diff --git a/SpecForge-ext/.pre-commit-config.yaml b/SpecForge-ext/.pre-commit-config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..8191551a215425aa3884516a770175af784bd097
--- /dev/null
+++ b/SpecForge-ext/.pre-commit-config.yaml
@@ -0,0 +1,53 @@
+default_stages: [pre-commit, pre-push, manual]
+
+repos:
+ - repo: https://github.com/PyCQA/autoflake
+ rev: v2.3.1
+ hooks:
+ - id: autoflake
+ args: [--remove-all-unused-imports, --in-place]
+ - repo: https://github.com/pre-commit/pre-commit-hooks
+ rev: v5.0.0
+ hooks:
+ - id: check-symlinks
+ - id: destroyed-symlinks
+ - id: trailing-whitespace
+ - id: end-of-file-fixer
+ - id: check-yaml
+ args: [--allow-multiple-documents]
+ - id: check-toml
+ - id: check-ast
+ - id: check-added-large-files
+ - id: check-merge-conflict
+ - id: check-shebang-scripts-are-executable
+ - id: detect-private-key
+ - id: debug-statements
+ - id: no-commit-to-branch
+ - repo: https://github.com/PyCQA/isort
+ rev: 5.13.2
+ hooks:
+ - id: isort
+ - repo: https://github.com/astral-sh/ruff-pre-commit
+ rev: v0.11.10
+ hooks:
+ - id: ruff
+ args: [--select=F401, --fixable=F401]
+ files: ^(benchmark/|docs/|examples/)
+ exclude: \.ipynb$
+ - repo: https://github.com/psf/black
+ rev: 24.10.0
+ hooks:
+ - id: black-jupyter
+ - repo: https://github.com/pre-commit/mirrors-clang-format
+ rev: v18.1.8
+ hooks:
+ - id: clang-format
+ types_or: [c++, cuda]
+ args: [--style=file, --verbose]
+ - repo: https://github.com/kynan/nbstripout
+ rev: 0.8.1
+ hooks:
+ - id: nbstripout
+ args:
+ - '--keep-output'
+ - '--extra-keys=metadata.kernelspec metadata.language_info.version'
diff --git a/SpecForge-ext/convert_mtbench.py b/SpecForge-ext/convert_mtbench.py
new file mode 100644
index 0000000000000000000000000000000000000000..0908aa7be758120c936ede8630caf64bb1a788c9
--- /dev/null
+++ b/SpecForge-ext/convert_mtbench.py
@@ -0,0 +1,22 @@
+#!/usr/bin/env python3
+import json
+import os
+
+# 读取 JSON 文件并转换为 JSONL
+input_file = "/workspace/hanrui/SpecForge-ext/mtbench_sample.json"
+with open(input_file, 'r') as f:
+ data = json.load(f)
+
+# 保存为 jsonl
+cache_dir = os.path.expanduser("~/.cache/sglang")
+os.makedirs(cache_dir, exist_ok=True)
+output_file = os.path.join(cache_dir, "mtbench.jsonl")
+
+with open(output_file, 'w') as f:
+ for item in data:
+ f.write(json.dumps(item) + '\n')
+
+print(f"Converted {len(data)} questions")
+print(f"Saved to {output_file}")
+print(f"\nFirst question:")
+print(json.dumps(data[0], indent=2))
diff --git a/SpecForge-ext/download_datasets.py b/SpecForge-ext/download_datasets.py
new file mode 100644
index 0000000000000000000000000000000000000000..9b620497a1a50d25a41248833802172a21dca6b6
--- /dev/null
+++ b/SpecForge-ext/download_datasets.py
@@ -0,0 +1,64 @@
+#!/usr/bin/env python3
+"""
+下载 GSM8K 和 HumanEval 数据集到本地
+"""
+import os
+import json
+import requests
+from datasets import load_dataset
+
+DATA_DIR = "/workspace/hanrui/datasets"
+os.makedirs(DATA_DIR, exist_ok=True)
+
+print("=" * 60)
+print("下载 GSM8K 数据集")
+print("=" * 60)
+
+try:
+ # 下载 GSM8K
+ gsm8k_dir = os.path.join(DATA_DIR, "gsm8k")
+ os.makedirs(gsm8k_dir, exist_ok=True)
+
+ print("Loading GSM8K from HuggingFace...")
+ dataset = load_dataset("gsm8k", "main", split="test")
+
+ # 保存为 jsonl
+ output_file = os.path.join(gsm8k_dir, "test.jsonl")
+ with open(output_file, 'w') as f:
+ for item in dataset:
+ f.write(json.dumps(item) + '\n')
+
+ print(f"✓ GSM8K saved to {output_file}")
+ print(f" Total samples: {len(dataset)}")
+
+except Exception as e:
+ print(f"✗ GSM8K download failed: {e}")
+
+print("\n" + "=" * 60)
+print("下载 HumanEval 数据集")
+print("=" * 60)
+
+try:
+ # 下载 HumanEval
+ humaneval_dir = os.path.join(DATA_DIR, "humaneval")
+ os.makedirs(humaneval_dir, exist_ok=True)
+
+ print("Loading HumanEval from HuggingFace...")
+ dataset = load_dataset("openai_humaneval", split="test")
+
+ # 保存为 jsonl
+ output_file = os.path.join(humaneval_dir, "test.jsonl")
+ with open(output_file, 'w') as f:
+ for item in dataset:
+ f.write(json.dumps(item) + '\n')
+
+ print(f"✓ HumanEval saved to {output_file}")
+ print(f" Total samples: {len(dataset)}")
+
+except Exception as e:
+ print(f"✗ HumanEval download failed: {e}")
+
+print("\n" + "=" * 60)
+print("下载完成")
+print("=" * 60)
+print(f"数据保存在: {DATA_DIR}")
diff --git a/SpecForge-ext/download_mtbench.sh b/SpecForge-ext/download_mtbench.sh
new file mode 100644
index 0000000000000000000000000000000000000000..20a8b392d6803f618528d6852baaca6777e04bdb
--- /dev/null
+++ b/SpecForge-ext/download_mtbench.sh
@@ -0,0 +1,23 @@
+#!/bin/bash
+
+# 下载 mtbench 数据文件
+# 如果无法访问 GitHub,需要手动下载或使用镜像
+
+CACHE_DIR="$HOME/.cache/sglang"
+mkdir -p "$CACHE_DIR"
+
+echo "Downloading mtbench data..."
+
+# 方法1:尝试使用代理下载
+https_proxy=http://10.1.2.1:7890 http_proxy=http://10.1.2.1:7890 \
+curl -L "https://raw.githubusercontent.com/lm-sys/FastChat/main/fastchat/llm_judge/data/mt_bench/question.jsonl" \
+ -o "$CACHE_DIR/mtbench.jsonl"
+
+if [ $? -eq 0 ]; then
+ echo "Downloaded to $CACHE_DIR/mtbench.jsonl"
+ ls -lh "$CACHE_DIR/mtbench.jsonl"
+else
+ echo "Download failed. Please manually download the file from:"
+ echo "https://raw.githubusercontent.com/lm-sys/FastChat/main/fastchat/llm_judge/data/mt_bench/question.jsonl"
+ echo "And save it to: $CACHE_DIR/mtbench.jsonl"
+fi
diff --git a/SpecForge-ext/download_mtbench_data.py b/SpecForge-ext/download_mtbench_data.py
new file mode 100644
index 0000000000000000000000000000000000000000..d42096c3d3d4ea9b9244b15109a518b91a7ac121
--- /dev/null
+++ b/SpecForge-ext/download_mtbench_data.py
@@ -0,0 +1,51 @@
+#!/usr/bin/env python3
+"""
+下载并转换 MT-Bench 数据到本地目录
+"""
+import json
+import os
+import requests
+
+# 目标目录
+DATA_DIR = "/workspace/hanrui/datasets/mtbench"
+os.makedirs(DATA_DIR, exist_ok=True)
+
+# 下载 MT-Bench 问题数据
+url = "https://raw.githubusercontent.com/lm-sys/FastChat/main/fastchat/llm_judge/data/mt_bench/question.jsonl"
+output_file = os.path.join(DATA_DIR, "question.jsonl")
+
+print(f"Downloading MT-Bench questions from {url}")
+print(f"Saving to {output_file}")
+
+try:
+ # 使用代理下载
+ proxies = {
+ 'http': 'http://10.1.2.1:7890',
+ 'https': 'http://10.1.2.1:7890',
+ }
+
+ response = requests.get(url, proxies=proxies, timeout=30)
+ response.raise_for_status()
+
+ with open(output_file, 'wb') as f:
+ f.write(response.content)
+
+ print(f"✓ Downloaded successfully")
+
+ # 验证数据
+ with open(output_file, 'r') as f:
+ lines = f.readlines()
+
+ print(f"✓ Total questions: {len(lines)}")
+
+ # 显示第一个问题
+ first_question = json.loads(lines[0])
+ print(f"\nFirst question:")
+ print(json.dumps(first_question, indent=2))
+
+except Exception as e:
+ print(f"✗ Download failed: {e}")
+ print(f"\nPlease manually download from:")
+ print(f" {url}")
+ print(f"And save to:")
+ print(f" {output_file}")
diff --git a/SpecForge-ext/mtbench_sample.json b/SpecForge-ext/mtbench_sample.json
new file mode 100644
index 0000000000000000000000000000000000000000..fa64e47eaa8c491c2ce1be35c98ba420fea79c83
--- /dev/null
+++ b/SpecForge-ext/mtbench_sample.json
@@ -0,0 +1,26 @@
+[
+ {
+ "question_id": 1,
+ "category": "writing",
+ "turns": [
+ "Compose an engaging travel blog post about a recent trip to Hawaii, highlighting cultural experiences and must-see attractions.",
+ "Rewrite your previous response. Start every sentence with the letter A."
+ ]
+ },
+ {
+ "question_id": 2,
+ "category": "roleplay",
+ "turns": [
+ "Imagine you are writing a blog post comparing two popular smartphone models. Develop an outline for the blog post, including key points and subheadings to effectively compare and contrast the features, performance, and user experience of the two models. Please answer in fewer than 200 words.",
+ "Take your previous response and rephrase it as a limerick."
+ ]
+ },
+ {
+ "question_id": 3,
+ "category": "reasoning",
+ "turns": [
+ "Describe a vivid and unique character, using strong imagery and creative language. Please answer in fewer than two paragraphs.",
+ "Revise your previous response and incorporate an allusion to a famous work of literature or historical event in each sentence."
+ ]
+ }
+]
diff --git a/SpecForge-ext/pyproject.toml b/SpecForge-ext/pyproject.toml
new file mode 100644
index 0000000000000000000000000000000000000000..507c79dfa15f72be10ca723a5a784bb5fc586657
--- /dev/null
+++ b/SpecForge-ext/pyproject.toml
@@ -0,0 +1,44 @@
+[build-system]
+requires = ["setuptools>=61.0", "wheel"]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "specforge"
+dynamic = ["version", "description"]
+readme = "README.md"
+requires-python = ">=3.11"
+dependencies = [
+ "pre-commit",
+ "torch==2.9.1",
+ "torchaudio==2.9.1",
+ "torchvision==0.24.1",
+ "transformers==4.57.1",
+ "qwen-vl-utils==0.0.11",
+ "datasets",
+ "setuptools",
+ "tqdm",
+ "wandb",
+ "psutil",
+ "numpy",
+ "accelerate",
+ "pydantic",
+ "sglang==0.5.6",
+ "openai-harmony",
+ "ninja",
+ "packaging",
+ "yunchang",
+]
+
+[tool.setuptools]
+packages = ["specforge"]
+
+[project.optional-dependencies]
+dev = [
+ "pre-commit",
+ "unittest"
+]
+fa = ["flash-attn"]
+
+[tool.setuptools.dynamic]
+version = {file = "version.txt"}
+description = {file = "README.md"}
diff --git a/SpecForge-ext/requirements.txt b/SpecForge-ext/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/SpecForge-ext/setup.py b/SpecForge-ext/setup.py
new file mode 100644
index 0000000000000000000000000000000000000000..08acbafb080791b91b26c5789b5e992740d49557
--- /dev/null
+++ b/SpecForge-ext/setup.py
@@ -0,0 +1,33 @@
+import tomllib
+from pathlib import Path
+
+from setuptools import find_packages, setup
+
+
+def read_readme():
+ with open("README.md", "r") as f:
+ return f.read()
+
+
+def read_version():
+ with open("version.txt", "r") as f:
+ return f.read().strip()
+
+
+def read_dependencies():
+ pyproject_path = Path(__file__).parent / "pyproject.toml"
+ with open(pyproject_path, "rb") as f:
+ pyproject = tomllib.load(f)
+ return pyproject.get("project", {}).get("dependencies", [])
+
+
+setup(
+ name="specforge",
+ packages=find_packages(exclude=["configs", "scripts", "tests"]),
+ version=read_version(),
+ install_requires=read_dependencies(),
+ long_description=read_readme(),
+ long_description_content_type="text/markdown",
+ author="SGLang Team",
+ url="https://github.com/sgl-project/SpecForge",
+)
diff --git a/SpecForge-ext/test_accept_length.md b/SpecForge-ext/test_accept_length.md
new file mode 100644
index 0000000000000000000000000000000000000000..9ab9f71f180b654f1dc013acfed678bf0c0f0915
--- /dev/null
+++ b/SpecForge-ext/test_accept_length.md
@@ -0,0 +1,300 @@
+# Accept Length 测试指南
+
+## 0. 准备工作
+
+### 创建目录
+```bash
+cd /workspace/hanrui/SpecForge-ext
+mkdir -p logs results
+```
+
+### 下载数据集(首次运行)
+```bash
+cd /workspace/hanrui/SpecForge-ext
+python download_datasets.py
+```
+
+数据保存位置:
+- MT-Bench: `/workspace/hanrui/datasets/mtbench/question.jsonl`
+- GSM8K: `/workspace/hanrui/datasets/gsm8k/test.jsonl`
+- HumanEval: `/workspace/hanrui/datasets/humaneval/test.jsonl`
+
+---
+
+## 1. 测试 Baseline 模型
+
+### 启动服务器(终端1)
+```bash
+cd /workspace/hanrui/SpecForge-ext
+
+# 设置环境变量
+export NO_PROXY="localhost,127.0.0.1,::1,10.0.0.0/8,172.16.0.0/12,192.168.0.0/16"
+export no_proxy="localhost,127.0.0.1,::1,10.0.0.0/8,172.16.0.0/12,192.168.0.0/16"
+
+# 启动 baseline 服务器
+python3 -m sglang.launch_server \
+ --model /workspace/Qwen3-8B \
+ --speculative-algorithm EAGLE3 \
+ --speculative-draft-model-path /workspace/qwen3_8b_eagle3 \
+ --speculative-num-steps 3 \
+ --speculative-eagle-topk 1 \
+ --speculative-num-draft-tokens 4 \
+ --mem-fraction-static 0.75 \
+ --cuda-graph-max-bs 1 \
+ --tp 1 \
+ --trust-remote-code \
+ --host 0.0.0.0 \
+ --port 30000 \
+ --dtype bfloat16 \
+ --skip-server-warmup
+```
+
+等待看到 `Application startup complete` 后,继续下一步。
+
+### 运行三个 Benchmark(终端2)
+```bash
+cd /workspace/hanrui/SpecForge-ext
+conda activate /workspace/Hanrui/
+
+# 设置环境变量
+export NO_PROXY="localhost,127.0.0.1,::1,10.0.0.0/8,172.16.0.0/12,192.168.0.0/16"
+export no_proxy="localhost,127.0.0.1,::1,10.0.0.0/8,172.16.0.0/12,192.168.0.0/16"
+
+# 1. MT-Bench
+echo "=== Running MT-Bench (Baseline) ==="
+python benchmarks/bench_eagle3.py \
+ --model-path /workspace/Qwen3-8B \
+ --host 10.1.1.31 \
+ --port 30000 \
+ --config-list 1,3,1,4 \
+ --benchmark-list mtbench:80 \
+ --dtype bfloat16 \
+ --skip-launch-server \
+ --name baseline_mtbench \
+ --output-dir ./results \
+ 2>&1 | tee logs/baseline_mtbench_$(date +%Y%m%d_%H%M%S).log
+
+# 2. GSM8K
+echo "=== Running GSM8K (Baseline) ==="
+python benchmarks/bench_eagle3.py \
+ --model-path /workspace/Qwen3-8B \
+ --host 10.1.1.31 \
+ --port 30000 \
+ --config-list 1,3,1,4 \
+ --benchmark-list gsm8k:100 \
+ --dtype bfloat16 \
+ --skip-launch-server \
+ --name baseline_gsm8k \
+ --output-dir ./results \
+ 2>&1 | tee logs/baseline_gsm8k_$(date +%Y%m%d_%H%M%S).log
+
+# 3. HumanEval
+echo "=== Running HumanEval (Baseline) ==="
+python benchmarks/bench_eagle3.py \
+ --model-path /workspace/Qwen3-8B \
+ --host 10.1.1.31 \
+ --port 30000 \
+ --config-list 1,3,1,4 \
+ --benchmark-list humaneval:164 \
+ --dtype bfloat16 \
+ --skip-launch-server \
+ --name baseline_humaneval \
+ --output-dir ./results \
+ 2>&1 | tee logs/baseline_humaneval_$(date +%Y%m%d_%H%M%S).log
+
+echo "=== Baseline 测试完成 ==="
+```
+
+---
+
+## 2. 测试训练后的模型
+
+### 停止 Baseline 服务器并启动训练后的服务器(终端1)
+```bash
+cd /workspace/hanrui/SpecForge-ext
+
+# 停止旧服务器
+pkill -f "sglang.launch_server"
+sleep 5
+
+# 设置环境变量
+export NO_PROXY="localhost,127.0.0.1,::1,10.0.0.0/8,172.16.0.0/12,192.168.0.0/16"
+export no_proxy="localhost,127.0.0.1,::1,10.0.0.0/8,172.16.0.0/12,192.168.0.0/16"
+
+# 启动训练后的服务器
+python3 -m sglang.launch_server \
+ --model /workspace/Qwen3-8B \
+ --speculative-algorithm EAGLE3 \
+ --speculative-draft-model-path /workspace/hanrui/SpecForge-ext/outputs/qwen3-8b-qwen3eagle-5layer/epoch_9_step_12310 \
+ --speculative-num-steps 3 \
+ --speculative-eagle-topk 1 \
+ --speculative-num-draft-tokens 4 \
+ --mem-fraction-static 0.75 \
+ --cuda-graph-max-bs 1 \
+ --tp 1 \
+ --trust-remote-code \
+ --host 0.0.0.0 \
+ --port 30000 \
+ --dtype bfloat16 \
+ --skip-server-warmup
+```
+
+等待看到 `Application startup complete` 后,继续下一步。
+
+### 运行三个 Benchmark(终端2)
+```bash
+cd /workspace/hanrui/SpecForge-ext
+conda activate /workspace/Hanrui/
+
+# 设置环境变量
+export NO_PROXY="localhost,127.0.0.1,::1,10.0.0.0/8,172.16.0.0/12,192.168.0.0/16"
+export no_proxy="localhost,127.0.0.1,::1,10.0.0.0/8,172.16.0.0/12,192.168.0.0/16"
+
+# 1. MT-Bench
+echo "=== Running MT-Bench (Trained) ==="
+python benchmarks/bench_eagle3.py \
+ --model-path /workspace/Qwen3-8B \
+ --host 10.1.1.31 \
+ --port 30000 \
+ --config-list 1,3,1,4 \
+ --benchmark-list mtbench:80 \
+ --dtype bfloat16 \
+ --skip-launch-server \
+ --name trained_mtbench \
+ --output-dir ./results \
+ 2>&1 | tee logs/trained_mtbench_$(date +%Y%m%d_%H%M%S).log
+
+# 2. GSM8K
+echo "=== Running GSM8K (Trained) ==="
+python benchmarks/bench_eagle3.py \
+ --model-path /workspace/Qwen3-8B \
+ --host 10.1.1.31 \
+ --port 30000 \
+ --config-list 1,3,1,4 \
+ --benchmark-list gsm8k:100 \
+ --dtype bfloat16 \
+ --skip-launch-server \
+ --name trained_gsm8k \
+ --output-dir ./results \
+ 2>&1 | tee logs/trained_gsm8k_$(date +%Y%m%d_%H%M%S).log
+
+# 3. HumanEval
+echo "=== Running HumanEval (Trained) ==="
+python benchmarks/bench_eagle3.py \
+ --model-path /workspace/Qwen3-8B \
+ --host 10.1.1.31 \
+ --port 30000 \
+ --config-list 1,3,1,4 \
+ --benchmark-list humaneval:164 \
+ --dtype bfloat16 \
+ --skip-launch-server \
+ --name trained_humaneval \
+ --output-dir ./results \
+ 2>&1 | tee logs/trained_humaneval_$(date +%Y%m%d_%H%M%S).log
+
+echo "=== Trained 测试完成 ==="
+```
+
+---
+
+## 3. 查看结果
+
+### 日志文件位置
+所有日志保存在:`/workspace/hanrui/SpecForge-ext/logs/`
+- `baseline_mtbench_*.log`
+- `baseline_gsm8k_*.log`
+- `baseline_humaneval_*.log`
+- `trained_mtbench_*.log`
+- `trained_gsm8k_*.log`
+- `trained_humaneval_*.log`
+
+所有结果保存在:`/workspace/hanrui/SpecForge-ext/results/`
+- `baseline_mtbench_*.jsonl`
+- `baseline_gsm8k_*.jsonl`
+- `baseline_humaneval_*.jsonl`
+- `trained_mtbench_*.jsonl`
+- `trained_gsm8k_*.jsonl`
+- `trained_humaneval_*.jsonl`
+
+### 生成对比报告
+```bash
+cd /workspace/hanrui/SpecForge-ext
+
+python3 << 'EOF'
+import json
+import glob
+
+print("=" * 80)
+print("Accept Length 对比报告")
+print("=" * 80)
+
+datasets = ['mtbench', 'gsm8k', 'humaneval']
+
+for dataset in datasets:
+ print(f"\n{'=' * 80}")
+ print(f"{dataset.upper()} 结果对比")
+ print('=' * 80)
+
+ baseline_files = sorted(glob.glob(f'results/baseline_{dataset}_*.jsonl'))
+ trained_files = sorted(glob.glob(f'results/trained_{dataset}_*.jsonl'))
+
+ if not baseline_files or not trained_files:
+ print(f" 未找到 {dataset} 的结果文件")
+ continue
+
+ with open(baseline_files[-1], 'r') as f:
+ baseline = json.load(f)
+
+ with open(trained_files[-1], 'r') as f:
+ trained = json.load(f)
+
+ baseline_metrics = baseline[dataset][0]['metrics'][0]
+ trained_metrics = trained[dataset][0]['metrics'][0]
+
+ print(f"\nBaseline:")
+ print(f" Accept Length: {baseline_metrics['accept_length']:.4f}")
+ print(f" Output Throughput: {baseline_metrics['output_throughput']:.2f} tokens/s")
+ if 'accuracy' in baseline_metrics and baseline_metrics['accuracy'] is not None:
+ print(f" Accuracy: {baseline_metrics['accuracy']:.2%}")
+
+ print(f"\nTrained:")
+ print(f" Accept Length: {trained_metrics['accept_length']:.4f}")
+ print(f" Output Throughput: {trained_metrics['output_throughput']:.2f} tokens/s")
+ if 'accuracy' in trained_metrics and trained_metrics['accuracy'] is not None:
+ print(f" Accuracy: {trained_metrics['accuracy']:.2%}")
+
+ accept_diff = trained_metrics['accept_length'] - baseline_metrics['accept_length']
+ accept_pct = (accept_diff / baseline_metrics['accept_length']) * 100
+
+ throughput_diff = trained_metrics['output_throughput'] - baseline_metrics['output_throughput']
+ throughput_pct = (throughput_diff / baseline_metrics['output_throughput']) * 100
+
+ print(f"\n差异:")
+ print(f" Accept Length: {accept_diff:+.4f} ({accept_pct:+.2f}%)")
+ print(f" Throughput: {throughput_diff:+.2f} tokens/s ({throughput_pct:+.2f}%)")
+
+ if 'accuracy' in baseline_metrics and baseline_metrics['accuracy'] is not None:
+ acc_diff = trained_metrics['accuracy'] - baseline_metrics['accuracy']
+ acc_pct = acc_diff * 100
+ print(f" Accuracy: {acc_pct:+.2f} percentage points")
+
+print("\n" + "=" * 80)
+EOF
+```
+
+---
+
+## 4. 快速查看单个结果
+```bash
+cd /workspace/hanrui/SpecForge-ext
+
+# 查看 baseline 的 accept_length
+cat results/baseline_mtbench_*.jsonl | jq '.mtbench[0].metrics[0].accept_length'
+cat results/baseline_gsm8k_*.jsonl | jq '.gsm8k[0].metrics[0].accept_length'
+cat results/baseline_humaneval_*.jsonl | jq '.humaneval[0].metrics[0].accept_length'
+
+# 查看 trained 的 accept_length
+cat results/trained_mtbench_*.jsonl | jq '.mtbench[0].metrics[0].accept_length'
+cat results/trained_gsm8k_*.jsonl | jq '.gsm8k[0].metrics[0].accept_length'
+cat results/trained_humaneval_*.jsonl | jq '.humaneval[0].metrics[0].accept_length'
+```
diff --git a/SpecForge/.editorconfig b/SpecForge/.editorconfig
new file mode 100644
index 0000000000000000000000000000000000000000..030a7293dcb6294d1ac26f262c761a9ac0a91052
--- /dev/null
+++ b/SpecForge/.editorconfig
@@ -0,0 +1,25 @@
+# https://editorconfig.org/
+
+root = true
+
+[*]
+charset = utf-8
+end_of_line = lf
+indent_style = space
+indent_size = 4
+trim_trailing_whitespace = true
+insert_final_newline = true
+
+[*.{json,yaml,yml}]
+indent_size = 2
+
+[*.md]
+indent_size = 2
+x-soft-wrap-text = true
+
+[*.rst]
+indent_size = 4
+x-soft-wrap-text = true
+
+[Makefile]
+indent_style = tab
diff --git a/SpecForge/.isort.cfg b/SpecForge/.isort.cfg
new file mode 100644
index 0000000000000000000000000000000000000000..82a27d81c14cfbef583d39fe8a51bb635437b35e
--- /dev/null
+++ b/SpecForge/.isort.cfg
@@ -0,0 +1,3 @@
+[settings]
+profile=black
+known_first_party=sgl-eagle
diff --git a/SpecForge/.pre-commit-config.yaml b/SpecForge/.pre-commit-config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..8191551a215425aa3884516a770175af784bd097
--- /dev/null
+++ b/SpecForge/.pre-commit-config.yaml
@@ -0,0 +1,53 @@
+default_stages: [pre-commit, pre-push, manual]
+
+repos:
+ - repo: https://github.com/PyCQA/autoflake
+ rev: v2.3.1
+ hooks:
+ - id: autoflake
+ args: [--remove-all-unused-imports, --in-place]
+ - repo: https://github.com/pre-commit/pre-commit-hooks
+ rev: v5.0.0
+ hooks:
+ - id: check-symlinks
+ - id: destroyed-symlinks
+ - id: trailing-whitespace
+ - id: end-of-file-fixer
+ - id: check-yaml
+ args: [--allow-multiple-documents]
+ - id: check-toml
+ - id: check-ast
+ - id: check-added-large-files
+ - id: check-merge-conflict
+ - id: check-shebang-scripts-are-executable
+ - id: detect-private-key
+ - id: debug-statements
+ - id: no-commit-to-branch
+ - repo: https://github.com/PyCQA/isort
+ rev: 5.13.2
+ hooks:
+ - id: isort
+ - repo: https://github.com/astral-sh/ruff-pre-commit
+ rev: v0.11.10
+ hooks:
+ - id: ruff
+ args: [--select=F401, --fixable=F401]
+ files: ^(benchmark/|docs/|examples/)
+ exclude: \.ipynb$
+ - repo: https://github.com/psf/black
+ rev: 24.10.0
+ hooks:
+ - id: black-jupyter
+ - repo: https://github.com/pre-commit/mirrors-clang-format
+ rev: v18.1.8
+ hooks:
+ - id: clang-format
+ types_or: [c++, cuda]
+ args: [--style=file, --verbose]
+ - repo: https://github.com/kynan/nbstripout
+ rev: 0.8.1
+ hooks:
+ - id: nbstripout
+ args:
+ - '--keep-output'
+ - '--extra-keys=metadata.kernelspec metadata.language_info.version'
diff --git a/SpecForge/LICENSE b/SpecForge/LICENSE
new file mode 100644
index 0000000000000000000000000000000000000000..909b8ff34ce3ff391ec5ecd1d2388d0c5b1cd4b3
--- /dev/null
+++ b/SpecForge/LICENSE
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2025 sgl-project
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/SpecForge/MANIFEST.in b/SpecForge/MANIFEST.in
new file mode 100644
index 0000000000000000000000000000000000000000..7e3c8f05614505dc88691fa12babee86f8d1995e
--- /dev/null
+++ b/SpecForge/MANIFEST.in
@@ -0,0 +1,2 @@
+include requirements.txt
+include version.txt
diff --git a/SpecForge/README.md b/SpecForge/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..141963e25880130165ca60532f9f0b4292adea41
--- /dev/null
+++ b/SpecForge/README.md
@@ -0,0 +1,70 @@
+
+

+
+[](https://docs.sglang.ai/SpecForge/)
+[](https://huggingface.co/collections/lmsys/specbundle)
+[](https://deepwiki.com/sgl-project/SpecForge)
+
+[](https://lmsys.org/blog/2025-07-25-spec-forge/)
+[](https://sgl-fru7574.slack.com/archives/C09784E3EN6)
+[](./LICENSE)
+
+
+
+## 📍 Overview
+
+SpecForge is an ecosystem project developed by the SGLang team. It is a framework for training speculative decoding models so that you can smoothly port them over to the SGLang serving framework to speed up your inference.
+
+We have seen many open-source projects for speculative decoding, but most of them are not well-maintained or not directly compatible with SGLang. We prepared this project because we wish that the open-source community can enjoy a speculative decoding framework that is
+- regularly maintained by the SpecForge team: the code is runnable out-of-the-box
+- directly compatible with SGLang: there is no additional efforts for porting to SGLang
+- provide performant training capabilities: we provided online/offline/tensor-parallel/FSDP to suit your needs
+
+
+Check out [**our documentation**](https://docs.sglang.ai/SpecForge/) to get started.
+
+
+## 🚀 Accelerate with SpecBundle
+
+SpecBundle is a collection of production-grade speculative decoding models that are released by the SpecForge team and our industry partners. They provide higher acceptance rate compared to the existing open-source checkpoints over a wide range of domains. Together with SGLang, you can experience up to 4x speedup for inference. Check out our resources below:
+
+
+| Item | Link |
+| --- | --- |
+| 📝 Documentation | [Link](https://docs.sglang.io/SpecForge/community_resources/specbundle.html) |
+| 📊 Performance Dashboard | [Link](https://docs.sglang.io/SpecForge/SpecBundle/index.html) |
+| 🤗 Hugging Face Collection | [Link](https://huggingface.co/collections/lmsys/specbundle) |
+
+
+## 🎉 News
+
+- [2025-12] 🎉 Released SpecBundle (phase 1) and SpecForge v0.2. Check out our blog at [LMSYS.org](https://lmsys.org/blog/2025-12-23-spec-bundle-phase-1/)
+- [2025-12] 🔔 Released the roadmap for 2026 Q1.
+- [2025-08] 🔔 SpecForge is listed as a [flagship project](https://lmsys.org/about/) in LMSYS. Congratulations to the SpecForge team!
+- [2025-08] 🔥 SpecForge powered the Eagle3 draft model for GPT-OSS. Check out the blog at [LMSYS.org](https://lmsys.org/blog/2025-08-27-gpt-oss/)
+- [2025-07] 🔥 SpecForge is released together with Llama4-Eagle3 checkpoints. Check out our blog at [LMSYS.org](https://lmsys.org/blog/2025-07-25-spec-forge/)
+
+## ✨ Acknowledgements
+
+
+
+We would like to express our sincere gratitude to the official EAGLE team, especially Hongyang Zhang and Yuhui Li, for their invaluable contributions and support. Our thanks also go to the NVIDIA team—particularly Avery H and Izzy Putterman—and to the Google team, especially Ying Wang, for their insightful discussions and generous assistance throughout the project.
+
+We are especially grateful to Meituan for their strong backing and meaningful contributions, which played a vital role in driving this project forward.
+
+This project has also been inspired by many outstanding open-source projects from the LLM community, including [EAGLE](https://github.com/SafeAILab/EAGLE), [BaldEagle](https://github.com/NickL77/BaldEagle), and [TensorRT-Model-Optimizer](https://github.com/NVIDIA/TensorRT-Model-Optimizer) and others. Their contributions and shared knowledge have greatly benefited our work.
+
+## 💡 Special Thanks to Voltage Park
+
+We would like to extend our sincere thanks to [Voltage Park](https://www.voltagepark.com/), our official infrastructure partner. As part of a formal collaboration with the SGLang team, Voltage Park provided critical GPU resources that empowered us to train and evaluate large-scale speculative decoding models efficiently and reliably. This partnership was instrumental in making SpecForge possible. We deeply appreciate Voltage Park’s mission to make cutting-edge AI infrastructure more accessible, and we look forward to continued collaboration as we push the boundaries of open-source LLM serving and optimization.
+
+## 📃 Citation
+
+```bibtex
+@misc{specforge2025,
+ title={SpecForge: Train speculative decoding models effortlessly},
+ author={Shenggui Li, Yikai Zhu, Chao Wang, Fan Yin, Shuai Shi, Yubo Wang, Yi Zhang, Yingyi Huang, Haoshuai Zheng, Yineng Zhang},
+ year={2025},
+ publisher={GitHub},
+ howpublished={\url{https://github.com/sgl-project/specforge}},
+}
diff --git a/SpecForge/pyproject.toml b/SpecForge/pyproject.toml
new file mode 100644
index 0000000000000000000000000000000000000000..4698a5e811892b633345a09ba8c261fd67a1b10d
--- /dev/null
+++ b/SpecForge/pyproject.toml
@@ -0,0 +1,47 @@
+[build-system]
+requires = ["setuptools>=61.0", "wheel"]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "specforge"
+dynamic = ["version"]
+readme = "README.md"
+requires-python = ">=3.11"
+description = "SpecForge: Speculative Decoding Training Framework"
+authors = [{name = "SGLang Team"}]
+urls = {Homepage = "https://github.com/sgl-project/SpecForge"}
+dependencies = [
+ "pre-commit",
+ "torch==2.9.1",
+ "torchaudio==2.9.1",
+ "torchvision==0.24.1",
+ "transformers==4.57.1",
+ "qwen-vl-utils==0.0.11",
+ "datasets",
+ "setuptools",
+ "tqdm",
+ "wandb",
+ "psutil",
+ "numpy",
+ "accelerate",
+ "pydantic",
+ "sglang==0.5.9",
+ "openai-harmony",
+ "ninja",
+ "packaging",
+ "yunchang",
+ "tensorboard",
+]
+
+[tool.setuptools.packages.find]
+exclude = ["configs*", "scripts*", "tests*"]
+
+[project.optional-dependencies]
+dev = [
+ "pre-commit",
+ "unittest"
+]
+fa = ["flash-attn"]
+
+[tool.setuptools.dynamic]
+version = {file = "version.txt"}
diff --git a/SpecForge/requirements-rocm.txt b/SpecForge/requirements-rocm.txt
new file mode 100644
index 0000000000000000000000000000000000000000..a7c314563749906b77582bf1234da54c63746a0c
--- /dev/null
+++ b/SpecForge/requirements-rocm.txt
@@ -0,0 +1,20 @@
+# Use the PyTorch ROCm wheel index (choose the stream that matches your system)
+--extra-index-url https://download.pytorch.org/whl/rocm6.3
+
+pre-commit
+torch==2.8.0+rocm6.3
+torchaudio==2.8.0+rocm6.3
+torchvision==0.23.0+rocm6.3
+transformers==4.57.1
+qwen-vl-utils==0.0.11
+datasets
+setuptools
+tqdm
+wandb
+psutil
+numpy
+accelerate
+pydantic
+sglang[all]==0.5.4
+openai-harmony
+tensorboard
diff --git a/SpecForge/version.txt b/SpecForge/version.txt
new file mode 100644
index 0000000000000000000000000000000000000000..0ea3a944b399d25f7e1b8fe684d754eb8da9fe7f
--- /dev/null
+++ b/SpecForge/version.txt
@@ -0,0 +1 @@
+0.2.0
diff --git a/idea1/.editorconfig b/idea1/.editorconfig
new file mode 100644
index 0000000000000000000000000000000000000000..030a7293dcb6294d1ac26f262c761a9ac0a91052
--- /dev/null
+++ b/idea1/.editorconfig
@@ -0,0 +1,25 @@
+# https://editorconfig.org/
+
+root = true
+
+[*]
+charset = utf-8
+end_of_line = lf
+indent_style = space
+indent_size = 4
+trim_trailing_whitespace = true
+insert_final_newline = true
+
+[*.{json,yaml,yml}]
+indent_size = 2
+
+[*.md]
+indent_size = 2
+x-soft-wrap-text = true
+
+[*.rst]
+indent_size = 4
+x-soft-wrap-text = true
+
+[Makefile]
+indent_style = tab
diff --git a/idea1/.isort.cfg b/idea1/.isort.cfg
new file mode 100644
index 0000000000000000000000000000000000000000..82a27d81c14cfbef583d39fe8a51bb635437b35e
--- /dev/null
+++ b/idea1/.isort.cfg
@@ -0,0 +1,3 @@
+[settings]
+profile=black
+known_first_party=sgl-eagle
diff --git a/idea1/.pre-commit-config.yaml b/idea1/.pre-commit-config.yaml
new file mode 100644
index 0000000000000000000000000000000000000000..8191551a215425aa3884516a770175af784bd097
--- /dev/null
+++ b/idea1/.pre-commit-config.yaml
@@ -0,0 +1,53 @@
+default_stages: [pre-commit, pre-push, manual]
+
+repos:
+ - repo: https://github.com/PyCQA/autoflake
+ rev: v2.3.1
+ hooks:
+ - id: autoflake
+ args: [--remove-all-unused-imports, --in-place]
+ - repo: https://github.com/pre-commit/pre-commit-hooks
+ rev: v5.0.0
+ hooks:
+ - id: check-symlinks
+ - id: destroyed-symlinks
+ - id: trailing-whitespace
+ - id: end-of-file-fixer
+ - id: check-yaml
+ args: [--allow-multiple-documents]
+ - id: check-toml
+ - id: check-ast
+ - id: check-added-large-files
+ - id: check-merge-conflict
+ - id: check-shebang-scripts-are-executable
+ - id: detect-private-key
+ - id: debug-statements
+ - id: no-commit-to-branch
+ - repo: https://github.com/PyCQA/isort
+ rev: 5.13.2
+ hooks:
+ - id: isort
+ - repo: https://github.com/astral-sh/ruff-pre-commit
+ rev: v0.11.10
+ hooks:
+ - id: ruff
+ args: [--select=F401, --fixable=F401]
+ files: ^(benchmark/|docs/|examples/)
+ exclude: \.ipynb$
+ - repo: https://github.com/psf/black
+ rev: 24.10.0
+ hooks:
+ - id: black-jupyter
+ - repo: https://github.com/pre-commit/mirrors-clang-format
+ rev: v18.1.8
+ hooks:
+ - id: clang-format
+ types_or: [c++, cuda]
+ args: [--style=file, --verbose]
+ - repo: https://github.com/kynan/nbstripout
+ rev: 0.8.1
+ hooks:
+ - id: nbstripout
+ args:
+ - '--keep-output'
+ - '--extra-keys=metadata.kernelspec metadata.language_info.version'
diff --git a/idea1/LICENSE b/idea1/LICENSE
new file mode 100644
index 0000000000000000000000000000000000000000..909b8ff34ce3ff391ec5ecd1d2388d0c5b1cd4b3
--- /dev/null
+++ b/idea1/LICENSE
@@ -0,0 +1,21 @@
+MIT License
+
+Copyright (c) 2025 sgl-project
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/idea1/requirements-rocm.txt b/idea1/requirements-rocm.txt
new file mode 100644
index 0000000000000000000000000000000000000000..a7c314563749906b77582bf1234da54c63746a0c
--- /dev/null
+++ b/idea1/requirements-rocm.txt
@@ -0,0 +1,20 @@
+# Use the PyTorch ROCm wheel index (choose the stream that matches your system)
+--extra-index-url https://download.pytorch.org/whl/rocm6.3
+
+pre-commit
+torch==2.8.0+rocm6.3
+torchaudio==2.8.0+rocm6.3
+torchvision==0.23.0+rocm6.3
+transformers==4.57.1
+qwen-vl-utils==0.0.11
+datasets
+setuptools
+tqdm
+wandb
+psutil
+numpy
+accelerate
+pydantic
+sglang[all]==0.5.4
+openai-harmony
+tensorboard
diff --git a/idea1/version.txt b/idea1/version.txt
new file mode 100644
index 0000000000000000000000000000000000000000..0ea3a944b399d25f7e1b8fe684d754eb8da9fe7f
--- /dev/null
+++ b/idea1/version.txt
@@ -0,0 +1 @@
+0.2.0
diff --git a/qwen3-8b_dflash_regen/.gitattributes b/qwen3-8b_dflash_regen/.gitattributes
new file mode 100644
index 0000000000000000000000000000000000000000..081686e03bf2eb3fac835595456cb5b2767629ba
--- /dev/null
+++ b/qwen3-8b_dflash_regen/.gitattributes
@@ -0,0 +1,36 @@
+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+sharegpt_train_regenerated.jsonl filter=lfs diff=lfs merge=lfs -text
diff --git a/syxin/backup.log b/syxin/backup.log
new file mode 100644
index 0000000000000000000000000000000000000000..666c89db56ad3169235f3d15e90984a1045430c7
--- /dev/null
+++ b/syxin/backup.log
@@ -0,0 +1,7662 @@
+nohup: ignoring input
+
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 20%|██ | 1/5 [00:12<00:50, 12.57s/it]
+Loading checkpoint shards: 20%|██ | 1/5 [00:11<00:47, 11.97s/it]
+Loading checkpoint shards: 20%|██ | 1/5 [00:11<00:47, 11.98s/it]
+Loading checkpoint shards: 20%|██ | 1/5 [00:11<00:47, 11.97s/it]
+Loading checkpoint shards: 20%|██ | 1/5 [00:11<00:47, 11.98s/it]
+Loading checkpoint shards: 20%|██ | 1/5 [00:11<00:47, 12.00s/it]
+Loading checkpoint shards: 20%|██ | 1/5 [00:12<00:50, 12.59s/it]
+Loading checkpoint shards: 20%|██ | 1/5 [00:12<00:48, 12.05s/it]
+Loading checkpoint shards: 40%|████ | 2/5 [00:25<00:37, 12.63s/it]
+Loading checkpoint shards: 40%|████ | 2/5 [00:24<00:37, 12.43s/it]
+Loading checkpoint shards: 40%|████ | 2/5 [00:24<00:37, 12.42s/it]
+Loading checkpoint shards: 40%|████ | 2/5 [00:24<00:37, 12.42s/it]
+Loading checkpoint shards: 40%|████ | 2/5 [00:25<00:38, 12.67s/it]
+Loading checkpoint shards: 40%|████ | 2/5 [00:24<00:37, 12.42s/it]
+Loading checkpoint shards: 40%|████ | 2/5 [00:24<00:37, 12.45s/it]
+Loading checkpoint shards: 40%|████ | 2/5 [00:24<00:37, 12.42s/it]
+Loading checkpoint shards: 60%|██████ | 3/5 [00:38<00:25, 12.74s/it]
+Loading checkpoint shards: 60%|██████ | 3/5 [00:37<00:25, 12.61s/it]
+Loading checkpoint shards: 60%|██████ | 3/5 [00:37<00:25, 12.61s/it]
+Loading checkpoint shards: 60%|██████ | 3/5 [00:37<00:25, 12.62s/it]
+Loading checkpoint shards: 60%|██████ | 3/5 [00:37<00:25, 12.62s/it]
+Loading checkpoint shards: 60%|██████ | 3/5 [00:37<00:25, 12.61s/it]
+Loading checkpoint shards: 60%|██████ | 3/5 [00:38<00:25, 12.75s/it]
+Loading checkpoint shards: 60%|██████ | 3/5 [00:37<00:25, 12.63s/it]
+Loading checkpoint shards: 80%|████████ | 4/5 [00:48<00:11, 11.76s/it]
+Loading checkpoint shards: 80%|████████ | 4/5 [00:47<00:11, 11.70s/it]
+Loading checkpoint shards: 80%|████████ | 4/5 [00:47<00:11, 11.70s/it]
+Loading checkpoint shards: 80%|████████ | 4/5 [00:47<00:11, 11.70s/it]
+Loading checkpoint shards: 80%|████████ | 4/5 [00:47<00:11, 11.70s/it]
+Loading checkpoint shards: 80%|████████ | 4/5 [00:47<00:11, 11.69s/it]
+Loading checkpoint shards: 80%|████████ | 4/5 [00:48<00:11, 11.78s/it]
+Loading checkpoint shards: 80%|████████ | 4/5 [00:47<00:11, 11.70s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 8.82s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 10.31s/it]
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:52<00:00, 8.90s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 8.84s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 8.84s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 8.84s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:52<00:00, 8.89s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 8.84s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:52<00:00, 10.44s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 8.84s/it]
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 10.33s/it]
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 10.32s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 10.32s/it]
+
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:52<00:00, 10.44s/it]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 10.32s/it]
+
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:51<00:00, 10.32s/it]
+
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 136.62it/s]
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.20it/s]
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.74it/s]
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 141.23it/s]
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.49it/s]
+Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.47it/s]
+
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.71it/s]
+
+Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.10it/s]
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+
+Generating train split: 0%| | 0/818627 [00:00, ? examples/s]trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+
+Generating train split: 0%| | 0/818627 [00:00, ? examples/s]trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+
+Generating train split: 3%|▎ | 21099/818627 [00:00<00:27, 28642.65 examples/s]
+Generating train split: 0%| | 0/818627 [00:00, ? examples/s]
+Generating train split: 3%|▎ | 21099/818627 [00:00<00:24, 32437.64 examples/s]
+Generating train split: 5%|▌ | 42198/818627 [00:01<00:17, 43203.50 examples/s]trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+
+Generating train split: 5%|▌ | 42198/818627 [00:00<00:16, 46441.93 examples/s]
+Generating train split: 0%| | 0/818627 [00:00, ? examples/s]
+Generating train split: 0%| | 0/818627 [00:00, ? examples/s]
+Generating train split: 8%|▊ | 63297/818627 [00:01<00:14, 53420.62 examples/s]
+Generating train split: 3%|▎ | 21099/818627 [00:00<00:24, 32967.65 examples/s]
+Generating train split: 8%|▊ | 63297/818627 [00:01<00:13, 54634.76 examples/s]
+Generating train split: 10%|█ | 84396/818627 [00:01<00:11, 61997.69 examples/s]
+Generating train split: 5%|▌ | 42198/818627 [00:00<00:16, 46585.66 examples/s]
+Generating train split: 3%|▎ | 21099/818627 [00:00<00:23, 34048.65 examples/s]
+Generating train split: 10%|█ | 84396/818627 [00:01<00:12, 58304.23 examples/s]
+Generating train split: 3%|▎ | 21099/818627 [00:00<00:23, 33469.06 examples/s]
+Generating train split: 8%|▊ | 63297/818627 [00:01<00:15, 50220.06 examples/s]
+Generating train split: 5%|▌ | 42198/818627 [00:00<00:16, 47991.59 examples/s]
+Generating train split: 5%|▌ | 42198/818627 [00:00<00:16, 47153.91 examples/s]
+Generating train split: 10%|█ | 84396/818627 [00:01<00:11, 65480.25 examples/s]
+Generating train split: 15%|█▌ | 123428/818627 [00:02<00:11, 58219.77 examples/s]
+Generating train split: 8%|▊ | 63297/818627 [00:01<00:13, 57421.86 examples/s]
+Generating train split: 8%|▊ | 63297/818627 [00:01<00:13, 56721.10 examples/s]
+Generating train split: 15%|█▌ | 123428/818627 [00:02<00:12, 57511.89 examples/s]
+Generating train split: 18%|█▊ | 144527/818627 [00:02<00:11, 60887.68 examples/s]
+Generating train split: 10%|█ | 84396/818627 [00:01<00:11, 65458.92 examples/s]
+Generating train split: 10%|█ | 84396/818627 [00:01<00:11, 64788.09 examples/s]
+Generating train split: 18%|█▊ | 144527/818627 [00:02<00:11, 60142.43 examples/s]
+Generating train split: 20%|██ | 165626/818627 [00:02<00:10, 65280.53 examples/s]
+Generating train split: 15%|█▌ | 123428/818627 [00:02<00:11, 60388.39 examples/s]
+Generating train split: 20%|██ | 165626/818627 [00:02<00:10, 64449.78 examples/s]
+Generating train split: 23%|██▎ | 186725/818627 [00:03<00:09, 69990.38 examples/s]
+Generating train split: 18%|█▊ | 144527/818627 [00:02<00:10, 62317.24 examples/s]
+Generating train split: 23%|██▎ | 186725/818627 [00:03<00:09, 69284.97 examples/s]
+Generating train split: 15%|█▌ | 123428/818627 [00:02<00:11, 61077.88 examples/s]
+Generating train split: 15%|█▌ | 123428/818627 [00:02<00:11, 60902.56 examples/s]
+Generating train split: 20%|██ | 165626/818627 [00:02<00:09, 66154.30 examples/s]
+Generating train split: 18%|█▊ | 144527/818627 [00:02<00:10, 62352.23 examples/s]
+Generating train split: 18%|█▊ | 144527/818627 [00:02<00:10, 61839.93 examples/s]
+Generating train split: 23%|██▎ | 186725/818627 [00:03<00:09, 70077.32 examples/s]
+Generating train split: 28%|██▊ | 225757/818627 [00:03<00:09, 62858.04 examples/s]
+Generating train split: 20%|██ | 165626/818627 [00:02<00:09, 65583.41 examples/s]
+Generating train split: 20%|██ | 165626/818627 [00:02<00:09, 65417.41 examples/s]
+Generating train split: 28%|██▊ | 225757/818627 [00:03<00:09, 64225.82 examples/s]
+Generating train split: 30%|███ | 246856/818627 [00:04<00:08, 64561.88 examples/s]
+Generating train split: 23%|██▎ | 186725/818627 [00:03<00:09, 70142.51 examples/s]
+Generating train split: 23%|██▎ | 186725/818627 [00:03<00:09, 69176.42 examples/s]
+Generating train split: 30%|███ | 246856/818627 [00:04<00:08, 65555.50 examples/s]
+Generating train split: 33%|███▎ | 267955/818627 [00:04<00:08, 67305.53 examples/s]
+Generating train split: 28%|██▊ | 225757/818627 [00:03<00:09, 63233.89 examples/s]
+Generating train split: 33%|███▎ | 267955/818627 [00:04<00:08, 67916.81 examples/s]
+Generating train split: 35%|███▌ | 289054/818627 [00:04<00:07, 71473.59 examples/s]
+Generating train split: 30%|███ | 246856/818627 [00:04<00:09, 63162.25 examples/s]
+Generating train split: 35%|███▌ | 289054/818627 [00:04<00:07, 71802.17 examples/s]
+Generating train split: 28%|██▊ | 225757/818627 [00:03<00:09, 61825.74 examples/s]
+Generating train split: 28%|██▊ | 225757/818627 [00:03<00:09, 62065.21 examples/s]
+Generating train split: 33%|███▎ | 267955/818627 [00:04<00:08, 66650.43 examples/s]
+Generating train split: 30%|███ | 246856/818627 [00:04<00:08, 63897.98 examples/s]
+Generating train split: 30%|███ | 246856/818627 [00:04<00:09, 63256.35 examples/s]
+Generating train split: 35%|███▌ | 289054/818627 [00:04<00:07, 70639.47 examples/s]
+Generating train split: 40%|████ | 328086/818627 [00:05<00:08, 59694.45 examples/s]
+Generating train split: 33%|███▎ | 267955/818627 [00:04<00:08, 68049.17 examples/s]
+Generating train split: 33%|███▎ | 267955/818627 [00:04<00:08, 65996.26 examples/s]
+Generating train split: 40%|████ | 328086/818627 [00:05<00:07, 62818.26 examples/s]
+Generating train split: 43%|████▎ | 349185/818627 [00:05<00:07, 63665.21 examples/s]
+Generating train split: 35%|███▌ | 289054/818627 [00:04<00:07, 71375.43 examples/s]
+Generating train split: 35%|███▌ | 289054/818627 [00:04<00:07, 69846.46 examples/s]
+Generating train split: 43%|████▎ | 349185/818627 [00:05<00:07, 66522.73 examples/s]
+Generating train split: 45%|████▌ | 370284/818627 [00:05<00:06, 67158.43 examples/s]
+Generating train split: 40%|████ | 328086/818627 [00:05<00:07, 61663.76 examples/s]
+Generating train split: 45%|████▌ | 370284/818627 [00:05<00:06, 68730.74 examples/s]
+Generating train split: 48%|████▊ | 391383/818627 [00:06<00:05, 73462.06 examples/s]
+Generating train split: 48%|████▊ | 391383/818627 [00:06<00:05, 74959.35 examples/s]
+Generating train split: 43%|████▎ | 349185/818627 [00:05<00:07, 66194.82 examples/s]
+Generating train split: 40%|████ | 328086/818627 [00:05<00:07, 62600.86 examples/s]
+Generating train split: 40%|████ | 328086/818627 [00:05<00:07, 61679.84 examples/s]
+Generating train split: 45%|████▌ | 370284/818627 [00:05<00:06, 68990.65 examples/s]
+Generating train split: 43%|████▎ | 349185/818627 [00:05<00:07, 65230.62 examples/s]
+Generating train split: 43%|████▎ | 349185/818627 [00:05<00:07, 64356.24 examples/s]
+Generating train split: 48%|████▊ | 391383/818627 [00:06<00:05, 75442.35 examples/s]
+Generating train split: 53%|█████▎ | 430414/818627 [00:06<00:06, 64347.20 examples/s]
+Generating train split: 53%|█████▎ | 430414/818627 [00:06<00:05, 65975.14 examples/s]
+Generating train split: 45%|████▌ | 370284/818627 [00:05<00:06, 68253.89 examples/s]
+Generating train split: 45%|████▌ | 370284/818627 [00:05<00:06, 65411.70 examples/s]
+Generating train split: 55%|█████▌ | 451513/818627 [00:07<00:05, 67368.91 examples/s]
+Generating train split: 48%|████▊ | 391383/818627 [00:06<00:05, 74342.13 examples/s]
+Generating train split: 55%|█████▌ | 451513/818627 [00:07<00:05, 69951.65 examples/s]
+Generating train split: 48%|████▊ | 391383/818627 [00:06<00:05, 74030.92 examples/s]
+Generating train split: 53%|█████▎ | 430414/818627 [00:06<00:05, 66269.06 examples/s]
+Generating train split: 58%|█████▊ | 472612/818627 [00:07<00:05, 65268.41 examples/s]
+Generating train split: 58%|█████▊ | 472612/818627 [00:07<00:05, 68571.19 examples/s]
+Generating train split: 60%|██████ | 493711/818627 [00:07<00:04, 72470.35 examples/s]
+Generating train split: 55%|█████▌ | 451513/818627 [00:07<00:05, 68820.99 examples/s]
+Generating train split: 60%|██████ | 493711/818627 [00:07<00:04, 74376.12 examples/s]
+Generating train split: 53%|█████▎ | 430414/818627 [00:06<00:05, 67285.76 examples/s]
+Generating train split: 53%|█████▎ | 430414/818627 [00:06<00:05, 65022.08 examples/s]
+Generating train split: 58%|█████▊ | 472612/818627 [00:07<00:05, 68161.01 examples/s]
+Generating train split: 55%|█████▌ | 451513/818627 [00:07<00:05, 69687.27 examples/s]
+Generating train split: 55%|█████▌ | 451513/818627 [00:07<00:05, 66592.79 examples/s]
+Generating train split: 60%|██████ | 493711/818627 [00:07<00:04, 74738.44 examples/s]
+Generating train split: 65%|██████▌ | 532742/818627 [00:08<00:04, 68865.74 examples/s]
+Generating train split: 65%|██████▌ | 532742/818627 [00:08<00:04, 63855.43 examples/s]
+Generating train split: 58%|█████▊ | 472612/818627 [00:07<00:05, 69053.45 examples/s]
+Generating train split: 58%|█████▊ | 472612/818627 [00:07<00:05, 65398.38 examples/s]
+Generating train split: 68%|██████▊ | 553841/818627 [00:08<00:03, 67812.48 examples/s]
+Generating train split: 68%|██████▊ | 553841/818627 [00:08<00:03, 69431.76 examples/s]
+Generating train split: 60%|██████ | 493711/818627 [00:07<00:04, 75425.11 examples/s]
+Generating train split: 60%|██████ | 493711/818627 [00:07<00:04, 72044.62 examples/s]
+Generating train split: 65%|██████▌ | 532742/818627 [00:08<00:04, 66979.07 examples/s]
+Generating train split: 70%|███████ | 574940/818627 [00:09<00:03, 67149.75 examples/s]
+Generating train split: 70%|███████ | 574940/818627 [00:08<00:03, 67799.19 examples/s]
+Generating train split: 73%|███████▎ | 596039/818627 [00:09<00:03, 73073.72 examples/s]
+Generating train split: 68%|██████▊ | 553841/818627 [00:08<00:03, 68482.42 examples/s]
+Generating train split: 73%|███████▎ | 596039/818627 [00:09<00:02, 75254.67 examples/s]
+Generating train split: 65%|██████▌ | 532742/818627 [00:08<00:04, 68666.27 examples/s]
+Generating train split: 65%|██████▌ | 532742/818627 [00:08<00:04, 66100.74 examples/s]
+Generating train split: 70%|███████ | 574940/818627 [00:08<00:03, 68428.28 examples/s]
+Generating train split: 68%|██████▊ | 553841/818627 [00:08<00:03, 69708.44 examples/s]
+Generating train split: 68%|██████▊ | 553841/818627 [00:08<00:03, 67817.47 examples/s]
+Generating train split: 73%|███████▎ | 596039/818627 [00:09<00:03, 73935.12 examples/s]
+Generating train split: 78%|███████▊ | 635070/818627 [00:09<00:02, 66435.93 examples/s]
+Generating train split: 78%|███████▊ | 635070/818627 [00:09<00:02, 63198.23 examples/s]
+Generating train split: 70%|███████ | 574940/818627 [00:08<00:03, 68979.27 examples/s]
+Generating train split: 70%|███████ | 574940/818627 [00:08<00:03, 67898.57 examples/s]
+Generating train split: 73%|███████▎ | 596039/818627 [00:08<00:02, 74564.59 examples/s]
+Generating train split: 80%|████████ | 656169/818627 [00:09<00:02, 67734.98 examples/s]
+Generating train split: 80%|████████ | 656169/818627 [00:10<00:02, 64757.05 examples/s]
+Generating train split: 73%|███████▎ | 596039/818627 [00:09<00:03, 73537.98 examples/s]
+Generating train split: 78%|███████▊ | 635070/818627 [00:09<00:02, 66071.16 examples/s]
+Generating train split: 83%|████████▎ | 677268/818627 [00:10<00:02, 67273.26 examples/s]
+Generating train split: 83%|████████▎ | 677268/818627 [00:10<00:02, 65517.69 examples/s]
+Generating train split: 80%|████████ | 656169/818627 [00:10<00:02, 67574.19 examples/s]
+Generating train split: 85%|████████▌ | 698367/818627 [00:10<00:01, 73974.80 examples/s]
+Generating train split: 85%|████████▌ | 698367/818627 [00:10<00:01, 71451.04 examples/s]
+Generating train split: 78%|███████▊ | 635070/818627 [00:09<00:02, 65227.26 examples/s]
+Generating train split: 78%|███████▊ | 635070/818627 [00:09<00:02, 66176.70 examples/s]
+Generating train split: 83%|████████▎ | 677268/818627 [00:10<00:02, 67538.50 examples/s]
+Generating train split: 80%|████████ | 656169/818627 [00:09<00:02, 66999.00 examples/s]
+Generating train split: 80%|████████ | 656169/818627 [00:10<00:02, 67728.37 examples/s]
+Generating train split: 85%|████████▌ | 698367/818627 [00:10<00:01, 73787.22 examples/s]
+Generating train split: 83%|████████▎ | 677268/818627 [00:10<00:02, 66419.94 examples/s]
+Generating train split: 90%|█████████ | 737398/818627 [00:11<00:01, 61148.54 examples/s]
+Generating train split: 90%|█████████ | 737398/818627 [00:11<00:01, 59237.86 examples/s]
+Generating train split: 83%|████████▎ | 677268/818627 [00:10<00:02, 65089.41 examples/s]
+Generating train split: 85%|████████▌ | 698367/818627 [00:10<00:01, 72956.83 examples/s]
+Generating train split: 85%|████████▌ | 698367/818627 [00:10<00:01, 73634.14 examples/s]
+Generating train split: 93%|█████████▎| 758497/818627 [00:11<00:00, 62597.70 examples/s]
+Generating train split: 93%|█████████▎| 758497/818627 [00:11<00:00, 60156.95 examples/s]
+Generating train split: 90%|█████████ | 737398/818627 [00:11<00:01, 61719.31 examples/s]
+Generating train split: 95%|█████████▌| 779596/818627 [00:12<00:00, 65259.90 examples/s]
+Generating train split: 95%|█████████▌| 779596/818627 [00:11<00:00, 65268.26 examples/s]
+Generating train split: 98%|█████████▊| 800695/818627 [00:12<00:00, 71435.03 examples/s]
+Generating train split: 93%|█████████▎| 758497/818627 [00:11<00:00, 61901.09 examples/s]
+Generating train split: 98%|█████████▊| 800695/818627 [00:12<00:00, 71701.72 examples/s]
+Generating train split: 100%|██████████| 818627/818627 [00:12<00:00, 65796.35 examples/s]
+
+Generating train split: 100%|██████████| 818627/818627 [00:12<00:00, 67048.19 examples/s]
+
+Generating train split: 90%|█████████ | 737398/818627 [00:11<00:01, 59130.90 examples/s]
+Generating train split: 90%|█████████ | 737398/818627 [00:11<00:01, 58481.10 examples/s]
+Generating train split: 95%|█████████▌| 779596/818627 [00:11<00:00, 65481.24 examples/s]
+Generating train split: 93%|█████████▎| 758497/818627 [00:11<00:00, 62579.81 examples/s]
+Generating train split: 98%|█████████▊| 800695/818627 [00:12<00:00, 71556.83 examples/s]
+Generating train split: 100%|██████████| 818627/818627 [00:12<00:00, 67102.86 examples/s]
+
+Generating train split: 93%|█████████▎| 758497/818627 [00:11<00:01, 59661.08 examples/s]dataset is cached at /workspace/hanrui/syxin_old/Specforge/cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
+Generating train split: 95%|█████████▌| 779596/818627 [00:11<00:00, 65078.42 examples/s]
+Map (num_proc=16): 0%| | 0/818627 [00:00, ? examples/s]
+Generating train split: 95%|█████████▌| 779596/818627 [00:12<00:00, 63238.77 examples/s]
+Generating train split: 98%|█████████▊| 800695/818627 [00:12<00:00, 71441.42 examples/s]
+Generating train split: 100%|██████████| 818627/818627 [00:12<00:00, 67136.47 examples/s]
+
+Generating train split: 98%|█████████▊| 800695/818627 [00:12<00:00, 70302.75 examples/s]
+Generating train split: 100%|██████████| 818627/818627 [00:12<00:00, 66337.81 examples/s]
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+
+Map (num_proc=16): 0%| | 1000/818627 [00:17<4:02:41, 56.15 examples/s]
+Map (num_proc=16): 0%| | 2000/818627 [00:18<1:41:43, 133.80 examples/s]
+Map (num_proc=16): 0%| | 3000/818627 [00:18<58:40, 231.69 examples/s]
+Map (num_proc=16): 0%| | 4000/818627 [00:18<36:10, 375.29 examples/s]
+Map (num_proc=16): 1%| | 5000/818627 [00:18<23:40, 572.86 examples/s]
+Map (num_proc=16): 1%| | 7000/818627 [00:19<12:32, 1077.90 examples/s]
+Map (num_proc=16): 1%| | 8000/818627 [00:19<10:12, 1322.78 examples/s]
+Map (num_proc=16): 1%| | 9000/818627 [00:19<07:53, 1708.97 examples/s]
+Map (num_proc=16): 1%|▏ | 12000/818627 [00:19<04:35, 2928.13 examples/s]
+Map (num_proc=16): 2%|▏ | 13000/818627 [00:20<03:55, 3416.73 examples/s]
+Map (num_proc=16): 2%|▏ | 14000/818627 [00:20<04:51, 2757.71 examples/s]
+Map (num_proc=16): 2%|▏ | 16000/818627 [00:21<04:27, 3005.49 examples/s]
+Map (num_proc=16): 2%|▏ | 17000/818627 [00:31<34:34, 386.42 examples/s]
+Map (num_proc=16): 2%|▏ | 18000/818627 [00:32<27:46, 480.32 examples/s]
+Map (num_proc=16): 2%|▏ | 19000/818627 [00:32<22:26, 593.88 examples/s]
+Map (num_proc=16): 2%|▏ | 20000/818627 [00:33<18:12, 731.00 examples/s]
+Map (num_proc=16): 3%|▎ | 21000/818627 [00:33<14:21, 925.68 examples/s]
+Map (num_proc=16): 3%|▎ | 23000/818627 [00:34<09:42, 1367.06 examples/s]
+Map (num_proc=16): 3%|▎ | 24000/818627 [00:34<07:46, 1704.61 examples/s]
+Map (num_proc=16): 3%|▎ | 25000/818627 [00:34<06:58, 1894.60 examples/s]
+Map (num_proc=16): 3%|▎ | 27000/818627 [00:35<04:55, 2682.49 examples/s]
+Map (num_proc=16): 4%|▎ | 29000/818627 [00:35<03:35, 3667.08 examples/s]
+Map (num_proc=16): 4%|▍ | 31000/818627 [00:35<02:44, 4796.72 examples/s]
+Map (num_proc=16): 4%|▍ | 32000/818627 [00:36<03:47, 3458.55 examples/s]
+Map (num_proc=16): 4%|▍ | 33000/818627 [00:46<32:39, 401.02 examples/s]
+Map (num_proc=16): 4%|▍ | 34000/818627 [00:46<25:33, 511.72 examples/s]
+Map (num_proc=16): 4%|▍ | 35000/818627 [00:47<23:21, 558.95 examples/s]
+Map (num_proc=16): 4%|▍ | 36000/818627 [00:48<18:57, 687.88 examples/s]
+Map (num_proc=16): 5%|▍ | 38000/818627 [00:48<11:33, 1124.84 examples/s]
+Map (num_proc=16): 5%|▍ | 39000/818627 [00:49<12:05, 1074.23 examples/s]
+Map (num_proc=16): 5%|▍ | 40000/818627 [00:49<09:27, 1372.76 examples/s]
+Map (num_proc=16): 5%|▌ | 42000/818627 [00:50<06:11, 2091.59 examples/s]
+Map (num_proc=16): 5%|▌ | 43000/818627 [00:50<05:11, 2487.70 examples/s]
+Map (num_proc=16): 5%|▌ | 45000/818627 [00:50<03:31, 3654.71 examples/s]
+Map (num_proc=16): 6%|▌ | 47000/818627 [00:50<03:29, 3691.29 examples/s]
+Map (num_proc=16): 6%|▌ | 48000/818627 [00:51<05:22, 2392.45 examples/s]
+Map (num_proc=16): 6%|▌ | 49000/818627 [01:00<29:29, 434.85 examples/s]
+Map (num_proc=16): 6%|▌ | 51000/818627 [01:02<21:37, 591.64 examples/s]
+Map (num_proc=16): 6%|▋ | 52000/818627 [01:03<19:20, 660.69 examples/s]
+Map (num_proc=16): 7%|▋ | 54000/818627 [01:03<12:07, 1051.60 examples/s]
+Map (num_proc=16): 7%|▋ | 55000/818627 [01:03<10:35, 1202.38 examples/s]
+Map (num_proc=16): 7%|▋ | 56000/818627 [01:04<11:08, 1140.34 examples/s]
+Map (num_proc=16): 7%|▋ | 57000/818627 [01:05<10:12, 1243.62 examples/s]
+Map (num_proc=16): 7%|▋ | 58000/818627 [01:05<08:10, 1550.11 examples/s]
+Map (num_proc=16): 7%|▋ | 60000/818627 [01:05<05:04, 2492.21 examples/s]
+Map (num_proc=16): 8%|▊ | 62000/818627 [01:05<03:56, 3204.50 examples/s]
+Map (num_proc=16): 8%|▊ | 63000/818627 [01:06<04:54, 2561.87 examples/s]
+Map (num_proc=16): 8%|▊ | 64000/818627 [01:07<06:28, 1944.15 examples/s]
+Map (num_proc=16): 8%|▊ | 65000/818627 [01:14<27:49, 451.48 examples/s]
+Map (num_proc=16): 8%|▊ | 66000/818627 [01:15<21:51, 574.03 examples/s]
+Map (num_proc=16): 8%|▊ | 67000/818627 [01:16<21:35, 580.33 examples/s]
+Map (num_proc=16): 8%|▊ | 68000/818627 [01:18<19:36, 637.88 examples/s]
+Map (num_proc=16): 9%|▊ | 70000/818627 [01:18<12:03, 1035.35 examples/s]
+Map (num_proc=16): 9%|▊ | 71000/818627 [01:18<10:18, 1208.95 examples/s]
+Map (num_proc=16): 9%|▉ | 72000/818627 [01:19<10:54, 1141.58 examples/s]
+Map (num_proc=16): 9%|▉ | 73000/818627 [01:20<09:29, 1309.57 examples/s]
+Map (num_proc=16): 9%|▉ | 74000/818627 [01:20<08:06, 1531.70 examples/s]
+Map (num_proc=16): 9%|▉ | 75000/818627 [01:21<08:27, 1464.27 examples/s]
+Map (num_proc=16): 9%|▉ | 77000/818627 [01:21<05:59, 2065.67 examples/s]
+Map (num_proc=16): 10%|▉ | 78000/818627 [01:22<04:50, 2551.98 examples/s]
+Map (num_proc=16): 10%|▉ | 79000/818627 [01:22<05:16, 2339.06 examples/s]
+Map (num_proc=16): 10%|▉ | 80000/818627 [01:23<07:43, 1595.27 examples/s]
+Map (num_proc=16): 10%|▉ | 81000/818627 [01:29<24:18, 505.67 examples/s]
+Map (num_proc=16): 10%|█ | 83000/818627 [01:30<17:59, 681.30 examples/s]
+Map (num_proc=16): 10%|█ | 84000/818627 [01:32<19:06, 640.96 examples/s]
+Map (num_proc=16): 10%|█ | 85000/818627 [01:32<14:39, 834.18 examples/s]
+Map (num_proc=16): 11%|█ | 86000/818627 [01:33<12:39, 965.22 examples/s]
+Map (num_proc=16): 11%|█ | 87000/818627 [01:34<11:33, 1054.80 examples/s]
+Map (num_proc=16): 11%|█ | 88000/818627 [01:34<09:07, 1333.65 examples/s]
+Map (num_proc=16): 11%|█ | 89000/818627 [01:35<08:39, 1403.66 examples/s]
+Map (num_proc=16): 11%|█ | 90000/818627 [01:35<08:35, 1412.32 examples/s]
+Map (num_proc=16): 11%|█ | 91000/818627 [01:37<10:43, 1130.37 examples/s]
+Map (num_proc=16): 11%|█ | 92000/818627 [01:37<09:02, 1338.53 examples/s]
+Map (num_proc=16): 11%|█▏ | 93000/818627 [01:37<07:05, 1705.25 examples/s]
+Map (num_proc=16): 11%|█▏ | 94000/818627 [01:38<06:34, 1835.89 examples/s]
+Map (num_proc=16): 12%|█▏ | 95000/818627 [01:39<09:01, 1336.71 examples/s]
+Map (num_proc=16): 12%|█▏ | 97000/818627 [01:43<17:14, 697.42 examples/s]
+Map (num_proc=16): 12%|█▏ | 98000/818627 [01:45<18:00, 667.07 examples/s]
+Map (num_proc=16): 12%|█▏ | 99000/818627 [01:46<15:53, 754.52 examples/s]
+Map (num_proc=16): 12%|█▏ | 100000/818627 [01:47<15:02, 796.42 examples/s]
+Map (num_proc=16): 12%|█▏ | 101000/818627 [01:48<14:37, 818.09 examples/s]
+Map (num_proc=16): 12%|█▏ | 102000/818627 [01:48<11:10, 1068.13 examples/s]
+Map (num_proc=16): 13%|█▎ | 103000/818627 [01:49<08:52, 1344.58 examples/s]
+Map (num_proc=16): 13%|█▎ | 104000/818627 [01:49<06:37, 1795.74 examples/s]
+Map (num_proc=16): 13%|█▎ | 105000/818627 [01:50<09:52, 1204.92 examples/s]
+Map (num_proc=16): 13%|█▎ | 106000/818627 [01:51<09:45, 1216.31 examples/s]
+Map (num_proc=16): 13%|█▎ | 107000/818627 [01:52<10:47, 1098.43 examples/s]
+Map (num_proc=16): 13%|█▎ | 108000/818627 [01:52<08:37, 1373.45 examples/s]
+Map (num_proc=16): 13%|█▎ | 109000/818627 [01:53<09:31, 1242.12 examples/s]
+Map (num_proc=16): 14%|█▎ | 111000/818627 [01:54<06:14, 1890.36 examples/s]
+Map (num_proc=16): 14%|█▎ | 112000/818627 [01:54<06:28, 1818.01 examples/s]
+Map (num_proc=16): 14%|█▍ | 113000/818627 [01:58<16:40, 705.60 examples/s]
+Map (num_proc=16): 14%|█▍ | 114000/818627 [02:00<16:21, 717.69 examples/s]
+Map (num_proc=16): 14%|█▍ | 115000/818627 [02:00<13:54, 843.29 examples/s]
+Map (num_proc=16): 14%|█▍ | 116000/818627 [02:01<13:02, 898.01 examples/s]
+Map (num_proc=16): 14%|█▍ | 117000/818627 [02:03<15:21, 761.56 examples/s]
+Map (num_proc=16): 14%|█▍ | 118000/818627 [02:04<13:07, 890.22 examples/s]
+Map (num_proc=16): 15%|█▍ | 120000/818627 [02:04<08:45, 1329.62 examples/s]
+Map (num_proc=16): 15%|█▍ | 121000/818627 [02:05<09:31, 1221.13 examples/s]
+Map (num_proc=16): 15%|█▍ | 122000/818627 [02:06<09:21, 1240.36 examples/s]
+Map (num_proc=16): 15%|█▌ | 123000/818627 [02:07<10:01, 1155.92 examples/s]
+Map (num_proc=16): 15%|█▌ | 124000/818627 [02:07<08:04, 1433.71 examples/s]
+Map (num_proc=16): 15%|█▌ | 125000/818627 [02:08<09:13, 1253.77 examples/s]
+Map (num_proc=16): 15%|█▌ | 126000/818627 [02:09<08:23, 1375.67 examples/s]
+Map (num_proc=16): 16%|█▌ | 127000/818627 [02:10<08:23, 1372.40 examples/s]
+Map (num_proc=16): 16%|█▌ | 128000/818627 [02:12<12:21, 931.06 examples/s]
+Map (num_proc=16): 16%|█▌ | 129000/818627 [02:13<14:44, 779.90 examples/s]
+Map (num_proc=16): 16%|█▌ | 130000/818627 [02:15<14:52, 771.59 examples/s]
+Map (num_proc=16): 16%|█▌ | 131000/818627 [02:15<13:08, 871.90 examples/s]
+Map (num_proc=16): 16%|█▌ | 133000/818627 [02:17<12:00, 951.83 examples/s]
+Map (num_proc=16): 16%|█▋ | 134000/818627 [02:18<11:38, 979.50 examples/s]
+Map (num_proc=16): 16%|█▋ | 135000/818627 [02:19<10:22, 1097.92 examples/s]
+Map (num_proc=16): 17%|█▋ | 136000/818627 [02:20<10:38, 1069.59 examples/s]
+Map (num_proc=16): 17%|█▋ | 137000/818627 [02:21<11:07, 1021.50 examples/s]
+Map (num_proc=16): 17%|█▋ | 138000/818627 [02:22<10:46, 1053.40 examples/s]
+Map (num_proc=16): 17%|█▋ | 139000/818627 [02:22<08:36, 1316.92 examples/s]
+Map (num_proc=16): 17%|█▋ | 140000/818627 [02:23<07:45, 1458.39 examples/s]
+Map (num_proc=16): 17%|█▋ | 141000/818627 [02:24<09:50, 1147.45 examples/s]
+Map (num_proc=16): 17%|█▋ | 142000/818627 [02:25<10:38, 1060.30 examples/s]
+Map (num_proc=16): 17%|█▋ | 143000/818627 [02:27<12:46, 881.48 examples/s]
+Map (num_proc=16): 18%|█▊ | 144000/818627 [02:27<09:20, 1202.89 examples/s]
+Map (num_proc=16): 18%|█▊ | 145000/818627 [02:29<15:08, 741.84 examples/s]
+Map (num_proc=16): 18%|█▊ | 146000/818627 [02:30<13:59, 801.57 examples/s]
+Map (num_proc=16): 18%|█▊ | 147000/818627 [02:31<11:45, 952.56 examples/s]
+Map (num_proc=16): 18%|█▊ | 148000/818627 [02:31<08:33, 1306.67 examples/s]
+Map (num_proc=16): 18%|█▊ | 149000/818627 [02:33<11:06, 1004.34 examples/s]
+Map (num_proc=16): 18%|█▊ | 150000/818627 [02:33<09:46, 1140.55 examples/s]
+Map (num_proc=16): 18%|█▊ | 151000/818627 [02:35<12:23, 898.17 examples/s]
+Map (num_proc=16): 19%|█▊ | 152000/818627 [02:35<10:39, 1042.77 examples/s]
+Map (num_proc=16): 19%|█▊ | 153000/818627 [02:36<09:53, 1121.10 examples/s]
+Map (num_proc=16): 19%|█▉ | 154000/818627 [02:37<11:12, 988.32 examples/s]
+Map (num_proc=16): 19%|█▉ | 155000/818627 [02:38<08:31, 1298.64 examples/s]
+Map (num_proc=16): 19%|█▉ | 156000/818627 [02:38<08:32, 1292.50 examples/s]
+Map (num_proc=16): 19%|█▉ | 157000/818627 [02:39<07:20, 1501.38 examples/s]
+Map (num_proc=16): 19%|█▉ | 158000/818627 [02:41<11:58, 919.69 examples/s]
+Map (num_proc=16): 19%|█▉ | 159000/818627 [02:42<12:46, 860.61 examples/s]
+Map (num_proc=16): 20%|█▉ | 160000/818627 [02:43<09:52, 1111.51 examples/s]
+Map (num_proc=16): 20%|█▉ | 161000/818627 [02:43<08:55, 1227.92 examples/s]
+Map (num_proc=16): 20%|█▉ | 162000/818627 [02:45<13:24, 816.64 examples/s]
+Map (num_proc=16): 20%|█▉ | 163000/818627 [02:46<11:22, 960.57 examples/s]
+Map (num_proc=16): 20%|██ | 165000/818627 [02:48<11:25, 953.59 examples/s]
+Map (num_proc=16): 20%|██ | 166000/818627 [02:48<09:01, 1205.07 examples/s]
+Map (num_proc=16): 20%|██ | 167000/818627 [02:50<10:52, 998.33 examples/s]
+Map (num_proc=16): 21%|██ | 168000/818627 [02:51<12:23, 874.57 examples/s]
+Map (num_proc=16): 21%|██ | 169000/818627 [02:52<11:15, 961.09 examples/s]
+Map (num_proc=16): 21%|██ | 170000/818627 [02:52<09:19, 1159.85 examples/s]
+Map (num_proc=16): 21%|██ | 171000/818627 [02:53<08:07, 1328.12 examples/s]
+Map (num_proc=16): 21%|██ | 172000/818627 [02:54<08:17, 1298.79 examples/s]
+Map (num_proc=16): 21%|██ | 173000/818627 [02:54<06:26, 1671.03 examples/s]
+Map (num_proc=16): 21%|██▏ | 174000/818627 [02:57<13:25, 799.84 examples/s]
+Map (num_proc=16): 21%|██▏ | 176000/818627 [02:57<07:44, 1382.00 examples/s]
+Map (num_proc=16): 22%|██▏ | 177000/818627 [02:58<07:56, 1346.98 examples/s]
+Map (num_proc=16): 22%|██▏ | 178000/818627 [03:00<13:31, 789.75 examples/s]
+Map (num_proc=16): 22%|██▏ | 180000/818627 [03:01<08:48, 1208.45 examples/s]
+Map (num_proc=16): 22%|██▏ | 181000/818627 [03:03<11:27, 927.72 examples/s]
+Map (num_proc=16): 22%|██▏ | 182000/818627 [03:03<09:21, 1133.62 examples/s]
+Map (num_proc=16): 22%|██▏ | 183000/818627 [03:04<09:42, 1091.88 examples/s]
+Map (num_proc=16): 22%|██▏ | 184000/818627 [03:07<14:20, 737.59 examples/s]
+Map (num_proc=16): 23%|██▎ | 185000/818627 [03:07<11:02, 956.08 examples/s]
+Map (num_proc=16): 23%|██▎ | 186000/818627 [03:07<09:24, 1120.67 examples/s]
+Map (num_proc=16): 23%|██▎ | 187000/818627 [03:09<09:57, 1056.83 examples/s]
+Map (num_proc=16): 23%|██▎ | 188000/818627 [03:09<08:04, 1301.18 examples/s]
+Map (num_proc=16): 23%|██▎ | 189000/818627 [03:09<06:16, 1670.81 examples/s]
+Map (num_proc=16): 23%|██▎ | 190000/818627 [03:11<10:53, 961.46 examples/s]
+Map (num_proc=16): 23%|██▎ | 192000/818627 [03:12<07:50, 1333.24 examples/s]
+Map (num_proc=16): 24%|██▎ | 193000/818627 [03:13<08:56, 1165.72 examples/s]
+Map (num_proc=16): 24%|██▎ | 194000/818627 [03:15<11:09, 933.23 examples/s]
+Map (num_proc=16): 24%|██▍ | 195000/818627 [03:16<11:04, 937.89 examples/s]
+Map (num_proc=16): 24%|██▍ | 197000/818627 [03:18<11:47, 878.37 examples/s]
+Map (num_proc=16): 24%|██▍ | 198000/818627 [03:19<10:31, 983.42 examples/s]
+Map (num_proc=16): 24%|██▍ | 199000/818627 [03:19<08:35, 1202.24 examples/s]
+Map (num_proc=16): 24%|██▍ | 200000/818627 [03:22<13:44, 750.74 examples/s]
+Map (num_proc=16): 25%|██▍ | 201000/818627 [03:22<10:32, 976.42 examples/s]
+Map (num_proc=16): 25%|██▍ | 202000/818627 [03:23<10:34, 971.40 examples/s]
+Map (num_proc=16): 25%|██▍ | 203000/818627 [03:23<08:14, 1245.54 examples/s]
+Map (num_proc=16): 25%|██▍ | 204000/818627 [03:24<06:53, 1484.84 examples/s]
+Map (num_proc=16): 25%|██▌ | 205000/818627 [03:24<05:19, 1918.84 examples/s]
+Map (num_proc=16): 25%|██▌ | 206000/818627 [03:26<08:53, 1148.47 examples/s]
+Map (num_proc=16): 25%|██▌ | 207000/818627 [03:26<07:22, 1381.00 examples/s]
+Map (num_proc=16): 25%|██▌ | 208000/818627 [03:27<07:52, 1291.99 examples/s]
+Map (num_proc=16): 26%|██▌ | 209000/818627 [03:28<09:40, 1049.39 examples/s]
+Map (num_proc=16): 26%|██▌ | 210000/818627 [03:29<10:06, 1003.60 examples/s]
+Map (num_proc=16): 26%|██▌ | 211000/818627 [03:30<09:19, 1086.67 examples/s]
+Map (num_proc=16): 26%|██▌ | 212000/818627 [03:32<10:59, 919.70 examples/s]
+Map (num_proc=16): 26%|██▌ | 213000/818627 [03:33<11:52, 850.54 examples/s]
+Map (num_proc=16): 26%|██▌ | 214000/818627 [03:34<11:06, 906.65 examples/s]
+Map (num_proc=16): 26%|██▋ | 215000/818627 [03:35<10:34, 951.36 examples/s]
+Map (num_proc=16): 26%|██▋ | 216000/818627 [03:37<13:13, 759.45 examples/s]
+Map (num_proc=16): 27%|██▋ | 217000/818627 [03:38<11:46, 851.49 examples/s]
+Map (num_proc=16): 27%|██▋ | 218000/818627 [03:38<10:20, 968.40 examples/s]
+Map (num_proc=16): 27%|██▋ | 219000/818627 [03:39<07:59, 1250.78 examples/s]
+Map (num_proc=16): 27%|██▋ | 220000/818627 [03:39<07:08, 1396.76 examples/s]
+Map (num_proc=16): 27%|██▋ | 221000/818627 [03:39<05:51, 1700.25 examples/s]
+Map (num_proc=16): 27%|██▋ | 222000/818627 [03:40<04:44, 2099.79 examples/s]
+Map (num_proc=16): 27%|██▋ | 223000/818627 [03:42<08:57, 1107.74 examples/s]
+Map (num_proc=16): 27%|██▋ | 224000/818627 [03:42<07:58, 1243.09 examples/s]
+Map (num_proc=16): 27%|██▋ | 225000/818627 [03:43<08:01, 1233.16 examples/s]
+Map (num_proc=16): 28%|██▊ | 226000/818627 [03:44<08:00, 1234.23 examples/s]
+Map (num_proc=16): 28%|██▊ | 227000/818627 [03:45<08:15, 1192.99 examples/s]
+Map (num_proc=16): 28%|██▊ | 228000/818627 [03:48<15:49, 621.99 examples/s]
+Map (num_proc=16): 28%|██▊ | 229000/818627 [03:49<12:46, 769.07 examples/s]
+Map (num_proc=16): 28%|██▊ | 230000/818627 [03:50<13:07, 747.62 examples/s]
+Map (num_proc=16): 28%|██▊ | 231000/818627 [03:50<09:56, 984.53 examples/s]
+Map (num_proc=16): 28%|██▊ | 232000/818627 [03:52<12:51, 760.58 examples/s]
+Map (num_proc=16): 28%|██▊ | 233000/818627 [03:53<11:06, 879.29 examples/s]
+Map (num_proc=16): 29%|██▊ | 234000/818627 [03:53<08:30, 1144.23 examples/s]
+Map (num_proc=16): 29%|██▊ | 235000/818627 [03:54<07:05, 1370.84 examples/s]
+Map (num_proc=16): 29%|██▉ | 236000/818627 [03:54<06:07, 1585.49 examples/s]
+Map (num_proc=16): 29%|██▉ | 237000/818627 [03:54<05:09, 1877.49 examples/s]
+Map (num_proc=16): 29%|██▉ | 238000/818627 [03:55<04:17, 2253.75 examples/s]
+Map (num_proc=16): 29%|██▉ | 239000/818627 [03:56<06:44, 1432.53 examples/s]
+Map (num_proc=16): 29%|██▉ | 240000/818627 [03:58<09:38, 999.64 examples/s]
+Map (num_proc=16): 29%|██▉ | 241000/818627 [03:58<07:36, 1264.69 examples/s]
+Map (num_proc=16): 30%|██▉ | 242000/818627 [04:00<12:10, 789.11 examples/s]
+Map (num_proc=16): 30%|██▉ | 243000/818627 [04:01<11:37, 825.25 examples/s]
+Map (num_proc=16): 30%|██▉ | 244000/818627 [04:03<12:29, 766.83 examples/s]
+Map (num_proc=16): 30%|██▉ | 245000/818627 [04:04<11:36, 824.03 examples/s]
+Map (num_proc=16): 30%|███ | 246000/818627 [04:06<13:46, 693.24 examples/s]
+Map (num_proc=16): 30%|███ | 247000/818627 [04:07<11:58, 795.85 examples/s]
+Map (num_proc=16): 30%|███ | 248000/818627 [04:07<08:57, 1061.89 examples/s]
+Map (num_proc=16): 30%|███ | 249000/818627 [04:08<08:49, 1074.97 examples/s]
+Map (num_proc=16): 31%|███ | 251000/818627 [04:08<06:04, 1557.39 examples/s]
+Map (num_proc=16): 31%|███ | 252000/818627 [04:09<05:24, 1746.30 examples/s]
+Map (num_proc=16): 31%|███ | 253000/818627 [04:09<04:58, 1894.25 examples/s]
+Map (num_proc=16): 31%|███ | 254000/818627 [04:10<05:55, 1590.48 examples/s]
+Map (num_proc=16): 31%|███ | 255000/818627 [04:10<04:52, 1924.70 examples/s]
+Map (num_proc=16): 31%|███▏ | 256000/818627 [04:13<09:21, 1002.66 examples/s]
+Map (num_proc=16): 31%|███▏ | 257000/818627 [04:13<07:57, 1176.34 examples/s]
+Map (num_proc=16): 32%|███▏ | 258000/818627 [04:15<11:33, 808.04 examples/s]
+Map (num_proc=16): 32%|███▏ | 259000/818627 [04:16<10:43, 869.86 examples/s]
+Map (num_proc=16): 32%|███▏ | 260000/818627 [04:17<09:06, 1021.50 examples/s]
+Map (num_proc=16): 32%|███▏ | 261000/818627 [04:19<12:29, 744.19 examples/s]
+Map (num_proc=16): 32%|███▏ | 262000/818627 [04:21<13:46, 673.33 examples/s]
+Map (num_proc=16): 32%|███▏ | 263000/818627 [04:22<13:58, 662.87 examples/s]
+Map (num_proc=16): 32%|███▏ | 264000/818627 [04:22<10:08, 912.03 examples/s]
+Map (num_proc=16): 32%|███▏ | 266000/818627 [04:24<07:42, 1193.88 examples/s]
+Map (num_proc=16): 33%|███▎ | 268000/818627 [04:24<04:51, 1892.08 examples/s]
+Map (num_proc=16): 33%|███▎ | 269000/818627 [04:24<05:01, 1824.22 examples/s]
+Map (num_proc=16): 33%|███▎ | 270000/818627 [04:26<06:50, 1337.69 examples/s]
+Map (num_proc=16): 33%|███▎ | 271000/818627 [04:26<05:19, 1711.73 examples/s]
+Map (num_proc=16): 33%|███▎ | 272000/818627 [04:27<07:37, 1195.83 examples/s]
+Map (num_proc=16): 33%|███▎ | 273000/818627 [04:29<08:55, 1019.53 examples/s]
+Map (num_proc=16): 33%|███▎ | 274000/818627 [04:30<09:45, 930.19 examples/s]
+Map (num_proc=16): 34%|███▎ | 275000/818627 [04:32<11:25, 792.84 examples/s]
+Map (num_proc=16): 34%|███▎ | 276000/818627 [04:32<08:32, 1059.07 examples/s]
+Map (num_proc=16): 34%|███▍ | 277000/818627 [04:34<12:24, 727.54 examples/s]
+Map (num_proc=16): 34%|███▍ | 278000/818627 [04:36<14:05, 639.61 examples/s]
+Map (num_proc=16): 34%|███▍ | 279000/818627 [04:37<12:33, 716.49 examples/s]
+Map (num_proc=16): 34%|███▍ | 280000/818627 [04:37<09:17, 966.94 examples/s]
+Map (num_proc=16): 34%|███▍ | 281000/818627 [04:38<08:21, 1071.26 examples/s]
+Map (num_proc=16): 34%|███▍ | 282000/818627 [04:38<06:27, 1384.03 examples/s]
+Map (num_proc=16): 35%|███▍ | 283000/818627 [04:39<06:18, 1415.54 examples/s]
+Map (num_proc=16): 35%|███▍ | 284000/818627 [04:39<05:00, 1779.66 examples/s]
+Map (num_proc=16): 35%|███▍ | 285000/818627 [04:40<04:43, 1880.00 examples/s]
+Map (num_proc=16): 35%|███▍ | 286000/818627 [04:40<04:22, 2032.23 examples/s]
+Map (num_proc=16): 35%|███▌ | 287000/818627 [04:41<04:12, 2102.95 examples/s]
+Map (num_proc=16): 35%|███▌ | 288000/818627 [04:43<08:43, 1013.96 examples/s]
+Map (num_proc=16): 35%|███▌ | 289000/818627 [04:44<09:18, 948.24 examples/s]
+Map (num_proc=16): 35%|███▌ | 290000/818627 [04:45<08:04, 1090.11 examples/s]
+Map (num_proc=16): 36%|███▌ | 291000/818627 [04:47<11:42, 751.40 examples/s]
+Map (num_proc=16): 36%|███▌ | 292000/818627 [04:47<09:13, 950.89 examples/s]
+Map (num_proc=16): 36%|███▌ | 293000/818627 [04:49<11:48, 741.96 examples/s]
+Map (num_proc=16): 36%|███▌ | 294000/818627 [04:51<12:52, 678.99 examples/s]
+Map (num_proc=16): 36%|███▌ | 295000/818627 [04:52<11:52, 735.38 examples/s]
+Map (num_proc=16): 36%|███▌ | 296000/818627 [04:52<08:54, 977.73 examples/s]
+Map (num_proc=16): 36%|███▋ | 297000/818627 [04:54<10:17, 845.36 examples/s]
+Map (num_proc=16): 36%|███▋ | 298000/818627 [04:54<07:29, 1158.58 examples/s]
+Map (num_proc=16): 37%|███▋ | 299000/818627 [04:54<05:32, 1564.05 examples/s]
+Map (num_proc=16): 37%|███▋ | 300000/818627 [04:54<04:25, 1954.98 examples/s]
+Map (num_proc=16): 37%|███▋ | 301000/818627 [04:55<04:50, 1780.34 examples/s]
+Map (num_proc=16): 37%|███▋ | 302000/818627 [04:55<04:24, 1953.87 examples/s]
+Map (num_proc=16): 37%|███▋ | 304000/818627 [04:57<05:32, 1545.56 examples/s]
+Map (num_proc=16): 37%|███▋ | 305000/818627 [04:58<07:02, 1215.94 examples/s]
+Map (num_proc=16): 37%|███▋ | 306000/818627 [04:59<05:58, 1431.13 examples/s]
+Map (num_proc=16): 38%|███▊ | 307000/818627 [05:02<10:48, 789.32 examples/s]
+Map (num_proc=16): 38%|███▊ | 308000/818627 [05:02<09:09, 929.98 examples/s]
+Map (num_proc=16): 38%|███▊ | 309000/818627 [05:04<10:09, 836.10 examples/s]
+Map (num_proc=16): 38%|███▊ | 310000/818627 [05:06<13:32, 626.04 examples/s]
+Map (num_proc=16): 38%|███▊ | 311000/818627 [05:07<10:39, 793.63 examples/s]
+Map (num_proc=16): 38%|███▊ | 312000/818627 [05:07<08:53, 950.17 examples/s]
+Map (num_proc=16): 38%|███▊ | 313000/818627 [05:09<09:50, 856.32 examples/s]
+Map (num_proc=16): 38%|███▊ | 314000/818627 [05:09<08:47, 956.11 examples/s]
+Map (num_proc=16): 38%|███▊ | 315000/818627 [05:10<07:57, 1054.15 examples/s]
+Map (num_proc=16): 39%|███▉ | 318000/818627 [05:10<03:58, 2095.74 examples/s]
+Map (num_proc=16): 39%|███▉ | 319000/818627 [05:11<04:00, 2077.23 examples/s]
+Map (num_proc=16): 39%|███▉ | 320000/818627 [05:12<04:34, 1819.39 examples/s]
+Map (num_proc=16): 39%|███▉ | 321000/818627 [05:13<06:44, 1231.69 examples/s]
+Map (num_proc=16): 39%|███▉ | 322000/818627 [05:14<05:28, 1513.03 examples/s]
+Map (num_proc=16): 39%|███▉ | 323000/818627 [05:16<08:33, 964.51 examples/s]
+Map (num_proc=16): 40%|███▉ | 324000/818627 [05:18<10:36, 777.26 examples/s]
+Map (num_proc=16): 40%|███▉ | 325000/818627 [05:18<09:38, 853.65 examples/s]
+Map (num_proc=16): 40%|███▉ | 326000/818627 [05:20<10:58, 748.64 examples/s]
+Map (num_proc=16): 40%|███▉ | 327000/818627 [05:21<09:34, 855.76 examples/s]
+Map (num_proc=16): 40%|████ | 328000/818627 [05:23<10:33, 774.31 examples/s]
+Map (num_proc=16): 40%|████ | 329000/818627 [05:23<09:35, 851.04 examples/s]
+Map (num_proc=16): 40%|████ | 331000/818627 [05:25<08:34, 947.44 examples/s]
+Map (num_proc=16): 41%|████ | 332000/818627 [05:26<07:39, 1058.06 examples/s]
+Map (num_proc=16): 41%|████ | 334000/818627 [05:26<04:50, 1665.71 examples/s]
+Map (num_proc=16): 41%|████ | 335000/818627 [05:26<04:06, 1961.53 examples/s]
+Map (num_proc=16): 41%|████ | 336000/818627 [05:27<04:11, 1918.54 examples/s]
+Map (num_proc=16): 41%|████ | 337000/818627 [05:28<04:32, 1765.83 examples/s]
+Map (num_proc=16): 41%|████▏ | 338000/818627 [05:28<05:20, 1501.74 examples/s]
+Map (num_proc=16): 41%|████▏ | 339000/818627 [05:30<08:02, 993.30 examples/s]
+Map (num_proc=16): 42%|████▏ | 340000/818627 [05:33<10:43, 743.49 examples/s]
+Map (num_proc=16): 42%|████▏ | 341000/818627 [05:33<09:23, 848.03 examples/s]
+Map (num_proc=16): 42%|████▏ | 342000/818627 [05:35<10:08, 783.78 examples/s]
+Map (num_proc=16): 42%|████▏ | 343000/818627 [05:36<10:53, 727.51 examples/s]
+Map (num_proc=16): 42%|████▏ | 344000/818627 [05:38<10:17, 769.25 examples/s]
+Map (num_proc=16): 42%|████▏ | 345000/818627 [05:38<08:50, 893.19 examples/s]
+Map (num_proc=16): 42%|████▏ | 347000/818627 [05:40<08:34, 916.99 examples/s]
+Map (num_proc=16): 43%|████▎ | 349000/818627 [05:41<05:55, 1320.61 examples/s]
+Map (num_proc=16): 43%|████▎ | 350000/818627 [05:41<04:55, 1585.02 examples/s]
+Map (num_proc=16): 43%|████▎ | 351000/818627 [05:41<03:56, 1978.79 examples/s]
+Map (num_proc=16): 43%|████▎ | 352000/818627 [05:42<04:18, 1807.17 examples/s]
+Map (num_proc=16): 43%|████▎ | 353000/818627 [05:42<03:58, 1950.66 examples/s]
+Map (num_proc=16): 43%|████▎ | 354000/818627 [05:44<05:41, 1360.36 examples/s]
+Map (num_proc=16): 43%|████▎ | 355000/818627 [05:44<05:32, 1393.47 examples/s]
+Map (num_proc=16): 43%|████▎ | 356000/818627 [05:48<12:40, 608.50 examples/s]
+Map (num_proc=16): 44%|████▎ | 357000/818627 [05:49<10:23, 739.92 examples/s]
+Map (num_proc=16): 44%|████▎ | 358000/818627 [05:49<07:34, 1012.82 examples/s]
+Map (num_proc=16): 44%|████▍ | 359000/818627 [05:51<09:37, 795.36 examples/s]
+Map (num_proc=16): 44%|████▍ | 360000/818627 [05:52<10:11, 749.48 examples/s]
+Map (num_proc=16): 44%|████▍ | 361000/818627 [05:53<08:17, 918.93 examples/s]
+Map (num_proc=16): 44%|████▍ | 362000/818627 [05:54<07:37, 998.64 examples/s]
+Map (num_proc=16): 44%|████▍ | 363000/818627 [05:56<10:06, 751.63 examples/s]
+Map (num_proc=16): 44%|████▍ | 364000/818627 [05:56<07:31, 1006.19 examples/s]
+Map (num_proc=16): 45%|████▍ | 366000/818627 [05:56<04:39, 1619.03 examples/s]
+Map (num_proc=16): 45%|████▍ | 367000/818627 [05:57<03:55, 1918.29 examples/s]
+Map (num_proc=16): 45%|████▍ | 368000/818627 [05:57<03:17, 2281.85 examples/s]
+Map (num_proc=16): 45%|████▌ | 369000/818627 [05:57<03:44, 1998.47 examples/s]
+Map (num_proc=16): 45%|████▌ | 370000/818627 [05:59<06:18, 1186.48 examples/s]
+Map (num_proc=16): 45%|████▌ | 371000/818627 [05:59<05:05, 1467.50 examples/s]
+Map (num_proc=16): 45%|████▌ | 372000/818627 [06:03<11:25, 651.30 examples/s]
+Map (num_proc=16): 46%|████▌ | 373000/818627 [06:04<09:46, 760.14 examples/s]
+Map (num_proc=16): 46%|████▌ | 374000/818627 [06:04<07:34, 977.88 examples/s]
+Map (num_proc=16): 46%|████▌ | 375000/818627 [06:06<08:21, 884.62 examples/s]
+Map (num_proc=16): 46%|████▌ | 376000/818627 [06:07<09:48, 752.56 examples/s]
+Map (num_proc=16): 46%|████▌ | 377000/818627 [06:08<07:43, 951.79 examples/s]
+Map (num_proc=16): 46%|████▌ | 378000/818627 [06:09<08:26, 869.59 examples/s]
+Map (num_proc=16): 46%|████▋ | 379000/818627 [06:11<09:40, 757.15 examples/s]
+Map (num_proc=16): 47%|████▋ | 381000/818627 [06:11<05:33, 1314.01 examples/s]
+Map (num_proc=16): 47%|████▋ | 382000/818627 [06:11<04:30, 1613.64 examples/s]
+Map (num_proc=16): 47%|████▋ | 383000/818627 [06:11<03:43, 1950.40 examples/s]
+Map (num_proc=16): 47%|████▋ | 385000/818627 [06:12<03:39, 1973.96 examples/s]
+Map (num_proc=16): 47%|████▋ | 386000/818627 [06:15<06:17, 1146.56 examples/s]
+Map (num_proc=16): 47%|████▋ | 388000/818627 [06:17<06:37, 1082.41 examples/s]
+Map (num_proc=16): 48%|████▊ | 389000/818627 [06:19<08:32, 838.30 examples/s]
+Map (num_proc=16): 48%|████▊ | 390000/818627 [06:19<07:29, 952.89 examples/s]
+Map (num_proc=16): 48%|████▊ | 391000/818627 [06:20<07:43, 922.72 examples/s]
+Map (num_proc=16): 48%|████▊ | 392000/818627 [06:22<08:39, 821.04 examples/s]
+Map (num_proc=16): 48%|████▊ | 393000/818627 [06:23<08:26, 840.29 examples/s]
+Map (num_proc=16): 48%|████▊ | 394000/818627 [06:25<09:36, 736.55 examples/s]
+Map (num_proc=16): 48%|████▊ | 395000/818627 [06:25<07:26, 949.77 examples/s]
+Map (num_proc=16): 48%|████▊ | 397000/818627 [06:26<05:30, 1275.58 examples/s]
+Map (num_proc=16): 49%|████▊ | 398000/818627 [06:26<04:33, 1539.19 examples/s]
+Map (num_proc=16): 49%|████▉ | 400000/818627 [06:28<05:22, 1298.84 examples/s]
+Map (num_proc=16): 49%|████▉ | 401000/818627 [06:29<04:54, 1418.24 examples/s]
+Map (num_proc=16): 49%|████▉ | 402000/818627 [06:29<04:41, 1480.88 examples/s]
+Map (num_proc=16): 49%|████▉ | 403000/818627 [06:30<04:46, 1451.77 examples/s]
+Map (num_proc=16): 49%|████▉ | 404000/818627 [06:31<05:45, 1201.38 examples/s]
+Map (num_proc=16): 49%|████▉ | 405000/818627 [06:34<09:48, 702.72 examples/s]
+Map (num_proc=16): 50%|████▉ | 406000/818627 [06:34<07:23, 930.67 examples/s]
+Map (num_proc=16): 50%|████▉ | 407000/818627 [06:35<07:01, 976.01 examples/s]
+Map (num_proc=16): 50%|████▉ | 408000/818627 [06:37<08:23, 815.27 examples/s]
+Map (num_proc=16): 50%|████▉ | 409000/818627 [06:38<07:04, 963.94 examples/s]
+Map (num_proc=16): 50%|█████ | 410000/818627 [06:40<09:24, 723.90 examples/s]
+Map (num_proc=16): 50%|█████ | 411000/818627 [06:40<07:29, 907.48 examples/s]
+Map (num_proc=16): 50%|█████ | 412000/818627 [06:41<06:26, 1052.26 examples/s]
+Map (num_proc=16): 50%|█████ | 413000/818627 [06:41<04:55, 1374.82 examples/s]
+Map (num_proc=16): 51%|█████ | 414000/818627 [06:41<03:45, 1793.25 examples/s]
+Map (num_proc=16): 51%|█████ | 416000/818627 [06:44<05:53, 1140.28 examples/s]
+Map (num_proc=16): 51%|█████ | 417000/818627 [06:44<04:48, 1394.10 examples/s]
+Map (num_proc=16): 51%|█████ | 418000/818627 [06:45<05:59, 1115.86 examples/s]
+Map (num_proc=16): 51%|█████ | 419000/818627 [06:46<05:36, 1187.32 examples/s]
+Map (num_proc=16): 51%|█████▏ | 420000/818627 [06:46<04:24, 1506.54 examples/s]
+Map (num_proc=16): 51%|█████▏ | 421000/818627 [06:49<08:24, 787.71 examples/s]
+Map (num_proc=16): 52%|█████▏ | 422000/818627 [06:50<07:20, 899.95 examples/s]
+Map (num_proc=16): 52%|█████▏ | 423000/818627 [06:51<08:03, 818.26 examples/s]
+Map (num_proc=16): 52%|█████▏ | 425000/818627 [06:52<05:42, 1149.36 examples/s]
+Map (num_proc=16): 52%|█████▏ | 426000/818627 [06:55<08:18, 786.99 examples/s]
+Map (num_proc=16): 52%|█████▏ | 428000/818627 [06:56<06:01, 1081.36 examples/s]
+Map (num_proc=16): 52%|█████▏ | 429000/818627 [06:56<05:59, 1082.95 examples/s]
+Map (num_proc=16): 53%|█████▎ | 431000/818627 [06:57<04:00, 1612.31 examples/s]
+Map (num_proc=16): 53%|█████▎ | 432000/818627 [06:58<05:24, 1193.00 examples/s]
+Map (num_proc=16): 53%|█████▎ | 433000/818627 [07:00<05:55, 1083.81 examples/s]
+Map (num_proc=16): 53%|█████▎ | 434000/818627 [07:00<04:41, 1367.79 examples/s]
+Map (num_proc=16): 53%|█████▎ | 435000/818627 [07:01<05:50, 1094.32 examples/s]
+Map (num_proc=16): 53%|█████▎ | 436000/818627 [07:03<06:42, 950.58 examples/s]
+Map (num_proc=16): 53%|█████▎ | 437000/818627 [07:04<06:47, 936.66 examples/s]
+Map (num_proc=16): 54%|█████▎ | 438000/818627 [07:05<06:48, 932.88 examples/s]
+Map (num_proc=16): 54%|█████▎ | 439000/818627 [07:06<06:38, 951.86 examples/s]
+Map (num_proc=16): 54%|█████▎ | 440000/818627 [07:06<05:12, 1213.14 examples/s]
+Map (num_proc=16): 54%|█████▍ | 441000/818627 [07:07<06:06, 1030.54 examples/s]
+Map (num_proc=16): 54%|█████▍ | 442000/818627 [07:09<06:56, 904.58 examples/s]
+Map (num_proc=16): 54%|█████▍ | 443000/818627 [07:10<06:21, 985.80 examples/s]
+Map (num_proc=16): 54%|█████▍ | 444000/818627 [07:11<06:58, 895.75 examples/s]
+Map (num_proc=16): 54%|█████▍ | 445000/818627 [07:12<06:03, 1029.23 examples/s]
+Map (num_proc=16): 54%|█████▍ | 446000/818627 [07:12<04:47, 1298.23 examples/s]
+Map (num_proc=16): 55%|█████▍ | 447000/818627 [07:13<04:50, 1277.62 examples/s]
+Map (num_proc=16): 55%|█████▍ | 448000/818627 [07:13<04:18, 1431.38 examples/s]
+Map (num_proc=16): 55%|█████▍ | 449000/818627 [07:14<05:11, 1184.72 examples/s]
+Map (num_proc=16): 55%|█████▍ | 450000/818627 [07:15<05:29, 1117.63 examples/s]
+Map (num_proc=16): 55%|█████▌ | 451000/818627 [07:16<05:07, 1195.68 examples/s]
+Map (num_proc=16): 55%|█████▌ | 452000/818627 [07:18<06:43, 907.74 examples/s]
+Map (num_proc=16): 55%|█████▌ | 453000/818627 [07:19<06:39, 914.07 examples/s]
+Map (num_proc=16): 55%|█████▌ | 454000/818627 [07:20<06:04, 999.62 examples/s]
+Map (num_proc=16): 56%|█████▌ | 455000/818627 [07:20<04:26, 1364.59 examples/s]
+Map (num_proc=16): 56%|█████▌ | 456000/818627 [07:21<05:05, 1185.42 examples/s]
+Map (num_proc=16): 56%|█████▌ | 457000/818627 [07:22<06:02, 996.61 examples/s]
+Map (num_proc=16): 56%|█████▌ | 458000/818627 [07:23<06:11, 970.23 examples/s]
+Map (num_proc=16): 56%|█████▌ | 459000/818627 [07:25<07:58, 752.20 examples/s]
+Map (num_proc=16): 56%|█████▌ | 460000/818627 [07:26<06:36, 904.14 examples/s]
+Map (num_proc=16): 56%|█████▋ | 461000/818627 [07:27<05:55, 1005.05 examples/s]
+Map (num_proc=16): 56%|█████▋ | 462000/818627 [07:27<04:39, 1278.04 examples/s]
+Map (num_proc=16): 57%|█████▋ | 463000/818627 [07:28<05:33, 1067.08 examples/s]
+Map (num_proc=16): 57%|█████▋ | 464000/818627 [07:29<04:24, 1341.11 examples/s]
+Map (num_proc=16): 57%|█████▋ | 466000/818627 [07:30<04:40, 1255.31 examples/s]
+Map (num_proc=16): 57%|█████▋ | 467000/818627 [07:31<04:03, 1444.64 examples/s]
+Map (num_proc=16): 57%|█████▋ | 468000/818627 [07:33<06:49, 855.25 examples/s]
+Map (num_proc=16): 57%|█████▋ | 469000/818627 [07:34<06:00, 968.63 examples/s]
+Map (num_proc=16): 57%|█████▋ | 470000/818627 [07:35<05:29, 1058.00 examples/s]
+Map (num_proc=16): 58%|█████▊ | 471000/818627 [07:35<04:33, 1269.67 examples/s]
+Map (num_proc=16): 58%|█████▊ | 472000/818627 [07:35<03:45, 1540.24 examples/s]
+Map (num_proc=16): 58%|█████▊ | 473000/818627 [07:37<04:57, 1160.93 examples/s]
+Map (num_proc=16): 58%|█████▊ | 474000/818627 [07:38<05:33, 1033.51 examples/s]
+Map (num_proc=16): 58%|█████▊ | 475000/818627 [07:40<07:56, 721.26 examples/s]
+Map (num_proc=16): 58%|█████▊ | 476000/818627 [07:41<06:18, 905.34 examples/s]
+Map (num_proc=16): 58%|█████▊ | 477000/818627 [07:42<06:15, 909.00 examples/s]
+Map (num_proc=16): 59%|█████▊ | 479000/818627 [07:43<04:23, 1290.66 examples/s]
+Map (num_proc=16): 59%|█████▊ | 480000/818627 [07:43<04:34, 1232.59 examples/s]
+Map (num_proc=16): 59%|█████▉ | 481000/818627 [07:44<04:04, 1382.80 examples/s]
+Map (num_proc=16): 59%|█████▉ | 482000/818627 [07:45<04:47, 1172.05 examples/s]
+Map (num_proc=16): 59%|█████▉ | 483000/818627 [07:45<03:53, 1439.95 examples/s]
+Map (num_proc=16): 59%|█████▉ | 484000/818627 [07:48<07:15, 769.22 examples/s]
+Map (num_proc=16): 59%|█████▉ | 485000/818627 [07:49<07:05, 784.58 examples/s]
+Map (num_proc=16): 59%|█████▉ | 486000/818627 [07:50<05:16, 1050.92 examples/s]
+Map (num_proc=16): 59%|█████▉ | 487000/818627 [07:50<04:23, 1256.36 examples/s]
+Map (num_proc=16): 60%|█████▉ | 488000/818627 [07:51<03:55, 1402.62 examples/s]
+Map (num_proc=16): 60%|█████▉ | 489000/818627 [07:51<04:01, 1366.81 examples/s]
+Map (num_proc=16): 60%|█████▉ | 490000/818627 [07:52<04:05, 1338.27 examples/s]
+Map (num_proc=16): 60%|█████▉ | 491000/818627 [07:56<08:44, 624.80 examples/s]
+Map (num_proc=16): 60%|██████ | 492000/818627 [07:56<06:17, 864.14 examples/s]
+Map (num_proc=16): 60%|██████ | 494000/818627 [07:57<04:45, 1135.83 examples/s]
+Map (num_proc=16): 60%|██████ | 495000/818627 [07:58<04:45, 1132.72 examples/s]
+Map (num_proc=16): 61%|██████ | 496000/818627 [07:59<05:04, 1060.03 examples/s]
+Map (num_proc=16): 61%|██████ | 497000/818627 [08:00<04:40, 1144.91 examples/s]
+Map (num_proc=16): 61%|██████ | 498000/818627 [08:00<04:13, 1265.54 examples/s]
+Map (num_proc=16): 61%|██████ | 500000/818627 [08:04<06:43, 789.55 examples/s]
+Map (num_proc=16): 61%|██████ | 501000/818627 [08:04<05:21, 986.98 examples/s]
+Map (num_proc=16): 61%|██████▏ | 502000/818627 [08:04<04:21, 1208.78 examples/s]
+Map (num_proc=16): 61%|██████▏ | 503000/818627 [08:05<03:52, 1358.89 examples/s]
+Map (num_proc=16): 62%|██████▏ | 504000/818627 [08:05<03:32, 1478.08 examples/s]
+Map (num_proc=16): 62%|██████▏ | 505000/818627 [08:07<04:26, 1178.36 examples/s]
+Map (num_proc=16): 62%|██████▏ | 506000/818627 [08:07<03:54, 1332.76 examples/s]
+Map (num_proc=16): 62%|██████▏ | 507000/818627 [08:10<06:40, 777.36 examples/s]
+Map (num_proc=16): 62%|██████▏ | 508000/818627 [08:11<06:06, 847.28 examples/s]
+Map (num_proc=16): 62%|██████▏ | 509000/818627 [08:11<04:44, 1089.14 examples/s]
+Map (num_proc=16): 62%|██████▏ | 510000/818627 [08:12<04:50, 1061.91 examples/s]
+Map (num_proc=16): 62%|██████▏ | 511000/818627 [08:12<03:52, 1324.58 examples/s]
+Map (num_proc=16): 63%|██████▎ | 512000/818627 [08:14<05:08, 994.68 examples/s]
+Map (num_proc=16): 63%|██████▎ | 513000/818627 [08:14<04:01, 1266.45 examples/s]
+Map (num_proc=16): 63%|██████▎ | 514000/818627 [08:15<04:02, 1255.04 examples/s]
+Map (num_proc=16): 63%|██████▎ | 515000/818627 [08:16<04:19, 1172.00 examples/s]
+Map (num_proc=16): 63%|██████▎ | 516000/818627 [08:19<07:53, 639.07 examples/s]
+Map (num_proc=16): 63%|██████▎ | 517000/818627 [08:19<05:44, 876.79 examples/s]
+Map (num_proc=16): 63%|██████▎ | 518000/818627 [08:20<04:28, 1118.78 examples/s]
+Map (num_proc=16): 63%|██████▎ | 519000/818627 [08:20<04:08, 1204.01 examples/s]
+Map (num_proc=16): 64%|██████▎ | 520000/818627 [08:21<03:38, 1368.22 examples/s]
+Map (num_proc=16): 64%|██████▎ | 521000/818627 [08:22<03:37, 1369.40 examples/s]
+Map (num_proc=16): 64%|██████▍ | 522000/818627 [08:22<03:33, 1388.72 examples/s]
+Map (num_proc=16): 64%|██████▍ | 523000/818627 [08:25<06:29, 758.14 examples/s]
+Map (num_proc=16): 64%|██████▍ | 524000/818627 [08:25<04:51, 1010.26 examples/s]
+Map (num_proc=16): 64%|██████▍ | 525000/818627 [08:27<06:14, 784.43 examples/s]
+Map (num_proc=16): 64%|██████▍ | 526000/818627 [08:27<04:43, 1032.20 examples/s]
+Map (num_proc=16): 64%|██████▍ | 528000/818627 [08:28<03:36, 1342.33 examples/s]
+Map (num_proc=16): 65%|██████▍ | 529000/818627 [08:30<04:09, 1160.98 examples/s]
+Map (num_proc=16): 65%|██████▍ | 530000/818627 [08:30<03:18, 1454.35 examples/s]
+Map (num_proc=16): 65%|██████▍ | 531000/818627 [08:31<03:50, 1247.84 examples/s]
+Map (num_proc=16): 65%|██████▍ | 532000/818627 [08:34<07:00, 681.52 examples/s]
+Map (num_proc=16): 65%|██████▌ | 533000/818627 [08:34<05:16, 902.76 examples/s]
+Map (num_proc=16): 65%|██████▌ | 534000/818627 [08:35<05:17, 897.33 examples/s]
+Map (num_proc=16): 65%|██████▌ | 536000/818627 [08:36<03:07, 1507.67 examples/s]
+Map (num_proc=16): 66%|██████▌ | 537000/818627 [08:37<04:04, 1151.65 examples/s]
+Map (num_proc=16): 66%|██████▌ | 538000/818627 [08:38<03:51, 1213.28 examples/s]
+Map (num_proc=16): 66%|██████▌ | 539000/818627 [08:39<04:20, 1074.07 examples/s]
+Map (num_proc=16): 66%|██████▌ | 540000/818627 [08:40<04:49, 963.14 examples/s]
+Map (num_proc=16): 66%|██████▌ | 541000/818627 [08:43<06:09, 751.93 examples/s]
+Map (num_proc=16): 66%|██████▋ | 543000/818627 [08:43<03:46, 1214.38 examples/s]
+Map (num_proc=16): 66%|██████▋ | 544000/818627 [08:44<03:54, 1172.15 examples/s]
+Map (num_proc=16): 67%|██████▋ | 545000/818627 [08:44<03:34, 1274.33 examples/s]
+Map (num_proc=16): 67%|██████▋ | 546000/818627 [08:45<03:10, 1429.02 examples/s]
+Map (num_proc=16): 67%|██████▋ | 547000/818627 [08:46<03:05, 1465.21 examples/s]
+Map (num_proc=16): 67%|██████▋ | 548000/818627 [08:49<06:15, 721.60 examples/s]
+Map (num_proc=16): 67%|██████▋ | 549000/818627 [08:49<05:20, 841.51 examples/s]
+Map (num_proc=16): 67%|██████▋ | 550000/818627 [08:51<05:15, 850.31 examples/s]
+Map (num_proc=16): 67%|██████▋ | 551000/818627 [08:51<03:57, 1125.70 examples/s]
+Map (num_proc=16): 67%|██████▋ | 552000/818627 [08:51<03:24, 1305.82 examples/s]
+Map (num_proc=16): 68%|██████▊ | 553000/818627 [08:52<02:46, 1598.26 examples/s]
+Map (num_proc=16): 68%|██████▊ | 554000/818627 [08:54<04:48, 916.16 examples/s]
+Map (num_proc=16): 68%|██████▊ | 556000/818627 [08:54<03:04, 1420.70 examples/s]
+Map (num_proc=16): 68%|██████▊ | 557000/818627 [08:58<06:33, 665.27 examples/s]
+Map (num_proc=16): 68%|██████▊ | 558000/818627 [08:58<04:56, 877.63 examples/s]
+Map (num_proc=16): 68%|██████▊ | 560000/818627 [09:00<04:14, 1015.15 examples/s]
+Map (num_proc=16): 69%|██████▊ | 561000/818627 [09:00<03:33, 1206.29 examples/s]
+Map (num_proc=16): 69%|██████▊ | 562000/818627 [09:00<02:48, 1523.92 examples/s]
+Map (num_proc=16): 69%|██████▉ | 563000/818627 [09:01<02:56, 1450.34 examples/s]
+Map (num_proc=16): 69%|██████▉ | 564000/818627 [09:03<03:59, 1064.13 examples/s]
+Map (num_proc=16): 69%|██████▉ | 565000/818627 [09:05<06:07, 689.94 examples/s]
+Map (num_proc=16): 69%|██████▉ | 567000/818627 [09:06<03:34, 1174.09 examples/s]
+Map (num_proc=16): 69%|██████▉ | 568000/818627 [09:06<03:02, 1374.46 examples/s]
+Map (num_proc=16): 70%|██████▉ | 569000/818627 [09:07<03:29, 1190.69 examples/s]
+Map (num_proc=16): 70%|██████▉ | 570000/818627 [09:08<03:58, 1042.35 examples/s]
+Map (num_proc=16): 70%|██████▉ | 571000/818627 [09:09<03:06, 1327.10 examples/s]
+Map (num_proc=16): 70%|██████▉ | 572000/818627 [09:09<02:35, 1588.55 examples/s]
+Map (num_proc=16): 70%|██████▉ | 573000/818627 [09:13<06:19, 647.92 examples/s]
+Map (num_proc=16): 70%|███████ | 574000/818627 [09:13<05:01, 811.36 examples/s]
+Map (num_proc=16): 70%|███████ | 575000/818627 [09:14<04:09, 978.30 examples/s]
+Map (num_proc=16): 70%|███████ | 576000/818627 [09:15<04:06, 984.79 examples/s]
+Map (num_proc=16): 70%|███████ | 577000/818627 [09:16<03:47, 1060.26 examples/s]
+Map (num_proc=16): 71%|███████ | 578000/818627 [09:16<02:46, 1443.56 examples/s]
+Map (num_proc=16): 71%|███████ | 579000/818627 [09:16<02:41, 1487.57 examples/s]
+Map (num_proc=16): 71%|███████ | 580000/818627 [09:18<03:30, 1132.50 examples/s]
+Map (num_proc=16): 71%|███████ | 581000/818627 [09:20<05:24, 732.44 examples/s]
+Map (num_proc=16): 71%|███████ | 582000/818627 [09:20<04:08, 953.24 examples/s]
+Map (num_proc=16): 71%|███████▏ | 584000/818627 [09:21<02:18, 1695.48 examples/s]
+Map (num_proc=16): 71%|███████▏ | 585000/818627 [09:23<03:44, 1041.06 examples/s]
+Map (num_proc=16): 72%|███████▏ | 586000/818627 [09:23<02:53, 1340.68 examples/s]
+Map (num_proc=16): 72%|███████▏ | 587000/818627 [09:23<02:36, 1479.79 examples/s]
+Map (num_proc=16): 72%|███████▏ | 588000/818627 [09:24<02:56, 1310.19 examples/s]
+Map (num_proc=16): 72%|███████▏ | 589000/818627 [09:27<05:23, 710.79 examples/s]
+Map (num_proc=16): 72%|███████▏ | 590000/818627 [09:28<04:07, 922.61 examples/s]
+Map (num_proc=16): 72%|███████▏ | 591000/818627 [09:28<03:52, 978.35 examples/s]
+Map (num_proc=16): 72%|███████▏ | 592000/818627 [09:30<04:24, 857.17 examples/s]
+Map (num_proc=16): 72%|███████▏ | 593000/818627 [09:31<04:11, 897.86 examples/s]
+Map (num_proc=16): 73%|███████▎ | 594000/818627 [09:31<03:18, 1131.97 examples/s]
+Map (num_proc=16): 73%|███████▎ | 596000/818627 [09:32<02:25, 1527.24 examples/s]
+Map (num_proc=16): 73%|███████▎ | 597000/818627 [09:35<04:45, 777.14 examples/s]
+Map (num_proc=16): 73%|███████▎ | 598000/818627 [09:36<03:52, 947.53 examples/s]
+Map (num_proc=16): 73%|███████▎ | 600000/818627 [09:36<02:45, 1318.00 examples/s]
+Map (num_proc=16): 73%|███████▎ | 601000/818627 [09:37<02:22, 1525.15 examples/s]
+Map (num_proc=16): 74%|███████▎ | 602000/818627 [09:37<02:28, 1460.93 examples/s]
+Map (num_proc=16): 74%|███████▎ | 603000/818627 [09:39<03:19, 1083.34 examples/s]
+Map (num_proc=16): 74%|███████▍ | 604000/818627 [09:40<03:34, 999.22 examples/s]
+Map (num_proc=16): 74%|███████▍ | 605000/818627 [09:42<04:19, 822.10 examples/s]
+Map (num_proc=16): 74%|███████▍ | 606000/818627 [09:42<03:31, 1004.52 examples/s]
+Map (num_proc=16): 74%|███████▍ | 607000/818627 [09:43<02:42, 1306.16 examples/s]
+Map (num_proc=16): 74%|███████▍ | 608000/818627 [09:45<04:20, 809.79 examples/s]
+Map (num_proc=16): 74%|███████▍ | 609000/818627 [09:46<04:05, 855.53 examples/s]
+Map (num_proc=16): 75%|███████▍ | 611000/818627 [09:47<02:50, 1215.19 examples/s]
+Map (num_proc=16): 75%|███████▍ | 612000/818627 [09:47<02:17, 1503.95 examples/s]
+Map (num_proc=16): 75%|███████▍ | 613000/818627 [09:50<03:59, 857.22 examples/s]
+Map (num_proc=16): 75%|███████▌ | 615000/818627 [09:51<02:54, 1163.60 examples/s]
+Map (num_proc=16): 75%|███████▌ | 616000/818627 [09:52<03:05, 1089.79 examples/s]
+Map (num_proc=16): 75%|███████▌ | 617000/818627 [09:52<02:27, 1366.01 examples/s]
+Map (num_proc=16): 76%|███████▌ | 619000/818627 [09:54<02:56, 1129.69 examples/s]
+Map (num_proc=16): 76%|███████▌ | 620000/818627 [09:56<03:23, 974.26 examples/s]
+Map (num_proc=16): 76%|███████▌ | 621000/818627 [09:56<02:58, 1107.57 examples/s]
+Map (num_proc=16): 76%|███████▌ | 622000/818627 [09:58<03:26, 951.24 examples/s]
+Map (num_proc=16): 76%|███████▌ | 623000/818627 [09:58<02:58, 1093.99 examples/s]
+Map (num_proc=16): 76%|███████▌ | 624000/818627 [10:00<03:28, 933.67 examples/s]
+Map (num_proc=16): 76%|███████▋ | 625000/818627 [10:01<03:35, 900.32 examples/s]
+Map (num_proc=16): 76%|███████▋ | 626000/818627 [10:01<02:59, 1075.55 examples/s]
+Map (num_proc=16): 77%|███████▋ | 627000/818627 [10:02<03:14, 987.66 examples/s]
+Map (num_proc=16): 77%|███████▋ | 629000/818627 [10:04<03:01, 1047.64 examples/s]
+Map (num_proc=16): 77%|███████▋ | 630000/818627 [10:06<03:16, 962.21 examples/s]
+Map (num_proc=16): 77%|███████▋ | 631000/818627 [10:06<02:51, 1094.06 examples/s]
+Map (num_proc=16): 77%|███████▋ | 632000/818627 [10:07<03:03, 1015.91 examples/s]
+Map (num_proc=16): 77%|███████▋ | 633000/818627 [10:08<02:42, 1145.68 examples/s]
+Map (num_proc=16): 77%|███████▋ | 634000/818627 [10:10<03:57, 776.76 examples/s]
+Map (num_proc=16): 78%|███████▊ | 635000/818627 [10:10<03:03, 1002.36 examples/s]
+Map (num_proc=16): 78%|███████▊ | 636000/818627 [10:11<02:50, 1068.15 examples/s]
+Map (num_proc=16): 78%|███████▊ | 638000/818627 [10:12<02:10, 1384.00 examples/s]
+Map (num_proc=16): 78%|███████▊ | 639000/818627 [10:13<02:29, 1199.16 examples/s]
+Map (num_proc=16): 78%|███████▊ | 640000/818627 [10:14<02:24, 1237.07 examples/s]
+Map (num_proc=16): 78%|███████▊ | 641000/818627 [10:15<02:36, 1137.29 examples/s]
+Map (num_proc=16): 78%|███████▊ | 642000/818627 [10:16<02:30, 1170.63 examples/s]
+Map (num_proc=16): 79%|███████▊ | 643000/818627 [10:17<02:57, 987.92 examples/s]
+Map (num_proc=16): 79%|███████▊ | 644000/818627 [10:18<02:15, 1290.40 examples/s]
+Map (num_proc=16): 79%|███████▉ | 645000/818627 [10:19<02:24, 1197.91 examples/s]
+Map (num_proc=16): 79%|███████▉ | 646000/818627 [10:20<02:49, 1021.34 examples/s]
+Map (num_proc=16): 79%|███████▉ | 647000/818627 [10:20<02:29, 1144.31 examples/s]
+Map (num_proc=16): 79%|███████▉ | 648000/818627 [10:23<03:33, 798.21 examples/s]
+Map (num_proc=16): 79%|███████▉ | 649000/818627 [10:24<03:31, 802.34 examples/s]
+Map (num_proc=16): 79%|███████▉ | 650000/818627 [10:25<03:46, 744.75 examples/s]
+Map (num_proc=16): 80%|███████▉ | 651000/818627 [10:26<02:50, 982.75 examples/s]
+Map (num_proc=16): 80%|███████▉ | 653000/818627 [10:26<01:37, 1705.66 examples/s]
+Map (num_proc=16): 80%|███████▉ | 654000/818627 [10:27<02:01, 1353.55 examples/s]
+Map (num_proc=16): 80%|████████ | 655000/818627 [10:29<02:42, 1009.32 examples/s]
+Map (num_proc=16): 80%|████████ | 656000/818627 [10:29<02:11, 1237.63 examples/s]
+Map (num_proc=16): 80%|████████ | 657000/818627 [10:30<02:11, 1231.91 examples/s]
+Map (num_proc=16): 80%|████████ | 658000/818627 [10:31<02:02, 1312.61 examples/s]
+Map (num_proc=16): 81%|████████ | 659000/818627 [10:33<03:04, 862.94 examples/s]
+Map (num_proc=16): 81%|████████ | 660000/818627 [10:33<02:14, 1176.46 examples/s]
+Map (num_proc=16): 81%|████████ | 661000/818627 [10:34<02:25, 1084.98 examples/s]
+Map (num_proc=16): 81%|████████ | 662000/818627 [10:35<02:14, 1164.74 examples/s]
+Map (num_proc=16): 81%|████████ | 664000/818627 [10:38<03:12, 802.45 examples/s]
+Map (num_proc=16): 81%|████████ | 665000/818627 [10:38<02:30, 1019.35 examples/s]
+Map (num_proc=16): 81%|████████▏ | 666000/818627 [10:40<03:23, 750.02 examples/s]
+Map (num_proc=16): 81%|████████▏ | 667000/818627 [10:41<02:35, 978.04 examples/s]
+Map (num_proc=16): 82%|████████▏ | 668000/818627 [10:41<02:14, 1118.60 examples/s]
+Map (num_proc=16): 82%|████████▏ | 670000/818627 [10:41<01:21, 1830.20 examples/s]
+Map (num_proc=16): 82%|████████▏ | 671000/818627 [10:43<01:55, 1276.04 examples/s]
+Map (num_proc=16): 82%|████████▏ | 672000/818627 [10:44<02:02, 1200.04 examples/s]
+Map (num_proc=16): 82%|████████▏ | 673000/818627 [10:45<01:51, 1302.63 examples/s]
+Map (num_proc=16): 82%|████████▏ | 674000/818627 [10:46<01:59, 1206.96 examples/s]
+Map (num_proc=16): 82%|████████▏ | 675000/818627 [10:48<02:48, 853.75 examples/s]
+Map (num_proc=16): 83%|████████▎ | 676000/818627 [10:49<02:43, 871.13 examples/s]
+Map (num_proc=16): 83%|████████▎ | 677000/818627 [10:49<02:14, 1049.10 examples/s]
+Map (num_proc=16): 83%|████████▎ | 678000/818627 [10:49<01:42, 1374.10 examples/s]
+Map (num_proc=16): 83%|████████▎ | 679000/818627 [10:50<01:29, 1564.67 examples/s]
+Map (num_proc=16): 83%|████████▎ | 680000/818627 [10:53<03:14, 714.47 examples/s]
+Map (num_proc=16): 83%|████████▎ | 681000/818627 [10:53<02:36, 880.82 examples/s]
+Map (num_proc=16): 83%|████████▎ | 682000/818627 [10:56<03:13, 705.30 examples/s]
+Map (num_proc=16): 84%|████████▎ | 684000/818627 [10:56<01:50, 1221.99 examples/s]
+Map (num_proc=16): 84%|████████▎ | 685000/818627 [10:56<01:40, 1331.78 examples/s]
+Map (num_proc=16): 84%|████████▍ | 686000/818627 [10:59<02:41, 822.53 examples/s]
+Map (num_proc=16): 84%|████████▍ | 687000/818627 [10:59<02:04, 1059.49 examples/s]
+Map (num_proc=16): 84%|████████▍ | 688000/818627 [11:00<01:45, 1234.30 examples/s]
+Map (num_proc=16): 84%|████████▍ | 689000/818627 [11:01<01:59, 1083.03 examples/s]
+Map (num_proc=16): 84%|████████▍ | 690000/818627 [11:03<02:35, 827.52 examples/s]
+Map (num_proc=16): 84%|████████▍ | 691000/818627 [11:04<02:21, 900.34 examples/s]
+Map (num_proc=16): 85%|████████▍ | 692000/818627 [11:04<01:47, 1172.82 examples/s]
+Map (num_proc=16): 85%|████████▍ | 693000/818627 [11:04<01:37, 1292.30 examples/s]
+Map (num_proc=16): 85%|████████▍ | 694000/818627 [11:06<01:59, 1040.82 examples/s]
+Map (num_proc=16): 85%|████████▍ | 695000/818627 [11:09<03:09, 651.03 examples/s]
+Map (num_proc=16): 85%|████████▌ | 696000/818627 [11:10<02:49, 725.18 examples/s]
+Map (num_proc=16): 85%|████████▌ | 697000/818627 [11:11<02:41, 755.03 examples/s]
+Map (num_proc=16): 85%|████████▌ | 699000/818627 [11:11<01:30, 1323.87 examples/s]
+Map (num_proc=16): 86%|████████▌ | 700000/818627 [11:11<01:19, 1494.38 examples/s]
+Map (num_proc=16): 86%|████████▌ | 702000/818627 [11:14<01:41, 1146.58 examples/s]
+Map (num_proc=16): 86%|████████▌ | 703000/818627 [11:14<01:25, 1354.24 examples/s]
+Map (num_proc=16): 86%|████████▌ | 704000/818627 [11:14<01:15, 1522.03 examples/s]
+Map (num_proc=16): 86%|████████▌ | 705000/818627 [11:16<01:33, 1220.24 examples/s]
+Map (num_proc=16): 86%|████████▌ | 706000/818627 [11:18<02:15, 830.63 examples/s]
+Map (num_proc=16): 86%|████████▋ | 707000/818627 [11:18<01:41, 1096.19 examples/s]
+Map (num_proc=16): 86%|████████▋ | 708000/818627 [11:21<02:34, 714.80 examples/s]
+Map (num_proc=16): 87%|████████▋ | 709000/818627 [11:21<02:07, 857.47 examples/s]
+Map (num_proc=16): 87%|████████▋ | 710000/818627 [11:24<02:40, 676.64 examples/s]
+Map (num_proc=16): 87%|████████▋ | 711000/818627 [11:24<02:14, 801.78 examples/s]
+Map (num_proc=16): 87%|████████▋ | 712000/818627 [11:24<01:40, 1065.44 examples/s]
+Map (num_proc=16): 87%|████████▋ | 713000/818627 [11:25<01:31, 1149.31 examples/s]
+Map (num_proc=16): 87%|████████▋ | 714000/818627 [11:26<01:15, 1379.03 examples/s]
+Map (num_proc=16): 87%|████████▋ | 715000/818627 [11:26<01:04, 1603.47 examples/s]
+Map (num_proc=16): 87%|████████▋ | 716000/818627 [11:27<01:06, 1552.88 examples/s]
+Map (num_proc=16): 88%|████████▊ | 718000/818627 [11:29<01:23, 1208.86 examples/s]
+Map (num_proc=16): 88%|████████▊ | 719000/818627 [11:29<01:10, 1419.17 examples/s]
+Map (num_proc=16): 88%|████████▊ | 721000/818627 [11:30<01:08, 1425.51 examples/s]
+Map (num_proc=16): 88%|████████▊ | 722000/818627 [11:32<01:37, 995.46 examples/s]
+Map (num_proc=16): 88%|████████▊ | 723000/818627 [11:33<01:28, 1081.08 examples/s]
+Map (num_proc=16): 88%|████████▊ | 724000/818627 [11:36<02:13, 708.14 examples/s]
+Map (num_proc=16): 89%|████████▊ | 725000/818627 [11:37<02:09, 725.20 examples/s]
+Map (num_proc=16): 89%|████████▊ | 726000/818627 [11:38<02:03, 752.37 examples/s]
+Map (num_proc=16): 89%|████████▉ | 727000/818627 [11:39<01:50, 830.20 examples/s]
+Map (num_proc=16): 89%|████████▉ | 728000/818627 [11:40<01:28, 1026.93 examples/s]
+Map (num_proc=16): 89%|████████▉ | 729000/818627 [11:40<01:04, 1387.57 examples/s]
+Map (num_proc=16): 89%|████████▉ | 730000/818627 [11:40<00:49, 1792.52 examples/s]
+Map (num_proc=16): 89%|████████▉ | 732000/818627 [11:41<00:50, 1703.27 examples/s]
+Map (num_proc=16): 90%|████████▉ | 733000/818627 [11:42<01:01, 1402.69 examples/s]
+Map (num_proc=16): 90%|████████▉ | 735000/818627 [11:45<01:12, 1150.53 examples/s]
+Map (num_proc=16): 90%|████████▉ | 736000/818627 [11:45<01:00, 1361.90 examples/s]
+Map (num_proc=16): 90%|█████████ | 737000/818627 [11:45<00:55, 1477.79 examples/s]
+Map (num_proc=16): 90%|█████████ | 738000/818627 [11:47<01:12, 1110.90 examples/s]
+Map (num_proc=16): 90%|█████████ | 739000/818627 [11:48<01:22, 970.80 examples/s]
+Map (num_proc=16): 90%|█████████ | 740000/818627 [11:51<02:08, 613.25 examples/s]
+Map (num_proc=16): 91%|█████████ | 741000/818627 [11:52<01:50, 703.35 examples/s]
+Map (num_proc=16): 91%|█████████ | 742000/818627 [11:53<01:30, 844.57 examples/s]
+Map (num_proc=16): 91%|█████████ | 743000/818627 [11:54<01:17, 976.38 examples/s]
+Map (num_proc=16): 91%|█████████ | 744000/818627 [11:54<01:06, 1125.81 examples/s]
+Map (num_proc=16): 91%|█████████ | 745000/818627 [11:54<00:50, 1446.02 examples/s]
+Map (num_proc=16): 91%|█████████ | 746000/818627 [11:55<00:39, 1826.98 examples/s]
+Map (num_proc=16): 91%|█████████▏| 747000/818627 [11:55<00:37, 1906.18 examples/s]
+Map (num_proc=16): 91%|█████████▏| 748000/818627 [11:56<00:40, 1734.57 examples/s]
+Map (num_proc=16): 91%|█████████▏| 749000/818627 [11:57<00:51, 1355.92 examples/s]
+Map (num_proc=16): 92%|█████████▏| 750000/818627 [11:58<00:56, 1220.22 examples/s]
+Map (num_proc=16): 92%|█████████▏| 751000/818627 [11:59<01:07, 1002.70 examples/s]
+Map (num_proc=16): 92%|█████████▏| 752000/818627 [12:01<01:12, 920.38 examples/s]
+Map (num_proc=16): 92%|█████████▏| 753000/818627 [12:01<00:59, 1108.20 examples/s]
+Map (num_proc=16): 92%|█████████▏| 755000/818627 [12:03<00:59, 1074.85 examples/s]
+Map (num_proc=16): 92%|█████████▏| 756000/818627 [12:07<01:40, 620.16 examples/s]
+Map (num_proc=16): 92%|█████████▏| 757000/818627 [12:07<01:17, 797.01 examples/s]
+Map (num_proc=16): 93%|█████████▎| 758000/818627 [12:08<01:15, 808.14 examples/s]
+Map (num_proc=16): 93%|█████████▎| 759000/818627 [12:08<00:59, 1010.35 examples/s]
+Map (num_proc=16): 93%|█████████▎| 760000/818627 [12:09<00:45, 1302.78 examples/s]
+Map (num_proc=16): 93%|█████████▎| 761000/818627 [12:09<00:37, 1522.63 examples/s]
+Map (num_proc=16): 93%|█████████▎| 762000/818627 [12:10<00:44, 1263.01 examples/s]
+Map (num_proc=16): 93%|█████████▎| 763000/818627 [12:10<00:34, 1612.67 examples/s]
+Map (num_proc=16): 93%|█████████▎| 764000/818627 [12:11<00:26, 2025.08 examples/s]
+Map (num_proc=16): 93%|█████████▎| 765000/818627 [12:12<00:39, 1375.03 examples/s]
+Map (num_proc=16): 94%|█████████▎| 766000/818627 [12:13<00:48, 1095.08 examples/s]
+Map (num_proc=16): 94%|█████████▎| 767000/818627 [12:14<00:46, 1107.18 examples/s]
+Map (num_proc=16): 94%|█████████▍| 768000/818627 [12:15<00:47, 1072.13 examples/s]
+Map (num_proc=16): 94%|█████████▍| 769000/818627 [12:15<00:35, 1395.37 examples/s]
+Map (num_proc=16): 94%|█████████▍| 770000/818627 [12:16<00:35, 1370.95 examples/s]
+Map (num_proc=16): 94%|█████████▍| 771000/818627 [12:18<00:54, 877.67 examples/s]
+Map (num_proc=16): 94%|█████████▍| 772000/818627 [12:21<01:19, 584.86 examples/s]
+Map (num_proc=16): 94%|█████████▍| 773000/818627 [12:22<01:07, 673.47 examples/s]
+Map (num_proc=16): 95%|█████████▍| 776000/818627 [12:23<00:36, 1162.08 examples/s]
+Map (num_proc=16): 95%|█████████▍| 776164/818627 [12:23<00:37, 1136.82 examples/s]
+Map (num_proc=16): 95%|█████████▍| 777164/818627 [12:24<00:28, 1444.26 examples/s]
+Map (num_proc=16): 95%|█████████▌| 778164/818627 [12:24<00:21, 1876.68 examples/s]
+Map (num_proc=16): 95%|█████████▌| 779164/818627 [12:25<00:28, 1386.15 examples/s]
+Map (num_proc=16): 95%|█████████▌| 780164/818627 [12:26<00:27, 1399.22 examples/s]
+Map (num_proc=16): 95%|█████████▌| 781164/818627 [12:26<00:23, 1593.33 examples/s]
+Map (num_proc=16): 96%|█████████▌| 782164/818627 [12:28<00:39, 926.12 examples/s]
+Map (num_proc=16): 96%|█████████▌| 783164/818627 [12:29<00:35, 989.30 examples/s]
+Map (num_proc=16): 96%|█████████▌| 784164/818627 [12:30<00:29, 1181.20 examples/s]
+Map (num_proc=16): 96%|█████████▌| 785164/818627 [12:30<00:21, 1542.42 examples/s]
+Map (num_proc=16): 96%|█████████▌| 786164/818627 [12:30<00:19, 1632.63 examples/s]
+Map (num_proc=16): 96%|█████████▌| 787328/818627 [12:33<00:39, 796.32 examples/s]
+Map (num_proc=16): 96%|█████████▋| 788328/818627 [12:35<00:41, 722.21 examples/s]
+Map (num_proc=16): 96%|█████████▋| 789328/818627 [12:36<00:37, 786.43 examples/s]
+Map (num_proc=16): 97%|█████████▋| 791328/818627 [12:37<00:23, 1139.16 examples/s]
+Map (num_proc=16): 97%|█████████▋| 793328/818627 [12:38<00:18, 1392.36 examples/s]
+Map (num_proc=16): 97%|█████████▋| 795328/818627 [12:39<00:14, 1633.19 examples/s]
+Map (num_proc=16): 97%|█████████▋| 795657/818627 [12:39<00:15, 1507.56 examples/s]
+Map (num_proc=16): 97%|█████████▋| 796657/818627 [12:39<00:12, 1760.30 examples/s]
+Map (num_proc=16): 97%|█████████▋| 797821/818627 [12:42<00:20, 1011.62 examples/s]
+Map (num_proc=16): 98%|█████████▊| 798821/818627 [12:42<00:17, 1116.67 examples/s]
+Map (num_proc=16): 98%|█████████▊| 799821/818627 [12:43<00:14, 1289.12 examples/s]
+Map (num_proc=16): 98%|█████████▊| 800821/818627 [12:43<00:11, 1561.67 examples/s]
+Map (num_proc=16): 98%|█████████▊| 801821/818627 [12:45<00:15, 1053.78 examples/s]
+Map (num_proc=16): 98%|█████████▊| 802821/818627 [12:45<00:13, 1144.93 examples/s]
+Map (num_proc=16): 98%|█████████▊| 803821/818627 [12:47<00:16, 878.23 examples/s]
+Map (num_proc=16): 98%|█████████▊| 804821/818627 [12:47<00:12, 1135.03 examples/s]
+Map (num_proc=16): 98%|█████████▊| 805821/818627 [12:48<00:08, 1450.78 examples/s]
+Map (num_proc=16): 99%|█████████▊| 806821/818627 [12:48<00:07, 1547.58 examples/s]
+Map (num_proc=16): 99%|█████████▊| 807149/818627 [12:49<00:10, 1120.98 examples/s]
+Map (num_proc=16): 99%|█████████▊| 808149/818627 [12:50<00:09, 1066.92 examples/s]
+Map (num_proc=16): 99%|█████████▉| 809149/818627 [12:51<00:09, 1007.08 examples/s]
+Map (num_proc=16): 99%|█████████▉| 809313/818627 [12:51<00:09, 993.20 examples/s]
+Map (num_proc=16): 99%|█████████▉| 810313/818627 [12:52<00:06, 1229.90 examples/s]
+Map (num_proc=16): 99%|█████████▉| 811313/818627 [12:52<00:04, 1723.80 examples/s]
+Map (num_proc=16): 99%|█████████▉| 812313/818627 [12:52<00:03, 2077.87 examples/s]
+Map (num_proc=16): 99%|█████████▉| 812641/818627 [12:53<00:04, 1377.02 examples/s]
+Map (num_proc=16): 99%|█████████▉| 812970/818627 [12:54<00:05, 1091.18 examples/s]
+Map (num_proc=16): 99%|█████████▉| 813970/818627 [12:54<00:03, 1535.19 examples/s]
+Map (num_proc=16): 100%|█████████▉| 814970/818627 [12:54<00:01, 2094.66 examples/s]
+Map (num_proc=16): 100%|█████████▉| 816134/818627 [12:56<00:02, 1039.33 examples/s]
+Map (num_proc=16): 100%|█████████▉| 817134/818627 [12:56<00:01, 1423.75 examples/s]
+Map (num_proc=16): 100%|█████████▉| 818463/818627 [13:01<00:00, 523.22 examples/s]
+Map (num_proc=16): 100%|██████████| 818627/818627 [13:03<00:00, 1044.55 examples/s]
+/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/distributed/distributed_c10d.py:4876: UserWarning: barrier(): using the device under current context. You can specify `device_id` in `init_process_group` to mute this warning.
+ warnings.warn( # warn only once
+[rank0]:[W309 17:02:55.540602358 ProcessGroupNCCL.cpp:5072] Guessing device ID based on global rank. This can cause a hang if rank to GPU mapping is heterogeneous. You can specify device_id in init_process_group()
+
+Filter: 0%| | 0/818627 [00:00, ? examples/s]dataset is cached at /workspace/hanrui/syxin_old/Specforge/cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /workspace/hanrui/syxin_old/Specforge/cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /workspace/hanrui/syxin_old/Specforge/cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /workspace/hanrui/syxin_old/Specforge/cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /workspace/hanrui/syxin_old/Specforge/cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /workspace/hanrui/syxin_old/Specforge/cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /workspace/hanrui/syxin_old/Specforge/cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
+Filter: 0%| | 1000/818627 [00:00<02:11, 6233.11 examples/s]
+Filter: 0%| | 0/818627 [00:00, ? examples/s]
+Filter: 0%| | 2000/818627 [00:00<02:00, 6760.22 examples/s]
+Filter: 0%| | 0/818627 [00:00, ? examples/s]
+Filter: 0%| | 0/818627 [00:00, ? examples/s]
+Filter: 0%| | 0/818627 [00:00, ? examples/s]
+Filter: 0%| | 0/818627 [00:00, ? examples/s]
+Filter: 0%| | 0/818627 [00:00, ? examples/s]
+Filter: 0%| | 0/818627 [00:00, ? examples/s]
+Filter: 0%| | 2000/818627 [00:00<01:11, 11484.95 examples/s]
+Filter: 0%| | 3000/818627 [00:00<01:50, 7352.96 examples/s]
+Filter: 0%| | 2000/818627 [00:00<01:06, 12223.05 examples/s]
+Filter: 0%| | 2000/818627 [00:00<01:09, 11795.07 examples/s]
+Filter: 0%| | 2000/818627 [00:00<01:10, 11655.04 examples/s]
+Filter: 0%| | 2000/818627 [00:00<01:08, 11897.23 examples/s]
+Filter: 0%| | 2000/818627 [00:00<01:09, 11750.50 examples/s]
+Filter: 0%| | 2000/818627 [00:00<01:12, 11282.55 examples/s]
+Filter: 0%| | 4000/818627 [00:00<01:41, 8061.79 examples/s]
+Filter: 0%| | 4000/818627 [00:00<01:07, 12133.95 examples/s]
+Filter: 0%| | 4000/818627 [00:00<01:04, 12572.85 examples/s]
+Filter: 0%| | 4000/818627 [00:00<01:04, 12599.14 examples/s]
+Filter: 0%| | 4000/818627 [00:00<01:04, 12578.09 examples/s]
+Filter: 0%| | 4000/818627 [00:00<01:04, 12578.49 examples/s]
+Filter: 0%| | 4000/818627 [00:00<01:04, 12536.43 examples/s]
+Filter: 0%| | 4000/818627 [00:00<01:07, 12001.36 examples/s]
+Filter: 1%| | 6000/818627 [00:00<01:08, 11905.77 examples/s]
+Filter: 1%| | 6000/818627 [00:00<01:30, 8951.20 examples/s]
+Filter: 1%| | 6000/818627 [00:00<01:03, 12848.21 examples/s]
+Filter: 1%| | 6000/818627 [00:00<01:03, 12847.39 examples/s]
+Filter: 1%| | 6000/818627 [00:00<01:03, 12756.49 examples/s]
+Filter: 1%| | 6000/818627 [00:00<01:03, 12745.95 examples/s]
+Filter: 1%| | 6000/818627 [00:00<01:04, 12594.06 examples/s]
+Filter: 1%| | 6000/818627 [00:00<01:06, 12240.64 examples/s]
+Filter: 1%| | 7000/818627 [00:00<01:30, 9009.37 examples/s]
+Filter: 1%| | 8000/818627 [00:00<01:30, 8929.46 examples/s]
+Filter: 1%| | 8000/818627 [00:00<01:03, 12841.41 examples/s]
+Filter: 1%| | 8000/818627 [00:00<01:17, 10514.79 examples/s]
+Filter: 1%| | 8000/818627 [00:00<01:02, 12869.23 examples/s]
+Filter: 1%| | 8000/818627 [00:00<01:03, 12693.47 examples/s]
+Filter: 1%| | 8000/818627 [00:00<01:03, 12773.09 examples/s]
+Filter: 1%| | 8000/818627 [00:00<01:03, 12735.76 examples/s]
+Filter: 1%| | 8000/818627 [00:00<01:06, 12266.40 examples/s]
+Filter: 1%| | 9000/818627 [00:01<01:31, 8849.83 examples/s]
+Filter: 1%| | 10000/818627 [00:00<01:11, 11235.65 examples/s]
+Filter: 1%| | 10000/818627 [00:00<01:13, 11007.85 examples/s]
+Filter: 1%| | 10000/818627 [00:00<01:13, 10970.02 examples/s]
+Filter: 1%| | 10000/818627 [00:00<01:11, 11272.24 examples/s]
+Filter: 1%| | 10000/818627 [00:00<01:11, 11262.67 examples/s]
+Filter: 1%| | 10000/818627 [00:00<01:10, 11498.88 examples/s]
+Filter: 1%| | 10000/818627 [00:00<01:22, 9779.89 examples/s]
+Filter: 1%| | 10000/818627 [00:01<01:32, 8753.29 examples/s]
+Filter: 1%|▏ | 11000/818627 [00:01<01:32, 8763.52 examples/s]
+Filter: 1%|▏ | 12000/818627 [00:01<01:18, 10234.35 examples/s]
+Filter: 1%|▏ | 12000/818627 [00:01<01:19, 10088.88 examples/s]
+Filter: 1%|▏ | 12000/818627 [00:01<01:19, 10107.93 examples/s]
+Filter: 1%|▏ | 12000/818627 [00:01<01:25, 9394.76 examples/s]
+Filter: 1%|▏ | 12000/818627 [00:01<01:18, 10248.52 examples/s]
+Filter: 1%|▏ | 12000/818627 [00:01<01:17, 10374.35 examples/s]
+Filter: 1%|▏ | 12000/818627 [00:01<01:18, 10250.81 examples/s]
+Filter: 1%|▏ | 12000/818627 [00:01<01:31, 8780.16 examples/s]
+Filter: 2%|▏ | 13000/818627 [00:01<01:27, 9251.35 examples/s]
+Filter: 2%|▏ | 13000/818627 [00:01<01:31, 8760.15 examples/s]
+Filter: 2%|▏ | 14000/818627 [00:01<01:23, 9688.75 examples/s]
+Filter: 2%|▏ | 14000/818627 [00:01<01:23, 9599.59 examples/s]
+Filter: 2%|▏ | 14000/818627 [00:01<01:23, 9611.21 examples/s]
+Filter: 2%|▏ | 14000/818627 [00:01<01:22, 9702.35 examples/s]
+Filter: 2%|▏ | 14000/818627 [00:01<01:22, 9697.77 examples/s]
+Filter: 2%|▏ | 14000/818627 [00:01<01:28, 9137.10 examples/s]
+Filter: 2%|▏ | 14000/818627 [00:01<01:22, 9772.13 examples/s]
+Filter: 2%|▏ | 14000/818627 [00:01<01:31, 8758.22 examples/s]
+Filter: 2%|▏ | 15000/818627 [00:01<01:25, 9404.50 examples/s]
+Filter: 2%|▏ | 15000/818627 [00:01<01:24, 9470.56 examples/s]
+Filter: 2%|▏ | 15000/818627 [00:01<01:25, 9413.66 examples/s]
+Filter: 2%|▏ | 15000/818627 [00:01<01:24, 9483.24 examples/s]
+Filter: 2%|▏ | 15000/818627 [00:01<01:29, 9017.63 examples/s]
+Filter: 2%|▏ | 15000/818627 [00:01<01:32, 8728.51 examples/s]
+Filter: 2%|▏ | 15000/818627 [00:01<01:24, 9475.84 examples/s]
+Filter: 2%|▏ | 15000/818627 [00:01<01:24, 9535.39 examples/s]
+Filter: 2%|▏ | 16000/818627 [00:01<01:26, 9250.55 examples/s]
+Filter: 2%|▏ | 16000/818627 [00:01<01:26, 9300.03 examples/s]
+Filter: 2%|▏ | 16000/818627 [00:01<01:26, 9255.20 examples/s]
+Filter: 2%|▏ | 16000/818627 [00:01<01:26, 9307.91 examples/s]
+Filter: 2%|▏ | 16000/818627 [00:01<01:26, 9306.92 examples/s]
+Filter: 2%|▏ | 16000/818627 [00:01<01:29, 8936.18 examples/s]
+Filter: 2%|▏ | 16000/818627 [00:01<01:32, 8722.25 examples/s]
+Filter: 2%|▏ | 16000/818627 [00:01<01:25, 9347.06 examples/s]
+Filter: 2%|▏ | 17000/818627 [00:01<01:27, 9186.45 examples/s]
+Filter: 2%|▏ | 17000/818627 [00:01<01:27, 9148.09 examples/s]
+Filter: 2%|▏ | 17000/818627 [00:01<01:27, 9153.42 examples/s]
+Filter: 2%|▏ | 17000/818627 [00:01<01:29, 8910.61 examples/s]
+Filter: 2%|▏ | 17000/818627 [00:01<01:26, 9226.81 examples/s]
+Filter: 2%|▏ | 17000/818627 [00:01<01:27, 9189.12 examples/s]
+Filter: 2%|▏ | 17000/818627 [00:01<01:31, 8755.05 examples/s]
+Filter: 2%|▏ | 17000/818627 [00:01<01:27, 9187.86 examples/s]
+Filter: 2%|▏ | 18000/818627 [00:01<01:28, 9033.75 examples/s]
+Filter: 2%|▏ | 18000/818627 [00:01<01:28, 9038.34 examples/s]
+Filter: 2%|▏ | 18000/818627 [00:01<01:28, 9060.42 examples/s]
+Filter: 2%|▏ | 18000/818627 [00:01<01:30, 8851.67 examples/s]
+Filter: 2%|▏ | 18000/818627 [00:02<01:31, 8741.58 examples/s]
+Filter: 2%|▏ | 18000/818627 [00:01<01:28, 9062.12 examples/s]
+Filter: 2%|▏ | 18000/818627 [00:01<01:28, 9062.62 examples/s]
+Filter: 2%|▏ | 18000/818627 [00:01<01:28, 9086.39 examples/s]
+Filter: 2%|▏ | 19000/818627 [00:01<01:29, 8952.72 examples/s]
+Filter: 2%|▏ | 19000/818627 [00:01<01:29, 8954.15 examples/s]
+Filter: 2%|▏ | 19000/818627 [00:01<01:29, 8961.86 examples/s]
+Filter: 2%|▏ | 19000/818627 [00:01<01:30, 8816.23 examples/s]
+Filter: 2%|▏ | 19000/818627 [00:01<01:29, 8973.39 examples/s]
+Filter: 2%|▏ | 19000/818627 [00:01<01:29, 8972.12 examples/s]
+Filter: 2%|▏ | 19000/818627 [00:02<01:31, 8735.88 examples/s]
+Filter: 2%|▏ | 19000/818627 [00:01<01:28, 8987.48 examples/s]
+Filter: 2%|▏ | 20000/818627 [00:01<01:29, 8931.87 examples/s]
+Filter: 2%|▏ | 20000/818627 [00:01<01:29, 8912.91 examples/s]
+Filter: 2%|▏ | 20000/818627 [00:02<01:29, 8909.84 examples/s]
+Filter: 2%|▏ | 20000/818627 [00:01<01:29, 8934.17 examples/s]
+Filter: 2%|▏ | 20000/818627 [00:02<01:30, 8815.44 examples/s]
+Filter: 2%|▏ | 20000/818627 [00:01<01:29, 8945.05 examples/s]
+Filter: 2%|▏ | 20000/818627 [00:02<01:31, 8758.12 examples/s]
+Filter: 2%|▏ | 20000/818627 [00:01<01:29, 8920.05 examples/s]
+Filter: 3%|▎ | 21000/818627 [00:02<01:29, 8907.25 examples/s]
+Filter: 3%|▎ | 21000/818627 [00:02<01:29, 8891.90 examples/s]
+Filter: 3%|▎ | 21000/818627 [00:02<01:30, 8830.39 examples/s]
+Filter: 3%|▎ | 21000/818627 [00:02<01:30, 8790.58 examples/s]
+Filter: 3%|▎ | 21000/818627 [00:02<01:29, 8911.92 examples/s]
+Filter: 3%|▎ | 21000/818627 [00:02<01:29, 8882.25 examples/s]
+Filter: 3%|▎ | 21000/818627 [00:02<01:29, 8906.50 examples/s]
+Filter: 3%|▎ | 21000/818627 [00:02<01:29, 8916.49 examples/s]
+Filter: 3%|▎ | 22000/818627 [00:02<01:29, 8883.32 examples/s]
+Filter: 3%|▎ | 22000/818627 [00:02<01:29, 8887.41 examples/s]
+Filter: 3%|▎ | 22000/818627 [00:02<01:29, 8884.12 examples/s]
+Filter: 3%|▎ | 22000/818627 [00:02<01:30, 8806.74 examples/s]
+Filter: 3%|▎ | 22000/818627 [00:02<01:30, 8829.42 examples/s]
+Filter: 3%|▎ | 22000/818627 [00:02<01:29, 8890.95 examples/s]
+Filter: 3%|▎ | 22000/818627 [00:02<01:29, 8886.92 examples/s]
+Filter: 3%|▎ | 22000/818627 [00:02<01:29, 8893.97 examples/s]
+Filter: 3%|▎ | 23000/818627 [00:02<01:29, 8885.99 examples/s]
+Filter: 3%|▎ | 23000/818627 [00:02<01:29, 8890.03 examples/s]
+Filter: 3%|▎ | 23000/818627 [00:02<01:29, 8886.38 examples/s]
+Filter: 3%|▎ | 23000/818627 [00:02<01:29, 8847.73 examples/s]
+Filter: 3%|▎ | 23000/818627 [00:02<01:29, 8890.15 examples/s]
+Filter: 3%|▎ | 23000/818627 [00:02<01:29, 8888.33 examples/s]
+Filter: 3%|▎ | 23000/818627 [00:02<01:29, 8894.66 examples/s]
+Filter: 3%|▎ | 23000/818627 [00:02<01:30, 8758.87 examples/s]
+Filter: 3%|▎ | 24000/818627 [00:02<01:29, 8872.57 examples/s]
+Filter: 3%|▎ | 24000/818627 [00:02<01:29, 8865.86 examples/s]
+Filter: 3%|▎ | 24000/818627 [00:02<01:29, 8869.93 examples/s]
+Filter: 3%|▎ | 24000/818627 [00:02<01:29, 8843.48 examples/s]
+Filter: 3%|▎ | 24000/818627 [00:02<01:29, 8871.58 examples/s]
+Filter: 3%|▎ | 24000/818627 [00:02<01:29, 8848.63 examples/s]
+Filter: 3%|▎ | 24000/818627 [00:02<01:29, 8869.70 examples/s]
+Filter: 3%|▎ | 24000/818627 [00:02<01:29, 8872.39 examples/s]
+Filter: 3%|▎ | 25000/818627 [00:02<01:30, 8787.68 examples/s]
+Filter: 3%|▎ | 25000/818627 [00:02<01:30, 8790.03 examples/s]
+Filter: 3%|▎ | 25000/818627 [00:02<01:30, 8776.67 examples/s]
+Filter: 3%|▎ | 25000/818627 [00:02<01:30, 8769.85 examples/s]
+Filter: 3%|▎ | 25000/818627 [00:02<01:30, 8792.32 examples/s]
+Filter: 3%|▎ | 25000/818627 [00:02<01:30, 8790.92 examples/s]
+Filter: 3%|▎ | 25000/818627 [00:02<01:30, 8770.70 examples/s]
+Filter: 3%|▎ | 25000/818627 [00:02<01:30, 8792.66 examples/s]
+Filter: 3%|▎ | 26000/818627 [00:02<01:29, 8821.80 examples/s]
+Filter: 3%|▎ | 26000/818627 [00:02<01:29, 8823.12 examples/s]
+Filter: 3%|▎ | 26000/818627 [00:02<01:29, 8828.79 examples/s]
+Filter: 3%|▎ | 26000/818627 [00:02<01:29, 8825.36 examples/s]
+Filter: 3%|▎ | 26000/818627 [00:02<01:29, 8823.50 examples/s]
+Filter: 3%|▎ | 26000/818627 [00:02<01:30, 8801.53 examples/s]
+Filter: 3%|▎ | 26000/818627 [00:03<01:29, 8810.70 examples/s]
+Filter: 3%|▎ | 26000/818627 [00:02<01:29, 8826.14 examples/s]
+Filter: 3%|▎ | 27000/818627 [00:02<01:29, 8827.94 examples/s]
+Filter: 3%|▎ | 27000/818627 [00:02<01:29, 8821.99 examples/s]
+Filter: 3%|▎ | 27000/818627 [00:02<01:29, 8827.13 examples/s]
+Filter: 3%|▎ | 27000/818627 [00:03<01:29, 8822.93 examples/s]
+Filter: 3%|▎ | 27000/818627 [00:02<01:29, 8819.76 examples/s]
+Filter: 3%|▎ | 27000/818627 [00:02<01:29, 8822.71 examples/s]
+Filter: 3%|▎ | 27000/818627 [00:02<01:29, 8824.46 examples/s]
+Filter: 3%|▎ | 27000/818627 [00:02<01:31, 8677.57 examples/s]
+Filter: 3%|▎ | 28000/818627 [00:02<01:29, 8831.69 examples/s]
+Filter: 3%|▎ | 28000/818627 [00:02<01:29, 8830.60 examples/s]
+Filter: 3%|▎ | 28000/818627 [00:02<01:29, 8832.06 examples/s]
+Filter: 3%|▎ | 28000/818627 [00:03<01:29, 8823.71 examples/s]
+Filter: 3%|▎ | 28000/818627 [00:03<01:29, 8823.83 examples/s]
+Filter: 3%|▎ | 28000/818627 [00:02<01:29, 8829.63 examples/s]
+Filter: 3%|▎ | 28000/818627 [00:02<01:29, 8869.60 examples/s]
+Filter: 3%|▎ | 28000/818627 [00:02<01:29, 8828.99 examples/s]
+Filter: 4%|▎ | 29000/818627 [00:03<01:29, 8862.25 examples/s]
+Filter: 4%|▎ | 29000/818627 [00:03<01:29, 8864.51 examples/s]
+Filter: 4%|▎ | 29000/818627 [00:03<01:29, 8858.54 examples/s]
+Filter: 4%|▎ | 29000/818627 [00:03<01:29, 8858.43 examples/s]
+Filter: 4%|▎ | 29000/818627 [00:03<01:29, 8861.47 examples/s]
+Filter: 4%|▎ | 29000/818627 [00:03<01:29, 8853.00 examples/s]
+Filter: 4%|▎ | 29000/818627 [00:03<01:28, 8890.05 examples/s]
+Filter: 4%|▎ | 29000/818627 [00:03<01:29, 8861.25 examples/s]
+Filter: 4%|▎ | 30000/818627 [00:03<01:29, 8799.86 examples/s]
+Filter: 4%|▎ | 30000/818627 [00:03<01:29, 8802.14 examples/s]
+Filter: 4%|▎ | 30000/818627 [00:03<01:29, 8798.36 examples/s]
+Filter: 4%|▎ | 30000/818627 [00:03<01:29, 8797.61 examples/s]
+Filter: 4%|▎ | 30000/818627 [00:03<01:29, 8797.42 examples/s]
+Filter: 4%|▎ | 30000/818627 [00:03<01:29, 8824.52 examples/s]
+Filter: 4%|▎ | 30000/818627 [00:03<01:29, 8800.82 examples/s]
+Filter: 4%|▎ | 30000/818627 [00:03<01:29, 8802.39 examples/s]
+Filter: 4%|▍ | 31000/818627 [00:03<01:29, 8794.40 examples/s]
+Filter: 4%|▍ | 31000/818627 [00:03<01:29, 8795.83 examples/s]
+Filter: 4%|▍ | 31000/818627 [00:03<01:29, 8793.21 examples/s]
+Filter: 4%|▍ | 31000/818627 [00:03<01:29, 8791.98 examples/s]
+Filter: 4%|▍ | 31000/818627 [00:03<01:29, 8791.46 examples/s]
+Filter: 4%|▍ | 31000/818627 [00:03<01:29, 8794.30 examples/s]
+Filter: 4%|▍ | 31000/818627 [00:03<01:29, 8797.83 examples/s]
+Filter: 4%|▍ | 31000/818627 [00:03<01:29, 8807.39 examples/s]
+Filter: 4%|▍ | 32000/818627 [00:03<01:29, 8811.58 examples/s]
+Filter: 4%|▍ | 32000/818627 [00:03<01:29, 8806.59 examples/s]
+Filter: 4%|▍ | 32000/818627 [00:03<01:29, 8805.83 examples/s]
+Filter: 4%|▍ | 32000/818627 [00:03<01:29, 8808.50 examples/s]
+Filter: 4%|▍ | 32000/818627 [00:03<01:29, 8812.92 examples/s]
+Filter: 4%|▍ | 32000/818627 [00:03<01:29, 8809.28 examples/s]
+Filter: 4%|▍ | 32000/818627 [00:03<01:29, 8819.97 examples/s]
+Filter: 4%|▍ | 32000/818627 [00:03<01:29, 8803.94 examples/s]
+Filter: 4%|▍ | 33000/818627 [00:03<01:29, 8775.72 examples/s]
+Filter: 4%|▍ | 33000/818627 [00:03<01:29, 8775.34 examples/s]
+Filter: 4%|▍ | 33000/818627 [00:03<01:29, 8771.80 examples/s]
+Filter: 4%|▍ | 33000/818627 [00:03<01:29, 8776.25 examples/s]
+Filter: 4%|▍ | 33000/818627 [00:03<01:29, 8773.53 examples/s]
+Filter: 4%|▍ | 33000/818627 [00:03<01:29, 8788.04 examples/s]
+Filter: 4%|▍ | 33000/818627 [00:03<01:29, 8775.05 examples/s]
+Filter: 4%|▍ | 33000/818627 [00:03<01:29, 8775.51 examples/s]
+Filter: 4%|▍ | 34000/818627 [00:03<01:29, 8788.34 examples/s]
+Filter: 4%|▍ | 34000/818627 [00:03<01:29, 8788.07 examples/s]
+Filter: 4%|▍ | 34000/818627 [00:03<01:29, 8780.93 examples/s]
+Filter: 4%|▍ | 34000/818627 [00:03<01:29, 8787.39 examples/s]
+Filter: 4%|▍ | 34000/818627 [00:03<01:29, 8794.54 examples/s]
+Filter: 4%|▍ | 34000/818627 [00:03<01:29, 8787.09 examples/s]
+Filter: 4%|▍ | 34000/818627 [00:03<01:29, 8786.69 examples/s]
+Filter: 4%|▍ | 34000/818627 [00:03<01:29, 8787.06 examples/s]
+Filter: 4%|▍ | 35000/818627 [00:03<01:29, 8767.56 examples/s]
+Filter: 4%|▍ | 35000/818627 [00:03<01:29, 8769.57 examples/s]
+Filter: 4%|▍ | 35000/818627 [00:03<01:29, 8764.32 examples/s]
+Filter: 4%|▍ | 35000/818627 [00:04<01:29, 8764.60 examples/s]
+Filter: 4%|▍ | 35000/818627 [00:03<01:29, 8765.65 examples/s]
+Filter: 4%|▍ | 35000/818627 [00:03<01:29, 8766.09 examples/s]
+Filter: 4%|▍ | 35000/818627 [00:03<01:29, 8764.32 examples/s]
+Filter: 4%|▍ | 35000/818627 [00:03<01:29, 8763.02 examples/s]
+Filter: 4%|▍ | 36000/818627 [00:03<01:29, 8783.38 examples/s]
+Filter: 4%|▍ | 36000/818627 [00:03<01:29, 8783.84 examples/s]
+Filter: 4%|▍ | 36000/818627 [00:03<01:29, 8781.08 examples/s]
+Filter: 4%|▍ | 36000/818627 [00:03<01:29, 8783.46 examples/s]
+Filter: 4%|▍ | 36000/818627 [00:04<01:29, 8781.86 examples/s]
+Filter: 4%|▍ | 36000/818627 [00:03<01:29, 8787.56 examples/s]
+Filter: 4%|▍ | 36000/818627 [00:03<01:29, 8782.00 examples/s]
+Filter: 4%|▍ | 36000/818627 [00:03<01:29, 8780.81 examples/s]
+Filter: 5%|▍ | 37000/818627 [00:03<01:29, 8772.12 examples/s]
+Filter: 5%|▍ | 37000/818627 [00:03<01:29, 8770.92 examples/s]
+Filter: 5%|▍ | 37000/818627 [00:03<01:29, 8768.89 examples/s]
+Filter: 5%|▍ | 37000/818627 [00:04<01:29, 8770.54 examples/s]
+Filter: 5%|▍ | 37000/818627 [00:03<01:29, 8775.50 examples/s]
+Filter: 5%|▍ | 37000/818627 [00:04<01:29, 8770.42 examples/s]
+Filter: 5%|▍ | 37000/818627 [00:03<01:29, 8772.21 examples/s]
+Filter: 5%|▍ | 37000/818627 [00:03<01:29, 8769.50 examples/s]
+Filter: 5%|▍ | 38000/818627 [00:04<01:28, 8802.72 examples/s]
+Filter: 5%|▍ | 38000/818627 [00:04<01:28, 8802.03 examples/s]
+Filter: 5%|▍ | 38000/818627 [00:04<01:28, 8798.30 examples/s]
+Filter: 5%|▍ | 38000/818627 [00:04<01:28, 8800.69 examples/s]
+Filter: 5%|▍ | 38000/818627 [00:04<01:28, 8800.15 examples/s]
+Filter: 5%|▍ | 38000/818627 [00:04<01:28, 8800.73 examples/s]
+Filter: 5%|▍ | 38000/818627 [00:04<01:28, 8793.99 examples/s]
+Filter: 5%|▍ | 38000/818627 [00:04<01:28, 8798.58 examples/s]
+Filter: 5%|▍ | 39000/818627 [00:04<01:28, 8818.63 examples/s]
+Filter: 5%|▍ | 39000/818627 [00:04<01:28, 8816.29 examples/s]
+Filter: 5%|▍ | 39000/818627 [00:04<01:28, 8819.62 examples/s]
+Filter: 5%|▍ | 39000/818627 [00:04<01:28, 8815.12 examples/s]
+Filter: 5%|▍ | 39000/818627 [00:04<01:28, 8814.08 examples/s]
+Filter: 5%|▍ | 39000/818627 [00:04<01:28, 8815.08 examples/s]
+Filter: 5%|▍ | 39000/818627 [00:04<01:28, 8809.59 examples/s]
+Filter: 5%|▍ | 39000/818627 [00:04<01:30, 8649.47 examples/s]
+Filter: 5%|▍ | 40000/818627 [00:04<01:28, 8840.73 examples/s]
+Filter: 5%|▍ | 40000/818627 [00:04<01:28, 8842.02 examples/s]
+Filter: 5%|▍ | 40000/818627 [00:04<01:27, 8890.15 examples/s]
+Filter: 5%|▍ | 40000/818627 [00:04<01:28, 8842.79 examples/s]
+Filter: 5%|▍ | 40000/818627 [00:04<01:28, 8845.42 examples/s]
+Filter: 5%|▍ | 40000/818627 [00:04<01:28, 8844.84 examples/s]
+Filter: 5%|▍ | 40000/818627 [00:04<01:28, 8844.66 examples/s]
+Filter: 5%|▍ | 40000/818627 [00:04<01:28, 8813.65 examples/s]
+Filter: 5%|▌ | 41000/818627 [00:04<01:28, 8833.21 examples/s]
+Filter: 5%|▌ | 41000/818627 [00:04<01:28, 8801.33 examples/s]
+Filter: 5%|▌ | 41000/818627 [00:04<01:28, 8801.35 examples/s]
+Filter: 5%|▌ | 41000/818627 [00:04<01:28, 8797.23 examples/s]
+Filter: 5%|▌ | 41000/818627 [00:04<01:28, 8804.43 examples/s]
+Filter: 5%|▌ | 41000/818627 [00:04<01:28, 8796.94 examples/s]
+Filter: 5%|▌ | 41000/818627 [00:04<01:29, 8657.26 examples/s]
+Filter: 5%|▌ | 41000/818627 [00:04<01:30, 8585.76 examples/s]
+Filter: 5%|▌ | 42000/818627 [00:04<01:28, 8793.97 examples/s]
+Filter: 5%|▌ | 42000/818627 [00:04<01:28, 8811.37 examples/s]
+Filter: 5%|▌ | 42000/818627 [00:04<01:27, 8831.08 examples/s]
+Filter: 5%|▌ | 42000/818627 [00:04<01:28, 8771.08 examples/s]
+Filter: 5%|▌ | 42000/818627 [00:04<01:28, 8770.53 examples/s]
+Filter: 5%|▌ | 42000/818627 [00:04<01:28, 8767.26 examples/s]
+Filter: 5%|▌ | 42000/818627 [00:04<01:28, 8771.05 examples/s]
+Filter: 5%|▌ | 42000/818627 [00:04<01:29, 8700.06 examples/s]
+Filter: 5%|▌ | 43000/818627 [00:04<01:28, 8801.93 examples/s]
+Filter: 5%|▌ | 43000/818627 [00:04<01:28, 8787.16 examples/s]
+Filter: 5%|▌ | 43000/818627 [00:04<01:28, 8773.96 examples/s]
+Filter: 5%|▌ | 43000/818627 [00:04<01:28, 8755.84 examples/s]
+Filter: 5%|▌ | 43000/818627 [00:04<01:28, 8756.19 examples/s]
+Filter: 5%|▌ | 43000/818627 [00:04<01:28, 8754.60 examples/s]
+Filter: 5%|▌ | 43000/818627 [00:04<01:28, 8757.74 examples/s]
+Filter: 5%|▌ | 43000/818627 [00:04<01:30, 8592.05 examples/s]
+Filter: 5%|▌ | 44000/818627 [00:04<01:28, 8800.63 examples/s]
+Filter: 5%|▌ | 44000/818627 [00:04<01:27, 8807.83 examples/s]
+Filter: 5%|▌ | 44000/818627 [00:04<01:27, 8812.84 examples/s]
+Filter: 5%|▌ | 44000/818627 [00:04<01:28, 8783.79 examples/s]
+Filter: 5%|▌ | 44000/818627 [00:04<01:28, 8781.32 examples/s]
+Filter: 5%|▌ | 44000/818627 [00:04<01:28, 8786.04 examples/s]
+Filter: 5%|▌ | 44000/818627 [00:04<01:27, 8832.03 examples/s]
+Filter: 5%|▌ | 44000/818627 [00:05<01:28, 8795.64 examples/s]
+Filter: 5%|▌ | 45000/818627 [00:04<01:28, 8761.90 examples/s]
+Filter: 5%|▌ | 45000/818627 [00:04<01:28, 8777.47 examples/s]
+Filter: 5%|▌ | 45000/818627 [00:04<01:28, 8764.09 examples/s]
+Filter: 5%|▌ | 45000/818627 [00:04<01:28, 8753.60 examples/s]
+Filter: 5%|▌ | 45000/818627 [00:04<01:28, 8752.06 examples/s]
+Filter: 5%|▌ | 45000/818627 [00:04<01:30, 8594.61 examples/s]
+Filter: 5%|▌ | 45000/818627 [00:04<01:29, 8618.72 examples/s]
+Filter: 5%|▌ | 45000/818627 [00:05<01:30, 8585.09 examples/s]
+Filter: 6%|▌ | 46000/818627 [00:04<01:28, 8778.02 examples/s]
+Filter: 6%|▌ | 46000/818627 [00:04<01:28, 8766.83 examples/s]
+Filter: 6%|▌ | 46000/818627 [00:04<01:28, 8771.99 examples/s]
+Filter: 6%|▌ | 46000/818627 [00:04<01:28, 8762.95 examples/s]
+Filter: 6%|▌ | 46000/818627 [00:04<01:28, 8763.03 examples/s]
+Filter: 6%|▌ | 46000/818627 [00:05<01:27, 8831.70 examples/s]
+Filter: 6%|▌ | 46000/818627 [00:05<01:29, 8642.05 examples/s]
+Filter: 6%|▌ | 46000/818627 [00:04<01:29, 8662.19 examples/s]
+Filter: 6%|▌ | 47000/818627 [00:05<01:27, 8773.23 examples/s]
+Filter: 6%|▌ | 47000/818627 [00:05<01:27, 8772.92 examples/s]
+Filter: 6%|▌ | 47000/818627 [00:05<01:28, 8741.05 examples/s]
+Filter: 6%|▌ | 47000/818627 [00:05<01:27, 8823.84 examples/s]
+Filter: 6%|▌ | 47000/818627 [00:05<01:28, 8710.78 examples/s]
+Filter: 6%|▌ | 47000/818627 [00:05<01:27, 8777.96 examples/s]
+Filter: 6%|▌ | 47000/818627 [00:05<01:28, 8674.72 examples/s]
+Filter: 6%|▌ | 47000/818627 [00:05<01:28, 8727.47 examples/s]
+Filter: 6%|▌ | 48000/818627 [00:05<01:27, 8825.36 examples/s]
+Filter: 6%|▌ | 48000/818627 [00:05<01:27, 8817.06 examples/s]
+Filter: 6%|▌ | 48000/818627 [00:05<01:27, 8808.99 examples/s]
+Filter: 6%|▌ | 48000/818627 [00:05<01:26, 8893.79 examples/s]
+Filter: 6%|▌ | 48000/818627 [00:05<01:27, 8835.14 examples/s]
+Filter: 6%|▌ | 48000/818627 [00:05<01:26, 8897.21 examples/s]
+Filter: 6%|▌ | 48000/818627 [00:05<01:27, 8824.31 examples/s]
+Filter: 6%|▌ | 48000/818627 [00:05<01:27, 8811.51 examples/s]
+Filter: 6%|▌ | 49000/818627 [00:05<01:27, 8767.49 examples/s]
+Filter: 6%|▌ | 49000/818627 [00:05<01:27, 8774.50 examples/s]
+Filter: 6%|▌ | 49000/818627 [00:05<01:27, 8768.03 examples/s]
+Filter: 6%|▌ | 49000/818627 [00:05<01:27, 8825.14 examples/s]
+Filter: 6%|▌ | 49000/818627 [00:05<01:27, 8831.21 examples/s]
+Filter: 6%|▌ | 49000/818627 [00:05<01:27, 8785.22 examples/s]
+Filter: 6%|▌ | 49000/818627 [00:05<01:27, 8776.88 examples/s]
+Filter: 6%|▌ | 49000/818627 [00:05<01:27, 8823.39 examples/s]
+Filter: 6%|▌ | 50000/818627 [00:05<01:27, 8752.16 examples/s]
+Filter: 6%|▌ | 50000/818627 [00:05<01:27, 8748.77 examples/s]
+Filter: 6%|▌ | 50000/818627 [00:05<01:27, 8740.48 examples/s]
+Filter: 6%|▌ | 50000/818627 [00:05<01:27, 8788.17 examples/s]
+Filter: 6%|▌ | 50000/818627 [00:05<01:27, 8792.04 examples/s]
+Filter: 6%|▌ | 50000/818627 [00:05<01:27, 8758.13 examples/s]
+Filter: 6%|▌ | 50000/818627 [00:05<01:27, 8756.31 examples/s]
+Filter: 6%|▌ | 50000/818627 [00:05<01:27, 8792.01 examples/s]
+Filter: 6%|▌ | 51000/818627 [00:05<01:28, 8686.69 examples/s]
+Filter: 6%|▌ | 51000/818627 [00:05<01:28, 8690.46 examples/s]
+Filter: 6%|▌ | 51000/818627 [00:05<01:28, 8686.23 examples/s]
+Filter: 6%|▌ | 51000/818627 [00:05<01:28, 8716.16 examples/s]
+Filter: 6%|▌ | 51000/818627 [00:05<01:28, 8719.25 examples/s]
+Filter: 6%|▌ | 51000/818627 [00:05<01:28, 8694.15 examples/s]
+Filter: 6%|▌ | 51000/818627 [00:05<01:28, 8690.31 examples/s]
+Filter: 6%|▌ | 51000/818627 [00:05<01:28, 8677.52 examples/s]
+Filter: 6%|▋ | 52000/818627 [00:05<01:27, 8741.91 examples/s]
+Filter: 6%|▋ | 52000/818627 [00:05<01:27, 8740.86 examples/s]
+Filter: 6%|▋ | 52000/818627 [00:05<01:27, 8736.48 examples/s]
+Filter: 6%|▋ | 52000/818627 [00:05<01:27, 8759.88 examples/s]
+Filter: 6%|▋ | 52000/818627 [00:05<01:27, 8749.49 examples/s]
+Filter: 6%|▋ | 52000/818627 [00:05<01:27, 8747.85 examples/s]
+Filter: 6%|▋ | 52000/818627 [00:05<01:27, 8779.95 examples/s]
+Filter: 6%|▋ | 52000/818627 [00:05<01:27, 8757.04 examples/s]
+Filter: 6%|▋ | 53000/818627 [00:05<01:30, 8500.92 examples/s]
+Filter: 6%|▋ | 53000/818627 [00:05<01:30, 8496.08 examples/s]
+Filter: 6%|▋ | 53000/818627 [00:05<01:30, 8493.42 examples/s]
+Filter: 6%|▋ | 53000/818627 [00:06<01:29, 8526.08 examples/s]
+Filter: 6%|▋ | 53000/818627 [00:05<01:29, 8513.08 examples/s]
+Filter: 6%|▋ | 53000/818627 [00:05<01:30, 8501.23 examples/s]
+Filter: 6%|▋ | 53000/818627 [00:05<01:30, 8502.89 examples/s]
+Filter: 6%|▋ | 53000/818627 [00:05<01:30, 8495.85 examples/s]
+Filter: 7%|▋ | 54000/818627 [00:05<01:31, 8351.77 examples/s]
+Filter: 7%|▋ | 54000/818627 [00:05<01:31, 8350.03 examples/s]
+Filter: 7%|▋ | 54000/818627 [00:05<01:31, 8346.54 examples/s]
+Filter: 7%|▋ | 54000/818627 [00:05<01:31, 8359.55 examples/s]
+Filter: 7%|▋ | 54000/818627 [00:05<01:31, 8358.19 examples/s]
+Filter: 7%|▋ | 54000/818627 [00:05<01:31, 8350.46 examples/s]
+Filter: 7%|▋ | 54000/818627 [00:05<01:31, 8350.07 examples/s]
+Filter: 7%|▋ | 54000/818627 [00:06<01:31, 8358.64 examples/s]
+Filter: 7%|▋ | 55000/818627 [00:05<01:28, 8630.94 examples/s]
+Filter: 7%|▋ | 55000/818627 [00:05<01:28, 8630.57 examples/s]
+Filter: 7%|▋ | 55000/818627 [00:06<01:28, 8628.87 examples/s]
+Filter: 7%|▋ | 55000/818627 [00:06<01:28, 8648.24 examples/s]
+Filter: 7%|▋ | 55000/818627 [00:06<01:28, 8637.36 examples/s]
+Filter: 7%|▋ | 55000/818627 [00:05<01:28, 8636.35 examples/s]
+Filter: 7%|▋ | 55000/818627 [00:05<01:28, 8629.42 examples/s]
+Filter: 7%|▋ | 55000/818627 [00:05<01:28, 8629.61 examples/s]
+Filter: 7%|▋ | 56000/818627 [00:06<01:28, 8646.26 examples/s]
+Filter: 7%|▋ | 56000/818627 [00:06<01:28, 8639.83 examples/s]
+Filter: 7%|▋ | 56000/818627 [00:06<01:28, 8655.74 examples/s]
+Filter: 7%|▋ | 56000/818627 [00:06<01:28, 8648.07 examples/s]
+Filter: 7%|▋ | 56000/818627 [00:06<01:28, 8645.62 examples/s]
+Filter: 7%|▋ | 56000/818627 [00:06<01:28, 8643.99 examples/s]
+Filter: 7%|▋ | 56000/818627 [00:06<01:28, 8641.98 examples/s]
+Filter: 7%|▋ | 56000/818627 [00:06<01:28, 8622.91 examples/s]
+Filter: 7%|▋ | 57000/818627 [00:06<01:24, 8965.21 examples/s]
+Filter: 7%|▋ | 57000/818627 [00:06<01:24, 8969.50 examples/s]
+Filter: 7%|▋ | 57000/818627 [00:06<01:24, 8961.08 examples/s]
+Filter: 7%|▋ | 57000/818627 [00:06<01:24, 8971.05 examples/s]
+Filter: 7%|▋ | 57000/818627 [00:06<01:24, 8969.30 examples/s]
+Filter: 7%|▋ | 57000/818627 [00:06<01:24, 8965.52 examples/s]
+Filter: 7%|▋ | 57000/818627 [00:06<01:24, 8965.09 examples/s]
+Filter: 7%|▋ | 57000/818627 [00:06<01:26, 8850.92 examples/s]
+Filter: 7%|▋ | 58000/818627 [00:06<01:24, 8993.53 examples/s]
+Filter: 7%|▋ | 58000/818627 [00:06<01:24, 8985.14 examples/s]
+Filter: 7%|▋ | 58000/818627 [00:06<01:24, 8982.88 examples/s]
+Filter: 7%|▋ | 58000/818627 [00:06<01:24, 9029.54 examples/s]
+Filter: 7%|▋ | 58000/818627 [00:06<01:24, 8986.46 examples/s]
+Filter: 7%|▋ | 58000/818627 [00:06<01:24, 8986.56 examples/s]
+Filter: 7%|▋ | 58000/818627 [00:06<01:24, 8986.51 examples/s]
+Filter: 7%|▋ | 58000/818627 [00:06<01:24, 8982.27 examples/s]
+Filter: 7%|▋ | 59000/818627 [00:06<01:25, 8833.95 examples/s]
+Filter: 7%|▋ | 59000/818627 [00:06<01:25, 8833.47 examples/s]
+Filter: 7%|▋ | 59000/818627 [00:06<01:25, 8833.18 examples/s]
+Filter: 7%|▋ | 59000/818627 [00:06<01:25, 8837.56 examples/s]
+Filter: 7%|▋ | 59000/818627 [00:06<01:25, 8837.18 examples/s]
+Filter: 7%|▋ | 59000/818627 [00:06<01:25, 8834.76 examples/s]
+Filter: 7%|▋ | 59000/818627 [00:06<01:25, 8834.87 examples/s]
+Filter: 7%|▋ | 59000/818627 [00:06<01:25, 8855.40 examples/s]
+Filter: 7%|▋ | 60000/818627 [00:06<01:26, 8747.76 examples/s]
+Filter: 7%|▋ | 60000/818627 [00:06<01:26, 8746.96 examples/s]
+Filter: 7%|▋ | 60000/818627 [00:06<01:26, 8743.55 examples/s]
+Filter: 7%|▋ | 60000/818627 [00:06<01:26, 8772.14 examples/s]
+Filter: 7%|▋ | 60000/818627 [00:06<01:26, 8745.96 examples/s]
+Filter: 7%|▋ | 60000/818627 [00:06<01:26, 8745.78 examples/s]
+Filter: 7%|▋ | 60000/818627 [00:06<01:26, 8745.19 examples/s]
+Filter: 7%|▋ | 60000/818627 [00:06<01:26, 8745.40 examples/s]
+Filter: 7%|▋ | 61000/818627 [00:06<01:26, 8725.33 examples/s]
+Filter: 7%|▋ | 61000/818627 [00:06<01:26, 8721.95 examples/s]
+Filter: 7%|▋ | 61000/818627 [00:06<01:26, 8721.57 examples/s]
+Filter: 7%|▋ | 61000/818627 [00:06<01:26, 8720.30 examples/s]
+Filter: 7%|▋ | 61000/818627 [00:06<01:26, 8721.36 examples/s]
+Filter: 7%|▋ | 61000/818627 [00:07<01:26, 8723.45 examples/s]
+Filter: 7%|▋ | 61000/818627 [00:06<01:27, 8692.47 examples/s]
+Filter: 7%|▋ | 61000/818627 [00:06<01:27, 8665.37 examples/s]
+Filter: 8%|▊ | 62000/818627 [00:06<01:25, 8863.03 examples/s]
+Filter: 8%|▊ | 62000/818627 [00:06<01:25, 8856.56 examples/s]
+Filter: 8%|▊ | 62000/818627 [00:06<01:25, 8842.13 examples/s]
+Filter: 8%|▊ | 62000/818627 [00:06<01:25, 8847.74 examples/s]
+Filter: 8%|▊ | 62000/818627 [00:07<01:25, 8856.59 examples/s]
+Filter: 8%|▊ | 62000/818627 [00:06<01:25, 8846.74 examples/s]
+Filter: 8%|▊ | 62000/818627 [00:06<01:25, 8847.00 examples/s]
+Filter: 8%|▊ | 62000/818627 [00:06<01:25, 8847.28 examples/s]
+Filter: 8%|▊ | 63000/818627 [00:06<01:23, 9043.81 examples/s]
+Filter: 8%|▊ | 63000/818627 [00:06<01:23, 9046.14 examples/s]
+Filter: 8%|▊ | 63000/818627 [00:06<01:23, 9035.77 examples/s]
+Filter: 8%|▊ | 63000/818627 [00:07<01:23, 9052.23 examples/s]
+Filter: 8%|▊ | 63000/818627 [00:06<01:23, 9036.85 examples/s]
+Filter: 8%|▊ | 63000/818627 [00:06<01:23, 9032.51 examples/s]
+Filter: 8%|▊ | 63000/818627 [00:06<01:23, 9032.89 examples/s]
+Filter: 8%|▊ | 63000/818627 [00:06<01:23, 9002.20 examples/s]
+Filter: 8%|▊ | 64000/818627 [00:07<01:24, 8894.45 examples/s]
+Filter: 8%|▊ | 64000/818627 [00:07<01:24, 8887.63 examples/s]
+Filter: 8%|▊ | 64000/818627 [00:07<01:24, 8886.22 examples/s]
+Filter: 8%|▊ | 64000/818627 [00:07<01:24, 8883.84 examples/s]
+Filter: 8%|▊ | 64000/818627 [00:07<01:24, 8885.77 examples/s]
+Filter: 8%|▊ | 64000/818627 [00:07<01:24, 8886.60 examples/s]
+Filter: 8%|▊ | 64000/818627 [00:07<01:24, 8891.72 examples/s]
+Filter: 8%|▊ | 64000/818627 [00:07<01:24, 8882.51 examples/s]
+Filter: 8%|▊ | 65000/818627 [00:07<01:25, 8783.67 examples/s]
+Filter: 8%|▊ | 65000/818627 [00:07<01:25, 8778.28 examples/s]
+Filter: 8%|▊ | 65000/818627 [00:07<01:25, 8790.69 examples/s]
+Filter: 8%|▊ | 65000/818627 [00:07<01:25, 8787.86 examples/s]
+Filter: 8%|▊ | 65000/818627 [00:07<01:25, 8795.91 examples/s]
+Filter: 8%|▊ | 65000/818627 [00:07<01:25, 8789.67 examples/s]
+Filter: 8%|▊ | 65000/818627 [00:07<01:25, 8782.17 examples/s]
+Filter: 8%|▊ | 65000/818627 [00:07<01:25, 8769.38 examples/s]
+Filter: 8%|▊ | 66000/818627 [00:07<01:26, 8689.09 examples/s]
+Filter: 8%|▊ | 66000/818627 [00:07<01:26, 8690.44 examples/s]
+Filter: 8%|▊ | 66000/818627 [00:07<01:26, 8690.89 examples/s]
+Filter: 8%|▊ | 66000/818627 [00:07<01:26, 8683.92 examples/s]
+Filter: 8%|▊ | 66000/818627 [00:07<01:26, 8683.58 examples/s]
+Filter: 8%|▊ | 66000/818627 [00:07<01:26, 8688.47 examples/s]
+Filter: 8%|▊ | 66000/818627 [00:07<01:26, 8683.49 examples/s]
+Filter: 8%|▊ | 66000/818627 [00:07<01:30, 8289.15 examples/s]
+Filter: 8%|▊ | 67000/818627 [00:07<01:26, 8691.19 examples/s]
+Filter: 8%|▊ | 67000/818627 [00:07<01:26, 8681.52 examples/s]
+Filter: 8%|▊ | 67000/818627 [00:07<01:26, 8676.16 examples/s]
+Filter: 8%|▊ | 67000/818627 [00:07<01:26, 8678.61 examples/s]
+Filter: 8%|▊ | 67000/818627 [00:07<01:26, 8680.21 examples/s]
+Filter: 8%|▊ | 67000/818627 [00:07<01:26, 8682.95 examples/s]
+Filter: 8%|▊ | 67000/818627 [00:07<01:26, 8680.35 examples/s]
+Filter: 8%|▊ | 68000/818627 [00:07<01:27, 8625.73 examples/s]
+Filter: 8%|▊ | 68000/818627 [00:07<01:27, 8626.53 examples/s]
+Filter: 8%|▊ | 68000/818627 [00:07<01:27, 8618.78 examples/s]
+Filter: 8%|▊ | 68000/818627 [00:07<01:27, 8619.44 examples/s]
+Filter: 8%|▊ | 68000/818627 [00:07<01:27, 8620.29 examples/s]
+Filter: 8%|▊ | 68000/818627 [00:07<01:27, 8614.62 examples/s]
+Filter: 8%|▊ | 68000/818627 [00:07<01:27, 8613.71 examples/s]
+Filter: 8%|▊ | 68000/818627 [00:07<01:26, 8714.18 examples/s]
+Filter: 8%|▊ | 69000/818627 [00:07<01:26, 8655.98 examples/s]
+Filter: 8%|▊ | 69000/818627 [00:07<01:26, 8655.76 examples/s]
+Filter: 8%|▊ | 69000/818627 [00:07<01:26, 8659.84 examples/s]
+Filter: 8%|▊ | 69000/818627 [00:07<01:26, 8654.86 examples/s]
+Filter: 8%|▊ | 69000/818627 [00:07<01:26, 8652.89 examples/s]
+Filter: 8%|▊ | 69000/818627 [00:07<01:26, 8653.64 examples/s]
+Filter: 8%|▊ | 69000/818627 [00:07<01:25, 8730.58 examples/s]
+Filter: 8%|▊ | 69000/818627 [00:07<01:27, 8578.70 examples/s]
+Filter: 9%|▊ | 70000/818627 [00:07<01:23, 8925.54 examples/s]
+Filter: 9%|▊ | 70000/818627 [00:07<01:23, 8942.10 examples/s]
+Filter: 9%|▊ | 70000/818627 [00:07<01:23, 8927.75 examples/s]
+Filter: 9%|▊ | 70000/818627 [00:07<01:23, 8927.01 examples/s]
+Filter: 9%|▊ | 70000/818627 [00:08<01:23, 8957.81 examples/s]
+Filter: 9%|▊ | 70000/818627 [00:07<01:23, 8928.98 examples/s]
+Filter: 9%|▊ | 70000/818627 [00:07<01:23, 8918.71 examples/s]
+Filter: 9%|▊ | 70000/818627 [00:07<01:23, 8924.79 examples/s]
+Filter: 9%|▊ | 71000/818627 [00:07<01:21, 9126.11 examples/s]
+Filter: 9%|▊ | 71000/818627 [00:07<01:21, 9145.42 examples/s]
+Filter: 9%|▊ | 71000/818627 [00:07<01:21, 9130.70 examples/s]
+Filter: 9%|▊ | 71000/818627 [00:07<01:21, 9122.79 examples/s]
+Filter: 9%|▊ | 71000/818627 [00:07<01:21, 9124.74 examples/s]
+Filter: 9%|▊ | 71000/818627 [00:07<01:21, 9122.60 examples/s]
+Filter: 9%|▊ | 71000/818627 [00:07<01:21, 9122.48 examples/s]
+Filter: 9%|▊ | 71000/818627 [00:08<01:22, 9093.10 examples/s]
+Filter: 9%|▉ | 72000/818627 [00:07<01:22, 8995.60 examples/s]
+Filter: 9%|▉ | 72000/818627 [00:07<01:22, 9007.69 examples/s]
+Filter: 9%|▉ | 72000/818627 [00:07<01:22, 8999.53 examples/s]
+Filter: 9%|▉ | 72000/818627 [00:08<01:22, 9019.63 examples/s]
+Filter: 9%|▉ | 72000/818627 [00:07<01:22, 8997.82 examples/s]
+Filter: 9%|▉ | 72000/818627 [00:08<01:22, 8995.62 examples/s]
+Filter: 9%|▉ | 72000/818627 [00:07<01:23, 8994.37 examples/s]
+Filter: 9%|▉ | 72000/818627 [00:07<01:23, 8994.76 examples/s]
+Filter: 9%|▉ | 73000/818627 [00:08<01:24, 8870.14 examples/s]
+Filter: 9%|▉ | 73000/818627 [00:08<01:24, 8870.06 examples/s]
+Filter: 9%|▉ | 73000/818627 [00:08<01:24, 8874.85 examples/s]
+Filter: 9%|▉ | 73000/818627 [00:08<01:23, 8893.04 examples/s]
+Filter: 9%|▉ | 73000/818627 [00:08<01:24, 8870.27 examples/s]
+Filter: 9%|▉ | 73000/818627 [00:08<01:24, 8868.91 examples/s]
+Filter: 9%|▉ | 73000/818627 [00:08<01:24, 8867.52 examples/s]
+Filter: 9%|▉ | 73000/818627 [00:08<01:24, 8862.91 examples/s]
+Filter: 9%|▉ | 74000/818627 [00:08<01:24, 8786.94 examples/s]
+Filter: 9%|▉ | 74000/818627 [00:08<01:24, 8782.02 examples/s]
+Filter: 9%|▉ | 74000/818627 [00:08<01:24, 8772.11 examples/s]
+Filter: 9%|▉ | 74000/818627 [00:08<01:24, 8780.61 examples/s]
+Filter: 9%|▉ | 74000/818627 [00:08<01:24, 8777.02 examples/s]
+Filter: 9%|▉ | 74000/818627 [00:08<01:24, 8777.60 examples/s]
+Filter: 9%|▉ | 74000/818627 [00:08<01:24, 8780.06 examples/s]
+Filter: 9%|▉ | 74000/818627 [00:08<01:24, 8789.67 examples/s]
+Filter: 9%|▉ | 75000/818627 [00:08<01:25, 8689.35 examples/s]
+Filter: 9%|▉ | 75000/818627 [00:08<01:25, 8684.15 examples/s]
+Filter: 9%|▉ | 75000/818627 [00:08<01:25, 8686.66 examples/s]
+Filter: 9%|▉ | 75000/818627 [00:08<01:25, 8686.17 examples/s]
+Filter: 9%|▉ | 75000/818627 [00:08<01:25, 8700.95 examples/s]
+Filter: 9%|▉ | 75000/818627 [00:08<01:25, 8685.80 examples/s]
+Filter: 9%|▉ | 75000/818627 [00:08<01:25, 8683.53 examples/s]
+Filter: 9%|▉ | 75000/818627 [00:08<01:25, 8680.32 examples/s]
+Filter: 9%|▉ | 76000/818627 [00:08<01:25, 8646.23 examples/s]
+Filter: 9%|▉ | 76000/818627 [00:08<01:25, 8643.01 examples/s]
+Filter: 9%|▉ | 76000/818627 [00:08<01:25, 8635.29 examples/s]
+Filter: 9%|▉ | 76000/818627 [00:08<01:25, 8656.58 examples/s]
+Filter: 9%|▉ | 76000/818627 [00:08<01:25, 8644.42 examples/s]
+Filter: 9%|▉ | 76000/818627 [00:08<01:25, 8644.25 examples/s]
+Filter: 9%|▉ | 76000/818627 [00:08<01:25, 8642.91 examples/s]
+Filter: 9%|▉ | 76000/818627 [00:08<01:25, 8644.70 examples/s]
+Filter: 9%|▉ | 77000/818627 [00:08<01:23, 8898.89 examples/s]
+Filter: 9%|▉ | 77000/818627 [00:08<01:23, 8902.75 examples/s]
+Filter: 9%|▉ | 77000/818627 [00:08<01:23, 8900.17 examples/s]
+Filter: 9%|▉ | 77000/818627 [00:08<01:23, 8896.80 examples/s]
+Filter: 9%|▉ | 77000/818627 [00:08<01:23, 8893.22 examples/s]
+Filter: 9%|▉ | 77000/818627 [00:08<01:23, 8897.14 examples/s]
+Filter: 9%|▉ | 77000/818627 [00:08<01:23, 8889.36 examples/s]
+Filter: 9%|▉ | 77000/818627 [00:08<01:23, 8852.70 examples/s]
+Filter: 10%|▉ | 78000/818627 [00:08<01:21, 9128.72 examples/s]
+Filter: 10%|▉ | 78000/818627 [00:08<01:21, 9129.65 examples/s]
+Filter: 10%|▉ | 78000/818627 [00:08<01:21, 9128.91 examples/s]
+Filter: 10%|▉ | 78000/818627 [00:08<01:21, 9128.77 examples/s]
+Filter: 10%|▉ | 78000/818627 [00:08<01:20, 9144.98 examples/s]
+Filter: 10%|▉ | 78000/818627 [00:08<01:21, 9127.95 examples/s]
+Filter: 10%|▉ | 78000/818627 [00:08<01:21, 9126.40 examples/s]
+Filter: 10%|▉ | 78000/818627 [00:08<01:21, 9127.75 examples/s]
+Filter: 10%|▉ | 79000/818627 [00:08<01:22, 8983.70 examples/s]
+Filter: 10%|▉ | 79000/818627 [00:08<01:22, 8968.64 examples/s]
+Filter: 10%|▉ | 79000/818627 [00:09<01:22, 8992.73 examples/s]
+Filter: 10%|▉ | 79000/818627 [00:08<01:22, 8975.90 examples/s]
+Filter: 10%|▉ | 79000/818627 [00:08<01:22, 8979.11 examples/s]
+Filter: 10%|▉ | 79000/818627 [00:08<01:22, 8976.80 examples/s]
+Filter: 10%|▉ | 79000/818627 [00:08<01:22, 8969.99 examples/s]
+Filter: 10%|▉ | 79000/818627 [00:08<01:23, 8839.81 examples/s]
+Filter: 10%|▉ | 80000/818627 [00:08<01:22, 8917.39 examples/s]
+Filter: 10%|▉ | 80000/818627 [00:08<01:22, 8918.96 examples/s]
+Filter: 10%|▉ | 80000/818627 [00:08<01:22, 8952.51 examples/s]
+Filter: 10%|▉ | 80000/818627 [00:09<01:22, 8924.70 examples/s]
+Filter: 10%|▉ | 80000/818627 [00:08<01:22, 8919.82 examples/s]
+Filter: 10%|▉ | 80000/818627 [00:08<01:22, 8913.72 examples/s]
+Filter: 10%|▉ | 80000/818627 [00:08<01:22, 8914.09 examples/s]
+Filter: 10%|▉ | 80000/818627 [00:08<01:22, 8915.53 examples/s]
+Filter: 10%|▉ | 81000/818627 [00:08<01:23, 8824.48 examples/s]
+Filter: 10%|▉ | 81000/818627 [00:08<01:23, 8855.14 examples/s]
+Filter: 10%|▉ | 81000/818627 [00:08<01:23, 8814.86 examples/s]
+Filter: 10%|▉ | 81000/818627 [00:09<01:23, 8828.95 examples/s]
+Filter: 10%|▉ | 81000/818627 [00:09<01:23, 8824.03 examples/s]
+Filter: 10%|▉ | 81000/818627 [00:08<01:23, 8827.02 examples/s]
+Filter: 10%|▉ | 81000/818627 [00:08<01:23, 8822.66 examples/s]
+Filter: 10%|▉ | 81000/818627 [00:08<01:23, 8824.84 examples/s]
+Filter: 10%|█ | 82000/818627 [00:09<01:24, 8766.57 examples/s]
+Filter: 10%|█ | 82000/818627 [00:09<01:24, 8763.85 examples/s]
+Filter: 10%|█ | 82000/818627 [00:09<01:23, 8779.08 examples/s]
+Filter: 10%|█ | 82000/818627 [00:09<01:23, 8771.48 examples/s]
+Filter: 10%|█ | 82000/818627 [00:09<01:24, 8762.84 examples/s]
+Filter: 10%|█ | 82000/818627 [00:09<01:24, 8765.85 examples/s]
+Filter: 10%|█ | 82000/818627 [00:09<01:24, 8762.12 examples/s]
+Filter: 10%|█ | 82000/818627 [00:09<01:24, 8761.80 examples/s]
+Filter: 10%|█ | 83000/818627 [00:09<01:24, 8726.96 examples/s]
+Filter: 10%|█ | 83000/818627 [00:09<01:24, 8742.20 examples/s]
+Filter: 10%|█ | 83000/818627 [00:09<01:24, 8725.33 examples/s]
+Filter: 10%|█ | 83000/818627 [00:09<01:24, 8726.68 examples/s]
+Filter: 10%|█ | 83000/818627 [00:09<01:24, 8726.75 examples/s]
+Filter: 10%|█ | 83000/818627 [00:09<01:24, 8721.21 examples/s]
+Filter: 10%|█ | 83000/818627 [00:09<01:26, 8547.55 examples/s]
+Filter: 10%|█ | 83000/818627 [00:09<01:26, 8511.72 examples/s]
+Filter: 10%|█ | 84000/818627 [00:09<01:21, 8969.05 examples/s]
+Filter: 10%|█ | 84000/818627 [00:09<01:21, 8973.42 examples/s]
+Filter: 10%|█ | 84000/818627 [00:09<01:21, 8983.50 examples/s]
+Filter: 10%|█ | 84000/818627 [00:09<01:21, 8977.01 examples/s]
+Filter: 10%|█ | 84000/818627 [00:09<01:21, 8972.99 examples/s]
+Filter: 10%|█ | 84000/818627 [00:09<01:21, 8970.57 examples/s]
+Filter: 10%|█ | 84000/818627 [00:09<01:23, 8832.44 examples/s]
+Filter: 10%|█ | 85000/818627 [00:09<01:19, 9236.26 examples/s]
+Filter: 10%|█ | 85000/818627 [00:09<01:19, 9230.83 examples/s]
+Filter: 10%|█ | 85000/818627 [00:09<01:19, 9229.65 examples/s]
+Filter: 10%|█ | 85000/818627 [00:09<01:19, 9229.58 examples/s]
+Filter: 10%|█ | 85000/818627 [00:09<01:19, 9202.63 examples/s]
+Filter: 10%|█ | 85000/818627 [00:09<01:20, 9163.31 examples/s]
+Filter: 10%|█ | 85000/818627 [00:09<01:20, 9060.76 examples/s]
+Filter: 11%|█ | 86000/818627 [00:09<01:19, 9185.11 examples/s]
+Filter: 11%|█ | 86000/818627 [00:09<01:20, 9147.41 examples/s]
+Filter: 11%|█ | 86000/818627 [00:09<01:20, 9138.66 examples/s]
+Filter: 11%|█ | 86000/818627 [00:09<01:20, 9133.49 examples/s]
+Filter: 11%|█ | 86000/818627 [00:09<01:20, 9142.26 examples/s]
+Filter: 11%|█ | 86000/818627 [00:09<01:19, 9244.05 examples/s]
+Filter: 11%|█ | 86000/818627 [00:09<01:20, 9128.47 examples/s]
+Filter: 11%|█ | 86000/818627 [00:09<01:20, 9088.02 examples/s]
+Filter: 11%|█ | 87000/818627 [00:09<01:20, 9040.75 examples/s]
+Filter: 11%|█ | 87000/818627 [00:09<01:20, 9042.57 examples/s]
+Filter: 11%|█ | 87000/818627 [00:09<01:20, 9065.84 examples/s]
+Filter: 11%|█ | 87000/818627 [00:09<01:20, 9054.59 examples/s]
+Filter: 11%|█ | 87000/818627 [00:09<01:20, 9045.33 examples/s]
+Filter: 11%|█ | 87000/818627 [00:09<01:21, 9031.68 examples/s]
+Filter: 11%|█ | 87000/818627 [00:09<01:20, 9130.63 examples/s]
+Filter: 11%|█ | 88000/818627 [00:09<01:20, 9024.22 examples/s]
+Filter: 11%|█ | 88000/818627 [00:09<01:20, 9036.75 examples/s]
+Filter: 11%|█ | 88000/818627 [00:09<01:20, 9029.13 examples/s]
+Filter: 11%|█ | 89000/818627 [00:09<01:20, 9009.17 examples/s]
+Filter: 11%|█ | 89000/818627 [00:09<01:21, 9003.62 examples/s]
+Filter: 11%|█ | 89000/818627 [00:09<01:21, 8987.12 examples/s]
+Filter: 11%|█ | 90000/818627 [00:09<01:20, 9099.93 examples/s]
+Filter: 11%|█ | 90000/818627 [00:09<01:20, 9101.21 examples/s]
+Filter: 11%|█ | 87000/818627 [00:10<02:47, 4361.42 examples/s]
+Filter: 11%|█ | 88000/818627 [00:09<02:24, 5060.90 examples/s]
+Filter: 11%|█ | 91000/818627 [00:10<01:18, 9258.34 examples/s]
+Filter: 11%|█ | 91000/818627 [00:10<01:18, 9250.82 examples/s]
+Filter: 11%|█ | 88000/818627 [00:10<02:33, 4770.04 examples/s]
+Filter: 11%|█ | 88000/818627 [00:10<02:37, 4652.70 examples/s]
+Filter: 11%|█ | 88000/818627 [00:10<02:26, 4973.73 examples/s]
+Filter: 11%|█ | 92000/818627 [00:10<01:17, 9366.57 examples/s]
+Filter: 11%|█ | 92000/818627 [00:10<01:18, 9199.44 examples/s]
+Filter: 11%|█ | 89000/818627 [00:10<01:56, 6247.95 examples/s]
+Filter: 11%|█ | 90000/818627 [00:10<01:43, 7031.33 examples/s]
+Filter: 11%|█ | 90000/818627 [00:10<01:48, 6743.06 examples/s]
+Filter: 11%|█ | 90000/818627 [00:10<01:50, 6580.63 examples/s]
+Filter: 11%|█ | 90000/818627 [00:10<01:49, 6668.96 examples/s]
+Filter: 11%|█ | 90000/818627 [00:10<02:32, 4793.22 examples/s]
+Filter: 11%|█ | 92000/818627 [00:10<01:24, 8649.95 examples/s]
+Filter: 11%|█ | 91000/818627 [00:10<01:32, 7852.10 examples/s]
+Filter: 11%|█ | 92000/818627 [00:10<01:26, 8363.21 examples/s]
+Filter: 11%|█ | 92000/818627 [00:10<01:29, 8103.05 examples/s]
+Filter: 11%|█ | 92000/818627 [00:10<01:30, 8061.89 examples/s]
+Filter: 11%|█ | 92000/818627 [00:10<01:49, 6663.57 examples/s]
+Filter: 11%|█▏ | 93000/818627 [00:10<01:19, 9153.86 examples/s]
+Filter: 11%|█▏ | 94000/818627 [00:10<01:16, 9423.51 examples/s]
+Filter: 11%|█▏ | 94000/818627 [00:10<01:14, 9667.16 examples/s]
+Filter: 11%|█▏ | 94000/818627 [00:10<01:17, 9307.75 examples/s]
+Filter: 11%|█▏ | 94000/818627 [00:10<01:18, 9177.82 examples/s]
+Filter: 11%|█▏ | 93000/818627 [00:10<02:23, 5039.45 examples/s]
+Filter: 11%|█▏ | 93000/818627 [00:10<02:27, 4934.68 examples/s]
+Filter: 11%|█▏ | 94000/818627 [00:10<01:27, 8239.23 examples/s]
+Filter: 12%|█▏ | 95000/818627 [00:10<01:11, 10157.06 examples/s]
+Filter: 12%|█▏ | 96000/818627 [00:10<01:14, 9671.51 examples/s]
+Filter: 12%|█▏ | 96000/818627 [00:10<01:12, 10015.56 examples/s]
+Filter: 12%|█▏ | 96000/818627 [00:10<01:10, 10286.15 examples/s]
+Filter: 12%|█▏ | 95000/818627 [00:10<01:43, 7015.01 examples/s]
+Filter: 12%|█▏ | 96000/818627 [00:10<01:11, 10056.43 examples/s]
+Filter: 12%|█▏ | 95000/818627 [00:10<01:45, 6872.29 examples/s]
+Filter: 12%|█▏ | 96000/818627 [00:10<01:16, 9505.91 examples/s]
+Filter: 12%|█▏ | 97000/818627 [00:11<01:07, 10683.86 examples/s]
+Filter: 12%|█▏ | 97000/818627 [00:10<01:23, 8600.31 examples/s]
+Filter: 12%|█▏ | 97000/818627 [00:10<01:25, 8468.21 examples/s]
+Filter: 12%|█▏ | 98000/818627 [00:10<01:14, 9632.68 examples/s]
+Filter: 12%|█▏ | 98000/818627 [00:10<01:12, 9876.92 examples/s]
+Filter: 12%|█▏ | 98000/818627 [00:10<01:08, 10481.09 examples/s]
+Filter: 12%|█▏ | 98000/818627 [00:10<01:10, 10155.52 examples/s]
+Filter: 12%|█▏ | 98000/818627 [00:10<01:09, 10342.53 examples/s]
+Filter: 12%|█▏ | 99000/818627 [00:11<01:09, 10358.42 examples/s]
+Filter: 12%|█▏ | 99000/818627 [00:11<01:12, 9902.11 examples/s]
+Filter: 12%|█▏ | 99000/818627 [00:11<01:13, 9727.07 examples/s]
+Filter: 12%|█▏ | 100000/818627 [00:11<01:15, 9552.48 examples/s]
+Filter: 12%|█▏ | 100000/818627 [00:11<01:13, 9717.58 examples/s]
+Filter: 12%|█▏ | 100000/818627 [00:11<01:11, 10094.46 examples/s]
+Filter: 12%|█▏ | 100000/818627 [00:11<01:11, 10020.43 examples/s]
+Filter: 12%|█▏ | 100000/818627 [00:11<01:12, 9894.84 examples/s]
+Filter: 12%|█▏ | 101000/818627 [00:11<01:16, 9359.75 examples/s]
+Filter: 12%|█▏ | 101000/818627 [00:11<01:13, 9723.60 examples/s]
+Filter: 12%|█▏ | 101000/818627 [00:11<01:13, 9801.66 examples/s]
+Filter: 12%|█▏ | 101000/818627 [00:11<01:12, 9924.17 examples/s]
+Filter: 12%|█▏ | 102000/818627 [00:11<01:17, 9200.39 examples/s]
+Filter: 12%|█▏ | 102000/818627 [00:11<01:16, 9346.80 examples/s]
+Filter: 12%|█▏ | 102000/818627 [00:11<01:15, 9461.41 examples/s]
+Filter: 12%|█▏ | 102000/818627 [00:11<01:14, 9574.83 examples/s]
+Filter: 12%|█▏ | 102000/818627 [00:11<01:16, 9423.53 examples/s]
+Filter: 13%|█▎ | 103000/818627 [00:11<01:18, 9075.58 examples/s]
+Filter: 13%|█▎ | 103000/818627 [00:11<01:17, 9216.44 examples/s]
+Filter: 13%|█▎ | 103000/818627 [00:11<01:16, 9351.59 examples/s]
+Filter: 13%|█▎ | 103000/818627 [00:11<01:16, 9415.00 examples/s]
+Filter: 13%|█▎ | 103000/818627 [00:11<01:15, 9468.64 examples/s]
+Filter: 13%|█▎ | 103000/818627 [00:11<01:16, 9303.74 examples/s]
+Filter: 13%|█▎ | 103000/818627 [00:11<01:16, 9405.25 examples/s]
+Filter: 13%|█▎ | 104000/818627 [00:11<01:19, 8946.28 examples/s]
+Filter: 13%|█▎ | 104000/818627 [00:11<01:18, 9072.12 examples/s]
+Filter: 13%|█▎ | 104000/818627 [00:11<01:17, 9259.87 examples/s]
+Filter: 13%|█▎ | 104000/818627 [00:11<01:17, 9252.11 examples/s]
+Filter: 13%|█▎ | 104000/818627 [00:11<01:18, 9144.57 examples/s]
+Filter: 13%|█▎ | 104000/818627 [00:11<01:17, 9224.66 examples/s]
+Filter: 13%|█▎ | 105000/818627 [00:11<01:18, 9120.66 examples/s]
+Filter: 13%|█▎ | 105000/818627 [00:11<01:20, 8891.60 examples/s]
+Filter: 13%|█▎ | 105000/818627 [00:11<01:19, 8999.01 examples/s]
+Filter: 13%|█▎ | 105000/818627 [00:12<01:18, 9147.57 examples/s]
+Filter: 13%|█▎ | 105000/818627 [00:11<01:17, 9160.19 examples/s]
+Filter: 13%|█▎ | 105000/818627 [00:11<01:17, 9197.77 examples/s]
+Filter: 13%|█▎ | 105000/818627 [00:11<01:18, 9053.21 examples/s]
+Filter: 13%|█▎ | 105000/818627 [00:11<01:18, 9114.57 examples/s]
+Filter: 13%|█▎ | 106000/818627 [00:11<01:18, 9046.22 examples/s]
+Filter: 13%|█▎ | 106000/818627 [00:11<01:17, 9182.16 examples/s]
+Filter: 13%|█▎ | 106000/818627 [00:11<01:18, 9109.78 examples/s]
+Filter: 13%|█▎ | 106000/818627 [00:11<01:17, 9225.70 examples/s]
+Filter: 13%|█▎ | 106000/818627 [00:12<01:17, 9219.14 examples/s]
+Filter: 13%|█▎ | 106000/818627 [00:11<01:17, 9248.69 examples/s]
+Filter: 13%|█▎ | 106000/818627 [00:11<01:17, 9151.24 examples/s]
+Filter: 13%|█▎ | 106000/818627 [00:11<01:17, 9200.71 examples/s]
+Filter: 13%|█▎ | 107000/818627 [00:11<01:16, 9243.28 examples/s]
+Filter: 13%|█▎ | 107000/818627 [00:11<01:16, 9300.89 examples/s]
+Filter: 13%|█▎ | 107000/818627 [00:11<01:16, 9273.48 examples/s]
+Filter: 13%|█▎ | 107000/818627 [00:11<01:16, 9347.79 examples/s]
+Filter: 13%|█▎ | 107000/818627 [00:12<01:16, 9351.49 examples/s]
+Filter: 13%|█▎ | 107000/818627 [00:11<01:16, 9312.47 examples/s]
+Filter: 13%|█▎ | 107000/818627 [00:11<01:16, 9355.62 examples/s]
+Filter: 13%|█▎ | 107000/818627 [00:11<01:16, 9347.33 examples/s]
+Filter: 13%|█▎ | 108000/818627 [00:11<01:15, 9438.85 examples/s]
+Filter: 13%|█▎ | 108000/818627 [00:11<01:15, 9449.89 examples/s]
+Filter: 13%|█▎ | 108000/818627 [00:11<01:15, 9457.54 examples/s]
+Filter: 13%|█▎ | 108000/818627 [00:11<01:14, 9492.38 examples/s]
+Filter: 13%|█▎ | 108000/818627 [00:11<01:14, 9483.13 examples/s]
+Filter: 13%|█▎ | 108000/818627 [00:12<01:14, 9491.27 examples/s]
+Filter: 13%|█▎ | 108000/818627 [00:11<01:14, 9510.55 examples/s]
+Filter: 13%|█▎ | 108000/818627 [00:12<01:18, 9047.01 examples/s]
+Filter: 13%|█▎ | 109000/818627 [00:12<01:15, 9361.34 examples/s]
+Filter: 13%|█▎ | 109000/818627 [00:12<01:15, 9381.30 examples/s]
+Filter: 13%|█▎ | 109000/818627 [00:12<01:15, 9376.10 examples/s]
+Filter: 13%|█▎ | 109000/818627 [00:12<01:15, 9395.77 examples/s]
+Filter: 13%|█▎ | 109000/818627 [00:12<01:15, 9405.46 examples/s]
+Filter: 13%|█▎ | 109000/818627 [00:12<01:15, 9414.28 examples/s]
+Filter: 13%|█▎ | 109000/818627 [00:12<01:15, 9404.97 examples/s]
+Filter: 13%|█▎ | 110000/818627 [00:12<01:17, 9141.35 examples/s]
+Filter: 13%|█▎ | 110000/818627 [00:12<01:17, 9157.06 examples/s]
+Filter: 13%|█▎ | 110000/818627 [00:12<01:17, 9178.44 examples/s]
+Filter: 13%|█▎ | 110000/818627 [00:12<01:15, 9358.97 examples/s]
+Filter: 13%|█▎ | 110000/818627 [00:12<01:17, 9169.98 examples/s]
+Filter: 13%|█▎ | 110000/818627 [00:12<01:17, 9190.39 examples/s]
+Filter: 13%|█▎ | 110000/818627 [00:12<01:17, 9198.70 examples/s]
+Filter: 13%|█▎ | 110000/818627 [00:12<01:17, 9179.70 examples/s]
+Filter: 14%|█▎ | 111000/818627 [00:12<01:18, 9015.33 examples/s]
+Filter: 14%|█▎ | 111000/818627 [00:12<01:16, 9189.98 examples/s]
+Filter: 14%|█▎ | 111000/818627 [00:12<01:18, 9043.54 examples/s]
+Filter: 14%|█▎ | 111000/818627 [00:12<01:18, 9020.15 examples/s]
+Filter: 14%|█▎ | 111000/818627 [00:12<01:18, 9031.15 examples/s]
+Filter: 14%|█▎ | 111000/818627 [00:12<01:18, 8972.48 examples/s]
+Filter: 14%|█▎ | 111000/818627 [00:12<01:19, 8868.35 examples/s]
+Filter: 14%|█▎ | 111000/818627 [00:12<01:19, 8894.38 examples/s]
+Filter: 14%|█▎ | 112000/818627 [00:12<01:18, 8994.03 examples/s]
+Filter: 14%|█▎ | 112000/818627 [00:12<01:18, 9004.59 examples/s]
+Filter: 14%|█▎ | 112000/818627 [00:12<01:17, 9099.61 examples/s]
+Filter: 14%|█▎ | 112000/818627 [00:12<01:18, 8986.45 examples/s]
+Filter: 14%|█▎ | 112000/818627 [00:12<01:18, 8969.94 examples/s]
+Filter: 14%|█▎ | 112000/818627 [00:12<01:18, 9043.72 examples/s]
+Filter: 14%|█▎ | 112000/818627 [00:12<01:18, 8977.97 examples/s]
+Filter: 14%|█▎ | 112000/818627 [00:12<01:19, 8904.76 examples/s]
+Filter: 14%|█▍ | 113000/818627 [00:12<01:17, 9122.96 examples/s]
+Filter: 14%|█▍ | 113000/818627 [00:12<01:17, 9119.17 examples/s]
+Filter: 14%|█▍ | 113000/818627 [00:12<01:17, 9123.87 examples/s]
+Filter: 14%|█▍ | 113000/818627 [00:12<01:16, 9189.69 examples/s]
+Filter: 14%|█▍ | 113000/818627 [00:12<01:17, 9115.75 examples/s]
+Filter: 14%|█▍ | 113000/818627 [00:12<01:17, 9104.06 examples/s]
+Filter: 14%|█▍ | 113000/818627 [00:12<01:17, 9154.26 examples/s]
+Filter: 14%|█▍ | 113000/818627 [00:12<01:17, 9107.09 examples/s]
+Filter: 14%|█▍ | 114000/818627 [00:12<01:15, 9282.46 examples/s]
+Filter: 14%|█▍ | 114000/818627 [00:12<01:15, 9281.34 examples/s]
+Filter: 14%|█▍ | 114000/818627 [00:12<01:15, 9277.27 examples/s]
+Filter: 14%|█▍ | 114000/818627 [00:12<01:15, 9317.81 examples/s]
+Filter: 14%|█▍ | 114000/818627 [00:12<01:16, 9270.32 examples/s]
+Filter: 14%|█▍ | 114000/818627 [00:12<01:15, 9300.97 examples/s]
+Filter: 14%|█▍ | 114000/818627 [00:12<01:16, 9266.45 examples/s]
+Filter: 14%|█▍ | 114000/818627 [00:12<01:16, 9270.54 examples/s]
+Filter: 14%|█▍ | 116000/818627 [00:12<01:14, 9449.32 examples/s]
+Filter: 14%|█▍ | 116000/818627 [00:12<01:14, 9449.23 examples/s]
+Filter: 14%|█▍ | 116000/818627 [00:13<01:14, 9470.60 examples/s]
+Filter: 14%|█▍ | 116000/818627 [00:12<01:14, 9448.25 examples/s]
+Filter: 14%|█▍ | 116000/818627 [00:12<01:14, 9464.14 examples/s]
+Filter: 14%|█▍ | 116000/818627 [00:12<01:14, 9443.68 examples/s]
+Filter: 14%|█▍ | 116000/818627 [00:12<01:14, 9445.48 examples/s]
+Filter: 14%|█▍ | 116000/818627 [00:12<01:14, 9376.88 examples/s]
+Filter: 14%|█▍ | 117000/818627 [00:12<01:15, 9266.60 examples/s]
+Filter: 14%|█▍ | 117000/818627 [00:12<01:15, 9266.30 examples/s]
+Filter: 14%|█▍ | 117000/818627 [00:12<01:15, 9273.80 examples/s]
+Filter: 14%|█▍ | 117000/818627 [00:13<01:15, 9282.89 examples/s]
+Filter: 14%|█▍ | 117000/818627 [00:12<01:15, 9261.30 examples/s]
+Filter: 14%|█▍ | 117000/818627 [00:12<01:15, 9260.96 examples/s]
+Filter: 14%|█▍ | 117000/818627 [00:13<01:15, 9254.59 examples/s]
+Filter: 14%|█▍ | 117000/818627 [00:12<01:16, 9218.14 examples/s]
+Filter: 14%|█▍ | 118000/818627 [00:13<01:16, 9116.91 examples/s]
+Filter: 14%|█▍ | 118000/818627 [00:13<01:16, 9133.00 examples/s]
+Filter: 14%|█▍ | 118000/818627 [00:13<01:16, 9118.47 examples/s]
+Filter: 14%|█▍ | 118000/818627 [00:13<01:16, 9141.42 examples/s]
+Filter: 14%|█▍ | 118000/818627 [00:13<01:16, 9130.23 examples/s]
+Filter: 14%|█▍ | 118000/818627 [00:13<01:16, 9122.79 examples/s]
+Filter: 14%|█▍ | 118000/818627 [00:13<01:16, 9112.63 examples/s]
+Filter: 14%|█▍ | 118000/818627 [00:13<01:16, 9114.56 examples/s]
+Filter: 15%|█▍ | 119000/818627 [00:13<01:17, 8997.12 examples/s]
+Filter: 15%|█▍ | 119000/818627 [00:13<01:17, 8985.25 examples/s]
+Filter: 15%|█▍ | 119000/818627 [00:13<01:17, 8984.41 examples/s]
+Filter: 15%|█▍ | 119000/818627 [00:13<01:17, 9003.50 examples/s]
+Filter: 15%|█▍ | 119000/818627 [00:13<01:17, 8993.87 examples/s]
+Filter: 15%|█▍ | 119000/818627 [00:13<01:17, 8981.59 examples/s]
+Filter: 15%|█▍ | 119000/818627 [00:13<01:17, 8987.88 examples/s]
+Filter: 15%|█▍ | 119000/818627 [00:13<01:17, 8982.95 examples/s]
+Filter: 15%|█▍ | 120000/818627 [00:13<01:18, 8877.32 examples/s]
+Filter: 15%|█▍ | 120000/818627 [00:13<01:18, 8884.71 examples/s]
+Filter: 15%|█▍ | 120000/818627 [00:13<01:18, 8893.72 examples/s]
+Filter: 15%|█▍ | 120000/818627 [00:13<01:18, 8872.39 examples/s]
+Filter: 15%|█▍ | 120000/818627 [00:13<01:18, 8882.12 examples/s]
+Filter: 15%|█▍ | 120000/818627 [00:13<01:18, 8876.05 examples/s]
+Filter: 15%|█▍ | 120000/818627 [00:13<01:18, 8883.60 examples/s]
+Filter: 15%|█▍ | 120000/818627 [00:13<01:18, 8875.66 examples/s]
+Filter: 15%|█▍ | 121000/818627 [00:13<01:19, 8819.10 examples/s]
+Filter: 15%|█▍ | 121000/818627 [00:13<01:19, 8823.44 examples/s]
+Filter: 15%|█▍ | 121000/818627 [00:13<01:19, 8830.52 examples/s]
+Filter: 15%|█▍ | 121000/818627 [00:13<01:19, 8815.60 examples/s]
+Filter: 15%|█▍ | 121000/818627 [00:13<01:19, 8816.80 examples/s]
+Filter: 15%|█▍ | 121000/818627 [00:13<01:19, 8817.29 examples/s]
+Filter: 15%|█▍ | 121000/818627 [00:13<01:19, 8817.34 examples/s]
+Filter: 15%|█▍ | 121000/818627 [00:13<01:19, 8815.71 examples/s]
+Filter: 15%|█▍ | 122000/818627 [00:13<01:19, 8780.09 examples/s]
+Filter: 15%|█▍ | 122000/818627 [00:13<01:19, 8783.11 examples/s]
+Filter: 15%|█▍ | 122000/818627 [00:13<01:19, 8782.43 examples/s]
+Filter: 15%|█▍ | 122000/818627 [00:13<01:19, 8782.77 examples/s]
+Filter: 15%|█▍ | 122000/818627 [00:13<01:19, 8776.14 examples/s]
+Filter: 15%|█▍ | 122000/818627 [00:13<01:19, 8781.45 examples/s]
+Filter: 15%|█▍ | 122000/818627 [00:13<01:19, 8776.42 examples/s]
+Filter: 15%|█▍ | 122000/818627 [00:13<01:19, 8773.41 examples/s]
+Filter: 15%|█▌ | 123000/818627 [00:13<01:19, 8748.65 examples/s]
+Filter: 15%|█▌ | 123000/818627 [00:13<01:19, 8746.85 examples/s]
+Filter: 15%|█▌ | 123000/818627 [00:13<01:19, 8748.15 examples/s]
+Filter: 15%|█▌ | 123000/818627 [00:13<01:19, 8758.44 examples/s]
+Filter: 15%|█▌ | 123000/818627 [00:13<01:19, 8753.78 examples/s]
+Filter: 15%|█▌ | 123000/818627 [00:13<01:19, 8748.85 examples/s]
+Filter: 15%|█▌ | 123000/818627 [00:13<01:19, 8745.08 examples/s]
+Filter: 15%|█▌ | 123000/818627 [00:13<01:19, 8747.91 examples/s]
+Filter: 15%|█▌ | 124000/818627 [00:13<01:19, 8699.92 examples/s]
+Filter: 15%|█▌ | 124000/818627 [00:13<01:19, 8700.13 examples/s]
+Filter: 15%|█▌ | 124000/818627 [00:13<01:19, 8700.36 examples/s]
+Filter: 15%|█▌ | 124000/818627 [00:14<01:19, 8705.78 examples/s]
+Filter: 15%|█▌ | 124000/818627 [00:13<01:19, 8702.82 examples/s]
+Filter: 15%|█▌ | 124000/818627 [00:13<01:19, 8701.36 examples/s]
+Filter: 15%|█▌ | 124000/818627 [00:13<01:19, 8697.56 examples/s]
+Filter: 15%|█▌ | 124000/818627 [00:13<01:19, 8697.23 examples/s]
+Filter: 15%|█▌ | 125000/818627 [00:13<01:19, 8698.07 examples/s]
+Filter: 15%|█▌ | 125000/818627 [00:13<01:19, 8700.81 examples/s]
+Filter: 15%|█▌ | 125000/818627 [00:13<01:19, 8699.05 examples/s]
+Filter: 15%|█▌ | 125000/818627 [00:14<01:19, 8704.75 examples/s]
+Filter: 15%|█▌ | 125000/818627 [00:13<01:19, 8702.13 examples/s]
+Filter: 15%|█▌ | 125000/818627 [00:13<01:19, 8700.65 examples/s]
+Filter: 15%|█▌ | 125000/818627 [00:13<01:19, 8699.28 examples/s]
+Filter: 15%|█▌ | 125000/818627 [00:13<01:19, 8700.15 examples/s]
+Filter: 15%|█▌ | 126000/818627 [00:14<01:20, 8650.18 examples/s]
+Filter: 15%|█▌ | 126000/818627 [00:14<01:20, 8650.80 examples/s]
+Filter: 15%|█▌ | 126000/818627 [00:14<01:20, 8648.39 examples/s]
+Filter: 15%|█▌ | 126000/818627 [00:14<01:20, 8649.11 examples/s]
+Filter: 15%|█▌ | 126000/818627 [00:14<01:20, 8652.15 examples/s]
+Filter: 15%|█▌ | 126000/818627 [00:14<01:20, 8651.50 examples/s]
+Filter: 15%|█▌ | 126000/818627 [00:14<01:20, 8649.91 examples/s]
+Filter: 15%|█▌ | 126000/818627 [00:14<01:20, 8650.35 examples/s]
+Filter: 16%|█▌ | 127000/818627 [00:14<01:17, 8935.45 examples/s]
+Filter: 16%|█▌ | 127000/818627 [00:14<01:17, 8933.81 examples/s]
+Filter: 16%|█▌ | 127000/818627 [00:14<01:17, 8931.62 examples/s]
+Filter: 16%|█▌ | 127000/818627 [00:14<01:17, 8937.07 examples/s]
+Filter: 16%|█▌ | 127000/818627 [00:14<01:17, 8936.17 examples/s]
+Filter: 16%|█▌ | 127000/818627 [00:14<01:17, 8933.16 examples/s]
+Filter: 16%|█▌ | 127000/818627 [00:14<01:17, 8936.16 examples/s]
+Filter: 16%|█▌ | 127000/818627 [00:14<01:20, 8582.26 examples/s]
+Filter: 16%|█▌ | 128000/818627 [00:14<01:15, 9162.99 examples/s]
+Filter: 16%|█▌ | 128000/818627 [00:14<01:15, 9172.06 examples/s]
+Filter: 16%|█▌ | 128000/818627 [00:14<01:15, 9159.19 examples/s]
+Filter: 16%|█▌ | 128000/818627 [00:14<01:15, 9168.40 examples/s]
+Filter: 16%|█▌ | 128000/818627 [00:14<01:15, 9168.33 examples/s]
+Filter: 16%|█▌ | 128000/818627 [00:14<01:15, 9163.60 examples/s]
+Filter: 16%|█▌ | 128000/818627 [00:14<01:15, 9163.13 examples/s]
+Filter: 16%|█▌ | 129000/818627 [00:14<01:16, 8997.77 examples/s]
+Filter: 16%|█▌ | 129000/818627 [00:14<01:16, 9000.52 examples/s]
+Filter: 16%|█▌ | 129000/818627 [00:14<01:16, 8995.30 examples/s]
+Filter: 16%|█▌ | 129000/818627 [00:14<01:16, 8995.25 examples/s]
+Filter: 16%|█▌ | 129000/818627 [00:14<01:15, 9117.50 examples/s]
+Filter: 16%|█▌ | 129000/818627 [00:14<01:16, 8995.43 examples/s]
+Filter: 16%|█▌ | 129000/818627 [00:14<01:16, 8992.00 examples/s]
+Filter: 16%|█▌ | 129000/818627 [00:14<01:16, 8993.26 examples/s]
+Filter: 16%|█▌ | 130000/818627 [00:14<01:17, 8885.44 examples/s]
+Filter: 16%|█▌ | 130000/818627 [00:14<01:17, 8871.36 examples/s]
+Filter: 16%|█▌ | 130000/818627 [00:14<01:16, 8994.78 examples/s]
+Filter: 16%|█▌ | 130000/818627 [00:14<01:17, 8880.84 examples/s]
+Filter: 16%|█▌ | 130000/818627 [00:14<01:17, 8880.10 examples/s]
+Filter: 16%|█▌ | 130000/818627 [00:14<01:17, 8881.26 examples/s]
+Filter: 16%|█▌ | 130000/818627 [00:14<01:17, 8880.98 examples/s]
+Filter: 16%|█▌ | 130000/818627 [00:14<01:18, 8751.10 examples/s]
+Filter: 16%|█▌ | 131000/818627 [00:14<01:17, 8849.86 examples/s]
+Filter: 16%|█▌ | 131000/818627 [00:14<01:17, 8849.15 examples/s]
+Filter: 16%|█▌ | 131000/818627 [00:14<01:17, 8886.99 examples/s]
+Filter: 16%|█▌ | 131000/818627 [00:14<01:16, 8935.36 examples/s]
+Filter: 16%|█▌ | 131000/818627 [00:14<01:17, 8849.76 examples/s]
+Filter: 16%|█▌ | 131000/818627 [00:14<01:17, 8846.77 examples/s]
+Filter: 16%|█▌ | 131000/818627 [00:14<01:17, 8845.83 examples/s]
+Filter: 16%|█▌ | 131000/818627 [00:14<01:17, 8847.62 examples/s]
+Filter: 16%|█▌ | 132000/818627 [00:14<01:18, 8798.37 examples/s]
+Filter: 16%|█▌ | 132000/818627 [00:14<01:18, 8797.91 examples/s]
+Filter: 16%|█▌ | 132000/818627 [00:14<01:17, 8826.62 examples/s]
+Filter: 16%|█▌ | 132000/818627 [00:15<01:17, 8866.28 examples/s]
+Filter: 16%|█▌ | 132000/818627 [00:14<01:18, 8799.43 examples/s]
+Filter: 16%|█▌ | 132000/818627 [00:14<01:18, 8796.40 examples/s]
+Filter: 16%|█▌ | 132000/818627 [00:14<01:18, 8795.99 examples/s]
+Filter: 16%|█▌ | 132000/818627 [00:14<01:18, 8760.87 examples/s]
+Filter: 16%|█▌ | 133000/818627 [00:14<01:18, 8778.28 examples/s]
+Filter: 16%|█▌ | 133000/818627 [00:14<01:18, 8777.64 examples/s]
+Filter: 16%|█▌ | 133000/818627 [00:14<01:17, 8794.23 examples/s]
+Filter: 16%|█▌ | 133000/818627 [00:15<01:17, 8824.69 examples/s]
+Filter: 16%|█▌ | 133000/818627 [00:14<01:18, 8787.63 examples/s]
+Filter: 16%|█▌ | 133000/818627 [00:14<01:18, 8775.22 examples/s]
+Filter: 16%|█▌ | 133000/818627 [00:14<01:18, 8773.62 examples/s]
+Filter: 16%|█▌ | 133000/818627 [00:14<01:18, 8778.46 examples/s]
+Filter: 16%|█▋ | 134000/818627 [00:14<01:18, 8777.24 examples/s]
+Filter: 16%|█▋ | 134000/818627 [00:14<01:17, 8796.02 examples/s]
+Filter: 16%|█▋ | 134000/818627 [00:14<01:18, 8774.60 examples/s]
+Filter: 16%|█▋ | 134000/818627 [00:15<01:17, 8810.61 examples/s]
+Filter: 16%|█▋ | 134000/818627 [00:15<01:17, 8777.81 examples/s]
+Filter: 16%|█▋ | 134000/818627 [00:14<01:17, 8785.33 examples/s]
+Filter: 16%|█▋ | 134000/818627 [00:14<01:18, 8774.51 examples/s]
+Filter: 16%|█▋ | 134000/818627 [00:14<01:18, 8777.02 examples/s]
+Filter: 16%|█▋ | 135000/818627 [00:15<01:15, 9105.41 examples/s]
+Filter: 16%|█▋ | 135000/818627 [00:15<01:15, 9103.89 examples/s]
+Filter: 16%|█▋ | 135000/818627 [00:15<01:14, 9122.73 examples/s]
+Filter: 16%|█▋ | 135000/818627 [00:15<01:15, 9106.77 examples/s]
+Filter: 16%|█▋ | 135000/818627 [00:14<01:15, 9107.70 examples/s]
+Filter: 16%|█▋ | 135000/818627 [00:15<01:15, 9102.45 examples/s]
+Filter: 16%|█▋ | 135000/818627 [00:14<01:15, 9111.20 examples/s]
+Filter: 16%|█▋ | 135000/818627 [00:15<01:15, 9097.69 examples/s]
+Filter: 17%|█▋ | 136000/818627 [00:15<01:14, 9136.12 examples/s]
+Filter: 17%|█▋ | 136000/818627 [00:15<01:14, 9132.00 examples/s]
+Filter: 17%|█▋ | 136000/818627 [00:15<01:14, 9149.83 examples/s]
+Filter: 17%|█▋ | 136000/818627 [00:15<01:14, 9138.70 examples/s]
+Filter: 17%|█▋ | 136000/818627 [00:15<01:14, 9131.13 examples/s]
+Filter: 17%|█▋ | 136000/818627 [00:15<01:14, 9136.23 examples/s]
+Filter: 17%|█▋ | 136000/818627 [00:15<01:14, 9132.14 examples/s]
+Filter: 17%|█▋ | 136000/818627 [00:15<01:14, 9136.37 examples/s]
+Filter: 17%|█▋ | 137000/818627 [00:15<01:15, 9013.07 examples/s]
+Filter: 17%|█▋ | 137000/818627 [00:15<01:15, 9011.88 examples/s]
+Filter: 17%|█▋ | 137000/818627 [00:15<01:15, 9018.33 examples/s]
+Filter: 17%|█▋ | 137000/818627 [00:15<01:15, 9011.61 examples/s]
+Filter: 17%|█▋ | 137000/818627 [00:15<01:15, 9013.84 examples/s]
+Filter: 17%|█▋ | 137000/818627 [00:15<01:15, 9011.18 examples/s]
+Filter: 17%|█▋ | 137000/818627 [00:15<01:15, 9012.79 examples/s]
+Filter: 17%|█▋ | 137000/818627 [00:15<01:15, 9005.70 examples/s]
+Filter: 17%|█▋ | 138000/818627 [00:15<01:16, 8924.53 examples/s]
+Filter: 17%|█▋ | 138000/818627 [00:15<01:16, 8923.39 examples/s]
+Filter: 17%|█▋ | 138000/818627 [00:15<01:16, 8930.97 examples/s]
+Filter: 17%|█▋ | 138000/818627 [00:15<01:16, 8931.87 examples/s]
+Filter: 17%|█▋ | 138000/818627 [00:15<01:16, 8927.19 examples/s]
+Filter: 17%|█▋ | 138000/818627 [00:15<01:16, 8932.47 examples/s]
+Filter: 17%|█▋ | 138000/818627 [00:15<01:16, 8929.16 examples/s]
+Filter: 17%|█▋ | 138000/818627 [00:15<01:16, 8928.21 examples/s]
+Filter: 17%|█▋ | 139000/818627 [00:15<01:16, 8831.87 examples/s]
+Filter: 17%|█▋ | 139000/818627 [00:15<01:16, 8833.04 examples/s]
+Filter: 17%|█▋ | 139000/818627 [00:15<01:16, 8840.30 examples/s]
+Filter: 17%|█▋ | 139000/818627 [00:15<01:16, 8833.78 examples/s]
+Filter: 17%|█▋ | 139000/818627 [00:15<01:16, 8833.07 examples/s]
+Filter: 17%|█▋ | 139000/818627 [00:15<01:16, 8831.87 examples/s]
+Filter: 17%|█▋ | 139000/818627 [00:15<01:16, 8831.86 examples/s]
+Filter: 17%|█▋ | 139000/818627 [00:15<01:17, 8825.91 examples/s]
+Filter: 17%|█▋ | 140000/818627 [00:15<01:17, 8789.34 examples/s]
+Filter: 17%|█▋ | 140000/818627 [00:15<01:17, 8790.16 examples/s]
+Filter: 17%|█▋ | 140000/818627 [00:15<01:17, 8795.17 examples/s]
+Filter: 17%|█▋ | 140000/818627 [00:15<01:17, 8804.79 examples/s]
+Filter: 17%|█▋ | 140000/818627 [00:15<01:17, 8792.21 examples/s]
+Filter: 17%|█▋ | 140000/818627 [00:15<01:17, 8792.36 examples/s]
+Filter: 17%|█▋ | 140000/818627 [00:15<01:17, 8788.67 examples/s]
+Filter: 17%|█▋ | 140000/818627 [00:15<01:17, 8790.91 examples/s]
+Filter: 17%|█▋ | 141000/818627 [00:15<01:17, 8795.61 examples/s]
+Filter: 17%|█▋ | 141000/818627 [00:16<01:17, 8799.39 examples/s]
+Filter: 17%|█▋ | 141000/818627 [00:15<01:17, 8795.42 examples/s]
+Filter: 17%|█▋ | 141000/818627 [00:15<01:17, 8794.35 examples/s]
+Filter: 17%|█▋ | 141000/818627 [00:15<01:17, 8797.67 examples/s]
+Filter: 17%|█▋ | 141000/818627 [00:15<01:17, 8785.82 examples/s]
+Filter: 17%|█▋ | 141000/818627 [00:15<01:17, 8794.09 examples/s]
+Filter: 17%|█▋ | 141000/818627 [00:15<01:17, 8769.50 examples/s]
+Filter: 17%|█▋ | 143000/818627 [00:15<01:14, 9115.21 examples/s]
+Filter: 17%|█▋ | 143000/818627 [00:15<01:14, 9119.84 examples/s]
+Filter: 17%|█▋ | 143000/818627 [00:15<01:14, 9116.01 examples/s]
+Filter: 17%|█▋ | 143000/818627 [00:16<01:14, 9113.59 examples/s]
+Filter: 17%|█▋ | 143000/818627 [00:15<01:14, 9113.73 examples/s]
+Filter: 17%|█▋ | 143000/818627 [00:15<01:14, 9115.07 examples/s]
+Filter: 17%|█▋ | 143000/818627 [00:15<01:14, 9106.60 examples/s]
+Filter: 17%|█▋ | 143000/818627 [00:16<01:14, 9013.40 examples/s]
+Filter: 18%|█▊ | 144000/818627 [00:16<01:14, 9016.98 examples/s]
+Filter: 18%|█▊ | 144000/818627 [00:16<01:14, 9009.52 examples/s]
+Filter: 18%|█▊ | 144000/818627 [00:16<01:14, 9013.00 examples/s]
+Filter: 18%|█▊ | 144000/818627 [00:16<01:14, 9045.27 examples/s]
+Filter: 18%|█▊ | 144000/818627 [00:16<01:14, 9011.32 examples/s]
+Filter: 18%|█▊ | 144000/818627 [00:16<01:14, 9012.60 examples/s]
+Filter: 18%|█▊ | 144000/818627 [00:16<01:14, 9012.58 examples/s]
+Filter: 18%|█▊ | 144000/818627 [00:16<01:14, 9013.51 examples/s]
+Filter: 18%|█▊ | 145000/818627 [00:16<01:15, 8874.85 examples/s]
+Filter: 18%|█▊ | 145000/818627 [00:16<01:15, 8871.08 examples/s]
+Filter: 18%|█▊ | 145000/818627 [00:16<01:15, 8867.47 examples/s]
+Filter: 18%|█▊ | 145000/818627 [00:16<01:15, 8893.67 examples/s]
+Filter: 18%|█▊ | 145000/818627 [00:16<01:15, 8872.24 examples/s]
+Filter: 18%|█▊ | 145000/818627 [00:16<01:15, 8871.52 examples/s]
+Filter: 18%|█▊ | 145000/818627 [00:16<01:15, 8868.80 examples/s]
+Filter: 18%|█▊ | 145000/818627 [00:16<01:15, 8872.39 examples/s]
+Filter: 18%|█▊ | 146000/818627 [00:16<01:16, 8833.54 examples/s]
+Filter: 18%|█▊ | 146000/818627 [00:16<01:16, 8831.57 examples/s]
+Filter: 18%|█▊ | 146000/818627 [00:16<01:16, 8829.53 examples/s]
+Filter: 18%|█▊ | 146000/818627 [00:16<01:16, 8849.43 examples/s]
+Filter: 18%|█▊ | 146000/818627 [00:16<01:16, 8831.92 examples/s]
+Filter: 18%|█▊ | 146000/818627 [00:16<01:16, 8832.39 examples/s]
+Filter: 18%|█▊ | 146000/818627 [00:16<01:16, 8830.75 examples/s]
+Filter: 18%|█▊ | 146000/818627 [00:16<01:16, 8832.33 examples/s]
+Filter: 18%|█▊ | 147000/818627 [00:16<01:16, 8789.22 examples/s]
+Filter: 18%|█▊ | 147000/818627 [00:16<01:16, 8782.01 examples/s]
+Filter: 18%|█▊ | 147000/818627 [00:16<01:16, 8789.77 examples/s]
+Filter: 18%|█▊ | 147000/818627 [00:16<01:16, 8787.09 examples/s]
+Filter: 18%|█▊ | 147000/818627 [00:16<01:16, 8799.15 examples/s]
+Filter: 18%|█▊ | 147000/818627 [00:16<01:16, 8787.87 examples/s]
+Filter: 18%|█▊ | 147000/818627 [00:16<01:16, 8780.06 examples/s]
+Filter: 18%|█▊ | 147000/818627 [00:16<01:16, 8788.09 examples/s]
+Filter: 18%|█▊ | 148000/818627 [00:16<01:14, 8982.92 examples/s]
+Filter: 18%|█▊ | 148000/818627 [00:16<01:14, 8987.12 examples/s]
+Filter: 18%|█▊ | 148000/818627 [00:16<01:14, 8988.13 examples/s]
+Filter: 18%|█▊ | 148000/818627 [00:16<01:14, 8984.28 examples/s]
+Filter: 18%|█▊ | 148000/818627 [00:16<01:14, 8983.73 examples/s]
+Filter: 18%|█▊ | 148000/818627 [00:16<01:14, 8982.04 examples/s]
+Filter: 18%|█▊ | 148000/818627 [00:16<01:14, 8989.41 examples/s]
+Filter: 18%|█▊ | 148000/818627 [00:16<01:14, 8981.95 examples/s]
+Filter: 18%|█▊ | 149000/818627 [00:16<01:13, 9163.35 examples/s]
+Filter: 18%|█▊ | 149000/818627 [00:16<01:13, 9166.67 examples/s]
+Filter: 18%|█▊ | 149000/818627 [00:16<01:13, 9166.82 examples/s]
+Filter: 18%|█▊ | 149000/818627 [00:16<01:12, 9175.51 examples/s]
+Filter: 18%|█▊ | 149000/818627 [00:16<01:13, 9166.77 examples/s]
+Filter: 18%|█▊ | 149000/818627 [00:16<01:13, 9165.45 examples/s]
+Filter: 18%|█▊ | 149000/818627 [00:16<01:13, 9161.53 examples/s]
+Filter: 18%|█▊ | 149000/818627 [00:16<01:13, 9160.75 examples/s]
+Filter: 18%|█▊ | 150000/818627 [00:16<01:14, 9035.45 examples/s]
+Filter: 18%|█▊ | 150000/818627 [00:16<01:14, 9031.70 examples/s]
+Filter: 18%|█▊ | 150000/818627 [00:16<01:14, 9033.54 examples/s]
+Filter: 18%|█▊ | 150000/818627 [00:17<01:13, 9042.02 examples/s]
+Filter: 18%|█▊ | 150000/818627 [00:16<01:14, 9034.28 examples/s]
+Filter: 18%|█▊ | 150000/818627 [00:16<01:14, 9031.02 examples/s]
+Filter: 18%|█▊ | 150000/818627 [00:16<01:14, 9029.97 examples/s]
+Filter: 18%|█▊ | 150000/818627 [00:16<01:14, 9029.96 examples/s]
+Filter: 18%|█▊ | 151000/818627 [00:16<01:14, 8954.81 examples/s]
+Filter: 18%|█▊ | 151000/818627 [00:16<01:14, 8955.44 examples/s]
+Filter: 18%|█▊ | 151000/818627 [00:16<01:14, 8958.76 examples/s]
+Filter: 18%|█▊ | 151000/818627 [00:16<01:14, 8953.88 examples/s]
+Filter: 18%|█▊ | 151000/818627 [00:16<01:14, 8954.13 examples/s]
+Filter: 18%|█▊ | 151000/818627 [00:16<01:14, 8954.31 examples/s]
+Filter: 18%|█▊ | 151000/818627 [00:16<01:14, 8953.16 examples/s]
+Filter: 18%|█▊ | 151000/818627 [00:17<01:15, 8792.00 examples/s]
+Filter: 19%|█▊ | 152000/818627 [00:16<01:14, 8924.63 examples/s]
+Filter: 19%|█▊ | 152000/818627 [00:16<01:14, 8921.53 examples/s]
+Filter: 19%|█▊ | 152000/818627 [00:16<01:14, 8929.01 examples/s]
+Filter: 19%|█▊ | 152000/818627 [00:17<01:14, 8985.94 examples/s]
+Filter: 19%|█▊ | 152000/818627 [00:17<01:14, 8927.20 examples/s]
+Filter: 19%|█▊ | 152000/818627 [00:16<01:14, 8923.76 examples/s]
+Filter: 19%|█▊ | 152000/818627 [00:16<01:14, 8922.08 examples/s]
+Filter: 19%|█▊ | 152000/818627 [00:16<01:14, 8922.20 examples/s]
+Filter: 19%|█▊ | 153000/818627 [00:17<01:15, 8823.62 examples/s]
+Filter: 19%|█▊ | 153000/818627 [00:17<01:15, 8862.35 examples/s]
+Filter: 19%|█▊ | 153000/818627 [00:17<01:15, 8816.67 examples/s]
+Filter: 19%|█▊ | 153000/818627 [00:17<01:15, 8824.11 examples/s]
+Filter: 19%|█▊ | 153000/818627 [00:17<01:15, 8821.11 examples/s]
+Filter: 19%|█▊ | 153000/818627 [00:17<01:15, 8821.86 examples/s]
+Filter: 19%|█▊ | 153000/818627 [00:17<01:15, 8790.06 examples/s]
+Filter: 19%|█▊ | 153000/818627 [00:17<01:15, 8782.58 examples/s]
+Filter: 19%|█▉ | 154000/818627 [00:17<01:17, 8541.30 examples/s]
+Filter: 19%|█▉ | 154000/818627 [00:17<01:17, 8545.65 examples/s]
+Filter: 19%|█▉ | 154000/818627 [00:17<01:17, 8563.12 examples/s]
+Filter: 19%|█▉ | 154000/818627 [00:17<01:17, 8550.45 examples/s]
+Filter: 19%|█▉ | 154000/818627 [00:17<01:17, 8540.53 examples/s]
+Filter: 19%|█▉ | 154000/818627 [00:17<01:17, 8540.88 examples/s]
+Filter: 19%|█▉ | 154000/818627 [00:17<01:17, 8535.52 examples/s]
+Filter: 19%|█▉ | 154000/818627 [00:17<01:18, 8502.77 examples/s]
+Filter: 19%|█▉ | 155000/818627 [00:17<01:17, 8564.50 examples/s]
+Filter: 19%|█▉ | 155000/818627 [00:17<01:17, 8555.99 examples/s]
+Filter: 19%|█▉ | 155000/818627 [00:17<01:17, 8568.64 examples/s]
+Filter: 19%|█▉ | 155000/818627 [00:17<01:17, 8575.87 examples/s]
+Filter: 19%|█▉ | 155000/818627 [00:17<01:17, 8557.09 examples/s]
+Filter: 19%|█▉ | 155000/818627 [00:17<01:17, 8564.60 examples/s]
+Filter: 19%|█▉ | 155000/818627 [00:17<01:17, 8557.11 examples/s]
+Filter: 19%|█▉ | 155000/818627 [00:17<01:17, 8555.94 examples/s]
+Filter: 19%|█▉ | 156000/818627 [00:17<01:17, 8566.39 examples/s]
+Filter: 19%|█▉ | 156000/818627 [00:17<01:17, 8560.96 examples/s]
+Filter: 19%|█▉ | 156000/818627 [00:17<01:17, 8568.45 examples/s]
+Filter: 19%|█▉ | 156000/818627 [00:17<01:17, 8566.75 examples/s]
+Filter: 19%|█▉ | 156000/818627 [00:17<01:17, 8560.73 examples/s]
+Filter: 19%|█▉ | 156000/818627 [00:17<01:17, 8558.98 examples/s]
+Filter: 19%|█▉ | 156000/818627 [00:17<01:17, 8559.33 examples/s]
+Filter: 19%|█▉ | 156000/818627 [00:17<01:17, 8544.09 examples/s]
+Filter: 19%|█▉ | 157000/818627 [00:17<01:16, 8632.21 examples/s]
+Filter: 19%|█▉ | 157000/818627 [00:17<01:16, 8629.09 examples/s]
+Filter: 19%|█▉ | 157000/818627 [00:17<01:16, 8643.77 examples/s]
+Filter: 19%|█▉ | 157000/818627 [00:17<01:16, 8628.27 examples/s]
+Filter: 19%|█▉ | 157000/818627 [00:17<01:16, 8631.29 examples/s]
+Filter: 19%|█▉ | 157000/818627 [00:17<01:16, 8625.39 examples/s]
+Filter: 19%|█▉ | 157000/818627 [00:17<01:16, 8628.94 examples/s]
+Filter: 19%|█▉ | 157000/818627 [00:17<01:16, 8629.13 examples/s]
+Filter: 19%|█▉ | 158000/818627 [00:17<01:13, 9000.84 examples/s]
+Filter: 19%|█▉ | 158000/818627 [00:17<01:13, 9009.71 examples/s]
+Filter: 19%|█▉ | 158000/818627 [00:17<01:13, 8998.18 examples/s]
+Filter: 19%|█▉ | 159000/818627 [00:17<01:13, 9002.16 examples/s]
+Filter: 19%|█▉ | 159000/818627 [00:17<01:13, 8999.97 examples/s]
+Filter: 19%|█▉ | 159000/818627 [00:17<01:13, 9003.35 examples/s]
+Filter: 19%|█▉ | 159000/818627 [00:17<01:13, 9000.01 examples/s]
+Filter: 19%|█▉ | 159000/818627 [00:17<01:13, 9002.32 examples/s]
+Filter: 19%|█▉ | 159000/818627 [00:17<01:13, 8999.35 examples/s]
+Filter: 19%|█▉ | 159000/818627 [00:17<01:13, 8997.37 examples/s]
+Filter: 19%|█▉ | 159000/818627 [00:18<01:13, 8993.70 examples/s]
+Filter: 20%|█▉ | 160000/818627 [00:17<01:13, 8913.03 examples/s]
+Filter: 20%|█▉ | 160000/818627 [00:17<01:14, 8888.75 examples/s]
+Filter: 20%|█▉ | 160000/818627 [00:17<01:13, 8911.74 examples/s]
+Filter: 20%|█▉ | 160000/818627 [00:18<01:13, 8903.27 examples/s]
+Filter: 20%|█▉ | 160000/818627 [00:17<01:14, 8896.02 examples/s]
+Filter: 20%|█▉ | 160000/818627 [00:17<01:13, 8915.66 examples/s]
+Filter: 20%|█▉ | 160000/818627 [00:17<01:13, 8912.65 examples/s]
+Filter: 20%|█▉ | 160000/818627 [00:17<01:13, 8913.84 examples/s]
+Filter: 20%|█▉ | 161000/818627 [00:17<01:14, 8828.90 examples/s]
+Filter: 20%|█▉ | 161000/818627 [00:17<01:14, 8843.94 examples/s]
+Filter: 20%|█▉ | 161000/818627 [00:17<01:14, 8850.48 examples/s]
+Filter: 20%|█▉ | 161000/818627 [00:18<01:14, 8835.26 examples/s]
+Filter: 20%|█▉ | 161000/818627 [00:18<01:14, 8850.37 examples/s]
+Filter: 20%|█▉ | 161000/818627 [00:17<01:14, 8850.53 examples/s]
+Filter: 20%|█▉ | 161000/818627 [00:17<01:14, 8825.65 examples/s]
+Filter: 20%|█▉ | 161000/818627 [00:17<01:14, 8845.74 examples/s]
+Filter: 20%|█▉ | 162000/818627 [00:18<01:14, 8773.16 examples/s]
+Filter: 20%|█▉ | 162000/818627 [00:18<01:14, 8790.39 examples/s]
+Filter: 20%|█▉ | 162000/818627 [00:18<01:14, 8795.45 examples/s]
+Filter: 20%|█▉ | 162000/818627 [00:18<01:14, 8790.82 examples/s]
+Filter: 20%|█▉ | 162000/818627 [00:18<01:14, 8766.85 examples/s]
+Filter: 20%|█▉ | 162000/818627 [00:18<01:14, 8787.79 examples/s]
+Filter: 20%|█▉ | 162000/818627 [00:18<01:14, 8789.73 examples/s]
+Filter: 20%|█▉ | 162000/818627 [00:18<01:17, 8526.45 examples/s]
+Filter: 20%|█▉ | 163000/818627 [00:18<01:14, 8750.02 examples/s]
+Filter: 20%|█▉ | 163000/818627 [00:18<01:14, 8761.76 examples/s]
+Filter: 20%|█▉ | 163000/818627 [00:18<01:14, 8765.61 examples/s]
+Filter: 20%|█▉ | 163000/818627 [00:18<01:14, 8765.94 examples/s]
+Filter: 20%|█▉ | 163000/818627 [00:18<01:14, 8748.34 examples/s]
+Filter: 20%|█▉ | 163000/818627 [00:18<01:14, 8765.61 examples/s]
+Filter: 20%|█▉ | 163000/818627 [00:18<01:14, 8767.15 examples/s]
+Filter: 20%|█▉ | 163000/818627 [00:18<01:14, 8817.59 examples/s]
+Filter: 20%|██ | 164000/818627 [00:18<01:13, 8965.17 examples/s]
+Filter: 20%|██ | 164000/818627 [00:18<01:12, 8968.25 examples/s]
+Filter: 20%|██ | 164000/818627 [00:18<01:13, 8961.36 examples/s]
+Filter: 20%|██ | 164000/818627 [00:18<01:12, 8969.82 examples/s]
+Filter: 20%|██ | 164000/818627 [00:18<01:12, 8968.15 examples/s]
+Filter: 20%|██ | 164000/818627 [00:18<01:13, 8964.31 examples/s]
+Filter: 20%|██ | 164000/818627 [00:18<01:12, 9016.64 examples/s]
+Filter: 20%|██ | 164000/818627 [00:18<01:13, 8964.36 examples/s]
+Filter: 20%|██ | 165000/818627 [00:18<01:10, 9237.08 examples/s]
+Filter: 20%|██ | 165000/818627 [00:18<01:10, 9226.55 examples/s]
+Filter: 20%|██ | 165000/818627 [00:18<01:10, 9226.59 examples/s]
+Filter: 20%|██ | 165000/818627 [00:18<01:10, 9283.48 examples/s]
+Filter: 20%|██ | 165000/818627 [00:18<01:10, 9228.00 examples/s]
+Filter: 20%|██ | 165000/818627 [00:18<01:10, 9234.87 examples/s]
+Filter: 20%|██ | 165000/818627 [00:18<01:10, 9224.27 examples/s]
+Filter: 20%|██ | 165000/818627 [00:18<01:10, 9226.38 examples/s]
+Filter: 20%|██ | 166000/818627 [00:18<01:10, 9220.39 examples/s]
+Filter: 20%|██ | 166000/818627 [00:18<01:10, 9215.31 examples/s]
+Filter: 20%|██ | 166000/818627 [00:18<01:10, 9253.98 examples/s]
+Filter: 20%|██ | 166000/818627 [00:18<01:10, 9211.88 examples/s]
+Filter: 20%|██ | 166000/818627 [00:18<01:10, 9216.13 examples/s]
+Filter: 20%|██ | 166000/818627 [00:18<01:10, 9210.26 examples/s]
+Filter: 20%|██ | 166000/818627 [00:18<01:10, 9210.62 examples/s]
+Filter: 20%|██ | 166000/818627 [00:18<01:10, 9195.14 examples/s]
+Filter: 20%|██ | 167000/818627 [00:18<01:12, 9048.15 examples/s]
+Filter: 20%|██ | 167000/818627 [00:18<01:12, 9048.35 examples/s]
+Filter: 20%|██ | 167000/818627 [00:18<01:11, 9054.50 examples/s]
+Filter: 20%|██ | 167000/818627 [00:18<01:11, 9051.10 examples/s]
+Filter: 20%|██ | 167000/818627 [00:18<01:12, 9048.10 examples/s]
+Filter: 20%|██ | 167000/818627 [00:18<01:12, 9045.60 examples/s]
+Filter: 20%|██ | 167000/818627 [00:18<01:12, 9047.58 examples/s]
+Filter: 20%|██ | 167000/818627 [00:18<01:11, 9054.21 examples/s]
+Filter: 21%|██ | 168000/818627 [00:18<01:13, 8905.30 examples/s]
+Filter: 21%|██ | 168000/818627 [00:18<01:13, 8911.50 examples/s]
+Filter: 21%|██ | 168000/818627 [00:18<01:13, 8908.03 examples/s]
+Filter: 21%|██ | 168000/818627 [00:18<01:13, 8906.51 examples/s]
+Filter: 21%|██ | 168000/818627 [00:18<01:13, 8907.81 examples/s]
+Filter: 21%|██ | 168000/818627 [00:19<01:12, 8915.63 examples/s]
+Filter: 21%|██ | 168000/818627 [00:18<01:13, 8908.66 examples/s]
+Filter: 21%|██ | 168000/818627 [00:18<01:14, 8755.65 examples/s]
+Filter: 21%|██ | 169000/818627 [00:18<01:13, 8826.69 examples/s]
+Filter: 21%|██ | 169000/818627 [00:18<01:13, 8824.79 examples/s]
+Filter: 21%|██ | 169000/818627 [00:18<01:13, 8865.34 examples/s]
+Filter: 21%|██ | 169000/818627 [00:18<01:13, 8825.16 examples/s]
+Filter: 21%|██ | 169000/818627 [00:18<01:13, 8824.56 examples/s]
+Filter: 21%|██ | 169000/818627 [00:18<01:13, 8825.45 examples/s]
+Filter: 21%|██ | 169000/818627 [00:18<01:13, 8827.36 examples/s]
+Filter: 21%|██ | 169000/818627 [00:19<01:13, 8831.49 examples/s]
+Filter: 21%|██ | 170000/818627 [00:18<01:12, 8951.54 examples/s]
+Filter: 21%|██ | 170000/818627 [00:18<01:12, 8953.50 examples/s]
+Filter: 21%|██ | 170000/818627 [00:18<01:12, 8979.15 examples/s]
+Filter: 21%|██ | 170000/818627 [00:18<01:12, 8954.04 examples/s]
+Filter: 21%|██ | 170000/818627 [00:18<01:12, 8950.28 examples/s]
+Filter: 21%|██ | 170000/818627 [00:19<01:12, 8949.51 examples/s]
+Filter: 21%|██ | 170000/818627 [00:18<01:12, 8951.40 examples/s]
+Filter: 21%|██ | 170000/818627 [00:19<01:12, 8954.03 examples/s]
+Filter: 21%|██ | 171000/818627 [00:19<01:10, 9166.00 examples/s]
+Filter: 21%|██ | 171000/818627 [00:19<01:10, 9193.16 examples/s]
+Filter: 21%|██ | 171000/818627 [00:19<01:10, 9166.37 examples/s]
+Filter: 21%|██ | 171000/818627 [00:19<01:10, 9165.74 examples/s]
+Filter: 21%|██ | 171000/818627 [00:19<01:10, 9173.23 examples/s]
+Filter: 21%|██ | 171000/818627 [00:19<01:10, 9166.78 examples/s]
+Filter: 21%|██ | 171000/818627 [00:19<01:10, 9162.71 examples/s]
+Filter: 21%|██ | 171000/818627 [00:19<01:10, 9158.86 examples/s]
+Filter: 21%|██ | 172000/818627 [00:19<01:08, 9395.52 examples/s]
+Filter: 21%|██ | 172000/818627 [00:19<01:08, 9398.86 examples/s]
+Filter: 21%|██ | 172000/818627 [00:19<01:08, 9415.51 examples/s]
+Filter: 21%|██ | 172000/818627 [00:19<01:08, 9396.97 examples/s]
+Filter: 21%|██ | 172000/818627 [00:19<01:08, 9395.97 examples/s]
+Filter: 21%|██ | 173000/818627 [00:19<01:09, 9346.67 examples/s]
+Filter: 21%|██ | 173000/818627 [00:19<01:09, 9351.23 examples/s]
+Filter: 21%|██ | 173000/818627 [00:19<01:08, 9362.20 examples/s]
+Filter: 21%|██ | 173000/818627 [00:19<01:08, 9366.16 examples/s]
+Filter: 21%|██ | 173000/818627 [00:19<01:09, 9344.07 examples/s]
+Filter: 21%|██ | 173000/818627 [00:19<01:08, 9357.15 examples/s]
+Filter: 21%|██ | 173000/818627 [00:19<01:09, 9356.89 examples/s]
+Filter: 21%|██ | 173000/818627 [00:19<01:09, 9345.76 examples/s]
+Filter: 21%|██▏ | 174000/818627 [00:19<01:10, 9149.78 examples/s]
+Filter: 21%|██▏ | 174000/818627 [00:19<01:10, 9136.40 examples/s]
+Filter: 21%|██▏ | 174000/818627 [00:19<01:10, 9133.92 examples/s]
+Filter: 21%|██▏ | 174000/818627 [00:19<01:10, 9183.04 examples/s]
+Filter: 21%|██▏ | 174000/818627 [00:19<01:10, 9137.80 examples/s]
+Filter: 21%|██▏ | 174000/818627 [00:19<01:10, 9181.44 examples/s]
+Filter: 21%|██▏ | 174000/818627 [00:19<01:10, 9135.50 examples/s]
+Filter: 21%|██▏ | 174000/818627 [00:19<01:11, 9077.42 examples/s]
+Filter: 21%|██▏ | 175000/818627 [00:19<01:11, 9034.15 examples/s]
+Filter: 21%|██▏ | 175000/818627 [00:19<01:11, 9035.12 examples/s]
+Filter: 21%|██▏ | 175000/818627 [00:19<01:11, 9038.38 examples/s]
+Filter: 21%|██▏ | 175000/818627 [00:19<01:10, 9083.08 examples/s]
+Filter: 21%|██▏ | 175000/818627 [00:19<01:11, 9035.80 examples/s]
+Filter: 21%|██▏ | 175000/818627 [00:19<01:10, 9081.81 examples/s]
+Filter: 21%|██▏ | 175000/818627 [00:19<01:11, 9035.78 examples/s]
+Filter: 21%|██▏ | 175000/818627 [00:19<01:10, 9104.65 examples/s]
+Filter: 21%|██▏ | 176000/818627 [00:19<01:12, 8887.03 examples/s]
+Filter: 21%|██▏ | 176000/818627 [00:19<01:12, 8875.05 examples/s]
+Filter: 21%|██▏ | 176000/818627 [00:19<01:12, 8879.93 examples/s]
+Filter: 21%|██▏ | 176000/818627 [00:19<01:12, 8887.67 examples/s]
+Filter: 21%|██▏ | 176000/818627 [00:19<01:11, 8960.28 examples/s]
+Filter: 21%|██▏ | 176000/818627 [00:19<01:11, 8930.95 examples/s]
+Filter: 21%|██▏ | 176000/818627 [00:19<01:11, 8927.59 examples/s]
+Filter: 21%|██▏ | 176000/818627 [00:19<01:12, 8881.40 examples/s]
+Filter: 22%|██▏ | 177000/818627 [00:19<01:12, 8852.61 examples/s]
+Filter: 22%|██▏ | 177000/818627 [00:19<01:12, 8851.09 examples/s]
+Filter: 22%|██▏ | 177000/818627 [00:19<01:12, 8851.75 examples/s]
+Filter: 22%|██▏ | 177000/818627 [00:19<01:12, 8881.89 examples/s]
+Filter: 22%|██▏ | 177000/818627 [00:19<01:12, 8882.76 examples/s]
+Filter: 22%|██▏ | 177000/818627 [00:19<01:12, 8845.79 examples/s]
+Filter: 22%|██▏ | 177000/818627 [00:19<01:12, 8845.99 examples/s]
+Filter: 22%|██▏ | 177000/818627 [00:20<01:12, 8893.06 examples/s]
+Filter: 22%|██▏ | 178000/818627 [00:19<01:12, 8793.88 examples/s]
+Filter: 22%|██▏ | 178000/818627 [00:19<01:12, 8798.28 examples/s]
+Filter: 22%|██▏ | 178000/818627 [00:19<01:12, 8791.86 examples/s]
+Filter: 22%|██▏ | 178000/818627 [00:20<01:12, 8838.18 examples/s]
+Filter: 22%|██▏ | 178000/818627 [00:19<01:12, 8820.24 examples/s]
+Filter: 22%|██▏ | 178000/818627 [00:19<01:12, 8792.28 examples/s]
+Filter: 22%|██▏ | 178000/818627 [00:19<01:12, 8820.15 examples/s]
+Filter: 22%|██▏ | 178000/818627 [00:19<01:12, 8796.23 examples/s]
+Filter: 22%|██▏ | 179000/818627 [00:19<01:11, 8884.12 examples/s]
+Filter: 22%|██▏ | 179000/818627 [00:19<01:11, 8888.20 examples/s]
+Filter: 22%|██▏ | 179000/818627 [00:19<01:12, 8882.90 examples/s]
+Filter: 22%|██▏ | 179000/818627 [00:20<01:11, 8914.85 examples/s]
+Filter: 22%|██▏ | 179000/818627 [00:20<01:11, 8885.70 examples/s]
+Filter: 22%|██▏ | 179000/818627 [00:19<01:11, 8900.39 examples/s]
+Filter: 22%|██▏ | 179000/818627 [00:19<01:11, 8898.96 examples/s]
+Filter: 22%|██▏ | 179000/818627 [00:19<01:11, 8883.75 examples/s]
+Filter: 22%|██▏ | 180000/818627 [00:20<01:12, 8803.29 examples/s]
+Filter: 22%|██▏ | 180000/818627 [00:20<01:12, 8804.68 examples/s]
+Filter: 22%|██▏ | 180000/818627 [00:20<01:12, 8801.64 examples/s]
+Filter: 22%|██▏ | 180000/818627 [00:20<01:12, 8825.19 examples/s]
+Filter: 22%|██▏ | 180000/818627 [00:20<01:12, 8815.26 examples/s]
+Filter: 22%|██▏ | 180000/818627 [00:20<01:12, 8814.52 examples/s]
+Filter: 22%|██▏ | 180000/818627 [00:20<01:12, 8798.61 examples/s]
+Filter: 22%|██▏ | 180000/818627 [00:20<01:12, 8798.99 examples/s]
+Filter: 22%|██▏ | 181000/818627 [00:20<01:12, 8741.48 examples/s]
+Filter: 22%|██▏ | 181000/818627 [00:20<01:12, 8743.80 examples/s]
+Filter: 22%|██▏ | 181000/818627 [00:20<01:13, 8733.90 examples/s]
+Filter: 22%|██▏ | 181000/818627 [00:20<01:12, 8756.08 examples/s]
+Filter: 22%|██▏ | 181000/818627 [00:20<01:12, 8751.72 examples/s]
+Filter: 22%|██▏ | 181000/818627 [00:20<01:12, 8746.72 examples/s]
+Filter: 22%|██▏ | 181000/818627 [00:20<01:12, 8739.99 examples/s]
+Filter: 22%|██▏ | 181000/818627 [00:20<01:13, 8708.09 examples/s]
+Filter: 22%|██▏ | 182000/818627 [00:20<01:13, 8692.70 examples/s]
+Filter: 22%|██▏ | 182000/818627 [00:20<01:13, 8691.91 examples/s]
+Filter: 22%|██▏ | 182000/818627 [00:20<01:13, 8708.35 examples/s]
+Filter: 22%|██▏ | 182000/818627 [00:20<01:13, 8701.30 examples/s]
+Filter: 22%|██▏ | 182000/818627 [00:20<01:13, 8701.99 examples/s]
+Filter: 22%|██▏ | 182000/818627 [00:20<01:13, 8678.44 examples/s]
+Filter: 22%|██▏ | 182000/818627 [00:20<01:13, 8691.65 examples/s]
+Filter: 22%|██▏ | 182000/818627 [00:20<01:13, 8695.69 examples/s]
+Filter: 22%|██▏ | 183000/818627 [00:20<01:13, 8636.43 examples/s]
+Filter: 22%|██▏ | 183000/818627 [00:20<01:13, 8633.30 examples/s]
+Filter: 22%|██▏ | 183000/818627 [00:20<01:13, 8638.40 examples/s]
+Filter: 22%|██▏ | 183000/818627 [00:20<01:13, 8647.07 examples/s]
+Filter: 22%|██▏ | 183000/818627 [00:20<01:13, 8638.07 examples/s]
+Filter: 22%|██▏ | 183000/818627 [00:20<01:13, 8632.20 examples/s]
+Filter: 22%|██▏ | 183000/818627 [00:20<01:13, 8614.22 examples/s]
+Filter: 22%|██▏ | 183000/818627 [00:20<01:13, 8612.77 examples/s]
+Filter: 22%|██▏ | 184000/818627 [00:20<01:13, 8678.90 examples/s]
+Filter: 22%|██▏ | 184000/818627 [00:20<01:13, 8682.39 examples/s]
+Filter: 22%|██▏ | 184000/818627 [00:20<01:13, 8688.44 examples/s]
+Filter: 22%|██▏ | 184000/818627 [00:20<01:13, 8673.45 examples/s]
+Filter: 22%|██▏ | 184000/818627 [00:20<01:13, 8682.99 examples/s]
+Filter: 22%|██▏ | 184000/818627 [00:20<01:13, 8690.39 examples/s]
+Filter: 22%|██▏ | 184000/818627 [00:20<01:13, 8687.27 examples/s]
+Filter: 22%|██▏ | 184000/818627 [00:20<01:13, 8676.76 examples/s]
+Filter: 23%|██▎ | 185000/818627 [00:20<01:10, 8964.50 examples/s]
+Filter: 23%|██▎ | 185000/818627 [00:20<01:10, 8968.36 examples/s]
+Filter: 23%|██▎ | 185000/818627 [00:20<01:10, 8963.99 examples/s]
+Filter: 23%|██▎ | 185000/818627 [00:20<01:10, 8967.07 examples/s]
+Filter: 23%|██▎ | 185000/818627 [00:20<01:10, 8979.19 examples/s]
+Filter: 23%|██▎ | 185000/818627 [00:20<01:10, 8970.53 examples/s]
+Filter: 23%|██▎ | 185000/818627 [00:20<01:10, 8967.78 examples/s]
+Filter: 23%|██▎ | 185000/818627 [00:20<01:10, 8973.81 examples/s]
+Filter: 23%|██▎ | 186000/818627 [00:20<01:08, 9215.69 examples/s]
+Filter: 23%|██▎ | 186000/818627 [00:20<01:08, 9218.38 examples/s]
+Filter: 23%|██▎ | 186000/818627 [00:20<01:08, 9215.70 examples/s]
+Filter: 23%|██▎ | 186000/818627 [00:21<01:08, 9220.12 examples/s]
+Filter: 23%|██▎ | 186000/818627 [00:20<01:08, 9222.31 examples/s]
+Filter: 23%|██▎ | 186000/818627 [00:20<01:08, 9218.32 examples/s]
+Filter: 23%|██▎ | 186000/818627 [00:20<01:08, 9220.23 examples/s]
+Filter: 23%|██▎ | 186000/818627 [00:20<01:08, 9216.11 examples/s]
+Filter: 23%|██▎ | 187000/818627 [00:20<01:08, 9186.68 examples/s]
+Filter: 23%|██▎ | 187000/818627 [00:20<01:08, 9190.89 examples/s]
+Filter: 23%|██▎ | 187000/818627 [00:20<01:08, 9185.91 examples/s]
+Filter: 23%|██▎ | 187000/818627 [00:21<01:08, 9186.90 examples/s]
+Filter: 23%|██▎ | 187000/818627 [00:20<01:08, 9185.49 examples/s]
+Filter: 23%|██▎ | 187000/818627 [00:20<01:08, 9186.43 examples/s]
+Filter: 23%|██▎ | 187000/818627 [00:20<01:08, 9185.56 examples/s]
+Filter: 23%|██▎ | 187000/818627 [00:20<01:08, 9181.93 examples/s]
+Filter: 23%|██▎ | 188000/818627 [00:20<01:10, 9006.68 examples/s]
+Filter: 23%|██▎ | 188000/818627 [00:20<01:09, 9014.13 examples/s]
+Filter: 23%|██▎ | 188000/818627 [00:20<01:09, 9010.00 examples/s]
+Filter: 23%|██▎ | 188000/818627 [00:21<01:09, 9016.40 examples/s]
+Filter: 23%|██▎ | 188000/818627 [00:21<01:09, 9013.29 examples/s]
+Filter: 23%|██▎ | 188000/818627 [00:20<01:09, 9012.88 examples/s]
+Filter: 23%|██▎ | 188000/818627 [00:20<01:09, 9009.26 examples/s]
+Filter: 23%|██▎ | 188000/818627 [00:20<01:10, 9007.40 examples/s]
+Filter: 23%|██▎ | 189000/818627 [00:21<01:10, 8928.47 examples/s]
+Filter: 23%|██▎ | 189000/818627 [00:21<01:10, 8925.12 examples/s]
+Filter: 23%|██▎ | 189000/818627 [00:21<01:10, 8923.34 examples/s]
+Filter: 23%|██▎ | 189000/818627 [00:21<01:10, 8932.31 examples/s]
+Filter: 23%|██▎ | 189000/818627 [00:21<01:10, 8930.53 examples/s]
+Filter: 23%|██▎ | 189000/818627 [00:21<01:10, 8931.12 examples/s]
+Filter: 23%|██▎ | 189000/818627 [00:21<01:10, 8926.00 examples/s]
+Filter: 23%|██▎ | 189000/818627 [00:21<01:10, 8884.42 examples/s]
+Filter: 23%|██▎ | 190000/818627 [00:21<01:11, 8848.70 examples/s]
+Filter: 23%|██▎ | 190000/818627 [00:21<01:11, 8849.25 examples/s]
+Filter: 23%|██▎ | 190000/818627 [00:21<01:11, 8849.37 examples/s]
+Filter: 23%|██▎ | 190000/818627 [00:21<01:10, 8862.22 examples/s]
+Filter: 23%|██▎ | 190000/818627 [00:21<01:11, 8846.85 examples/s]
+Filter: 23%|██▎ | 190000/818627 [00:21<01:11, 8846.12 examples/s]
+Filter: 23%|██▎ | 190000/818627 [00:21<01:11, 8844.65 examples/s]
+Filter: 23%|██▎ | 190000/818627 [00:21<01:11, 8816.38 examples/s]
+Filter: 23%|██▎ | 191000/818627 [00:21<01:09, 9077.65 examples/s]
+Filter: 23%|██▎ | 191000/818627 [00:21<01:09, 9075.32 examples/s]
+Filter: 23%|██▎ | 191000/818627 [00:21<01:09, 9077.32 examples/s]
+Filter: 23%|██▎ | 191000/818627 [00:21<01:09, 9084.86 examples/s]
+Filter: 23%|██▎ | 191000/818627 [00:21<01:09, 9082.11 examples/s]
+Filter: 23%|██▎ | 191000/818627 [00:21<01:09, 9080.48 examples/s]
+Filter: 23%|██▎ | 191000/818627 [00:21<01:09, 9088.85 examples/s]
+Filter: 23%|██▎ | 191000/818627 [00:21<01:09, 9079.72 examples/s]
+Filter: 24%|██▎ | 193000/818627 [00:21<01:07, 9301.11 examples/s]
+Filter: 24%|██▎ | 193000/818627 [00:21<01:07, 9303.07 examples/s]
+Filter: 24%|██▎ | 193000/818627 [00:21<01:07, 9298.95 examples/s]
+Filter: 24%|██▎ | 193000/818627 [00:21<01:07, 9304.66 examples/s]
+Filter: 24%|██▎ | 193000/818627 [00:21<01:07, 9311.63 examples/s]
+Filter: 24%|██▎ | 193000/818627 [00:21<01:07, 9301.02 examples/s]
+Filter: 24%|██▎ | 193000/818627 [00:21<01:07, 9302.49 examples/s]
+Filter: 24%|██▎ | 193000/818627 [00:21<01:07, 9215.58 examples/s]
+Filter: 24%|██▎ | 194000/818627 [00:21<01:08, 9144.62 examples/s]
+Filter: 24%|██▎ | 194000/818627 [00:21<01:08, 9146.24 examples/s]
+Filter: 24%|██▎ | 194000/818627 [00:21<01:08, 9149.86 examples/s]
+Filter: 24%|██▎ | 194000/818627 [00:21<01:08, 9149.77 examples/s]
+Filter: 24%|██▎ | 194000/818627 [00:21<01:08, 9146.03 examples/s]
+Filter: 24%|██▎ | 194000/818627 [00:21<01:08, 9169.08 examples/s]
+Filter: 24%|██▎ | 194000/818627 [00:21<01:08, 9142.03 examples/s]
+Filter: 24%|██▎ | 194000/818627 [00:21<01:08, 9109.64 examples/s]
+Filter: 24%|██▍ | 195000/818627 [00:21<01:09, 8972.21 examples/s]
+Filter: 24%|██▍ | 195000/818627 [00:21<01:09, 8973.08 examples/s]
+Filter: 24%|██▍ | 195000/818627 [00:21<01:09, 8977.49 examples/s]
+Filter: 24%|██▍ | 195000/818627 [00:22<01:09, 8976.35 examples/s]
+Filter: 24%|██▍ | 195000/818627 [00:21<01:09, 8973.97 examples/s]
+Filter: 24%|██▍ | 195000/818627 [00:21<01:09, 8970.68 examples/s]
+Filter: 24%|██▍ | 195000/818627 [00:21<01:09, 8987.61 examples/s]
+Filter: 24%|██▍ | 195000/818627 [00:21<01:09, 8968.52 examples/s]
+Filter: 24%|██▍ | 196000/818627 [00:21<01:09, 8911.35 examples/s]
+Filter: 24%|██▍ | 196000/818627 [00:21<01:09, 8904.65 examples/s]
+Filter: 24%|██▍ | 196000/818627 [00:21<01:09, 8906.27 examples/s]
+Filter: 24%|██▍ | 196000/818627 [00:22<01:09, 8907.22 examples/s]
+Filter: 24%|██▍ | 196000/818627 [00:21<01:09, 8903.49 examples/s]
+Filter: 24%|██▍ | 196000/818627 [00:21<01:09, 8919.37 examples/s]
+Filter: 24%|██▍ | 196000/818627 [00:21<01:09, 8904.27 examples/s]
+Filter: 24%|██▍ | 196000/818627 [00:21<01:09, 8903.35 examples/s]
+Filter: 24%|██▍ | 197000/818627 [00:21<01:10, 8837.83 examples/s]
+Filter: 24%|██▍ | 197000/818627 [00:21<01:10, 8833.32 examples/s]
+Filter: 24%|██▍ | 197000/818627 [00:21<01:10, 8829.19 examples/s]
+Filter: 24%|██▍ | 197000/818627 [00:22<01:10, 8833.17 examples/s]
+Filter: 24%|██▍ | 197000/818627 [00:21<01:10, 8843.68 examples/s]
+Filter: 24%|██▍ | 197000/818627 [00:21<01:10, 8831.79 examples/s]
+Filter: 24%|██▍ | 197000/818627 [00:21<01:10, 8833.20 examples/s]
+Filter: 24%|██▍ | 197000/818627 [00:22<01:10, 8790.03 examples/s]
+Filter: 24%|██▍ | 198000/818627 [00:22<01:08, 9033.31 examples/s]
+Filter: 24%|██▍ | 198000/818627 [00:22<01:08, 9030.93 examples/s]
+Filter: 24%|██▍ | 198000/818627 [00:22<01:08, 9031.72 examples/s]
+Filter: 24%|██▍ | 198000/818627 [00:22<01:08, 9042.02 examples/s]
+Filter: 24%|██▍ | 198000/818627 [00:22<01:08, 9040.90 examples/s]
+Filter: 24%|██▍ | 198000/818627 [00:22<01:08, 9031.66 examples/s]
+Filter: 24%|██▍ | 198000/818627 [00:22<01:08, 9033.04 examples/s]
+Filter: 24%|██▍ | 198000/818627 [00:22<01:08, 9032.56 examples/s]
+Filter: 24%|██▍ | 199000/818627 [00:22<01:09, 8910.62 examples/s]
+Filter: 24%|██▍ | 199000/818627 [00:22<01:09, 8908.80 examples/s]
+Filter: 24%|██▍ | 199000/818627 [00:22<01:09, 8909.79 examples/s]
+Filter: 24%|██▍ | 199000/818627 [00:22<01:09, 8911.10 examples/s]
+Filter: 24%|██▍ | 199000/818627 [00:22<01:09, 8913.58 examples/s]
+Filter: 24%|██▍ | 199000/818627 [00:22<01:09, 8907.65 examples/s]
+Filter: 24%|██▍ | 199000/818627 [00:22<01:09, 8911.20 examples/s]
+Filter: 24%|██▍ | 199000/818627 [00:22<01:09, 8906.78 examples/s]
+Filter: 24%|██▍ | 200000/818627 [00:22<01:09, 8947.39 examples/s]
+Filter: 24%|██▍ | 200000/818627 [00:22<01:09, 8943.10 examples/s]
+Filter: 24%|██▍ | 200000/818627 [00:22<01:09, 8943.85 examples/s]
+Filter: 24%|██▍ | 200000/818627 [00:22<01:09, 8952.07 examples/s]
+Filter: 24%|██▍ | 200000/818627 [00:22<01:09, 8946.38 examples/s]
+Filter: 24%|██▍ | 200000/818627 [00:22<01:09, 8950.42 examples/s]
+Filter: 24%|██▍ | 200000/818627 [00:22<01:09, 8942.57 examples/s]
+Filter: 24%|██▍ | 200000/818627 [00:22<01:09, 8942.60 examples/s]
+Filter: 25%|██▍ | 201000/818627 [00:22<01:09, 8903.09 examples/s]
+Filter: 25%|██▍ | 201000/818627 [00:22<01:09, 8903.31 examples/s]
+Filter: 25%|██▍ | 201000/818627 [00:22<01:09, 8899.69 examples/s]
+Filter: 25%|██▍ | 201000/818627 [00:22<01:09, 8907.27 examples/s]
+Filter: 25%|██▍ | 201000/818627 [00:22<01:09, 8904.86 examples/s]
+Filter: 25%|██▍ | 201000/818627 [00:22<01:09, 8900.53 examples/s]
+Filter: 25%|██▍ | 201000/818627 [00:22<01:09, 8901.87 examples/s]
+Filter: 25%|██▍ | 201000/818627 [00:22<01:09, 8902.24 examples/s]
+Filter: 25%|██▍ | 202000/818627 [00:22<01:09, 8823.48 examples/s]
+Filter: 25%|██▍ | 202000/818627 [00:22<01:09, 8821.95 examples/s]
+Filter: 25%|██▍ | 202000/818627 [00:22<01:09, 8822.04 examples/s]
+Filter: 25%|██▍ | 202000/818627 [00:22<01:09, 8823.11 examples/s]
+Filter: 25%|██▍ | 202000/818627 [00:22<01:09, 8821.93 examples/s]
+Filter: 25%|██▍ | 202000/818627 [00:22<01:09, 8821.51 examples/s]
+Filter: 25%|██▍ | 202000/818627 [00:22<01:09, 8811.52 examples/s]
+Filter: 25%|██▍ | 202000/818627 [00:22<01:10, 8771.30 examples/s]
+Filter: 25%|██▍ | 203000/818627 [00:22<01:09, 8847.38 examples/s]
+Filter: 25%|██▍ | 203000/818627 [00:22<01:09, 8832.58 examples/s]
+Filter: 25%|██▍ | 203000/818627 [00:22<01:09, 8828.37 examples/s]
+Filter: 25%|██▍ | 203000/818627 [00:22<01:09, 8835.98 examples/s]
+Filter: 25%|██▍ | 203000/818627 [00:22<01:09, 8834.24 examples/s]
+Filter: 25%|██▍ | 203000/818627 [00:22<01:09, 8832.82 examples/s]
+Filter: 25%|██▍ | 203000/818627 [00:22<01:09, 8833.22 examples/s]
+Filter: 25%|██▍ | 203000/818627 [00:22<01:09, 8834.26 examples/s]
+Filter: 25%|██▍ | 204000/818627 [00:22<01:09, 8833.65 examples/s]
+Filter: 25%|██▍ | 204000/818627 [00:22<01:09, 8838.28 examples/s]
+Filter: 25%|██▍ | 204000/818627 [00:22<01:09, 8828.17 examples/s]
+Filter: 25%|██▍ | 204000/818627 [00:23<01:09, 8830.52 examples/s]
+Filter: 25%|██▍ | 204000/818627 [00:22<01:09, 8830.20 examples/s]
+Filter: 25%|██▍ | 204000/818627 [00:22<01:09, 8831.05 examples/s]
+Filter: 25%|██▍ | 204000/818627 [00:22<01:09, 8828.47 examples/s]
+Filter: 25%|██▍ | 204000/818627 [00:22<01:09, 8830.57 examples/s]
+Filter: 25%|██▌ | 205000/818627 [00:22<01:12, 8509.38 examples/s]
+Filter: 25%|██▌ | 205000/818627 [00:22<01:12, 8511.06 examples/s]
+Filter: 25%|██▌ | 205000/818627 [00:22<01:12, 8503.36 examples/s]
+Filter: 25%|██▌ | 205000/818627 [00:22<01:12, 8509.55 examples/s]
+Filter: 25%|██▌ | 205000/818627 [00:23<01:12, 8506.11 examples/s]
+Filter: 25%|██▌ | 205000/818627 [00:22<01:12, 8505.29 examples/s]
+Filter: 25%|██▌ | 205000/818627 [00:22<01:12, 8508.22 examples/s]
+Filter: 25%|██▌ | 205000/818627 [00:22<01:12, 8505.42 examples/s]
+Filter: 25%|██▌ | 206000/818627 [00:22<01:12, 8494.70 examples/s]
+Filter: 25%|██▌ | 206000/818627 [00:22<01:12, 8496.06 examples/s]
+Filter: 25%|██▌ | 206000/818627 [00:22<01:12, 8490.82 examples/s]
+Filter: 25%|██▌ | 206000/818627 [00:22<01:12, 8497.38 examples/s]
+Filter: 25%|██▌ | 206000/818627 [00:23<01:12, 8496.13 examples/s]
+Filter: 25%|██▌ | 206000/818627 [00:23<01:12, 8494.02 examples/s]
+Filter: 25%|██▌ | 206000/818627 [00:22<01:12, 8495.19 examples/s]
+Filter: 25%|██▌ | 206000/818627 [00:22<01:12, 8493.05 examples/s]
+Filter: 25%|██▌ | 207000/818627 [00:23<01:11, 8540.82 examples/s]
+Filter: 25%|██▌ | 207000/818627 [00:23<01:11, 8539.86 examples/s]
+Filter: 25%|██▌ | 207000/818627 [00:23<01:11, 8540.38 examples/s]
+Filter: 25%|██▌ | 207000/818627 [00:23<01:11, 8539.34 examples/s]
+Filter: 25%|██▌ | 207000/818627 [00:23<01:11, 8540.20 examples/s]
+Filter: 25%|██▌ | 207000/818627 [00:23<01:11, 8539.07 examples/s]
+Filter: 25%|██▌ | 207000/818627 [00:23<01:11, 8540.96 examples/s]
+Filter: 25%|██▌ | 207000/818627 [00:23<01:13, 8329.91 examples/s]
+Filter: 25%|██▌ | 208000/818627 [00:23<01:10, 8649.70 examples/s]
+Filter: 25%|██▌ | 208000/818627 [00:23<01:10, 8641.81 examples/s]
+Filter: 25%|██▌ | 208000/818627 [00:23<01:10, 8643.88 examples/s]
+Filter: 25%|██▌ | 208000/818627 [00:23<01:10, 8711.86 examples/s]
+Filter: 25%|██▌ | 208000/818627 [00:23<01:10, 8643.04 examples/s]
+Filter: 25%|██▌ | 208000/818627 [00:23<01:10, 8642.08 examples/s]
+Filter: 25%|██▌ | 208000/818627 [00:23<01:10, 8641.42 examples/s]
+Filter: 25%|██▌ | 208000/818627 [00:23<01:10, 8642.09 examples/s]
+Filter: 26%|██▌ | 209000/818627 [00:23<01:07, 9010.34 examples/s]
+Filter: 26%|██▌ | 209000/818627 [00:23<01:07, 9005.89 examples/s]
+Filter: 26%|██▌ | 209000/818627 [00:23<01:07, 8985.48 examples/s]
+Filter: 26%|██▌ | 209000/818627 [00:23<01:07, 8985.13 examples/s]
+Filter: 26%|██▌ | 209000/818627 [00:23<01:07, 8984.21 examples/s]
+Filter: 26%|██▌ | 209000/818627 [00:23<01:08, 8957.67 examples/s]
+Filter: 26%|██▌ | 209000/818627 [00:23<01:07, 8968.18 examples/s]
+Filter: 26%|██▌ | 210000/818627 [00:23<01:07, 9028.57 examples/s]
+Filter: 26%|██▌ | 210000/818627 [00:23<01:07, 9038.55 examples/s]
+Filter: 26%|██▌ | 210000/818627 [00:23<01:07, 9067.62 examples/s]
+Filter: 26%|██▌ | 210000/818627 [00:23<01:07, 9023.72 examples/s]
+Filter: 26%|██▌ | 210000/818627 [00:23<01:07, 9029.17 examples/s]
+Filter: 26%|██▌ | 210000/818627 [00:23<01:07, 9035.88 examples/s]
+Filter: 26%|██▌ | 210000/818627 [00:23<01:07, 9029.08 examples/s]
+Filter: 26%|██▌ | 210000/818627 [00:23<01:07, 9029.37 examples/s]
+Filter: 26%|██▌ | 211000/818627 [00:23<01:08, 8913.75 examples/s]
+Filter: 26%|██▌ | 211000/818627 [00:23<01:08, 8905.56 examples/s]
+Filter: 26%|██▌ | 211000/818627 [00:23<01:08, 8900.12 examples/s]
+Filter: 26%|██▌ | 211000/818627 [00:23<01:08, 8913.78 examples/s]
+Filter: 26%|██▌ | 211000/818627 [00:23<01:08, 8908.80 examples/s]
+Filter: 26%|██▌ | 211000/818627 [00:23<01:08, 8908.05 examples/s]
+Filter: 26%|██▌ | 211000/818627 [00:23<01:07, 8943.54 examples/s]
+Filter: 26%|██▌ | 211000/818627 [00:23<01:08, 8907.34 examples/s]
+Filter: 26%|██▌ | 212000/818627 [00:23<01:08, 8816.74 examples/s]
+Filter: 26%|██▌ | 212000/818627 [00:23<01:08, 8814.01 examples/s]
+Filter: 26%|██▌ | 212000/818627 [00:23<01:08, 8864.97 examples/s]
+Filter: 26%|██▌ | 212000/818627 [00:23<01:08, 8810.79 examples/s]
+Filter: 26%|██▌ | 212000/818627 [00:23<01:08, 8816.22 examples/s]
+Filter: 26%|██▌ | 212000/818627 [00:23<01:08, 8815.15 examples/s]
+Filter: 26%|██▌ | 212000/818627 [00:23<01:08, 8813.70 examples/s]
+Filter: 26%|██▌ | 212000/818627 [00:23<01:08, 8812.70 examples/s]
+Filter: 26%|██▌ | 213000/818627 [00:23<01:09, 8731.87 examples/s]
+Filter: 26%|██▌ | 213000/818627 [00:23<01:09, 8728.14 examples/s]
+Filter: 26%|██▌ | 213000/818627 [00:23<01:09, 8725.48 examples/s]
+Filter: 26%|██▌ | 213000/818627 [00:24<01:09, 8769.47 examples/s]
+Filter: 26%|██▌ | 213000/818627 [00:23<01:09, 8725.72 examples/s]
+Filter: 26%|██▌ | 213000/818627 [00:23<01:09, 8728.48 examples/s]
+Filter: 26%|██▌ | 213000/818627 [00:23<01:09, 8724.78 examples/s]
+Filter: 26%|██▌ | 213000/818627 [00:23<01:09, 8726.92 examples/s]
+Filter: 26%|██▌ | 214000/818627 [00:23<01:09, 8718.13 examples/s]
+Filter: 26%|██▌ | 214000/818627 [00:23<01:09, 8717.19 examples/s]
+Filter: 26%|██▌ | 214000/818627 [00:24<01:09, 8749.34 examples/s]
+Filter: 26%|██▌ | 214000/818627 [00:23<01:09, 8714.69 examples/s]
+Filter: 26%|██▌ | 214000/818627 [00:23<01:09, 8717.36 examples/s]
+Filter: 26%|██▌ | 214000/818627 [00:23<01:09, 8719.17 examples/s]
+Filter: 26%|██▌ | 214000/818627 [00:23<01:09, 8719.47 examples/s]
+Filter: 26%|██▌ | 214000/818627 [00:23<01:09, 8697.16 examples/s]
+Filter: 26%|██▋ | 215000/818627 [00:24<01:09, 8743.29 examples/s]
+Filter: 26%|██▋ | 215000/818627 [00:24<01:09, 8742.35 examples/s]
+Filter: 26%|██▋ | 215000/818627 [00:24<01:08, 8764.02 examples/s]
+Filter: 26%|██▋ | 215000/818627 [00:24<01:08, 8749.54 examples/s]
+Filter: 26%|██▋ | 215000/818627 [00:23<01:09, 8744.20 examples/s]
+Filter: 26%|██▋ | 215000/818627 [00:24<01:09, 8744.15 examples/s]
+Filter: 26%|██▋ | 215000/818627 [00:23<01:09, 8738.13 examples/s]
+Filter: 26%|██▋ | 215000/818627 [00:24<01:09, 8700.96 examples/s]
+Filter: 26%|██▋ | 216000/818627 [00:24<01:09, 8733.31 examples/s]
+Filter: 26%|██▋ | 216000/818627 [00:24<01:09, 8731.34 examples/s]
+Filter: 26%|██▋ | 216000/818627 [00:24<01:08, 8739.18 examples/s]
+Filter: 26%|██▋ | 216000/818627 [00:24<01:08, 8738.08 examples/s]
+Filter: 26%|██▋ | 216000/818627 [00:24<01:08, 8733.91 examples/s]
+Filter: 26%|██▋ | 216000/818627 [00:24<01:09, 8732.56 examples/s]
+Filter: 26%|██▋ | 216000/818627 [00:24<01:08, 8735.33 examples/s]
+Filter: 26%|██▋ | 216000/818627 [00:24<01:09, 8731.57 examples/s]
+Filter: 27%|██▋ | 217000/818627 [00:24<01:08, 8726.10 examples/s]
+Filter: 27%|██▋ | 217000/818627 [00:24<01:08, 8725.64 examples/s]
+Filter: 27%|██▋ | 217000/818627 [00:24<01:08, 8735.35 examples/s]
+Filter: 27%|██▋ | 217000/818627 [00:24<01:08, 8728.33 examples/s]
+Filter: 27%|██▋ | 217000/818627 [00:24<01:08, 8727.80 examples/s]
+Filter: 27%|██▋ | 217000/818627 [00:24<01:08, 8727.01 examples/s]
+Filter: 27%|██▋ | 217000/818627 [00:24<01:08, 8728.46 examples/s]
+Filter: 27%|██▋ | 217000/818627 [00:24<01:08, 8721.98 examples/s]
+Filter: 27%|██▋ | 218000/818627 [00:24<01:08, 8705.44 examples/s]
+Filter: 27%|██▋ | 218000/818627 [00:24<01:08, 8705.32 examples/s]
+Filter: 27%|██▋ | 218000/818627 [00:24<01:08, 8710.23 examples/s]
+Filter: 27%|██▋ | 218000/818627 [00:24<01:08, 8711.67 examples/s]
+Filter: 27%|██▋ | 218000/818627 [00:24<01:08, 8708.23 examples/s]
+Filter: 27%|██▋ | 218000/818627 [00:24<01:08, 8705.11 examples/s]
+Filter: 27%|██▋ | 218000/818627 [00:24<01:08, 8705.79 examples/s]
+Filter: 27%|██▋ | 218000/818627 [00:24<01:09, 8703.50 examples/s]
+Filter: 27%|██▋ | 219000/818627 [00:24<01:09, 8664.48 examples/s]
+Filter: 27%|██▋ | 219000/818627 [00:24<01:09, 8662.92 examples/s]
+Filter: 27%|██▋ | 219000/818627 [00:24<01:09, 8669.06 examples/s]
+Filter: 27%|██▋ | 219000/818627 [00:24<01:09, 8669.41 examples/s]
+Filter: 27%|██▋ | 219000/818627 [00:24<01:09, 8662.32 examples/s]
+Filter: 27%|██▋ | 219000/818627 [00:24<01:09, 8663.34 examples/s]
+Filter: 27%|██▋ | 219000/818627 [00:24<01:09, 8662.45 examples/s]
+Filter: 27%|██▋ | 219000/818627 [00:24<01:09, 8660.87 examples/s]
+Filter: 27%|██▋ | 220000/818627 [00:24<01:09, 8661.10 examples/s]
+Filter: 27%|██▋ | 220000/818627 [00:24<01:09, 8668.64 examples/s]
+Filter: 27%|██▋ | 220000/818627 [00:24<01:09, 8667.50 examples/s]
+Filter: 27%|██▋ | 220000/818627 [00:24<01:09, 8653.71 examples/s]
+Filter: 27%|██▋ | 220000/818627 [00:24<01:09, 8665.01 examples/s]
+Filter: 27%|██▋ | 220000/818627 [00:24<01:09, 8663.71 examples/s]
+Filter: 27%|██▋ | 220000/818627 [00:24<01:09, 8662.10 examples/s]
+Filter: 27%|██▋ | 220000/818627 [00:24<01:09, 8660.21 examples/s]
+Filter: 27%|██▋ | 221000/818627 [00:24<01:08, 8690.31 examples/s]
+Filter: 27%|██▋ | 221000/818627 [00:24<01:08, 8684.98 examples/s]
+Filter: 27%|██▋ | 221000/818627 [00:25<01:08, 8688.37 examples/s]
+Filter: 27%|██▋ | 221000/818627 [00:24<01:08, 8677.43 examples/s]
+Filter: 27%|██▋ | 221000/818627 [00:24<01:08, 8687.99 examples/s]
+Filter: 27%|██▋ | 221000/818627 [00:24<01:08, 8686.52 examples/s]
+Filter: 27%|██▋ | 221000/818627 [00:24<01:08, 8686.32 examples/s]
+Filter: 27%|██▋ | 221000/818627 [00:24<01:08, 8686.24 examples/s]
+Filter: 27%|██▋ | 222000/818627 [00:24<01:06, 9014.77 examples/s]
+Filter: 27%|██▋ | 222000/818627 [00:24<01:06, 9012.75 examples/s]
+Filter: 27%|██▋ | 222000/818627 [00:24<01:06, 9012.42 examples/s]
+Filter: 27%|██▋ | 222000/818627 [00:24<01:06, 9012.25 examples/s]
+Filter: 27%|██▋ | 222000/818627 [00:24<01:06, 9012.55 examples/s]
+Filter: 27%|██▋ | 222000/818627 [00:24<01:06, 9010.56 examples/s]
+Filter: 27%|██▋ | 222000/818627 [00:25<01:06, 9002.59 examples/s]
+Filter: 27%|██▋ | 222000/818627 [00:24<01:06, 9012.19 examples/s]
+Filter: 27%|██▋ | 223000/818627 [00:24<01:05, 9041.11 examples/s]
+Filter: 27%|██▋ | 223000/818627 [00:24<01:05, 9038.30 examples/s]
+Filter: 27%|██▋ | 223000/818627 [00:24<01:05, 9034.86 examples/s]
+Filter: 27%|██▋ | 223000/818627 [00:25<01:05, 9040.68 examples/s]
+Filter: 27%|██▋ | 223000/818627 [00:24<01:05, 9039.83 examples/s]
+Filter: 27%|██▋ | 223000/818627 [00:25<01:05, 9033.16 examples/s]
+Filter: 27%|██▋ | 223000/818627 [00:24<01:05, 9035.67 examples/s]
+Filter: 27%|██▋ | 223000/818627 [00:24<01:05, 9036.08 examples/s]
+Filter: 27%|██▋ | 224000/818627 [00:25<01:05, 9088.66 examples/s]
+Filter: 27%|██▋ | 224000/818627 [00:25<01:05, 9094.59 examples/s]
+Filter: 27%|██▋ | 224000/818627 [00:25<01:05, 9082.18 examples/s]
+Filter: 27%|██▋ | 224000/818627 [00:25<01:05, 9090.61 examples/s]
+Filter: 27%|██▋ | 224000/818627 [00:25<01:05, 9086.23 examples/s]
+Filter: 27%|██▋ | 224000/818627 [00:25<01:05, 9065.05 examples/s]
+Filter: 27%|██▋ | 224000/818627 [00:25<01:05, 9079.64 examples/s]
+Filter: 27%|██▋ | 224000/818627 [00:25<01:05, 9066.36 examples/s]
+Filter: 27%|██▋ | 225000/818627 [00:25<01:06, 8918.03 examples/s]
+Filter: 27%|██▋ | 225000/818627 [00:25<01:06, 8920.03 examples/s]
+Filter: 27%|██▋ | 225000/818627 [00:25<01:06, 8920.07 examples/s]
+Filter: 27%|██▋ | 225000/818627 [00:25<01:06, 8920.12 examples/s]
+Filter: 27%|██▋ | 225000/818627 [00:25<01:06, 8912.60 examples/s]
+Filter: 27%|██▋ | 225000/818627 [00:25<01:06, 8918.94 examples/s]
+Filter: 27%|██▋ | 225000/818627 [00:25<01:06, 8912.68 examples/s]
+Filter: 27%|██▋ | 225000/818627 [00:25<01:06, 8916.15 examples/s]
+Filter: 28%|██▊ | 226000/818627 [00:25<01:07, 8798.09 examples/s]
+Filter: 28%|██▊ | 226000/818627 [00:25<01:07, 8802.42 examples/s]
+Filter: 28%|██▊ | 226000/818627 [00:25<01:07, 8798.74 examples/s]
+Filter: 28%|██▊ | 226000/818627 [00:25<01:07, 8798.94 examples/s]
+Filter: 28%|██▊ | 226000/818627 [00:25<01:07, 8797.06 examples/s]
+Filter: 28%|██▊ | 226000/818627 [00:25<01:07, 8792.90 examples/s]
+Filter: 28%|██▊ | 226000/818627 [00:25<01:07, 8790.40 examples/s]
+Filter: 28%|██▊ | 226000/818627 [00:25<01:07, 8793.30 examples/s]
+Filter: 28%|██▊ | 227000/818627 [00:25<01:08, 8695.49 examples/s]
+Filter: 28%|██▊ | 227000/818627 [00:25<01:08, 8688.96 examples/s]
+Filter: 28%|██▊ | 227000/818627 [00:25<01:08, 8691.77 examples/s]
+Filter: 28%|██▊ | 227000/818627 [00:25<01:08, 8693.54 examples/s]
+Filter: 28%|██▊ | 227000/818627 [00:25<01:08, 8687.83 examples/s]
+Filter: 28%|██▊ | 227000/818627 [00:25<01:08, 8687.43 examples/s]
+Filter: 28%|██▊ | 227000/818627 [00:25<01:08, 8688.87 examples/s]
+Filter: 28%|██▊ | 227000/818627 [00:25<01:08, 8690.32 examples/s]
+Filter: 28%|██▊ | 228000/818627 [00:25<01:07, 8695.41 examples/s]
+Filter: 28%|██▊ | 228000/818627 [00:25<01:07, 8696.79 examples/s]
+Filter: 28%|██▊ | 228000/818627 [00:25<01:07, 8693.02 examples/s]
+Filter: 28%|██▊ | 228000/818627 [00:25<01:07, 8696.15 examples/s]
+Filter: 28%|██▊ | 228000/818627 [00:25<01:07, 8692.17 examples/s]
+Filter: 28%|██▊ | 228000/818627 [00:25<01:07, 8694.19 examples/s]
+Filter: 28%|██▊ | 228000/818627 [00:25<01:07, 8691.72 examples/s]
+Filter: 28%|██▊ | 228000/818627 [00:25<01:07, 8693.16 examples/s]
+Filter: 28%|██▊ | 229000/818627 [00:25<01:07, 8687.92 examples/s]
+Filter: 28%|██▊ | 229000/818627 [00:25<01:07, 8685.97 examples/s]
+Filter: 28%|██▊ | 229000/818627 [00:25<01:07, 8682.54 examples/s]
+Filter: 28%|██▊ | 229000/818627 [00:25<01:07, 8687.13 examples/s]
+Filter: 28%|██▊ | 229000/818627 [00:25<01:07, 8687.15 examples/s]
+Filter: 28%|██▊ | 229000/818627 [00:25<01:07, 8682.56 examples/s]
+Filter: 28%|██▊ | 229000/818627 [00:25<01:07, 8681.87 examples/s]
+Filter: 28%|██▊ | 229000/818627 [00:25<01:08, 8640.40 examples/s]
+Filter: 28%|██▊ | 230000/818627 [00:25<01:08, 8647.98 examples/s]
+Filter: 28%|██▊ | 230000/818627 [00:25<01:08, 8648.25 examples/s]
+Filter: 28%|██▊ | 230000/818627 [00:25<01:08, 8648.26 examples/s]
+Filter: 28%|██▊ | 230000/818627 [00:26<01:07, 8658.54 examples/s]
+Filter: 28%|██▊ | 230000/818627 [00:25<01:08, 8650.42 examples/s]
+Filter: 28%|██▊ | 230000/818627 [00:25<01:08, 8649.71 examples/s]
+Filter: 28%|██▊ | 230000/818627 [00:25<01:08, 8648.51 examples/s]
+Filter: 28%|██▊ | 230000/818627 [00:25<01:08, 8650.41 examples/s]
+Filter: 28%|██▊ | 231000/818627 [00:25<01:07, 8646.41 examples/s]
+Filter: 28%|██▊ | 231000/818627 [00:25<01:07, 8649.18 examples/s]
+Filter: 28%|██▊ | 231000/818627 [00:25<01:08, 8637.17 examples/s]
+Filter: 28%|██▊ | 231000/818627 [00:26<01:07, 8653.23 examples/s]
+Filter: 28%|██▊ | 231000/818627 [00:25<01:07, 8650.76 examples/s]
+Filter: 28%|██▊ | 231000/818627 [00:25<01:07, 8650.18 examples/s]
+Filter: 28%|██▊ | 231000/818627 [00:25<01:07, 8649.54 examples/s]
+Filter: 28%|██▊ | 231000/818627 [00:25<01:07, 8647.84 examples/s]
+Filter: 28%|██▊ | 232000/818627 [00:25<01:07, 8663.34 examples/s]
+Filter: 28%|██▊ | 232000/818627 [00:25<01:07, 8663.95 examples/s]
+Filter: 28%|██▊ | 232000/818627 [00:25<01:07, 8658.79 examples/s]
+Filter: 28%|██▊ | 232000/818627 [00:26<01:07, 8668.09 examples/s]
+Filter: 28%|██▊ | 232000/818627 [00:25<01:07, 8665.55 examples/s]
+Filter: 28%|██▊ | 232000/818627 [00:25<01:07, 8663.57 examples/s]
+Filter: 28%|██▊ | 232000/818627 [00:26<01:07, 8662.58 examples/s]
+Filter: 28%|██▊ | 232000/818627 [00:25<01:07, 8663.42 examples/s]
+Filter: 28%|██▊ | 233000/818627 [00:26<01:07, 8614.02 examples/s]
+Filter: 28%|██▊ | 233000/818627 [00:26<01:08, 8611.85 examples/s]
+Filter: 28%|██▊ | 233000/818627 [00:26<01:07, 8619.78 examples/s]
+Filter: 28%|██▊ | 233000/818627 [00:26<01:08, 8608.29 examples/s]
+Filter: 28%|██▊ | 233000/818627 [00:26<01:07, 8618.02 examples/s]
+Filter: 28%|██▊ | 233000/818627 [00:26<01:07, 8615.43 examples/s]
+Filter: 28%|██▊ | 233000/818627 [00:26<01:07, 8614.78 examples/s]
+Filter: 28%|██▊ | 233000/818627 [00:26<01:07, 8615.48 examples/s]
+Filter: 29%|██▊ | 234000/818627 [00:26<01:08, 8572.55 examples/s]
+Filter: 29%|██▊ | 234000/818627 [00:26<01:08, 8572.25 examples/s]
+Filter: 29%|██▊ | 234000/818627 [00:26<01:08, 8567.76 examples/s]
+Filter: 29%|██▊ | 234000/818627 [00:26<01:08, 8573.20 examples/s]
+Filter: 29%|██▊ | 234000/818627 [00:26<01:08, 8573.75 examples/s]
+Filter: 29%|██▊ | 234000/818627 [00:26<01:08, 8571.04 examples/s]
+Filter: 29%|██▊ | 234000/818627 [00:26<01:08, 8570.12 examples/s]
+Filter: 29%|██▊ | 234000/818627 [00:26<01:08, 8570.43 examples/s]
+Filter: 29%|██▊ | 235000/818627 [00:26<01:07, 8597.75 examples/s]
+Filter: 29%|██▊ | 235000/818627 [00:26<01:07, 8597.85 examples/s]
+Filter: 29%|██▊ | 235000/818627 [00:26<01:07, 8595.76 examples/s]
+Filter: 29%|██▊ | 235000/818627 [00:26<01:07, 8596.97 examples/s]
+Filter: 29%|██▊ | 235000/818627 [00:26<01:07, 8596.86 examples/s]
+Filter: 29%|██▊ | 235000/818627 [00:26<01:07, 8594.15 examples/s]
+Filter: 29%|██▊ | 235000/818627 [00:26<01:07, 8589.09 examples/s]
+Filter: 29%|██▊ | 235000/818627 [00:26<01:07, 8590.77 examples/s]
+Filter: 29%|██▉ | 236000/818627 [00:26<01:05, 8954.11 examples/s]
+Filter: 29%|██▉ | 236000/818627 [00:26<01:05, 8954.99 examples/s]
+Filter: 29%|██▉ | 236000/818627 [00:26<01:05, 8956.80 examples/s]
+Filter: 29%|██▉ | 236000/818627 [00:26<01:05, 8961.96 examples/s]
+Filter: 29%|██▉ | 236000/818627 [00:26<01:05, 8957.72 examples/s]
+Filter: 29%|██▉ | 236000/818627 [00:26<01:05, 8960.14 examples/s]
+Filter: 29%|██▉ | 236000/818627 [00:26<01:05, 8954.00 examples/s]
+Filter: 29%|██▉ | 236000/818627 [00:26<01:05, 8955.79 examples/s]
+Filter: 29%|██▉ | 237000/818627 [00:26<01:04, 9024.27 examples/s]
+Filter: 29%|██▉ | 237000/818627 [00:26<01:04, 9027.01 examples/s]
+Filter: 29%|██▉ | 237000/818627 [00:26<01:04, 9022.95 examples/s]
+Filter: 29%|██▉ | 237000/818627 [00:26<01:04, 9027.59 examples/s]
+Filter: 29%|██▉ | 237000/818627 [00:26<01:04, 9023.76 examples/s]
+Filter: 29%|██▉ | 237000/818627 [00:26<01:04, 9024.41 examples/s]
+Filter: 29%|██▉ | 237000/818627 [00:26<01:04, 9025.15 examples/s]
+Filter: 29%|██▉ | 237000/818627 [00:26<01:04, 9026.89 examples/s]
+Filter: 29%|██▉ | 238000/818627 [00:26<01:05, 8823.37 examples/s]
+Filter: 29%|██▉ | 238000/818627 [00:26<01:05, 8822.30 examples/s]
+Filter: 29%|██▉ | 238000/818627 [00:26<01:05, 8821.20 examples/s]
+Filter: 29%|██▉ | 238000/818627 [00:26<01:05, 8822.16 examples/s]
+Filter: 29%|██▉ | 238000/818627 [00:26<01:05, 8819.86 examples/s]
+Filter: 29%|██▉ | 238000/818627 [00:26<01:05, 8821.61 examples/s]
+Filter: 29%|██▉ | 238000/818627 [00:26<01:05, 8822.61 examples/s]
+Filter: 29%|██▉ | 238000/818627 [00:26<01:05, 8821.69 examples/s]
+Filter: 29%|██▉ | 239000/818627 [00:26<01:06, 8727.37 examples/s]
+Filter: 29%|██▉ | 239000/818627 [00:26<01:06, 8727.91 examples/s]
+Filter: 29%|██▉ | 239000/818627 [00:26<01:06, 8727.94 examples/s]
+Filter: 29%|██▉ | 239000/818627 [00:27<01:06, 8726.45 examples/s]
+Filter: 29%|██▉ | 239000/818627 [00:26<01:06, 8726.81 examples/s]
+Filter: 29%|██▉ | 239000/818627 [00:26<01:06, 8724.82 examples/s]
+Filter: 29%|██▉ | 239000/818627 [00:26<01:06, 8727.66 examples/s]
+Filter: 29%|██▉ | 239000/818627 [00:26<01:06, 8728.02 examples/s]
+Filter: 29%|██▉ | 240000/818627 [00:26<01:06, 8695.23 examples/s]
+Filter: 29%|██▉ | 240000/818627 [00:26<01:06, 8696.08 examples/s]
+Filter: 29%|██▉ | 240000/818627 [00:26<01:06, 8696.25 examples/s]
+Filter: 29%|██▉ | 240000/818627 [00:27<01:06, 8696.21 examples/s]
+Filter: 29%|██▉ | 240000/818627 [00:26<01:06, 8696.23 examples/s]
+Filter: 29%|██▉ | 240000/818627 [00:26<01:06, 8693.43 examples/s]
+Filter: 29%|██▉ | 240000/818627 [00:26<01:06, 8693.64 examples/s]
+Filter: 29%|██▉ | 240000/818627 [00:26<01:06, 8692.92 examples/s]
+Filter: 29%|██▉ | 241000/818627 [00:26<01:06, 8641.75 examples/s]
+Filter: 29%|██▉ | 241000/818627 [00:26<01:06, 8640.34 examples/s]
+Filter: 29%|██▉ | 241000/818627 [00:26<01:06, 8637.37 examples/s]
+Filter: 29%|██▉ | 241000/818627 [00:26<01:06, 8642.32 examples/s]
+Filter: 29%|██▉ | 241000/818627 [00:27<01:06, 8635.94 examples/s]
+Filter: 29%|██▉ | 241000/818627 [00:27<01:06, 8636.39 examples/s]
+Filter: 29%|██▉ | 241000/818627 [00:26<01:06, 8640.04 examples/s]
+Filter: 29%|██▉ | 241000/818627 [00:26<01:07, 8569.58 examples/s]
+Filter: 30%|██▉ | 242000/818627 [00:27<01:06, 8626.08 examples/s]
+Filter: 30%|██▉ | 242000/818627 [00:27<01:06, 8622.37 examples/s]
+Filter: 30%|██▉ | 242000/818627 [00:27<01:06, 8627.76 examples/s]
+Filter: 30%|██▉ | 242000/818627 [00:27<01:06, 8625.46 examples/s]
+Filter: 30%|██▉ | 242000/818627 [00:27<01:06, 8624.97 examples/s]
+Filter: 30%|██▉ | 242000/818627 [00:27<01:06, 8644.21 examples/s]
+Filter: 30%|██▉ | 242000/818627 [00:27<01:06, 8625.41 examples/s]
+Filter: 30%|██▉ | 242000/818627 [00:27<01:07, 8603.79 examples/s]
+Filter: 30%|██▉ | 243000/818627 [00:27<01:07, 8573.66 examples/s]
+Filter: 30%|██▉ | 243000/818627 [00:27<01:07, 8566.43 examples/s]
+Filter: 30%|██▉ | 243000/818627 [00:27<01:07, 8570.82 examples/s]
+Filter: 30%|██▉ | 243000/818627 [00:27<01:07, 8551.92 examples/s]
+Filter: 30%|██▉ | 243000/818627 [00:27<01:07, 8567.69 examples/s]
+Filter: 30%|██▉ | 243000/818627 [00:27<01:07, 8580.89 examples/s]
+Filter: 30%|██▉ | 243000/818627 [00:27<01:07, 8566.47 examples/s]
+Filter: 30%|██▉ | 243000/818627 [00:27<01:07, 8567.57 examples/s]
+Filter: 30%|██▉ | 244000/818627 [00:27<01:07, 8553.63 examples/s]
+Filter: 30%|██▉ | 244000/818627 [00:27<01:07, 8546.81 examples/s]
+Filter: 30%|██▉ | 244000/818627 [00:27<01:07, 8549.38 examples/s]
+Filter: 30%|██▉ | 244000/818627 [00:27<01:07, 8544.27 examples/s]
+Filter: 30%|██▉ | 244000/818627 [00:27<01:07, 8556.20 examples/s]
+Filter: 30%|██▉ | 244000/818627 [00:27<01:07, 8545.53 examples/s]
+Filter: 30%|██▉ | 244000/818627 [00:27<01:07, 8543.29 examples/s]
+Filter: 30%|██▉ | 244000/818627 [00:27<01:07, 8544.66 examples/s]
+Filter: 30%|██▉ | 245000/818627 [00:27<01:05, 8707.79 examples/s]
+Filter: 30%|██▉ | 245000/818627 [00:27<01:05, 8705.30 examples/s]
+Filter: 30%|██▉ | 245000/818627 [00:27<01:05, 8704.86 examples/s]
+Filter: 30%|██▉ | 245000/818627 [00:27<01:05, 8705.60 examples/s]
+Filter: 30%|██▉ | 245000/818627 [00:27<01:05, 8707.82 examples/s]
+Filter: 30%|██▉ | 245000/818627 [00:27<01:05, 8704.13 examples/s]
+Filter: 30%|██▉ | 245000/818627 [00:27<01:05, 8699.33 examples/s]
+Filter: 30%|██▉ | 245000/818627 [00:27<01:05, 8698.39 examples/s]
+Filter: 30%|███ | 246000/818627 [00:27<01:05, 8688.22 examples/s]
+Filter: 30%|███ | 246000/818627 [00:27<01:05, 8686.73 examples/s]
+Filter: 30%|███ | 246000/818627 [00:27<01:05, 8683.87 examples/s]
+Filter: 30%|███ | 246000/818627 [00:27<01:05, 8685.27 examples/s]
+Filter: 30%|███ | 246000/818627 [00:27<01:05, 8687.81 examples/s]
+Filter: 30%|███ | 246000/818627 [00:27<01:05, 8685.75 examples/s]
+Filter: 30%|███ | 246000/818627 [00:27<01:05, 8689.11 examples/s]
+Filter: 30%|███ | 246000/818627 [00:27<01:05, 8686.11 examples/s]
+Filter: 30%|███ | 247000/818627 [00:27<01:06, 8606.08 examples/s]
+Filter: 30%|███ | 247000/818627 [00:27<01:06, 8605.15 examples/s]
+Filter: 30%|███ | 247000/818627 [00:27<01:06, 8603.79 examples/s]
+Filter: 30%|███ | 247000/818627 [00:28<01:06, 8601.21 examples/s]
+Filter: 30%|███ | 247000/818627 [00:27<01:06, 8606.31 examples/s]
+Filter: 30%|███ | 247000/818627 [00:27<01:06, 8604.77 examples/s]
+Filter: 30%|███ | 247000/818627 [00:27<01:06, 8608.24 examples/s]
+Filter: 30%|███ | 247000/818627 [00:27<01:06, 8601.00 examples/s]
+Filter: 30%|███ | 248000/818627 [00:27<01:06, 8604.79 examples/s]
+Filter: 30%|███ | 248000/818627 [00:27<01:06, 8607.08 examples/s]
+Filter: 30%|███ | 248000/818627 [00:27<01:06, 8601.60 examples/s]
+Filter: 30%|███ | 248000/818627 [00:28<01:06, 8606.90 examples/s]
+Filter: 30%|███ | 248000/818627 [00:27<01:06, 8609.30 examples/s]
+Filter: 30%|███ | 248000/818627 [00:27<01:06, 8607.65 examples/s]
+Filter: 30%|███ | 248000/818627 [00:27<01:06, 8601.23 examples/s]
+Filter: 30%|███ | 248000/818627 [00:27<01:06, 8603.40 examples/s]
+Filter: 30%|███ | 249000/818627 [00:27<01:06, 8549.37 examples/s]
+Filter: 30%|███ | 249000/818627 [00:27<01:06, 8548.82 examples/s]
+Filter: 30%|███ | 249000/818627 [00:27<01:06, 8549.51 examples/s]
+Filter: 30%|███ | 249000/818627 [00:28<01:06, 8548.96 examples/s]
+Filter: 30%|███ | 249000/818627 [00:27<01:06, 8550.35 examples/s]
+Filter: 30%|███ | 249000/818627 [00:27<01:06, 8547.80 examples/s]
+Filter: 30%|███ | 249000/818627 [00:27<01:06, 8547.55 examples/s]
+Filter: 30%|███ | 249000/818627 [00:28<01:06, 8541.39 examples/s]
+Filter: 31%|███ | 250000/818627 [00:28<01:03, 8899.04 examples/s]
+Filter: 31%|███ | 250000/818627 [00:28<01:03, 8898.64 examples/s]
+Filter: 31%|███ | 250000/818627 [00:28<01:03, 8897.14 examples/s]
+Filter: 31%|███ | 250000/818627 [00:28<01:03, 8898.97 examples/s]
+Filter: 31%|███ | 250000/818627 [00:28<01:03, 8899.86 examples/s]
+Filter: 31%|███ | 250000/818627 [00:28<01:03, 8899.84 examples/s]
+Filter: 31%|███ | 250000/818627 [00:28<01:03, 8898.86 examples/s]
+Filter: 31%|███ | 250000/818627 [00:28<01:03, 8899.43 examples/s]
+Filter: 31%|███ | 251000/818627 [00:28<01:03, 8924.77 examples/s]
+Filter: 31%|███ | 251000/818627 [00:28<01:03, 8920.09 examples/s]
+Filter: 31%|███ | 251000/818627 [00:28<01:03, 8924.21 examples/s]
+Filter: 31%|███ | 251000/818627 [00:28<01:03, 8923.26 examples/s]
+Filter: 31%|███ | 251000/818627 [00:28<01:03, 8925.17 examples/s]
+Filter: 31%|███ | 251000/818627 [00:28<01:03, 8926.30 examples/s]
+Filter: 31%|███ | 251000/818627 [00:28<01:03, 8925.70 examples/s]
+Filter: 31%|███ | 251000/818627 [00:28<01:03, 8924.70 examples/s]
+Filter: 31%|███ | 252000/818627 [00:28<01:04, 8783.67 examples/s]
+Filter: 31%|███ | 252000/818627 [00:28<01:04, 8783.66 examples/s]
+Filter: 31%|███ | 252000/818627 [00:28<01:04, 8785.77 examples/s]
+Filter: 31%|███ | 252000/818627 [00:28<01:04, 8775.48 examples/s]
+Filter: 31%|███ | 252000/818627 [00:28<01:04, 8783.76 examples/s]
+Filter: 31%|███ | 252000/818627 [00:28<01:04, 8781.03 examples/s]
+Filter: 31%|███ | 252000/818627 [00:28<01:04, 8784.94 examples/s]
+Filter: 31%|███ | 252000/818627 [00:28<01:04, 8780.59 examples/s]
+Filter: 31%|███ | 253000/818627 [00:28<01:04, 8746.02 examples/s]
+Filter: 31%|███ | 253000/818627 [00:28<01:04, 8741.01 examples/s]
+Filter: 31%|███ | 253000/818627 [00:28<01:04, 8734.45 examples/s]
+Filter: 31%|███ | 253000/818627 [00:28<01:04, 8737.41 examples/s]
+Filter: 31%|███ | 253000/818627 [00:28<01:04, 8738.61 examples/s]
+Filter: 31%|███ | 253000/818627 [00:28<01:04, 8739.98 examples/s]
+Filter: 31%|███ | 253000/818627 [00:28<01:04, 8736.89 examples/s]
+Filter: 31%|███ | 253000/818627 [00:28<01:04, 8737.75 examples/s]
+Filter: 31%|███ | 254000/818627 [00:28<01:04, 8721.22 examples/s]
+Filter: 31%|███ | 254000/818627 [00:28<01:04, 8719.34 examples/s]
+Filter: 31%|███ | 254000/818627 [00:28<01:04, 8719.12 examples/s]
+Filter: 31%|███ | 254000/818627 [00:28<01:04, 8713.33 examples/s]
+Filter: 31%|███ | 254000/818627 [00:28<01:04, 8710.95 examples/s]
+Filter: 31%|███ | 254000/818627 [00:28<01:04, 8711.04 examples/s]
+Filter: 31%|███ | 254000/818627 [00:28<01:04, 8707.66 examples/s]
+Filter: 31%|███ | 254000/818627 [00:28<01:05, 8559.31 examples/s]
+Filter: 31%|███ | 255000/818627 [00:28<01:04, 8766.26 examples/s]
+Filter: 31%|███ | 255000/818627 [00:28<01:04, 8674.55 examples/s]
+Filter: 31%|███ | 255000/818627 [00:28<01:04, 8692.88 examples/s]
+Filter: 31%|███ | 255000/818627 [00:28<01:04, 8690.93 examples/s]
+Filter: 31%|███ | 255000/818627 [00:28<01:05, 8671.14 examples/s]
+Filter: 31%|███ | 255000/818627 [00:28<01:05, 8651.18 examples/s]
+Filter: 31%|███ | 255000/818627 [00:28<01:05, 8665.25 examples/s]
+Filter: 31%|███ | 255000/818627 [00:28<01:05, 8644.35 examples/s]
+Filter: 31%|███▏ | 256000/818627 [00:28<01:06, 8460.40 examples/s]
+Filter: 31%|███▏ | 256000/818627 [00:28<01:06, 8466.24 examples/s]
+Filter: 31%|███▏ | 256000/818627 [00:28<01:06, 8480.28 examples/s]
+Filter: 31%|███▏ | 256000/818627 [00:28<01:06, 8459.17 examples/s]
+Filter: 31%|███▏ | 256000/818627 [00:28<01:06, 8467.73 examples/s]
+Filter: 31%|███▏ | 256000/818627 [00:28<01:06, 8453.84 examples/s]
+Filter: 31%|███▏ | 256000/818627 [00:28<01:06, 8463.22 examples/s]
+Filter: 31%|███▏ | 256000/818627 [00:29<01:06, 8423.59 examples/s]
+Filter: 31%|███▏ | 257000/818627 [00:28<01:05, 8535.01 examples/s]
+Filter: 31%|███▏ | 257000/818627 [00:28<01:05, 8526.79 examples/s]
+Filter: 31%|███▏ | 257000/818627 [00:28<01:05, 8542.81 examples/s]
+Filter: 31%|███▏ | 257000/818627 [00:29<01:05, 8539.62 examples/s]
+Filter: 31%|███▏ | 257000/818627 [00:28<01:05, 8539.51 examples/s]
+Filter: 31%|███▏ | 257000/818627 [00:28<01:05, 8525.79 examples/s]
+Filter: 31%|███▏ | 257000/818627 [00:28<01:05, 8528.32 examples/s]
+Filter: 31%|███▏ | 257000/818627 [00:28<01:05, 8531.42 examples/s]
+Filter: 32%|███▏ | 258000/818627 [00:28<01:05, 8551.19 examples/s]
+Filter: 32%|███▏ | 258000/818627 [00:28<01:05, 8545.11 examples/s]
+Filter: 32%|███▏ | 258000/818627 [00:28<01:05, 8555.88 examples/s]
+Filter: 32%|███▏ | 258000/818627 [00:29<01:05, 8553.51 examples/s]
+Filter: 32%|███▏ | 258000/818627 [00:29<01:05, 8546.46 examples/s]
+Filter: 32%|███▏ | 258000/818627 [00:28<01:05, 8547.33 examples/s]
+Filter: 32%|███▏ | 258000/818627 [00:28<01:05, 8549.96 examples/s]
+Filter: 32%|███▏ | 258000/818627 [00:28<01:05, 8548.12 examples/s]
+Filter: 32%|███▏ | 259000/818627 [00:29<01:02, 8923.54 examples/s]
+Filter: 32%|███▏ | 259000/818627 [00:29<01:02, 8919.05 examples/s]
+Filter: 32%|███▏ | 259000/818627 [00:29<01:02, 8926.68 examples/s]
+Filter: 32%|███▏ | 259000/818627 [00:29<01:02, 8922.51 examples/s]
+Filter: 32%|███▏ | 259000/818627 [00:29<01:02, 8927.71 examples/s]
+Filter: 32%|███▏ | 259000/818627 [00:29<01:02, 8920.95 examples/s]
+Filter: 32%|███▏ | 259000/818627 [00:29<01:02, 8918.15 examples/s]
+Filter: 32%|███▏ | 259000/818627 [00:29<01:02, 8923.30 examples/s]
+Filter: 32%|███▏ | 260000/818627 [00:29<01:02, 8932.79 examples/s]
+Filter: 32%|███▏ | 260000/818627 [00:29<01:02, 8930.12 examples/s]
+Filter: 32%|███▏ | 260000/818627 [00:29<01:02, 8936.51 examples/s]
+Filter: 32%|███▏ | 260000/818627 [00:29<01:02, 8935.69 examples/s]
+Filter: 32%|███▏ | 260000/818627 [00:29<01:02, 8934.17 examples/s]
+Filter: 32%|███▏ | 260000/818627 [00:29<01:02, 8932.09 examples/s]
+Filter: 32%|███▏ | 260000/818627 [00:29<01:02, 8930.75 examples/s]
+Filter: 32%|███▏ | 260000/818627 [00:29<01:02, 8927.97 examples/s]
+Filter: 32%|███▏ | 261000/818627 [00:29<01:01, 9016.58 examples/s]
+Filter: 32%|███▏ | 261000/818627 [00:29<01:01, 9012.06 examples/s]
+Filter: 32%|███▏ | 261000/818627 [00:29<01:01, 9015.87 examples/s]
+Filter: 32%|███▏ | 261000/818627 [00:29<01:01, 9010.03 examples/s]
+Filter: 32%|███▏ | 261000/818627 [00:29<01:01, 9010.93 examples/s]
+Filter: 32%|███▏ | 261000/818627 [00:29<01:01, 9014.68 examples/s]
+Filter: 32%|███▏ | 261000/818627 [00:29<01:01, 9010.15 examples/s]
+Filter: 32%|███▏ | 261000/818627 [00:29<01:01, 9014.35 examples/s]
+Filter: 32%|███▏ | 262000/818627 [00:29<01:02, 8886.32 examples/s]
+Filter: 32%|███▏ | 262000/818627 [00:29<01:02, 8884.50 examples/s]
+Filter: 32%|███▏ | 262000/818627 [00:29<01:02, 8888.46 examples/s]
+Filter: 32%|███▏ | 262000/818627 [00:29<01:02, 8887.20 examples/s]
+Filter: 32%|███▏ | 262000/818627 [00:29<01:02, 8885.17 examples/s]
+Filter: 32%|███▏ | 262000/818627 [00:29<01:02, 8884.50 examples/s]
+Filter: 32%|███▏ | 262000/818627 [00:29<01:02, 8885.93 examples/s]
+Filter: 32%|███▏ | 262000/818627 [00:29<01:02, 8887.80 examples/s]
+Filter: 32%|███▏ | 263000/818627 [00:29<01:03, 8817.91 examples/s]
+Filter: 32%|███▏ | 263000/818627 [00:29<01:02, 8821.78 examples/s]
+Filter: 32%|███▏ | 263000/818627 [00:29<01:03, 8812.22 examples/s]
+Filter: 32%|███▏ | 263000/818627 [00:29<01:03, 8819.05 examples/s]
+Filter: 32%|███▏ | 263000/818627 [00:29<01:03, 8812.63 examples/s]
+Filter: 32%|███▏ | 263000/818627 [00:29<01:02, 8820.06 examples/s]
+Filter: 32%|███▏ | 263000/818627 [00:29<01:03, 8816.91 examples/s]
+Filter: 32%|███▏ | 263000/818627 [00:29<01:03, 8819.21 examples/s]
+Filter: 32%|███▏ | 264000/818627 [00:29<01:02, 8825.22 examples/s]
+Filter: 32%|███▏ | 264000/818627 [00:29<01:02, 8827.98 examples/s]
+Filter: 32%|███▏ | 264000/818627 [00:29<01:02, 8827.41 examples/s]
+Filter: 32%|███▏ | 264000/818627 [00:29<01:02, 8828.92 examples/s]
+Filter: 32%|███▏ | 264000/818627 [00:29<01:02, 8825.22 examples/s]
+Filter: 32%|███▏ | 264000/818627 [00:29<01:02, 8824.39 examples/s]
+Filter: 32%|███▏ | 264000/818627 [00:29<01:02, 8825.13 examples/s]
+Filter: 32%|███▏ | 264000/818627 [00:29<01:02, 8825.66 examples/s]
+Filter: 32%|███▏ | 265000/818627 [00:29<01:02, 8790.17 examples/s]
+Filter: 32%|███▏ | 265000/818627 [00:29<01:02, 8792.15 examples/s]
+Filter: 32%|███▏ | 265000/818627 [00:30<01:02, 8795.19 examples/s]
+Filter: 32%|███▏ | 265000/818627 [00:29<01:03, 8783.53 examples/s]
+Filter: 32%|███▏ | 265000/818627 [00:29<01:02, 8791.66 examples/s]
+Filter: 32%|███▏ | 265000/818627 [00:29<01:02, 8788.47 examples/s]
+Filter: 32%|███▏ | 265000/818627 [00:29<01:02, 8788.09 examples/s]
+Filter: 32%|███▏ | 265000/818627 [00:29<01:02, 8790.65 examples/s]
+Filter: 32%|███▏ | 266000/818627 [00:29<01:00, 9114.12 examples/s]
+Filter: 32%|███▏ | 266000/818627 [00:29<01:00, 9116.56 examples/s]
+Filter: 32%|███▏ | 266000/818627 [00:30<01:00, 9115.89 examples/s]
+Filter: 32%|███▏ | 266000/818627 [00:29<01:00, 9115.16 examples/s]
+Filter: 32%|███▏ | 266000/818627 [00:29<01:00, 9115.31 examples/s]
+Filter: 32%|███▏ | 266000/818627 [00:29<01:00, 9114.61 examples/s]
+Filter: 32%|███▏ | 266000/818627 [00:29<01:00, 9112.44 examples/s]
+Filter: 33%|███▎ | 267000/818627 [00:29<01:00, 9119.21 examples/s]
+Filter: 33%|███▎ | 267000/818627 [00:29<01:00, 9114.56 examples/s]
+Filter: 33%|███▎ | 267000/818627 [00:29<01:00, 9118.66 examples/s]
+Filter: 33%|███▎ | 267000/818627 [00:30<01:00, 9115.20 examples/s]
+Filter: 33%|███▎ | 267000/818627 [00:30<01:00, 9116.36 examples/s]
+Filter: 33%|███▎ | 267000/818627 [00:29<01:00, 9114.97 examples/s]
+Filter: 33%|███▎ | 267000/818627 [00:29<01:00, 9116.32 examples/s]
+Filter: 33%|███▎ | 267000/818627 [00:29<01:00, 9107.55 examples/s]
+Filter: 33%|███▎ | 268000/818627 [00:30<01:01, 8947.56 examples/s]
+Filter: 33%|███▎ | 268000/818627 [00:30<01:01, 8947.44 examples/s]
+Filter: 33%|███▎ | 268000/818627 [00:30<01:01, 8978.62 examples/s]
+Filter: 33%|███▎ | 268000/818627 [00:30<01:01, 8948.16 examples/s]
+Filter: 33%|███▎ | 268000/818627 [00:30<01:01, 8945.82 examples/s]
+Filter: 33%|███▎ | 268000/818627 [00:30<01:01, 8944.38 examples/s]
+Filter: 33%|███▎ | 268000/818627 [00:30<01:01, 8946.71 examples/s]
+Filter: 33%|███▎ | 268000/818627 [00:30<01:01, 8942.98 examples/s]
+Filter: 33%|███▎ | 269000/818627 [00:30<01:02, 8860.39 examples/s]
+Filter: 33%|███▎ | 269000/818627 [00:30<01:02, 8860.57 examples/s]
+Filter: 33%|███▎ | 269000/818627 [00:30<01:02, 8864.14 examples/s]
+Filter: 33%|███▎ | 269000/818627 [00:30<01:01, 8894.13 examples/s]
+Filter: 33%|███▎ | 269000/818627 [00:30<01:02, 8857.07 examples/s]
+Filter: 33%|███▎ | 269000/818627 [00:30<01:02, 8860.42 examples/s]
+Filter: 33%|███▎ | 269000/818627 [00:30<01:02, 8855.37 examples/s]
+Filter: 33%|███▎ | 269000/818627 [00:30<01:02, 8796.91 examples/s]
+Filter: 33%|███▎ | 270000/818627 [00:30<01:02, 8814.03 examples/s]
+Filter: 33%|███▎ | 270000/818627 [00:30<01:02, 8812.47 examples/s]
+Filter: 33%|███▎ | 270000/818627 [00:30<01:02, 8814.43 examples/s]
+Filter: 33%|███▎ | 270000/818627 [00:30<01:02, 8792.17 examples/s]
+Filter: 33%|███▎ | 270000/818627 [00:30<01:02, 8822.94 examples/s]
+Filter: 33%|███▎ | 270000/818627 [00:30<01:02, 8792.80 examples/s]
+Filter: 33%|███▎ | 270000/818627 [00:30<01:02, 8824.47 examples/s]
+Filter: 33%|███▎ | 270000/818627 [00:30<01:02, 8801.16 examples/s]
+Filter: 33%|███▎ | 271000/818627 [00:30<01:02, 8771.76 examples/s]
+Filter: 33%|███▎ | 271000/818627 [00:30<01:02, 8778.27 examples/s]
+Filter: 33%|███▎ | 271000/818627 [00:30<01:02, 8798.88 examples/s]
+Filter: 33%|███▎ | 271000/818627 [00:30<01:02, 8790.96 examples/s]
+Filter: 33%|███▎ | 271000/818627 [00:30<01:02, 8769.17 examples/s]
+Filter: 33%|███▎ | 271000/818627 [00:30<01:02, 8771.34 examples/s]
+Filter: 33%|███▎ | 271000/818627 [00:30<01:02, 8763.41 examples/s]
+Filter: 33%|███▎ | 271000/818627 [00:30<01:02, 8740.42 examples/s]
+Filter: 33%|███▎ | 272000/818627 [00:30<01:02, 8714.43 examples/s]
+Filter: 33%|███▎ | 272000/818627 [00:30<01:02, 8723.62 examples/s]
+Filter: 33%|███▎ | 272000/818627 [00:30<01:02, 8712.79 examples/s]
+Filter: 33%|███▎ | 272000/818627 [00:30<01:02, 8694.08 examples/s]
+Filter: 33%|███▎ | 272000/818627 [00:30<01:02, 8711.16 examples/s]
+Filter: 33%|███▎ | 272000/818627 [00:30<01:02, 8718.48 examples/s]
+Filter: 33%|███▎ | 272000/818627 [00:30<01:02, 8682.28 examples/s]
+Filter: 33%|███▎ | 272000/818627 [00:30<01:03, 8666.75 examples/s]
+Filter: 33%|███▎ | 273000/818627 [00:30<01:00, 9034.98 examples/s]
+Filter: 33%|███▎ | 273000/818627 [00:30<01:00, 9029.95 examples/s]
+Filter: 33%|███▎ | 273000/818627 [00:30<01:00, 9039.63 examples/s]
+Filter: 33%|███▎ | 273000/818627 [00:30<01:00, 9037.23 examples/s]
+Filter: 33%|███▎ | 273000/818627 [00:30<01:00, 9030.48 examples/s]
+Filter: 33%|███▎ | 273000/818627 [00:30<01:00, 9027.29 examples/s]
+Filter: 33%|███▎ | 274000/818627 [00:30<01:00, 9020.61 examples/s]
+Filter: 33%|███▎ | 274000/818627 [00:30<01:00, 9019.86 examples/s]
+Filter: 33%|███▎ | 274000/818627 [00:30<01:00, 9024.98 examples/s]
+Filter: 33%|███▎ | 274000/818627 [00:31<01:00, 9019.77 examples/s]
+Filter: 33%|███▎ | 274000/818627 [00:30<01:00, 9018.49 examples/s]
+Filter: 33%|███▎ | 274000/818627 [00:30<01:00, 9037.03 examples/s]
+Filter: 33%|███▎ | 274000/818627 [00:30<01:00, 9036.98 examples/s]
+Filter: 33%|███▎ | 274000/818627 [00:30<01:00, 9014.61 examples/s]
+Filter: 34%|███▎ | 275000/818627 [00:30<01:01, 8874.33 examples/s]
+Filter: 34%|███▎ | 275000/818627 [00:30<01:01, 8878.21 examples/s]
+Filter: 34%|███▎ | 275000/818627 [00:31<01:01, 8875.72 examples/s]
+Filter: 34%|███▎ | 275000/818627 [00:30<01:01, 8862.54 examples/s]
+Filter: 34%|███▎ | 275000/818627 [00:30<01:01, 8909.84 examples/s]
+Filter: 34%|███▎ | 275000/818627 [00:30<01:01, 8867.93 examples/s]
+Filter: 34%|███▎ | 275000/818627 [00:30<01:01, 8909.09 examples/s]
+Filter: 34%|███▎ | 275000/818627 [00:30<01:01, 8869.89 examples/s]
+Filter: 34%|███▎ | 276000/818627 [00:30<01:01, 8804.83 examples/s]
+Filter: 34%|███▎ | 276000/818627 [00:30<01:01, 8800.24 examples/s]
+Filter: 34%|███▎ | 276000/818627 [00:31<01:01, 8805.01 examples/s]
+Filter: 34%|███▎ | 276000/818627 [00:30<01:01, 8800.08 examples/s]
+Filter: 34%|███▎ | 276000/818627 [00:31<01:01, 8800.85 examples/s]
+Filter: 34%|███▎ | 276000/818627 [00:30<01:01, 8838.96 examples/s]
+Filter: 34%|███▎ | 276000/818627 [00:30<01:01, 8804.47 examples/s]
+Filter: 34%|███▎ | 276000/818627 [00:30<01:01, 8836.23 examples/s]
+Filter: 34%|███▍ | 277000/818627 [00:31<01:01, 8762.77 examples/s]
+Filter: 34%|███▍ | 277000/818627 [00:31<01:01, 8759.43 examples/s]
+Filter: 34%|███▍ | 277000/818627 [00:31<01:01, 8760.97 examples/s]
+Filter: 34%|███▍ | 277000/818627 [00:31<01:01, 8761.89 examples/s]
+Filter: 34%|███▍ | 277000/818627 [00:31<01:01, 8792.72 examples/s]
+Filter: 34%|███▍ | 277000/818627 [00:31<01:01, 8761.84 examples/s]
+Filter: 34%|███▍ | 277000/818627 [00:31<01:01, 8786.41 examples/s]
+Filter: 34%|███▍ | 277000/818627 [00:31<01:01, 8753.81 examples/s]
+Filter: 34%|███▍ | 278000/818627 [00:31<01:02, 8698.59 examples/s]
+Filter: 34%|███▍ | 278000/818627 [00:31<01:02, 8695.24 examples/s]
+Filter: 34%|███▍ | 278000/818627 [00:31<01:02, 8703.04 examples/s]
+Filter: 34%|███▍ | 278000/818627 [00:31<01:02, 8697.22 examples/s]
+Filter: 34%|███▍ | 278000/818627 [00:31<01:01, 8727.12 examples/s]
+Filter: 34%|███▍ | 278000/818627 [00:31<01:02, 8698.12 examples/s]
+Filter: 34%|███▍ | 278000/818627 [00:31<01:01, 8721.75 examples/s]
+Filter: 34%|███▍ | 278000/818627 [00:31<01:02, 8695.76 examples/s]
+Filter: 34%|███▍ | 279000/818627 [00:31<01:02, 8699.01 examples/s]
+Filter: 34%|███▍ | 279000/818627 [00:31<01:02, 8699.80 examples/s]
+Filter: 34%|███▍ | 279000/818627 [00:31<01:02, 8692.04 examples/s]
+Filter: 34%|███▍ | 279000/818627 [00:31<01:02, 8696.55 examples/s]
+Filter: 34%|███▍ | 279000/818627 [00:31<01:02, 8702.56 examples/s]
+Filter: 34%|███▍ | 279000/818627 [00:31<01:01, 8718.45 examples/s]
+Filter: 34%|███▍ | 279000/818627 [00:31<01:01, 8717.05 examples/s]
+Filter: 34%|███▍ | 279000/818627 [00:31<01:02, 8701.17 examples/s]
+Filter: 34%|███▍ | 280000/818627 [00:31<01:01, 8791.23 examples/s]
+Filter: 34%|███▍ | 280000/818627 [00:31<01:01, 8788.21 examples/s]
+Filter: 34%|███▍ | 280000/818627 [00:31<01:01, 8788.52 examples/s]
+Filter: 34%|███▍ | 280000/818627 [00:31<01:01, 8791.21 examples/s]
+Filter: 34%|███▍ | 280000/818627 [00:31<01:01, 8801.61 examples/s]
+Filter: 34%|███▍ | 280000/818627 [00:31<01:01, 8799.87 examples/s]
+Filter: 34%|███▍ | 280000/818627 [00:31<01:01, 8787.98 examples/s]
+Filter: 34%|███▍ | 280000/818627 [00:31<01:01, 8773.85 examples/s]
+Filter: 34%|███▍ | 281000/818627 [00:31<01:00, 8932.25 examples/s]
+Filter: 34%|███▍ | 281000/818627 [00:31<01:00, 8927.25 examples/s]
+Filter: 34%|███▍ | 281000/818627 [00:31<01:00, 8929.41 examples/s]
+Filter: 34%|███▍ | 281000/818627 [00:31<01:00, 8932.29 examples/s]
+Filter: 34%|███▍ | 281000/818627 [00:31<01:00, 8929.56 examples/s]
+Filter: 34%|███▍ | 281000/818627 [00:31<01:00, 8928.98 examples/s]
+Filter: 34%|███▍ | 281000/818627 [00:31<01:00, 8923.60 examples/s]
+Filter: 34%|███▍ | 281000/818627 [00:31<01:00, 8923.75 examples/s]
+Filter: 34%|███▍ | 282000/818627 [00:31<01:00, 8870.36 examples/s]
+Filter: 34%|███▍ | 282000/818627 [00:31<01:00, 8867.09 examples/s]
+Filter: 34%|███▍ | 282000/818627 [00:31<01:00, 8871.27 examples/s]
+Filter: 34%|███▍ | 282000/818627 [00:31<01:00, 8873.13 examples/s]
+Filter: 34%|███▍ | 282000/818627 [00:31<01:00, 8875.04 examples/s]
+Filter: 34%|███▍ | 282000/818627 [00:31<01:00, 8872.78 examples/s]
+Filter: 34%|███▍ | 282000/818627 [00:31<01:00, 8867.82 examples/s]
+Filter: 34%|███▍ | 282000/818627 [00:31<01:00, 8866.96 examples/s]
+Filter: 35%|███▍ | 283000/818627 [00:31<01:00, 8849.32 examples/s]
+Filter: 35%|███▍ | 283000/818627 [00:31<01:00, 8848.69 examples/s]
+Filter: 35%|███▍ | 283000/818627 [00:31<01:00, 8851.96 examples/s]
+Filter: 35%|███▍ | 283000/818627 [00:32<01:00, 8849.46 examples/s]
+Filter: 35%|███▍ | 283000/818627 [00:31<01:00, 8852.49 examples/s]
+Filter: 35%|███▍ | 283000/818627 [00:31<01:00, 8853.52 examples/s]
+Filter: 35%|███▍ | 283000/818627 [00:31<01:00, 8850.97 examples/s]
+Filter: 35%|███▍ | 283000/818627 [00:31<01:00, 8848.68 examples/s]
+Filter: 35%|███▍ | 284000/818627 [00:31<01:01, 8756.30 examples/s]
+Filter: 35%|███▍ | 284000/818627 [00:31<01:01, 8762.20 examples/s]
+Filter: 35%|███▍ | 284000/818627 [00:31<01:01, 8757.29 examples/s]
+Filter: 35%|███▍ | 284000/818627 [00:32<01:00, 8765.75 examples/s]
+Filter: 35%|███▍ | 284000/818627 [00:31<01:01, 8763.24 examples/s]
+Filter: 35%|███▍ | 284000/818627 [00:31<01:01, 8758.82 examples/s]
+Filter: 35%|███▍ | 284000/818627 [00:31<01:01, 8757.71 examples/s]
+Filter: 35%|███▍ | 284000/818627 [00:31<01:01, 8661.50 examples/s]
+Filter: 35%|███▍ | 285000/818627 [00:31<01:00, 8767.25 examples/s]
+Filter: 35%|███▍ | 285000/818627 [00:31<01:00, 8765.71 examples/s]
+Filter: 35%|███▍ | 285000/818627 [00:31<01:00, 8766.91 examples/s]
+Filter: 35%|███▍ | 285000/818627 [00:32<01:00, 8765.64 examples/s]
+Filter: 35%|███▍ | 285000/818627 [00:31<01:00, 8771.27 examples/s]
+Filter: 35%|███▍ | 285000/818627 [00:31<01:00, 8768.17 examples/s]
+Filter: 35%|███▍ | 285000/818627 [00:32<01:00, 8792.89 examples/s]
+Filter: 35%|███▍ | 285000/818627 [00:31<01:00, 8764.34 examples/s]
+Filter: 35%|███▍ | 286000/818627 [00:32<01:00, 8778.19 examples/s]
+Filter: 35%|███▍ | 286000/818627 [00:32<01:00, 8777.37 examples/s]
+Filter: 35%|███▍ | 286000/818627 [00:32<01:00, 8779.59 examples/s]
+Filter: 35%|███▍ | 286000/818627 [00:32<01:00, 8778.22 examples/s]
+Filter: 35%|███▍ | 286000/818627 [00:32<01:00, 8801.69 examples/s]
+Filter: 35%|███▍ | 286000/818627 [00:32<01:00, 8781.10 examples/s]
+Filter: 35%|███▍ | 286000/818627 [00:32<01:00, 8779.15 examples/s]
+Filter: 35%|███▍ | 286000/818627 [00:32<01:00, 8779.43 examples/s]
+Filter: 35%|███▌ | 287000/818627 [00:32<01:00, 8769.80 examples/s]
+Filter: 35%|███▌ | 287000/818627 [00:32<01:00, 8769.98 examples/s]
+Filter: 35%|███▌ | 287000/818627 [00:32<01:00, 8770.64 examples/s]
+Filter: 35%|███▌ | 287000/818627 [00:32<01:00, 8768.47 examples/s]
+Filter: 35%|███▌ | 287000/818627 [00:32<01:00, 8784.28 examples/s]
+Filter: 35%|███▌ | 287000/818627 [00:32<01:00, 8768.22 examples/s]
+Filter: 35%|███▌ | 287000/818627 [00:32<01:00, 8768.45 examples/s]
+Filter: 35%|███▌ | 287000/818627 [00:32<01:00, 8769.72 examples/s]
+Filter: 35%|███▌ | 288000/818627 [00:32<00:59, 8852.84 examples/s]
+Filter: 35%|███▌ | 288000/818627 [00:32<00:59, 8851.55 examples/s]
+Filter: 35%|███▌ | 288000/818627 [00:32<00:59, 8847.20 examples/s]
+Filter: 35%|███▌ | 288000/818627 [00:32<00:59, 8849.90 examples/s]
+Filter: 35%|███▌ | 288000/818627 [00:32<00:59, 8851.59 examples/s]
+Filter: 35%|███▌ | 288000/818627 [00:32<00:59, 8860.37 examples/s]
+Filter: 35%|███▌ | 288000/818627 [00:32<00:59, 8850.36 examples/s]
+Filter: 35%|███▌ | 288000/818627 [00:32<00:59, 8850.57 examples/s]
+Filter: 35%|███▌ | 289000/818627 [00:32<00:59, 8870.00 examples/s]
+Filter: 35%|███▌ | 289000/818627 [00:32<00:59, 8861.27 examples/s]
+Filter: 35%|███▌ | 289000/818627 [00:32<00:59, 8871.24 examples/s]
+Filter: 35%|███▌ | 289000/818627 [00:32<00:59, 8867.19 examples/s]
+Filter: 35%|███▌ | 289000/818627 [00:32<00:59, 8865.49 examples/s]
+Filter: 35%|███▌ | 289000/818627 [00:32<00:59, 8870.71 examples/s]
+Filter: 35%|███▌ | 289000/818627 [00:32<01:00, 8736.60 examples/s]
+Filter: 35%|███▌ | 289000/818627 [00:32<01:01, 8568.70 examples/s]
+Filter: 35%|███▌ | 290000/818627 [00:32<00:59, 8905.48 examples/s]
+Filter: 35%|███▌ | 290000/818627 [00:32<00:59, 8943.91 examples/s]
+Filter: 35%|███▌ | 290000/818627 [00:32<00:59, 8904.40 examples/s]
+Filter: 35%|███▌ | 290000/818627 [00:32<00:59, 8904.33 examples/s]
+Filter: 35%|███▌ | 290000/818627 [00:32<00:59, 8908.90 examples/s]
+Filter: 35%|███▌ | 290000/818627 [00:32<00:59, 8903.33 examples/s]
+Filter: 35%|███▌ | 290000/818627 [00:32<00:59, 8900.50 examples/s]
+Filter: 36%|███▌ | 291000/818627 [00:32<00:59, 8873.97 examples/s]
+Filter: 36%|███▌ | 291000/818627 [00:32<00:59, 8877.46 examples/s]
+Filter: 36%|███▌ | 291000/818627 [00:32<00:59, 8900.33 examples/s]
+Filter: 36%|███▌ | 291000/818627 [00:32<00:58, 8953.00 examples/s]
+Filter: 36%|███▌ | 291000/818627 [00:32<00:59, 8879.86 examples/s]
+Filter: 36%|███▌ | 291000/818627 [00:32<00:59, 8874.83 examples/s]
+Filter: 36%|███▌ | 291000/818627 [00:32<00:59, 8876.40 examples/s]
+Filter: 36%|███▌ | 291000/818627 [00:32<00:59, 8872.65 examples/s]
+Filter: 36%|███▌ | 292000/818627 [00:32<00:59, 8808.41 examples/s]
+Filter: 36%|███▌ | 292000/818627 [00:32<00:59, 8809.46 examples/s]
+Filter: 36%|███▌ | 292000/818627 [00:32<00:59, 8823.22 examples/s]
+Filter: 36%|███▌ | 292000/818627 [00:33<00:59, 8877.29 examples/s]
+Filter: 36%|███▌ | 292000/818627 [00:32<00:59, 8810.11 examples/s]
+Filter: 36%|███▌ | 292000/818627 [00:32<00:59, 8811.31 examples/s]
+Filter: 36%|███▌ | 292000/818627 [00:32<00:59, 8808.65 examples/s]
+Filter: 36%|███▌ | 292000/818627 [00:32<00:59, 8806.78 examples/s]
+Filter: 36%|███▌ | 293000/818627 [00:32<01:00, 8756.49 examples/s]
+Filter: 36%|███▌ | 293000/818627 [00:32<01:00, 8756.65 examples/s]
+Filter: 36%|███▌ | 293000/818627 [00:32<00:59, 8768.06 examples/s]
+Filter: 36%|███▌ | 293000/818627 [00:33<00:59, 8816.83 examples/s]
+Filter: 36%|███▌ | 293000/818627 [00:32<01:00, 8757.46 examples/s]
+Filter: 36%|███▌ | 293000/818627 [00:32<01:00, 8755.27 examples/s]
+Filter: 36%|███▌ | 293000/818627 [00:32<01:00, 8754.50 examples/s]
+Filter: 36%|███▌ | 293000/818627 [00:32<01:00, 8754.21 examples/s]
+Filter: 36%|███▌ | 294000/818627 [00:33<00:59, 8832.26 examples/s]
+Filter: 36%|███▌ | 294000/818627 [00:32<00:59, 8817.74 examples/s]
+Filter: 36%|███▌ | 294000/818627 [00:33<00:59, 8819.19 examples/s]
+Filter: 36%|███▌ | 294000/818627 [00:33<00:59, 8857.61 examples/s]
+Filter: 36%|███▌ | 294000/818627 [00:32<00:59, 8818.57 examples/s]
+Filter: 36%|███▌ | 294000/818627 [00:33<00:59, 8819.93 examples/s]
+Filter: 36%|███▌ | 294000/818627 [00:32<00:59, 8816.66 examples/s]
+Filter: 36%|███▌ | 294000/818627 [00:33<00:59, 8818.89 examples/s]
+Filter: 36%|███▌ | 295000/818627 [00:33<00:58, 8894.74 examples/s]
+Filter: 36%|███▌ | 295000/818627 [00:33<00:58, 8901.35 examples/s]
+Filter: 36%|███▌ | 295000/818627 [00:33<00:58, 8894.53 examples/s]
+Filter: 36%|███▌ | 295000/818627 [00:33<00:58, 8914.30 examples/s]
+Filter: 36%|███▌ | 295000/818627 [00:33<00:58, 8894.04 examples/s]
+Filter: 36%|███▌ | 295000/818627 [00:33<00:58, 8894.95 examples/s]
+Filter: 36%|███▌ | 295000/818627 [00:33<00:58, 8894.40 examples/s]
+Filter: 36%|███▌ | 295000/818627 [00:33<00:58, 8896.01 examples/s]
+Filter: 36%|███▌ | 296000/818627 [00:33<00:59, 8823.40 examples/s]
+Filter: 36%|███▌ | 296000/818627 [00:33<00:59, 8819.08 examples/s]
+Filter: 36%|███▌ | 296000/818627 [00:33<00:59, 8825.03 examples/s]
+Filter: 36%|███▌ | 296000/818627 [00:33<00:59, 8844.76 examples/s]
+Filter: 36%|███▌ | 296000/818627 [00:33<00:59, 8825.26 examples/s]
+Filter: 36%|███▌ | 296000/818627 [00:33<00:59, 8823.34 examples/s]
+Filter: 36%|███▌ | 296000/818627 [00:33<00:59, 8822.84 examples/s]
+Filter: 36%|███▌ | 296000/818627 [00:33<00:59, 8817.10 examples/s]
+Filter: 36%|███▋ | 297000/818627 [00:33<00:59, 8815.83 examples/s]
+Filter: 36%|███▋ | 297000/818627 [00:33<00:59, 8819.88 examples/s]
+Filter: 36%|███▋ | 297000/818627 [00:33<00:59, 8834.13 examples/s]
+Filter: 36%|███▋ | 297000/818627 [00:33<00:59, 8814.74 examples/s]
+Filter: 36%|███▋ | 297000/818627 [00:33<00:59, 8817.84 examples/s]
+Filter: 36%|███▋ | 297000/818627 [00:33<00:59, 8815.00 examples/s]
+Filter: 36%|███▋ | 297000/818627 [00:33<00:59, 8813.94 examples/s]
+Filter: 36%|███▋ | 297000/818627 [00:33<00:59, 8817.83 examples/s]
+Filter: 36%|███▋ | 298000/818627 [00:33<00:59, 8765.82 examples/s]
+Filter: 36%|███▋ | 298000/818627 [00:33<00:59, 8761.61 examples/s]
+Filter: 36%|███▋ | 298000/818627 [00:33<00:59, 8757.47 examples/s]
+Filter: 36%|███▋ | 298000/818627 [00:33<00:59, 8765.11 examples/s]
+Filter: 36%|███▋ | 298000/818627 [00:33<00:59, 8763.03 examples/s]
+Filter: 36%|███▋ | 298000/818627 [00:33<00:59, 8762.56 examples/s]
+Filter: 36%|███▋ | 298000/818627 [00:33<00:59, 8761.90 examples/s]
+Filter: 36%|███▋ | 298000/818627 [00:33<01:00, 8606.38 examples/s]
+Filter: 37%|███▋ | 299000/818627 [00:33<00:59, 8728.66 examples/s]
+Filter: 37%|███▋ | 299000/818627 [00:33<00:59, 8725.48 examples/s]
+Filter: 37%|███▋ | 299000/818627 [00:33<00:59, 8724.65 examples/s]
+Filter: 37%|███▋ | 299000/818627 [00:33<00:59, 8732.74 examples/s]
+Filter: 37%|███▋ | 299000/818627 [00:33<00:59, 8726.82 examples/s]
+Filter: 37%|███▋ | 299000/818627 [00:33<00:59, 8772.84 examples/s]
+Filter: 37%|███▋ | 299000/818627 [00:33<00:59, 8725.77 examples/s]
+Filter: 37%|███▋ | 299000/818627 [00:33<00:59, 8728.26 examples/s]
+Filter: 37%|███▋ | 300000/818627 [00:33<00:59, 8740.11 examples/s]
+Filter: 37%|███▋ | 300000/818627 [00:33<00:59, 8743.44 examples/s]
+Filter: 37%|███▋ | 300000/818627 [00:33<00:59, 8739.93 examples/s]
+Filter: 37%|███▋ | 300000/818627 [00:34<00:59, 8749.27 examples/s]
+Filter: 37%|███▋ | 300000/818627 [00:33<00:59, 8742.43 examples/s]
+Filter: 37%|███▋ | 300000/818627 [00:33<00:59, 8741.53 examples/s]
+Filter: 37%|███▋ | 300000/818627 [00:33<00:59, 8774.52 examples/s]
+Filter: 37%|███▋ | 300000/818627 [00:33<00:59, 8739.91 examples/s]
+Filter: 37%|███▋ | 301000/818627 [00:33<00:57, 9065.88 examples/s]
+Filter: 37%|███▋ | 301000/818627 [00:34<00:57, 9069.19 examples/s]
+Filter: 37%|███▋ | 301000/818627 [00:33<00:57, 9058.76 examples/s]
+Filter: 37%|███▋ | 301000/818627 [00:33<00:56, 9086.94 examples/s]
+Filter: 37%|███▋ | 301000/818627 [00:33<00:57, 9061.87 examples/s]
+Filter: 37%|███▋ | 301000/818627 [00:33<00:57, 9056.23 examples/s]
+Filter: 37%|███▋ | 301000/818627 [00:33<00:57, 9060.13 examples/s]
+Filter: 37%|███▋ | 301000/818627 [00:33<00:58, 8899.62 examples/s]
+Filter: 37%|███▋ | 302000/818627 [00:33<00:56, 9108.72 examples/s]
+Filter: 37%|███▋ | 302000/818627 [00:34<00:56, 9064.25 examples/s]
+Filter: 37%|███▋ | 302000/818627 [00:33<00:57, 9057.68 examples/s]
+Filter: 37%|███▋ | 302000/818627 [00:34<00:56, 9064.20 examples/s]
+Filter: 37%|███▋ | 302000/818627 [00:33<00:56, 9080.09 examples/s]
+Filter: 37%|███▋ | 302000/818627 [00:33<00:57, 9060.07 examples/s]
+Filter: 37%|███▋ | 302000/818627 [00:33<00:56, 9063.97 examples/s]
+Filter: 37%|███▋ | 302000/818627 [00:33<00:57, 8995.48 examples/s]
+Filter: 37%|███▋ | 303000/818627 [00:34<00:57, 8988.27 examples/s]
+Filter: 37%|███▋ | 303000/818627 [00:34<00:57, 8960.06 examples/s]
+Filter: 37%|███▋ | 303000/818627 [00:34<00:57, 8958.88 examples/s]
+Filter: 37%|███▋ | 303000/818627 [00:34<00:57, 8974.46 examples/s]
+Filter: 37%|███▋ | 303000/818627 [00:34<00:57, 8968.13 examples/s]
+Filter: 37%|███▋ | 303000/818627 [00:34<00:57, 8954.09 examples/s]
+Filter: 37%|███▋ | 303000/818627 [00:34<00:57, 8954.55 examples/s]
+Filter: 37%|███▋ | 303000/818627 [00:34<00:57, 8956.26 examples/s]
+Filter: 37%|███▋ | 304000/818627 [00:34<00:57, 8921.82 examples/s]
+Filter: 37%|███▋ | 304000/818627 [00:34<00:57, 8898.43 examples/s]
+Filter: 37%|███▋ | 304000/818627 [00:34<00:57, 8911.52 examples/s]
+Filter: 37%|███▋ | 304000/818627 [00:34<00:57, 8898.41 examples/s]
+Filter: 37%|███▋ | 304000/818627 [00:34<00:57, 8899.67 examples/s]
+Filter: 37%|███▋ | 304000/818627 [00:34<00:57, 8905.51 examples/s]
+Filter: 37%|███▋ | 304000/818627 [00:34<00:57, 8897.20 examples/s]
+Filter: 37%|███▋ | 304000/818627 [00:34<00:57, 8897.77 examples/s]
+Filter: 37%|███▋ | 305000/818627 [00:34<00:57, 8864.64 examples/s]
+Filter: 37%|███▋ | 305000/818627 [00:34<00:58, 8850.33 examples/s]
+Filter: 37%|███▋ | 305000/818627 [00:34<00:57, 8858.82 examples/s]
+Filter: 37%|███▋ | 305000/818627 [00:34<00:58, 8849.15 examples/s]
+Filter: 37%|███▋ | 305000/818627 [00:34<00:58, 8846.92 examples/s]
+Filter: 37%|███▋ | 305000/818627 [00:34<00:58, 8846.87 examples/s]
+Filter: 37%|███▋ | 305000/818627 [00:34<00:58, 8851.03 examples/s]
+Filter: 37%|███▋ | 305000/818627 [00:34<00:58, 8847.15 examples/s]
+Filter: 37%|███▋ | 306000/818627 [00:34<00:58, 8828.14 examples/s]
+Filter: 37%|███▋ | 306000/818627 [00:34<00:58, 8820.51 examples/s]
+Filter: 37%|███▋ | 306000/818627 [00:34<00:58, 8826.38 examples/s]
+Filter: 37%|███▋ | 306000/818627 [00:34<00:58, 8817.88 examples/s]
+Filter: 37%|███▋ | 306000/818627 [00:34<00:58, 8820.48 examples/s]
+Filter: 37%|███▋ | 306000/818627 [00:34<00:58, 8818.19 examples/s]
+Filter: 37%|███▋ | 306000/818627 [00:34<00:59, 8640.58 examples/s]
+Filter: 37%|███▋ | 306000/818627 [00:34<00:59, 8627.72 examples/s]
+Filter: 38%|███▊ | 307000/818627 [00:34<00:59, 8530.50 examples/s]
+Filter: 38%|███▊ | 307000/818627 [00:34<00:59, 8529.68 examples/s]
+Filter: 38%|███▊ | 307000/818627 [00:34<01:00, 8523.61 examples/s]
+Filter: 38%|███▊ | 307000/818627 [00:34<00:59, 8580.06 examples/s]
+Filter: 38%|███▊ | 307000/818627 [00:34<00:59, 8577.09 examples/s]
+Filter: 38%|███▊ | 307000/818627 [00:34<01:00, 8520.70 examples/s]
+Filter: 38%|███▊ | 307000/818627 [00:34<01:00, 8519.88 examples/s]
+Filter: 38%|███▊ | 307000/818627 [00:34<01:00, 8506.17 examples/s]
+Filter: 38%|███▊ | 308000/818627 [00:34<00:59, 8572.88 examples/s]
+Filter: 38%|███▊ | 308000/818627 [00:34<00:59, 8571.42 examples/s]
+Filter: 38%|███▊ | 308000/818627 [00:34<00:59, 8566.85 examples/s]
+Filter: 38%|███▊ | 308000/818627 [00:34<00:59, 8609.77 examples/s]
+Filter: 38%|███▊ | 308000/818627 [00:34<00:59, 8566.89 examples/s]
+Filter: 38%|███▊ | 308000/818627 [00:34<00:59, 8604.27 examples/s]
+Filter: 38%|███▊ | 308000/818627 [00:34<00:59, 8564.24 examples/s]
+Filter: 38%|███▊ | 308000/818627 [00:34<00:59, 8566.74 examples/s]
+Filter: 38%|███▊ | 309000/818627 [00:34<00:59, 8607.29 examples/s]
+Filter: 38%|███▊ | 309000/818627 [00:34<00:59, 8603.56 examples/s]
+Filter: 38%|███▊ | 309000/818627 [00:34<00:59, 8601.14 examples/s]
+Filter: 38%|███▊ | 309000/818627 [00:34<00:59, 8631.68 examples/s]
+Filter: 38%|███▊ | 309000/818627 [00:35<00:59, 8599.42 examples/s]
+Filter: 38%|███▊ | 309000/818627 [00:34<00:59, 8628.40 examples/s]
+Filter: 38%|███▊ | 309000/818627 [00:34<00:59, 8603.81 examples/s]
+Filter: 38%|███▊ | 309000/818627 [00:34<00:59, 8604.04 examples/s]
+Filter: 38%|███▊ | 310000/818627 [00:34<00:58, 8697.69 examples/s]
+Filter: 38%|███▊ | 310000/818627 [00:34<00:58, 8696.85 examples/s]
+Filter: 38%|███▊ | 310000/818627 [00:34<00:58, 8693.63 examples/s]
+Filter: 38%|███▊ | 310000/818627 [00:34<00:58, 8714.53 examples/s]
+Filter: 38%|███▊ | 310000/818627 [00:35<00:58, 8692.01 examples/s]
+Filter: 38%|███▊ | 310000/818627 [00:34<00:58, 8695.79 examples/s]
+Filter: 38%|███▊ | 310000/818627 [00:34<00:58, 8711.96 examples/s]
+Filter: 38%|███▊ | 310000/818627 [00:34<00:58, 8696.00 examples/s]
+Filter: 38%|███▊ | 311000/818627 [00:34<00:58, 8718.60 examples/s]
+Filter: 38%|███▊ | 311000/818627 [00:34<00:58, 8719.78 examples/s]
+Filter: 38%|███▊ | 311000/818627 [00:34<00:58, 8718.73 examples/s]
+Filter: 38%|███▊ | 311000/818627 [00:35<00:58, 8720.58 examples/s]
+Filter: 38%|███▊ | 311000/818627 [00:35<00:58, 8734.11 examples/s]
+Filter: 38%|███▊ | 311000/818627 [00:34<00:58, 8732.77 examples/s]
+Filter: 38%|███▊ | 311000/818627 [00:34<00:58, 8719.39 examples/s]
+Filter: 38%|███▊ | 311000/818627 [00:34<00:58, 8719.78 examples/s]
+Filter: 38%|███▊ | 312000/818627 [00:35<00:56, 8912.60 examples/s]
+Filter: 38%|███▊ | 312000/818627 [00:35<00:56, 8911.72 examples/s]
+Filter: 38%|███▊ | 312000/818627 [00:35<00:56, 8910.56 examples/s]
+Filter: 38%|███▊ | 312000/818627 [00:35<00:56, 8912.75 examples/s]
+Filter: 38%|███▊ | 312000/818627 [00:35<00:56, 8919.84 examples/s]
+Filter: 38%|███▊ | 312000/818627 [00:35<00:56, 8920.28 examples/s]
+Filter: 38%|███▊ | 312000/818627 [00:35<00:56, 8910.41 examples/s]
+Filter: 38%|███▊ | 312000/818627 [00:35<00:56, 8909.89 examples/s]
+Filter: 38%|███▊ | 313000/818627 [00:35<00:57, 8785.23 examples/s]
+Filter: 38%|███▊ | 313000/818627 [00:35<00:57, 8785.16 examples/s]
+Filter: 38%|███▊ | 313000/818627 [00:35<00:57, 8780.73 examples/s]
+Filter: 38%|███▊ | 313000/818627 [00:35<00:57, 8783.94 examples/s]
+Filter: 38%|███▊ | 313000/818627 [00:35<00:57, 8783.80 examples/s]
+Filter: 38%|███▊ | 313000/818627 [00:35<00:57, 8787.35 examples/s]
+Filter: 38%|███▊ | 313000/818627 [00:35<00:57, 8786.79 examples/s]
+Filter: 38%|███▊ | 313000/818627 [00:35<00:57, 8781.54 examples/s]
+Filter: 38%|███▊ | 314000/818627 [00:35<00:57, 8705.15 examples/s]
+Filter: 38%|███▊ | 314000/818627 [00:35<00:57, 8704.34 examples/s]
+Filter: 38%|███▊ | 314000/818627 [00:35<00:58, 8699.70 examples/s]
+Filter: 38%|███▊ | 314000/818627 [00:35<00:57, 8705.25 examples/s]
+Filter: 38%|███▊ | 314000/818627 [00:35<00:57, 8709.31 examples/s]
+Filter: 38%|███▊ | 314000/818627 [00:35<00:57, 8702.34 examples/s]
+Filter: 38%|███▊ | 314000/818627 [00:35<00:57, 8705.69 examples/s]
+Filter: 38%|███▊ | 314000/818627 [00:35<00:57, 8702.94 examples/s]
+Filter: 38%|███▊ | 315000/818627 [00:35<00:57, 8724.49 examples/s]
+Filter: 38%|███▊ | 315000/818627 [00:35<00:57, 8718.64 examples/s]
+Filter: 38%|███▊ | 315000/818627 [00:35<00:57, 8726.20 examples/s]
+Filter: 38%|███▊ | 315000/818627 [00:35<00:57, 8717.12 examples/s]
+Filter: 38%|███▊ | 315000/818627 [00:35<00:57, 8724.80 examples/s]
+Filter: 38%|███▊ | 315000/818627 [00:35<00:57, 8728.80 examples/s]
+Filter: 38%|███▊ | 315000/818627 [00:35<00:57, 8726.96 examples/s]
+Filter: 38%|███▊ | 315000/818627 [00:35<00:57, 8724.62 examples/s]
+Filter: 39%|███▊ | 316000/818627 [00:35<00:57, 8741.16 examples/s]
+Filter: 39%|███▊ | 316000/818627 [00:35<00:57, 8739.86 examples/s]
+Filter: 39%|███▊ | 316000/818627 [00:35<00:57, 8739.28 examples/s]
+Filter: 39%|███▊ | 316000/818627 [00:35<00:57, 8738.59 examples/s]
+Filter: 39%|███▊ | 316000/818627 [00:35<00:57, 8743.50 examples/s]
+Filter: 39%|███▊ | 316000/818627 [00:35<00:57, 8742.37 examples/s]
+Filter: 39%|███▊ | 316000/818627 [00:35<00:57, 8739.50 examples/s]
+Filter: 39%|███▊ | 316000/818627 [00:35<00:57, 8740.52 examples/s]
+Filter: 39%|███▊ | 317000/818627 [00:35<00:57, 8711.63 examples/s]
+Filter: 39%|███▊ | 317000/818627 [00:35<00:57, 8710.87 examples/s]
+Filter: 39%|███▊ | 317000/818627 [00:35<00:57, 8705.10 examples/s]
+Filter: 39%|███▊ | 317000/818627 [00:35<00:57, 8714.64 examples/s]
+Filter: 39%|███▊ | 317000/818627 [00:35<00:57, 8711.52 examples/s]
+Filter: 39%|███▊ | 317000/818627 [00:35<00:57, 8710.18 examples/s]
+Filter: 39%|███▊ | 317000/818627 [00:35<00:57, 8702.45 examples/s]
+Filter: 39%|███▊ | 317000/818627 [00:35<00:57, 8707.97 examples/s]
+Filter: 39%|███▉ | 318000/818627 [00:35<00:56, 8847.84 examples/s]
+Filter: 39%|███▉ | 318000/818627 [00:35<00:56, 8847.37 examples/s]
+Filter: 39%|███▉ | 318000/818627 [00:35<00:56, 8844.29 examples/s]
+Filter: 39%|███▉ | 318000/818627 [00:35<00:56, 8850.93 examples/s]
+Filter: 39%|███▉ | 318000/818627 [00:36<00:56, 8848.57 examples/s]
+Filter: 39%|███▉ | 318000/818627 [00:35<00:56, 8849.36 examples/s]
+Filter: 39%|███▉ | 318000/818627 [00:35<00:56, 8848.82 examples/s]
+Filter: 39%|███▉ | 318000/818627 [00:35<00:56, 8849.30 examples/s]
+Filter: 39%|███▉ | 319000/818627 [00:35<00:55, 9021.02 examples/s]
+Filter: 39%|███▉ | 319000/818627 [00:35<00:55, 9025.36 examples/s]
+Filter: 39%|███▉ | 319000/818627 [00:35<00:55, 9023.05 examples/s]
+Filter: 39%|███▉ | 319000/818627 [00:36<00:55, 9019.71 examples/s]
+Filter: 39%|███▉ | 319000/818627 [00:35<00:55, 9020.16 examples/s]
+Filter: 39%|███▉ | 319000/818627 [00:35<00:55, 9020.59 examples/s]
+Filter: 39%|███▉ | 319000/818627 [00:35<00:55, 9023.27 examples/s]
+Filter: 39%|███▉ | 319000/818627 [00:35<00:55, 9016.30 examples/s]
+Filter: 39%|███▉ | 320000/818627 [00:35<00:55, 8987.23 examples/s]
+Filter: 39%|███▉ | 320000/818627 [00:35<00:55, 8989.82 examples/s]
+Filter: 39%|███▉ | 320000/818627 [00:35<00:55, 8987.88 examples/s]
+Filter: 39%|███▉ | 320000/818627 [00:35<00:55, 8990.07 examples/s]
+Filter: 39%|███▉ | 320000/818627 [00:36<00:55, 8992.90 examples/s]
+Filter: 39%|███▉ | 320000/818627 [00:35<00:55, 8984.96 examples/s]
+Filter: 39%|███▉ | 320000/818627 [00:35<00:55, 8984.71 examples/s]
+Filter: 39%|███▉ | 321000/818627 [00:36<00:55, 8937.25 examples/s]
+Filter: 39%|███▉ | 321000/818627 [00:36<00:55, 8930.63 examples/s]
+Filter: 39%|███▉ | 321000/818627 [00:36<00:55, 8931.33 examples/s]
+Filter: 39%|███▉ | 322000/818627 [00:36<00:55, 9000.47 examples/s]
+Filter: 39%|███▉ | 322000/818627 [00:36<00:55, 9005.82 examples/s]
+Filter: 39%|███▉ | 322000/818627 [00:36<00:55, 9004.76 examples/s]
+Filter: 39%|███▉ | 320000/818627 [00:36<01:40, 4983.61 examples/s]
+Filter: 39%|███▉ | 323000/818627 [00:36<00:55, 9006.10 examples/s]
+Filter: 39%|███▉ | 323000/818627 [00:36<00:55, 9007.27 examples/s]
+Filter: 39%|███▉ | 323000/818627 [00:36<00:55, 9004.30 examples/s]
+Filter: 39%|███▉ | 321000/818627 [00:36<01:35, 5220.60 examples/s]
+Filter: 39%|███▉ | 321000/818627 [00:36<01:36, 5175.71 examples/s]
+Filter: 39%|███▉ | 321000/818627 [00:36<01:37, 5097.53 examples/s]
+Filter: 39%|███▉ | 321000/818627 [00:36<01:39, 4997.36 examples/s]
+Filter: 40%|███▉ | 324000/818627 [00:36<00:54, 9029.31 examples/s]
+Filter: 40%|███▉ | 324000/818627 [00:36<00:54, 9029.26 examples/s]
+Filter: 40%|███▉ | 324000/818627 [00:36<00:54, 9026.61 examples/s]
+Filter: 39%|███▉ | 322000/818627 [00:36<01:11, 6907.88 examples/s]
+Filter: 39%|███▉ | 323000/818627 [00:36<01:09, 7178.58 examples/s]
+Filter: 39%|███▉ | 323000/818627 [00:36<01:09, 7137.80 examples/s]
+Filter: 39%|███▉ | 323000/818627 [00:36<01:09, 7091.48 examples/s]
+Filter: 40%|███▉ | 325000/818627 [00:36<00:54, 9096.91 examples/s]
+Filter: 40%|███▉ | 325000/818627 [00:36<00:54, 9091.64 examples/s]
+Filter: 40%|███▉ | 325000/818627 [00:36<00:54, 9094.89 examples/s]
+Filter: 39%|███▉ | 323000/818627 [00:36<01:10, 7003.47 examples/s]
+Filter: 40%|███▉ | 324000/818627 [00:36<00:58, 8457.63 examples/s]
+Filter: 40%|███▉ | 325000/818627 [00:36<00:56, 8707.87 examples/s]
+Filter: 40%|███▉ | 325000/818627 [00:36<00:56, 8767.80 examples/s]
+Filter: 40%|███▉ | 325000/818627 [00:36<00:57, 8571.91 examples/s]
+Filter: 40%|███▉ | 325000/818627 [00:36<00:57, 8629.07 examples/s]
+Filter: 40%|███▉ | 326000/818627 [00:37<00:53, 9266.75 examples/s]
+Filter: 40%|███▉ | 327000/818627 [00:36<00:54, 9060.14 examples/s]
+Filter: 40%|███▉ | 327000/818627 [00:36<00:53, 9214.61 examples/s]
+Filter: 40%|███▉ | 327000/818627 [00:36<00:54, 9088.52 examples/s]
+Filter: 40%|███▉ | 327000/818627 [00:36<00:54, 8988.94 examples/s]
+Filter: 40%|███▉ | 326000/818627 [00:36<01:38, 5004.08 examples/s]
+Filter: 40%|███▉ | 326000/818627 [00:37<01:40, 4898.87 examples/s]
+Filter: 40%|███▉ | 326000/818627 [00:36<01:40, 4878.76 examples/s]
+Filter: 40%|████ | 328000/818627 [00:37<00:53, 9179.62 examples/s]
+Filter: 40%|████ | 328000/818627 [00:36<00:54, 8945.51 examples/s]
+Filter: 40%|████ | 328000/818627 [00:36<00:54, 9022.59 examples/s]
+Filter: 40%|████ | 328000/818627 [00:37<01:10, 6979.44 examples/s]
+Filter: 40%|████ | 329000/818627 [00:37<00:54, 8983.92 examples/s]
+Filter: 40%|████ | 329000/818627 [00:37<00:53, 9082.32 examples/s]
+Filter: 40%|████ | 329000/818627 [00:37<00:53, 9125.39 examples/s]
+Filter: 40%|████ | 329000/818627 [00:37<00:54, 8939.89 examples/s]
+Filter: 40%|████ | 329000/818627 [00:37<00:54, 8997.18 examples/s]
+Filter: 40%|████ | 328000/818627 [00:37<01:11, 6871.30 examples/s]
+Filter: 40%|████ | 328000/818627 [00:37<01:11, 6867.56 examples/s]
+Filter: 40%|████ | 330000/818627 [00:37<00:54, 8973.62 examples/s]
+Filter: 40%|████ | 330000/818627 [00:37<00:53, 9052.78 examples/s]
+Filter: 40%|████ | 330000/818627 [00:37<00:53, 9081.59 examples/s]
+Filter: 40%|████ | 330000/818627 [00:37<00:54, 8938.99 examples/s]
+Filter: 40%|████ | 330000/818627 [00:37<00:54, 8983.85 examples/s]
+Filter: 40%|████ | 330000/818627 [00:37<00:56, 8599.87 examples/s]
+Filter: 40%|████ | 330000/818627 [00:37<00:57, 8498.73 examples/s]
+Filter: 40%|████ | 330000/818627 [00:37<00:57, 8482.79 examples/s]
+Filter: 40%|████ | 331000/818627 [00:37<00:54, 8990.06 examples/s]
+Filter: 40%|████ | 331000/818627 [00:37<00:53, 9046.65 examples/s]
+Filter: 40%|████ | 331000/818627 [00:37<00:54, 8965.61 examples/s]
+Filter: 40%|████ | 331000/818627 [00:37<00:54, 8999.28 examples/s]
+Filter: 40%|████ | 331000/818627 [00:37<00:53, 9064.09 examples/s]
+Filter: 41%|████ | 332000/818627 [00:37<00:53, 9034.00 examples/s]
+Filter: 41%|████ | 332000/818627 [00:37<00:53, 9084.38 examples/s]
+Filter: 41%|████ | 332000/818627 [00:37<00:52, 9182.42 examples/s]
+Filter: 41%|████ | 332000/818627 [00:37<00:53, 9104.73 examples/s]
+Filter: 41%|████ | 332000/818627 [00:37<00:52, 9346.05 examples/s]
+Filter: 41%|████ | 332000/818627 [00:37<00:52, 9336.26 examples/s]
+Filter: 41%|████ | 332000/818627 [00:37<00:53, 9021.59 examples/s]
+Filter: 41%|████ | 332000/818627 [00:37<00:53, 9044.03 examples/s]
+Filter: 41%|████ | 333000/818627 [00:37<00:53, 9085.10 examples/s]
+Filter: 41%|████ | 333000/818627 [00:37<00:53, 9123.54 examples/s]
+Filter: 41%|████ | 333000/818627 [00:37<00:53, 9139.47 examples/s]
+Filter: 41%|████ | 333000/818627 [00:37<00:53, 9085.48 examples/s]
+Filter: 41%|████ | 333000/818627 [00:37<00:53, 9100.14 examples/s]
+Filter: 41%|████ | 334000/818627 [00:37<00:54, 8964.23 examples/s]
+Filter: 41%|████ | 334000/818627 [00:37<00:53, 9098.11 examples/s]
+Filter: 41%|████ | 334000/818627 [00:37<00:53, 8992.22 examples/s]
+Filter: 41%|████ | 334000/818627 [00:37<00:53, 8999.86 examples/s]
+Filter: 41%|████ | 334000/818627 [00:37<00:52, 9199.94 examples/s]
+Filter: 41%|████ | 334000/818627 [00:37<00:52, 9195.25 examples/s]
+Filter: 41%|████ | 334000/818627 [00:37<00:54, 8955.86 examples/s]
+Filter: 41%|████ | 334000/818627 [00:37<00:54, 8967.83 examples/s]
+Filter: 41%|████ | 335000/818627 [00:37<00:54, 8887.80 examples/s]
+Filter: 41%|████ | 335000/818627 [00:37<00:53, 9014.78 examples/s]
+Filter: 41%|████ | 335000/818627 [00:37<00:54, 8905.38 examples/s]
+Filter: 41%|████ | 335000/818627 [00:38<00:54, 8907.28 examples/s]
+Filter: 41%|████ | 335000/818627 [00:37<00:54, 8876.84 examples/s]
+Filter: 41%|████ | 335000/818627 [00:37<00:54, 8886.35 examples/s]
+Filter: 41%|████ | 336000/818627 [00:37<00:54, 8852.12 examples/s]
+Filter: 41%|████ | 336000/818627 [00:37<00:54, 8865.57 examples/s]
+Filter: 41%|████ | 336000/818627 [00:37<00:53, 8956.62 examples/s]
+Filter: 41%|████ | 336000/818627 [00:37<00:53, 9040.54 examples/s]
+Filter: 41%|████ | 336000/818627 [00:37<00:53, 9036.77 examples/s]
+Filter: 41%|████ | 336000/818627 [00:37<00:54, 8846.36 examples/s]
+Filter: 41%|████ | 336000/818627 [00:37<00:54, 8853.26 examples/s]
+Filter: 41%|████ | 336000/818627 [00:38<00:54, 8860.84 examples/s]
+Filter: 41%|████ | 337000/818627 [00:37<00:54, 8905.46 examples/s]
+Filter: 41%|████ | 337000/818627 [00:37<00:54, 8814.34 examples/s]
+Filter: 41%|████ | 337000/818627 [00:37<00:54, 8825.42 examples/s]
+Filter: 41%|████ | 337000/818627 [00:37<00:53, 8981.41 examples/s]
+Filter: 41%|████ | 337000/818627 [00:38<00:53, 8978.42 examples/s]
+Filter: 41%|████ | 337000/818627 [00:38<00:54, 8825.63 examples/s]
+Filter: 41%|████ | 337000/818627 [00:37<00:54, 8809.21 examples/s]
+Filter: 41%|████ | 337000/818627 [00:37<00:54, 8814.32 examples/s]
+Filter: 41%|████▏ | 338000/818627 [00:38<00:54, 8891.55 examples/s]
+Filter: 41%|████▏ | 338000/818627 [00:38<00:54, 8838.14 examples/s]
+Filter: 41%|████▏ | 338000/818627 [00:38<00:54, 8822.23 examples/s]
+Filter: 41%|████▏ | 338000/818627 [00:38<00:54, 8838.45 examples/s]
+Filter: 41%|████▏ | 338000/818627 [00:38<00:53, 8952.18 examples/s]
+Filter: 41%|████▏ | 338000/818627 [00:38<00:54, 8823.68 examples/s]
+Filter: 41%|████▏ | 338000/818627 [00:38<00:53, 8948.53 examples/s]
+Filter: 41%|████▏ | 338000/818627 [00:38<00:54, 8826.22 examples/s]
+Filter: 41%|████▏ | 339000/818627 [00:38<00:53, 8927.30 examples/s]
+Filter: 41%|████▏ | 339000/818627 [00:38<00:53, 8962.96 examples/s]
+Filter: 41%|████▏ | 339000/818627 [00:38<00:53, 8930.59 examples/s]
+Filter: 41%|████▏ | 339000/818627 [00:38<00:53, 8932.74 examples/s]
+Filter: 41%|████▏ | 339000/818627 [00:38<00:53, 9000.02 examples/s]
+Filter: 41%|████▏ | 339000/818627 [00:38<00:53, 8999.93 examples/s]
+Filter: 41%|████▏ | 339000/818627 [00:38<00:53, 8923.63 examples/s]
+Filter: 41%|████▏ | 339000/818627 [00:38<00:53, 8924.11 examples/s]
+Filter: 42%|████▏ | 340000/818627 [00:38<00:54, 8830.40 examples/s]
+Filter: 42%|████▏ | 340000/818627 [00:38<00:54, 8862.83 examples/s]
+Filter: 42%|████▏ | 340000/818627 [00:38<00:54, 8834.16 examples/s]
+Filter: 42%|████▏ | 340000/818627 [00:38<00:54, 8833.71 examples/s]
+Filter: 42%|████▏ | 340000/818627 [00:38<00:54, 8827.00 examples/s]
+Filter: 42%|████▏ | 340000/818627 [00:38<00:53, 8897.57 examples/s]
+Filter: 42%|████▏ | 340000/818627 [00:38<00:53, 8897.65 examples/s]
+Filter: 42%|████▏ | 340000/818627 [00:38<00:54, 8827.14 examples/s]
+Filter: 42%|████▏ | 341000/818627 [00:38<00:54, 8738.18 examples/s]
+Filter: 42%|████▏ | 341000/818627 [00:38<00:54, 8741.34 examples/s]
+Filter: 42%|████▏ | 341000/818627 [00:38<00:54, 8759.94 examples/s]
+Filter: 42%|████▏ | 341000/818627 [00:38<00:54, 8738.90 examples/s]
+Filter: 42%|████▏ | 341000/818627 [00:38<00:54, 8796.47 examples/s]
+Filter: 42%|████▏ | 341000/818627 [00:38<00:54, 8795.35 examples/s]
+Filter: 42%|████▏ | 341000/818627 [00:38<00:54, 8733.17 examples/s]
+Filter: 42%|████▏ | 341000/818627 [00:38<00:54, 8734.51 examples/s]
+Filter: 42%|████▏ | 342000/818627 [00:38<00:54, 8722.00 examples/s]
+Filter: 42%|████▏ | 342000/818627 [00:38<00:54, 8721.75 examples/s]
+Filter: 42%|████▏ | 342000/818627 [00:38<00:54, 8736.80 examples/s]
+Filter: 42%|████▏ | 342000/818627 [00:38<00:54, 8723.17 examples/s]
+Filter: 42%|████▏ | 342000/818627 [00:38<00:54, 8720.02 examples/s]
+Filter: 42%|████▏ | 342000/818627 [00:38<00:54, 8763.54 examples/s]
+Filter: 42%|████▏ | 342000/818627 [00:38<00:54, 8762.57 examples/s]
+Filter: 42%|████▏ | 342000/818627 [00:38<00:54, 8720.28 examples/s]
+Filter: 42%|████▏ | 343000/818627 [00:38<00:54, 8709.68 examples/s]
+Filter: 42%|████▏ | 343000/818627 [00:38<00:54, 8712.27 examples/s]
+Filter: 42%|████▏ | 343000/818627 [00:38<00:54, 8726.40 examples/s]
+Filter: 42%|████▏ | 343000/818627 [00:38<00:54, 8713.51 examples/s]
+Filter: 42%|████▏ | 343000/818627 [00:38<00:54, 8744.17 examples/s]
+Filter: 42%|████▏ | 343000/818627 [00:38<00:54, 8743.80 examples/s]
+Filter: 42%|████▏ | 343000/818627 [00:38<00:54, 8707.21 examples/s]
+Filter: 42%|████▏ | 343000/818627 [00:38<00:54, 8710.52 examples/s]
+Filter: 42%|████▏ | 344000/818627 [00:38<00:54, 8681.39 examples/s]
+Filter: 42%|████▏ | 344000/818627 [00:38<00:54, 8695.48 examples/s]
+Filter: 42%|████▏ | 344000/818627 [00:39<00:54, 8682.10 examples/s]
+Filter: 42%|████▏ | 344000/818627 [00:38<00:54, 8684.52 examples/s]
+Filter: 42%|████▏ | 344000/818627 [00:38<00:54, 8707.99 examples/s]
+Filter: 42%|████▏ | 344000/818627 [00:38<00:54, 8707.27 examples/s]
+Filter: 42%|████▏ | 344000/818627 [00:38<00:54, 8682.78 examples/s]
+Filter: 42%|████▏ | 344000/818627 [00:38<00:55, 8600.29 examples/s]
+Filter: 42%|████▏ | 345000/818627 [00:38<00:54, 8716.66 examples/s]
+Filter: 42%|████▏ | 345000/818627 [00:38<00:54, 8724.21 examples/s]
+Filter: 42%|████▏ | 345000/818627 [00:38<00:54, 8741.43 examples/s]
+Filter: 42%|████▏ | 345000/818627 [00:39<00:54, 8718.29 examples/s]
+Filter: 42%|████▏ | 345000/818627 [00:38<00:54, 8718.00 examples/s]
+Filter: 42%|████▏ | 345000/818627 [00:38<00:54, 8734.78 examples/s]
+Filter: 42%|████▏ | 345000/818627 [00:38<00:54, 8734.29 examples/s]
+Filter: 42%|████▏ | 345000/818627 [00:38<00:54, 8718.24 examples/s]
+Filter: 42%|████▏ | 346000/818627 [00:39<00:54, 8696.35 examples/s]
+Filter: 42%|████▏ | 346000/818627 [00:39<00:54, 8702.04 examples/s]
+Filter: 42%|████▏ | 346000/818627 [00:39<00:54, 8711.65 examples/s]
+Filter: 42%|████▏ | 346000/818627 [00:39<00:54, 8696.82 examples/s]
+Filter: 42%|████▏ | 346000/818627 [00:39<00:54, 8709.23 examples/s]
+Filter: 42%|████▏ | 346000/818627 [00:39<00:54, 8706.69 examples/s]
+Filter: 42%|████▏ | 346000/818627 [00:39<00:54, 8693.12 examples/s]
+Filter: 42%|████▏ | 346000/818627 [00:39<00:54, 8696.48 examples/s]
+Filter: 42%|████▏ | 347000/818627 [00:39<00:53, 8863.35 examples/s]
+Filter: 42%|████▏ | 347000/818627 [00:39<00:53, 8866.30 examples/s]
+Filter: 42%|████▏ | 347000/818627 [00:39<00:53, 8875.02 examples/s]
+Filter: 42%|████▏ | 347000/818627 [00:39<00:53, 8870.05 examples/s]
+Filter: 42%|████▏ | 347000/818627 [00:39<00:53, 8862.50 examples/s]
+Filter: 42%|████▏ | 347000/818627 [00:39<00:53, 8867.45 examples/s]
+Filter: 42%|████▏ | 347000/818627 [00:39<00:53, 8862.19 examples/s]
+Filter: 42%|████▏ | 347000/818627 [00:39<00:53, 8835.79 examples/s]
+Filter: 43%|████▎ | 348000/818627 [00:39<00:53, 8805.68 examples/s]
+Filter: 43%|████▎ | 348000/818627 [00:39<00:53, 8793.59 examples/s]
+Filter: 43%|████▎ | 348000/818627 [00:39<00:53, 8794.32 examples/s]
+Filter: 43%|████▎ | 348000/818627 [00:39<00:53, 8797.58 examples/s]
+Filter: 43%|████▎ | 348000/818627 [00:39<00:53, 8797.55 examples/s]
+Filter: 43%|████▎ | 348000/818627 [00:39<00:53, 8795.85 examples/s]
+Filter: 43%|████▎ | 348000/818627 [00:39<00:53, 8790.39 examples/s]
+Filter: 43%|████▎ | 348000/818627 [00:39<00:53, 8791.01 examples/s]
+Filter: 43%|████▎ | 349000/818627 [00:39<00:53, 8748.79 examples/s]
+Filter: 43%|████▎ | 349000/818627 [00:39<00:53, 8752.91 examples/s]
+Filter: 43%|████▎ | 349000/818627 [00:39<00:53, 8755.53 examples/s]
+Filter: 43%|████▎ | 349000/818627 [00:39<00:53, 8758.87 examples/s]
+Filter: 43%|████▎ | 349000/818627 [00:39<00:53, 8756.47 examples/s]
+Filter: 43%|████▎ | 349000/818627 [00:39<00:53, 8751.07 examples/s]
+Filter: 43%|████▎ | 349000/818627 [00:39<00:53, 8754.71 examples/s]
+Filter: 43%|████▎ | 349000/818627 [00:39<00:53, 8746.88 examples/s]
+Filter: 43%|████▎ | 350000/818627 [00:39<00:53, 8721.96 examples/s]
+Filter: 43%|████▎ | 350000/818627 [00:39<00:53, 8725.39 examples/s]
+Filter: 43%|████▎ | 350000/818627 [00:39<00:53, 8726.27 examples/s]
+Filter: 43%|████▎ | 350000/818627 [00:39<00:53, 8726.66 examples/s]
+Filter: 43%|████▎ | 350000/818627 [00:39<00:53, 8725.78 examples/s]
+Filter: 43%|████▎ | 350000/818627 [00:39<00:53, 8724.20 examples/s]
+Filter: 43%|████▎ | 350000/818627 [00:39<00:53, 8722.45 examples/s]
+Filter: 43%|████▎ | 350000/818627 [00:39<00:53, 8722.08 examples/s]
+Filter: 43%|████▎ | 351000/818627 [00:39<00:53, 8727.29 examples/s]
+Filter: 43%|████▎ | 351000/818627 [00:39<00:53, 8725.90 examples/s]
+Filter: 43%|████▎ | 351000/818627 [00:39<00:53, 8727.27 examples/s]
+Filter: 43%|████▎ | 351000/818627 [00:39<00:53, 8726.77 examples/s]
+Filter: 43%|████▎ | 351000/818627 [00:39<00:53, 8730.06 examples/s]
+Filter: 43%|████▎ | 351000/818627 [00:39<00:53, 8726.79 examples/s]
+Filter: 43%|████▎ | 351000/818627 [00:39<00:53, 8726.25 examples/s]
+Filter: 43%|████▎ | 351000/818627 [00:39<00:53, 8716.96 examples/s]
+Filter: 43%|████▎ | 352000/818627 [00:39<00:53, 8712.65 examples/s]
+Filter: 43%|████▎ | 352000/818627 [00:39<00:53, 8712.36 examples/s]
+Filter: 43%|████▎ | 352000/818627 [00:39<00:53, 8709.07 examples/s]
+Filter: 43%|████▎ | 352000/818627 [00:40<00:53, 8713.38 examples/s]
+Filter: 43%|████▎ | 352000/818627 [00:39<00:53, 8713.17 examples/s]
+Filter: 43%|████▎ | 352000/818627 [00:39<00:53, 8713.17 examples/s]
+Filter: 43%|████▎ | 352000/818627 [00:39<00:53, 8717.28 examples/s]
+Filter: 43%|████▎ | 352000/818627 [00:39<00:53, 8712.19 examples/s]
+Filter: 43%|████▎ | 353000/818627 [00:39<00:52, 8847.63 examples/s]
+Filter: 43%|████▎ | 353000/818627 [00:39<00:52, 8848.35 examples/s]
+Filter: 43%|████▎ | 353000/818627 [00:40<00:52, 8848.76 examples/s]
+Filter: 43%|████▎ | 353000/818627 [00:39<00:52, 8851.37 examples/s]
+Filter: 43%|████▎ | 353000/818627 [00:39<00:52, 8850.46 examples/s]
+Filter: 43%|████▎ | 353000/818627 [00:39<00:52, 8846.60 examples/s]
+Filter: 43%|████▎ | 353000/818627 [00:39<00:52, 8848.66 examples/s]
+Filter: 43%|████▎ | 353000/818627 [00:39<00:52, 8792.67 examples/s]
+Filter: 43%|████▎ | 354000/818627 [00:39<00:51, 9012.45 examples/s]
+Filter: 43%|████▎ | 354000/818627 [00:39<00:51, 8995.77 examples/s]
+Filter: 43%|████▎ | 354000/818627 [00:39<00:51, 8988.01 examples/s]
+Filter: 43%|████▎ | 354000/818627 [00:40<00:51, 8993.91 examples/s]
+Filter: 43%|████▎ | 354000/818627 [00:39<00:51, 8995.43 examples/s]
+Filter: 43%|████▎ | 354000/818627 [00:39<00:51, 8988.16 examples/s]
+Filter: 43%|████▎ | 354000/818627 [00:39<00:51, 8993.73 examples/s]
+Filter: 43%|████▎ | 354000/818627 [00:40<00:51, 8989.19 examples/s]
+Filter: 43%|████▎ | 355000/818627 [00:40<00:50, 9173.11 examples/s]
+Filter: 43%|████▎ | 355000/818627 [00:40<00:50, 9161.67 examples/s]
+Filter: 43%|████▎ | 355000/818627 [00:40<00:50, 9158.98 examples/s]
+Filter: 43%|████▎ | 355000/818627 [00:40<00:50, 9157.55 examples/s]
+Filter: 43%|████▎ | 355000/818627 [00:40<00:50, 9162.79 examples/s]
+Filter: 43%|████▎ | 355000/818627 [00:40<00:50, 9157.14 examples/s]
+Filter: 43%|████▎ | 355000/818627 [00:40<00:50, 9157.74 examples/s]
+Filter: 43%|████▎ | 355000/818627 [00:40<00:50, 9147.07 examples/s]
+Filter: 43%|████▎ | 356000/818627 [00:40<00:51, 8992.21 examples/s]
+Filter: 43%|████▎ | 356000/818627 [00:40<00:51, 8986.74 examples/s]
+Filter: 43%|████▎ | 356000/818627 [00:40<00:51, 8987.28 examples/s]
+Filter: 43%|████▎ | 356000/818627 [00:40<00:51, 8986.87 examples/s]
+Filter: 43%|████▎ | 356000/818627 [00:40<00:51, 8985.33 examples/s]
+Filter: 43%|████▎ | 356000/818627 [00:40<00:51, 8986.40 examples/s]
+Filter: 43%|████▎ | 356000/818627 [00:40<00:51, 8986.90 examples/s]
+Filter: 43%|████▎ | 356000/818627 [00:40<00:51, 8984.47 examples/s]
+Filter: 44%|████▎ | 357000/818627 [00:40<00:51, 8905.88 examples/s]
+Filter: 44%|████▎ | 357000/818627 [00:40<00:51, 8903.41 examples/s]
+Filter: 44%|████▎ | 357000/818627 [00:40<00:51, 8901.78 examples/s]
+Filter: 44%|████▎ | 357000/818627 [00:40<00:51, 8898.66 examples/s]
+Filter: 44%|████▎ | 357000/818627 [00:40<00:51, 8896.33 examples/s]
+Filter: 44%|████▎ | 357000/818627 [00:40<00:51, 8898.68 examples/s]
+Filter: 44%|████▎ | 357000/818627 [00:40<00:51, 8893.96 examples/s]
+Filter: 44%|████▎ | 357000/818627 [00:40<00:52, 8870.46 examples/s]
+Filter: 44%|████▎ | 358000/818627 [00:40<00:51, 8907.76 examples/s]
+Filter: 44%|████▎ | 358000/818627 [00:40<00:51, 8916.77 examples/s]
+Filter: 44%|████▎ | 358000/818627 [00:40<00:51, 8904.32 examples/s]
+Filter: 44%|████▎ | 358000/818627 [00:40<00:51, 8903.11 examples/s]
+Filter: 44%|████▎ | 358000/818627 [00:40<00:51, 8901.25 examples/s]
+Filter: 44%|████▎ | 358000/818627 [00:40<00:51, 8900.52 examples/s]
+Filter: 44%|████▎ | 358000/818627 [00:40<00:51, 8862.34 examples/s]
+Filter: 44%|████▎ | 358000/818627 [00:40<00:52, 8851.51 examples/s]
+Filter: 44%|████▍ | 359000/818627 [00:40<00:51, 8926.36 examples/s]
+Filter: 44%|████▍ | 359000/818627 [00:40<00:51, 8930.91 examples/s]
+Filter: 44%|████▍ | 359000/818627 [00:40<00:51, 8923.85 examples/s]
+Filter: 44%|████▍ | 359000/818627 [00:40<00:51, 8941.34 examples/s]
+Filter: 44%|████▍ | 359000/818627 [00:40<00:51, 8923.02 examples/s]
+Filter: 44%|████▍ | 359000/818627 [00:40<00:51, 8924.18 examples/s]
+Filter: 44%|████▍ | 359000/818627 [00:40<00:51, 8933.76 examples/s]
+Filter: 44%|████▍ | 359000/818627 [00:40<00:51, 8921.58 examples/s]
+Filter: 44%|████▍ | 360000/818627 [00:40<00:53, 8538.55 examples/s]
+Filter: 44%|████▍ | 360000/818627 [00:40<00:53, 8540.56 examples/s]
+Filter: 44%|████▍ | 360000/818627 [00:40<00:53, 8535.36 examples/s]
+Filter: 44%|████▍ | 360000/818627 [00:40<00:53, 8544.33 examples/s]
+Filter: 44%|████▍ | 360000/818627 [00:40<00:53, 8535.36 examples/s]
+Filter: 44%|████▍ | 360000/818627 [00:40<00:53, 8543.37 examples/s]
+Filter: 44%|████▍ | 360000/818627 [00:40<00:53, 8533.74 examples/s]
+Filter: 44%|████▍ | 360000/818627 [00:40<00:53, 8534.91 examples/s]
+Filter: 44%|████▍ | 361000/818627 [00:40<00:55, 8196.95 examples/s]
+Filter: 44%|████▍ | 361000/818627 [00:40<00:55, 8192.38 examples/s]
+Filter: 44%|████▍ | 361000/818627 [00:40<00:55, 8190.96 examples/s]
+Filter: 44%|████▍ | 361000/818627 [00:41<00:55, 8202.23 examples/s]
+Filter: 44%|████▍ | 361000/818627 [00:40<00:55, 8196.42 examples/s]
+Filter: 44%|████▍ | 361000/818627 [00:40<00:55, 8193.27 examples/s]
+Filter: 44%|████▍ | 361000/818627 [00:40<00:55, 8197.34 examples/s]
+Filter: 44%|████▍ | 361000/818627 [00:40<00:55, 8194.56 examples/s]
+Filter: 44%|████▍ | 362000/818627 [00:40<00:54, 8304.34 examples/s]
+Filter: 44%|████▍ | 362000/818627 [00:40<00:54, 8304.72 examples/s]
+Filter: 44%|████▍ | 362000/818627 [00:40<00:55, 8300.77 examples/s]
+Filter: 44%|████▍ | 362000/818627 [00:41<00:54, 8305.11 examples/s]
+Filter: 44%|████▍ | 362000/818627 [00:40<00:54, 8307.27 examples/s]
+Filter: 44%|████▍ | 362000/818627 [00:40<00:55, 8302.17 examples/s]
+Filter: 44%|████▍ | 362000/818627 [00:40<00:54, 8306.33 examples/s]
+Filter: 44%|████▍ | 362000/818627 [00:40<00:54, 8303.68 examples/s]
+Filter: 44%|████▍ | 363000/818627 [00:40<00:52, 8634.11 examples/s]
+Filter: 44%|████▍ | 363000/818627 [00:40<00:52, 8631.23 examples/s]
+Filter: 44%|████▍ | 363000/818627 [00:40<00:52, 8628.51 examples/s]
+Filter: 44%|████▍ | 363000/818627 [00:41<00:52, 8632.85 examples/s]
+Filter: 44%|████▍ | 363000/818627 [00:40<00:52, 8633.61 examples/s]
+Filter: 44%|████▍ | 363000/818627 [00:40<00:52, 8636.78 examples/s]
+Filter: 44%|████▍ | 363000/818627 [00:40<00:52, 8636.35 examples/s]
+Filter: 44%|████▍ | 363000/818627 [00:41<00:52, 8631.40 examples/s]
+Filter: 44%|████▍ | 364000/818627 [00:41<00:51, 8908.34 examples/s]
+Filter: 44%|████▍ | 364000/818627 [00:41<00:51, 8909.21 examples/s]
+Filter: 44%|████▍ | 364000/818627 [00:41<00:51, 8905.93 examples/s]
+Filter: 44%|████▍ | 364000/818627 [00:41<00:51, 8911.26 examples/s]
+Filter: 44%|████▍ | 364000/818627 [00:41<00:51, 8905.21 examples/s]
+Filter: 44%|████▍ | 364000/818627 [00:41<00:51, 8906.79 examples/s]
+Filter: 44%|████▍ | 364000/818627 [00:41<00:51, 8907.99 examples/s]
+Filter: 44%|████▍ | 364000/818627 [00:41<00:51, 8849.18 examples/s]
+Filter: 45%|████▍ | 365000/818627 [00:41<00:49, 9182.11 examples/s]
+Filter: 45%|████▍ | 365000/818627 [00:41<00:49, 9173.74 examples/s]
+Filter: 45%|████▍ | 365000/818627 [00:41<00:49, 9178.21 examples/s]
+Filter: 45%|████▍ | 365000/818627 [00:41<00:49, 9183.48 examples/s]
+Filter: 45%|████▍ | 365000/818627 [00:41<00:49, 9181.40 examples/s]
+Filter: 45%|████▍ | 365000/818627 [00:41<00:49, 9178.64 examples/s]
+Filter: 45%|████▍ | 365000/818627 [00:41<00:49, 9078.28 examples/s]
+Filter: 45%|████▍ | 366000/818627 [00:41<00:49, 9149.49 examples/s]
+Filter: 45%|████▍ | 366000/818627 [00:41<00:49, 9148.93 examples/s]
+Filter: 45%|████▍ | 366000/818627 [00:41<00:49, 9146.93 examples/s]
+Filter: 45%|████▍ | 366000/818627 [00:41<00:49, 9152.42 examples/s]
+Filter: 45%|████▍ | 366000/818627 [00:41<00:49, 9154.70 examples/s]
+Filter: 45%|████▍ | 366000/818627 [00:41<00:49, 9172.17 examples/s]
+Filter: 45%|████▍ | 366000/818627 [00:41<00:49, 9177.08 examples/s]
+Filter: 45%|████▍ | 366000/818627 [00:41<00:49, 9146.62 examples/s]
+Filter: 45%|████▍ | 367000/818627 [00:41<00:50, 8965.65 examples/s]
+Filter: 45%|████▍ | 367000/818627 [00:41<00:50, 8968.91 examples/s]
+Filter: 45%|████▍ | 367000/818627 [00:41<00:50, 8967.71 examples/s]
+Filter: 45%|████▍ | 367000/818627 [00:41<00:50, 8965.94 examples/s]
+Filter: 45%|████▍ | 367000/818627 [00:41<00:50, 8967.70 examples/s]
+Filter: 45%|████▍ | 367000/818627 [00:41<00:50, 8968.41 examples/s]
+Filter: 45%|████▍ | 367000/818627 [00:41<00:50, 8984.40 examples/s]
+Filter: 45%|████▍ | 367000/818627 [00:41<00:50, 9011.63 examples/s]
+Filter: 45%|████▍ | 368000/818627 [00:41<00:50, 8907.10 examples/s]
+Filter: 45%|████▍ | 368000/818627 [00:41<00:50, 8906.70 examples/s]
+Filter: 45%|████▍ | 368000/818627 [00:41<00:50, 8902.03 examples/s]
+Filter: 45%|████▍ | 368000/818627 [00:41<00:50, 8903.87 examples/s]
+Filter: 45%|████▍ | 368000/818627 [00:41<00:50, 8910.54 examples/s]
+Filter: 45%|████▍ | 368000/818627 [00:41<00:50, 8922.59 examples/s]
+Filter: 45%|████▍ | 368000/818627 [00:41<00:50, 8908.39 examples/s]
+Filter: 45%|████▍ | 368000/818627 [00:41<00:50, 8950.32 examples/s]
+Filter: 45%|████▌ | 369000/818627 [00:41<00:50, 8842.43 examples/s]
+Filter: 45%|████▌ | 369000/818627 [00:41<00:50, 8840.17 examples/s]
+Filter: 45%|████▌ | 369000/818627 [00:41<00:50, 8840.36 examples/s]
+Filter: 45%|████▌ | 369000/818627 [00:41<00:50, 8852.37 examples/s]
+Filter: 45%|████▌ | 369000/818627 [00:41<00:50, 8841.57 examples/s]
+Filter: 45%|████▌ | 369000/818627 [00:41<00:50, 8839.68 examples/s]
+Filter: 45%|████▌ | 369000/818627 [00:41<00:50, 8875.32 examples/s]
+Filter: 45%|████▌ | 369000/818627 [00:41<00:51, 8764.29 examples/s]
+Filter: 45%|████▌ | 370000/818627 [00:41<00:49, 9024.31 examples/s]
+Filter: 45%|████▌ | 370000/818627 [00:41<00:49, 9004.05 examples/s]
+Filter: 45%|████▌ | 370000/818627 [00:41<00:49, 9016.41 examples/s]
+Filter: 45%|████▌ | 370000/818627 [00:41<00:49, 8980.68 examples/s]
+Filter: 45%|████▌ | 370000/818627 [00:41<00:49, 8992.90 examples/s]
+Filter: 45%|████▌ | 370000/818627 [00:41<00:49, 8993.16 examples/s]
+Filter: 45%|████▌ | 370000/818627 [00:42<00:49, 8977.74 examples/s]
+Filter: 45%|████▌ | 370000/818627 [00:41<00:49, 8982.16 examples/s]
+Filter: 45%|████▌ | 371000/818627 [00:41<00:48, 9180.80 examples/s]
+Filter: 45%|████▌ | 371000/818627 [00:41<00:48, 9194.56 examples/s]
+Filter: 45%|████▌ | 371000/818627 [00:41<00:48, 9185.32 examples/s]
+Filter: 45%|████▌ | 371000/818627 [00:41<00:48, 9181.45 examples/s]
+Filter: 45%|████▌ | 371000/818627 [00:41<00:48, 9186.40 examples/s]
+Filter: 45%|████▌ | 371000/818627 [00:41<00:48, 9180.79 examples/s]
+Filter: 45%|████▌ | 371000/818627 [00:41<00:48, 9179.53 examples/s]
+Filter: 45%|████▌ | 371000/818627 [00:42<00:48, 9143.46 examples/s]
+Filter: 45%|████▌ | 372000/818627 [00:41<00:47, 9417.78 examples/s]
+Filter: 45%|████▌ | 372000/818627 [00:41<00:47, 9404.52 examples/s]
+Filter: 45%|████▌ | 372000/818627 [00:41<00:47, 9408.09 examples/s]
+Filter: 45%|████▌ | 372000/818627 [00:42<00:47, 9407.47 examples/s]
+Filter: 45%|████▌ | 372000/818627 [00:41<00:47, 9409.66 examples/s]
+Filter: 45%|████▌ | 372000/818627 [00:41<00:47, 9399.81 examples/s]
+Filter: 45%|████▌ | 372000/818627 [00:41<00:47, 9408.48 examples/s]
+Filter: 46%|████▌ | 373000/818627 [00:42<00:47, 9284.38 examples/s]
+Filter: 46%|████▌ | 373000/818627 [00:42<00:48, 9276.48 examples/s]
+Filter: 46%|████▌ | 373000/818627 [00:42<00:48, 9279.70 examples/s]
+Filter: 46%|████▌ | 373000/818627 [00:42<00:47, 9325.02 examples/s]
+Filter: 46%|████▌ | 373000/818627 [00:42<00:47, 9285.36 examples/s]
+Filter: 46%|████▌ | 373000/818627 [00:42<00:47, 9288.45 examples/s]
+Filter: 46%|████▌ | 373000/818627 [00:42<00:48, 9278.79 examples/s]
+Filter: 46%|████▌ | 373000/818627 [00:42<00:48, 9274.98 examples/s]
+Filter: 46%|████▌ | 374000/818627 [00:42<00:49, 9037.02 examples/s]
+Filter: 46%|████▌ | 374000/818627 [00:42<00:49, 9028.98 examples/s]
+Filter: 46%|████▌ | 374000/818627 [00:42<00:49, 9030.15 examples/s]
+Filter: 46%|████▌ | 374000/818627 [00:42<00:48, 9102.74 examples/s]
+Filter: 46%|████▌ | 374000/818627 [00:42<00:49, 9036.05 examples/s]
+Filter: 46%|████▌ | 374000/818627 [00:42<00:49, 9031.22 examples/s]
+Filter: 46%|████▌ | 374000/818627 [00:42<00:49, 9034.17 examples/s]
+Filter: 46%|████▌ | 374000/818627 [00:42<00:49, 9034.03 examples/s]
+Filter: 46%|████▌ | 375000/818627 [00:42<00:49, 8894.36 examples/s]
+Filter: 46%|████▌ | 375000/818627 [00:42<00:49, 8887.95 examples/s]
+Filter: 46%|████▌ | 375000/818627 [00:42<00:49, 8956.59 examples/s]
+Filter: 46%|████▌ | 375000/818627 [00:42<00:49, 8892.00 examples/s]
+Filter: 46%|████▌ | 375000/818627 [00:42<00:49, 8894.48 examples/s]
+Filter: 46%|████▌ | 375000/818627 [00:42<00:49, 8891.21 examples/s]
+Filter: 46%|████▌ | 375000/818627 [00:42<00:49, 8873.79 examples/s]
+Filter: 46%|████▌ | 375000/818627 [00:42<00:49, 8893.73 examples/s]
+Filter: 46%|████▌ | 376000/818627 [00:42<00:49, 8861.81 examples/s]
+Filter: 46%|████▌ | 376000/818627 [00:42<00:49, 8858.58 examples/s]
+Filter: 46%|████▌ | 376000/818627 [00:42<00:49, 8858.21 examples/s]
+Filter: 46%|████▌ | 376000/818627 [00:42<00:49, 8864.18 examples/s]
+Filter: 46%|████▌ | 376000/818627 [00:42<00:49, 8908.73 examples/s]
+Filter: 46%|████▌ | 376000/818627 [00:42<00:49, 8859.50 examples/s]
+Filter: 46%|████▌ | 376000/818627 [00:42<00:49, 8857.28 examples/s]
+Filter: 46%|████▌ | 376000/818627 [00:42<00:49, 8861.58 examples/s]
+Filter: 46%|████▌ | 377000/818627 [00:42<00:50, 8765.96 examples/s]
+Filter: 46%|████▌ | 377000/818627 [00:42<00:50, 8765.83 examples/s]
+Filter: 46%|████▌ | 377000/818627 [00:42<00:50, 8762.11 examples/s]
+Filter: 46%|████▌ | 377000/818627 [00:42<00:50, 8807.32 examples/s]
+Filter: 46%|████▌ | 377000/818627 [00:42<00:50, 8763.42 examples/s]
+Filter: 46%|████▌ | 377000/818627 [00:42<00:50, 8762.41 examples/s]
+Filter: 46%|████▌ | 377000/818627 [00:42<00:50, 8762.83 examples/s]
+Filter: 46%|████▌ | 377000/818627 [00:42<00:50, 8765.23 examples/s]
+Filter: 46%|████▌ | 378000/818627 [00:42<00:50, 8738.86 examples/s]
+Filter: 46%|████▌ | 378000/818627 [00:42<00:50, 8744.69 examples/s]
+Filter: 46%|████▌ | 378000/818627 [00:42<00:50, 8736.59 examples/s]
+Filter: 46%|████▌ | 378000/818627 [00:42<00:50, 8775.44 examples/s]
+Filter: 46%|████▌ | 378000/818627 [00:42<00:50, 8741.38 examples/s]
+Filter: 46%|████▌ | 378000/818627 [00:42<00:50, 8735.13 examples/s]
+Filter: 46%|████▌ | 378000/818627 [00:42<00:50, 8742.00 examples/s]
+Filter: 46%|████▌ | 378000/818627 [00:42<00:50, 8735.33 examples/s]
+Filter: 46%|████▋ | 379000/818627 [00:42<00:48, 9083.17 examples/s]
+Filter: 46%|████▋ | 379000/818627 [00:42<00:48, 9077.51 examples/s]
+Filter: 46%|████▋ | 379000/818627 [00:42<00:48, 9079.28 examples/s]
+Filter: 46%|████▋ | 379000/818627 [00:43<00:48, 9091.22 examples/s]
+Filter: 46%|████▋ | 379000/818627 [00:42<00:48, 9077.62 examples/s]
+Filter: 46%|████▋ | 379000/818627 [00:42<00:48, 9077.21 examples/s]
+Filter: 46%|████▋ | 379000/818627 [00:42<00:48, 9077.14 examples/s]
+Filter: 46%|████▋ | 379000/818627 [00:42<00:48, 9076.46 examples/s]
+Filter: 46%|████▋ | 380000/818627 [00:42<00:48, 9086.19 examples/s]
+Filter: 46%|████▋ | 380000/818627 [00:42<00:48, 9089.30 examples/s]
+Filter: 46%|████▋ | 380000/818627 [00:42<00:48, 9085.75 examples/s]
+Filter: 46%|████▋ | 380000/818627 [00:43<00:48, 9096.40 examples/s]
+Filter: 46%|████▋ | 380000/818627 [00:42<00:48, 9085.43 examples/s]
+Filter: 46%|████▋ | 380000/818627 [00:42<00:48, 9085.77 examples/s]
+Filter: 46%|████▋ | 380000/818627 [00:42<00:48, 9084.41 examples/s]
+Filter: 46%|████▋ | 380000/818627 [00:42<00:48, 9083.86 examples/s]
+Filter: 47%|████▋ | 381000/818627 [00:42<00:48, 8934.89 examples/s]
+Filter: 47%|████▋ | 381000/818627 [00:42<00:48, 8936.32 examples/s]
+Filter: 47%|████▋ | 381000/818627 [00:42<00:48, 8933.70 examples/s]
+Filter: 47%|████▋ | 381000/818627 [00:43<00:48, 8943.36 examples/s]
+Filter: 47%|████▋ | 381000/818627 [00:42<00:48, 8935.16 examples/s]
+Filter: 47%|████▋ | 381000/818627 [00:43<00:48, 8934.94 examples/s]
+Filter: 47%|████▋ | 381000/818627 [00:42<00:48, 8938.54 examples/s]
+Filter: 47%|████▋ | 381000/818627 [00:42<00:48, 8933.94 examples/s]
+Filter: 47%|████▋ | 382000/818627 [00:43<00:49, 8845.23 examples/s]
+Filter: 47%|████▋ | 382000/818627 [00:43<00:49, 8847.52 examples/s]
+Filter: 47%|████▋ | 382000/818627 [00:43<00:49, 8845.15 examples/s]
+Filter: 47%|████▋ | 382000/818627 [00:43<00:49, 8850.40 examples/s]
+Filter: 47%|████▋ | 382000/818627 [00:43<00:49, 8848.53 examples/s]
+Filter: 47%|████▋ | 382000/818627 [00:43<00:49, 8847.75 examples/s]
+Filter: 47%|████▋ | 382000/818627 [00:43<00:49, 8843.71 examples/s]
+Filter: 47%|████▋ | 382000/818627 [00:43<00:49, 8845.44 examples/s]
+Filter: 47%|████▋ | 383000/818627 [00:43<00:49, 8790.47 examples/s]
+Filter: 47%|████▋ | 383000/818627 [00:43<00:49, 8790.57 examples/s]
+Filter: 47%|████▋ | 383000/818627 [00:43<00:49, 8788.17 examples/s]
+Filter: 47%|████▋ | 383000/818627 [00:43<00:49, 8797.03 examples/s]
+Filter: 47%|████▋ | 383000/818627 [00:43<00:49, 8794.38 examples/s]
+Filter: 47%|████▋ | 383000/818627 [00:43<00:49, 8791.49 examples/s]
+Filter: 47%|████▋ | 383000/818627 [00:43<00:49, 8791.27 examples/s]
+Filter: 47%|████▋ | 383000/818627 [00:43<00:49, 8790.08 examples/s]
+Filter: 47%|████▋ | 384000/818627 [00:43<00:48, 8965.96 examples/s]
+Filter: 47%|████▋ | 384000/818627 [00:43<00:48, 8965.69 examples/s]
+Filter: 47%|████▋ | 384000/818627 [00:43<00:48, 8963.48 examples/s]
+Filter: 47%|████▋ | 384000/818627 [00:43<00:48, 8962.62 examples/s]
+Filter: 47%|████▋ | 384000/818627 [00:43<00:48, 8964.02 examples/s]
+Filter: 47%|████▋ | 384000/818627 [00:43<00:48, 8960.16 examples/s]
+Filter: 47%|████▋ | 384000/818627 [00:43<00:48, 8962.64 examples/s]
+Filter: 47%|████▋ | 384000/818627 [00:43<00:51, 8380.72 examples/s]
+Filter: 47%|████▋ | 385000/818627 [00:43<00:48, 8891.46 examples/s]
+Filter: 47%|████▋ | 385000/818627 [00:43<00:48, 8890.18 examples/s]
+Filter: 47%|████▋ | 385000/818627 [00:43<00:48, 8886.25 examples/s]
+Filter: 47%|████▋ | 385000/818627 [00:43<00:48, 8890.71 examples/s]
+Filter: 47%|████▋ | 385000/818627 [00:43<00:48, 8890.81 examples/s]
+Filter: 47%|████▋ | 385000/818627 [00:43<00:48, 8888.32 examples/s]
+Filter: 47%|████▋ | 385000/818627 [00:43<00:48, 8888.82 examples/s]
+Filter: 47%|████▋ | 386000/818627 [00:43<00:48, 8882.96 examples/s]
+Filter: 47%|████▋ | 386000/818627 [00:43<00:48, 8878.65 examples/s]
+Filter: 47%|████▋ | 386000/818627 [00:43<00:47, 9031.73 examples/s]
+Filter: 47%|████▋ | 386000/818627 [00:43<00:48, 8876.85 examples/s]
+Filter: 47%|████▋ | 386000/818627 [00:43<00:48, 8878.88 examples/s]
+Filter: 47%|████▋ | 386000/818627 [00:43<00:48, 8879.27 examples/s]
+Filter: 47%|████▋ | 386000/818627 [00:43<00:48, 8877.95 examples/s]
+Filter: 47%|████▋ | 386000/818627 [00:43<00:48, 8877.58 examples/s]
+Filter: 47%|████▋ | 387000/818627 [00:43<00:48, 8841.74 examples/s]
+Filter: 47%|████▋ | 387000/818627 [00:43<00:48, 8840.06 examples/s]
+Filter: 47%|████▋ | 387000/818627 [00:43<00:48, 8960.19 examples/s]
+Filter: 47%|████▋ | 387000/818627 [00:43<00:48, 8837.43 examples/s]
+Filter: 47%|████▋ | 387000/818627 [00:43<00:48, 8838.96 examples/s]
+Filter: 47%|████▋ | 387000/818627 [00:43<00:48, 8836.40 examples/s]
+Filter: 47%|████▋ | 387000/818627 [00:43<00:48, 8837.47 examples/s]
+Filter: 47%|████▋ | 387000/818627 [00:43<00:48, 8839.09 examples/s]
+Filter: 47%|████▋ | 388000/818627 [00:43<00:48, 8796.74 examples/s]
+Filter: 47%|████▋ | 388000/818627 [00:43<00:48, 8795.05 examples/s]
+Filter: 47%|████▋ | 388000/818627 [00:43<00:48, 8795.57 examples/s]
+Filter: 47%|████▋ | 388000/818627 [00:44<00:48, 8888.96 examples/s]
+Filter: 47%|████▋ | 388000/818627 [00:43<00:48, 8798.21 examples/s]
+Filter: 47%|████▋ | 388000/818627 [00:43<00:48, 8796.35 examples/s]
+Filter: 47%|████▋ | 388000/818627 [00:43<00:48, 8795.11 examples/s]
+Filter: 47%|████▋ | 388000/818627 [00:43<00:48, 8795.79 examples/s]
+Filter: 48%|████▊ | 389000/818627 [00:43<00:49, 8740.71 examples/s]
+Filter: 48%|████▊ | 389000/818627 [00:43<00:49, 8739.14 examples/s]
+Filter: 48%|████▊ | 389000/818627 [00:44<00:48, 8814.52 examples/s]
+Filter: 48%|████▊ | 389000/818627 [00:43<00:49, 8738.98 examples/s]
+Filter: 48%|████▊ | 389000/818627 [00:43<00:49, 8741.06 examples/s]
+Filter: 48%|████▊ | 389000/818627 [00:43<00:49, 8741.28 examples/s]
+Filter: 48%|████▊ | 389000/818627 [00:43<00:49, 8739.03 examples/s]
+Filter: 48%|████▊ | 389000/818627 [00:43<00:49, 8740.98 examples/s]
+Filter: 48%|████▊ | 390000/818627 [00:43<00:49, 8739.49 examples/s]
+Filter: 48%|████▊ | 390000/818627 [00:43<00:49, 8739.39 examples/s]
+Filter: 48%|████▊ | 390000/818627 [00:44<00:48, 8792.89 examples/s]
+Filter: 48%|████▊ | 390000/818627 [00:43<00:49, 8735.83 examples/s]
+Filter: 48%|████▊ | 390000/818627 [00:43<00:49, 8738.59 examples/s]
+Filter: 48%|████▊ | 390000/818627 [00:43<00:49, 8742.91 examples/s]
+Filter: 48%|████▊ | 390000/818627 [00:43<00:49, 8738.48 examples/s]
+Filter: 48%|████▊ | 390000/818627 [00:44<00:49, 8735.89 examples/s]
+Filter: 48%|████▊ | 391000/818627 [00:44<00:49, 8679.60 examples/s]
+Filter: 48%|████▊ | 391000/818627 [00:44<00:49, 8718.54 examples/s]
+Filter: 48%|████▊ | 391000/818627 [00:44<00:49, 8680.18 examples/s]
+Filter: 48%|████▊ | 391000/818627 [00:44<00:49, 8671.89 examples/s]
+Filter: 48%|████▊ | 391000/818627 [00:44<00:49, 8680.53 examples/s]
+Filter: 48%|████▊ | 391000/818627 [00:44<00:49, 8679.65 examples/s]
+Filter: 48%|████▊ | 391000/818627 [00:44<00:49, 8679.40 examples/s]
+Filter: 48%|████▊ | 391000/818627 [00:44<00:49, 8678.73 examples/s]
+Filter: 48%|████▊ | 392000/818627 [00:44<00:47, 9006.19 examples/s]
+Filter: 48%|████▊ | 392000/818627 [00:44<00:47, 9008.05 examples/s]
+Filter: 48%|████▊ | 392000/818627 [00:44<00:47, 9023.78 examples/s]
+Filter: 48%|████▊ | 392000/818627 [00:44<00:47, 9006.50 examples/s]
+Filter: 48%|████▊ | 392000/818627 [00:44<00:47, 9010.34 examples/s]
+Filter: 48%|████▊ | 392000/818627 [00:44<00:47, 9006.66 examples/s]
+Filter: 48%|████▊ | 392000/818627 [00:44<00:47, 9004.23 examples/s]
+Filter: 48%|████▊ | 392000/818627 [00:44<00:47, 8995.13 examples/s]
+Filter: 48%|████▊ | 393000/818627 [00:44<00:47, 8891.68 examples/s]
+Filter: 48%|████▊ | 393000/818627 [00:44<00:47, 8888.17 examples/s]
+Filter: 48%|████▊ | 393000/818627 [00:44<00:47, 8897.79 examples/s]
+Filter: 48%|████▊ | 393000/818627 [00:44<00:47, 8880.95 examples/s]
+Filter: 48%|████▊ | 393000/818627 [00:44<00:47, 8891.23 examples/s]
+Filter: 48%|████▊ | 393000/818627 [00:44<00:47, 8890.11 examples/s]
+Filter: 48%|████▊ | 393000/818627 [00:44<00:47, 8888.79 examples/s]
+Filter: 48%|████▊ | 393000/818627 [00:44<00:47, 8885.51 examples/s]
+Filter: 48%|████▊ | 394000/818627 [00:44<00:48, 8843.43 examples/s]
+Filter: 48%|████▊ | 394000/818627 [00:44<00:48, 8842.35 examples/s]
+Filter: 48%|████▊ | 394000/818627 [00:44<00:47, 8855.34 examples/s]
+Filter: 48%|████▊ | 394000/818627 [00:44<00:48, 8839.42 examples/s]
+Filter: 48%|████▊ | 394000/818627 [00:44<00:48, 8845.68 examples/s]
+Filter: 48%|████▊ | 394000/818627 [00:44<00:48, 8842.18 examples/s]
+Filter: 48%|████▊ | 394000/818627 [00:44<00:48, 8840.92 examples/s]
+Filter: 48%|████▊ | 394000/818627 [00:44<00:48, 8837.20 examples/s]
+Filter: 48%|████▊ | 395000/818627 [00:44<00:48, 8755.81 examples/s]
+Filter: 48%|████▊ | 395000/818627 [00:44<00:48, 8758.24 examples/s]
+Filter: 48%|████▊ | 395000/818627 [00:44<00:48, 8766.24 examples/s]
+Filter: 48%|████▊ | 395000/818627 [00:44<00:48, 8757.79 examples/s]
+Filter: 48%|████▊ | 395000/818627 [00:44<00:48, 8757.96 examples/s]
+Filter: 48%|████▊ | 395000/818627 [00:44<00:48, 8755.16 examples/s]
+Filter: 48%|████▊ | 395000/818627 [00:44<00:48, 8753.70 examples/s]
+Filter: 48%|████▊ | 395000/818627 [00:44<00:48, 8754.09 examples/s]
+Filter: 48%|████▊ | 396000/818627 [00:44<00:48, 8753.12 examples/s]
+Filter: 48%|████▊ | 396000/818627 [00:44<00:48, 8755.50 examples/s]
+Filter: 48%|████▊ | 396000/818627 [00:44<00:48, 8758.53 examples/s]
+Filter: 48%|████▊ | 396000/818627 [00:44<00:48, 8752.24 examples/s]
+Filter: 48%|████▊ | 396000/818627 [00:44<00:48, 8753.10 examples/s]
+Filter: 48%|████▊ | 396000/818627 [00:44<00:48, 8752.68 examples/s]
+Filter: 48%|████▊ | 396000/818627 [00:44<00:48, 8749.29 examples/s]
+Filter: 48%|████▊ | 396000/818627 [00:44<00:48, 8699.45 examples/s]
+Filter: 48%|████▊ | 397000/818627 [00:44<00:48, 8692.11 examples/s]
+Filter: 48%|████▊ | 397000/818627 [00:44<00:48, 8678.94 examples/s]
+Filter: 48%|████▊ | 397000/818627 [00:44<00:48, 8682.84 examples/s]
+Filter: 48%|████▊ | 397000/818627 [00:44<00:48, 8681.41 examples/s]
+Filter: 48%|████▊ | 397000/818627 [00:44<00:48, 8683.31 examples/s]
+Filter: 48%|████▊ | 397000/818627 [00:44<00:48, 8677.51 examples/s]
+Filter: 48%|████▊ | 397000/818627 [00:45<00:48, 8671.79 examples/s]
+Filter: 48%|████▊ | 397000/818627 [00:44<00:48, 8675.31 examples/s]
+Filter: 49%|████▊ | 398000/818627 [00:44<00:48, 8679.16 examples/s]
+Filter: 49%|████▊ | 398000/818627 [00:44<00:48, 8666.48 examples/s]
+Filter: 49%|████▊ | 398000/818627 [00:45<00:48, 8674.28 examples/s]
+Filter: 49%|████▊ | 398000/818627 [00:44<00:48, 8666.96 examples/s]
+Filter: 49%|████▊ | 398000/818627 [00:44<00:48, 8668.20 examples/s]
+Filter: 49%|████▊ | 398000/818627 [00:44<00:48, 8664.81 examples/s]
+Filter: 49%|████▊ | 398000/818627 [00:44<00:48, 8667.69 examples/s]
+Filter: 49%|████▊ | 398000/818627 [00:44<00:48, 8667.16 examples/s]
+Filter: 49%|████▊ | 399000/818627 [00:44<00:46, 8958.42 examples/s]
+Filter: 49%|████▊ | 399000/818627 [00:45<00:46, 8959.47 examples/s]
+Filter: 49%|████▊ | 399000/818627 [00:44<00:46, 8951.37 examples/s]
+Filter: 49%|████▊ | 399000/818627 [00:44<00:46, 8950.52 examples/s]
+Filter: 49%|████▊ | 399000/818627 [00:44<00:46, 8949.30 examples/s]
+Filter: 49%|████▊ | 399000/818627 [00:45<00:46, 8948.64 examples/s]
+Filter: 49%|████▊ | 399000/818627 [00:44<00:46, 8949.54 examples/s]
+Filter: 49%|████▊ | 399000/818627 [00:44<00:46, 8949.49 examples/s]
+Filter: 49%|████▉ | 400000/818627 [00:45<00:47, 8873.56 examples/s]
+Filter: 49%|████▉ | 400000/818627 [00:45<00:47, 8875.64 examples/s]
+Filter: 49%|████▉ | 400000/818627 [00:45<00:47, 8873.66 examples/s]
+Filter: 49%|████▉ | 400000/818627 [00:45<00:47, 8872.63 examples/s]
+Filter: 49%|████▉ | 400000/818627 [00:45<00:47, 8874.99 examples/s]
+Filter: 49%|████▉ | 400000/818627 [00:45<00:47, 8872.27 examples/s]
+Filter: 49%|████▉ | 400000/818627 [00:45<00:47, 8862.31 examples/s]
+Filter: 49%|████▉ | 400000/818627 [00:45<00:47, 8871.27 examples/s]
+Filter: 49%|████▉ | 401000/818627 [00:45<00:47, 8830.74 examples/s]
+Filter: 49%|████▉ | 401000/818627 [00:45<00:47, 8828.08 examples/s]
+Filter: 49%|████▉ | 401000/818627 [00:45<00:47, 8823.69 examples/s]
+Filter: 49%|████▉ | 401000/818627 [00:45<00:47, 8824.44 examples/s]
+Filter: 49%|████▉ | 401000/818627 [00:45<00:47, 8822.81 examples/s]
+Filter: 49%|████▉ | 401000/818627 [00:45<00:47, 8823.10 examples/s]
+Filter: 49%|████▉ | 401000/818627 [00:45<00:47, 8822.61 examples/s]
+Filter: 49%|████▉ | 401000/818627 [00:45<00:47, 8824.79 examples/s]
+Filter: 49%|████▉ | 402000/818627 [00:45<00:47, 8792.85 examples/s]
+Filter: 49%|████▉ | 402000/818627 [00:45<00:47, 8797.03 examples/s]
+Filter: 49%|████▉ | 402000/818627 [00:45<00:47, 8791.24 examples/s]
+Filter: 49%|████▉ | 402000/818627 [00:45<00:47, 8786.64 examples/s]
+Filter: 49%|████▉ | 402000/818627 [00:45<00:47, 8789.43 examples/s]
+Filter: 49%|████▉ | 402000/818627 [00:45<00:47, 8784.93 examples/s]
+Filter: 49%|████▉ | 402000/818627 [00:45<00:47, 8780.06 examples/s]
+Filter: 49%|████▉ | 402000/818627 [00:45<00:47, 8792.34 examples/s]
+Filter: 49%|████▉ | 403000/818627 [00:45<00:47, 8706.55 examples/s]
+Filter: 49%|████▉ | 403000/818627 [00:45<00:47, 8702.63 examples/s]
+Filter: 49%|████▉ | 403000/818627 [00:45<00:47, 8698.56 examples/s]
+Filter: 49%|████▉ | 403000/818627 [00:45<00:47, 8702.36 examples/s]
+Filter: 49%|████▉ | 403000/818627 [00:45<00:47, 8702.90 examples/s]
+Filter: 49%|████▉ | 403000/818627 [00:45<00:47, 8701.29 examples/s]
+Filter: 49%|████▉ | 403000/818627 [00:45<00:47, 8698.53 examples/s]
+Filter: 49%|████▉ | 403000/818627 [00:45<00:47, 8698.92 examples/s]
+Filter: 49%|████▉ | 404000/818627 [00:45<00:47, 8685.18 examples/s]
+Filter: 49%|████▉ | 404000/818627 [00:45<00:47, 8682.82 examples/s]
+Filter: 49%|████▉ | 404000/818627 [00:45<00:47, 8682.29 examples/s]
+Filter: 49%|████▉ | 404000/818627 [00:45<00:47, 8677.78 examples/s]
+Filter: 49%|████▉ | 404000/818627 [00:45<00:47, 8684.58 examples/s]
+Filter: 49%|████▉ | 404000/818627 [00:45<00:47, 8684.59 examples/s]
+Filter: 49%|████▉ | 404000/818627 [00:45<00:47, 8680.91 examples/s]
+Filter: 49%|████▉ | 404000/818627 [00:45<00:47, 8684.26 examples/s]
+Filter: 49%|████▉ | 405000/818627 [00:45<00:47, 8667.47 examples/s]
+Filter: 49%|████▉ | 405000/818627 [00:45<00:47, 8666.01 examples/s]
+Filter: 49%|████▉ | 405000/818627 [00:45<00:47, 8667.02 examples/s]
+Filter: 49%|████▉ | 405000/818627 [00:46<00:47, 8663.70 examples/s]
+Filter: 49%|████▉ | 405000/818627 [00:45<00:47, 8664.74 examples/s]
+Filter: 49%|████▉ | 405000/818627 [00:45<00:47, 8663.55 examples/s]
+Filter: 49%|████▉ | 405000/818627 [00:45<00:47, 8664.20 examples/s]
+Filter: 49%|████▉ | 405000/818627 [00:45<00:47, 8660.48 examples/s]
+Filter: 50%|████▉ | 406000/818627 [00:45<00:47, 8645.22 examples/s]
+Filter: 50%|████▉ | 406000/818627 [00:45<00:47, 8643.62 examples/s]
+Filter: 50%|████▉ | 406000/818627 [00:46<00:47, 8643.34 examples/s]
+Filter: 50%|████▉ | 406000/818627 [00:45<00:47, 8644.89 examples/s]
+Filter: 50%|████▉ | 406000/818627 [00:45<00:47, 8643.58 examples/s]
+Filter: 50%|████▉ | 406000/818627 [00:45<00:47, 8643.65 examples/s]
+Filter: 50%|████▉ | 406000/818627 [00:45<00:47, 8643.23 examples/s]
+Filter: 50%|████▉ | 406000/818627 [00:45<00:47, 8642.34 examples/s]
+Filter: 50%|████▉ | 407000/818627 [00:45<00:47, 8661.16 examples/s]
+Filter: 50%|████▉ | 407000/818627 [00:46<00:47, 8664.04 examples/s]
+Filter: 50%|████▉ | 407000/818627 [00:45<00:47, 8658.94 examples/s]
+Filter: 50%|████▉ | 407000/818627 [00:45<00:47, 8662.40 examples/s]
+Filter: 50%|████▉ | 407000/818627 [00:45<00:47, 8661.99 examples/s]
+Filter: 50%|████▉ | 407000/818627 [00:46<00:47, 8661.01 examples/s]
+Filter: 50%|████▉ | 407000/818627 [00:45<00:47, 8660.03 examples/s]
+Filter: 50%|████▉ | 407000/818627 [00:45<00:47, 8661.08 examples/s]
+Filter: 50%|████▉ | 408000/818627 [00:46<00:47, 8646.93 examples/s]
+Filter: 50%|████▉ | 408000/818627 [00:46<00:47, 8647.01 examples/s]
+Filter: 50%|████▉ | 408000/818627 [00:46<00:47, 8644.33 examples/s]
+Filter: 50%|████▉ | 408000/818627 [00:46<00:47, 8645.74 examples/s]
+Filter: 50%|████▉ | 408000/818627 [00:46<00:47, 8647.42 examples/s]
+Filter: 50%|████▉ | 408000/818627 [00:46<00:47, 8645.91 examples/s]
+Filter: 50%|████▉ | 408000/818627 [00:46<00:47, 8645.10 examples/s]
+Filter: 50%|████▉ | 408000/818627 [00:46<00:47, 8648.95 examples/s]
+Filter: 50%|████▉ | 409000/818627 [00:46<00:47, 8655.95 examples/s]
+Filter: 50%|████▉ | 409000/818627 [00:46<00:47, 8656.17 examples/s]
+Filter: 50%|████▉ | 409000/818627 [00:46<00:47, 8650.03 examples/s]
+Filter: 50%|████▉ | 409000/818627 [00:46<00:47, 8658.83 examples/s]
+Filter: 50%|████▉ | 409000/818627 [00:46<00:47, 8643.33 examples/s]
+Filter: 50%|████▉ | 409000/818627 [00:46<00:47, 8654.94 examples/s]
+Filter: 50%|████▉ | 409000/818627 [00:46<00:47, 8652.10 examples/s]
+Filter: 50%|████▉ | 409000/818627 [00:46<00:47, 8647.46 examples/s]
+Filter: 50%|█████ | 410000/818627 [00:46<00:47, 8644.37 examples/s]
+Filter: 50%|█████ | 410000/818627 [00:46<00:47, 8647.24 examples/s]
+Filter: 50%|█████ | 410000/818627 [00:46<00:47, 8642.48 examples/s]
+Filter: 50%|█████ | 410000/818627 [00:46<00:47, 8636.69 examples/s]
+Filter: 50%|█████ | 410000/818627 [00:46<00:47, 8643.16 examples/s]
+Filter: 50%|█████ | 410000/818627 [00:46<00:47, 8642.90 examples/s]
+Filter: 50%|█████ | 410000/818627 [00:46<00:47, 8644.47 examples/s]
+Filter: 50%|█████ | 410000/818627 [00:46<00:47, 8643.62 examples/s]
+Filter: 50%|█████ | 411000/818627 [00:46<00:48, 8481.05 examples/s]
+Filter: 50%|█████ | 411000/818627 [00:46<00:48, 8482.39 examples/s]
+Filter: 50%|█████ | 411000/818627 [00:46<00:48, 8478.22 examples/s]
+Filter: 50%|█████ | 411000/818627 [00:46<00:48, 8476.96 examples/s]
+Filter: 50%|█████ | 411000/818627 [00:46<00:48, 8484.07 examples/s]
+Filter: 50%|█████ | 411000/818627 [00:46<00:48, 8481.64 examples/s]
+Filter: 50%|█████ | 411000/818627 [00:46<00:48, 8480.02 examples/s]
+Filter: 50%|█████ | 411000/818627 [00:46<00:48, 8482.38 examples/s]
+Filter: 50%|█████ | 412000/818627 [00:46<00:48, 8347.86 examples/s]
+Filter: 50%|█████ | 412000/818627 [00:46<00:48, 8344.88 examples/s]
+Filter: 50%|█████ | 412000/818627 [00:46<00:48, 8347.23 examples/s]
+Filter: 50%|█████ | 412000/818627 [00:46<00:48, 8349.55 examples/s]
+Filter: 50%|█████ | 412000/818627 [00:46<00:48, 8340.68 examples/s]
+Filter: 50%|█████ | 412000/818627 [00:46<00:48, 8344.32 examples/s]
+Filter: 50%|█████ | 412000/818627 [00:46<00:48, 8345.81 examples/s]
+Filter: 50%|█████ | 412000/818627 [00:46<00:48, 8347.84 examples/s]
+Filter: 50%|█████ | 413000/818627 [00:46<00:46, 8659.13 examples/s]
+Filter: 50%|█████ | 413000/818627 [00:46<00:46, 8661.08 examples/s]
+Filter: 50%|█████ | 413000/818627 [00:46<00:46, 8660.70 examples/s]
+Filter: 50%|█████ | 413000/818627 [00:46<00:46, 8660.86 examples/s]
+Filter: 50%|█████ | 413000/818627 [00:46<00:46, 8659.56 examples/s]
+Filter: 50%|█████ | 413000/818627 [00:46<00:46, 8659.77 examples/s]
+Filter: 50%|█████ | 413000/818627 [00:46<00:46, 8659.69 examples/s]
+Filter: 50%|█████ | 413000/818627 [00:46<00:46, 8661.02 examples/s]
+Filter: 51%|█████ | 414000/818627 [00:46<00:46, 8657.13 examples/s]
+Filter: 51%|█████ | 414000/818627 [00:46<00:46, 8656.62 examples/s]
+Filter: 51%|█████ | 414000/818627 [00:47<00:46, 8659.55 examples/s]
+Filter: 51%|█████ | 414000/818627 [00:46<00:46, 8657.79 examples/s]
+Filter: 51%|█████ | 414000/818627 [00:46<00:46, 8659.10 examples/s]
+Filter: 51%|█████ | 414000/818627 [00:46<00:46, 8652.57 examples/s]
+Filter: 51%|█████ | 414000/818627 [00:46<00:46, 8652.12 examples/s]
+Filter: 51%|█████ | 414000/818627 [00:46<00:46, 8657.34 examples/s]
+Filter: 51%|█████ | 415000/818627 [00:46<00:44, 9007.00 examples/s]
+Filter: 51%|█████ | 415000/818627 [00:46<00:44, 9006.30 examples/s]
+Filter: 51%|█████ | 415000/818627 [00:47<00:44, 9006.96 examples/s]
+Filter: 51%|█████ | 415000/818627 [00:46<00:44, 9006.41 examples/s]
+Filter: 51%|█████ | 415000/818627 [00:46<00:44, 9004.89 examples/s]
+Filter: 51%|█████ | 415000/818627 [00:46<00:44, 9005.32 examples/s]
+Filter: 51%|█████ | 415000/818627 [00:46<00:44, 9004.51 examples/s]
+Filter: 51%|█████ | 415000/818627 [00:46<00:44, 8998.65 examples/s]
+Filter: 51%|█████ | 416000/818627 [00:47<00:44, 9049.11 examples/s]
+Filter: 51%|█████ | 416000/818627 [00:46<00:44, 9044.11 examples/s]
+Filter: 51%|█████ | 416000/818627 [00:46<00:44, 9046.20 examples/s]
+Filter: 51%|█████ | 416000/818627 [00:46<00:44, 9034.37 examples/s]
+Filter: 51%|█████ | 416000/818627 [00:47<00:44, 9048.50 examples/s]
+Filter: 51%|█████ | 416000/818627 [00:46<00:44, 9043.61 examples/s]
+Filter: 51%|█████ | 416000/818627 [00:46<00:44, 9041.21 examples/s]
+Filter: 51%|█████ | 416000/818627 [00:46<00:44, 9047.30 examples/s]
+Filter: 51%|█████ | 417000/818627 [00:47<00:44, 8965.26 examples/s]
+Filter: 51%|█████ | 417000/818627 [00:47<00:44, 8963.27 examples/s]
+Filter: 51%|█████ | 417000/818627 [00:47<00:44, 8961.31 examples/s]
+Filter: 51%|█████ | 417000/818627 [00:47<00:44, 8961.93 examples/s]
+Filter: 51%|█████ | 417000/818627 [00:47<00:44, 8964.38 examples/s]
+Filter: 51%|█████ | 417000/818627 [00:47<00:44, 8963.89 examples/s]
+Filter: 51%|█████ | 417000/818627 [00:47<00:44, 8964.23 examples/s]
+Filter: 51%|█████ | 417000/818627 [00:47<00:44, 8965.14 examples/s]
+Filter: 51%|█████ | 418000/818627 [00:47<00:45, 8886.85 examples/s]
+Filter: 51%|█████ | 418000/818627 [00:47<00:45, 8885.27 examples/s]
+Filter: 51%|█████ | 418000/818627 [00:47<00:45, 8884.22 examples/s]
+Filter: 51%|█████ | 418000/818627 [00:47<00:45, 8885.29 examples/s]
+Filter: 51%|█████ | 418000/818627 [00:47<00:45, 8885.47 examples/s]
+Filter: 51%|█████ | 418000/818627 [00:47<00:45, 8885.08 examples/s]
+Filter: 51%|█████ | 418000/818627 [00:47<00:45, 8883.63 examples/s]
+Filter: 51%|█████ | 418000/818627 [00:47<00:45, 8885.17 examples/s]
+Filter: 51%|█████ | 419000/818627 [00:47<00:45, 8801.58 examples/s]
+Filter: 51%|█████ | 419000/818627 [00:47<00:45, 8801.30 examples/s]
+Filter: 51%|█████ | 419000/818627 [00:47<00:45, 8800.95 examples/s]
+Filter: 51%|█████ | 419000/818627 [00:47<00:45, 8801.32 examples/s]
+Filter: 51%|█████ | 419000/818627 [00:47<00:45, 8801.27 examples/s]
+Filter: 51%|█████ | 419000/818627 [00:47<00:45, 8799.17 examples/s]
+Filter: 51%|█████ | 419000/818627 [00:47<00:45, 8798.15 examples/s]
+Filter: 51%|█████ | 419000/818627 [00:47<00:45, 8800.39 examples/s]
+Filter: 51%|█████▏ | 420000/818627 [00:47<00:45, 8718.16 examples/s]
+Filter: 51%|█████▏ | 420000/818627 [00:47<00:45, 8715.14 examples/s]
+Filter: 51%|█████▏ | 420000/818627 [00:47<00:45, 8718.11 examples/s]
+Filter: 51%|█████▏ | 420000/818627 [00:47<00:45, 8712.23 examples/s]
+Filter: 51%|█████▏ | 420000/818627 [00:47<00:45, 8716.46 examples/s]
+Filter: 51%|█████▏ | 420000/818627 [00:47<00:45, 8714.61 examples/s]
+Filter: 51%|█████▏ | 420000/818627 [00:47<00:45, 8711.77 examples/s]
+Filter: 51%|█████▏ | 420000/818627 [00:47<00:45, 8717.14 examples/s]
+Filter: 51%|█████▏ | 421000/818627 [00:47<00:45, 8665.34 examples/s]
+Filter: 51%|█████▏ | 421000/818627 [00:47<00:45, 8666.11 examples/s]
+Filter: 51%|█████▏ | 421000/818627 [00:47<00:45, 8661.46 examples/s]
+Filter: 51%|█████▏ | 421000/818627 [00:47<00:45, 8660.68 examples/s]
+Filter: 51%|█████▏ | 421000/818627 [00:47<00:45, 8668.08 examples/s]
+Filter: 51%|█████▏ | 421000/818627 [00:47<00:45, 8663.25 examples/s]
+Filter: 51%|█████▏ | 421000/818627 [00:47<00:45, 8662.82 examples/s]
+Filter: 51%|█████▏ | 421000/818627 [00:47<00:45, 8657.87 examples/s]
+Filter: 52%|█████▏ | 422000/818627 [00:47<00:45, 8666.12 examples/s]
+Filter: 52%|█████▏ | 422000/818627 [00:47<00:45, 8664.47 examples/s]
+Filter: 52%|█████▏ | 422000/818627 [00:47<00:45, 8665.65 examples/s]
+Filter: 52%|█████▏ | 422000/818627 [00:47<00:45, 8664.77 examples/s]
+Filter: 52%|█████▏ | 422000/818627 [00:47<00:45, 8665.71 examples/s]
+Filter: 52%|█████▏ | 422000/818627 [00:47<00:45, 8664.41 examples/s]
+Filter: 52%|█████▏ | 422000/818627 [00:47<00:45, 8658.85 examples/s]
+Filter: 52%|█████▏ | 422000/818627 [00:47<00:46, 8554.41 examples/s]
+Filter: 52%|█████▏ | 423000/818627 [00:47<00:45, 8689.62 examples/s]
+Filter: 52%|█████▏ | 423000/818627 [00:47<00:45, 8687.31 examples/s]
+Filter: 52%|█████▏ | 423000/818627 [00:48<00:45, 8688.04 examples/s]
+Filter: 52%|█████▏ | 423000/818627 [00:47<00:45, 8684.15 examples/s]
+Filter: 52%|█████▏ | 423000/818627 [00:47<00:45, 8689.19 examples/s]
+Filter: 52%|█████▏ | 423000/818627 [00:47<00:45, 8688.35 examples/s]
+Filter: 52%|█████▏ | 423000/818627 [00:47<00:45, 8685.90 examples/s]
+Filter: 52%|█████▏ | 423000/818627 [00:47<00:45, 8722.59 examples/s]
+Filter: 52%|█████▏ | 424000/818627 [00:48<00:45, 8653.57 examples/s]
+Filter: 52%|█████▏ | 424000/818627 [00:47<00:45, 8652.13 examples/s]
+Filter: 52%|█████▏ | 424000/818627 [00:47<00:45, 8650.95 examples/s]
+Filter: 52%|█████▏ | 424000/818627 [00:47<00:45, 8652.50 examples/s]
+Filter: 52%|█████▏ | 424000/818627 [00:47<00:45, 8655.13 examples/s]
+Filter: 52%|█████▏ | 424000/818627 [00:47<00:45, 8653.81 examples/s]
+Filter: 52%|█████▏ | 424000/818627 [00:47<00:45, 8651.60 examples/s]
+Filter: 52%|█████▏ | 424000/818627 [00:47<00:45, 8677.16 examples/s]
+Filter: 52%|█████▏ | 425000/818627 [00:47<00:45, 8623.12 examples/s]
+Filter: 52%|█████▏ | 425000/818627 [00:47<00:45, 8622.73 examples/s]
+Filter: 52%|█████▏ | 425000/818627 [00:47<00:45, 8622.94 examples/s]
+Filter: 52%|█████▏ | 425000/818627 [00:48<00:45, 8619.42 examples/s]
+Filter: 52%|█████▏ | 425000/818627 [00:47<00:45, 8620.28 examples/s]
+Filter: 52%|█████▏ | 425000/818627 [00:48<00:45, 8619.18 examples/s]
+Filter: 52%|█████▏ | 425000/818627 [00:47<00:45, 8619.15 examples/s]
+Filter: 52%|█████▏ | 425000/818627 [00:47<00:45, 8635.84 examples/s]
+Filter: 52%|█████▏ | 426000/818627 [00:48<00:45, 8616.06 examples/s]
+Filter: 52%|█████▏ | 426000/818627 [00:48<00:45, 8613.97 examples/s]
+Filter: 52%|█████▏ | 426000/818627 [00:48<00:45, 8611.96 examples/s]
+Filter: 52%|█████▏ | 426000/818627 [00:48<00:45, 8612.76 examples/s]
+Filter: 52%|█████▏ | 426000/818627 [00:48<00:45, 8614.58 examples/s]
+Filter: 52%|█████▏ | 426000/818627 [00:48<00:45, 8611.85 examples/s]
+Filter: 52%|█████▏ | 426000/818627 [00:48<00:45, 8611.36 examples/s]
+Filter: 52%|█████▏ | 426000/818627 [00:48<00:45, 8630.68 examples/s]
+Filter: 52%|█████▏ | 427000/818627 [00:48<00:45, 8612.28 examples/s]
+Filter: 52%|█████▏ | 427000/818627 [00:48<00:45, 8610.78 examples/s]
+Filter: 52%|█████▏ | 427000/818627 [00:48<00:45, 8612.98 examples/s]
+Filter: 52%|█████▏ | 427000/818627 [00:48<00:45, 8612.11 examples/s]
+Filter: 52%|█████▏ | 427000/818627 [00:48<00:45, 8612.31 examples/s]
+Filter: 52%|█████▏ | 427000/818627 [00:48<00:45, 8609.73 examples/s]
+Filter: 52%|█████▏ | 427000/818627 [00:48<00:45, 8618.39 examples/s]
+Filter: 52%|█████▏ | 427000/818627 [00:48<00:45, 8538.40 examples/s]
+Filter: 52%|█████▏ | 428000/818627 [00:48<00:45, 8627.30 examples/s]
+Filter: 52%|█████▏ | 428000/818627 [00:48<00:45, 8627.48 examples/s]
+Filter: 52%|█████▏ | 428000/818627 [00:48<00:45, 8625.18 examples/s]
+Filter: 52%|█████▏ | 428000/818627 [00:48<00:45, 8627.30 examples/s]
+Filter: 52%|█████▏ | 428000/818627 [00:48<00:45, 8626.80 examples/s]
+Filter: 52%|█████▏ | 428000/818627 [00:48<00:45, 8648.50 examples/s]
+Filter: 52%|█████▏ | 428000/818627 [00:48<00:45, 8634.14 examples/s]
+Filter: 52%|█████▏ | 428000/818627 [00:48<00:46, 8489.26 examples/s]
+Filter: 52%|█████▏ | 429000/818627 [00:48<00:45, 8652.88 examples/s]
+Filter: 52%|█████▏ | 429000/818627 [00:48<00:44, 8693.17 examples/s]
+Filter: 52%|█████▏ | 429000/818627 [00:48<00:45, 8652.04 examples/s]
+Filter: 52%|█████▏ | 429000/818627 [00:48<00:45, 8654.33 examples/s]
+Filter: 52%|█████▏ | 429000/818627 [00:48<00:45, 8653.21 examples/s]
+Filter: 52%|█████▏ | 429000/818627 [00:48<00:45, 8650.45 examples/s]
+Filter: 52%|█████▏ | 429000/818627 [00:48<00:44, 8666.31 examples/s]
+Filter: 52%|█████▏ | 429000/818627 [00:48<00:45, 8655.96 examples/s]
+Filter: 53%|█████▎ | 430000/818627 [00:48<00:44, 8657.17 examples/s]
+Filter: 53%|█████▎ | 430000/818627 [00:48<00:44, 8683.28 examples/s]
+Filter: 53%|█████▎ | 430000/818627 [00:48<00:44, 8651.52 examples/s]
+Filter: 53%|█████▎ | 430000/818627 [00:48<00:44, 8648.36 examples/s]
+Filter: 53%|█████▎ | 430000/818627 [00:48<00:44, 8669.58 examples/s]
+Filter: 53%|█████▎ | 430000/818627 [00:48<00:44, 8657.10 examples/s]
+Filter: 53%|█████▎ | 430000/818627 [00:48<00:44, 8656.19 examples/s]
+Filter: 53%|█████▎ | 430000/818627 [00:48<00:44, 8660.02 examples/s]
+Filter: 53%|█████▎ | 431000/818627 [00:48<00:44, 8662.54 examples/s]
+Filter: 53%|█████▎ | 431000/818627 [00:48<00:44, 8683.26 examples/s]
+Filter: 53%|█████▎ | 431000/818627 [00:48<00:44, 8661.38 examples/s]
+Filter: 53%|█████▎ | 431000/818627 [00:48<00:44, 8662.51 examples/s]
+Filter: 53%|█████▎ | 431000/818627 [00:48<00:44, 8667.43 examples/s]
+Filter: 53%|█████▎ | 431000/818627 [00:48<00:44, 8673.77 examples/s]
+Filter: 53%|█████▎ | 431000/818627 [00:48<00:44, 8664.93 examples/s]
+Filter: 53%|█████▎ | 431000/818627 [00:48<00:44, 8663.27 examples/s]
+Filter: 53%|█████▎ | 432000/818627 [00:48<00:44, 8639.33 examples/s]
+Filter: 53%|█████▎ | 432000/818627 [00:48<00:44, 8651.57 examples/s]
+Filter: 53%|█████▎ | 432000/818627 [00:48<00:44, 8640.33 examples/s]
+Filter: 53%|█████▎ | 432000/818627 [00:49<00:44, 8635.17 examples/s]
+Filter: 53%|█████▎ | 432000/818627 [00:48<00:44, 8640.38 examples/s]
+Filter: 53%|█████▎ | 432000/818627 [00:48<00:44, 8645.80 examples/s]
+Filter: 53%|█████▎ | 432000/818627 [00:48<00:44, 8638.77 examples/s]
+Filter: 53%|█████▎ | 432000/818627 [00:48<00:44, 8639.66 examples/s]
+Filter: 53%|█████▎ | 433000/818627 [00:49<00:44, 8626.01 examples/s]
+Filter: 53%|█████▎ | 433000/818627 [00:48<00:44, 8625.73 examples/s]
+Filter: 53%|█████▎ | 433000/818627 [00:48<00:44, 8618.25 examples/s]
+Filter: 53%|█████▎ | 433000/818627 [00:48<00:44, 8627.62 examples/s]
+Filter: 53%|█████▎ | 433000/818627 [00:49<00:44, 8627.71 examples/s]
+Filter: 53%|█████▎ | 433000/818627 [00:48<00:44, 8623.35 examples/s]
+Filter: 53%|█████▎ | 433000/818627 [00:48<00:44, 8619.36 examples/s]
+Filter: 53%|█████▎ | 433000/818627 [00:48<00:44, 8621.91 examples/s]
+Filter: 53%|█████▎ | 434000/818627 [00:49<00:44, 8612.69 examples/s]
+Filter: 53%|█████▎ | 434000/818627 [00:49<00:44, 8605.49 examples/s]
+Filter: 53%|█████▎ | 434000/818627 [00:49<00:44, 8605.95 examples/s]
+Filter: 53%|█████▎ | 434000/818627 [00:49<00:44, 8596.73 examples/s]
+Filter: 53%|█████▎ | 434000/818627 [00:49<00:44, 8606.89 examples/s]
+Filter: 53%|█████▎ | 434000/818627 [00:49<00:44, 8604.67 examples/s]
+Filter: 53%|█████▎ | 434000/818627 [00:49<00:44, 8606.78 examples/s]
+Filter: 53%|█████▎ | 434000/818627 [00:49<00:44, 8607.06 examples/s]
+Filter: 53%|█████▎ | 435000/818627 [00:49<00:44, 8648.91 examples/s]
+Filter: 53%|█████▎ | 435000/818627 [00:49<00:44, 8651.89 examples/s]
+Filter: 53%|█████▎ | 435000/818627 [00:49<00:44, 8646.53 examples/s]
+Filter: 53%|█████▎ | 435000/818627 [00:49<00:44, 8645.75 examples/s]
+Filter: 53%|█████▎ | 435000/818627 [00:49<00:44, 8646.22 examples/s]
+Filter: 53%|█████▎ | 435000/818627 [00:49<00:44, 8647.76 examples/s]
+Filter: 53%|█████▎ | 435000/818627 [00:49<00:44, 8646.81 examples/s]
+Filter: 53%|█████▎ | 435000/818627 [00:49<00:44, 8649.06 examples/s]
+Filter: 53%|█████▎ | 436000/818627 [00:49<00:44, 8642.56 examples/s]
+Filter: 53%|█████▎ | 436000/818627 [00:49<00:44, 8637.55 examples/s]
+Filter: 53%|█████▎ | 436000/818627 [00:49<00:44, 8638.43 examples/s]
+Filter: 53%|█████▎ | 436000/818627 [00:49<00:44, 8636.26 examples/s]
+Filter: 53%|█████▎ | 436000/818627 [00:49<00:44, 8638.24 examples/s]
+Filter: 53%|█████▎ | 436000/818627 [00:49<00:44, 8635.37 examples/s]
+Filter: 53%|█████▎ | 436000/818627 [00:49<00:44, 8636.50 examples/s]
+Filter: 53%|█████▎ | 436000/818627 [00:49<00:44, 8637.54 examples/s]
+Filter: 53%|█████▎ | 437000/818627 [00:49<00:44, 8611.21 examples/s]
+Filter: 53%|█████▎ | 437000/818627 [00:49<00:44, 8613.84 examples/s]
+Filter: 53%|█████▎ | 437000/818627 [00:49<00:44, 8611.47 examples/s]
+Filter: 53%|█████▎ | 437000/818627 [00:49<00:44, 8609.07 examples/s]
+Filter: 53%|█████▎ | 437000/818627 [00:49<00:44, 8609.65 examples/s]
+Filter: 53%|█████▎ | 437000/818627 [00:49<00:44, 8609.48 examples/s]
+Filter: 53%|█████▎ | 437000/818627 [00:49<00:44, 8610.19 examples/s]
+Filter: 53%|█████▎ | 437000/818627 [00:49<00:44, 8609.79 examples/s]
+Filter: 54%|█████▎ | 438000/818627 [00:49<00:43, 8651.70 examples/s]
+Filter: 54%|█████▎ | 438000/818627 [00:49<00:43, 8651.04 examples/s]
+Filter: 54%|█████▎ | 438000/818627 [00:49<00:43, 8651.12 examples/s]
+Filter: 54%|█████▎ | 438000/818627 [00:49<00:44, 8645.48 examples/s]
+Filter: 54%|█████▎ | 438000/818627 [00:49<00:44, 8650.03 examples/s]
+Filter: 54%|█████▎ | 438000/818627 [00:49<00:44, 8647.76 examples/s]
+Filter: 54%|█████▎ | 438000/818627 [00:49<00:44, 8642.87 examples/s]
+Filter: 54%|█████▎ | 438000/818627 [00:49<00:44, 8649.71 examples/s]
+Filter: 54%|█████▎ | 439000/818627 [00:49<00:43, 8633.76 examples/s]
+Filter: 54%|█████▎ | 439000/818627 [00:49<00:43, 8635.62 examples/s]
+Filter: 54%|█████▎ | 439000/818627 [00:49<00:43, 8634.37 examples/s]
+Filter: 54%|█████▎ | 439000/818627 [00:49<00:43, 8635.71 examples/s]
+Filter: 54%|█████▎ | 439000/818627 [00:49<00:43, 8636.36 examples/s]
+Filter: 54%|█████▎ | 439000/818627 [00:49<00:43, 8635.03 examples/s]
+Filter: 54%|█████▎ | 439000/818627 [00:49<00:43, 8636.54 examples/s]
+Filter: 54%|█████▎ | 439000/818627 [00:49<00:43, 8634.00 examples/s]
+Filter: 54%|█████▎ | 440000/818627 [00:49<00:43, 8632.88 examples/s]
+Filter: 54%|█████▎ | 440000/818627 [00:49<00:43, 8631.52 examples/s]
+Filter: 54%|█████▎ | 440000/818627 [00:50<00:43, 8630.61 examples/s]
+Filter: 54%|█████▎ | 440000/818627 [00:49<00:43, 8632.54 examples/s]
+Filter: 54%|█████▎ | 440000/818627 [00:49<00:43, 8633.13 examples/s]
+Filter: 54%|█████▎ | 440000/818627 [00:49<00:43, 8633.99 examples/s]
+Filter: 54%|█████▎ | 440000/818627 [00:49<00:43, 8629.53 examples/s]
+Filter: 54%|█████▎ | 440000/818627 [00:49<00:43, 8630.31 examples/s]
+Filter: 54%|█████▍ | 441000/818627 [00:49<00:42, 8913.04 examples/s]
+Filter: 54%|█████▍ | 441000/818627 [00:49<00:42, 8913.56 examples/s]
+Filter: 54%|█████▍ | 441000/818627 [00:49<00:42, 8913.48 examples/s]
+Filter: 54%|█████▍ | 441000/818627 [00:49<00:42, 8910.78 examples/s]
+Filter: 54%|█████▍ | 441000/818627 [00:49<00:42, 8910.95 examples/s]
+Filter: 54%|█████▍ | 441000/818627 [00:49<00:42, 8908.41 examples/s]
+Filter: 54%|█████▍ | 441000/818627 [00:50<00:42, 8844.52 examples/s]
+Filter: 54%|█████▍ | 441000/818627 [00:49<00:43, 8750.07 examples/s]
+Filter: 54%|█████▍ | 442000/818627 [00:49<00:40, 9206.67 examples/s]
+Filter: 54%|█████▍ | 442000/818627 [00:49<00:40, 9203.17 examples/s]
+Filter: 54%|█████▍ | 442000/818627 [00:49<00:40, 9205.71 examples/s]
+Filter: 54%|█████▍ | 442000/818627 [00:50<00:40, 9203.96 examples/s]
+Filter: 54%|█████▍ | 442000/818627 [00:49<00:40, 9202.99 examples/s]
+Filter: 54%|█████▍ | 442000/818627 [00:49<00:40, 9206.00 examples/s]
+Filter: 54%|█████▍ | 443000/818627 [00:50<00:41, 9144.51 examples/s]
+Filter: 54%|█████▍ | 443000/818627 [00:50<00:41, 9140.55 examples/s]
+Filter: 54%|█████▍ | 443000/818627 [00:50<00:40, 9197.59 examples/s]
+Filter: 54%|█████▍ | 443000/818627 [00:50<00:40, 9171.39 examples/s]
+Filter: 54%|█████▍ | 443000/818627 [00:50<00:41, 9143.09 examples/s]
+Filter: 54%|█████▍ | 443000/818627 [00:50<00:41, 9139.55 examples/s]
+Filter: 54%|█████▍ | 443000/818627 [00:50<00:41, 9141.23 examples/s]
+Filter: 54%|█████▍ | 443000/818627 [00:50<00:41, 9140.18 examples/s]
+Filter: 54%|█████▍ | 444000/818627 [00:50<00:41, 8992.81 examples/s]
+Filter: 54%|█████▍ | 444000/818627 [00:50<00:41, 8993.48 examples/s]
+Filter: 54%|█████▍ | 444000/818627 [00:50<00:41, 9056.89 examples/s]
+Filter: 54%|█████▍ | 444000/818627 [00:50<00:41, 9037.76 examples/s]
+Filter: 54%|█████▍ | 444000/818627 [00:50<00:41, 8995.10 examples/s]
+Filter: 54%|█████▍ | 444000/818627 [00:50<00:41, 8990.82 examples/s]
+Filter: 54%|█████▍ | 444000/818627 [00:50<00:41, 8989.34 examples/s]
+Filter: 54%|█████▍ | 444000/818627 [00:50<00:41, 8992.18 examples/s]
+Filter: 54%|█████▍ | 445000/818627 [00:50<00:41, 8969.15 examples/s]
+Filter: 54%|█████▍ | 445000/818627 [00:50<00:41, 8956.15 examples/s]
+Filter: 54%|█████▍ | 445000/818627 [00:50<00:41, 8904.32 examples/s]
+Filter: 54%|█████▍ | 445000/818627 [00:50<00:41, 8904.67 examples/s]
+Filter: 54%|█████▍ | 445000/818627 [00:50<00:41, 8907.60 examples/s]
+Filter: 54%|█████▍ | 445000/818627 [00:50<00:41, 8908.44 examples/s]
+Filter: 54%|█████▍ | 445000/818627 [00:50<00:41, 8904.11 examples/s]
+Filter: 54%|█████▍ | 445000/818627 [00:50<00:41, 8907.91 examples/s]
+Filter: 54%|█████▍ | 446000/818627 [00:50<00:42, 8802.50 examples/s]
+Filter: 54%|█████▍ | 446000/818627 [00:50<00:42, 8853.43 examples/s]
+Filter: 54%|█████▍ | 446000/818627 [00:50<00:42, 8844.30 examples/s]
+Filter: 54%|█████▍ | 446000/818627 [00:50<00:42, 8797.27 examples/s]
+Filter: 54%|█████▍ | 446000/818627 [00:50<00:42, 8805.63 examples/s]
+Filter: 54%|█████▍ | 446000/818627 [00:50<00:42, 8799.72 examples/s]
+Filter: 54%|█████▍ | 446000/818627 [00:50<00:42, 8801.45 examples/s]
+Filter: 54%|█████▍ | 446000/818627 [00:50<00:42, 8800.78 examples/s]
+Filter: 55%|█████▍ | 447000/818627 [00:50<00:41, 9026.70 examples/s]
+Filter: 55%|█████▍ | 447000/818627 [00:50<00:41, 9043.65 examples/s]
+Filter: 55%|█████▍ | 447000/818627 [00:50<00:41, 9049.79 examples/s]
+Filter: 55%|█████▍ | 447000/818627 [00:50<00:41, 9019.12 examples/s]
+Filter: 55%|█████▍ | 447000/818627 [00:50<00:41, 9026.27 examples/s]
+Filter: 55%|█████▍ | 447000/818627 [00:50<00:41, 9026.98 examples/s]
+Filter: 55%|█████▍ | 447000/818627 [00:50<00:41, 9024.52 examples/s]
+Filter: 55%|█████▍ | 447000/818627 [00:50<00:41, 9026.61 examples/s]
+Filter: 55%|█████▍ | 448000/818627 [00:50<00:40, 9194.98 examples/s]
+Filter: 55%|█████▍ | 448000/818627 [00:50<00:40, 9200.70 examples/s]
+Filter: 55%|█████▍ | 448000/818627 [00:50<00:40, 9204.84 examples/s]
+Filter: 55%|█████▍ | 448000/818627 [00:50<00:40, 9195.59 examples/s]
+Filter: 55%|█████▍ | 448000/818627 [00:50<00:40, 9192.57 examples/s]
+Filter: 55%|█████▍ | 448000/818627 [00:50<00:40, 9193.41 examples/s]
+Filter: 55%|█████▍ | 448000/818627 [00:50<00:40, 9191.64 examples/s]
+Filter: 55%|█████▍ | 448000/818627 [00:50<00:40, 9189.40 examples/s]
+Filter: 55%|█████▍ | 449000/818627 [00:50<00:40, 9017.70 examples/s]
+Filter: 55%|█████▍ | 449000/818627 [00:50<00:40, 9016.94 examples/s]
+Filter: 55%|█████▍ | 449000/818627 [00:51<00:40, 9020.80 examples/s]
+Filter: 55%|█████▍ | 449000/818627 [00:50<00:40, 9020.59 examples/s]
+Filter: 55%|█████▍ | 449000/818627 [00:50<00:40, 9017.62 examples/s]
+Filter: 55%|█████▍ | 449000/818627 [00:50<00:40, 9016.81 examples/s]
+Filter: 55%|█████▍ | 449000/818627 [00:50<00:40, 9015.74 examples/s]
+Filter: 55%|█████▍ | 449000/818627 [00:50<00:40, 9016.63 examples/s]
+Filter: 55%|█████▍ | 450000/818627 [00:50<00:41, 8903.44 examples/s]
+Filter: 55%|█████▍ | 450000/818627 [00:50<00:41, 8906.99 examples/s]
+Filter: 55%|█████▍ | 450000/818627 [00:51<00:41, 8911.16 examples/s]
+Filter: 55%|█████▍ | 450000/818627 [00:50<00:41, 8905.06 examples/s]
+Filter: 55%|█████▍ | 450000/818627 [00:50<00:41, 8902.95 examples/s]
+Filter: 55%|█████▍ | 450000/818627 [00:50<00:41, 8899.28 examples/s]
+Filter: 55%|█████▍ | 450000/818627 [00:50<00:41, 8897.56 examples/s]
+Filter: 55%|█████▍ | 450000/818627 [00:50<00:41, 8902.12 examples/s]
+Filter: 55%|█████▌ | 451000/818627 [00:50<00:41, 8778.39 examples/s]
+Filter: 55%|█████▌ | 451000/818627 [00:50<00:41, 8778.68 examples/s]
+Filter: 55%|█████▌ | 451000/818627 [00:51<00:41, 8788.92 examples/s]
+Filter: 55%|█████▌ | 451000/818627 [00:50<00:41, 8791.24 examples/s]
+Filter: 55%|█████▌ | 451000/818627 [00:50<00:41, 8779.76 examples/s]
+Filter: 55%|█████▌ | 451000/818627 [00:50<00:41, 8779.68 examples/s]
+Filter: 55%|█████▌ | 451000/818627 [00:51<00:41, 8779.91 examples/s]
+Filter: 55%|█████▌ | 451000/818627 [00:50<00:41, 8781.01 examples/s]
+Filter: 55%|█████▌ | 452000/818627 [00:51<00:41, 8729.28 examples/s]
+Filter: 55%|█████▌ | 452000/818627 [00:51<00:41, 8736.84 examples/s]
+Filter: 55%|█████▌ | 452000/818627 [00:51<00:42, 8727.99 examples/s]
+Filter: 55%|█████▌ | 452000/818627 [00:51<00:41, 8737.88 examples/s]
+Filter: 55%|█████▌ | 452000/818627 [00:51<00:41, 8729.47 examples/s]
+Filter: 55%|█████▌ | 452000/818627 [00:51<00:41, 8730.29 examples/s]
+Filter: 55%|█████▌ | 452000/818627 [00:51<00:41, 8730.99 examples/s]
+Filter: 55%|█████▌ | 452000/818627 [00:51<00:42, 8720.16 examples/s]
+Filter: 55%|█████▌ | 453000/818627 [00:51<00:42, 8702.84 examples/s]
+Filter: 55%|█████▌ | 453000/818627 [00:51<00:41, 8706.83 examples/s]
+Filter: 55%|█████▌ | 453000/818627 [00:51<00:41, 8707.55 examples/s]
+Filter: 55%|█████▌ | 453000/818627 [00:51<00:42, 8699.85 examples/s]
+Filter: 55%|█████▌ | 453000/818627 [00:51<00:42, 8704.43 examples/s]
+Filter: 55%|█████▌ | 453000/818627 [00:51<00:42, 8699.11 examples/s]
+Filter: 55%|█████▌ | 453000/818627 [00:51<00:42, 8701.79 examples/s]
+Filter: 55%|█████▌ | 453000/818627 [00:51<00:42, 8609.83 examples/s]
+Filter: 55%|█████▌ | 454000/818627 [00:51<00:42, 8667.65 examples/s]
+Filter: 55%|█████▌ | 454000/818627 [00:51<00:42, 8640.90 examples/s]
+Filter: 55%|█████▌ | 454000/818627 [00:51<00:42, 8643.28 examples/s]
+Filter: 55%|█████▌ | 454000/818627 [00:51<00:42, 8643.11 examples/s]
+Filter: 55%|█████▌ | 454000/818627 [00:51<00:42, 8641.34 examples/s]
+Filter: 55%|█████▌ | 454000/818627 [00:51<00:42, 8644.08 examples/s]
+Filter: 55%|█████▌ | 454000/818627 [00:51<00:42, 8638.78 examples/s]
+Filter: 55%|█████▌ | 454000/818627 [00:51<00:42, 8638.97 examples/s]
+Filter: 56%|█████▌ | 455000/818627 [00:51<00:40, 8990.39 examples/s]
+Filter: 56%|█████▌ | 455000/818627 [00:51<00:40, 9006.18 examples/s]
+Filter: 56%|█████▌ | 455000/818627 [00:51<00:40, 8987.73 examples/s]
+Filter: 56%|█████▌ | 455000/818627 [00:51<00:40, 8989.49 examples/s]
+Filter: 56%|█████▌ | 455000/818627 [00:51<00:40, 8989.18 examples/s]
+Filter: 56%|█████▌ | 455000/818627 [00:51<00:40, 8990.61 examples/s]
+Filter: 56%|█████▌ | 455000/818627 [00:51<00:40, 8986.82 examples/s]
+Filter: 56%|█████▌ | 455000/818627 [00:51<00:40, 8986.88 examples/s]
+Filter: 56%|█████▌ | 456000/818627 [00:51<00:40, 8978.51 examples/s]
+Filter: 56%|█████▌ | 456000/818627 [00:51<00:40, 8990.84 examples/s]
+Filter: 56%|█████▌ | 456000/818627 [00:51<00:40, 8978.51 examples/s]
+Filter: 56%|█████▌ | 456000/818627 [00:51<00:40, 8974.79 examples/s]
+Filter: 56%|█████▌ | 456000/818627 [00:51<00:40, 8979.20 examples/s]
+Filter: 56%|█████▌ | 456000/818627 [00:51<00:40, 8978.18 examples/s]
+Filter: 56%|█████▌ | 456000/818627 [00:51<00:40, 8979.22 examples/s]
+Filter: 56%|█████▌ | 456000/818627 [00:51<00:40, 8980.52 examples/s]
+Filter: 56%|█████▌ | 457000/818627 [00:51<00:40, 8867.97 examples/s]
+Filter: 56%|█████▌ | 457000/818627 [00:51<00:40, 8875.01 examples/s]
+Filter: 56%|█████▌ | 457000/818627 [00:51<00:40, 8877.17 examples/s]
+Filter: 56%|█████▌ | 457000/818627 [00:51<00:40, 8872.23 examples/s]
+Filter: 56%|█████▌ | 457000/818627 [00:51<00:40, 8874.17 examples/s]
+Filter: 56%|█████▌ | 457000/818627 [00:51<00:40, 8871.93 examples/s]
+Filter: 56%|█████▌ | 457000/818627 [00:51<00:40, 8867.38 examples/s]
+Filter: 56%|█████▌ | 457000/818627 [00:51<00:40, 8867.45 examples/s]
+Filter: 56%|█████▌ | 458000/818627 [00:51<00:41, 8782.26 examples/s]
+Filter: 56%|█████▌ | 458000/818627 [00:51<00:41, 8787.89 examples/s]
+Filter: 56%|█████▌ | 458000/818627 [00:52<00:41, 8785.36 examples/s]
+Filter: 56%|█████▌ | 458000/818627 [00:51<00:41, 8783.03 examples/s]
+Filter: 56%|█████▌ | 458000/818627 [00:51<00:41, 8784.39 examples/s]
+Filter: 56%|█████▌ | 458000/818627 [00:51<00:41, 8784.20 examples/s]
+Filter: 56%|█████▌ | 458000/818627 [00:51<00:41, 8784.08 examples/s]
+Filter: 56%|█████▌ | 458000/818627 [00:51<00:41, 8784.20 examples/s]
+Filter: 56%|█████▌ | 459000/818627 [00:51<00:41, 8754.24 examples/s]
+Filter: 56%|█████▌ | 459000/818627 [00:51<00:41, 8748.78 examples/s]
+Filter: 56%|█████▌ | 459000/818627 [00:52<00:41, 8750.51 examples/s]
+Filter: 56%|█████▌ | 459000/818627 [00:51<00:41, 8749.41 examples/s]
+Filter: 56%|█████▌ | 459000/818627 [00:51<00:41, 8752.47 examples/s]
+Filter: 56%|█████▌ | 459000/818627 [00:51<00:41, 8748.17 examples/s]
+Filter: 56%|█████▌ | 459000/818627 [00:51<00:41, 8747.24 examples/s]
+Filter: 56%|█████▌ | 459000/818627 [00:51<00:41, 8750.42 examples/s]
+Filter: 56%|█████▌ | 460000/818627 [00:51<00:41, 8728.13 examples/s]
+Filter: 56%|█████▌ | 460000/818627 [00:51<00:41, 8730.48 examples/s]
+Filter: 56%|█████▌ | 460000/818627 [00:52<00:41, 8726.69 examples/s]
+Filter: 56%|█████▌ | 460000/818627 [00:51<00:41, 8724.22 examples/s]
+Filter: 56%|█████▌ | 460000/818627 [00:51<00:41, 8724.90 examples/s]
+Filter: 56%|█████▌ | 460000/818627 [00:51<00:41, 8727.58 examples/s]
+Filter: 56%|█████▌ | 460000/818627 [00:52<00:41, 8727.08 examples/s]
+Filter: 56%|█████▌ | 460000/818627 [00:51<00:41, 8725.72 examples/s]
+Filter: 56%|█████▋ | 461000/818627 [00:52<00:42, 8465.27 examples/s]
+Filter: 56%|█████▋ | 461000/818627 [00:52<00:42, 8463.48 examples/s]
+Filter: 56%|█████▋ | 461000/818627 [00:52<00:42, 8459.70 examples/s]
+Filter: 56%|█████▋ | 461000/818627 [00:52<00:42, 8462.14 examples/s]
+Filter: 56%|█████▋ | 461000/818627 [00:52<00:42, 8463.81 examples/s]
+Filter: 56%|█████▋ | 461000/818627 [00:52<00:42, 8459.34 examples/s]
+Filter: 56%|█████▋ | 461000/818627 [00:52<00:42, 8458.82 examples/s]
+Filter: 56%|█████▋ | 461000/818627 [00:52<00:42, 8464.63 examples/s]
+Filter: 56%|█████▋ | 462000/818627 [00:52<00:41, 8516.97 examples/s]
+Filter: 56%|█████▋ | 462000/818627 [00:52<00:41, 8512.72 examples/s]
+Filter: 56%|█████▋ | 462000/818627 [00:52<00:41, 8513.97 examples/s]
+Filter: 56%|█████▋ | 462000/818627 [00:52<00:41, 8510.72 examples/s]
+Filter: 56%|█████▋ | 462000/818627 [00:52<00:41, 8516.13 examples/s]
+Filter: 56%|█████▋ | 462000/818627 [00:52<00:41, 8512.77 examples/s]
+Filter: 56%|█████▋ | 462000/818627 [00:52<00:41, 8510.99 examples/s]
+Filter: 56%|█████▋ | 462000/818627 [00:52<00:42, 8346.79 examples/s]
+Filter: 57%|█████▋ | 463000/818627 [00:52<00:41, 8544.85 examples/s]
+Filter: 57%|█████▋ | 463000/818627 [00:52<00:41, 8542.24 examples/s]
+Filter: 57%|█████▋ | 463000/818627 [00:52<00:41, 8542.20 examples/s]
+Filter: 57%|█████▋ | 463000/818627 [00:52<00:41, 8542.72 examples/s]
+Filter: 57%|█████▋ | 463000/818627 [00:52<00:41, 8544.03 examples/s]
+Filter: 57%|█████▋ | 463000/818627 [00:52<00:41, 8541.59 examples/s]
+Filter: 57%|█████▋ | 463000/818627 [00:52<00:41, 8541.97 examples/s]
+Filter: 57%|█████▋ | 463000/818627 [00:52<00:41, 8587.71 examples/s]
+Filter: 57%|█████▋ | 464000/818627 [00:52<00:40, 8838.73 examples/s]
+Filter: 57%|█████▋ | 464000/818627 [00:52<00:40, 8838.90 examples/s]
+Filter: 57%|█████▋ | 464000/818627 [00:52<00:40, 8838.38 examples/s]
+Filter: 57%|█████▋ | 464000/818627 [00:52<00:40, 8838.31 examples/s]
+Filter: 57%|█████▋ | 464000/818627 [00:52<00:40, 8839.32 examples/s]
+Filter: 57%|█████▋ | 464000/818627 [00:52<00:40, 8837.72 examples/s]
+Filter: 57%|█████▋ | 464000/818627 [00:52<00:40, 8838.15 examples/s]
+Filter: 57%|█████▋ | 464000/818627 [00:52<00:39, 8883.74 examples/s]
+Filter: 57%|█████▋ | 465000/818627 [00:52<00:40, 8791.24 examples/s]
+Filter: 57%|█████▋ | 465000/818627 [00:52<00:40, 8791.47 examples/s]
+Filter: 57%|█████▋ | 465000/818627 [00:52<00:40, 8793.84 examples/s]
+Filter: 57%|█████▋ | 465000/818627 [00:52<00:40, 8792.15 examples/s]
+Filter: 57%|█████▋ | 465000/818627 [00:52<00:40, 8791.22 examples/s]
+Filter: 57%|█████▋ | 465000/818627 [00:52<00:40, 8774.25 examples/s]
+Filter: 57%|█████▋ | 465000/818627 [00:52<00:40, 8814.84 examples/s]
+Filter: 57%|█████▋ | 465000/818627 [00:52<00:40, 8731.30 examples/s]
+Filter: 57%|█████▋ | 466000/818627 [00:52<00:39, 8859.13 examples/s]
+Filter: 57%|█████▋ | 466000/818627 [00:52<00:39, 8860.46 examples/s]
+Filter: 57%|█████▋ | 466000/818627 [00:52<00:39, 8864.13 examples/s]
+Filter: 57%|█████▋ | 466000/818627 [00:52<00:39, 8860.99 examples/s]
+Filter: 57%|█████▋ | 466000/818627 [00:52<00:39, 8858.57 examples/s]
+Filter: 57%|█████▋ | 466000/818627 [00:52<00:39, 8876.57 examples/s]
+Filter: 57%|█████▋ | 466000/818627 [00:52<00:39, 8857.91 examples/s]
+Filter: 57%|█████▋ | 466000/818627 [00:52<00:39, 8878.22 examples/s]
+Filter: 57%|█████▋ | 467000/818627 [00:52<00:40, 8751.08 examples/s]
+Filter: 57%|█████▋ | 467000/818627 [00:52<00:40, 8755.20 examples/s]
+Filter: 57%|█████▋ | 467000/818627 [00:52<00:40, 8753.30 examples/s]
+Filter: 57%|█████▋ | 467000/818627 [00:53<00:40, 8749.74 examples/s]
+Filter: 57%|█████▋ | 467000/818627 [00:52<00:40, 8764.63 examples/s]
+Filter: 57%|█████▋ | 467000/818627 [00:52<00:40, 8751.98 examples/s]
+Filter: 57%|█████▋ | 467000/818627 [00:52<00:40, 8751.38 examples/s]
+Filter: 57%|█████▋ | 467000/818627 [00:52<00:40, 8770.46 examples/s]
+Filter: 57%|█████▋ | 468000/818627 [00:52<00:40, 8714.71 examples/s]
+Filter: 57%|█████▋ | 468000/818627 [00:52<00:40, 8715.00 examples/s]
+Filter: 57%|█████▋ | 468000/818627 [00:52<00:40, 8705.54 examples/s]
+Filter: 57%|█████▋ | 468000/818627 [00:52<00:40, 8714.98 examples/s]
+Filter: 57%|█████▋ | 468000/818627 [00:53<00:40, 8702.48 examples/s]
+Filter: 57%|█████▋ | 468000/818627 [00:52<00:40, 8722.77 examples/s]
+Filter: 57%|█████▋ | 468000/818627 [00:52<00:40, 8711.65 examples/s]
+Filter: 57%|█████▋ | 468000/818627 [00:52<00:40, 8629.46 examples/s]
+Filter: 57%|█████▋ | 469000/818627 [00:52<00:40, 8672.94 examples/s]
+Filter: 57%|█████▋ | 469000/818627 [00:53<00:40, 8678.73 examples/s]
+Filter: 57%|█████▋ | 469000/818627 [00:53<00:40, 8673.00 examples/s]
+Filter: 57%|█████▋ | 469000/818627 [00:52<00:40, 8673.09 examples/s]
+Filter: 57%|█████▋ | 469000/818627 [00:52<00:40, 8681.54 examples/s]
+Filter: 57%|█████▋ | 469000/818627 [00:53<00:40, 8672.46 examples/s]
+Filter: 57%|█████▋ | 469000/818627 [00:52<00:40, 8673.15 examples/s]
+Filter: 57%|█████▋ | 469000/818627 [00:52<00:40, 8707.65 examples/s]
+Filter: 57%|█████▋ | 470000/818627 [00:53<00:40, 8660.12 examples/s]
+Filter: 57%|█████▋ | 470000/818627 [00:53<00:40, 8662.75 examples/s]
+Filter: 57%|█████▋ | 470000/818627 [00:53<00:40, 8662.38 examples/s]
+Filter: 57%|█████▋ | 470000/818627 [00:53<00:40, 8662.17 examples/s]
+Filter: 57%|█████▋ | 470000/818627 [00:53<00:40, 8662.08 examples/s]
+Filter: 57%|█████▋ | 470000/818627 [00:53<00:40, 8660.48 examples/s]
+Filter: 57%|█████▋ | 470000/818627 [00:53<00:40, 8663.70 examples/s]
+Filter: 57%|█████▋ | 470000/818627 [00:53<00:40, 8688.77 examples/s]
+Filter: 58%|█████▊ | 471000/818627 [00:53<00:40, 8665.58 examples/s]
+Filter: 58%|█████▊ | 471000/818627 [00:53<00:40, 8664.78 examples/s]
+Filter: 58%|█████▊ | 471000/818627 [00:53<00:40, 8663.37 examples/s]
+Filter: 58%|█████▊ | 471000/818627 [00:53<00:40, 8665.07 examples/s]
+Filter: 58%|█████▊ | 471000/818627 [00:53<00:40, 8667.46 examples/s]
+Filter: 58%|█████▊ | 471000/818627 [00:53<00:40, 8665.08 examples/s]
+Filter: 58%|█████▊ | 471000/818627 [00:53<00:40, 8667.20 examples/s]
+Filter: 58%|█████▊ | 471000/818627 [00:53<00:40, 8685.68 examples/s]
+Filter: 58%|█████▊ | 472000/818627 [00:53<00:38, 9006.36 examples/s]
+Filter: 58%|█████▊ | 472000/818627 [00:53<00:38, 9000.53 examples/s]
+Filter: 58%|█████▊ | 472000/818627 [00:53<00:38, 9004.38 examples/s]
+Filter: 58%|█████▊ | 472000/818627 [00:53<00:38, 8996.01 examples/s]
+Filter: 58%|█████▊ | 472000/818627 [00:53<00:38, 9005.74 examples/s]
+Filter: 58%|█████▊ | 472000/818627 [00:53<00:38, 9003.33 examples/s]
+Filter: 58%|█████▊ | 472000/818627 [00:53<00:38, 9002.92 examples/s]
+Filter: 58%|█████▊ | 472000/818627 [00:53<00:38, 9000.44 examples/s]
+Filter: 58%|█████▊ | 473000/818627 [00:53<00:38, 9010.80 examples/s]
+Filter: 58%|█████▊ | 473000/818627 [00:53<00:38, 9010.73 examples/s]
+Filter: 58%|█████▊ | 473000/818627 [00:53<00:38, 9010.37 examples/s]
+Filter: 58%|█████▊ | 473000/818627 [00:53<00:38, 9009.52 examples/s]
+Filter: 58%|█████▊ | 473000/818627 [00:53<00:38, 9012.22 examples/s]
+Filter: 58%|█████▊ | 473000/818627 [00:53<00:38, 9008.75 examples/s]
+Filter: 58%|█████▊ | 473000/818627 [00:53<00:38, 9024.23 examples/s]
+Filter: 58%|█████▊ | 473000/818627 [00:53<00:38, 9002.07 examples/s]
+Filter: 58%|█████▊ | 474000/818627 [00:53<00:38, 8885.99 examples/s]
+Filter: 58%|█████▊ | 474000/818627 [00:53<00:38, 8885.06 examples/s]
+Filter: 58%|█████▊ | 474000/818627 [00:53<00:38, 8885.01 examples/s]
+Filter: 58%|█████▊ | 474000/818627 [00:53<00:38, 8878.84 examples/s]
+Filter: 58%|█████▊ | 474000/818627 [00:53<00:38, 8884.98 examples/s]
+Filter: 58%|█████▊ | 474000/818627 [00:53<00:38, 8881.04 examples/s]
+Filter: 58%|█████▊ | 474000/818627 [00:53<00:38, 8878.05 examples/s]
+Filter: 58%|█████▊ | 474000/818627 [00:53<00:38, 8887.94 examples/s]
+Filter: 58%|█████▊ | 475000/818627 [00:53<00:39, 8771.26 examples/s]
+Filter: 58%|█████▊ | 475000/818627 [00:53<00:39, 8768.36 examples/s]
+Filter: 58%|█████▊ | 475000/818627 [00:54<00:39, 8769.81 examples/s]
+Filter: 58%|█████▊ | 475000/818627 [00:53<00:39, 8770.21 examples/s]
+Filter: 58%|█████▊ | 475000/818627 [00:53<00:39, 8769.75 examples/s]
+Filter: 58%|█████▊ | 475000/818627 [00:53<00:39, 8768.45 examples/s]
+Filter: 58%|█████▊ | 475000/818627 [00:53<00:39, 8766.90 examples/s]
+Filter: 58%|█████▊ | 475000/818627 [00:53<00:39, 8777.37 examples/s]
+Filter: 58%|█████▊ | 476000/818627 [00:53<00:39, 8732.67 examples/s]
+Filter: 58%|█████▊ | 476000/818627 [00:53<00:39, 8729.29 examples/s]
+Filter: 58%|█████▊ | 476000/818627 [00:54<00:39, 8733.51 examples/s]
+Filter: 58%|█████▊ | 476000/818627 [00:53<00:39, 8733.14 examples/s]
+Filter: 58%|█████▊ | 476000/818627 [00:53<00:39, 8732.46 examples/s]
+Filter: 58%|█████▊ | 476000/818627 [00:53<00:39, 8732.69 examples/s]
+Filter: 58%|█████▊ | 476000/818627 [00:53<00:39, 8731.07 examples/s]
+Filter: 58%|█████▊ | 476000/818627 [00:53<00:39, 8734.98 examples/s]
+Filter: 58%|█████▊ | 477000/818627 [00:53<00:39, 8669.01 examples/s]
+Filter: 58%|█████▊ | 477000/818627 [00:53<00:39, 8665.78 examples/s]
+Filter: 58%|█████▊ | 477000/818627 [00:54<00:39, 8669.07 examples/s]
+Filter: 58%|█████▊ | 477000/818627 [00:53<00:39, 8670.21 examples/s]
+Filter: 58%|█████▊ | 477000/818627 [00:53<00:39, 8668.86 examples/s]
+Filter: 58%|█████▊ | 477000/818627 [00:54<00:39, 8667.84 examples/s]
+Filter: 58%|█████▊ | 477000/818627 [00:53<00:39, 8666.05 examples/s]
+Filter: 58%|█████▊ | 477000/818627 [00:53<00:39, 8672.22 examples/s]
+Filter: 58%|█████▊ | 478000/818627 [00:54<00:39, 8677.19 examples/s]
+Filter: 58%|█████▊ | 478000/818627 [00:54<00:39, 8674.08 examples/s]
+Filter: 58%|█████▊ | 478000/818627 [00:54<00:39, 8677.84 examples/s]
+Filter: 58%|█████▊ | 478000/818627 [00:54<00:39, 8674.53 examples/s]
+Filter: 58%|█████▊ | 478000/818627 [00:54<00:39, 8676.55 examples/s]
+Filter: 58%|█████▊ | 478000/818627 [00:54<00:39, 8676.24 examples/s]
+Filter: 58%|█████▊ | 478000/818627 [00:54<00:39, 8675.53 examples/s]
+Filter: 58%|█████▊ | 478000/818627 [00:54<00:39, 8606.82 examples/s]
+Filter: 59%|█████▊ | 479000/818627 [00:54<00:39, 8702.60 examples/s]
+Filter: 59%|█████▊ | 479000/818627 [00:54<00:39, 8701.63 examples/s]
+Filter: 59%|█████▊ | 479000/818627 [00:54<00:39, 8703.47 examples/s]
+Filter: 59%|█████▊ | 479000/818627 [00:54<00:39, 8697.81 examples/s]
+Filter: 59%|█████▊ | 479000/818627 [00:54<00:39, 8703.95 examples/s]
+Filter: 59%|█████▊ | 479000/818627 [00:54<00:39, 8703.43 examples/s]
+Filter: 59%|█████▊ | 479000/818627 [00:54<00:39, 8701.54 examples/s]
+Filter: 59%|█████▊ | 479000/818627 [00:54<00:38, 8724.61 examples/s]
+Filter: 59%|█████▊ | 480000/818627 [00:54<00:38, 8696.50 examples/s]
+Filter: 59%|█████▊ | 480000/818627 [00:54<00:38, 8696.40 examples/s]
+Filter: 59%|█████▊ | 480000/818627 [00:54<00:38, 8699.30 examples/s]
+Filter: 59%|█████▊ | 480000/818627 [00:54<00:38, 8690.50 examples/s]
+Filter: 59%|█████▊ | 480000/818627 [00:54<00:38, 8697.75 examples/s]
+Filter: 59%|█████▊ | 480000/818627 [00:54<00:38, 8696.62 examples/s]
+Filter: 59%|█████▊ | 480000/818627 [00:54<00:38, 8698.33 examples/s]
+Filter: 59%|█████▊ | 480000/818627 [00:54<00:38, 8710.20 examples/s]
+Filter: 59%|█████▉ | 481000/818627 [00:54<00:38, 8682.18 examples/s]
+Filter: 59%|█████▉ | 481000/818627 [00:54<00:38, 8685.01 examples/s]
+Filter: 59%|█████▉ | 481000/818627 [00:54<00:38, 8678.69 examples/s]
+Filter: 59%|█████▉ | 481000/818627 [00:54<00:38, 8684.54 examples/s]
+Filter: 59%|█████▉ | 481000/818627 [00:54<00:38, 8685.77 examples/s]
+Filter: 59%|█████▉ | 481000/818627 [00:54<00:38, 8684.20 examples/s]
+Filter: 59%|█████▉ | 481000/818627 [00:54<00:38, 8681.57 examples/s]
+Filter: 59%|█████▉ | 481000/818627 [00:54<00:38, 8695.44 examples/s]
+Filter: 59%|█████▉ | 482000/818627 [00:54<00:38, 8690.92 examples/s]
+Filter: 59%|█████▉ | 482000/818627 [00:54<00:38, 8694.37 examples/s]
+Filter: 59%|█████▉ | 482000/818627 [00:54<00:38, 8688.55 examples/s]
+Filter: 59%|█████▉ | 482000/818627 [00:54<00:38, 8691.20 examples/s]
+Filter: 59%|█████▉ | 482000/818627 [00:54<00:38, 8694.29 examples/s]
+Filter: 59%|█████▉ | 482000/818627 [00:54<00:38, 8690.69 examples/s]
+Filter: 59%|█████▉ | 482000/818627 [00:54<00:38, 8690.48 examples/s]
+Filter: 59%|█████▉ | 482000/818627 [00:54<00:38, 8697.77 examples/s]
+Filter: 59%|█████▉ | 483000/818627 [00:54<00:38, 8682.32 examples/s]
+Filter: 59%|█████▉ | 483000/818627 [00:54<00:38, 8681.16 examples/s]
+Filter: 59%|█████▉ | 483000/818627 [00:54<00:38, 8680.02 examples/s]
+Filter: 59%|█████▉ | 483000/818627 [00:54<00:38, 8680.61 examples/s]
+Filter: 59%|█████▉ | 483000/818627 [00:54<00:38, 8683.40 examples/s]
+Filter: 59%|█████▉ | 483000/818627 [00:54<00:38, 8680.82 examples/s]
+Filter: 59%|█████▉ | 483000/818627 [00:54<00:38, 8678.28 examples/s]
+Filter: 59%|█████▉ | 483000/818627 [00:54<00:38, 8688.12 examples/s]
+Filter: 59%|█████▉ | 484000/818627 [00:54<00:38, 8634.04 examples/s]
+Filter: 59%|█████▉ | 484000/818627 [00:54<00:38, 8636.49 examples/s]
+Filter: 59%|█████▉ | 484000/818627 [00:54<00:38, 8630.71 examples/s]
+Filter: 59%|█████▉ | 484000/818627 [00:55<00:38, 8632.48 examples/s]
+Filter: 59%|█████▉ | 484000/818627 [00:54<00:38, 8631.68 examples/s]
+Filter: 59%|█████▉ | 484000/818627 [00:54<00:38, 8629.12 examples/s]
+Filter: 59%|█████▉ | 484000/818627 [00:54<00:38, 8630.24 examples/s]
+Filter: 59%|█████▉ | 484000/818627 [00:54<00:38, 8632.90 examples/s]
+Filter: 59%|█████▉ | 485000/818627 [00:54<00:37, 8895.74 examples/s]
+Filter: 59%|█████▉ | 485000/818627 [00:55<00:37, 8897.63 examples/s]
+Filter: 59%|█████▉ | 485000/818627 [00:54<00:37, 8892.97 examples/s]
+Filter: 59%|█████▉ | 485000/818627 [00:54<00:37, 8893.76 examples/s]
+Filter: 59%|█████▉ | 485000/818627 [00:54<00:37, 8895.96 examples/s]
+Filter: 59%|█████▉ | 485000/818627 [00:54<00:37, 8892.41 examples/s]
+Filter: 59%|█████▉ | 485000/818627 [00:54<00:37, 8892.69 examples/s]
+Filter: 59%|█████▉ | 485000/818627 [00:54<00:37, 8900.61 examples/s]
+Filter: 59%|█████▉ | 486000/818627 [00:54<00:36, 9171.85 examples/s]
+Filter: 59%|█████▉ | 486000/818627 [00:54<00:36, 9166.62 examples/s]
+Filter: 59%|█████▉ | 486000/818627 [00:55<00:36, 9165.60 examples/s]
+Filter: 59%|█████▉ | 486000/818627 [00:54<00:36, 9161.63 examples/s]
+Filter: 59%|█████▉ | 486000/818627 [00:54<00:36, 9167.38 examples/s]
+Filter: 59%|█████▉ | 486000/818627 [00:54<00:36, 9159.38 examples/s]
+Filter: 59%|█████▉ | 486000/818627 [00:55<00:36, 9158.73 examples/s]
+Filter: 59%|█████▉ | 486000/818627 [00:54<00:36, 8998.42 examples/s]
+Filter: 59%|█████▉ | 487000/818627 [00:55<00:36, 9128.13 examples/s]
+Filter: 59%|█████▉ | 487000/818627 [00:55<00:36, 9128.11 examples/s]
+Filter: 59%|█████▉ | 487000/818627 [00:55<00:36, 9123.71 examples/s]
+Filter: 59%|█████▉ | 487000/818627 [00:55<00:36, 9121.78 examples/s]
+Filter: 59%|█████▉ | 487000/818627 [00:55<00:36, 9127.08 examples/s]
+Filter: 59%|█████▉ | 487000/818627 [00:55<00:36, 9127.97 examples/s]
+Filter: 59%|█████▉ | 487000/818627 [00:55<00:36, 9181.99 examples/s]
+Filter: 59%|█████▉ | 487000/818627 [00:55<00:36, 9122.52 examples/s]
+Filter: 60%|█████▉ | 488000/818627 [00:55<00:37, 8930.64 examples/s]
+Filter: 60%|█████▉ | 488000/818627 [00:55<00:37, 8928.44 examples/s]
+Filter: 60%|█████▉ | 488000/818627 [00:55<00:37, 8931.36 examples/s]
+Filter: 60%|█████▉ | 488000/818627 [00:55<00:37, 8929.94 examples/s]
+Filter: 60%|█████▉ | 488000/818627 [00:55<00:37, 8928.09 examples/s]
+Filter: 60%|█████▉ | 488000/818627 [00:55<00:37, 8928.97 examples/s]
+Filter: 60%|█████▉ | 488000/818627 [00:55<00:37, 8925.28 examples/s]
+Filter: 60%|█████▉ | 488000/818627 [00:55<00:36, 8958.86 examples/s]
+Filter: 60%|█████▉ | 489000/818627 [00:55<00:37, 8848.49 examples/s]
+Filter: 60%|█████▉ | 489000/818627 [00:55<00:37, 8849.34 examples/s]
+Filter: 60%|█████▉ | 489000/818627 [00:55<00:37, 8850.55 examples/s]
+Filter: 60%|█████▉ | 489000/818627 [00:55<00:37, 8849.97 examples/s]
+Filter: 60%|█████▉ | 489000/818627 [00:55<00:37, 8847.72 examples/s]
+Filter: 60%|█████▉ | 489000/818627 [00:55<00:37, 8844.87 examples/s]
+Filter: 60%|█████▉ | 489000/818627 [00:55<00:37, 8843.56 examples/s]
+Filter: 60%|█████▉ | 489000/818627 [00:55<00:37, 8871.48 examples/s]
+Filter: 60%|█████▉ | 490000/818627 [00:55<00:37, 8769.56 examples/s]
+Filter: 60%|█████▉ | 490000/818627 [00:55<00:37, 8773.31 examples/s]
+Filter: 60%|█████▉ | 490000/818627 [00:55<00:37, 8771.78 examples/s]
+Filter: 60%|█████▉ | 490000/818627 [00:55<00:37, 8760.20 examples/s]
+Filter: 60%|█████▉ | 490000/818627 [00:55<00:37, 8770.45 examples/s]
+Filter: 60%|█████▉ | 490000/818627 [00:55<00:37, 8767.35 examples/s]
+Filter: 60%|█████▉ | 490000/818627 [00:55<00:37, 8766.72 examples/s]
+Filter: 60%|█████▉ | 490000/818627 [00:55<00:37, 8786.04 examples/s]
+Filter: 60%|█████▉ | 491000/818627 [00:55<00:37, 8701.41 examples/s]
+Filter: 60%|█████▉ | 491000/818627 [00:55<00:37, 8699.54 examples/s]
+Filter: 60%|█████▉ | 491000/818627 [00:55<00:37, 8698.37 examples/s]
+Filter: 60%|█████▉ | 491000/818627 [00:55<00:37, 8698.21 examples/s]
+Filter: 60%|█████▉ | 491000/818627 [00:55<00:37, 8701.15 examples/s]
+Filter: 60%|█████▉ | 491000/818627 [00:55<00:37, 8699.74 examples/s]
+Filter: 60%|█████▉ | 491000/818627 [00:55<00:37, 8699.27 examples/s]
+Filter: 60%|█████▉ | 491000/818627 [00:55<00:37, 8705.65 examples/s]
+Filter: 60%|██████ | 492000/818627 [00:55<00:37, 8675.15 examples/s]
+Filter: 60%|██████ | 492000/818627 [00:55<00:37, 8672.92 examples/s]
+Filter: 60%|██████ | 492000/818627 [00:55<00:37, 8672.47 examples/s]
+Filter: 60%|██████ | 492000/818627 [00:55<00:37, 8665.85 examples/s]
+Filter: 60%|██████ | 492000/818627 [00:55<00:37, 8679.45 examples/s]
+Filter: 60%|██████ | 492000/818627 [00:55<00:37, 8677.04 examples/s]
+Filter: 60%|██████ | 492000/818627 [00:55<00:37, 8676.43 examples/s]
+Filter: 60%|██████ | 492000/818627 [00:55<00:37, 8685.77 examples/s]
+Filter: 60%|██████ | 493000/818627 [00:56<00:37, 8696.90 examples/s]
+Filter: 60%|██████ | 493000/818627 [00:55<00:37, 8690.29 examples/s]
+Filter: 60%|██████ | 493000/818627 [00:55<00:37, 8689.82 examples/s]
+Filter: 60%|██████ | 493000/818627 [00:55<00:37, 8693.92 examples/s]
+Filter: 60%|██████ | 493000/818627 [00:55<00:37, 8696.48 examples/s]
+Filter: 60%|██████ | 493000/818627 [00:55<00:37, 8694.85 examples/s]
+Filter: 60%|██████ | 493000/818627 [00:55<00:37, 8692.14 examples/s]
+Filter: 60%|██████ | 493000/818627 [00:55<00:37, 8691.07 examples/s]
+Filter: 60%|██████ | 494000/818627 [00:55<00:37, 8654.51 examples/s]
+Filter: 60%|██████ | 494000/818627 [00:55<00:37, 8652.80 examples/s]
+Filter: 60%|██████ | 494000/818627 [00:56<00:37, 8654.34 examples/s]
+Filter: 60%|██████ | 494000/818627 [00:55<00:37, 8651.86 examples/s]
+Filter: 60%|██████ | 494000/818627 [00:55<00:37, 8654.79 examples/s]
+Filter: 60%|██████ | 494000/818627 [00:55<00:37, 8653.19 examples/s]
+Filter: 60%|██████ | 494000/818627 [00:55<00:37, 8655.16 examples/s]
+Filter: 60%|██████ | 494000/818627 [00:55<00:37, 8664.97 examples/s]
+Filter: 60%|██████ | 495000/818627 [00:55<00:37, 8656.61 examples/s]
+Filter: 60%|██████ | 495000/818627 [00:56<00:37, 8657.60 examples/s]
+Filter: 60%|██████ | 495000/818627 [00:55<00:37, 8654.76 examples/s]
+Filter: 60%|██████ | 495000/818627 [00:55<00:37, 8655.34 examples/s]
+Filter: 60%|██████ | 495000/818627 [00:55<00:37, 8657.25 examples/s]
+Filter: 60%|██████ | 495000/818627 [00:55<00:37, 8656.37 examples/s]
+Filter: 60%|██████ | 495000/818627 [00:56<00:37, 8653.88 examples/s]
+Filter: 60%|██████ | 495000/818627 [00:55<00:37, 8662.50 examples/s]
+Filter: 61%|██████ | 496000/818627 [00:56<00:37, 8672.65 examples/s]
+Filter: 61%|██████ | 496000/818627 [00:56<00:37, 8672.49 examples/s]
+Filter: 61%|██████ | 496000/818627 [00:56<00:37, 8673.05 examples/s]
+Filter: 61%|██████ | 496000/818627 [00:56<00:37, 8670.61 examples/s]
+Filter: 61%|██████ | 496000/818627 [00:56<00:37, 8673.22 examples/s]
+Filter: 61%|██████ | 496000/818627 [00:56<00:37, 8674.31 examples/s]
+Filter: 61%|██████ | 496000/818627 [00:56<00:37, 8672.01 examples/s]
+Filter: 61%|██████ | 496000/818627 [00:56<00:37, 8503.63 examples/s]
+Filter: 61%|██████ | 497000/818627 [00:56<00:37, 8672.56 examples/s]
+Filter: 61%|██████ | 497000/818627 [00:56<00:37, 8666.32 examples/s]
+Filter: 61%|██████ | 497000/818627 [00:56<00:37, 8668.25 examples/s]
+Filter: 61%|██████ | 497000/818627 [00:56<00:37, 8670.07 examples/s]
+Filter: 61%|██████ | 497000/818627 [00:56<00:37, 8669.57 examples/s]
+Filter: 61%|██████ | 497000/818627 [00:56<00:37, 8671.75 examples/s]
+Filter: 61%|██████ | 497000/818627 [00:56<00:37, 8668.46 examples/s]
+Filter: 61%|██████ | 497000/818627 [00:56<00:36, 8720.66 examples/s]
+Filter: 61%|██████ | 498000/818627 [00:56<00:36, 8699.33 examples/s]
+Filter: 61%|██████ | 498000/818627 [00:56<00:36, 8701.90 examples/s]
+Filter: 61%|██████ | 498000/818627 [00:56<00:36, 8698.94 examples/s]
+Filter: 61%|██████ | 498000/818627 [00:56<00:36, 8696.62 examples/s]
+Filter: 61%|██████ | 498000/818627 [00:56<00:36, 8702.26 examples/s]
+Filter: 61%|██████ | 498000/818627 [00:56<00:36, 8697.47 examples/s]
+Filter: 61%|██████ | 498000/818627 [00:56<00:36, 8697.81 examples/s]
+Filter: 61%|██████ | 498000/818627 [00:56<00:36, 8742.27 examples/s]
+Filter: 61%|██████ | 499000/818627 [00:56<00:37, 8628.82 examples/s]
+Filter: 61%|██████ | 499000/818627 [00:56<00:37, 8629.20 examples/s]
+Filter: 61%|██████ | 499000/818627 [00:56<00:37, 8628.03 examples/s]
+Filter: 61%|██████ | 499000/818627 [00:56<00:37, 8631.08 examples/s]
+Filter: 61%|██████ | 499000/818627 [00:56<00:37, 8630.30 examples/s]
+Filter: 61%|██████ | 499000/818627 [00:56<00:37, 8629.29 examples/s]
+Filter: 61%|██████ | 499000/818627 [00:56<00:37, 8630.05 examples/s]
+Filter: 61%|██████ | 499000/818627 [00:56<00:36, 8654.35 examples/s]
+Filter: 61%|██████ | 500000/818627 [00:56<00:36, 8640.71 examples/s]
+Filter: 61%|██████ | 500000/818627 [00:56<00:36, 8640.12 examples/s]
+Filter: 61%|██████ | 500000/818627 [00:56<00:36, 8638.62 examples/s]
+Filter: 61%|██████ | 500000/818627 [00:56<00:36, 8640.26 examples/s]
+Filter: 61%|██████ | 500000/818627 [00:56<00:36, 8640.24 examples/s]
+Filter: 61%|██████ | 500000/818627 [00:56<00:36, 8639.07 examples/s]
+Filter: 61%|██████ | 500000/818627 [00:56<00:36, 8637.55 examples/s]
+Filter: 61%|██████ | 500000/818627 [00:56<00:36, 8658.71 examples/s]
+Filter: 61%|██████ | 501000/818627 [00:56<00:36, 8627.95 examples/s]
+Filter: 61%|██████ | 501000/818627 [00:56<00:36, 8627.65 examples/s]
+Filter: 61%|██████ | 501000/818627 [00:56<00:36, 8627.61 examples/s]
+Filter: 61%|██████ | 501000/818627 [00:56<00:36, 8628.06 examples/s]
+Filter: 61%|██████ | 501000/818627 [00:56<00:36, 8628.65 examples/s]
+Filter: 61%|██████ | 501000/818627 [00:56<00:36, 8629.84 examples/s]
+Filter: 61%|██████ | 501000/818627 [00:56<00:36, 8629.22 examples/s]
+Filter: 61%|██████ | 501000/818627 [00:56<00:36, 8640.67 examples/s]
+Filter: 61%|██████▏ | 502000/818627 [00:56<00:36, 8637.04 examples/s]
+Filter: 61%|██████▏ | 502000/818627 [00:56<00:36, 8637.12 examples/s]
+Filter: 61%|██████▏ | 502000/818627 [00:57<00:36, 8638.25 examples/s]
+Filter: 61%|██████▏ | 502000/818627 [00:56<00:36, 8636.93 examples/s]
+Filter: 61%|██████▏ | 502000/818627 [00:56<00:36, 8638.78 examples/s]
+Filter: 61%|██████▏ | 502000/818627 [00:56<00:36, 8637.00 examples/s]
+Filter: 61%|██████▏ | 502000/818627 [00:56<00:36, 8645.36 examples/s]
+Filter: 61%|██████▏ | 502000/818627 [00:56<00:36, 8623.21 examples/s]
+Filter: 61%|██████▏ | 503000/818627 [00:56<00:36, 8619.74 examples/s]
+Filter: 61%|██████▏ | 503000/818627 [00:56<00:36, 8617.80 examples/s]
+Filter: 61%|██████▏ | 503000/818627 [00:57<00:36, 8617.13 examples/s]
+Filter: 61%|██████▏ | 503000/818627 [00:56<00:36, 8618.03 examples/s]
+Filter: 61%|██████▏ | 503000/818627 [00:56<00:36, 8614.75 examples/s]
+Filter: 61%|██████▏ | 503000/818627 [00:56<00:36, 8614.17 examples/s]
+Filter: 61%|██████▏ | 503000/818627 [00:56<00:36, 8618.90 examples/s]
+Filter: 61%|██████▏ | 503000/818627 [00:56<00:36, 8623.15 examples/s]
+Filter: 62%|██████▏ | 504000/818627 [00:56<00:36, 8591.18 examples/s]
+Filter: 62%|██████▏ | 504000/818627 [00:57<00:36, 8584.62 examples/s]
+Filter: 62%|██████▏ | 504000/818627 [00:57<00:36, 8587.03 examples/s]
+Filter: 62%|██████▏ | 504000/818627 [00:56<00:36, 8591.64 examples/s]
+Filter: 62%|██████▏ | 504000/818627 [00:56<00:36, 8590.19 examples/s]
+Filter: 62%|██████▏ | 504000/818627 [00:57<00:36, 8591.99 examples/s]
+Filter: 62%|██████▏ | 504000/818627 [00:57<00:36, 8596.84 examples/s]
+Filter: 62%|██████▏ | 504000/818627 [00:57<00:37, 8456.97 examples/s]
+Filter: 62%|██████▏ | 505000/818627 [00:57<00:36, 8668.49 examples/s]
+Filter: 62%|██████▏ | 505000/818627 [00:57<00:36, 8662.40 examples/s]
+Filter: 62%|██████▏ | 505000/818627 [00:57<00:36, 8667.21 examples/s]
+Filter: 62%|██████▏ | 505000/818627 [00:57<00:36, 8699.75 examples/s]
+Filter: 62%|██████▏ | 505000/818627 [00:57<00:36, 8668.25 examples/s]
+Filter: 62%|██████▏ | 505000/818627 [00:57<00:36, 8670.09 examples/s]
+Filter: 62%|██████▏ | 505000/818627 [00:57<00:36, 8664.22 examples/s]
+Filter: 62%|██████▏ | 505000/818627 [00:57<00:36, 8664.83 examples/s]
+Filter: 62%|██████▏ | 506000/818627 [00:57<00:36, 8634.52 examples/s]
+Filter: 62%|██████▏ | 506000/818627 [00:57<00:36, 8659.46 examples/s]
+Filter: 62%|██████▏ | 506000/818627 [00:57<00:36, 8628.80 examples/s]
+Filter: 62%|██████▏ | 506000/818627 [00:57<00:36, 8626.91 examples/s]
+Filter: 62%|██████▏ | 506000/818627 [00:57<00:36, 8635.49 examples/s]
+Filter: 62%|██████▏ | 506000/818627 [00:57<00:36, 8632.65 examples/s]
+Filter: 62%|██████▏ | 506000/818627 [00:57<00:36, 8631.98 examples/s]
+Filter: 62%|██████▏ | 506000/818627 [00:57<00:36, 8635.95 examples/s]
+Filter: 62%|██████▏ | 507000/818627 [00:57<00:34, 8989.07 examples/s]
+Filter: 62%|██████▏ | 507000/818627 [00:57<00:34, 9011.76 examples/s]
+Filter: 62%|██████▏ | 507000/818627 [00:57<00:34, 8989.27 examples/s]
+Filter: 62%|██████▏ | 507000/818627 [00:57<00:34, 8986.77 examples/s]
+Filter: 62%|██████▏ | 507000/818627 [00:57<00:34, 8992.88 examples/s]
+Filter: 62%|██████▏ | 507000/818627 [00:57<00:34, 8987.61 examples/s]
+Filter: 62%|██████▏ | 507000/818627 [00:57<00:34, 8988.10 examples/s]
+Filter: 62%|██████▏ | 507000/818627 [00:57<00:34, 8985.33 examples/s]
+Filter: 62%|██████▏ | 508000/818627 [00:57<00:34, 9044.40 examples/s]
+Filter: 62%|██████▏ | 508000/818627 [00:57<00:34, 9026.16 examples/s]
+Filter: 62%|██████▏ | 508000/818627 [00:57<00:34, 9029.71 examples/s]
+Filter: 62%|██████▏ | 508000/818627 [00:57<00:34, 9028.99 examples/s]
+Filter: 62%|██████▏ | 508000/818627 [00:57<00:34, 9025.93 examples/s]
+Filter: 62%|██████▏ | 508000/818627 [00:57<00:34, 9026.00 examples/s]
+Filter: 62%|██████▏ | 508000/818627 [00:57<00:34, 9031.89 examples/s]
+Filter: 62%|██████▏ | 508000/818627 [00:57<00:34, 9019.64 examples/s]
+Filter: 62%|██████▏ | 509000/818627 [00:57<00:34, 8880.41 examples/s]
+Filter: 62%|██████▏ | 509000/818627 [00:57<00:34, 8867.91 examples/s]
+Filter: 62%|██████▏ | 509000/818627 [00:57<00:34, 8870.40 examples/s]
+Filter: 62%|██████▏ | 509000/818627 [00:57<00:34, 8857.60 examples/s]
+Filter: 62%|██████▏ | 509000/818627 [00:57<00:34, 8868.07 examples/s]
+Filter: 62%|██████▏ | 509000/818627 [00:57<00:34, 8867.45 examples/s]
+Filter: 62%|██████▏ | 509000/818627 [00:57<00:34, 8864.74 examples/s]
+Filter: 62%|██████▏ | 509000/818627 [00:57<00:35, 8746.97 examples/s]
+Filter: 62%|██████▏ | 510000/818627 [00:57<00:34, 8832.51 examples/s]
+Filter: 62%|██████▏ | 510000/818627 [00:57<00:34, 8835.84 examples/s]
+Filter: 62%|██████▏ | 510000/818627 [00:58<00:34, 8829.64 examples/s]
+Filter: 62%|██████▏ | 510000/818627 [00:57<00:34, 8824.59 examples/s]
+Filter: 62%|██████▏ | 510000/818627 [00:57<00:34, 8829.90 examples/s]
+Filter: 62%|██████▏ | 510000/818627 [00:57<00:34, 8828.91 examples/s]
+Filter: 62%|██████▏ | 510000/818627 [00:57<00:34, 8825.67 examples/s]
+Filter: 62%|██████▏ | 510000/818627 [00:57<00:34, 8866.89 examples/s]
+Filter: 62%|██████▏ | 511000/818627 [00:57<00:35, 8735.24 examples/s]
+Filter: 62%|██████▏ | 511000/818627 [00:57<00:35, 8737.76 examples/s]
+Filter: 62%|██████▏ | 511000/818627 [00:57<00:35, 8732.48 examples/s]
+Filter: 62%|██████▏ | 511000/818627 [00:57<00:35, 8734.00 examples/s]
+Filter: 62%|██████▏ | 511000/818627 [00:57<00:35, 8734.21 examples/s]
+Filter: 62%|██████▏ | 511000/818627 [00:57<00:35, 8732.55 examples/s]
+Filter: 62%|██████▏ | 511000/818627 [00:57<00:35, 8757.69 examples/s]
+Filter: 62%|██████▏ | 511000/818627 [00:58<00:35, 8670.06 examples/s]
+Filter: 63%|██████▎ | 512000/818627 [00:57<00:36, 8477.74 examples/s]
+Filter: 63%|██████▎ | 512000/818627 [00:58<00:36, 8495.27 examples/s]
+Filter: 63%|██████▎ | 512000/818627 [00:57<00:36, 8478.01 examples/s]
+Filter: 63%|██████▎ | 512000/818627 [00:57<00:36, 8478.14 examples/s]
+Filter: 63%|██████▎ | 512000/818627 [00:57<00:36, 8478.17 examples/s]
+Filter: 63%|██████▎ | 512000/818627 [00:57<00:36, 8478.48 examples/s]
+Filter: 63%|██████▎ | 512000/818627 [00:58<00:36, 8476.47 examples/s]
+Filter: 63%|██████▎ | 512000/818627 [00:57<00:36, 8495.91 examples/s]
+Filter: 63%|██████▎ | 513000/818627 [00:58<00:35, 8504.89 examples/s]
+Filter: 63%|██████▎ | 513000/818627 [00:58<00:35, 8516.58 examples/s]
+Filter: 63%|██████▎ | 513000/818627 [00:58<00:35, 8504.28 examples/s]
+Filter: 63%|██████▎ | 513000/818627 [00:58<00:35, 8504.64 examples/s]
+Filter: 63%|██████▎ | 513000/818627 [00:58<00:35, 8505.58 examples/s]
+Filter: 63%|██████▎ | 513000/818627 [00:58<00:35, 8504.74 examples/s]
+Filter: 63%|██████▎ | 513000/818627 [00:58<00:35, 8503.47 examples/s]
+Filter: 63%|██████▎ | 513000/818627 [00:58<00:35, 8512.63 examples/s]
+Filter: 63%|██████▎ | 514000/818627 [00:58<00:35, 8544.81 examples/s]
+Filter: 63%|██████▎ | 514000/818627 [00:58<00:35, 8545.04 examples/s]
+Filter: 63%|██████▎ | 514000/818627 [00:58<00:35, 8552.84 examples/s]
+Filter: 63%|██████▎ | 514000/818627 [00:58<00:35, 8543.31 examples/s]
+Filter: 63%|██████▎ | 514000/818627 [00:58<00:35, 8544.40 examples/s]
+Filter: 63%|██████▎ | 514000/818627 [00:58<00:35, 8542.88 examples/s]
+Filter: 63%|██████▎ | 514000/818627 [00:58<00:35, 8542.77 examples/s]
+Filter: 63%|██████▎ | 514000/818627 [00:58<00:35, 8552.58 examples/s]
+Filter: 63%|██████▎ | 515000/818627 [00:58<00:35, 8591.53 examples/s]
+Filter: 63%|██████▎ | 515000/818627 [00:58<00:35, 8592.59 examples/s]
+Filter: 63%|██████▎ | 515000/818627 [00:58<00:35, 8592.31 examples/s]
+Filter: 63%|██████▎ | 515000/818627 [00:58<00:35, 8596.32 examples/s]
+Filter: 63%|██████▎ | 515000/818627 [00:58<00:35, 8593.62 examples/s]
+Filter: 63%|██████▎ | 515000/818627 [00:58<00:35, 8592.27 examples/s]
+Filter: 63%|██████▎ | 515000/818627 [00:58<00:36, 8433.64 examples/s]
+Filter: 63%|██████▎ | 515000/818627 [00:58<00:36, 8390.98 examples/s]
+Filter: 63%|██████▎ | 516000/818627 [00:58<00:35, 8584.28 examples/s]
+Filter: 63%|██████▎ | 516000/818627 [00:58<00:35, 8584.14 examples/s]
+Filter: 63%|██████▎ | 516000/818627 [00:58<00:35, 8587.06 examples/s]
+Filter: 63%|██████▎ | 516000/818627 [00:58<00:35, 8584.39 examples/s]
+Filter: 63%|██████▎ | 516000/818627 [00:58<00:35, 8585.15 examples/s]
+Filter: 63%|██████▎ | 516000/818627 [00:58<00:35, 8583.53 examples/s]
+Filter: 63%|██████▎ | 516000/818627 [00:58<00:35, 8496.70 examples/s]
+Filter: 63%|██████▎ | 516000/818627 [00:58<00:35, 8473.84 examples/s]
+Filter: 63%|██████▎ | 517000/818627 [00:58<00:34, 8753.51 examples/s]
+Filter: 63%|██████▎ | 517000/818627 [00:58<00:34, 8760.14 examples/s]
+Filter: 63%|██████▎ | 517000/818627 [00:58<00:34, 8757.07 examples/s]
+Filter: 63%|██████▎ | 517000/818627 [00:58<00:34, 8753.82 examples/s]
+Filter: 63%|██████▎ | 517000/818627 [00:58<00:34, 8754.34 examples/s]
+Filter: 63%|██████▎ | 517000/818627 [00:58<00:34, 8832.01 examples/s]
+Filter: 63%|██████▎ | 517000/818627 [00:58<00:34, 8753.42 examples/s]
+Filter: 63%|██████▎ | 517000/818627 [00:58<00:34, 8860.83 examples/s]
+Filter: 63%|██████▎ | 518000/818627 [00:58<00:34, 8758.84 examples/s]
+Filter: 63%|██████▎ | 518000/818627 [00:58<00:34, 8761.17 examples/s]
+Filter: 63%|██████▎ | 518000/818627 [00:58<00:34, 8759.02 examples/s]
+Filter: 63%|██████▎ | 518000/818627 [00:58<00:34, 8758.54 examples/s]
+Filter: 63%|██████▎ | 518000/818627 [00:58<00:34, 8757.19 examples/s]
+Filter: 63%|██████▎ | 518000/818627 [00:58<00:34, 8810.37 examples/s]
+Filter: 63%|██████▎ | 518000/818627 [00:58<00:34, 8830.68 examples/s]
+Filter: 63%|██████▎ | 518000/818627 [00:58<00:34, 8731.20 examples/s]
+Filter: 63%|██████▎ | 519000/818627 [00:58<00:34, 8738.90 examples/s]
+Filter: 63%|██████▎ | 519000/818627 [00:58<00:34, 8738.18 examples/s]
+Filter: 63%|██████▎ | 519000/818627 [00:59<00:34, 8740.27 examples/s]
+Filter: 63%|██████▎ | 519000/818627 [00:58<00:34, 8744.72 examples/s]
+Filter: 63%|██████▎ | 519000/818627 [00:58<00:34, 8737.60 examples/s]
+Filter: 63%|██████▎ | 519000/818627 [00:58<00:34, 8736.96 examples/s]
+Filter: 63%|██████▎ | 519000/818627 [00:58<00:34, 8794.75 examples/s]
+Filter: 63%|██████▎ | 519000/818627 [00:58<00:34, 8775.78 examples/s]
+Filter: 64%|██████▎ | 520000/818627 [00:58<00:34, 8772.05 examples/s]
+Filter: 64%|██████▎ | 520000/818627 [00:58<00:34, 8772.34 examples/s]
+Filter: 64%|██████▎ | 520000/818627 [00:59<00:34, 8775.10 examples/s]
+Filter: 64%|██████▎ | 520000/818627 [00:58<00:34, 8777.59 examples/s]
+Filter: 64%|██████▎ | 520000/818627 [00:58<00:34, 8773.73 examples/s]
+Filter: 64%|██████▎ | 520000/818627 [00:58<00:34, 8771.66 examples/s]
+Filter: 64%|██████▎ | 520000/818627 [00:58<00:33, 8798.24 examples/s]
+Filter: 64%|██████▎ | 520000/818627 [00:58<00:33, 8804.78 examples/s]
+Filter: 64%|██████▎ | 521000/818627 [00:58<00:33, 8766.84 examples/s]
+Filter: 64%|██████▎ | 521000/818627 [00:58<00:33, 8766.97 examples/s]
+Filter: 64%|██████▎ | 521000/818627 [00:59<00:33, 8767.40 examples/s]
+Filter: 64%|██████▎ | 521000/818627 [00:58<00:33, 8770.89 examples/s]
+Filter: 64%|██████▎ | 521000/818627 [00:58<00:33, 8767.51 examples/s]
+Filter: 64%|██████▎ | 521000/818627 [00:58<00:33, 8795.43 examples/s]
+Filter: 64%|██████▎ | 521000/818627 [00:58<00:33, 8783.09 examples/s]
+Filter: 64%|██████▎ | 521000/818627 [00:59<00:33, 8758.95 examples/s]
+Filter: 64%|██████▍ | 522000/818627 [00:59<00:34, 8723.45 examples/s]
+Filter: 64%|██████▍ | 522000/818627 [00:59<00:33, 8725.73 examples/s]
+Filter: 64%|██████▍ | 522000/818627 [00:59<00:33, 8724.64 examples/s]
+Filter: 64%|██████▍ | 522000/818627 [00:59<00:34, 8720.71 examples/s]
+Filter: 64%|██████▍ | 522000/818627 [00:59<00:33, 8735.61 examples/s]
+Filter: 64%|██████▍ | 522000/818627 [00:59<00:33, 8740.65 examples/s]
+Filter: 64%|██████▍ | 522000/818627 [00:59<00:34, 8719.63 examples/s]
+Filter: 64%|██████▍ | 522000/818627 [00:59<00:34, 8715.97 examples/s]
+Filter: 64%|██████▍ | 523000/818627 [00:59<00:34, 8671.71 examples/s]
+Filter: 64%|██████▍ | 523000/818627 [00:59<00:34, 8669.42 examples/s]
+Filter: 64%|██████▍ | 523000/818627 [00:59<00:34, 8670.18 examples/s]
+Filter: 64%|██████▍ | 523000/818627 [00:59<00:34, 8675.37 examples/s]
+Filter: 64%|██████▍ | 523000/818627 [00:59<00:34, 8673.38 examples/s]
+Filter: 64%|██████▍ | 523000/818627 [00:59<00:34, 8670.46 examples/s]
+Filter: 64%|██████▍ | 523000/818627 [00:59<00:34, 8679.57 examples/s]
+Filter: 64%|██████▍ | 523000/818627 [00:59<00:34, 8684.17 examples/s]
+Filter: 64%|██████▍ | 524000/818627 [00:59<00:33, 8838.85 examples/s]
+Filter: 64%|██████▍ | 524000/818627 [00:59<00:33, 8819.63 examples/s]
+Filter: 64%|██████▍ | 524000/818627 [00:59<00:33, 8811.93 examples/s]
+Filter: 64%|██████▍ | 524000/818627 [00:59<00:33, 8802.94 examples/s]
+Filter: 64%|██████▍ | 524000/818627 [00:59<00:33, 8815.09 examples/s]
+Filter: 64%|██████▍ | 524000/818627 [00:59<00:33, 8820.00 examples/s]
+Filter: 64%|██████▍ | 524000/818627 [00:59<00:33, 8793.68 examples/s]
+Filter: 64%|██████▍ | 524000/818627 [00:59<00:34, 8646.12 examples/s]
+Filter: 64%|██████▍ | 525000/818627 [00:59<00:33, 8766.43 examples/s]
+Filter: 64%|██████▍ | 525000/818627 [00:59<00:33, 8758.86 examples/s]
+Filter: 64%|██████▍ | 525000/818627 [00:59<00:33, 8765.71 examples/s]
+Filter: 64%|██████▍ | 525000/818627 [00:59<00:33, 8742.72 examples/s]
+Filter: 64%|██████▍ | 525000/818627 [00:59<00:33, 8751.07 examples/s]
+Filter: 64%|██████▍ | 525000/818627 [00:59<00:33, 8813.58 examples/s]
+Filter: 64%|██████▍ | 525000/818627 [00:59<00:33, 8727.24 examples/s]
+Filter: 64%|██████▍ | 525000/818627 [00:59<00:33, 8729.70 examples/s]
+Filter: 64%|██████▍ | 526000/818627 [00:59<00:33, 8735.63 examples/s]
+Filter: 64%|██████▍ | 526000/818627 [00:59<00:33, 8732.05 examples/s]
+Filter: 64%|██████▍ | 526000/818627 [00:59<00:33, 8718.27 examples/s]
+Filter: 64%|██████▍ | 526000/818627 [00:59<00:33, 8714.34 examples/s]
+Filter: 64%|██████▍ | 526000/818627 [00:59<00:33, 8729.97 examples/s]
+Filter: 64%|██████▍ | 526000/818627 [00:59<00:33, 8741.25 examples/s]
+Filter: 64%|██████▍ | 526000/818627 [00:59<00:33, 8729.70 examples/s]
+Filter: 64%|██████▍ | 526000/818627 [00:59<00:33, 8767.56 examples/s]
+Filter: 64%|██████▍ | 527000/818627 [00:59<00:33, 8732.28 examples/s]
+Filter: 64%|██████▍ | 527000/818627 [00:59<00:33, 8731.31 examples/s]
+Filter: 64%|██████▍ | 527000/818627 [00:59<00:33, 8726.93 examples/s]
+Filter: 64%|██████▍ | 527000/818627 [00:59<00:33, 8723.73 examples/s]
+Filter: 64%|██████▍ | 527000/818627 [00:59<00:33, 8742.47 examples/s]
+Filter: 64%|██████▍ | 527000/818627 [00:59<00:33, 8736.59 examples/s]
+Filter: 64%|██████▍ | 527000/818627 [00:59<00:33, 8729.62 examples/s]
+Filter: 64%|██████▍ | 527000/818627 [00:59<00:33, 8760.40 examples/s]
+Filter: 64%|██████▍ | 528000/818627 [00:59<00:33, 8778.57 examples/s]
+Filter: 64%|██████▍ | 528000/818627 [00:59<00:33, 8777.34 examples/s]
+Filter: 64%|██████▍ | 528000/818627 [00:59<00:33, 8772.82 examples/s]
+Filter: 64%|██████▍ | 528000/818627 [01:00<00:33, 8771.60 examples/s]
+Filter: 64%|██████▍ | 528000/818627 [00:59<00:33, 8780.67 examples/s]
+Filter: 64%|██████▍ | 528000/818627 [00:59<00:33, 8778.44 examples/s]
+Filter: 64%|██████▍ | 528000/818627 [00:59<00:33, 8781.24 examples/s]
+Filter: 64%|██████▍ | 528000/818627 [00:59<00:33, 8792.09 examples/s]
+Filter: 65%|██████▍ | 529000/818627 [00:59<00:31, 9101.54 examples/s]
+Filter: 65%|██████▍ | 529000/818627 [01:00<00:31, 9105.31 examples/s]
+Filter: 65%|██████▍ | 529000/818627 [00:59<00:31, 9102.53 examples/s]
+Filter: 65%|██████▍ | 529000/818627 [00:59<00:31, 9102.41 examples/s]
+Filter: 65%|██████▍ | 529000/818627 [00:59<00:31, 9106.46 examples/s]
+Filter: 65%|██████▍ | 529000/818627 [00:59<00:31, 9102.13 examples/s]
+Filter: 65%|██████▍ | 529000/818627 [00:59<00:31, 9101.86 examples/s]
+Filter: 65%|██████▍ | 529000/818627 [00:59<00:31, 9108.93 examples/s]
+Filter: 65%|██████▍ | 530000/818627 [00:59<00:31, 9059.17 examples/s]
+Filter: 65%|██████▍ | 530000/818627 [00:59<00:31, 9060.02 examples/s]
+Filter: 65%|██████▍ | 530000/818627 [00:59<00:31, 9059.03 examples/s]
+Filter: 65%|██████▍ | 530000/818627 [01:00<00:31, 9051.17 examples/s]
+Filter: 65%|██████▍ | 530000/818627 [00:59<00:31, 9058.33 examples/s]
+Filter: 65%|██████▍ | 530000/818627 [01:00<00:31, 9056.08 examples/s]
+Filter: 65%|██████▍ | 530000/818627 [00:59<00:31, 9058.15 examples/s]
+Filter: 65%|██████▍ | 530000/818627 [00:59<00:31, 9072.74 examples/s]
+Filter: 65%|██████▍ | 531000/818627 [01:00<00:31, 9116.89 examples/s]
+Filter: 65%|██████▍ | 531000/818627 [01:00<00:31, 9118.02 examples/s]
+Filter: 65%|██████▍ | 531000/818627 [01:00<00:31, 9117.92 examples/s]
+Filter: 65%|██████▍ | 531000/818627 [01:00<00:31, 9114.71 examples/s]
+Filter: 65%|██████▍ | 531000/818627 [01:00<00:31, 9117.68 examples/s]
+Filter: 65%|██████▍ | 531000/818627 [01:00<00:31, 9118.03 examples/s]
+Filter: 65%|██████▍ | 531000/818627 [01:00<00:31, 9116.38 examples/s]
+Filter: 65%|██████▍ | 531000/818627 [01:00<00:31, 9125.71 examples/s]
+Filter: 65%|██████▍ | 532000/818627 [01:00<00:31, 8984.36 examples/s]
+Filter: 65%|██████▍ | 532000/818627 [01:00<00:31, 8984.47 examples/s]
+Filter: 65%|██████▍ | 532000/818627 [01:00<00:31, 8982.65 examples/s]
+Filter: 65%|██████▍ | 532000/818627 [01:00<00:31, 8982.96 examples/s]
+Filter: 65%|██████▍ | 532000/818627 [01:00<00:31, 8983.07 examples/s]
+Filter: 65%|██████▍ | 532000/818627 [01:00<00:31, 8984.52 examples/s]
+Filter: 65%|██████▍ | 532000/818627 [01:00<00:31, 8981.02 examples/s]
+Filter: 65%|██████▍ | 532000/818627 [01:00<00:31, 8989.67 examples/s]
+Filter: 65%|██████▌ | 533000/818627 [01:00<00:32, 8879.52 examples/s]
+Filter: 65%|██████▌ | 533000/818627 [01:00<00:32, 8881.70 examples/s]
+Filter: 65%|██████▌ | 533000/818627 [01:00<00:32, 8879.01 examples/s]
+Filter: 65%|██████▌ | 533000/818627 [01:00<00:32, 8876.61 examples/s]
+Filter: 65%|██████▌ | 533000/818627 [01:00<00:32, 8878.30 examples/s]
+Filter: 65%|██████▌ | 533000/818627 [01:00<00:32, 8879.71 examples/s]
+Filter: 65%|██████▌ | 533000/818627 [01:00<00:32, 8879.57 examples/s]
+Filter: 65%|██████▌ | 533000/818627 [01:00<00:32, 8878.31 examples/s]
+Filter: 65%|██████▌ | 534000/818627 [01:00<00:32, 8824.72 examples/s]
+Filter: 65%|██████▌ | 534000/818627 [01:00<00:32, 8825.65 examples/s]
+Filter: 65%|██████▌ | 534000/818627 [01:00<00:32, 8815.58 examples/s]
+Filter: 65%|██████▌ | 534000/818627 [01:00<00:32, 8825.42 examples/s]
+Filter: 65%|██████▌ | 534000/818627 [01:00<00:32, 8827.06 examples/s]
+Filter: 65%|██████▌ | 534000/818627 [01:00<00:32, 8799.64 examples/s]
+Filter: 65%|██████▌ | 534000/818627 [01:00<00:32, 8791.95 examples/s]
+Filter: 65%|██████▌ | 534000/818627 [01:00<00:32, 8761.25 examples/s]
+Filter: 65%|██████▌ | 535000/818627 [01:00<00:32, 8808.16 examples/s]
+Filter: 65%|██████▌ | 535000/818627 [01:00<00:32, 8809.70 examples/s]
+Filter: 65%|██████▌ | 535000/818627 [01:00<00:32, 8813.64 examples/s]
+Filter: 65%|██████▌ | 535000/818627 [01:00<00:32, 8806.01 examples/s]
+Filter: 65%|██████▌ | 535000/818627 [01:00<00:32, 8817.32 examples/s]
+Filter: 65%|██████▌ | 535000/818627 [01:00<00:32, 8807.72 examples/s]
+Filter: 65%|██████▌ | 535000/818627 [01:00<00:32, 8812.98 examples/s]
+Filter: 65%|██████▌ | 535000/818627 [01:00<00:32, 8823.44 examples/s]
+Filter: 65%|██████▌ | 536000/818627 [01:00<00:31, 9099.11 examples/s]
+Filter: 65%|██████▌ | 536000/818627 [01:00<00:31, 9076.72 examples/s]
+Filter: 65%|██████▌ | 536000/818627 [01:00<00:31, 9049.75 examples/s]
+Filter: 65%|██████▌ | 536000/818627 [01:00<00:31, 9055.05 examples/s]
+Filter: 65%|██████▌ | 536000/818627 [01:00<00:31, 9054.23 examples/s]
+Filter: 65%|██████▌ | 536000/818627 [01:00<00:31, 9068.08 examples/s]
+Filter: 65%|██████▌ | 536000/818627 [01:00<00:31, 9053.76 examples/s]
+Filter: 65%|██████▌ | 536000/818627 [01:00<00:31, 9030.88 examples/s]
+Filter: 66%|██████▌ | 537000/818627 [01:00<00:31, 9064.63 examples/s]
+Filter: 66%|██████▌ | 537000/818627 [01:00<00:30, 9085.14 examples/s]
+Filter: 66%|██████▌ | 537000/818627 [01:00<00:31, 9063.19 examples/s]
+Filter: 66%|██████▌ | 537000/818627 [01:00<00:31, 9051.48 examples/s]
+Filter: 66%|██████▌ | 537000/818627 [01:01<00:31, 9050.57 examples/s]
+Filter: 66%|██████▌ | 537000/818627 [01:00<00:31, 9036.89 examples/s]
+Filter: 66%|██████▌ | 537000/818627 [01:00<00:31, 9036.68 examples/s]
+Filter: 66%|██████▌ | 537000/818627 [01:00<00:31, 9037.05 examples/s]
+Filter: 66%|██████▌ | 538000/818627 [01:00<00:30, 9095.74 examples/s]
+Filter: 66%|██████▌ | 538000/818627 [01:00<00:30, 9097.32 examples/s]
+Filter: 66%|██████▌ | 538000/818627 [01:01<00:30, 9098.09 examples/s]
+Filter: 66%|██████▌ | 538000/818627 [01:00<00:30, 9090.17 examples/s]
+Filter: 66%|██████▌ | 538000/818627 [01:00<00:30, 9099.30 examples/s]
+Filter: 66%|██████▌ | 538000/818627 [01:00<00:30, 9087.74 examples/s]
+Filter: 66%|██████▌ | 538000/818627 [01:00<00:30, 9086.27 examples/s]
+Filter: 66%|██████▌ | 538000/818627 [01:00<00:30, 9068.92 examples/s]
+Filter: 66%|██████▌ | 539000/818627 [01:00<00:31, 8965.95 examples/s]
+Filter: 66%|██████▌ | 539000/818627 [01:00<00:31, 8967.68 examples/s]
+Filter: 66%|██████▌ | 539000/818627 [01:01<00:31, 8969.36 examples/s]
+Filter: 66%|██████▌ | 539000/818627 [01:00<00:31, 8964.17 examples/s]
+Filter: 66%|██████▌ | 539000/818627 [01:00<00:31, 8969.30 examples/s]
+Filter: 66%|██████▌ | 539000/818627 [01:00<00:31, 8969.51 examples/s]
+Filter: 66%|██████▌ | 539000/818627 [01:01<00:31, 8961.78 examples/s]
+Filter: 66%|██████▌ | 539000/818627 [01:00<00:31, 8953.35 examples/s]
+Filter: 66%|██████▌ | 540000/818627 [01:01<00:31, 8873.86 examples/s]
+Filter: 66%|██████▌ | 540000/818627 [01:01<00:31, 8871.60 examples/s]
+Filter: 66%|██████▌ | 540000/818627 [01:01<00:31, 8869.04 examples/s]
+Filter: 66%|██████▌ | 540000/818627 [01:01<00:31, 8868.37 examples/s]
+Filter: 66%|██████▌ | 540000/818627 [01:01<00:31, 8879.70 examples/s]
+Filter: 66%|██████▌ | 540000/818627 [01:01<00:31, 8876.02 examples/s]
+Filter: 66%|██████▌ | 540000/818627 [01:01<00:31, 8863.59 examples/s]
+Filter: 66%|██████▌ | 540000/818627 [01:01<00:31, 8740.63 examples/s]
+Filter: 66%|██████▌ | 541000/818627 [01:01<00:31, 8839.25 examples/s]
+Filter: 66%|██████▌ | 541000/818627 [01:01<00:31, 8834.69 examples/s]
+Filter: 66%|██████▌ | 541000/818627 [01:01<00:31, 8842.09 examples/s]
+Filter: 66%|██████▌ | 541000/818627 [01:01<00:31, 8829.65 examples/s]
+Filter: 66%|██████▌ | 541000/818627 [01:01<00:31, 8840.64 examples/s]
+Filter: 66%|██████▌ | 541000/818627 [01:01<00:31, 8876.85 examples/s]
+Filter: 66%|██████▌ | 541000/818627 [01:01<00:31, 8835.35 examples/s]
+Filter: 66%|██████▌ | 541000/818627 [01:01<00:31, 8830.13 examples/s]
+Filter: 66%|██████▌ | 542000/818627 [01:01<00:31, 8778.90 examples/s]
+Filter: 66%|██████▌ | 542000/818627 [01:01<00:31, 8774.30 examples/s]
+Filter: 66%|██████▌ | 542000/818627 [01:01<00:31, 8778.52 examples/s]
+Filter: 66%|██████▌ | 542000/818627 [01:01<00:31, 8774.39 examples/s]
+Filter: 66%|██████▌ | 542000/818627 [01:01<00:31, 8780.26 examples/s]
+Filter: 66%|██████▌ | 542000/818627 [01:01<00:31, 8806.85 examples/s]
+Filter: 66%|██████▌ | 542000/818627 [01:01<00:31, 8780.37 examples/s]
+Filter: 66%|██████▌ | 542000/818627 [01:01<00:31, 8777.92 examples/s]
+Filter: 66%|██████▋ | 543000/818627 [01:01<00:30, 9097.95 examples/s]
+Filter: 66%|██████▋ | 543000/818627 [01:01<00:30, 9098.54 examples/s]
+Filter: 66%|██████▋ | 543000/818627 [01:01<00:30, 9093.03 examples/s]
+Filter: 66%|██████▋ | 543000/818627 [01:01<00:30, 9097.19 examples/s]
+Filter: 66%|██████▋ | 543000/818627 [01:01<00:30, 9116.82 examples/s]
+Filter: 66%|██████▋ | 543000/818627 [01:01<00:30, 9097.27 examples/s]
+Filter: 66%|██████▋ | 543000/818627 [01:01<00:30, 9079.66 examples/s]
+Filter: 66%|██████▋ | 543000/818627 [01:01<00:30, 8999.13 examples/s]
+Filter: 66%|██████▋ | 544000/818627 [01:01<00:30, 9114.52 examples/s]
+Filter: 66%|██████▋ | 544000/818627 [01:01<00:30, 9120.41 examples/s]
+Filter: 66%|██████▋ | 544000/818627 [01:01<00:30, 9114.21 examples/s]
+Filter: 66%|██████▋ | 544000/818627 [01:01<00:30, 9113.65 examples/s]
+Filter: 66%|██████▋ | 544000/818627 [01:01<00:30, 9116.37 examples/s]
+Filter: 66%|██████▋ | 544000/818627 [01:01<00:30, 9116.73 examples/s]
+Filter: 66%|██████▋ | 544000/818627 [01:01<00:30, 9129.28 examples/s]
+Filter: 66%|██████▋ | 544000/818627 [01:01<00:30, 9140.86 examples/s]
+Filter: 67%|██████▋ | 545000/818627 [01:01<00:29, 9148.66 examples/s]
+Filter: 67%|██████▋ | 545000/818627 [01:01<00:29, 9152.79 examples/s]
+Filter: 67%|██████▋ | 545000/818627 [01:01<00:29, 9149.56 examples/s]
+Filter: 67%|██████▋ | 545000/818627 [01:01<00:29, 9144.94 examples/s]
+Filter: 67%|██████▋ | 545000/818627 [01:01<00:29, 9152.54 examples/s]
+Filter: 67%|██████▋ | 545000/818627 [01:01<00:29, 9160.47 examples/s]
+Filter: 67%|██████▋ | 545000/818627 [01:01<00:29, 9171.71 examples/s]
+Filter: 67%|██████▋ | 545000/818627 [01:01<00:30, 8980.03 examples/s]
+Filter: 67%|██████▋ | 546000/818627 [01:01<00:30, 9019.19 examples/s]
+Filter: 67%|██████▋ | 546000/818627 [01:02<00:30, 9014.29 examples/s]
+Filter: 67%|██████▋ | 546000/818627 [01:01<00:30, 9008.10 examples/s]
+Filter: 67%|██████▋ | 546000/818627 [01:01<00:30, 9018.34 examples/s]
+Filter: 67%|██████▋ | 546000/818627 [01:01<00:30, 9022.42 examples/s]
+Filter: 67%|██████▋ | 546000/818627 [01:01<00:30, 9031.12 examples/s]
+Filter: 67%|██████▋ | 546000/818627 [01:01<00:30, 9063.82 examples/s]
+Filter: 67%|██████▋ | 546000/818627 [01:01<00:30, 8964.97 examples/s]
+Filter: 67%|██████▋ | 547000/818627 [01:01<00:30, 8932.93 examples/s]
+Filter: 67%|██████▋ | 547000/818627 [01:01<00:30, 8943.74 examples/s]
+Filter: 67%|██████▋ | 547000/818627 [01:01<00:30, 8935.04 examples/s]
+Filter: 67%|██████▋ | 547000/818627 [01:02<00:30, 8930.12 examples/s]
+Filter: 67%|██████▋ | 547000/818627 [01:01<00:30, 8936.93 examples/s]
+Filter: 67%|██████▋ | 547000/818627 [01:01<00:30, 8965.83 examples/s]
+Filter: 67%|██████▋ | 547000/818627 [01:01<00:30, 8928.31 examples/s]
+Filter: 67%|██████▋ | 547000/818627 [01:01<00:30, 8938.58 examples/s]
+Filter: 67%|██████▋ | 548000/818627 [01:01<00:30, 8894.47 examples/s]
+Filter: 67%|██████▋ | 548000/818627 [01:01<00:30, 8884.48 examples/s]
+Filter: 67%|██████▋ | 548000/818627 [01:02<00:30, 8886.15 examples/s]
+Filter: 67%|██████▋ | 548000/818627 [01:01<00:30, 8876.35 examples/s]
+Filter: 67%|██████▋ | 548000/818627 [01:01<00:30, 8882.63 examples/s]
+Filter: 67%|██████▋ | 548000/818627 [01:01<00:30, 8901.00 examples/s]
+Filter: 67%|██████▋ | 548000/818627 [01:01<00:30, 8886.32 examples/s]
+Filter: 67%|██████▋ | 548000/818627 [01:02<00:30, 8877.57 examples/s]
+Filter: 67%|██████▋ | 549000/818627 [01:02<00:30, 8787.40 examples/s]
+Filter: 67%|██████▋ | 549000/818627 [01:02<00:30, 8780.08 examples/s]
+Filter: 67%|██████▋ | 549000/818627 [01:02<00:30, 8780.80 examples/s]
+Filter: 67%|██████▋ | 549000/818627 [01:02<00:30, 8782.23 examples/s]
+Filter: 67%|██████▋ | 549000/818627 [01:02<00:30, 8784.69 examples/s]
+Filter: 67%|██████▋ | 549000/818627 [01:02<00:30, 8779.37 examples/s]
+Filter: 67%|██████▋ | 549000/818627 [01:02<00:30, 8797.01 examples/s]
+Filter: 67%|██████▋ | 549000/818627 [01:02<00:30, 8783.42 examples/s]
+Filter: 67%|██████▋ | 550000/818627 [01:02<00:30, 8803.27 examples/s]
+Filter: 67%|██████▋ | 550000/818627 [01:02<00:30, 8795.15 examples/s]
+Filter: 67%|██████▋ | 550000/818627 [01:02<00:30, 8798.56 examples/s]
+Filter: 67%|██████▋ | 550000/818627 [01:02<00:30, 8789.93 examples/s]
+Filter: 67%|██████▋ | 550000/818627 [01:02<00:30, 8811.45 examples/s]
+Filter: 67%|██████▋ | 550000/818627 [01:02<00:30, 8793.52 examples/s]
+Filter: 67%|██████▋ | 550000/818627 [01:02<00:30, 8800.07 examples/s]
+Filter: 67%|██████▋ | 550000/818627 [01:02<00:30, 8798.65 examples/s]
+Filter: 67%|██████▋ | 551000/818627 [01:02<00:30, 8745.29 examples/s]
+Filter: 67%|██████▋ | 551000/818627 [01:02<00:30, 8745.09 examples/s]
+Filter: 67%|██████▋ | 551000/818627 [01:02<00:30, 8739.78 examples/s]
+Filter: 67%|██████▋ | 551000/818627 [01:02<00:30, 8745.26 examples/s]
+Filter: 67%|██████▋ | 551000/818627 [01:02<00:30, 8748.67 examples/s]
+Filter: 67%|██████▋ | 551000/818627 [01:02<00:30, 8752.42 examples/s]
+Filter: 67%|██████▋ | 551000/818627 [01:02<00:30, 8748.61 examples/s]
+Filter: 67%|██████▋ | 551000/818627 [01:02<00:30, 8686.03 examples/s]
+Filter: 67%|██████▋ | 552000/818627 [01:02<00:30, 8755.14 examples/s]
+Filter: 67%|██████▋ | 552000/818627 [01:02<00:30, 8754.02 examples/s]
+Filter: 67%|██████▋ | 552000/818627 [01:02<00:30, 8756.02 examples/s]
+Filter: 67%|██████▋ | 552000/818627 [01:02<00:30, 8742.93 examples/s]
+Filter: 67%|██████▋ | 552000/818627 [01:02<00:30, 8758.86 examples/s]
+Filter: 67%|██████▋ | 552000/818627 [01:02<00:30, 8756.39 examples/s]
+Filter: 67%|██████▋ | 552000/818627 [01:02<00:30, 8751.40 examples/s]
+Filter: 67%|██████▋ | 552000/818627 [01:02<00:30, 8768.56 examples/s]
+Filter: 68%|██████▊ | 553000/818627 [01:02<00:30, 8748.46 examples/s]
+Filter: 68%|██████▊ | 553000/818627 [01:02<00:30, 8747.52 examples/s]
+Filter: 68%|██████▊ | 553000/818627 [01:02<00:30, 8750.58 examples/s]
+Filter: 68%|██████▊ | 553000/818627 [01:02<00:30, 8757.98 examples/s]
+Filter: 68%|██████▊ | 553000/818627 [01:02<00:30, 8751.69 examples/s]
+Filter: 68%|██████▊ | 553000/818627 [01:02<00:30, 8762.04 examples/s]
+Filter: 68%|██████▊ | 553000/818627 [01:02<00:30, 8741.87 examples/s]
+Filter: 68%|██████▊ | 554000/818627 [01:02<00:29, 8824.51 examples/s]
+Filter: 68%|██████▊ | 554000/818627 [01:02<00:29, 8822.52 examples/s]
+Filter: 68%|██████▊ | 554000/818627 [01:02<00:29, 8822.27 examples/s]
+Filter: 68%|██████▊ | 555000/818627 [01:02<00:29, 8869.88 examples/s]
+Filter: 68%|██████▊ | 555000/818627 [01:02<00:29, 8864.51 examples/s]
+Filter: 68%|██████▊ | 555000/818627 [01:02<00:29, 8861.14 examples/s]
+Filter: 68%|██████▊ | 556000/818627 [01:02<00:28, 9172.03 examples/s]
+Filter: 68%|██████▊ | 556000/818627 [01:02<00:28, 9171.45 examples/s]
+Filter: 68%|██████▊ | 556000/818627 [01:02<00:28, 9170.03 examples/s]
+Filter: 68%|██████▊ | 554000/818627 [01:02<00:52, 5073.48 examples/s]
+Filter: 68%|██████▊ | 553000/818627 [01:03<01:02, 4239.17 examples/s]
+Filter: 68%|██████▊ | 554000/818627 [01:02<00:53, 4950.08 examples/s]
+Filter: 68%|██████▊ | 557000/818627 [01:02<00:28, 9213.86 examples/s]
+Filter: 68%|██████▊ | 557000/818627 [01:02<00:28, 9227.43 examples/s]
+Filter: 68%|██████▊ | 557000/818627 [01:03<00:28, 9225.79 examples/s]
+Filter: 68%|██████▊ | 554000/818627 [01:02<00:55, 4753.83 examples/s]
+Filter: 68%|██████▊ | 554000/818627 [01:02<00:56, 4703.89 examples/s]
+Filter: 68%|██████▊ | 558000/818627 [01:03<00:28, 9107.46 examples/s]
+Filter: 68%|██████▊ | 558000/818627 [01:03<00:28, 9108.37 examples/s]
+Filter: 68%|██████▊ | 558000/818627 [01:03<00:28, 9107.50 examples/s]
+Filter: 68%|██████▊ | 556000/818627 [01:03<00:37, 7055.13 examples/s]
+Filter: 68%|██████▊ | 556000/818627 [01:03<00:37, 6946.09 examples/s]
+Filter: 68%|██████▊ | 555000/818627 [01:03<00:42, 6154.39 examples/s]
+Filter: 68%|██████▊ | 556000/818627 [01:03<00:39, 6712.35 examples/s]
+Filter: 68%|██████▊ | 556000/818627 [01:03<00:39, 6570.82 examples/s]
+Filter: 68%|██████▊ | 558000/818627 [01:03<00:30, 8662.95 examples/s]
+Filter: 68%|██████▊ | 558000/818627 [01:03<00:30, 8585.86 examples/s]
+Filter: 68%|██████▊ | 557000/818627 [01:03<00:33, 7820.23 examples/s]
+Filter: 68%|██████▊ | 558000/818627 [01:03<00:31, 8257.09 examples/s]
+Filter: 68%|██████▊ | 558000/818627 [01:03<00:32, 8092.80 examples/s]
+Filter: 68%|██████▊ | 559000/818627 [01:03<00:28, 9171.70 examples/s]
+Filter: 68%|██████▊ | 560000/818627 [01:03<00:28, 9172.15 examples/s]
+Filter: 68%|██████▊ | 560000/818627 [01:03<00:27, 9317.47 examples/s]
+Filter: 68%|██████▊ | 560000/818627 [01:03<00:27, 9449.16 examples/s]
+Filter: 68%|██████▊ | 560000/818627 [01:03<00:28, 9145.89 examples/s]
+Filter: 68%|██████▊ | 559000/818627 [01:03<00:51, 5029.88 examples/s]
+Filter: 68%|██████▊ | 559000/818627 [01:03<00:53, 4822.28 examples/s]
+Filter: 68%|██████▊ | 559000/818627 [01:03<00:54, 4788.57 examples/s]
+Filter: 69%|██████▊ | 561000/818627 [01:03<00:25, 10226.85 examples/s]
+Filter: 69%|██████▊ | 561000/818627 [01:03<00:36, 7026.87 examples/s]
+Filter: 69%|██████▊ | 562000/818627 [01:03<00:27, 9251.31 examples/s]
+Filter: 69%|██████▊ | 562000/818627 [01:03<00:28, 9155.04 examples/s]
+Filter: 69%|██████▊ | 562000/818627 [01:03<00:26, 9547.48 examples/s]
+Filter: 69%|██████▊ | 562000/818627 [01:03<00:26, 9677.92 examples/s]
+Filter: 69%|██████▊ | 561000/818627 [01:03<00:38, 6775.02 examples/s]
+Filter: 69%|██████▊ | 561000/818627 [01:03<00:38, 6764.59 examples/s]
+Filter: 69%|██████▉ | 563000/818627 [01:03<00:28, 8950.22 examples/s]
+Filter: 69%|██████▉ | 563000/818627 [01:04<00:25, 9840.46 examples/s]
+Filter: 69%|██████▉ | 563000/818627 [01:03<00:29, 8661.31 examples/s]
+Filter: 69%|██████▉ | 563000/818627 [01:03<00:30, 8403.18 examples/s]
+Filter: 69%|██████▉ | 563000/818627 [01:03<00:30, 8400.12 examples/s]
+Filter: 69%|██████▉ | 564000/818627 [01:03<00:28, 8882.88 examples/s]
+Filter: 69%|██████▉ | 564000/818627 [01:03<00:28, 8955.03 examples/s]
+Filter: 69%|██████▉ | 564000/818627 [01:03<00:27, 9142.65 examples/s]
+Filter: 69%|██████▉ | 564000/818627 [01:03<00:27, 9327.38 examples/s]
+Filter: 69%|██████▉ | 565000/818627 [01:04<00:28, 8853.11 examples/s]
+Filter: 69%|██████▉ | 565000/818627 [01:04<00:28, 8944.76 examples/s]
+Filter: 69%|██████▉ | 565000/818627 [01:04<00:28, 8916.93 examples/s]
+Filter: 69%|██████▉ | 565000/818627 [01:04<00:27, 9290.19 examples/s]
+Filter: 69%|██████▉ | 565000/818627 [01:04<00:26, 9445.30 examples/s]
+Filter: 69%|██████▉ | 565000/818627 [01:04<00:27, 9260.41 examples/s]
+Filter: 69%|██████▉ | 565000/818627 [01:04<00:27, 9067.70 examples/s]
+Filter: 69%|██████▉ | 565000/818627 [01:04<00:27, 9213.68 examples/s]
+Filter: 69%|██████▉ | 566000/818627 [01:04<00:27, 9101.85 examples/s]
+Filter: 69%|██████▉ | 566000/818627 [01:04<00:27, 9118.37 examples/s]
+Filter: 69%|██████▉ | 566000/818627 [01:04<00:27, 9237.23 examples/s]
+Filter: 69%|██████▉ | 566000/818627 [01:04<00:26, 9357.24 examples/s]
+Filter: 69%|██████▉ | 567000/818627 [01:04<00:27, 9091.76 examples/s]
+Filter: 69%|██████▉ | 567000/818627 [01:04<00:27, 9073.20 examples/s]
+Filter: 69%|██████▉ | 567000/818627 [01:04<00:27, 9108.67 examples/s]
+Filter: 69%|██████▉ | 567000/818627 [01:04<00:26, 9444.99 examples/s]
+Filter: 69%|██████▉ | 567000/818627 [01:04<00:26, 9337.90 examples/s]
+Filter: 69%|██████▉ | 567000/818627 [01:04<00:27, 9182.23 examples/s]
+Filter: 69%|██████▉ | 567000/818627 [01:04<00:27, 9317.81 examples/s]
+Filter: 69%|██████▉ | 567000/818627 [01:04<00:27, 9272.59 examples/s]
+Filter: 69%|██████▉ | 568000/818627 [01:04<00:28, 8905.09 examples/s]
+Filter: 69%|██████▉ | 568000/818627 [01:04<00:27, 8983.03 examples/s]
+Filter: 69%|██████▉ | 568000/818627 [01:04<00:28, 8929.63 examples/s]
+Filter: 69%|██████▉ | 568000/818627 [01:04<00:27, 9255.05 examples/s]
+Filter: 69%|██████▉ | 568000/818627 [01:04<00:27, 8998.76 examples/s]
+Filter: 69%|██████▉ | 568000/818627 [01:04<00:27, 9015.70 examples/s]
+Filter: 70%|██████▉ | 569000/818627 [01:04<00:28, 8803.65 examples/s]
+Filter: 70%|██████▉ | 569000/818627 [01:04<00:28, 8830.91 examples/s]
+Filter: 70%|██████▉ | 569000/818627 [01:04<00:28, 8881.73 examples/s]
+Filter: 70%|██████▉ | 569000/818627 [01:04<00:27, 9042.94 examples/s]
+Filter: 70%|██████▉ | 569000/818627 [01:04<00:27, 9054.14 examples/s]
+Filter: 70%|██████▉ | 569000/818627 [01:04<00:27, 9095.33 examples/s]
+Filter: 70%|██████▉ | 569000/818627 [01:04<00:28, 8876.78 examples/s]
+Filter: 70%|██████▉ | 569000/818627 [01:04<00:27, 8934.31 examples/s]
+Filter: 70%|██████▉ | 570000/818627 [01:04<00:28, 8675.57 examples/s]
+Filter: 70%|██████▉ | 570000/818627 [01:04<00:28, 8702.17 examples/s]
+Filter: 70%|██████▉ | 570000/818627 [01:04<00:28, 8760.21 examples/s]
+Filter: 70%|██████▉ | 570000/818627 [01:04<00:27, 8929.96 examples/s]
+Filter: 70%|██████▉ | 570000/818627 [01:04<00:27, 8910.32 examples/s]
+Filter: 70%|██████▉ | 570000/818627 [01:04<00:27, 8918.83 examples/s]
+Filter: 70%|██████▉ | 570000/818627 [01:04<00:28, 8737.93 examples/s]
+Filter: 70%|██████▉ | 570000/818627 [01:04<00:28, 8776.08 examples/s]
+Filter: 70%|██████▉ | 571000/818627 [01:04<00:28, 8586.23 examples/s]
+Filter: 70%|██████▉ | 571000/818627 [01:04<00:28, 8605.61 examples/s]
+Filter: 70%|██████▉ | 571000/818627 [01:04<00:28, 8656.29 examples/s]
+Filter: 70%|██████▉ | 571000/818627 [01:05<00:28, 8783.05 examples/s]
+Filter: 70%|██████▉ | 571000/818627 [01:04<00:28, 8794.77 examples/s]
+Filter: 70%|██████▉ | 571000/818627 [01:04<00:28, 8629.89 examples/s]
+Filter: 70%|██████▉ | 571000/818627 [01:04<00:28, 8786.47 examples/s]
+Filter: 70%|██████▉ | 571000/818627 [01:04<00:28, 8659.76 examples/s]
+Filter: 70%|██████▉ | 572000/818627 [01:04<00:28, 8603.95 examples/s]
+Filter: 70%|██████▉ | 572000/818627 [01:04<00:28, 8620.10 examples/s]
+Filter: 70%|██████▉ | 572000/818627 [01:04<00:28, 8654.12 examples/s]
+Filter: 70%|██████▉ | 572000/818627 [01:05<00:28, 8747.05 examples/s]
+Filter: 70%|██████▉ | 572000/818627 [01:04<00:28, 8760.10 examples/s]
+Filter: 70%|██████▉ | 572000/818627 [01:04<00:28, 8754.68 examples/s]
+Filter: 70%|██████▉ | 572000/818627 [01:04<00:28, 8633.83 examples/s]
+Filter: 70%|██████▉ | 572000/818627 [01:04<00:28, 8658.77 examples/s]
+Filter: 70%|██████▉ | 573000/818627 [01:04<00:28, 8615.23 examples/s]
+Filter: 70%|██████▉ | 573000/818627 [01:04<00:28, 8625.67 examples/s]
+Filter: 70%|██████▉ | 573000/818627 [01:04<00:28, 8650.87 examples/s]
+Filter: 70%|██████▉ | 573000/818627 [01:05<00:28, 8717.17 examples/s]
+Filter: 70%|██████▉ | 573000/818627 [01:04<00:28, 8727.11 examples/s]
+Filter: 70%|██████▉ | 573000/818627 [01:05<00:28, 8730.68 examples/s]
+Filter: 70%|██████▉ | 573000/818627 [01:04<00:28, 8638.54 examples/s]
+Filter: 70%|██████▉ | 573000/818627 [01:04<00:28, 8652.41 examples/s]
+Filter: 70%|███████ | 574000/818627 [01:05<00:28, 8617.20 examples/s]
+Filter: 70%|███████ | 574000/818627 [01:05<00:28, 8685.44 examples/s]
+Filter: 70%|███████ | 574000/818627 [01:05<00:28, 8693.49 examples/s]
+Filter: 70%|███████ | 574000/818627 [01:05<00:28, 8593.86 examples/s]
+Filter: 70%|███████ | 574000/818627 [01:05<00:28, 8608.37 examples/s]
+Filter: 70%|███████ | 574000/818627 [01:05<00:28, 8602.04 examples/s]
+Filter: 70%|███████ | 574000/818627 [01:05<00:28, 8656.10 examples/s]
+Filter: 70%|███████ | 574000/818627 [01:05<00:28, 8591.81 examples/s]
+Filter: 70%|███████ | 575000/818627 [01:05<00:27, 8848.64 examples/s]
+Filter: 70%|███████ | 575000/818627 [01:05<00:27, 8845.36 examples/s]
+Filter: 70%|███████ | 575000/818627 [01:05<00:27, 8856.43 examples/s]
+Filter: 70%|███████ | 575000/818627 [01:05<00:27, 8885.64 examples/s]
+Filter: 70%|███████ | 575000/818627 [01:05<00:27, 8857.08 examples/s]
+Filter: 70%|███████ | 575000/818627 [01:05<00:27, 8883.76 examples/s]
+Filter: 70%|███████ | 575000/818627 [01:05<00:27, 8872.73 examples/s]
+Filter: 70%|███████ | 575000/818627 [01:05<00:27, 8890.61 examples/s]
+Filter: 70%|███████ | 576000/818627 [01:05<00:27, 8723.51 examples/s]
+Filter: 70%|███████ | 576000/818627 [01:05<00:27, 8721.85 examples/s]
+Filter: 70%|███████ | 576000/818627 [01:05<00:27, 8738.77 examples/s]
+Filter: 70%|███████ | 576000/818627 [01:05<00:27, 8755.55 examples/s]
+Filter: 70%|███████ | 576000/818627 [01:05<00:27, 8768.20 examples/s]
+Filter: 70%|███████ | 576000/818627 [01:05<00:27, 8733.89 examples/s]
+Filter: 70%|███████ | 576000/818627 [01:05<00:27, 8742.40 examples/s]
+Filter: 70%|███████ | 576000/818627 [01:05<00:27, 8751.49 examples/s]
+Filter: 70%|███████ | 577000/818627 [01:05<00:27, 8674.01 examples/s]
+Filter: 70%|███████ | 577000/818627 [01:05<00:27, 8675.07 examples/s]
+Filter: 70%|███████ | 577000/818627 [01:05<00:27, 8685.29 examples/s]
+Filter: 70%|███████ | 577000/818627 [01:05<00:27, 8696.20 examples/s]
+Filter: 70%|███████ | 577000/818627 [01:05<00:27, 8681.74 examples/s]
+Filter: 70%|███████ | 577000/818627 [01:05<00:27, 8706.23 examples/s]
+Filter: 70%|███████ | 577000/818627 [01:05<00:27, 8688.87 examples/s]
+Filter: 70%|███████ | 577000/818627 [01:05<00:27, 8700.37 examples/s]
+Filter: 71%|███████ | 578000/818627 [01:05<00:27, 8696.15 examples/s]
+Filter: 71%|███████ | 578000/818627 [01:05<00:27, 8693.34 examples/s]
+Filter: 71%|███████ | 578000/818627 [01:05<00:27, 8703.25 examples/s]
+Filter: 71%|███████ | 578000/818627 [01:05<00:27, 8713.06 examples/s]
+Filter: 71%|███████ | 578000/818627 [01:05<00:27, 8718.07 examples/s]
+Filter: 71%|███████ | 578000/818627 [01:05<00:27, 8717.89 examples/s]
+Filter: 71%|███████ | 578000/818627 [01:05<00:27, 8706.86 examples/s]
+Filter: 71%|███████ | 578000/818627 [01:05<00:27, 8698.38 examples/s]
+Filter: 71%|███████ | 579000/818627 [01:05<00:27, 8706.79 examples/s]
+Filter: 71%|███████ | 579000/818627 [01:05<00:27, 8714.86 examples/s]
+Filter: 71%|███████ | 579000/818627 [01:05<00:27, 8706.37 examples/s]
+Filter: 71%|███████ | 579000/818627 [01:05<00:27, 8717.09 examples/s]
+Filter: 71%|███████ | 579000/818627 [01:05<00:27, 8722.80 examples/s]
+Filter: 71%|███████ | 579000/818627 [01:05<00:27, 8720.83 examples/s]
+Filter: 71%|███████ | 579000/818627 [01:05<00:27, 8709.45 examples/s]
+Filter: 71%|███████ | 579000/818627 [01:05<00:27, 8711.14 examples/s]
+Filter: 71%|███████ | 580000/818627 [01:05<00:26, 9029.22 examples/s]
+Filter: 71%|███████ | 580000/818627 [01:05<00:26, 9027.78 examples/s]
+Filter: 71%|███████ | 580000/818627 [01:06<00:26, 9034.10 examples/s]
+Filter: 71%|███████ | 580000/818627 [01:05<00:26, 9030.82 examples/s]
+Filter: 71%|███████ | 580000/818627 [01:05<00:26, 9034.49 examples/s]
+Filter: 71%|███████ | 580000/818627 [01:05<00:26, 9031.13 examples/s]
+Filter: 71%|███████ | 580000/818627 [01:05<00:26, 9014.86 examples/s]
+Filter: 71%|███████ | 580000/818627 [01:05<00:26, 8965.21 examples/s]
+Filter: 71%|███████ | 581000/818627 [01:05<00:26, 9106.58 examples/s]
+Filter: 71%|███████ | 581000/818627 [01:05<00:26, 9086.96 examples/s]
+Filter: 71%|███████ | 581000/818627 [01:05<00:26, 9088.19 examples/s]
+Filter: 71%|███████ | 581000/818627 [01:05<00:26, 9093.38 examples/s]
+Filter: 71%|███████ | 581000/818627 [01:05<00:26, 9090.50 examples/s]
+Filter: 71%|███████ | 581000/818627 [01:05<00:26, 9090.24 examples/s]
+Filter: 71%|███████ | 581000/818627 [01:05<00:26, 9088.29 examples/s]
+Filter: 71%|███████ | 581000/818627 [01:06<00:26, 9025.25 examples/s]
+Filter: 71%|███████ | 582000/818627 [01:05<00:26, 8944.93 examples/s]
+Filter: 71%|███████ | 582000/818627 [01:05<00:26, 8936.87 examples/s]
+Filter: 71%|███████ | 582000/818627 [01:05<00:26, 8929.02 examples/s]
+Filter: 71%|███████ | 582000/818627 [01:06<00:26, 8956.64 examples/s]
+Filter: 71%|███████ | 582000/818627 [01:05<00:26, 8939.62 examples/s]
+Filter: 71%|███████ | 582000/818627 [01:06<00:26, 8938.21 examples/s]
+Filter: 71%|███████ | 582000/818627 [01:05<00:26, 8931.76 examples/s]
+Filter: 71%|███████ | 582000/818627 [01:05<00:26, 8942.44 examples/s]
+Filter: 71%|███████ | 583000/818627 [01:06<00:26, 8798.41 examples/s]
+Filter: 71%|███████ | 583000/818627 [01:06<00:26, 8787.76 examples/s]
+Filter: 71%|███████ | 583000/818627 [01:06<00:26, 8783.98 examples/s]
+Filter: 71%|███████ | 583000/818627 [01:06<00:26, 8792.26 examples/s]
+Filter: 71%|███████ | 583000/818627 [01:06<00:26, 8792.57 examples/s]
+Filter: 71%|███████ | 583000/818627 [01:06<00:26, 8798.15 examples/s]
+Filter: 71%|███████ | 583000/818627 [01:06<00:26, 8796.89 examples/s]
+Filter: 71%|███████ | 583000/818627 [01:06<00:26, 8789.20 examples/s]
+Filter: 71%|███████▏ | 584000/818627 [01:06<00:27, 8676.57 examples/s]
+Filter: 71%|███████▏ | 584000/818627 [01:06<00:27, 8669.63 examples/s]
+Filter: 71%|███████▏ | 584000/818627 [01:06<00:27, 8667.71 examples/s]
+Filter: 71%|███████▏ | 584000/818627 [01:06<00:27, 8680.84 examples/s]
+Filter: 71%|███████▏ | 584000/818627 [01:06<00:27, 8672.49 examples/s]
+Filter: 71%|███████▏ | 584000/818627 [01:06<00:27, 8671.58 examples/s]
+Filter: 71%|███████▏ | 584000/818627 [01:06<00:27, 8672.98 examples/s]
+Filter: 71%|███████▏ | 584000/818627 [01:06<00:27, 8674.26 examples/s]
+Filter: 71%|███████▏ | 585000/818627 [01:06<00:26, 8655.06 examples/s]
+Filter: 71%|███████▏ | 585000/818627 [01:06<00:27, 8650.12 examples/s]
+Filter: 71%|███████▏ | 585000/818627 [01:06<00:26, 8653.04 examples/s]
+Filter: 71%|███████▏ | 585000/818627 [01:06<00:26, 8659.07 examples/s]
+Filter: 71%|███████▏ | 585000/818627 [01:06<00:26, 8653.48 examples/s]
+Filter: 71%|███████▏ | 585000/818627 [01:06<00:27, 8652.45 examples/s]
+Filter: 71%|███████▏ | 585000/818627 [01:06<00:27, 8648.92 examples/s]
+Filter: 71%|███████▏ | 585000/818627 [01:06<00:27, 8651.34 examples/s]
+Filter: 72%|███████▏ | 586000/818627 [01:06<00:26, 8712.20 examples/s]
+Filter: 72%|███████▏ | 586000/818627 [01:06<00:26, 8709.21 examples/s]
+Filter: 72%|███████▏ | 586000/818627 [01:06<00:26, 8710.73 examples/s]
+Filter: 72%|███████▏ | 586000/818627 [01:06<00:26, 8714.87 examples/s]
+Filter: 72%|███████▏ | 586000/818627 [01:06<00:26, 8708.01 examples/s]
+Filter: 72%|███████▏ | 586000/818627 [01:06<00:26, 8706.06 examples/s]
+Filter: 72%|███████▏ | 586000/818627 [01:06<00:26, 8709.29 examples/s]
+Filter: 72%|███████▏ | 586000/818627 [01:06<00:26, 8704.17 examples/s]
+Filter: 72%|███████▏ | 587000/818627 [01:06<00:26, 8753.42 examples/s]
+Filter: 72%|███████▏ | 587000/818627 [01:06<00:26, 8754.52 examples/s]
+Filter: 72%|███████▏ | 587000/818627 [01:06<00:26, 8749.09 examples/s]
+Filter: 72%|███████▏ | 587000/818627 [01:06<00:26, 8755.00 examples/s]
+Filter: 72%|███████▏ | 587000/818627 [01:06<00:26, 8753.93 examples/s]
+Filter: 72%|███████▏ | 587000/818627 [01:06<00:26, 8753.94 examples/s]
+Filter: 72%|███████▏ | 587000/818627 [01:06<00:26, 8748.52 examples/s]
+Filter: 72%|███████▏ | 587000/818627 [01:06<00:26, 8748.08 examples/s]
+Filter: 72%|███████▏ | 588000/818627 [01:06<00:26, 8854.11 examples/s]
+Filter: 72%|███████▏ | 588000/818627 [01:06<00:26, 8854.10 examples/s]
+Filter: 72%|███████▏ | 588000/818627 [01:06<00:26, 8855.46 examples/s]
+Filter: 72%|███████▏ | 588000/818627 [01:06<00:26, 8854.87 examples/s]
+Filter: 72%|███████▏ | 588000/818627 [01:06<00:26, 8854.54 examples/s]
+Filter: 72%|███████▏ | 588000/818627 [01:06<00:26, 8855.36 examples/s]
+Filter: 72%|███████▏ | 588000/818627 [01:06<00:26, 8853.34 examples/s]
+Filter: 72%|███████▏ | 588000/818627 [01:06<00:26, 8851.01 examples/s]
+Filter: 72%|███████▏ | 589000/818627 [01:06<00:26, 8779.23 examples/s]
+Filter: 72%|███████▏ | 589000/818627 [01:06<00:26, 8778.72 examples/s]
+Filter: 72%|███████▏ | 589000/818627 [01:06<00:26, 8773.30 examples/s]
+Filter: 72%|███████▏ | 589000/818627 [01:07<00:26, 8778.75 examples/s]
+Filter: 72%|███████▏ | 589000/818627 [01:06<00:26, 8779.39 examples/s]
+Filter: 72%|███████▏ | 589000/818627 [01:06<00:26, 8778.56 examples/s]
+Filter: 72%|███████▏ | 589000/818627 [01:06<00:26, 8776.77 examples/s]
+Filter: 72%|███████▏ | 589000/818627 [01:06<00:26, 8717.22 examples/s]
+Filter: 72%|███████▏ | 590000/818627 [01:06<00:26, 8712.57 examples/s]
+Filter: 72%|███████▏ | 590000/818627 [01:06<00:26, 8712.61 examples/s]
+Filter: 72%|███████▏ | 590000/818627 [01:06<00:26, 8716.98 examples/s]
+Filter: 72%|███████▏ | 590000/818627 [01:07<00:26, 8714.78 examples/s]
+Filter: 72%|███████▏ | 590000/818627 [01:06<00:26, 8713.34 examples/s]
+Filter: 72%|███████▏ | 590000/818627 [01:06<00:26, 8713.88 examples/s]
+Filter: 72%|███████▏ | 590000/818627 [01:06<00:26, 8711.76 examples/s]
+Filter: 72%|███████▏ | 590000/818627 [01:06<00:26, 8730.17 examples/s]
+Filter: 72%|███████▏ | 591000/818627 [01:06<00:26, 8652.09 examples/s]
+Filter: 72%|███████▏ | 591000/818627 [01:06<00:26, 8649.37 examples/s]
+Filter: 72%|███████▏ | 591000/818627 [01:06<00:26, 8650.89 examples/s]
+Filter: 72%|███████▏ | 591000/818627 [01:07<00:26, 8651.76 examples/s]
+Filter: 72%|███████▏ | 591000/818627 [01:06<00:26, 8650.62 examples/s]
+Filter: 72%|███████▏ | 591000/818627 [01:06<00:26, 8648.06 examples/s]
+Filter: 72%|███████▏ | 591000/818627 [01:07<00:26, 8649.51 examples/s]
+Filter: 72%|███████▏ | 591000/818627 [01:06<00:26, 8663.01 examples/s]
+Filter: 72%|███████▏ | 592000/818627 [01:07<00:26, 8629.93 examples/s]
+Filter: 72%|███████▏ | 592000/818627 [01:07<00:26, 8628.04 examples/s]
+Filter: 72%|███████▏ | 592000/818627 [01:07<00:26, 8628.71 examples/s]
+Filter: 72%|███████▏ | 592000/818627 [01:07<00:26, 8629.08 examples/s]
+Filter: 72%|███████▏ | 592000/818627 [01:07<00:26, 8629.59 examples/s]
+Filter: 72%|███████▏ | 592000/818627 [01:07<00:26, 8628.09 examples/s]
+Filter: 72%|███████▏ | 592000/818627 [01:07<00:26, 8629.37 examples/s]
+Filter: 72%|███████▏ | 592000/818627 [01:07<00:26, 8636.31 examples/s]
+Filter: 72%|███████▏ | 593000/818627 [01:07<00:26, 8677.14 examples/s]
+Filter: 72%|███████▏ | 593000/818627 [01:07<00:25, 8680.48 examples/s]
+Filter: 72%|███████▏ | 593000/818627 [01:07<00:26, 8677.63 examples/s]
+Filter: 72%|███████▏ | 593000/818627 [01:07<00:25, 8680.75 examples/s]
+Filter: 72%|███████▏ | 593000/818627 [01:07<00:25, 8679.25 examples/s]
+Filter: 72%|███████▏ | 593000/818627 [01:07<00:25, 8687.26 examples/s]
+Filter: 72%|███████▏ | 593000/818627 [01:07<00:25, 8678.18 examples/s]
+Filter: 72%|███████▏ | 593000/818627 [01:07<00:26, 8628.92 examples/s]
+Filter: 73%|███████▎ | 594000/818627 [01:07<00:25, 8657.33 examples/s]
+Filter: 73%|███████▎ | 594000/818627 [01:07<00:25, 8673.07 examples/s]
+Filter: 73%|███████▎ | 594000/818627 [01:07<00:25, 8660.71 examples/s]
+Filter: 73%|███████▎ | 594000/818627 [01:07<00:25, 8664.53 examples/s]
+Filter: 73%|███████▎ | 594000/818627 [01:07<00:25, 8663.44 examples/s]
+Filter: 73%|███████▎ | 594000/818627 [01:07<00:25, 8665.37 examples/s]
+Filter: 73%|███████▎ | 594000/818627 [01:07<00:25, 8658.95 examples/s]
+Filter: 73%|███████▎ | 594000/818627 [01:07<00:25, 8661.93 examples/s]
+Filter: 73%|███████▎ | 595000/818627 [01:07<00:25, 8794.31 examples/s]
+Filter: 73%|███████▎ | 595000/818627 [01:07<00:25, 8805.39 examples/s]
+Filter: 73%|███████▎ | 595000/818627 [01:07<00:25, 8793.77 examples/s]
+Filter: 73%|███████▎ | 595000/818627 [01:07<00:25, 8795.08 examples/s]
+Filter: 73%|███████▎ | 595000/818627 [01:07<00:25, 8794.31 examples/s]
+Filter: 73%|███████▎ | 595000/818627 [01:07<00:25, 8795.17 examples/s]
+Filter: 73%|███████▎ | 595000/818627 [01:07<00:25, 8792.06 examples/s]
+Filter: 73%|███████▎ | 595000/818627 [01:07<00:25, 8794.23 examples/s]
+Filter: 73%|███████▎ | 596000/818627 [01:07<00:25, 8688.37 examples/s]
+Filter: 73%|███████▎ | 596000/818627 [01:07<00:25, 8697.18 examples/s]
+Filter: 73%|███████▎ | 596000/818627 [01:07<00:25, 8687.24 examples/s]
+Filter: 73%|███████▎ | 596000/818627 [01:07<00:25, 8687.58 examples/s]
+Filter: 73%|███████▎ | 596000/818627 [01:07<00:25, 8689.93 examples/s]
+Filter: 73%|███████▎ | 596000/818627 [01:07<00:25, 8689.03 examples/s]
+Filter: 73%|███████▎ | 596000/818627 [01:07<00:25, 8685.56 examples/s]
+Filter: 73%|███████▎ | 596000/818627 [01:07<00:25, 8687.33 examples/s]
+Filter: 73%|███████▎ | 597000/818627 [01:07<00:25, 8647.06 examples/s]
+Filter: 73%|███████▎ | 597000/818627 [01:07<00:25, 8651.65 examples/s]
+Filter: 73%|███████▎ | 597000/818627 [01:07<00:25, 8648.88 examples/s]
+Filter: 73%|███████▎ | 597000/818627 [01:07<00:25, 8646.38 examples/s]
+Filter: 73%|███████▎ | 597000/818627 [01:07<00:25, 8651.26 examples/s]
+Filter: 73%|███████▎ | 597000/818627 [01:07<00:25, 8646.99 examples/s]
+Filter: 73%|███████▎ | 597000/818627 [01:07<00:25, 8645.38 examples/s]
+Filter: 73%|███████▎ | 597000/818627 [01:07<00:25, 8650.33 examples/s]
+Filter: 73%|███████▎ | 598000/818627 [01:07<00:25, 8577.29 examples/s]
+Filter: 73%|███████▎ | 598000/818627 [01:07<00:25, 8579.76 examples/s]
+Filter: 73%|███████▎ | 598000/818627 [01:07<00:25, 8576.14 examples/s]
+Filter: 73%|███████▎ | 598000/818627 [01:07<00:25, 8576.75 examples/s]
+Filter: 73%|███████▎ | 598000/818627 [01:07<00:25, 8575.38 examples/s]
+Filter: 73%|███████▎ | 598000/818627 [01:07<00:25, 8577.58 examples/s]
+Filter: 73%|███████▎ | 598000/818627 [01:07<00:25, 8571.24 examples/s]
+Filter: 73%|███████▎ | 598000/818627 [01:08<00:26, 8454.88 examples/s]
+Filter: 73%|███████▎ | 599000/818627 [01:07<00:25, 8565.49 examples/s]
+Filter: 73%|███████▎ | 599000/818627 [01:07<00:25, 8560.61 examples/s]
+Filter: 73%|███████▎ | 599000/818627 [01:08<00:25, 8601.29 examples/s]
+Filter: 73%|███████▎ | 599000/818627 [01:07<00:25, 8555.57 examples/s]
+Filter: 73%|███████▎ | 599000/818627 [01:07<00:25, 8564.04 examples/s]
+Filter: 73%|███████▎ | 599000/818627 [01:07<00:25, 8561.72 examples/s]
+Filter: 73%|███████▎ | 599000/818627 [01:07<00:25, 8566.02 examples/s]
+Filter: 73%|███████▎ | 599000/818627 [01:08<00:25, 8560.08 examples/s]
+Filter: 73%|███████▎ | 600000/818627 [01:08<00:25, 8641.53 examples/s]
+Filter: 73%|███████▎ | 600000/818627 [01:08<00:25, 8640.97 examples/s]
+Filter: 73%|███████▎ | 600000/818627 [01:08<00:25, 8639.66 examples/s]
+Filter: 73%|███████▎ | 600000/818627 [01:08<00:25, 8664.20 examples/s]
+Filter: 73%|███████▎ | 600000/818627 [01:08<00:25, 8640.06 examples/s]
+Filter: 73%|███████▎ | 600000/818627 [01:08<00:25, 8638.80 examples/s]
+Filter: 73%|███████▎ | 600000/818627 [01:08<00:25, 8638.76 examples/s]
+Filter: 73%|███████▎ | 600000/818627 [01:08<00:25, 8641.37 examples/s]
+Filter: 73%|███████▎ | 601000/818627 [01:08<00:24, 8999.80 examples/s]
+Filter: 73%|███████▎ | 601000/818627 [01:08<00:24, 8998.16 examples/s]
+Filter: 73%|███████▎ | 601000/818627 [01:08<00:24, 8995.68 examples/s]
+Filter: 73%|███████▎ | 601000/818627 [01:08<00:24, 9015.54 examples/s]
+Filter: 73%|███████▎ | 601000/818627 [01:08<00:24, 8997.81 examples/s]
+Filter: 73%|███████▎ | 601000/818627 [01:08<00:24, 8997.27 examples/s]
+Filter: 73%|███████▎ | 601000/818627 [01:08<00:24, 8994.86 examples/s]
+Filter: 73%|███████▎ | 601000/818627 [01:08<00:24, 8997.21 examples/s]
+Filter: 74%|███████▎ | 602000/818627 [01:08<00:23, 9051.26 examples/s]
+Filter: 74%|███████▎ | 602000/818627 [01:08<00:23, 9048.87 examples/s]
+Filter: 74%|███████▎ | 602000/818627 [01:08<00:23, 9042.85 examples/s]
+Filter: 74%|███████▎ | 602000/818627 [01:08<00:23, 9059.08 examples/s]
+Filter: 74%|███████▎ | 602000/818627 [01:08<00:23, 9051.28 examples/s]
+Filter: 74%|███████▎ | 602000/818627 [01:08<00:23, 9050.82 examples/s]
+Filter: 74%|███████▎ | 602000/818627 [01:08<00:23, 9051.02 examples/s]
+Filter: 74%|███████▎ | 602000/818627 [01:08<00:23, 9048.65 examples/s]
+Filter: 74%|███████▎ | 603000/818627 [01:08<00:24, 8913.63 examples/s]
+Filter: 74%|███████▎ | 603000/818627 [01:08<00:24, 8914.81 examples/s]
+Filter: 74%|███████▎ | 603000/818627 [01:08<00:24, 8912.06 examples/s]
+Filter: 74%|███████▎ | 603000/818627 [01:08<00:24, 8923.04 examples/s]
+Filter: 74%|███████▎ | 603000/818627 [01:08<00:24, 8913.70 examples/s]
+Filter: 74%|███████▎ | 603000/818627 [01:08<00:24, 8915.05 examples/s]
+Filter: 74%|███████▎ | 603000/818627 [01:08<00:24, 8913.29 examples/s]
+Filter: 74%|███████▎ | 603000/818627 [01:08<00:24, 8905.87 examples/s]
+Filter: 74%|███████▍ | 604000/818627 [01:08<00:24, 8816.95 examples/s]
+Filter: 74%|███████▍ | 604000/818627 [01:08<00:24, 8814.05 examples/s]
+Filter: 74%|███████▍ | 604000/818627 [01:08<00:24, 8814.17 examples/s]
+Filter: 74%|███████▍ | 604000/818627 [01:08<00:24, 8816.63 examples/s]
+Filter: 74%|███████▍ | 604000/818627 [01:08<00:24, 8819.11 examples/s]
+Filter: 74%|███████▍ | 604000/818627 [01:08<00:24, 8816.99 examples/s]
+Filter: 74%|███████▍ | 604000/818627 [01:08<00:24, 8816.02 examples/s]
+Filter: 74%|███████▍ | 604000/818627 [01:08<00:24, 8818.51 examples/s]
+Filter: 74%|███████▍ | 605000/818627 [01:08<00:24, 8738.61 examples/s]
+Filter: 74%|███████▍ | 605000/818627 [01:08<00:24, 8739.33 examples/s]
+Filter: 74%|███████▍ | 605000/818627 [01:08<00:24, 8739.99 examples/s]
+Filter: 74%|███████▍ | 605000/818627 [01:08<00:24, 8741.11 examples/s]
+Filter: 74%|███████▍ | 605000/818627 [01:08<00:24, 8740.07 examples/s]
+Filter: 74%|███████▍ | 605000/818627 [01:08<00:24, 8738.64 examples/s]
+Filter: 74%|███████▍ | 605000/818627 [01:08<00:24, 8738.49 examples/s]
+Filter: 74%|███████▍ | 605000/818627 [01:08<00:24, 8741.00 examples/s]
+Filter: 74%|███████▍ | 606000/818627 [01:08<00:24, 8733.73 examples/s]
+Filter: 74%|███████▍ | 606000/818627 [01:08<00:24, 8732.63 examples/s]
+Filter: 74%|███████▍ | 606000/818627 [01:09<00:24, 8744.01 examples/s]
+Filter: 74%|███████▍ | 606000/818627 [01:08<00:24, 8738.49 examples/s]
+Filter: 74%|███████▍ | 606000/818627 [01:08<00:24, 8737.04 examples/s]
+Filter: 74%|███████▍ | 606000/818627 [01:08<00:24, 8732.45 examples/s]
+Filter: 74%|███████▍ | 606000/818627 [01:08<00:24, 8734.96 examples/s]
+Filter: 74%|███████▍ | 606000/818627 [01:08<00:24, 8654.21 examples/s]
+Filter: 74%|███████▍ | 607000/818627 [01:08<00:23, 9040.63 examples/s]
+Filter: 74%|███████▍ | 607000/818627 [01:08<00:23, 9041.44 examples/s]
+Filter: 74%|███████▍ | 607000/818627 [01:09<00:23, 9043.71 examples/s]
+Filter: 74%|███████▍ | 607000/818627 [01:08<00:23, 9038.41 examples/s]
+Filter: 74%|███████▍ | 607000/818627 [01:08<00:23, 9039.56 examples/s]
+Filter: 74%|███████▍ | 607000/818627 [01:08<00:23, 9039.89 examples/s]
+Filter: 74%|███████▍ | 607000/818627 [01:08<00:23, 8978.64 examples/s]
+Filter: 74%|███████▍ | 608000/818627 [01:08<00:23, 9043.76 examples/s]
+Filter: 74%|███████▍ | 608000/818627 [01:08<00:23, 9045.50 examples/s]
+Filter: 74%|███████▍ | 608000/818627 [01:08<00:23, 9063.40 examples/s]
+Filter: 74%|███████▍ | 608000/818627 [01:09<00:23, 9042.22 examples/s]
+Filter: 74%|███████▍ | 608000/818627 [01:09<00:23, 9042.85 examples/s]
+Filter: 74%|███████▍ | 608000/818627 [01:08<00:23, 9040.94 examples/s]
+Filter: 74%|███████▍ | 608000/818627 [01:08<00:23, 9061.20 examples/s]
+Filter: 74%|███████▍ | 608000/818627 [01:08<00:23, 9042.71 examples/s]
+Filter: 74%|███████▍ | 609000/818627 [01:09<00:23, 9086.29 examples/s]
+Filter: 74%|███████▍ | 609000/818627 [01:09<00:23, 9086.94 examples/s]
+Filter: 74%|███████▍ | 609000/818627 [01:09<00:23, 9095.35 examples/s]
+Filter: 74%|███████▍ | 609000/818627 [01:09<00:23, 9091.10 examples/s]
+Filter: 74%|███████▍ | 609000/818627 [01:09<00:23, 9090.66 examples/s]
+Filter: 74%|███████▍ | 609000/818627 [01:09<00:23, 9101.47 examples/s]
+Filter: 74%|███████▍ | 609000/818627 [01:09<00:23, 9086.36 examples/s]
+Filter: 74%|███████▍ | 609000/818627 [01:09<00:23, 9086.62 examples/s]
+Filter: 75%|███████▍ | 610000/818627 [01:09<00:23, 8931.26 examples/s]
+Filter: 75%|███████▍ | 610000/818627 [01:09<00:23, 8956.56 examples/s]
+Filter: 75%|███████▍ | 610000/818627 [01:09<00:23, 8935.09 examples/s]
+Filter: 75%|███████▍ | 610000/818627 [01:09<00:23, 8931.88 examples/s]
+Filter: 75%|███████▍ | 610000/818627 [01:09<00:23, 8938.93 examples/s]
+Filter: 75%|███████▍ | 610000/818627 [01:09<00:23, 8931.20 examples/s]
+Filter: 75%|███████▍ | 610000/818627 [01:09<00:23, 8905.99 examples/s]
+Filter: 75%|███████▍ | 610000/818627 [01:09<00:23, 8828.83 examples/s]
+Filter: 75%|███████▍ | 611000/818627 [01:09<00:23, 8827.67 examples/s]
+Filter: 75%|███████▍ | 611000/818627 [01:09<00:23, 8836.66 examples/s]
+Filter: 75%|███████▍ | 611000/818627 [01:09<00:23, 8852.69 examples/s]
+Filter: 75%|███████▍ | 611000/818627 [01:09<00:23, 8829.36 examples/s]
+Filter: 75%|███████▍ | 611000/818627 [01:09<00:23, 8835.35 examples/s]
+Filter: 75%|███████▍ | 611000/818627 [01:09<00:23, 8825.03 examples/s]
+Filter: 75%|███████▍ | 611000/818627 [01:09<00:23, 8829.50 examples/s]
+Filter: 75%|███████▍ | 611000/818627 [01:09<00:23, 8851.83 examples/s]
+Filter: 75%|███████▍ | 612000/818627 [01:09<00:23, 8769.76 examples/s]
+Filter: 75%|███████▍ | 612000/818627 [01:09<00:23, 8775.44 examples/s]
+Filter: 75%|███████▍ | 612000/818627 [01:09<00:23, 8794.98 examples/s]
+Filter: 75%|███████▍ | 612000/818627 [01:09<00:23, 8768.32 examples/s]
+Filter: 75%|███████▍ | 612000/818627 [01:09<00:23, 8770.80 examples/s]
+Filter: 75%|███████▍ | 612000/818627 [01:09<00:23, 8793.09 examples/s]
+Filter: 75%|███████▍ | 612000/818627 [01:09<00:23, 8774.61 examples/s]
+Filter: 75%|███████▍ | 612000/818627 [01:09<00:23, 8764.69 examples/s]
+Filter: 75%|███████▍ | 613000/818627 [01:09<00:23, 8740.31 examples/s]
+Filter: 75%|███████▍ | 613000/818627 [01:09<00:23, 8732.62 examples/s]
+Filter: 75%|███████▍ | 613000/818627 [01:09<00:23, 8754.06 examples/s]
+Filter: 75%|███████▍ | 613000/818627 [01:09<00:23, 8736.19 examples/s]
+Filter: 75%|███████▍ | 613000/818627 [01:09<00:23, 8735.05 examples/s]
+Filter: 75%|███████▍ | 613000/818627 [01:09<00:23, 8736.30 examples/s]
+Filter: 75%|███████▍ | 613000/818627 [01:09<00:23, 8747.94 examples/s]
+Filter: 75%|███████▍ | 613000/818627 [01:09<00:23, 8734.83 examples/s]
+Filter: 75%|███████▌ | 614000/818627 [01:09<00:24, 8432.68 examples/s]
+Filter: 75%|███████▌ | 614000/818627 [01:09<00:24, 8431.43 examples/s]
+Filter: 75%|███████▌ | 614000/818627 [01:09<00:24, 8454.32 examples/s]
+Filter: 75%|███████▌ | 614000/818627 [01:09<00:24, 8431.80 examples/s]
+Filter: 75%|███████▌ | 614000/818627 [01:09<00:24, 8443.53 examples/s]
+Filter: 75%|███████▌ | 614000/818627 [01:09<00:24, 8431.29 examples/s]
+Filter: 75%|███████▌ | 614000/818627 [01:09<00:24, 8431.81 examples/s]
+Filter: 75%|███████▌ | 614000/818627 [01:09<00:24, 8433.35 examples/s]
+Filter: 75%|███████▌ | 615000/818627 [01:09<00:24, 8464.28 examples/s]
+Filter: 75%|███████▌ | 615000/818627 [01:09<00:24, 8459.98 examples/s]
+Filter: 75%|███████▌ | 615000/818627 [01:09<00:24, 8477.39 examples/s]
+Filter: 75%|███████▌ | 615000/818627 [01:10<00:24, 8464.28 examples/s]
+Filter: 75%|███████▌ | 615000/818627 [01:09<00:24, 8470.73 examples/s]
+Filter: 75%|███████▌ | 615000/818627 [01:09<00:24, 8463.55 examples/s]
+Filter: 75%|███████▌ | 615000/818627 [01:09<00:24, 8459.80 examples/s]
+Filter: 75%|███████▌ | 615000/818627 [01:09<00:24, 8463.52 examples/s]
+Filter: 75%|███████▌ | 616000/818627 [01:09<00:23, 8509.52 examples/s]
+Filter: 75%|███████▌ | 616000/818627 [01:09<00:23, 8509.82 examples/s]
+Filter: 75%|███████▌ | 616000/818627 [01:09<00:23, 8519.29 examples/s]
+Filter: 75%|███████▌ | 616000/818627 [01:09<00:23, 8514.52 examples/s]
+Filter: 75%|███████▌ | 616000/818627 [01:10<00:23, 8503.94 examples/s]
+Filter: 75%|███████▌ | 616000/818627 [01:09<00:23, 8509.48 examples/s]
+Filter: 75%|███████▌ | 616000/818627 [01:09<00:23, 8507.93 examples/s]
+Filter: 75%|███████▌ | 616000/818627 [01:09<00:23, 8509.73 examples/s]
+Filter: 75%|███████▌ | 617000/818627 [01:09<00:23, 8635.35 examples/s]
+Filter: 75%|███████▌ | 617000/818627 [01:09<00:23, 8632.47 examples/s]
+Filter: 75%|███████▌ | 617000/818627 [01:09<00:23, 8640.53 examples/s]
+Filter: 75%|███████▌ | 617000/818627 [01:10<00:23, 8632.02 examples/s]
+Filter: 75%|███████▌ | 617000/818627 [01:09<00:23, 8632.13 examples/s]
+Filter: 75%|███████▌ | 617000/818627 [01:10<00:23, 8632.53 examples/s]
+Filter: 75%|███████▌ | 617000/818627 [01:09<00:23, 8630.75 examples/s]
+Filter: 75%|███████▌ | 617000/818627 [01:09<00:23, 8632.75 examples/s]
+Filter: 75%|███████▌ | 618000/818627 [01:10<00:22, 8818.33 examples/s]
+Filter: 75%|███████▌ | 618000/818627 [01:10<00:22, 8823.72 examples/s]
+Filter: 75%|███████▌ | 618000/818627 [01:10<00:22, 8816.59 examples/s]
+Filter: 75%|███████▌ | 618000/818627 [01:10<00:22, 8821.19 examples/s]
+Filter: 75%|███████▌ | 618000/818627 [01:10<00:22, 8823.45 examples/s]
+Filter: 75%|███████▌ | 618000/818627 [01:10<00:22, 8820.75 examples/s]
+Filter: 75%|███████▌ | 618000/818627 [01:10<00:22, 8817.56 examples/s]
+Filter: 75%|███████▌ | 618000/818627 [01:10<00:22, 8817.78 examples/s]
+Filter: 76%|███████▌ | 619000/818627 [01:10<00:22, 8986.55 examples/s]
+Filter: 76%|███████▌ | 619000/818627 [01:10<00:22, 8986.09 examples/s]
+Filter: 76%|███████▌ | 619000/818627 [01:10<00:22, 8986.34 examples/s]
+Filter: 76%|███████▌ | 619000/818627 [01:10<00:22, 8988.42 examples/s]
+Filter: 76%|███████▌ | 619000/818627 [01:10<00:22, 8986.40 examples/s]
+Filter: 76%|███████▌ | 619000/818627 [01:10<00:22, 8988.89 examples/s]
+Filter: 76%|███████▌ | 619000/818627 [01:10<00:22, 8986.57 examples/s]
+Filter: 76%|███████▌ | 619000/818627 [01:10<00:22, 8985.77 examples/s]
+Filter: 76%|███████▌ | 620000/818627 [01:10<00:22, 8865.97 examples/s]
+Filter: 76%|███████▌ | 620000/818627 [01:10<00:22, 8865.19 examples/s]
+Filter: 76%|███████▌ | 620000/818627 [01:10<00:22, 8863.02 examples/s]
+Filter: 76%|███████▌ | 620000/818627 [01:10<00:22, 8866.00 examples/s]
+Filter: 76%|███████▌ | 620000/818627 [01:10<00:22, 8859.12 examples/s]
+Filter: 76%|███████▌ | 620000/818627 [01:10<00:22, 8863.29 examples/s]
+Filter: 76%|███████▌ | 620000/818627 [01:10<00:22, 8860.73 examples/s]
+Filter: 76%|███████▌ | 620000/818627 [01:10<00:22, 8862.99 examples/s]
+Filter: 76%|███████▌ | 621000/818627 [01:10<00:22, 8763.26 examples/s]
+Filter: 76%|███████▌ | 621000/818627 [01:10<00:22, 8754.65 examples/s]
+Filter: 76%|███████▌ | 621000/818627 [01:10<00:22, 8760.12 examples/s]
+Filter: 76%|███████▌ | 621000/818627 [01:10<00:22, 8753.35 examples/s]
+Filter: 76%|███████▌ | 621000/818627 [01:10<00:22, 8755.65 examples/s]
+Filter: 76%|███████▌ | 621000/818627 [01:10<00:22, 8740.11 examples/s]
+Filter: 76%|███████▌ | 621000/818627 [01:10<00:22, 8743.50 examples/s]
+Filter: 76%|███████▌ | 621000/818627 [01:10<00:22, 8719.51 examples/s]
+Filter: 76%|███████▌ | 622000/818627 [01:10<00:21, 9088.29 examples/s]
+Filter: 76%|███████▌ | 622000/818627 [01:10<00:21, 9090.08 examples/s]
+Filter: 76%|███████▌ | 622000/818627 [01:10<00:21, 9089.14 examples/s]
+Filter: 76%|███████▌ | 622000/818627 [01:10<00:21, 9086.48 examples/s]
+Filter: 76%|███████▌ | 622000/818627 [01:10<00:21, 9084.84 examples/s]
+Filter: 76%|███████▌ | 623000/818627 [01:10<00:21, 9006.84 examples/s]
+Filter: 76%|███████▌ | 623000/818627 [01:10<00:21, 9010.81 examples/s]
+Filter: 76%|███████▌ | 623000/818627 [01:10<00:21, 9031.34 examples/s]
+Filter: 76%|███████▌ | 623000/818627 [01:10<00:21, 9006.51 examples/s]
+Filter: 76%|███████▌ | 623000/818627 [01:10<00:21, 9034.90 examples/s]
+Filter: 76%|███████▌ | 623000/818627 [01:10<00:21, 9002.79 examples/s]
+Filter: 76%|███████▌ | 623000/818627 [01:10<00:21, 9000.29 examples/s]
+Filter: 76%|███████▌ | 623000/818627 [01:10<00:21, 8977.84 examples/s]
+Filter: 76%|███████▌ | 624000/818627 [01:10<00:21, 8858.47 examples/s]
+Filter: 76%|███████▌ | 624000/818627 [01:10<00:21, 8852.87 examples/s]
+Filter: 76%|███████▌ | 624000/818627 [01:10<00:21, 8858.79 examples/s]
+Filter: 76%|███████▌ | 624000/818627 [01:10<00:21, 8857.56 examples/s]
+Filter: 76%|███████▌ | 624000/818627 [01:11<00:21, 8892.31 examples/s]
+Filter: 76%|███████▌ | 624000/818627 [01:10<00:21, 8902.52 examples/s]
+Filter: 76%|███████▌ | 624000/818627 [01:10<00:21, 8902.68 examples/s]
+Filter: 76%|███████▌ | 624000/818627 [01:10<00:21, 8849.32 examples/s]
+Filter: 76%|███████▋ | 625000/818627 [01:10<00:22, 8767.24 examples/s]
+Filter: 76%|███████▋ | 625000/818627 [01:10<00:22, 8767.14 examples/s]
+Filter: 76%|███████▋ | 625000/818627 [01:10<00:21, 8826.64 examples/s]
+Filter: 76%|███████▋ | 625000/818627 [01:11<00:21, 8813.17 examples/s]
+Filter: 76%|███████▋ | 625000/818627 [01:10<00:22, 8772.62 examples/s]
+Filter: 76%|███████▋ | 625000/818627 [01:10<00:22, 8774.29 examples/s]
+Filter: 76%|███████▋ | 625000/818627 [01:10<00:22, 8770.77 examples/s]
+Filter: 76%|███████▋ | 625000/818627 [01:10<00:21, 8815.59 examples/s]
+Filter: 76%|███████▋ | 626000/818627 [01:10<00:21, 8964.05 examples/s]
+Filter: 76%|███████▋ | 626000/818627 [01:10<00:21, 8963.91 examples/s]
+Filter: 76%|███████▋ | 626000/818627 [01:10<00:21, 8988.62 examples/s]
+Filter: 76%|███████▋ | 626000/818627 [01:11<00:21, 8979.39 examples/s]
+Filter: 76%|███████▋ | 626000/818627 [01:11<00:21, 8968.68 examples/s]
+Filter: 76%|███████▋ | 626000/818627 [01:10<00:21, 8968.29 examples/s]
+Filter: 76%|███████▋ | 626000/818627 [01:10<00:21, 8966.12 examples/s]
+Filter: 76%|███████▋ | 626000/818627 [01:10<00:21, 8980.22 examples/s]
+Filter: 77%|███████▋ | 627000/818627 [01:11<00:21, 8827.45 examples/s]
+Filter: 77%|███████▋ | 627000/818627 [01:11<00:21, 8828.09 examples/s]
+Filter: 77%|███████▋ | 627000/818627 [01:11<00:21, 8852.50 examples/s]
+Filter: 77%|███████▋ | 627000/818627 [01:11<00:21, 8846.13 examples/s]
+Filter: 77%|███████▋ | 627000/818627 [01:11<00:21, 8828.55 examples/s]
+Filter: 77%|███████▋ | 627000/818627 [01:11<00:21, 8824.37 examples/s]
+Filter: 77%|███████▋ | 627000/818627 [01:11<00:21, 8846.07 examples/s]
+Filter: 77%|███████▋ | 627000/818627 [01:11<00:21, 8816.66 examples/s]
+Filter: 77%|███████▋ | 628000/818627 [01:11<00:21, 8697.90 examples/s]
+Filter: 77%|███████▋ | 628000/818627 [01:11<00:21, 8696.77 examples/s]
+Filter: 77%|███████▋ | 628000/818627 [01:11<00:21, 8724.47 examples/s]
+Filter: 77%|███████▋ | 628000/818627 [01:11<00:21, 8720.62 examples/s]
+Filter: 77%|███████▋ | 628000/818627 [01:11<00:21, 8702.76 examples/s]
+Filter: 77%|███████▋ | 628000/818627 [01:11<00:21, 8704.24 examples/s]
+Filter: 77%|███████▋ | 628000/818627 [01:11<00:21, 8700.76 examples/s]
+Filter: 77%|███████▋ | 628000/818627 [01:11<00:21, 8719.48 examples/s]
+Filter: 77%|███████▋ | 629000/818627 [01:11<00:21, 8639.24 examples/s]
+Filter: 77%|███████▋ | 629000/818627 [01:11<00:21, 8641.86 examples/s]
+Filter: 77%|███████▋ | 629000/818627 [01:11<00:21, 8658.71 examples/s]
+Filter: 77%|███████▋ | 629000/818627 [01:11<00:21, 8651.43 examples/s]
+Filter: 77%|███████▋ | 629000/818627 [01:11<00:21, 8639.39 examples/s]
+Filter: 77%|███████▋ | 629000/818627 [01:11<00:21, 8638.59 examples/s]
+Filter: 77%|███████▋ | 629000/818627 [01:11<00:21, 8639.42 examples/s]
+Filter: 77%|███████▋ | 629000/818627 [01:11<00:21, 8647.51 examples/s]
+Filter: 77%|███████▋ | 630000/818627 [01:11<00:21, 8631.85 examples/s]
+Filter: 77%|███████▋ | 630000/818627 [01:11<00:21, 8632.26 examples/s]
+Filter: 77%|███████▋ | 630000/818627 [01:11<00:21, 8649.40 examples/s]
+Filter: 77%|███████▋ | 630000/818627 [01:11<00:21, 8648.71 examples/s]
+Filter: 77%|███████▋ | 630000/818627 [01:11<00:21, 8636.97 examples/s]
+Filter: 77%|███████▋ | 630000/818627 [01:11<00:21, 8637.67 examples/s]
+Filter: 77%|███████▋ | 630000/818627 [01:11<00:21, 8633.17 examples/s]
+Filter: 77%|███████▋ | 630000/818627 [01:11<00:21, 8642.87 examples/s]
+Filter: 77%|███████▋ | 631000/818627 [01:11<00:21, 8733.02 examples/s]
+Filter: 77%|███████▋ | 631000/818627 [01:11<00:21, 8742.23 examples/s]
+Filter: 77%|███████▋ | 631000/818627 [01:11<00:21, 8738.20 examples/s]
+Filter: 77%|███████▋ | 631000/818627 [01:11<00:21, 8733.23 examples/s]
+Filter: 77%|███████▋ | 631000/818627 [01:11<00:21, 8736.00 examples/s]
+Filter: 77%|███████▋ | 631000/818627 [01:11<00:21, 8745.29 examples/s]
+Filter: 77%|███████▋ | 631000/818627 [01:11<00:21, 8672.28 examples/s]
+Filter: 77%|███████▋ | 631000/818627 [01:11<00:21, 8610.41 examples/s]
+Filter: 77%|███████▋ | 632000/818627 [01:11<00:21, 8741.15 examples/s]
+Filter: 77%|███████▋ | 632000/818627 [01:11<00:21, 8725.23 examples/s]
+Filter: 77%|███████▋ | 632000/818627 [01:11<00:21, 8729.18 examples/s]
+Filter: 77%|███████▋ | 632000/818627 [01:11<00:21, 8725.25 examples/s]
+Filter: 77%|███████▋ | 632000/818627 [01:11<00:21, 8724.42 examples/s]
+Filter: 77%|███████▋ | 632000/818627 [01:11<00:21, 8723.25 examples/s]
+Filter: 77%|███████▋ | 632000/818627 [01:11<00:21, 8759.66 examples/s]
+Filter: 77%|███████▋ | 632000/818627 [01:11<00:21, 8728.39 examples/s]
+Filter: 77%|███████▋ | 633000/818627 [01:11<00:21, 8684.36 examples/s]
+Filter: 77%|███████▋ | 633000/818627 [01:11<00:21, 8671.08 examples/s]
+Filter: 77%|███████▋ | 633000/818627 [01:11<00:21, 8677.41 examples/s]
+Filter: 77%|███████▋ | 633000/818627 [01:12<00:21, 8674.72 examples/s]
+Filter: 77%|███████▋ | 633000/818627 [01:11<00:21, 8674.04 examples/s]
+Filter: 77%|███████▋ | 633000/818627 [01:11<00:21, 8699.90 examples/s]
+Filter: 77%|███████▋ | 633000/818627 [01:11<00:21, 8672.60 examples/s]
+Filter: 77%|███████▋ | 633000/818627 [01:11<00:21, 8679.53 examples/s]
+Filter: 77%|███████▋ | 634000/818627 [01:11<00:21, 8674.50 examples/s]
+Filter: 77%|███████▋ | 634000/818627 [01:11<00:21, 8680.39 examples/s]
+Filter: 77%|███████▋ | 634000/818627 [01:11<00:21, 8676.81 examples/s]
+Filter: 77%|███████▋ | 634000/818627 [01:12<00:21, 8674.69 examples/s]
+Filter: 77%|███████▋ | 634000/818627 [01:11<00:21, 8675.66 examples/s]
+Filter: 77%|███████▋ | 634000/818627 [01:11<00:21, 8692.10 examples/s]
+Filter: 77%|███████▋ | 634000/818627 [01:11<00:21, 8673.21 examples/s]
+Filter: 77%|███████▋ | 634000/818627 [01:11<00:21, 8675.73 examples/s]
+Filter: 78%|███████▊ | 635000/818627 [01:12<00:21, 8647.56 examples/s]
+Filter: 78%|███████▊ | 635000/818627 [01:11<00:21, 8651.50 examples/s]
+Filter: 78%|███████▊ | 635000/818627 [01:11<00:21, 8643.14 examples/s]
+Filter: 78%|███████▊ | 635000/818627 [01:12<00:21, 8647.43 examples/s]
+Filter: 78%|███████▊ | 635000/818627 [01:11<00:21, 8645.27 examples/s]
+Filter: 78%|███████▊ | 635000/818627 [01:11<00:21, 8648.50 examples/s]
+Filter: 78%|███████▊ | 635000/818627 [01:11<00:21, 8654.39 examples/s]
+Filter: 78%|███████▊ | 635000/818627 [01:12<00:21, 8641.68 examples/s]
+Filter: 78%|███████▊ | 636000/818627 [01:12<00:21, 8666.35 examples/s]
+Filter: 78%|███████▊ | 636000/818627 [01:12<00:21, 8660.10 examples/s]
+Filter: 78%|███████▊ | 636000/818627 [01:12<00:21, 8665.80 examples/s]
+Filter: 78%|███████▊ | 636000/818627 [01:12<00:21, 8665.75 examples/s]
+Filter: 78%|███████▊ | 636000/818627 [01:12<00:21, 8663.42 examples/s]
+Filter: 78%|███████▊ | 636000/818627 [01:12<00:21, 8664.07 examples/s]
+Filter: 78%|███████▊ | 636000/818627 [01:12<00:21, 8671.14 examples/s]
+Filter: 78%|███████▊ | 636000/818627 [01:12<00:21, 8663.80 examples/s]
+Filter: 78%|███████▊ | 637000/818627 [01:12<00:21, 8629.94 examples/s]
+Filter: 78%|███████▊ | 637000/818627 [01:12<00:21, 8631.40 examples/s]
+Filter: 78%|███████▊ | 637000/818627 [01:12<00:21, 8624.32 examples/s]
+Filter: 78%|███████▊ | 637000/818627 [01:12<00:21, 8628.14 examples/s]
+Filter: 78%|███████▊ | 637000/818627 [01:12<00:21, 8627.91 examples/s]
+Filter: 78%|███████▊ | 637000/818627 [01:12<00:21, 8632.70 examples/s]
+Filter: 78%|███████▊ | 637000/818627 [01:12<00:21, 8624.75 examples/s]
+Filter: 78%|███████▊ | 637000/818627 [01:12<00:21, 8627.87 examples/s]
+Filter: 78%|███████▊ | 638000/818627 [01:12<00:20, 8629.86 examples/s]
+Filter: 78%|███████▊ | 638000/818627 [01:12<00:20, 8627.13 examples/s]
+Filter: 78%|███████▊ | 638000/818627 [01:12<00:20, 8627.10 examples/s]
+Filter: 78%|███████▊ | 638000/818627 [01:12<00:20, 8626.80 examples/s]
+Filter: 78%|███████▊ | 638000/818627 [01:12<00:20, 8633.06 examples/s]
+Filter: 78%|███████▊ | 638000/818627 [01:12<00:20, 8627.84 examples/s]
+Filter: 78%|███████▊ | 638000/818627 [01:12<00:20, 8626.03 examples/s]
+Filter: 78%|███████▊ | 638000/818627 [01:12<00:20, 8620.67 examples/s]
+Filter: 78%|███████▊ | 639000/818627 [01:12<00:20, 8590.87 examples/s]
+Filter: 78%|███████▊ | 639000/818627 [01:12<00:20, 8585.42 examples/s]
+Filter: 78%|███████▊ | 639000/818627 [01:12<00:20, 8583.29 examples/s]
+Filter: 78%|███████▊ | 639000/818627 [01:12<00:20, 8593.65 examples/s]
+Filter: 78%|███████▊ | 639000/818627 [01:12<00:20, 8589.24 examples/s]
+Filter: 78%|███████▊ | 639000/818627 [01:12<00:20, 8583.17 examples/s]
+Filter: 78%|███████▊ | 639000/818627 [01:12<00:20, 8590.89 examples/s]
+Filter: 78%|███████▊ | 639000/818627 [01:12<00:21, 8543.50 examples/s]
+Filter: 78%|███████▊ | 640000/818627 [01:12<00:20, 8819.69 examples/s]
+Filter: 78%|███████▊ | 640000/818627 [01:12<00:20, 8815.99 examples/s]
+Filter: 78%|███████▊ | 640000/818627 [01:12<00:20, 8813.18 examples/s]
+Filter: 78%|███████▊ | 640000/818627 [01:12<00:20, 8816.30 examples/s]
+Filter: 78%|███████▊ | 640000/818627 [01:12<00:20, 8820.49 examples/s]
+Filter: 78%|███████▊ | 640000/818627 [01:12<00:20, 8833.37 examples/s]
+Filter: 78%|███████▊ | 640000/818627 [01:12<00:20, 8817.77 examples/s]
+Filter: 78%|███████▊ | 640000/818627 [01:12<00:20, 8817.47 examples/s]
+Filter: 78%|███████▊ | 641000/818627 [01:12<00:20, 8745.38 examples/s]
+Filter: 78%|███████▊ | 641000/818627 [01:12<00:20, 8740.81 examples/s]
+Filter: 78%|███████▊ | 641000/818627 [01:12<00:20, 8743.85 examples/s]
+Filter: 78%|███████▊ | 641000/818627 [01:13<00:20, 8739.55 examples/s]
+Filter: 78%|███████▊ | 641000/818627 [01:12<00:20, 8749.96 examples/s]
+Filter: 78%|███████▊ | 641000/818627 [01:12<00:20, 8740.62 examples/s]
+Filter: 78%|███████▊ | 641000/818627 [01:12<00:20, 8738.80 examples/s]
+Filter: 78%|███████▊ | 641000/818627 [01:12<00:20, 8743.19 examples/s]
+Filter: 78%|███████▊ | 642000/818627 [01:12<00:20, 8717.53 examples/s]
+Filter: 78%|███████▊ | 642000/818627 [01:12<00:20, 8715.71 examples/s]
+Filter: 78%|███████▊ | 642000/818627 [01:12<00:20, 8721.65 examples/s]
+Filter: 78%|███████▊ | 642000/818627 [01:13<00:20, 8723.49 examples/s]
+Filter: 78%|███████▊ | 642000/818627 [01:12<00:20, 8720.63 examples/s]
+Filter: 78%|███████▊ | 642000/818627 [01:12<00:20, 8718.82 examples/s]
+Filter: 78%|███████▊ | 642000/818627 [01:12<00:20, 8719.81 examples/s]
+Filter: 78%|███████▊ | 642000/818627 [01:12<00:20, 8714.00 examples/s]
+Filter: 79%|███████▊ | 643000/818627 [01:12<00:20, 8676.49 examples/s]
+Filter: 79%|███████▊ | 643000/818627 [01:12<00:20, 8675.19 examples/s]
+Filter: 79%|███████▊ | 643000/818627 [01:12<00:20, 8675.37 examples/s]
+Filter: 79%|███████▊ | 643000/818627 [01:12<00:20, 8683.40 examples/s]
+Filter: 79%|███████▊ | 643000/818627 [01:13<00:20, 8672.47 examples/s]
+Filter: 79%|███████▊ | 643000/818627 [01:12<00:20, 8673.89 examples/s]
+Filter: 79%|███████▊ | 643000/818627 [01:13<00:20, 8673.01 examples/s]
+Filter: 79%|███████▊ | 643000/818627 [01:12<00:20, 8678.54 examples/s]
+Filter: 79%|███████▊ | 644000/818627 [01:13<00:20, 8681.55 examples/s]
+Filter: 79%|███████▊ | 644000/818627 [01:13<00:20, 8681.54 examples/s]
+Filter: 79%|███████▊ | 644000/818627 [01:13<00:20, 8681.94 examples/s]
+Filter: 79%|███████▊ | 644000/818627 [01:13<00:20, 8681.40 examples/s]
+Filter: 79%|███████▊ | 644000/818627 [01:13<00:20, 8683.14 examples/s]
+Filter: 79%|███████▊ | 644000/818627 [01:13<00:20, 8685.06 examples/s]
+Filter: 79%|███████▊ | 644000/818627 [01:13<00:20, 8680.40 examples/s]
+Filter: 79%|███████▊ | 644000/818627 [01:13<00:20, 8682.88 examples/s]
+Filter: 79%|███████▉ | 645000/818627 [01:13<00:19, 8722.14 examples/s]
+Filter: 79%|███████▉ | 645000/818627 [01:13<00:19, 8723.49 examples/s]
+Filter: 79%|███████▉ | 645000/818627 [01:13<00:19, 8715.88 examples/s]
+Filter: 79%|███████▉ | 645000/818627 [01:13<00:19, 8721.46 examples/s]
+Filter: 79%|███████▉ | 645000/818627 [01:13<00:19, 8721.66 examples/s]
+Filter: 79%|███████▉ | 645000/818627 [01:13<00:19, 8719.56 examples/s]
+Filter: 79%|███████▉ | 645000/818627 [01:13<00:19, 8720.91 examples/s]
+Filter: 79%|███████▉ | 645000/818627 [01:13<00:19, 8719.38 examples/s]
+Filter: 79%|███████▉ | 646000/818627 [01:13<00:19, 8857.88 examples/s]
+Filter: 79%|███████▉ | 646000/818627 [01:13<00:19, 8860.65 examples/s]
+Filter: 79%|███████▉ | 646000/818627 [01:13<00:19, 8859.26 examples/s]
+Filter: 79%|███████▉ | 646000/818627 [01:13<00:19, 8860.38 examples/s]
+Filter: 79%|███████▉ | 646000/818627 [01:13<00:19, 8859.53 examples/s]
+Filter: 79%|███████▉ | 646000/818627 [01:13<00:19, 8857.80 examples/s]
+Filter: 79%|███████▉ | 646000/818627 [01:13<00:19, 8858.40 examples/s]
+Filter: 79%|███████▉ | 646000/818627 [01:13<00:19, 8860.39 examples/s]
+Filter: 79%|███████▉ | 647000/818627 [01:13<00:18, 9044.95 examples/s]
+Filter: 79%|███████▉ | 647000/818627 [01:13<00:18, 9047.63 examples/s]
+Filter: 79%|███████▉ | 647000/818627 [01:13<00:18, 9041.94 examples/s]
+Filter: 79%|███████▉ | 647000/818627 [01:13<00:18, 9045.81 examples/s]
+Filter: 79%|███████▉ | 647000/818627 [01:13<00:18, 9049.18 examples/s]
+Filter: 79%|███████▉ | 647000/818627 [01:13<00:18, 9046.51 examples/s]
+Filter: 79%|███████▉ | 647000/818627 [01:13<00:18, 9043.03 examples/s]
+Filter: 79%|███████▉ | 647000/818627 [01:13<00:18, 9041.32 examples/s]
+Filter: 79%|███████▉ | 648000/818627 [01:13<00:19, 8877.67 examples/s]
+Filter: 79%|███████▉ | 648000/818627 [01:13<00:19, 8874.33 examples/s]
+Filter: 79%|███████▉ | 648000/818627 [01:13<00:19, 8875.22 examples/s]
+Filter: 79%|███████▉ | 648000/818627 [01:13<00:19, 8875.37 examples/s]
+Filter: 79%|███████▉ | 648000/818627 [01:13<00:19, 8878.25 examples/s]
+Filter: 79%|███████▉ | 648000/818627 [01:13<00:19, 8871.31 examples/s]
+Filter: 79%|███████▉ | 648000/818627 [01:13<00:19, 8873.67 examples/s]
+Filter: 79%|███████▉ | 648000/818627 [01:13<00:19, 8869.21 examples/s]
+Filter: 79%|███████▉ | 649000/818627 [01:13<00:19, 8806.38 examples/s]
+Filter: 79%|███████▉ | 649000/818627 [01:13<00:19, 8806.04 examples/s]
+Filter: 79%|███████▉ | 649000/818627 [01:13<00:19, 8807.05 examples/s]
+Filter: 79%|███████▉ | 649000/818627 [01:13<00:19, 8804.04 examples/s]
+Filter: 79%|███████▉ | 649000/818627 [01:13<00:19, 8804.06 examples/s]
+Filter: 79%|███████▉ | 649000/818627 [01:13<00:19, 8803.65 examples/s]
+Filter: 79%|███████▉ | 649000/818627 [01:13<00:19, 8803.21 examples/s]
+Filter: 79%|███████▉ | 649000/818627 [01:13<00:19, 8803.66 examples/s]
+Filter: 79%|███████▉ | 650000/818627 [01:13<00:19, 8789.25 examples/s]
+Filter: 79%|███████▉ | 650000/818627 [01:13<00:19, 8788.46 examples/s]
+Filter: 79%|███████▉ | 650000/818627 [01:13<00:19, 8789.27 examples/s]
+Filter: 79%|███████▉ | 650000/818627 [01:14<00:19, 8788.99 examples/s]
+Filter: 79%|███████▉ | 650000/818627 [01:13<00:19, 8789.54 examples/s]
+Filter: 79%|███████▉ | 650000/818627 [01:13<00:19, 8790.66 examples/s]
+Filter: 79%|███████▉ | 650000/818627 [01:13<00:19, 8789.42 examples/s]
+Filter: 79%|███████▉ | 650000/818627 [01:13<00:19, 8788.00 examples/s]
+Filter: 80%|███████▉ | 651000/818627 [01:13<00:19, 8766.63 examples/s]
+Filter: 80%|███████▉ | 651000/818627 [01:13<00:19, 8763.37 examples/s]
+Filter: 80%|███████▉ | 651000/818627 [01:13<00:19, 8765.16 examples/s]
+Filter: 80%|███████▉ | 651000/818627 [01:14<00:19, 8771.94 examples/s]
+Filter: 80%|███████▉ | 651000/818627 [01:13<00:19, 8767.93 examples/s]
+Filter: 80%|███████▉ | 651000/818627 [01:13<00:19, 8768.16 examples/s]
+Filter: 80%|███████▉ | 651000/818627 [01:13<00:19, 8767.88 examples/s]
+Filter: 80%|███████▉ | 651000/818627 [01:13<00:19, 8766.65 examples/s]
+Filter: 80%|███████▉ | 652000/818627 [01:13<00:18, 8877.19 examples/s]
+Filter: 80%|███████▉ | 652000/818627 [01:13<00:18, 8880.19 examples/s]
+Filter: 80%|███████▉ | 652000/818627 [01:13<00:18, 8878.54 examples/s]
+Filter: 80%|███████▉ | 652000/818627 [01:14<00:18, 8881.30 examples/s]
+Filter: 80%|███████▉ | 652000/818627 [01:13<00:18, 8883.99 examples/s]
+Filter: 80%|███████▉ | 652000/818627 [01:14<00:18, 8881.88 examples/s]
+Filter: 80%|███████▉ | 652000/818627 [01:13<00:18, 8880.06 examples/s]
+Filter: 80%|███████▉ | 652000/818627 [01:13<00:18, 8878.45 examples/s]
+Filter: 80%|███████▉ | 653000/818627 [01:14<00:18, 8766.36 examples/s]
+Filter: 80%|███████▉ | 653000/818627 [01:14<00:18, 8765.94 examples/s]
+Filter: 80%|███████▉ | 653000/818627 [01:14<00:18, 8763.66 examples/s]
+Filter: 80%|███████▉ | 653000/818627 [01:14<00:18, 8764.31 examples/s]
+Filter: 80%|███████▉ | 653000/818627 [01:14<00:18, 8764.81 examples/s]
+Filter: 80%|███████▉ | 653000/818627 [01:14<00:18, 8764.25 examples/s]
+Filter: 80%|███████▉ | 653000/818627 [01:14<00:18, 8764.42 examples/s]
+Filter: 80%|███████▉ | 653000/818627 [01:14<00:18, 8763.68 examples/s]
+Filter: 80%|███████▉ | 654000/818627 [01:14<00:18, 8724.60 examples/s]
+Filter: 80%|███████▉ | 654000/818627 [01:14<00:18, 8723.86 examples/s]
+Filter: 80%|███████▉ | 654000/818627 [01:14<00:18, 8727.32 examples/s]
+Filter: 80%|███████▉ | 654000/818627 [01:14<00:18, 8730.20 examples/s]
+Filter: 80%|███████▉ | 654000/818627 [01:14<00:18, 8728.01 examples/s]
+Filter: 80%|███████▉ | 654000/818627 [01:14<00:18, 8725.55 examples/s]
+Filter: 80%|███████▉ | 654000/818627 [01:14<00:18, 8729.76 examples/s]
+Filter: 80%|███████▉ | 654000/818627 [01:14<00:18, 8724.73 examples/s]
+Filter: 80%|████████ | 655000/818627 [01:14<00:18, 8707.14 examples/s]
+Filter: 80%|████████ | 655000/818627 [01:14<00:18, 8707.47 examples/s]
+Filter: 80%|████████ | 655000/818627 [01:14<00:18, 8708.14 examples/s]
+Filter: 80%|████████ | 655000/818627 [01:14<00:18, 8708.59 examples/s]
+Filter: 80%|████████ | 655000/818627 [01:14<00:18, 8708.36 examples/s]
+Filter: 80%|████████ | 655000/818627 [01:14<00:18, 8707.28 examples/s]
+Filter: 80%|████████ | 655000/818627 [01:14<00:18, 8709.93 examples/s]
+Filter: 80%|████████ | 655000/818627 [01:14<00:19, 8595.48 examples/s]
+Filter: 80%|████████ | 656000/818627 [01:14<00:18, 8729.45 examples/s]
+Filter: 80%|████████ | 656000/818627 [01:14<00:18, 8731.63 examples/s]
+Filter: 80%|████████ | 656000/818627 [01:14<00:18, 8729.98 examples/s]
+Filter: 80%|████████ | 656000/818627 [01:14<00:18, 8731.13 examples/s]
+Filter: 80%|████████ | 656000/818627 [01:14<00:18, 8728.84 examples/s]
+Filter: 80%|████████ | 656000/818627 [01:14<00:18, 8762.43 examples/s]
+Filter: 80%|████████ | 656000/818627 [01:14<00:18, 8728.92 examples/s]
+Filter: 80%|████████ | 656000/818627 [01:14<00:18, 8725.02 examples/s]
+Filter: 80%|████████ | 657000/818627 [01:14<00:18, 8720.39 examples/s]
+Filter: 80%|████████ | 657000/818627 [01:14<00:18, 8718.92 examples/s]
+Filter: 80%|████████ | 657000/818627 [01:14<00:18, 8720.59 examples/s]
+Filter: 80%|████████ | 657000/818627 [01:14<00:18, 8720.62 examples/s]
+Filter: 80%|████████ | 657000/818627 [01:14<00:18, 8722.15 examples/s]
+Filter: 80%|████████ | 657000/818627 [01:14<00:18, 8721.01 examples/s]
+Filter: 80%|████████ | 657000/818627 [01:14<00:18, 8743.36 examples/s]
+Filter: 80%|████████ | 657000/818627 [01:14<00:18, 8718.19 examples/s]
+Filter: 80%|████████ | 658000/818627 [01:14<00:18, 8776.43 examples/s]
+Filter: 80%|████████ | 658000/818627 [01:14<00:18, 8768.69 examples/s]
+Filter: 80%|████████ | 658000/818627 [01:14<00:18, 8768.92 examples/s]
+Filter: 80%|████████ | 658000/818627 [01:14<00:18, 8776.03 examples/s]
+Filter: 80%|████████ | 658000/818627 [01:14<00:18, 8773.85 examples/s]
+Filter: 80%|████████ | 658000/818627 [01:14<00:18, 8790.81 examples/s]
+Filter: 80%|████████ | 658000/818627 [01:14<00:18, 8755.97 examples/s]
+Filter: 80%|████████ | 658000/818627 [01:14<00:18, 8626.36 examples/s]
+Filter: 81%|████████ | 659000/818627 [01:14<00:17, 8883.39 examples/s]
+Filter: 81%|████████ | 659000/818627 [01:14<00:17, 8884.93 examples/s]
+Filter: 81%|████████ | 659000/818627 [01:15<00:17, 8882.88 examples/s]
+Filter: 81%|████████ | 659000/818627 [01:14<00:17, 8878.82 examples/s]
+Filter: 81%|████████ | 659000/818627 [01:14<00:17, 8897.38 examples/s]
+Filter: 81%|████████ | 659000/818627 [01:14<00:17, 8877.85 examples/s]
+Filter: 81%|████████ | 659000/818627 [01:14<00:17, 8875.59 examples/s]
+Filter: 81%|████████ | 659000/818627 [01:14<00:17, 8925.87 examples/s]
+Filter: 81%|████████ | 660000/818627 [01:14<00:17, 9025.50 examples/s]
+Filter: 81%|████████ | 660000/818627 [01:14<00:17, 9023.97 examples/s]
+Filter: 81%|████████ | 660000/818627 [01:15<00:17, 9029.10 examples/s]
+Filter: 81%|████████ | 660000/818627 [01:14<00:17, 9030.34 examples/s]
+Filter: 81%|████████ | 660000/818627 [01:14<00:17, 9025.49 examples/s]
+Filter: 81%|████████ | 660000/818627 [01:14<00:17, 9025.87 examples/s]
+Filter: 81%|████████ | 660000/818627 [01:14<00:17, 9032.19 examples/s]
+Filter: 81%|████████ | 660000/818627 [01:14<00:17, 9058.31 examples/s]
+Filter: 81%|████████ | 661000/818627 [01:14<00:17, 8876.10 examples/s]
+Filter: 81%|████████ | 661000/818627 [01:14<00:17, 8877.35 examples/s]
+Filter: 81%|████████ | 661000/818627 [01:14<00:17, 8877.82 examples/s]
+Filter: 81%|████████ | 661000/818627 [01:15<00:17, 8875.26 examples/s]
+Filter: 81%|████████ | 661000/818627 [01:14<00:17, 8880.04 examples/s]
+Filter: 81%|████████ | 661000/818627 [01:14<00:17, 8874.02 examples/s]
+Filter: 81%|████████ | 661000/818627 [01:14<00:17, 8898.91 examples/s]
+Filter: 81%|████████ | 661000/818627 [01:15<00:17, 8866.26 examples/s]
+Filter: 81%|████████ | 662000/818627 [01:15<00:17, 8823.97 examples/s]
+Filter: 81%|████████ | 662000/818627 [01:15<00:17, 8818.31 examples/s]
+Filter: 81%|████████ | 662000/818627 [01:15<00:17, 8821.67 examples/s]
+Filter: 81%|████████ | 662000/818627 [01:15<00:17, 8822.21 examples/s]
+Filter: 81%|████████ | 662000/818627 [01:15<00:17, 8825.40 examples/s]
+Filter: 81%|████████ | 662000/818627 [01:15<00:17, 8826.27 examples/s]
+Filter: 81%|████████ | 662000/818627 [01:15<00:17, 8840.12 examples/s]
+Filter: 81%|████████ | 662000/818627 [01:15<00:17, 8821.22 examples/s]
+Filter: 81%|████████ | 663000/818627 [01:15<00:17, 8784.21 examples/s]
+Filter: 81%|████████ | 663000/818627 [01:15<00:17, 8786.22 examples/s]
+Filter: 81%|████████ | 663000/818627 [01:15<00:17, 8789.00 examples/s]
+Filter: 81%|████████ | 663000/818627 [01:15<00:17, 8787.41 examples/s]
+Filter: 81%|████████ | 663000/818627 [01:15<00:17, 8789.19 examples/s]
+Filter: 81%|████████ | 663000/818627 [01:15<00:17, 8787.85 examples/s]
+Filter: 81%|████████ | 663000/818627 [01:15<00:17, 8785.80 examples/s]
+Filter: 81%|████████ | 663000/818627 [01:15<00:17, 8795.67 examples/s]
+Filter: 81%|████████ | 664000/818627 [01:15<00:17, 8748.57 examples/s]
+Filter: 81%|████████ | 664000/818627 [01:15<00:17, 8748.48 examples/s]
+Filter: 81%|████████ | 664000/818627 [01:15<00:17, 8750.61 examples/s]
+Filter: 81%|████████ | 664000/818627 [01:15<00:17, 8748.90 examples/s]
+Filter: 81%|████████ | 664000/818627 [01:15<00:17, 8747.52 examples/s]
+Filter: 81%|████████ | 664000/818627 [01:15<00:17, 8746.21 examples/s]
+Filter: 81%|████████ | 664000/818627 [01:15<00:17, 8754.15 examples/s]
+Filter: 81%|████████ | 664000/818627 [01:15<00:17, 8739.62 examples/s]
+Filter: 81%|████████ | 665000/818627 [01:15<00:17, 8714.07 examples/s]
+Filter: 81%|████████ | 665000/818627 [01:15<00:17, 8713.10 examples/s]
+Filter: 81%|████████ | 665000/818627 [01:15<00:17, 8715.36 examples/s]
+Filter: 81%|████████ | 665000/818627 [01:15<00:17, 8705.16 examples/s]
+Filter: 81%|████████ | 665000/818627 [01:15<00:17, 8714.80 examples/s]
+Filter: 81%|████████ | 665000/818627 [01:15<00:17, 8713.55 examples/s]
+Filter: 81%|████████ | 665000/818627 [01:15<00:17, 8713.73 examples/s]
+Filter: 81%|████████ | 665000/818627 [01:15<00:17, 8714.58 examples/s]
+Filter: 81%|████████▏ | 666000/818627 [01:15<00:17, 8773.96 examples/s]
+Filter: 81%|████████▏ | 666000/818627 [01:15<00:17, 8779.71 examples/s]
+Filter: 81%|████████▏ | 666000/818627 [01:15<00:17, 8781.47 examples/s]
+Filter: 81%|████████▏ | 666000/818627 [01:15<00:17, 8773.89 examples/s]
+Filter: 81%|████████▏ | 666000/818627 [01:15<00:17, 8780.91 examples/s]
+Filter: 81%|████████▏ | 666000/818627 [01:15<00:17, 8781.85 examples/s]
+Filter: 81%|████████▏ | 666000/818627 [01:15<00:17, 8777.11 examples/s]
+Filter: 81%|████████▏ | 666000/818627 [01:15<00:17, 8778.10 examples/s]
+Filter: 81%|████████▏ | 667000/818627 [01:15<00:17, 8516.07 examples/s]
+Filter: 81%|████████▏ | 667000/818627 [01:15<00:17, 8517.89 examples/s]
+Filter: 81%|████████▏ | 667000/818627 [01:15<00:17, 8515.39 examples/s]
+Filter: 81%|████████▏ | 667000/818627 [01:15<00:17, 8512.92 examples/s]
+Filter: 81%|████████▏ | 667000/818627 [01:15<00:17, 8518.68 examples/s]
+Filter: 81%|████████▏ | 667000/818627 [01:15<00:17, 8517.96 examples/s]
+Filter: 81%|████████▏ | 667000/818627 [01:15<00:17, 8515.81 examples/s]
+Filter: 81%|████████▏ | 667000/818627 [01:15<00:17, 8519.82 examples/s]
+Filter: 82%|████████▏ | 668000/818627 [01:15<00:18, 8303.50 examples/s]
+Filter: 82%|████████▏ | 668000/818627 [01:15<00:18, 8304.13 examples/s]
+Filter: 82%|████████▏ | 668000/818627 [01:16<00:18, 8304.28 examples/s]
+Filter: 82%|████████▏ | 668000/818627 [01:15<00:18, 8301.40 examples/s]
+Filter: 82%|████████▏ | 668000/818627 [01:15<00:18, 8303.69 examples/s]
+Filter: 82%|████████▏ | 668000/818627 [01:15<00:18, 8301.84 examples/s]
+Filter: 82%|████████▏ | 668000/818627 [01:15<00:18, 8302.40 examples/s]
+Filter: 82%|████████▏ | 668000/818627 [01:15<00:18, 8305.72 examples/s]
+Filter: 82%|████████▏ | 669000/818627 [01:15<00:17, 8586.67 examples/s]
+Filter: 82%|████████▏ | 669000/818627 [01:15<00:17, 8587.67 examples/s]
+Filter: 82%|████████▏ | 669000/818627 [01:16<00:17, 8584.31 examples/s]
+Filter: 82%|████████▏ | 669000/818627 [01:15<00:17, 8580.52 examples/s]
+Filter: 82%|████████▏ | 669000/818627 [01:15<00:17, 8588.61 examples/s]
+Filter: 82%|████████▏ | 669000/818627 [01:15<00:17, 8587.59 examples/s]
+Filter: 82%|████████▏ | 669000/818627 [01:15<00:17, 8584.43 examples/s]
+Filter: 82%|████████▏ | 669000/818627 [01:15<00:17, 8581.63 examples/s]
+Filter: 82%|████████▏ | 670000/818627 [01:15<00:16, 8865.29 examples/s]
+Filter: 82%|████████▏ | 670000/818627 [01:15<00:16, 8867.85 examples/s]
+Filter: 82%|████████▏ | 670000/818627 [01:16<00:16, 8868.15 examples/s]
+Filter: 82%|████████▏ | 670000/818627 [01:15<00:16, 8864.37 examples/s]
+Filter: 82%|████████▏ | 670000/818627 [01:16<00:16, 8867.26 examples/s]
+Filter: 82%|████████▏ | 670000/818627 [01:15<00:16, 8866.43 examples/s]
+Filter: 82%|████████▏ | 670000/818627 [01:15<00:16, 8864.58 examples/s]
+Filter: 82%|████████▏ | 670000/818627 [01:15<00:16, 8869.64 examples/s]
+Filter: 82%|████████▏ | 671000/818627 [01:16<00:16, 9175.52 examples/s]
+Filter: 82%|████████▏ | 671000/818627 [01:16<00:16, 9178.86 examples/s]
+Filter: 82%|████████▏ | 671000/818627 [01:16<00:16, 9180.12 examples/s]
+Filter: 82%|████████▏ | 672000/818627 [01:16<00:15, 9170.78 examples/s]
+Filter: 82%|████████▏ | 672000/818627 [01:16<00:15, 9173.01 examples/s]
+Filter: 82%|████████▏ | 672000/818627 [01:16<00:15, 9166.44 examples/s]
+Filter: 82%|████████▏ | 672000/818627 [01:16<00:15, 9170.77 examples/s]
+Filter: 82%|████████▏ | 672000/818627 [01:16<00:15, 9172.95 examples/s]
+Filter: 82%|████████▏ | 672000/818627 [01:16<00:15, 9166.12 examples/s]
+Filter: 82%|████████▏ | 672000/818627 [01:16<00:15, 9169.79 examples/s]
+Filter: 82%|████████▏ | 672000/818627 [01:16<00:15, 9168.26 examples/s]
+Filter: 82%|████████▏ | 673000/818627 [01:16<00:16, 9016.93 examples/s]
+Filter: 82%|████████▏ | 673000/818627 [01:16<00:16, 9019.65 examples/s]
+Filter: 82%|████████▏ | 673000/818627 [01:16<00:16, 9017.57 examples/s]
+Filter: 82%|████████▏ | 673000/818627 [01:16<00:16, 8979.54 examples/s]
+Filter: 82%|████████▏ | 673000/818627 [01:16<00:16, 9017.97 examples/s]
+Filter: 82%|████████▏ | 673000/818627 [01:16<00:16, 9017.68 examples/s]
+Filter: 82%|████████▏ | 673000/818627 [01:16<00:16, 8981.71 examples/s]
+Filter: 82%|████████▏ | 673000/818627 [01:16<00:16, 8984.81 examples/s]
+Filter: 82%|████████▏ | 674000/818627 [01:16<00:16, 8913.38 examples/s]
+Filter: 82%|████████▏ | 674000/818627 [01:16<00:16, 8914.91 examples/s]
+Filter: 82%|████████▏ | 674000/818627 [01:16<00:16, 8880.18 examples/s]
+Filter: 82%|████████▏ | 674000/818627 [01:16<00:16, 8911.88 examples/s]
+Filter: 82%|████████▏ | 674000/818627 [01:16<00:16, 8878.88 examples/s]
+Filter: 82%|████████▏ | 674000/818627 [01:16<00:16, 8913.81 examples/s]
+Filter: 82%|████████▏ | 674000/818627 [01:16<00:16, 8915.11 examples/s]
+Filter: 82%|████████▏ | 674000/818627 [01:16<00:16, 8874.93 examples/s]
+Filter: 82%|████████▏ | 675000/818627 [01:16<00:16, 8872.33 examples/s]
+Filter: 82%|████████▏ | 675000/818627 [01:16<00:16, 8841.47 examples/s]
+Filter: 82%|████████▏ | 675000/818627 [01:16<00:16, 8870.62 examples/s]
+Filter: 82%|████████▏ | 675000/818627 [01:16<00:16, 8874.53 examples/s]
+Filter: 82%|████████▏ | 675000/818627 [01:16<00:16, 8841.85 examples/s]
+Filter: 82%|████████▏ | 675000/818627 [01:16<00:16, 8870.28 examples/s]
+Filter: 82%|████████▏ | 675000/818627 [01:16<00:16, 8843.77 examples/s]
+Filter: 82%|████████▏ | 675000/818627 [01:16<00:16, 8720.17 examples/s]
+Filter: 83%|████████▎ | 676000/818627 [01:16<00:15, 9061.02 examples/s]
+Filter: 83%|████████▎ | 676000/818627 [01:16<00:15, 9054.54 examples/s]
+Filter: 83%|████████▎ | 676000/818627 [01:16<00:15, 9061.34 examples/s]
+Filter: 83%|████████▎ | 676000/818627 [01:16<00:15, 9064.59 examples/s]
+Filter: 83%|████████▎ | 676000/818627 [01:16<00:15, 9062.95 examples/s]
+Filter: 83%|████████▎ | 676000/818627 [01:16<00:15, 9052.06 examples/s]
+Filter: 83%|████████▎ | 676000/818627 [01:16<00:15, 9053.77 examples/s]
+Filter: 83%|████████▎ | 677000/818627 [01:16<00:15, 9227.43 examples/s]
+Filter: 83%|████████▎ | 677000/818627 [01:16<00:15, 9229.49 examples/s]
+Filter: 83%|████████▎ | 677000/818627 [01:16<00:15, 9229.34 examples/s]
+Filter: 83%|████████▎ | 677000/818627 [01:17<00:15, 9225.21 examples/s]
+Filter: 83%|████████▎ | 677000/818627 [01:16<00:15, 9231.92 examples/s]
+Filter: 83%|████████▎ | 677000/818627 [01:16<00:15, 9228.67 examples/s]
+Filter: 83%|████████▎ | 677000/818627 [01:16<00:15, 9225.86 examples/s]
+Filter: 83%|████████▎ | 677000/818627 [01:16<00:15, 9228.19 examples/s]
+Filter: 83%|████████▎ | 678000/818627 [01:16<00:15, 8998.41 examples/s]
+Filter: 83%|████████▎ | 678000/818627 [01:16<00:15, 8996.23 examples/s]
+Filter: 83%|████████▎ | 678000/818627 [01:17<00:15, 9003.33 examples/s]
+Filter: 83%|████████▎ | 678000/818627 [01:16<00:15, 9035.23 examples/s]
+Filter: 83%|████████▎ | 678000/818627 [01:16<00:15, 8992.13 examples/s]
+Filter: 83%|████████▎ | 678000/818627 [01:16<00:15, 8997.05 examples/s]
+Filter: 83%|████████▎ | 678000/818627 [01:16<00:15, 8997.59 examples/s]
+Filter: 83%|████████▎ | 678000/818627 [01:16<00:15, 8991.80 examples/s]
+Filter: 83%|████████▎ | 679000/818627 [01:16<00:15, 8914.79 examples/s]
+Filter: 83%|████████▎ | 679000/818627 [01:16<00:15, 8860.25 examples/s]
+Filter: 83%|████████▎ | 679000/818627 [01:17<00:15, 8863.77 examples/s]
+Filter: 83%|████████▎ | 679000/818627 [01:16<00:15, 8852.16 examples/s]
+Filter: 83%|████████▎ | 679000/818627 [01:17<00:15, 8858.96 examples/s]
+Filter: 83%|████████▎ | 679000/818627 [01:16<00:15, 8867.07 examples/s]
+Filter: 83%|████████▎ | 679000/818627 [01:16<00:15, 8864.07 examples/s]
+Filter: 83%|████████▎ | 679000/818627 [01:16<00:15, 8855.17 examples/s]
+Filter: 83%|████████▎ | 680000/818627 [01:17<00:15, 8807.46 examples/s]
+Filter: 83%|████████▎ | 680000/818627 [01:17<00:15, 8843.62 examples/s]
+Filter: 83%|████████▎ | 680000/818627 [01:17<00:15, 8797.77 examples/s]
+Filter: 83%|████████▎ | 680000/818627 [01:17<00:15, 8804.44 examples/s]
+Filter: 83%|████████▎ | 680000/818627 [01:17<00:15, 8796.08 examples/s]
+Filter: 83%|████████▎ | 680000/818627 [01:17<00:15, 8803.22 examples/s]
+Filter: 83%|████████▎ | 680000/818627 [01:17<00:15, 8799.23 examples/s]
+Filter: 83%|████████▎ | 680000/818627 [01:17<00:15, 8781.90 examples/s]
+Filter: 83%|████████▎ | 681000/818627 [01:17<00:15, 8717.98 examples/s]
+Filter: 83%|████████▎ | 681000/818627 [01:17<00:15, 8750.28 examples/s]
+Filter: 83%|████████▎ | 681000/818627 [01:17<00:15, 8724.63 examples/s]
+Filter: 83%|████████▎ | 681000/818627 [01:17<00:15, 8711.61 examples/s]
+Filter: 83%|████████▎ | 681000/818627 [01:17<00:15, 8716.07 examples/s]
+Filter: 83%|████████▎ | 681000/818627 [01:17<00:15, 8709.31 examples/s]
+Filter: 83%|████████▎ | 681000/818627 [01:17<00:15, 8715.07 examples/s]
+Filter: 83%|████████▎ | 681000/818627 [01:17<00:15, 8712.24 examples/s]
+Filter: 83%|████████▎ | 682000/818627 [01:17<00:15, 8636.90 examples/s]
+Filter: 83%|████████▎ | 682000/818627 [01:17<00:15, 8665.01 examples/s]
+Filter: 83%|████████▎ | 682000/818627 [01:17<00:15, 8642.13 examples/s]
+Filter: 83%|████████▎ | 682000/818627 [01:17<00:15, 8633.25 examples/s]
+Filter: 83%|████████▎ | 682000/818627 [01:17<00:15, 8636.35 examples/s]
+Filter: 83%|████████▎ | 682000/818627 [01:17<00:15, 8631.79 examples/s]
+Filter: 83%|████████▎ | 682000/818627 [01:17<00:15, 8635.13 examples/s]
+Filter: 83%|████████▎ | 682000/818627 [01:17<00:15, 8632.84 examples/s]
+Filter: 83%|████████▎ | 683000/818627 [01:17<00:15, 8815.97 examples/s]
+Filter: 83%|████████▎ | 683000/818627 [01:17<00:15, 8832.48 examples/s]
+Filter: 83%|████████▎ | 683000/818627 [01:17<00:15, 8820.59 examples/s]
+Filter: 83%|████████▎ | 683000/818627 [01:17<00:15, 8811.02 examples/s]
+Filter: 83%|████████▎ | 683000/818627 [01:17<00:15, 8815.23 examples/s]
+Filter: 83%|████████▎ | 683000/818627 [01:17<00:15, 8812.61 examples/s]
+Filter: 83%|████████▎ | 683000/818627 [01:17<00:15, 8808.51 examples/s]
+Filter: 83%|████████▎ | 683000/818627 [01:17<00:15, 8812.83 examples/s]
+Filter: 84%|████████▎ | 684000/818627 [01:17<00:15, 8747.74 examples/s]
+Filter: 84%|████████▎ | 684000/818627 [01:17<00:15, 8760.28 examples/s]
+Filter: 84%|████████▎ | 684000/818627 [01:17<00:15, 8746.70 examples/s]
+Filter: 84%|████████▎ | 684000/818627 [01:17<00:15, 8747.18 examples/s]
+Filter: 84%|████████▎ | 684000/818627 [01:17<00:15, 8746.97 examples/s]
+Filter: 84%|████████▎ | 684000/818627 [01:17<00:15, 8747.51 examples/s]
+Filter: 84%|████████▎ | 684000/818627 [01:17<00:15, 8747.96 examples/s]
+Filter: 84%|████████▎ | 684000/818627 [01:17<00:15, 8745.84 examples/s]
+Filter: 84%|████████▎ | 685000/818627 [01:17<00:15, 8702.65 examples/s]
+Filter: 84%|████████▎ | 685000/818627 [01:17<00:15, 8689.92 examples/s]
+Filter: 84%|████████▎ | 685000/818627 [01:18<00:15, 8693.36 examples/s]
+Filter: 84%|████████▎ | 685000/818627 [01:17<00:15, 8690.86 examples/s]
+Filter: 84%|████████▎ | 685000/818627 [01:17<00:15, 8693.63 examples/s]
+Filter: 84%|████████▎ | 685000/818627 [01:17<00:15, 8693.96 examples/s]
+Filter: 84%|████████▎ | 685000/818627 [01:17<00:15, 8689.74 examples/s]
+Filter: 84%|████████▎ | 685000/818627 [01:17<00:15, 8690.37 examples/s]
+Filter: 84%|████████▍ | 686000/818627 [01:17<00:15, 8647.49 examples/s]
+Filter: 84%|████████▍ | 686000/818627 [01:17<00:15, 8654.95 examples/s]
+Filter: 84%|████████▍ | 686000/818627 [01:18<00:15, 8648.94 examples/s]
+Filter: 84%|████████▍ | 686000/818627 [01:17<00:15, 8646.39 examples/s]
+Filter: 84%|████████▍ | 686000/818627 [01:17<00:15, 8649.41 examples/s]
+Filter: 84%|████████▍ | 686000/818627 [01:17<00:15, 8648.13 examples/s]
+Filter: 84%|████████▍ | 686000/818627 [01:17<00:15, 8647.01 examples/s]
+Filter: 84%|████████▍ | 686000/818627 [01:17<00:15, 8644.79 examples/s]
+Filter: 84%|████████▍ | 687000/818627 [01:17<00:15, 8643.98 examples/s]
+Filter: 84%|████████▍ | 687000/818627 [01:17<00:15, 8647.29 examples/s]
+Filter: 84%|████████▍ | 687000/818627 [01:18<00:15, 8644.50 examples/s]
+Filter: 84%|████████▍ | 687000/818627 [01:17<00:15, 8642.66 examples/s]
+Filter: 84%|████████▍ | 687000/818627 [01:17<00:15, 8644.17 examples/s]
+Filter: 84%|████████▍ | 687000/818627 [01:17<00:15, 8641.00 examples/s]
+Filter: 84%|████████▍ | 687000/818627 [01:18<00:15, 8641.07 examples/s]
+Filter: 84%|████████▍ | 687000/818627 [01:17<00:15, 8642.39 examples/s]
+Filter: 84%|████████▍ | 688000/818627 [01:18<00:15, 8661.63 examples/s]
+Filter: 84%|████████▍ | 688000/818627 [01:18<00:15, 8666.31 examples/s]
+Filter: 84%|████████▍ | 688000/818627 [01:18<00:15, 8661.75 examples/s]
+Filter: 84%|████████▍ | 688000/818627 [01:18<00:15, 8664.02 examples/s]
+Filter: 84%|████████▍ | 688000/818627 [01:18<00:15, 8662.45 examples/s]
+Filter: 84%|████████▍ | 688000/818627 [01:18<00:15, 8660.36 examples/s]
+Filter: 84%|████████▍ | 688000/818627 [01:18<00:15, 8662.46 examples/s]
+Filter: 84%|████████▍ | 688000/818627 [01:18<00:15, 8640.83 examples/s]
+Filter: 84%|████████▍ | 689000/818627 [01:18<00:14, 8659.56 examples/s]
+Filter: 84%|████████▍ | 689000/818627 [01:18<00:14, 8657.40 examples/s]
+Filter: 84%|████████▍ | 689000/818627 [01:18<00:14, 8663.25 examples/s]
+Filter: 84%|████████▍ | 689000/818627 [01:18<00:14, 8654.92 examples/s]
+Filter: 84%|████████▍ | 689000/818627 [01:18<00:14, 8659.14 examples/s]
+Filter: 84%|████████▍ | 689000/818627 [01:18<00:14, 8659.90 examples/s]
+Filter: 84%|████████▍ | 689000/818627 [01:18<00:14, 8657.99 examples/s]
+Filter: 84%|████████▍ | 689000/818627 [01:18<00:14, 8658.52 examples/s]
+Filter: 84%|████████▍ | 690000/818627 [01:18<00:14, 8625.38 examples/s]
+Filter: 84%|████████▍ | 690000/818627 [01:18<00:14, 8635.79 examples/s]
+Filter: 84%|████████▍ | 690000/818627 [01:18<00:14, 8629.30 examples/s]
+Filter: 84%|████████▍ | 690000/818627 [01:18<00:14, 8631.81 examples/s]
+Filter: 84%|████████▍ | 690000/818627 [01:18<00:14, 8628.22 examples/s]
+Filter: 84%|████████▍ | 690000/818627 [01:18<00:14, 8625.18 examples/s]
+Filter: 84%|████████▍ | 690000/818627 [01:18<00:14, 8611.37 examples/s]
+Filter: 84%|████████▍ | 690000/818627 [01:18<00:14, 8625.16 examples/s]
+Filter: 84%|████████▍ | 691000/818627 [01:18<00:14, 8904.85 examples/s]
+Filter: 84%|████████▍ | 691000/818627 [01:18<00:14, 8912.24 examples/s]
+Filter: 84%|████████▍ | 691000/818627 [01:18<00:14, 8904.62 examples/s]
+Filter: 84%|████████▍ | 691000/818627 [01:18<00:14, 8905.94 examples/s]
+Filter: 84%|████████▍ | 691000/818627 [01:18<00:14, 8905.42 examples/s]
+Filter: 84%|████████▍ | 691000/818627 [01:18<00:14, 8906.54 examples/s]
+Filter: 84%|████████▍ | 691000/818627 [01:18<00:14, 8904.57 examples/s]
+Filter: 84%|████████▍ | 691000/818627 [01:18<00:14, 8846.56 examples/s]
+Filter: 85%|████████▍ | 692000/818627 [01:18<00:14, 8873.83 examples/s]
+Filter: 85%|████████▍ | 692000/818627 [01:18<00:14, 8867.22 examples/s]
+Filter: 85%|████████▍ | 692000/818627 [01:18<00:14, 8869.99 examples/s]
+Filter: 85%|████████▍ | 692000/818627 [01:18<00:14, 8869.62 examples/s]
+Filter: 85%|████████▍ | 692000/818627 [01:18<00:14, 8871.59 examples/s]
+Filter: 85%|████████▍ | 692000/818627 [01:18<00:14, 8885.22 examples/s]
+Filter: 85%|████████▍ | 692000/818627 [01:18<00:14, 8868.01 examples/s]
+Filter: 85%|████████▍ | 692000/818627 [01:18<00:14, 8865.53 examples/s]
+Filter: 85%|████████▍ | 693000/818627 [01:18<00:14, 8763.39 examples/s]
+Filter: 85%|████████▍ | 693000/818627 [01:18<00:14, 8764.74 examples/s]
+Filter: 85%|████████▍ | 693000/818627 [01:18<00:14, 8765.10 examples/s]
+Filter: 85%|████████▍ | 693000/818627 [01:18<00:14, 8761.99 examples/s]
+Filter: 85%|████████▍ | 693000/818627 [01:18<00:14, 8774.99 examples/s]
+Filter: 85%|████████▍ | 693000/818627 [01:18<00:14, 8763.12 examples/s]
+Filter: 85%|████████▍ | 693000/818627 [01:18<00:14, 8766.81 examples/s]
+Filter: 85%|████████▍ | 693000/818627 [01:18<00:14, 8760.71 examples/s]
+Filter: 85%|████████▍ | 694000/818627 [01:18<00:14, 8705.14 examples/s]
+Filter: 85%|████████▍ | 694000/818627 [01:18<00:14, 8700.63 examples/s]
+Filter: 85%|████████▍ | 694000/818627 [01:18<00:14, 8704.89 examples/s]
+Filter: 85%|████████▍ | 694000/818627 [01:19<00:14, 8701.10 examples/s]
+Filter: 85%|████████▍ | 694000/818627 [01:18<00:14, 8703.37 examples/s]
+Filter: 85%|████████▍ | 694000/818627 [01:18<00:14, 8710.48 examples/s]
+Filter: 85%|████████▍ | 694000/818627 [01:18<00:14, 8702.75 examples/s]
+Filter: 85%|████████▍ | 694000/818627 [01:18<00:14, 8648.61 examples/s]
+Filter: 85%|████████▍ | 695000/818627 [01:18<00:14, 8658.60 examples/s]
+Filter: 85%|████████▍ | 695000/818627 [01:18<00:14, 8660.65 examples/s]
+Filter: 85%|████████▍ | 695000/818627 [01:19<00:14, 8661.69 examples/s]
+Filter: 85%|████████▍ | 695000/818627 [01:18<00:14, 8654.71 examples/s]
+Filter: 85%|████████▍ | 695000/818627 [01:18<00:14, 8660.07 examples/s]
+Filter: 85%|████████▍ | 695000/818627 [01:18<00:14, 8662.30 examples/s]
+Filter: 85%|████████▍ | 695000/818627 [01:18<00:14, 8661.28 examples/s]
+Filter: 85%|████████▍ | 695000/818627 [01:18<00:14, 8670.68 examples/s]
+Filter: 85%|████████▌ | 696000/818627 [01:18<00:14, 8676.54 examples/s]
+Filter: 85%|████████▌ | 696000/818627 [01:18<00:14, 8675.76 examples/s]
+Filter: 85%|████████▌ | 696000/818627 [01:18<00:14, 8676.35 examples/s]
+Filter: 85%|████████▌ | 696000/818627 [01:19<00:14, 8674.18 examples/s]
+Filter: 85%|████████▌ | 696000/818627 [01:18<00:14, 8674.71 examples/s]
+Filter: 85%|████████▌ | 696000/818627 [01:19<00:14, 8679.79 examples/s]
+Filter: 85%|████████▌ | 696000/818627 [01:18<00:14, 8687.10 examples/s]
+Filter: 85%|████████▌ | 696000/818627 [01:18<00:14, 8673.74 examples/s]
+Filter: 85%|████████▌ | 697000/818627 [01:19<00:13, 8848.95 examples/s]
+Filter: 85%|████████▌ | 697000/818627 [01:19<00:13, 8846.64 examples/s]
+Filter: 85%|████████▌ | 697000/818627 [01:19<00:13, 8843.42 examples/s]
+Filter: 85%|████████▌ | 697000/818627 [01:19<00:13, 8846.10 examples/s]
+Filter: 85%|████████▌ | 697000/818627 [01:19<00:13, 8851.00 examples/s]
+Filter: 85%|████████▌ | 697000/818627 [01:19<00:13, 8856.15 examples/s]
+Filter: 85%|████████▌ | 697000/818627 [01:19<00:13, 8846.73 examples/s]
+Filter: 85%|████████▌ | 697000/818627 [01:19<00:13, 8848.68 examples/s]
+Filter: 85%|████████▌ | 698000/818627 [01:19<00:13, 9097.98 examples/s]
+Filter: 85%|████████▌ | 698000/818627 [01:19<00:13, 9096.88 examples/s]
+Filter: 85%|████████▌ | 698000/818627 [01:19<00:13, 9096.62 examples/s]
+Filter: 85%|████████▌ | 698000/818627 [01:19<00:13, 9093.53 examples/s]
+Filter: 85%|████████▌ | 698000/818627 [01:19<00:13, 9108.41 examples/s]
+Filter: 85%|████████▌ | 698000/818627 [01:19<00:13, 9102.25 examples/s]
+Filter: 85%|████████▌ | 698000/818627 [01:19<00:13, 9098.14 examples/s]
+Filter: 85%|████████▌ | 698000/818627 [01:19<00:13, 9098.93 examples/s]
+Filter: 85%|████████▌ | 699000/818627 [01:19<00:13, 8928.48 examples/s]
+Filter: 85%|████████▌ | 699000/818627 [01:19<00:13, 8930.53 examples/s]
+Filter: 85%|████████▌ | 699000/818627 [01:19<00:13, 8927.42 examples/s]
+Filter: 85%|████████▌ | 699000/818627 [01:19<00:13, 8927.37 examples/s]
+Filter: 85%|████████▌ | 699000/818627 [01:19<00:13, 8928.19 examples/s]
+Filter: 85%|████████▌ | 699000/818627 [01:19<00:13, 8925.40 examples/s]
+Filter: 85%|████████▌ | 699000/818627 [01:19<00:13, 8926.93 examples/s]
+Filter: 85%|████████▌ | 699000/818627 [01:19<00:13, 8922.49 examples/s]
+Filter: 86%|████████▌ | 700000/818627 [01:19<00:13, 8836.37 examples/s]
+Filter: 86%|████████▌ | 700000/818627 [01:19<00:13, 8838.39 examples/s]
+Filter: 86%|████████▌ | 700000/818627 [01:19<00:13, 8839.60 examples/s]
+Filter: 86%|████████▌ | 700000/818627 [01:19<00:13, 8837.40 examples/s]
+Filter: 86%|████████▌ | 700000/818627 [01:19<00:13, 8840.74 examples/s]
+Filter: 86%|████████▌ | 700000/818627 [01:19<00:13, 8841.42 examples/s]
+Filter: 86%|████████▌ | 700000/818627 [01:19<00:13, 8836.28 examples/s]
+Filter: 86%|████████▌ | 700000/818627 [01:19<00:13, 8839.31 examples/s]
+Filter: 86%|████████▌ | 701000/818627 [01:19<00:13, 8752.47 examples/s]
+Filter: 86%|████████▌ | 701000/818627 [01:19<00:13, 8753.06 examples/s]
+Filter: 86%|████████▌ | 701000/818627 [01:19<00:13, 8752.89 examples/s]
+Filter: 86%|████████▌ | 701000/818627 [01:19<00:13, 8748.72 examples/s]
+Filter: 86%|████████▌ | 701000/818627 [01:19<00:13, 8755.00 examples/s]
+Filter: 86%|████████▌ | 701000/818627 [01:19<00:13, 8752.12 examples/s]
+Filter: 86%|████████▌ | 701000/818627 [01:19<00:13, 8751.75 examples/s]
+Filter: 86%|████████▌ | 701000/818627 [01:19<00:13, 8753.98 examples/s]
+Filter: 86%|████████▌ | 702000/818627 [01:19<00:13, 8681.07 examples/s]
+Filter: 86%|████████▌ | 702000/818627 [01:19<00:13, 8687.56 examples/s]
+Filter: 86%|████████▌ | 702000/818627 [01:19<00:13, 8680.69 examples/s]
+Filter: 86%|████████▌ | 702000/818627 [01:19<00:13, 8685.55 examples/s]
+Filter: 86%|████████▌ | 702000/818627 [01:19<00:13, 8686.61 examples/s]
+Filter: 86%|████████▌ | 702000/818627 [01:19<00:13, 8682.51 examples/s]
+Filter: 86%|████████▌ | 702000/818627 [01:19<00:13, 8680.12 examples/s]
+Filter: 86%|████████▌ | 702000/818627 [01:19<00:13, 8668.47 examples/s]
+Filter: 86%|████████▌ | 703000/818627 [01:19<00:13, 8619.88 examples/s]
+Filter: 86%|████████▌ | 703000/818627 [01:19<00:13, 8618.49 examples/s]
+Filter: 86%|████████▌ | 703000/818627 [01:20<00:13, 8618.48 examples/s]
+Filter: 86%|████████▌ | 703000/818627 [01:19<00:13, 8622.54 examples/s]
+Filter: 86%|████████▌ | 703000/818627 [01:19<00:13, 8620.28 examples/s]
+Filter: 86%|████████▌ | 703000/818627 [01:19<00:13, 8616.67 examples/s]
+Filter: 86%|████████▌ | 703000/818627 [01:19<00:13, 8617.64 examples/s]
+Filter: 86%|████████▌ | 703000/818627 [01:19<00:13, 8618.76 examples/s]
+Filter: 86%|████████▌ | 704000/818627 [01:19<00:12, 8834.58 examples/s]
+Filter: 86%|████████▌ | 704000/818627 [01:19<00:12, 8830.65 examples/s]
+Filter: 86%|████████▌ | 704000/818627 [01:20<00:12, 8830.86 examples/s]
+Filter: 86%|████████▌ | 704000/818627 [01:19<00:12, 8836.24 examples/s]
+Filter: 86%|████████▌ | 704000/818627 [01:19<00:12, 8832.89 examples/s]
+Filter: 86%|████████▌ | 704000/818627 [01:19<00:12, 8831.38 examples/s]
+Filter: 86%|████████▌ | 704000/818627 [01:19<00:12, 8825.91 examples/s]
+Filter: 86%|████████▌ | 704000/818627 [01:19<00:13, 8705.35 examples/s]
+Filter: 86%|████████▌ | 705000/818627 [01:19<00:12, 8761.91 examples/s]
+Filter: 86%|████████▌ | 705000/818627 [01:19<00:12, 8761.85 examples/s]
+Filter: 86%|████████▌ | 705000/818627 [01:20<00:12, 8759.90 examples/s]
+Filter: 86%|████████▌ | 705000/818627 [01:19<00:12, 8763.13 examples/s]
+Filter: 86%|████████▌ | 705000/818627 [01:19<00:12, 8761.02 examples/s]
+Filter: 86%|████████▌ | 705000/818627 [01:20<00:12, 8759.99 examples/s]
+Filter: 86%|████████▌ | 705000/818627 [01:19<00:12, 8762.00 examples/s]
+Filter: 86%|████████▌ | 705000/818627 [01:19<00:12, 8797.09 examples/s]
+Filter: 86%|████████▌ | 706000/818627 [01:20<00:12, 8681.72 examples/s]
+Filter: 86%|████████▌ | 706000/818627 [01:20<00:12, 8686.49 examples/s]
+Filter: 86%|████████▌ | 706000/818627 [01:20<00:12, 8681.65 examples/s]
+Filter: 86%|████████▌ | 706000/818627 [01:20<00:12, 8674.38 examples/s]
+Filter: 86%|████████▌ | 706000/818627 [01:20<00:12, 8684.48 examples/s]
+Filter: 86%|████████▌ | 706000/818627 [01:20<00:12, 8678.95 examples/s]
+Filter: 86%|████████▌ | 706000/818627 [01:20<00:12, 8706.11 examples/s]
+Filter: 86%|████████▌ | 706000/818627 [01:20<00:12, 8673.44 examples/s]
+Filter: 86%|████████▋ | 707000/818627 [01:20<00:12, 8701.74 examples/s]
+Filter: 86%|████████▋ | 707000/818627 [01:20<00:12, 8704.08 examples/s]
+Filter: 86%|████████▋ | 707000/818627 [01:20<00:12, 8699.75 examples/s]
+Filter: 86%|████████▋ | 707000/818627 [01:20<00:12, 8697.11 examples/s]
+Filter: 86%|████████▋ | 707000/818627 [01:20<00:12, 8700.58 examples/s]
+Filter: 86%|████████▋ | 707000/818627 [01:20<00:12, 8699.16 examples/s]
+Filter: 86%|████████▋ | 707000/818627 [01:20<00:12, 8697.77 examples/s]
+Filter: 86%|████████▋ | 707000/818627 [01:20<00:12, 8718.74 examples/s]
+Filter: 86%|████████▋ | 708000/818627 [01:20<00:12, 8605.63 examples/s]
+Filter: 86%|████████▋ | 708000/818627 [01:20<00:12, 8610.53 examples/s]
+Filter: 86%|████████▋ | 708000/818627 [01:20<00:12, 8603.97 examples/s]
+Filter: 86%|████████▋ | 708000/818627 [01:20<00:12, 8608.31 examples/s]
+Filter: 86%|████████▋ | 708000/818627 [01:20<00:12, 8608.82 examples/s]
+Filter: 86%|████████▋ | 708000/818627 [01:20<00:12, 8604.44 examples/s]
+Filter: 86%|████████▋ | 708000/818627 [01:20<00:12, 8620.73 examples/s]
+Filter: 86%|████████▋ | 708000/818627 [01:20<00:12, 8529.98 examples/s]
+Filter: 87%|████████▋ | 709000/818627 [01:20<00:12, 8654.77 examples/s]
+Filter: 87%|████████▋ | 709000/818627 [01:20<00:12, 8655.05 examples/s]
+Filter: 87%|████████▋ | 709000/818627 [01:20<00:12, 8668.92 examples/s]
+Filter: 87%|████████▋ | 709000/818627 [01:20<00:12, 8647.32 examples/s]
+Filter: 87%|████████▋ | 709000/818627 [01:20<00:12, 8655.42 examples/s]
+Filter: 87%|████████▋ | 709000/818627 [01:20<00:12, 8655.89 examples/s]
+Filter: 87%|████████▋ | 709000/818627 [01:20<00:12, 8658.39 examples/s]
+Filter: 87%|████████▋ | 709000/818627 [01:20<00:12, 8630.73 examples/s]
+Filter: 87%|████████▋ | 710000/818627 [01:20<00:12, 8670.80 examples/s]
+Filter: 87%|████████▋ | 710000/818627 [01:20<00:12, 8651.98 examples/s]
+Filter: 87%|████████▋ | 710000/818627 [01:20<00:12, 8653.50 examples/s]
+Filter: 87%|████████▋ | 710000/818627 [01:20<00:12, 8653.81 examples/s]
+Filter: 87%|████████▋ | 710000/818627 [01:20<00:12, 8651.35 examples/s]
+Filter: 87%|████████▋ | 710000/818627 [01:20<00:12, 8656.33 examples/s]
+Filter: 87%|████████▋ | 710000/818627 [01:20<00:12, 8649.01 examples/s]
+Filter: 87%|████████▋ | 710000/818627 [01:20<00:12, 8654.48 examples/s]
+Filter: 87%|████████▋ | 711000/818627 [01:20<00:12, 8601.30 examples/s]
+Filter: 87%|████████▋ | 711000/818627 [01:20<00:12, 8609.73 examples/s]
+Filter: 87%|████████▋ | 711000/818627 [01:20<00:12, 8601.58 examples/s]
+Filter: 87%|████████▋ | 711000/818627 [01:20<00:12, 8598.14 examples/s]
+Filter: 87%|████████▋ | 711000/818627 [01:20<00:12, 8599.84 examples/s]
+Filter: 87%|████████▋ | 711000/818627 [01:20<00:12, 8598.28 examples/s]
+Filter: 87%|████████▋ | 711000/818627 [01:20<00:12, 8602.23 examples/s]
+Filter: 87%|████████▋ | 711000/818627 [01:20<00:12, 8603.36 examples/s]
+Filter: 87%|████████▋ | 712000/818627 [01:20<00:11, 8889.79 examples/s]
+Filter: 87%|████████▋ | 712000/818627 [01:20<00:12, 8881.93 examples/s]
+Filter: 87%|████████▋ | 712000/818627 [01:20<00:12, 8883.14 examples/s]
+Filter: 87%|████████▋ | 712000/818627 [01:21<00:12, 8881.35 examples/s]
+Filter: 87%|████████▋ | 712000/818627 [01:20<00:12, 8880.70 examples/s]
+Filter: 87%|████████▋ | 712000/818627 [01:20<00:12, 8882.72 examples/s]
+Filter: 87%|████████▋ | 712000/818627 [01:20<00:12, 8878.27 examples/s]
+Filter: 87%|████████▋ | 712000/818627 [01:20<00:12, 8885.20 examples/s]
+Filter: 87%|████████▋ | 713000/818627 [01:20<00:11, 8808.77 examples/s]
+Filter: 87%|████████▋ | 713000/818627 [01:20<00:11, 8813.40 examples/s]
+Filter: 87%|████████▋ | 713000/818627 [01:20<00:11, 8806.04 examples/s]
+Filter: 87%|████████▋ | 713000/818627 [01:21<00:12, 8801.73 examples/s]
+Filter: 87%|████████▋ | 713000/818627 [01:20<00:11, 8808.36 examples/s]
+Filter: 87%|████████▋ | 713000/818627 [01:20<00:11, 8808.30 examples/s]
+Filter: 87%|████████▋ | 713000/818627 [01:20<00:11, 8809.96 examples/s]
+Filter: 87%|████████▋ | 713000/818627 [01:20<00:11, 8810.35 examples/s]
+Filter: 87%|████████▋ | 714000/818627 [01:21<00:11, 8751.15 examples/s]
+Filter: 87%|████████▋ | 714000/818627 [01:20<00:11, 8755.07 examples/s]
+Filter: 87%|████████▋ | 714000/818627 [01:20<00:11, 8754.90 examples/s]
+Filter: 87%|████████▋ | 714000/818627 [01:21<00:11, 8756.06 examples/s]
+Filter: 87%|████████▋ | 714000/818627 [01:20<00:11, 8752.42 examples/s]
+Filter: 87%|████████▋ | 714000/818627 [01:20<00:11, 8754.28 examples/s]
+Filter: 87%|████████▋ | 714000/818627 [01:21<00:11, 8750.79 examples/s]
+Filter: 87%|████████▋ | 714000/818627 [01:20<00:11, 8754.36 examples/s]
+Filter: 87%|████████▋ | 715000/818627 [01:21<00:11, 8691.31 examples/s]
+Filter: 87%|████████▋ | 715000/818627 [01:21<00:11, 8686.39 examples/s]
+Filter: 87%|████████▋ | 715000/818627 [01:21<00:11, 8688.63 examples/s]
+Filter: 87%|████████▋ | 715000/818627 [01:21<00:11, 8686.35 examples/s]
+Filter: 87%|████████▋ | 715000/818627 [01:21<00:11, 8688.80 examples/s]
+Filter: 87%|████████▋ | 715000/818627 [01:21<00:11, 8687.81 examples/s]
+Filter: 87%|████████▋ | 715000/818627 [01:21<00:11, 8686.63 examples/s]
+Filter: 87%|████████▋ | 715000/818627 [01:21<00:11, 8688.68 examples/s]
+Filter: 87%|████████▋ | 716000/818627 [01:21<00:11, 8665.49 examples/s]
+Filter: 87%|████████▋ | 716000/818627 [01:21<00:11, 8660.59 examples/s]
+Filter: 87%|████████▋ | 716000/818627 [01:21<00:11, 8657.00 examples/s]
+Filter: 87%|████████▋ | 716000/818627 [01:21<00:11, 8654.47 examples/s]
+Filter: 87%|████████▋ | 716000/818627 [01:21<00:11, 8663.70 examples/s]
+Filter: 87%|████████▋ | 716000/818627 [01:21<00:11, 8662.04 examples/s]
+Filter: 87%|████████▋ | 716000/818627 [01:21<00:11, 8662.64 examples/s]
+Filter: 87%|████████▋ | 716000/818627 [01:21<00:11, 8648.33 examples/s]
+Filter: 88%|████████▊ | 717000/818627 [01:21<00:11, 8646.14 examples/s]
+Filter: 88%|████████▊ | 717000/818627 [01:21<00:11, 8643.96 examples/s]
+Filter: 88%|████████▊ | 717000/818627 [01:21<00:11, 8643.80 examples/s]
+Filter: 88%|████████▊ | 717000/818627 [01:21<00:11, 8637.58 examples/s]
+Filter: 88%|████████▊ | 717000/818627 [01:21<00:11, 8647.49 examples/s]
+Filter: 88%|████████▊ | 717000/818627 [01:21<00:11, 8644.96 examples/s]
+Filter: 88%|████████▊ | 717000/818627 [01:21<00:11, 8643.67 examples/s]
+Filter: 88%|████████▊ | 717000/818627 [01:21<00:11, 8650.59 examples/s]
+Filter: 88%|████████▊ | 718000/818627 [01:21<00:11, 8489.19 examples/s]
+Filter: 88%|████████▊ | 718000/818627 [01:21<00:11, 8485.19 examples/s]
+Filter: 88%|████████▊ | 718000/818627 [01:21<00:11, 8488.71 examples/s]
+Filter: 88%|████████▊ | 718000/818627 [01:21<00:11, 8486.84 examples/s]
+Filter: 88%|████████▊ | 718000/818627 [01:21<00:11, 8487.92 examples/s]
+Filter: 88%|████████▊ | 718000/818627 [01:21<00:11, 8492.15 examples/s]
+Filter: 88%|████████▊ | 718000/818627 [01:21<00:11, 8484.63 examples/s]
+Filter: 88%|████████▊ | 718000/818627 [01:21<00:11, 8482.08 examples/s]
+Filter: 88%|████████▊ | 719000/818627 [01:21<00:11, 8353.58 examples/s]
+Filter: 88%|████████▊ | 719000/818627 [01:21<00:11, 8354.88 examples/s]
+Filter: 88%|████████▊ | 719000/818627 [01:21<00:11, 8347.20 examples/s]
+Filter: 88%|████████▊ | 719000/818627 [01:21<00:11, 8352.90 examples/s]
+Filter: 88%|████████▊ | 719000/818627 [01:21<00:11, 8354.69 examples/s]
+Filter: 88%|████████▊ | 719000/818627 [01:21<00:11, 8358.28 examples/s]
+Filter: 88%|████████▊ | 719000/818627 [01:21<00:11, 8350.38 examples/s]
+Filter: 88%|████████▊ | 719000/818627 [01:21<00:11, 8349.04 examples/s]
+Filter: 88%|████████▊ | 720000/818627 [01:21<00:11, 8676.11 examples/s]
+Filter: 88%|████████▊ | 720000/818627 [01:21<00:11, 8678.58 examples/s]
+Filter: 88%|████████▊ | 720000/818627 [01:22<00:11, 8679.11 examples/s]
+Filter: 88%|████████▊ | 720000/818627 [01:21<00:11, 8679.94 examples/s]
+Filter: 88%|████████▊ | 720000/818627 [01:21<00:11, 8680.18 examples/s]
+Filter: 88%|████████▊ | 720000/818627 [01:21<00:11, 8679.38 examples/s]
+Filter: 88%|████████▊ | 720000/818627 [01:21<00:11, 8678.94 examples/s]
+Filter: 88%|████████▊ | 720000/818627 [01:21<00:11, 8676.36 examples/s]
+Filter: 88%|████████▊ | 721000/818627 [01:21<00:10, 8967.18 examples/s]
+Filter: 88%|████████▊ | 721000/818627 [01:21<00:10, 8970.19 examples/s]
+Filter: 88%|████████▊ | 721000/818627 [01:22<00:10, 8968.74 examples/s]
+Filter: 88%|████████▊ | 721000/818627 [01:21<00:10, 8969.47 examples/s]
+Filter: 88%|████████▊ | 721000/818627 [01:21<00:10, 8970.90 examples/s]
+Filter: 88%|████████▊ | 721000/818627 [01:21<00:10, 8967.49 examples/s]
+Filter: 88%|████████▊ | 721000/818627 [01:21<00:10, 8967.40 examples/s]
+Filter: 88%|████████▊ | 721000/818627 [01:21<00:10, 8961.98 examples/s]
+Filter: 88%|████████▊ | 722000/818627 [01:21<00:10, 8856.41 examples/s]
+Filter: 88%|████████▊ | 722000/818627 [01:21<00:10, 8856.85 examples/s]
+Filter: 88%|████████▊ | 722000/818627 [01:22<00:10, 8858.10 examples/s]
+Filter: 88%|████████▊ | 722000/818627 [01:21<00:10, 8855.03 examples/s]
+Filter: 88%|████████▊ | 722000/818627 [01:22<00:10, 8859.34 examples/s]
+Filter: 88%|████████▊ | 722000/818627 [01:21<00:10, 8856.41 examples/s]
+Filter: 88%|████████▊ | 722000/818627 [01:21<00:10, 8855.76 examples/s]
+Filter: 88%|████████▊ | 722000/818627 [01:21<00:10, 8859.99 examples/s]
+Filter: 88%|████████▊ | 723000/818627 [01:22<00:10, 8816.74 examples/s]
+Filter: 88%|████████▊ | 723000/818627 [01:22<00:10, 8812.68 examples/s]
+Filter: 88%|████████▊ | 723000/818627 [01:22<00:10, 8816.47 examples/s]
+Filter: 88%|████████▊ | 723000/818627 [01:22<00:10, 8811.52 examples/s]
+Filter: 88%|████████▊ | 723000/818627 [01:22<00:10, 8819.36 examples/s]
+Filter: 88%|████████▊ | 723000/818627 [01:22<00:10, 8817.54 examples/s]
+Filter: 88%|████████▊ | 723000/818627 [01:22<00:10, 8816.53 examples/s]
+Filter: 88%|████████▊ | 723000/818627 [01:22<00:10, 8815.51 examples/s]
+Filter: 88%|████████▊ | 724000/818627 [01:22<00:10, 8767.05 examples/s]
+Filter: 88%|████████▊ | 724000/818627 [01:22<00:10, 8763.91 examples/s]
+Filter: 88%|████████▊ | 724000/818627 [01:22<00:10, 8764.50 examples/s]
+Filter: 88%|████████▊ | 724000/818627 [01:22<00:10, 8764.02 examples/s]
+Filter: 88%|████████▊ | 724000/818627 [01:22<00:10, 8766.37 examples/s]
+Filter: 88%|████████▊ | 724000/818627 [01:22<00:10, 8765.63 examples/s]
+Filter: 88%|████████▊ | 724000/818627 [01:22<00:10, 8766.63 examples/s]
+Filter: 88%|████████▊ | 724000/818627 [01:22<00:10, 8760.90 examples/s]
+Filter: 89%|████████▊ | 725000/818627 [01:22<00:10, 8757.23 examples/s]
+Filter: 89%|████████▊ | 725000/818627 [01:22<00:10, 8754.30 examples/s]
+Filter: 89%|████████▊ | 725000/818627 [01:22<00:10, 8752.48 examples/s]
+Filter: 89%|████████▊ | 725000/818627 [01:22<00:10, 8757.73 examples/s]
+Filter: 89%|████████▊ | 725000/818627 [01:22<00:10, 8756.27 examples/s]
+Filter: 89%|████████▊ | 725000/818627 [01:22<00:10, 8753.88 examples/s]
+Filter: 89%|████████▊ | 725000/818627 [01:22<00:10, 8753.95 examples/s]
+Filter: 89%|████████▊ | 725000/818627 [01:22<00:10, 8739.23 examples/s]
+Filter: 89%|████████▊ | 726000/818627 [01:22<00:10, 8946.97 examples/s]
+Filter: 89%|████████▊ | 726000/818627 [01:22<00:10, 8955.68 examples/s]
+Filter: 89%|████████▊ | 726000/818627 [01:22<00:10, 8948.68 examples/s]
+Filter: 89%|████████▊ | 726000/818627 [01:22<00:10, 8957.90 examples/s]
+Filter: 89%|████████▊ | 726000/818627 [01:22<00:10, 8954.32 examples/s]
+Filter: 89%|████████▊ | 726000/818627 [01:22<00:10, 8954.63 examples/s]
+Filter: 89%|████████▊ | 726000/818627 [01:22<00:10, 8949.09 examples/s]
+Filter: 89%|████████▊ | 726000/818627 [01:22<00:10, 8946.76 examples/s]
+Filter: 89%|████████▉ | 727000/818627 [01:22<00:10, 8867.00 examples/s]
+Filter: 89%|████████▉ | 727000/818627 [01:22<00:10, 8869.77 examples/s]
+Filter: 89%|████████▉ | 727000/818627 [01:22<00:10, 8871.85 examples/s]
+Filter: 89%|████████▉ | 727000/818627 [01:22<00:10, 8867.22 examples/s]
+Filter: 89%|████████▉ | 727000/818627 [01:22<00:10, 8868.51 examples/s]
+Filter: 89%|████████▉ | 727000/818627 [01:22<00:10, 8868.19 examples/s]
+Filter: 89%|████████▉ | 727000/818627 [01:22<00:10, 8865.27 examples/s]
+Filter: 89%|████████▉ | 727000/818627 [01:22<00:10, 8869.67 examples/s]
+Filter: 89%|████████▉ | 728000/818627 [01:22<00:10, 8824.14 examples/s]
+Filter: 89%|████████▉ | 728000/818627 [01:22<00:10, 8822.28 examples/s]
+Filter: 89%|████████▉ | 728000/818627 [01:22<00:10, 8821.81 examples/s]
+Filter: 89%|████████▉ | 728000/818627 [01:22<00:10, 8823.83 examples/s]
+Filter: 89%|████████▉ | 728000/818627 [01:22<00:10, 8821.69 examples/s]
+Filter: 89%|████████▉ | 728000/818627 [01:22<00:10, 8821.90 examples/s]
+Filter: 89%|████████▉ | 728000/818627 [01:22<00:10, 8820.71 examples/s]
+Filter: 89%|████████▉ | 728000/818627 [01:22<00:10, 8820.38 examples/s]
+Filter: 89%|████████▉ | 729000/818627 [01:22<00:10, 8776.20 examples/s]
+Filter: 89%|████████▉ | 729000/818627 [01:22<00:10, 8776.39 examples/s]
+Filter: 89%|████████▉ | 729000/818627 [01:23<00:10, 8777.23 examples/s]
+Filter: 89%|████████▉ | 729000/818627 [01:22<00:10, 8778.37 examples/s]
+Filter: 89%|████████▉ | 729000/818627 [01:22<00:10, 8776.35 examples/s]
+Filter: 89%|████████▉ | 729000/818627 [01:22<00:10, 8776.45 examples/s]
+Filter: 89%|████████▉ | 729000/818627 [01:22<00:10, 8777.48 examples/s]
+Filter: 89%|████████▉ | 729000/818627 [01:22<00:10, 8773.26 examples/s]
+Filter: 89%|████████▉ | 730000/818627 [01:22<00:10, 8756.27 examples/s]
+Filter: 89%|████████▉ | 730000/818627 [01:22<00:10, 8757.25 examples/s]
+Filter: 89%|████████▉ | 730000/818627 [01:22<00:10, 8757.85 examples/s]
+Filter: 89%|████████▉ | 730000/818627 [01:23<00:10, 8756.32 examples/s]
+Filter: 89%|████████▉ | 730000/818627 [01:22<00:10, 8757.66 examples/s]
+Filter: 89%|████████▉ | 730000/818627 [01:22<00:10, 8756.68 examples/s]
+Filter: 89%|████████▉ | 730000/818627 [01:22<00:10, 8756.27 examples/s]
+Filter: 89%|████████▉ | 730000/818627 [01:22<00:10, 8758.30 examples/s]
+Filter: 89%|████████▉ | 731000/818627 [01:22<00:10, 8727.93 examples/s]
+Filter: 89%|████████▉ | 731000/818627 [01:22<00:10, 8726.35 examples/s]
+Filter: 89%|████████▉ | 731000/818627 [01:23<00:10, 8727.00 examples/s]
+Filter: 89%|████████▉ | 731000/818627 [01:22<00:10, 8728.00 examples/s]
+Filter: 89%|████████▉ | 731000/818627 [01:22<00:10, 8719.34 examples/s]
+Filter: 89%|████████▉ | 731000/818627 [01:22<00:10, 8723.07 examples/s]
+Filter: 89%|████████▉ | 731000/818627 [01:22<00:10, 8728.77 examples/s]
+Filter: 89%|████████▉ | 731000/818627 [01:23<00:10, 8723.04 examples/s]
+Filter: 89%|████████▉ | 732000/818627 [01:23<00:09, 8700.84 examples/s]
+Filter: 89%|████████▉ | 732000/818627 [01:23<00:09, 8708.52 examples/s]
+Filter: 89%|████████▉ | 732000/818627 [01:23<00:09, 8699.87 examples/s]
+Filter: 89%|████████▉ | 732000/818627 [01:23<00:09, 8701.79 examples/s]
+Filter: 89%|████████▉ | 732000/818627 [01:23<00:09, 8704.14 examples/s]
+Filter: 89%|████████▉ | 732000/818627 [01:23<00:09, 8704.62 examples/s]
+Filter: 89%|████████▉ | 732000/818627 [01:23<00:09, 8705.29 examples/s]
+Filter: 89%|████████▉ | 732000/818627 [01:23<00:10, 8543.93 examples/s]
+Filter: 90%|████████▉ | 733000/818627 [01:23<00:09, 8917.27 examples/s]
+Filter: 90%|████████▉ | 733000/818627 [01:23<00:09, 8917.50 examples/s]
+Filter: 90%|████████▉ | 733000/818627 [01:23<00:09, 8915.21 examples/s]
+Filter: 90%|████████▉ | 733000/818627 [01:23<00:09, 8915.81 examples/s]
+Filter: 90%|████████▉ | 733000/818627 [01:23<00:09, 8915.55 examples/s]
+Filter: 90%|████████▉ | 733000/818627 [01:23<00:09, 8913.30 examples/s]
+Filter: 90%|████████▉ | 733000/818627 [01:23<00:09, 8755.97 examples/s]
+Filter: 90%|████████▉ | 734000/818627 [01:23<00:09, 9118.79 examples/s]
+Filter: 90%|████████▉ | 734000/818627 [01:23<00:09, 9116.17 examples/s]
+Filter: 90%|████████▉ | 734000/818627 [01:23<00:09, 9116.03 examples/s]
+Filter: 90%|████████▉ | 734000/818627 [01:23<00:09, 9108.52 examples/s]
+Filter: 90%|████████▉ | 734000/818627 [01:23<00:09, 9114.65 examples/s]
+Filter: 90%|████████▉ | 734000/818627 [01:23<00:09, 9116.22 examples/s]
+Filter: 90%|████████▉ | 734000/818627 [01:23<00:09, 9098.02 examples/s]
+Filter: 90%|████████▉ | 735000/818627 [01:23<00:08, 9363.53 examples/s]
+Filter: 90%|████████▉ | 736000/818627 [01:23<00:08, 9313.56 examples/s]
+Filter: 90%|████████▉ | 736000/818627 [01:23<00:08, 9288.12 examples/s]
+Filter: 90%|████████▉ | 736000/818627 [01:23<00:08, 9314.51 examples/s]
+Filter: 90%|████████▉ | 736000/818627 [01:23<00:08, 9316.28 examples/s]
+Filter: 90%|████████▉ | 736000/818627 [01:23<00:08, 9305.32 examples/s]
+Filter: 90%|████████▉ | 736000/818627 [01:23<00:08, 9312.37 examples/s]
+Filter: 90%|████████▉ | 736000/818627 [01:23<00:08, 9279.79 examples/s]
+Filter: 90%|████████▉ | 736000/818627 [01:23<00:08, 9311.27 examples/s]
+Filter: 90%|█████████ | 737000/818627 [01:23<00:08, 9162.04 examples/s]
+Filter: 90%|█████████ | 737000/818627 [01:23<00:08, 9139.05 examples/s]
+Filter: 90%|█████████ | 737000/818627 [01:23<00:08, 9168.34 examples/s]
+Filter: 90%|█████████ | 737000/818627 [01:23<00:08, 9163.05 examples/s]
+Filter: 90%|█████████ | 737000/818627 [01:23<00:08, 9155.50 examples/s]
+Filter: 90%|█████████ | 737000/818627 [01:23<00:08, 9162.75 examples/s]
+Filter: 90%|█████████ | 737000/818627 [01:23<00:08, 9162.92 examples/s]
+Filter: 90%|█████████ | 737000/818627 [01:23<00:08, 9121.41 examples/s]
+Filter: 90%|█████████ | 738000/818627 [01:23<00:08, 8997.26 examples/s]
+Filter: 90%|█████████ | 738000/818627 [01:24<00:08, 9017.09 examples/s]
+Filter: 90%|█████████ | 738000/818627 [01:23<00:08, 8974.86 examples/s]
+Filter: 90%|█████████ | 738000/818627 [01:23<00:08, 9003.56 examples/s]
+Filter: 90%|█████████ | 738000/818627 [01:23<00:08, 9001.28 examples/s]
+Filter: 90%|█████████ | 738000/818627 [01:23<00:08, 8996.76 examples/s]
+Filter: 90%|█████████ | 738000/818627 [01:23<00:08, 9003.13 examples/s]
+Filter: 90%|█████████ | 738000/818627 [01:23<00:08, 8998.02 examples/s]
+Filter: 90%|█████████ | 739000/818627 [01:23<00:08, 8928.35 examples/s]
+Filter: 90%|█████████ | 739000/818627 [01:23<00:08, 8909.34 examples/s]
+Filter: 90%|█████████ | 739000/818627 [01:24<00:08, 8938.75 examples/s]
+Filter: 90%|█████████ | 739000/818627 [01:23<00:08, 8929.19 examples/s]
+Filter: 90%|█████████ | 739000/818627 [01:23<00:08, 8939.34 examples/s]
+Filter: 90%|█████████ | 739000/818627 [01:23<00:08, 8929.07 examples/s]
+Filter: 90%|█████████ | 739000/818627 [01:23<00:08, 8926.04 examples/s]
+Filter: 90%|█████████ | 739000/818627 [01:23<00:08, 8928.86 examples/s]
+Filter: 90%|█████████ | 740000/818627 [01:23<00:08, 9074.82 examples/s]
+Filter: 90%|█████████ | 740000/818627 [01:23<00:08, 9060.36 examples/s]
+Filter: 90%|█████████ | 740000/818627 [01:24<00:08, 9080.60 examples/s]
+Filter: 90%|█████████ | 740000/818627 [01:23<00:08, 9075.06 examples/s]
+Filter: 90%|█████████ | 740000/818627 [01:23<00:08, 9077.00 examples/s]
+Filter: 90%|█████████ | 740000/818627 [01:23<00:08, 9076.91 examples/s]
+Filter: 90%|█████████ | 740000/818627 [01:24<00:08, 9074.01 examples/s]
+Filter: 90%|█████████ | 740000/818627 [01:23<00:08, 9076.68 examples/s]
+Filter: 91%|█████████ | 741000/818627 [01:24<00:08, 9268.63 examples/s]
+Filter: 91%|█████████ | 741000/818627 [01:24<00:08, 9263.37 examples/s]
+Filter: 91%|█████████ | 741000/818627 [01:24<00:08, 9269.35 examples/s]
+Filter: 91%|█████████ | 741000/818627 [01:24<00:08, 9273.92 examples/s]
+Filter: 91%|█████████ | 741000/818627 [01:24<00:08, 9269.16 examples/s]
+Filter: 91%|█████████ | 741000/818627 [01:24<00:08, 9268.05 examples/s]
+Filter: 91%|█████████ | 741000/818627 [01:24<00:08, 9261.72 examples/s]
+Filter: 91%|█████████ | 741000/818627 [01:24<00:08, 9269.94 examples/s]
+Filter: 91%|█████████ | 743000/818627 [01:24<00:08, 9384.21 examples/s]
+Filter: 91%|█████████ | 743000/818627 [01:24<00:08, 9383.93 examples/s]
+Filter: 91%|█████████ | 743000/818627 [01:24<00:08, 9385.05 examples/s]
+Filter: 91%|█████████ | 743000/818627 [01:24<00:08, 9379.03 examples/s]
+Filter: 91%|█████████ | 743000/818627 [01:24<00:08, 9380.66 examples/s]
+Filter: 91%|█████████ | 743000/818627 [01:24<00:08, 9376.09 examples/s]
+Filter: 91%|█████████ | 743000/818627 [01:24<00:08, 9379.08 examples/s]
+Filter: 91%|█████████ | 743000/818627 [01:24<00:08, 9382.40 examples/s]
+Filter: 91%|█████████ | 744000/818627 [01:24<00:08, 9195.41 examples/s]
+Filter: 91%|█████████ | 744000/818627 [01:24<00:08, 9193.91 examples/s]
+Filter: 91%|█████████ | 744000/818627 [01:24<00:08, 9198.64 examples/s]
+Filter: 91%|█████████ | 744000/818627 [01:24<00:08, 9197.95 examples/s]
+Filter: 91%|█████████ | 744000/818627 [01:24<00:08, 9198.43 examples/s]
+Filter: 91%|█████████ | 744000/818627 [01:24<00:08, 9197.81 examples/s]
+Filter: 91%|█████████ | 744000/818627 [01:24<00:08, 9194.87 examples/s]
+Filter: 91%|█████████ | 744000/818627 [01:24<00:08, 9192.07 examples/s]
+Filter: 91%|█████████ | 745000/818627 [01:24<00:08, 9034.87 examples/s]
+Filter: 91%|█████████ | 745000/818627 [01:24<00:08, 9030.98 examples/s]
+Filter: 91%|█████████ | 745000/818627 [01:24<00:08, 9033.90 examples/s]
+Filter: 91%|█████████ | 745000/818627 [01:24<00:08, 9036.08 examples/s]
+Filter: 91%|█████████ | 745000/818627 [01:24<00:08, 9036.16 examples/s]
+Filter: 91%|█████████ | 745000/818627 [01:24<00:08, 9032.30 examples/s]
+Filter: 91%|█████████ | 745000/818627 [01:24<00:08, 9033.54 examples/s]
+Filter: 91%|█████████ | 745000/818627 [01:24<00:08, 8888.99 examples/s]
+Filter: 91%|█████████ | 746000/818627 [01:24<00:08, 8962.59 examples/s]
+Filter: 91%|█████████ | 746000/818627 [01:24<00:08, 8958.57 examples/s]
+Filter: 91%|█████████ | 746000/818627 [01:24<00:08, 8965.10 examples/s]
+Filter: 91%|█████████ | 746000/818627 [01:24<00:08, 9008.94 examples/s]
+Filter: 91%|█████████ | 746000/818627 [01:24<00:08, 8963.93 examples/s]
+Filter: 91%|█████████ | 746000/818627 [01:24<00:08, 8963.71 examples/s]
+Filter: 91%|█████████ | 746000/818627 [01:24<00:08, 8961.44 examples/s]
+Filter: 91%|█████████ | 746000/818627 [01:24<00:08, 8961.21 examples/s]
+Filter: 91%|█████████▏| 747000/818627 [01:24<00:07, 9096.78 examples/s]
+Filter: 91%|█████████▏| 747000/818627 [01:24<00:07, 9095.84 examples/s]
+Filter: 91%|█████████▏| 747000/818627 [01:24<00:07, 9131.62 examples/s]
+Filter: 91%|█████████▏| 747000/818627 [01:25<00:07, 9097.47 examples/s]
+Filter: 91%|█████████▏| 747000/818627 [01:24<00:07, 9094.65 examples/s]
+Filter: 91%|█████████▏| 747000/818627 [01:24<00:07, 9093.98 examples/s]
+Filter: 91%|█████████▏| 747000/818627 [01:24<00:07, 9093.61 examples/s]
+Filter: 91%|█████████▏| 747000/818627 [01:24<00:07, 9089.84 examples/s]
+Filter: 91%|█████████▏| 748000/818627 [01:24<00:07, 9287.11 examples/s]
+Filter: 91%|█████████▏| 748000/818627 [01:25<00:07, 9289.70 examples/s]
+Filter: 91%|█████████▏| 748000/818627 [01:24<00:07, 9313.38 examples/s]
+Filter: 91%|█████████▏| 748000/818627 [01:24<00:07, 9283.78 examples/s]
+Filter: 91%|█████████▏| 748000/818627 [01:24<00:07, 9289.32 examples/s]
+Filter: 91%|█████████▏| 748000/818627 [01:24<00:07, 9288.29 examples/s]
+Filter: 91%|█████████▏| 748000/818627 [01:24<00:07, 9288.68 examples/s]
+Filter: 91%|█████████▏| 748000/818627 [01:24<00:07, 9289.04 examples/s]
+Filter: 91%|█████████▏| 749000/818627 [01:24<00:07, 9500.36 examples/s]
+Filter: 91%|█████████▏| 749000/818627 [01:25<00:07, 9478.84 examples/s]
+Filter: 91%|█████████▏| 749000/818627 [01:24<00:07, 9480.92 examples/s]
+Filter: 91%|█████████▏| 749000/818627 [01:24<00:07, 9481.31 examples/s]
+Filter: 91%|█████████▏| 749000/818627 [01:24<00:07, 9397.05 examples/s]
+Filter: 91%|█████████▏| 749000/818627 [01:25<00:07, 9273.48 examples/s]
+Filter: 92%|█████████▏| 750000/818627 [01:25<00:07, 9408.27 examples/s]
+Filter: 92%|█████████▏| 750000/818627 [01:25<00:07, 9410.13 examples/s]
+Filter: 92%|█████████▏| 750000/818627 [01:25<00:07, 9391.12 examples/s]
+Filter: 92%|█████████▏| 750000/818627 [01:25<00:07, 9402.59 examples/s]
+Filter: 92%|█████████▏| 750000/818627 [01:24<00:07, 9413.05 examples/s]
+Filter: 92%|█████████▏| 750000/818627 [01:25<00:07, 9450.33 examples/s]
+Filter: 92%|█████████▏| 750000/818627 [01:24<00:07, 9386.52 examples/s]
+Filter: 92%|█████████▏| 750000/818627 [01:25<00:07, 9382.66 examples/s]
+Filter: 92%|█████████▏| 751000/818627 [01:25<00:07, 9231.47 examples/s]
+Filter: 92%|█████████▏| 751000/818627 [01:25<00:07, 9234.43 examples/s]
+Filter: 92%|█████████▏| 751000/818627 [01:25<00:07, 9188.59 examples/s]
+Filter: 92%|█████████▏| 751000/818627 [01:25<00:07, 9175.15 examples/s]
+Filter: 92%|█████████▏| 751000/818627 [01:25<00:07, 9224.22 examples/s]
+Filter: 92%|█████████▏| 751000/818627 [01:25<00:07, 9197.69 examples/s]
+Filter: 92%|█████████▏| 751000/818627 [01:25<00:07, 9184.40 examples/s]
+Filter: 92%|█████████▏| 751000/818627 [01:25<00:07, 9180.45 examples/s]
+Filter: 92%|█████████▏| 752000/818627 [01:25<00:07, 9096.55 examples/s]
+Filter: 92%|█████████▏| 752000/818627 [01:25<00:07, 9045.12 examples/s]
+Filter: 92%|█████████▏| 752000/818627 [01:25<00:07, 9047.96 examples/s]
+Filter: 92%|█████████▏| 752000/818627 [01:25<00:07, 9040.95 examples/s]
+Filter: 92%|█████████▏| 752000/818627 [01:25<00:07, 9066.12 examples/s]
+Filter: 92%|█████████▏| 752000/818627 [01:25<00:07, 9077.31 examples/s]
+Filter: 92%|█████████▏| 752000/818627 [01:25<00:07, 9036.83 examples/s]
+Filter: 92%|█████████▏| 752000/818627 [01:25<00:07, 8878.17 examples/s]
+Filter: 92%|█████████▏| 753000/818627 [01:25<00:07, 8972.51 examples/s]
+Filter: 92%|█████████▏| 753000/818627 [01:25<00:07, 8966.46 examples/s]
+Filter: 92%|█████████▏| 753000/818627 [01:25<00:07, 8915.36 examples/s]
+Filter: 92%|█████████▏| 753000/818627 [01:25<00:07, 8917.89 examples/s]
+Filter: 92%|█████████▏| 753000/818627 [01:25<00:07, 8912.96 examples/s]
+Filter: 92%|█████████▏| 753000/818627 [01:25<00:07, 8932.09 examples/s]
+Filter: 92%|█████████▏| 753000/818627 [01:25<00:07, 8970.33 examples/s]
+Filter: 92%|█████████▏| 753000/818627 [01:25<00:07, 8910.91 examples/s]
+Filter: 92%|█████████▏| 754000/818627 [01:25<00:07, 9103.12 examples/s]
+Filter: 92%|█████████▏| 754000/818627 [01:25<00:07, 9099.47 examples/s]
+Filter: 92%|█████████▏| 754000/818627 [01:25<00:07, 9073.17 examples/s]
+Filter: 92%|█████████▏| 754000/818627 [01:25<00:07, 9074.19 examples/s]
+Filter: 92%|█████████▏| 754000/818627 [01:25<00:07, 9088.39 examples/s]
+Filter: 92%|█████████▏| 754000/818627 [01:25<00:07, 9116.46 examples/s]
+Filter: 92%|█████████▏| 754000/818627 [01:25<00:07, 9070.37 examples/s]
+Filter: 92%|█████████▏| 754000/818627 [01:25<00:07, 9073.52 examples/s]
+Filter: 92%|█████████▏| 755000/818627 [01:25<00:06, 9254.49 examples/s]
+Filter: 92%|█████████▏| 755000/818627 [01:25<00:06, 9251.64 examples/s]
+Filter: 92%|█████████▏| 755000/818627 [01:25<00:06, 9239.27 examples/s]
+Filter: 92%|█████████▏| 755000/818627 [01:25<00:06, 9233.95 examples/s]
+Filter: 92%|█████████▏| 755000/818627 [01:25<00:06, 9241.21 examples/s]
+Filter: 92%|█████████▏| 755000/818627 [01:25<00:06, 9249.71 examples/s]
+Filter: 92%|█████████▏| 755000/818627 [01:25<00:06, 9269.11 examples/s]
+Filter: 92%|█████████▏| 755000/818627 [01:25<00:06, 9242.02 examples/s]
+Filter: 92%|█████████▏| 756000/818627 [01:25<00:06, 9404.89 examples/s]
+Filter: 92%|█████████▏| 756000/818627 [01:25<00:06, 9401.22 examples/s]
+Filter: 92%|█████████▏| 756000/818627 [01:25<00:06, 9398.66 examples/s]
+Filter: 92%|█████████▏| 756000/818627 [01:25<00:06, 9400.67 examples/s]
+Filter: 92%|█████████▏| 756000/818627 [01:25<00:06, 9409.62 examples/s]
+Filter: 92%|█████████▏| 756000/818627 [01:25<00:06, 9424.30 examples/s]
+Filter: 92%|█████████▏| 756000/818627 [01:25<00:06, 9401.95 examples/s]
+Filter: 92%|█████████▏| 756000/818627 [01:25<00:06, 9398.07 examples/s]
+Filter: 92%|█████████▏| 757000/818627 [01:25<00:06, 9338.25 examples/s]
+Filter: 92%|█████████▏| 757000/818627 [01:25<00:06, 9337.12 examples/s]
+Filter: 92%|█████████▏| 757000/818627 [01:25<00:06, 9338.38 examples/s]
+Filter: 92%|█████████▏| 757000/818627 [01:26<00:06, 9334.35 examples/s]
+Filter: 92%|█████████▏| 757000/818627 [01:25<00:06, 9353.21 examples/s]
+Filter: 92%|█████████▏| 757000/818627 [01:25<00:06, 9335.46 examples/s]
+Filter: 92%|█████████▏| 757000/818627 [01:25<00:06, 9339.11 examples/s]
+Filter: 92%|█████████▏| 757000/818627 [01:25<00:06, 9248.29 examples/s]
+Filter: 93%|█████████▎| 758000/818627 [01:25<00:06, 9139.73 examples/s]
+Filter: 93%|█████████▎| 758000/818627 [01:25<00:06, 9140.62 examples/s]
+Filter: 93%|█████████▎| 758000/818627 [01:26<00:06, 9132.05 examples/s]
+Filter: 93%|█████████▎| 758000/818627 [01:25<00:06, 9133.11 examples/s]
+Filter: 93%|█████████▎| 758000/818627 [01:25<00:06, 9138.26 examples/s]
+Filter: 93%|█████████▎| 758000/818627 [01:25<00:06, 9144.22 examples/s]
+Filter: 93%|█████████▎| 758000/818627 [01:25<00:06, 9132.81 examples/s]
+Filter: 93%|█████████▎| 758000/818627 [01:25<00:06, 9157.95 examples/s]
+Filter: 93%|█████████▎| 759000/818627 [01:26<00:06, 8994.11 examples/s]
+Filter: 93%|█████████▎| 759000/818627 [01:26<00:06, 8991.55 examples/s]
+Filter: 93%|█████████▎| 759000/818627 [01:25<00:06, 8979.60 examples/s]
+Filter: 93%|█████████▎| 759000/818627 [01:25<00:06, 8994.01 examples/s]
+Filter: 93%|█████████▎| 759000/818627 [01:26<00:06, 8975.65 examples/s]
+Filter: 93%|█████████▎| 759000/818627 [01:25<00:06, 9000.76 examples/s]
+Filter: 93%|█████████▎| 759000/818627 [01:26<00:06, 8976.12 examples/s]
+Filter: 93%|█████████▎| 759000/818627 [01:25<00:06, 8952.53 examples/s]
+Filter: 93%|█████████▎| 760000/818627 [01:26<00:06, 8882.93 examples/s]
+Filter: 93%|█████████▎| 760000/818627 [01:26<00:06, 8873.89 examples/s]
+Filter: 93%|█████████▎| 760000/818627 [01:26<00:06, 8878.17 examples/s]
+Filter: 93%|█████████▎| 760000/818627 [01:26<00:06, 8870.90 examples/s]
+Filter: 93%|█████████▎| 760000/818627 [01:26<00:06, 8880.13 examples/s]
+Filter: 93%|█████████▎| 760000/818627 [01:26<00:06, 8884.88 examples/s]
+Filter: 93%|█████████▎| 760000/818627 [01:26<00:06, 8878.32 examples/s]
+Filter: 93%|█████████▎| 760000/818627 [01:26<00:06, 8886.97 examples/s]
+Filter: 93%|█████████▎| 761000/818627 [01:26<00:06, 9043.69 examples/s]
+Filter: 93%|█████████▎| 761000/818627 [01:26<00:06, 9042.67 examples/s]
+Filter: 93%|█████████▎| 761000/818627 [01:26<00:06, 9041.32 examples/s]
+Filter: 93%|█████████▎| 761000/818627 [01:26<00:06, 9036.22 examples/s]
+Filter: 93%|█████████▎| 761000/818627 [01:26<00:06, 9042.47 examples/s]
+Filter: 93%|█████████▎| 761000/818627 [01:26<00:06, 9042.11 examples/s]
+Filter: 93%|█████████▎| 761000/818627 [01:26<00:06, 9046.77 examples/s]
+Filter: 93%|█████████▎| 761000/818627 [01:26<00:06, 9034.54 examples/s]
+Filter: 93%|█████████▎| 762000/818627 [01:26<00:06, 9233.84 examples/s]
+Filter: 93%|█████████▎| 762000/818627 [01:26<00:06, 9238.02 examples/s]
+Filter: 93%|█████████▎| 762000/818627 [01:26<00:06, 9234.92 examples/s]
+Filter: 93%|█████████▎| 762000/818627 [01:26<00:06, 9227.79 examples/s]
+Filter: 93%|█████████▎| 762000/818627 [01:26<00:06, 9237.69 examples/s]
+Filter: 93%|█████████▎| 762000/818627 [01:26<00:06, 9237.55 examples/s]
+Filter: 93%|█████████▎| 762000/818627 [01:26<00:06, 9240.03 examples/s]
+Filter: 93%|█████████▎| 762000/818627 [01:26<00:06, 9238.07 examples/s]
+Filter: 93%|█████████▎| 763000/818627 [01:26<00:05, 9445.67 examples/s]
+Filter: 93%|█████████▎| 764000/818627 [01:26<00:05, 9401.32 examples/s]
+Filter: 93%|█████████▎| 764000/818627 [01:26<00:05, 9403.08 examples/s]
+Filter: 93%|█████████▎| 764000/818627 [01:26<00:05, 9401.45 examples/s]
+Filter: 93%|█████████▎| 764000/818627 [01:26<00:05, 9397.81 examples/s]
+Filter: 93%|█████████▎| 764000/818627 [01:26<00:05, 9400.43 examples/s]
+Filter: 93%|█████████▎| 764000/818627 [01:26<00:05, 9387.22 examples/s]
+Filter: 93%|█████████▎| 764000/818627 [01:26<00:05, 9404.93 examples/s]
+Filter: 93%|█████████▎| 764000/818627 [01:26<00:05, 9406.51 examples/s]
+Filter: 93%|█████████▎| 765000/818627 [01:26<00:05, 9208.38 examples/s]
+Filter: 93%|█████████▎| 765000/818627 [01:26<00:05, 9205.62 examples/s]
+Filter: 93%|█████████▎| 765000/818627 [01:26<00:05, 9207.01 examples/s]
+Filter: 93%|█████████▎| 765000/818627 [01:26<00:05, 9212.11 examples/s]
+Filter: 93%|█████████▎| 765000/818627 [01:26<00:05, 9199.47 examples/s]
+Filter: 93%|█████████▎| 765000/818627 [01:26<00:05, 9207.33 examples/s]
+Filter: 93%|█████████▎| 765000/818627 [01:26<00:05, 9158.47 examples/s]
+Filter: 93%|█████████▎| 765000/818627 [01:26<00:05, 9209.71 examples/s]
+Filter: 94%|█████████▎| 766000/818627 [01:26<00:05, 9062.81 examples/s]
+Filter: 94%|█████████▎| 766000/818627 [01:26<00:05, 9060.26 examples/s]
+Filter: 94%|█████████▎| 766000/818627 [01:26<00:05, 9062.89 examples/s]
+Filter: 94%|█████████▎| 766000/818627 [01:27<00:05, 9063.50 examples/s]
+Filter: 94%|█████████▎| 766000/818627 [01:26<00:05, 9008.91 examples/s]
+Filter: 94%|█████████▎| 766000/818627 [01:26<00:05, 9063.32 examples/s]
+Filter: 94%|█████████▎| 766000/818627 [01:26<00:05, 9064.41 examples/s]
+Filter: 94%|█████████▎| 766000/818627 [01:26<00:05, 9053.70 examples/s]
+Filter: 94%|█████████▎| 767000/818627 [01:26<00:05, 8946.81 examples/s]
+Filter: 94%|█████████▎| 767000/818627 [01:26<00:05, 8945.06 examples/s]
+Filter: 94%|█████████▎| 767000/818627 [01:27<00:05, 8947.09 examples/s]
+Filter: 94%|█████████▎| 767000/818627 [01:26<00:05, 8939.06 examples/s]
+Filter: 94%|█████████▎| 767000/818627 [01:26<00:05, 8945.00 examples/s]
+Filter: 94%|█████████▎| 767000/818627 [01:26<00:05, 8945.44 examples/s]
+Filter: 94%|█████████▎| 767000/818627 [01:26<00:05, 8891.25 examples/s]
+Filter: 94%|█████████▎| 767000/818627 [01:26<00:05, 8940.86 examples/s]
+Filter: 94%|█████████▍| 768000/818627 [01:27<00:05, 8686.45 examples/s]
+Filter: 94%|█████████▍| 768000/818627 [01:27<00:05, 8683.42 examples/s]
+Filter: 94%|█████████▍| 768000/818627 [01:27<00:05, 8685.20 examples/s]
+Filter: 94%|█████████▍| 768000/818627 [01:27<00:05, 8682.65 examples/s]
+Filter: 94%|█████████▍| 768000/818627 [01:26<00:05, 8690.05 examples/s]
+Filter: 94%|█████████▍| 768000/818627 [01:27<00:05, 8634.56 examples/s]
+Filter: 94%|█████████▍| 768000/818627 [01:26<00:05, 8683.92 examples/s]
+Filter: 94%|█████████▍| 768000/818627 [01:27<00:05, 8683.34 examples/s]
+Filter: 94%|█████████▍| 769000/818627 [01:27<00:05, 8683.04 examples/s]
+Filter: 94%|█████████▍| 769000/818627 [01:27<00:05, 8683.44 examples/s]
+Filter: 94%|█████████▍| 769000/818627 [01:27<00:05, 8681.98 examples/s]
+Filter: 94%|█████████▍| 769000/818627 [01:27<00:05, 8678.15 examples/s]
+Filter: 94%|█████████▍| 769000/818627 [01:27<00:05, 8647.79 examples/s]
+Filter: 94%|█████████▍| 769000/818627 [01:27<00:05, 8683.41 examples/s]
+Filter: 94%|█████████▍| 769000/818627 [01:27<00:05, 8682.79 examples/s]
+Filter: 94%|█████████▍| 769000/818627 [01:27<00:05, 8684.52 examples/s]
+Filter: 94%|█████████▍| 770000/818627 [01:27<00:05, 8685.94 examples/s]
+Filter: 94%|█████████▍| 770000/818627 [01:27<00:05, 8687.84 examples/s]
+Filter: 94%|█████████▍| 770000/818627 [01:27<00:05, 8686.81 examples/s]
+Filter: 94%|█████████▍| 770000/818627 [01:27<00:05, 8684.26 examples/s]
+Filter: 94%|█████████▍| 770000/818627 [01:27<00:05, 8689.21 examples/s]
+Filter: 94%|█████████▍| 770000/818627 [01:27<00:05, 8662.45 examples/s]
+Filter: 94%|█████████▍| 770000/818627 [01:27<00:05, 8685.72 examples/s]
+Filter: 94%|█████████▍| 770000/818627 [01:27<00:05, 8687.19 examples/s]
+Filter: 94%|█████████▍| 771000/818627 [01:27<00:05, 8933.69 examples/s]
+Filter: 94%|█████████▍| 771000/818627 [01:27<00:05, 8935.93 examples/s]
+Filter: 94%|█████████▍| 771000/818627 [01:27<00:05, 8934.27 examples/s]
+Filter: 94%|█████████▍| 771000/818627 [01:27<00:05, 8933.51 examples/s]
+Filter: 94%|█████████▍| 771000/818627 [01:27<00:05, 8922.35 examples/s]
+Filter: 94%|█████████▍| 771000/818627 [01:27<00:05, 8932.36 examples/s]
+Filter: 94%|█████████▍| 771000/818627 [01:27<00:05, 8930.61 examples/s]
+Filter: 94%|█████████▍| 771000/818627 [01:27<00:05, 8927.68 examples/s]
+Filter: 94%|█████████▍| 772000/818627 [01:27<00:05, 9205.47 examples/s]
+Filter: 94%|█████████▍| 772000/818627 [01:27<00:05, 9209.32 examples/s]
+Filter: 94%|█████████▍| 772000/818627 [01:27<00:05, 9204.97 examples/s]
+Filter: 94%|█████████▍| 772000/818627 [01:27<00:05, 9205.78 examples/s]
+Filter: 94%|█████████▍| 772000/818627 [01:27<00:05, 9206.75 examples/s]
+Filter: 94%|█████████▍| 772000/818627 [01:27<00:05, 9201.05 examples/s]
+Filter: 94%|█████████▍| 772000/818627 [01:27<00:05, 9206.17 examples/s]
+Filter: 94%|█████████▍| 772000/818627 [01:27<00:05, 9196.39 examples/s]
+Filter: 94%|█████████▍| 773000/818627 [01:27<00:04, 9162.90 examples/s]
+Filter: 94%|█████████▍| 773000/818627 [01:27<00:04, 9163.98 examples/s]
+Filter: 94%|█████████▍| 773000/818627 [01:27<00:04, 9162.61 examples/s]
+Filter: 94%|█████████▍| 773000/818627 [01:27<00:04, 9158.88 examples/s]
+Filter: 94%|█████████▍| 773000/818627 [01:27<00:04, 9159.36 examples/s]
+Filter: 94%|█████████▍| 773000/818627 [01:27<00:04, 9163.31 examples/s]
+Filter: 94%|█████████▍| 773000/818627 [01:27<00:04, 9163.02 examples/s]
+Filter: 94%|█████████▍| 773000/818627 [01:27<00:04, 9166.73 examples/s]
+Filter: 95%|█████████▍| 774000/818627 [01:27<00:04, 9031.91 examples/s]
+Filter: 95%|█████████▍| 774000/818627 [01:27<00:04, 9032.02 examples/s]
+Filter: 95%|█████████▍| 774000/818627 [01:27<00:04, 9033.97 examples/s]
+Filter: 95%|█████████▍| 774000/818627 [01:27<00:04, 9027.73 examples/s]
+Filter: 95%|█████████▍| 774000/818627 [01:27<00:04, 9034.79 examples/s]
+Filter: 95%|█████████▍| 774000/818627 [01:27<00:04, 9037.77 examples/s]
+Filter: 95%|█████████▍| 774000/818627 [01:27<00:04, 9034.63 examples/s]
+Filter: 95%|█████████▍| 774000/818627 [01:27<00:04, 9037.81 examples/s]
+Filter: 95%|█████████▍| 775000/818627 [01:27<00:04, 8902.05 examples/s]
+Filter: 95%|█████████▍| 775000/818627 [01:28<00:04, 8900.31 examples/s]
+Filter: 95%|█████████▍| 775000/818627 [01:27<00:04, 8896.42 examples/s]
+Filter: 95%|█████████▍| 775000/818627 [01:27<00:04, 8899.34 examples/s]
+Filter: 95%|█████████▍| 775000/818627 [01:27<00:04, 8900.52 examples/s]
+Filter: 95%|█████████▍| 775000/818627 [01:27<00:04, 8902.66 examples/s]
+Filter: 95%|█████████▍| 775000/818627 [01:27<00:04, 8907.28 examples/s]
+Filter: 95%|█████████▍| 775000/818627 [01:27<00:04, 8902.73 examples/s]
+Filter: 95%|█████████▍| 776000/818627 [01:27<00:04, 8835.75 examples/s]
+Filter: 95%|█████████▍| 776000/818627 [01:27<00:04, 8835.01 examples/s]
+Filter: 95%|█████████▍| 776000/818627 [01:28<00:04, 8834.72 examples/s]
+Filter: 95%|█████████▍| 776000/818627 [01:27<00:04, 8832.10 examples/s]
+Filter: 95%|█████████▍| 776000/818627 [01:27<00:04, 8831.01 examples/s]
+Filter: 95%|█████████▍| 776000/818627 [01:27<00:04, 8833.30 examples/s]
+Filter: 95%|█████████▍| 776000/818627 [01:27<00:04, 8835.73 examples/s]
+Filter: 95%|█████████▍| 776000/818627 [01:27<00:04, 8826.88 examples/s]
+Filter: 95%|█████████▍| 777000/818627 [01:28<00:04, 8824.30 examples/s]
+Filter: 95%|█████████▍| 777000/818627 [01:28<00:04, 8826.79 examples/s]
+Filter: 95%|█████████▍| 777000/818627 [01:28<00:04, 8826.62 examples/s]
+Filter: 95%|█████████▍| 777000/818627 [01:28<00:04, 8823.94 examples/s]
+Filter: 95%|█████████▍| 777000/818627 [01:28<00:04, 8824.28 examples/s]
+Filter: 95%|█████████▍| 777000/818627 [01:28<00:04, 8826.03 examples/s]
+Filter: 95%|█████████▍| 777000/818627 [01:28<00:04, 8823.36 examples/s]
+Filter: 95%|█████████▍| 777000/818627 [01:28<00:04, 8803.51 examples/s]
+Filter: 95%|█████████▌| 778000/818627 [01:28<00:04, 9065.47 examples/s]
+Filter: 95%|█████████▌| 778000/818627 [01:28<00:04, 9067.50 examples/s]
+Filter: 95%|█████████▌| 778000/818627 [01:28<00:04, 9069.36 examples/s]
+Filter: 95%|█████████▌| 778000/818627 [01:28<00:04, 9064.58 examples/s]
+Filter: 95%|█████████▌| 778000/818627 [01:28<00:04, 9070.69 examples/s]
+Filter: 95%|█████████▌| 778000/818627 [01:28<00:04, 9071.29 examples/s]
+Filter: 95%|█████████▌| 778000/818627 [01:28<00:04, 9065.93 examples/s]
+Filter: 95%|█████████▌| 778000/818627 [01:28<00:04, 9067.44 examples/s]
+Filter: 95%|█████████▌| 779000/818627 [01:28<00:04, 9316.79 examples/s]
+Filter: 95%|█████████▌| 779000/818627 [01:28<00:04, 9321.31 examples/s]
+Filter: 95%|█████████▌| 779000/818627 [01:28<00:04, 9318.21 examples/s]
+Filter: 95%|█████████▌| 779000/818627 [01:28<00:04, 9313.79 examples/s]
+Filter: 95%|█████████▌| 779000/818627 [01:28<00:04, 9318.02 examples/s]
+Filter: 95%|█████████▌| 779000/818627 [01:28<00:04, 9312.73 examples/s]
+Filter: 95%|█████████▌| 779000/818627 [01:28<00:04, 9315.56 examples/s]
+Filter: 95%|█████████▌| 779000/818627 [01:28<00:04, 9314.23 examples/s]
+Filter: 95%|█████████▌| 780000/818627 [01:28<00:04, 9303.03 examples/s]
+Filter: 95%|█████████▌| 780000/818627 [01:28<00:04, 9302.73 examples/s]
+Filter: 95%|█████████▌| 780000/818627 [01:28<00:04, 9302.62 examples/s]
+Filter: 95%|█████████▌| 780000/818627 [01:28<00:04, 9301.28 examples/s]
+Filter: 95%|█████████▌| 780000/818627 [01:28<00:04, 9300.15 examples/s]
+Filter: 95%|█████████▌| 780000/818627 [01:28<00:04, 9302.32 examples/s]
+Filter: 95%|█████████▌| 780000/818627 [01:28<00:04, 9299.47 examples/s]
+Filter: 95%|█████████▌| 780000/818627 [01:28<00:04, 9275.07 examples/s]
+Filter: 95%|█████████▌| 781000/818627 [01:28<00:04, 9085.89 examples/s]
+Filter: 95%|█████████▌| 781000/818627 [01:28<00:04, 9080.74 examples/s]
+Filter: 95%|█████████▌| 781000/818627 [01:28<00:04, 9082.07 examples/s]
+Filter: 95%|█████████▌| 781000/818627 [01:28<00:04, 9077.74 examples/s]
+Filter: 95%|█████████▌| 781000/818627 [01:28<00:04, 9080.21 examples/s]
+Filter: 95%|█████████▌| 781000/818627 [01:28<00:04, 9076.72 examples/s]
+Filter: 95%|█████████▌| 781000/818627 [01:28<00:04, 9076.02 examples/s]
+Filter: 95%|█████████▌| 781000/818627 [01:28<00:04, 9075.60 examples/s]
+Filter: 96%|█████████▌| 782000/818627 [01:28<00:04, 8930.96 examples/s]
+Filter: 96%|█████████▌| 782000/818627 [01:28<00:04, 8933.04 examples/s]
+Filter: 96%|█████████▌| 782000/818627 [01:28<00:04, 8931.90 examples/s]
+Filter: 96%|█████████▌| 782000/818627 [01:28<00:04, 8929.67 examples/s]
+Filter: 96%|█████████▌| 782000/818627 [01:28<00:04, 8931.21 examples/s]
+Filter: 96%|█████████▌| 782000/818627 [01:28<00:04, 8929.87 examples/s]
+Filter: 96%|█████████▌| 782000/818627 [01:28<00:04, 8927.50 examples/s]
+Filter: 96%|█████████▌| 782000/818627 [01:28<00:04, 8929.81 examples/s]
+Filter: 96%|█████████▌| 783000/818627 [01:28<00:03, 8953.21 examples/s]
+Filter: 96%|█████████▌| 783000/818627 [01:28<00:03, 8949.53 examples/s]
+Filter: 96%|█████████▌| 783000/818627 [01:28<00:03, 8952.15 examples/s]
+Filter: 96%|█████████▌| 783000/818627 [01:28<00:03, 8948.14 examples/s]
+Filter: 96%|█████████▌| 783000/818627 [01:28<00:03, 8953.50 examples/s]
+Filter: 96%|█████████▌| 783000/818627 [01:28<00:03, 8950.99 examples/s]
+Filter: 96%|█████████▌| 783000/818627 [01:28<00:03, 8951.25 examples/s]
+Filter: 96%|█████████▌| 783000/818627 [01:28<00:03, 8949.58 examples/s]
+Filter: 96%|█████████▌| 784000/818627 [01:28<00:03, 8876.65 examples/s]
+Filter: 96%|█████████▌| 784000/818627 [01:28<00:03, 8874.04 examples/s]
+Filter: 96%|█████████▌| 784000/818627 [01:28<00:03, 8874.27 examples/s]
+Filter: 96%|█████████▌| 784000/818627 [01:29<00:03, 8873.05 examples/s]
+Filter: 96%|█████████▌| 784000/818627 [01:28<00:03, 8875.38 examples/s]
+Filter: 96%|█████████▌| 784000/818627 [01:28<00:03, 8874.96 examples/s]
+Filter: 96%|█████████▌| 784000/818627 [01:28<00:03, 8872.09 examples/s]
+Filter: 96%|█████████▌| 784000/818627 [01:28<00:03, 8863.80 examples/s]
+Filter: 96%|█████████▌| 785000/818627 [01:28<00:03, 8781.82 examples/s]
+Filter: 96%|█████████▌| 785000/818627 [01:28<00:03, 8779.67 examples/s]
+Filter: 96%|█████████▌| 785000/818627 [01:28<00:03, 8778.20 examples/s]
+Filter: 96%|█████████▌| 785000/818627 [01:29<00:03, 8777.48 examples/s]
+Filter: 96%|█████████▌| 785000/818627 [01:28<00:03, 8779.56 examples/s]
+Filter: 96%|█████████▌| 785000/818627 [01:29<00:03, 8779.97 examples/s]
+Filter: 96%|█████████▌| 785000/818627 [01:28<00:03, 8780.12 examples/s]
+Filter: 96%|█████████▌| 785000/818627 [01:28<00:03, 8785.26 examples/s]
+Filter: 96%|█████████▌| 786000/818627 [01:29<00:03, 8877.89 examples/s]
+Filter: 96%|█████████▌| 786000/818627 [01:29<00:03, 8882.82 examples/s]
+Filter: 96%|█████████▌| 786000/818627 [01:29<00:03, 8877.92 examples/s]
+Filter: 96%|█████████▌| 786000/818627 [01:29<00:03, 8882.04 examples/s]
+Filter: 96%|█████████▌| 786000/818627 [01:28<00:03, 8881.11 examples/s]
+Filter: 96%|█████████▌| 786000/818627 [01:28<00:03, 8877.57 examples/s]
+Filter: 96%|█████████▌| 786000/818627 [01:29<00:03, 8874.84 examples/s]
+Filter: 96%|█████████▌| 787000/818627 [01:29<00:03, 8909.37 examples/s]
+Filter: 96%|█████████▌| 787000/818627 [01:29<00:03, 8909.36 examples/s]
+Filter: 96%|█████████▌| 787000/818627 [01:29<00:03, 8908.80 examples/s]
+Filter: 96%|█████████▋| 788000/818627 [01:29<00:03, 8846.41 examples/s]
+Filter: 96%|█████████▋| 788000/818627 [01:29<00:03, 8846.32 examples/s]
+Filter: 96%|█████████▋| 788000/818627 [01:29<00:03, 8845.59 examples/s]
+Filter: 96%|█████████▌| 786000/818627 [01:29<00:06, 5004.11 examples/s]
+Filter: 96%|█████████▋| 789000/818627 [01:29<00:03, 8848.05 examples/s]
+Filter: 96%|█████████▋| 789000/818627 [01:29<00:03, 8844.29 examples/s]
+Filter: 96%|█████████▋| 789000/818627 [01:29<00:03, 8839.70 examples/s]
+Filter: 96%|█████████▌| 787000/818627 [01:29<00:06, 5110.83 examples/s]
+Filter: 96%|█████████▌| 787000/818627 [01:29<00:06, 4898.45 examples/s]
+Filter: 96%|█████████▌| 787000/818627 [01:29<00:06, 4779.59 examples/s]
+Filter: 97%|█████████▋| 790000/818627 [01:29<00:03, 9146.36 examples/s]
+Filter: 97%|█████████▋| 790000/818627 [01:29<00:03, 9146.33 examples/s]
+Filter: 97%|█████████▋| 790000/818627 [01:29<00:03, 9142.71 examples/s]
+Filter: 96%|█████████▌| 787000/818627 [01:29<00:06, 4664.03 examples/s]
+Filter: 96%|█████████▋| 788000/818627 [01:29<00:04, 6862.65 examples/s]
+Filter: 96%|█████████▋| 789000/818627 [01:29<00:04, 7095.14 examples/s]
+Filter: 97%|█████████▋| 791000/818627 [01:29<00:02, 9247.46 examples/s]
+Filter: 97%|█████████▋| 791000/818627 [01:29<00:02, 9248.12 examples/s]
+Filter: 97%|█████████▋| 791000/818627 [01:29<00:02, 9245.55 examples/s]
+Filter: 96%|█████████▋| 789000/818627 [01:29<00:04, 6846.77 examples/s]
+Filter: 96%|█████████▋| 789000/818627 [01:29<00:04, 6659.75 examples/s]
+Filter: 96%|█████████▋| 789000/818627 [01:29<00:04, 6624.87 examples/s]
+Filter: 97%|█████████▋| 790000/818627 [01:29<00:03, 8403.37 examples/s]
+Filter: 97%|█████████▋| 791000/818627 [01:29<00:03, 8706.20 examples/s]
+Filter: 97%|█████████▋| 791000/818627 [01:29<00:03, 8491.33 examples/s]
+Filter: 97%|█████████▋| 791000/818627 [01:29<00:03, 8159.90 examples/s]
+Filter: 97%|█████████▋| 791000/818627 [01:29<00:03, 8229.44 examples/s]
+Filter: 97%|█████████▋| 792000/818627 [01:30<00:02, 9381.67 examples/s]
+Filter: 97%|█████████▋| 793000/818627 [01:29<00:02, 9191.47 examples/s]
+Filter: 97%|█████████▋| 793000/818627 [01:29<00:02, 9497.64 examples/s]
+Filter: 97%|█████████▋| 793000/818627 [01:29<00:02, 9485.96 examples/s]
+Filter: 97%|█████████▋| 793000/818627 [01:29<00:02, 9279.54 examples/s]
+Filter: 97%|█████████▋| 792000/818627 [01:29<00:05, 5118.96 examples/s]
+Filter: 97%|█████████▋| 792000/818627 [01:30<00:05, 4883.40 examples/s]
+Filter: 97%|█████████▋| 794000/818627 [01:30<00:02, 9301.74 examples/s]
+Filter: 97%|█████████▋| 792000/818627 [01:29<00:05, 4705.09 examples/s]
+Filter: 97%|█████████▋| 794000/818627 [01:30<00:03, 7099.74 examples/s]
+Filter: 97%|█████████▋| 795000/818627 [01:30<00:02, 9087.62 examples/s]
+Filter: 97%|█████████▋| 795000/818627 [01:30<00:02, 9280.80 examples/s]
+Filter: 97%|█████████▋| 795000/818627 [01:30<00:02, 9626.20 examples/s]
+Filter: 97%|█████████▋| 795000/818627 [01:30<00:02, 9616.10 examples/s]
+Filter: 97%|█████████▋| 794000/818627 [01:30<00:03, 6873.25 examples/s]
+Filter: 97%|█████████▋| 794000/818627 [01:30<00:03, 6688.04 examples/s]
+Filter: 97%|█████████▋| 796000/818627 [01:30<00:02, 9013.20 examples/s]
+Filter: 97%|█████████▋| 796000/818627 [01:30<00:02, 9104.36 examples/s]
+Filter: 97%|█████████▋| 796000/818627 [01:30<00:02, 8722.99 examples/s]
+Filter: 97%|█████████▋| 796000/818627 [01:30<00:02, 8496.10 examples/s]
+Filter: 97%|█████████▋| 796000/818627 [01:30<00:02, 8345.67 examples/s]
+Filter: 97%|█████████▋| 797000/818627 [01:30<00:02, 8922.99 examples/s]
+Filter: 97%|█████████▋| 797000/818627 [01:30<00:02, 9071.89 examples/s]
+Filter: 97%|█████████▋| 797000/818627 [01:30<00:02, 9006.76 examples/s]
+Filter: 97%|█████████▋| 797000/818627 [01:30<00:02, 9287.95 examples/s]
+Filter: 97%|█████████▋| 797000/818627 [01:30<00:02, 9281.16 examples/s]
+Filter: 97%|█████████▋| 798000/818627 [01:30<00:02, 9033.72 examples/s]
+Filter: 97%|█████████▋| 798000/818627 [01:30<00:02, 9081.57 examples/s]
+Filter: 97%|█████████▋| 798000/818627 [01:30<00:02, 9396.04 examples/s]
+Filter: 97%|█████████▋| 798000/818627 [01:30<00:02, 9122.12 examples/s]
+Filter: 97%|█████████▋| 798000/818627 [01:30<00:02, 9074.05 examples/s]
+Filter: 97%|█████████▋| 798000/818627 [01:30<00:02, 9289.58 examples/s]
+Filter: 97%|█████████▋| 798000/818627 [01:30<00:02, 9609.49 examples/s]
+Filter: 98%|█████████▊| 799000/818627 [01:30<00:02, 9253.54 examples/s]
+Filter: 98%|█████████▊| 799000/818627 [01:30<00:02, 9410.79 examples/s]
+Filter: 98%|█████████▊| 800000/818627 [01:30<00:02, 9173.99 examples/s]
+Filter: 98%|█████████▊| 800000/818627 [01:30<00:02, 9242.97 examples/s]
+Filter: 98%|█████████▊| 800000/818627 [01:30<00:02, 9203.12 examples/s]
+Filter: 98%|█████████▊| 800000/818627 [01:30<00:02, 9222.27 examples/s]
+Filter: 98%|█████████▊| 800000/818627 [01:30<00:01, 9410.47 examples/s]
+Filter: 98%|█████████▊| 800000/818627 [01:30<00:01, 9598.85 examples/s]
+Filter: 98%|█████████▊| 800000/818627 [01:30<00:01, 9355.00 examples/s]
+Filter: 98%|█████████▊| 800000/818627 [01:30<00:02, 9271.35 examples/s]
+Filter: 98%|█████████▊| 801000/818627 [01:30<00:01, 9004.08 examples/s]
+Filter: 98%|█████████▊| 801000/818627 [01:30<00:01, 9104.01 examples/s]
+Filter: 98%|█████████▊| 801000/818627 [01:31<00:01, 9080.17 examples/s]
+Filter: 98%|█████████▊| 801000/818627 [01:30<00:01, 9074.83 examples/s]
+Filter: 98%|█████████▊| 801000/818627 [01:30<00:01, 9174.55 examples/s]
+Filter: 98%|█████████▊| 801000/818627 [01:30<00:01, 9190.46 examples/s]
+Filter: 98%|█████████▊| 802000/818627 [01:30<00:01, 9004.10 examples/s]
+Filter: 98%|█████████▊| 802000/818627 [01:30<00:01, 8904.56 examples/s]
+Filter: 98%|█████████▊| 802000/818627 [01:30<00:01, 8985.81 examples/s]
+Filter: 98%|█████████▊| 802000/818627 [01:31<00:01, 8975.04 examples/s]
+Filter: 98%|█████████▊| 802000/818627 [01:30<00:01, 9260.22 examples/s]
+Filter: 98%|█████████▊| 802000/818627 [01:31<00:01, 9138.86 examples/s]
+Filter: 98%|█████████▊| 802000/818627 [01:30<00:01, 9073.28 examples/s]
+Filter: 98%|█████████▊| 802000/818627 [01:30<00:01, 9053.81 examples/s]
+Filter: 98%|█████████▊| 803000/818627 [01:31<00:01, 8875.65 examples/s]
+Filter: 98%|█████████▊| 803000/818627 [01:31<00:01, 8796.62 examples/s]
+Filter: 98%|█████████▊| 803000/818627 [01:31<00:01, 8869.92 examples/s]
+Filter: 98%|█████████▊| 803000/818627 [01:31<00:01, 8882.86 examples/s]
+Filter: 98%|█████████▊| 803000/818627 [01:31<00:01, 9017.62 examples/s]
+Filter: 98%|█████████▊| 803000/818627 [01:31<00:01, 8919.30 examples/s]
+Filter: 98%|█████████▊| 803000/818627 [01:31<00:01, 8934.41 examples/s]
+Filter: 98%|█████████▊| 804000/818627 [01:31<00:01, 8827.19 examples/s]
+Filter: 98%|█████████▊| 804000/818627 [01:31<00:01, 8856.89 examples/s]
+Filter: 98%|█████████▊| 804000/818627 [01:31<00:01, 8941.55 examples/s]
+Filter: 98%|█████████▊| 804000/818627 [01:31<00:01, 8805.92 examples/s]
+Filter: 98%|█████████▊| 804000/818627 [01:31<00:01, 8865.45 examples/s]
+Filter: 98%|█████████▊| 804000/818627 [01:31<00:01, 8721.84 examples/s]
+Filter: 98%|█████████▊| 804000/818627 [01:31<00:01, 8778.94 examples/s]
+Filter: 98%|█████████▊| 804000/818627 [01:31<00:01, 8976.86 examples/s]
+Filter: 98%|█████████▊| 805000/818627 [01:31<00:01, 9006.73 examples/s]
+Filter: 98%|█████████▊| 805000/818627 [01:31<00:01, 8983.10 examples/s]
+Filter: 98%|█████████▊| 805000/818627 [01:31<00:01, 9000.81 examples/s]
+Filter: 98%|█████████▊| 805000/818627 [01:31<00:01, 9073.35 examples/s]
+Filter: 98%|█████████▊| 805000/818627 [01:31<00:01, 9027.39 examples/s]
+Filter: 98%|█████████▊| 805000/818627 [01:31<00:01, 9035.71 examples/s]
+Filter: 98%|█████████▊| 805000/818627 [01:31<00:01, 8989.90 examples/s]
+Filter: 98%|█████████▊| 805000/818627 [01:31<00:01, 9140.85 examples/s]
+Filter: 98%|█████████▊| 806000/818627 [01:31<00:01, 8923.77 examples/s]
+Filter: 98%|█████████▊| 806000/818627 [01:31<00:01, 8900.57 examples/s]
+Filter: 98%|█████████▊| 806000/818627 [01:31<00:01, 8920.66 examples/s]
+Filter: 98%|█████████▊| 806000/818627 [01:31<00:01, 8928.75 examples/s]
+Filter: 98%|█████████▊| 806000/818627 [01:31<00:01, 9055.81 examples/s]
+Filter: 98%|█████████▊| 806000/818627 [01:31<00:01, 8937.78 examples/s]
+Filter: 98%|█████████▊| 806000/818627 [01:31<00:01, 8978.08 examples/s]
+Filter: 98%|█████████▊| 806000/818627 [01:31<00:01, 8942.43 examples/s]
+Filter: 99%|█████████▊| 807000/818627 [01:31<00:01, 8913.14 examples/s]
+Filter: 99%|█████████▊| 807000/818627 [01:31<00:01, 8909.72 examples/s]
+Filter: 99%|█████████▊| 807000/818627 [01:31<00:01, 8888.69 examples/s]
+Filter: 99%|█████████▊| 807000/818627 [01:31<00:01, 8952.15 examples/s]
+Filter: 99%|█████████▊| 807000/818627 [01:31<00:01, 8924.89 examples/s]
+Filter: 99%|█████████▊| 807000/818627 [01:31<00:01, 8912.52 examples/s]
+Filter: 99%|█████████▊| 807000/818627 [01:31<00:01, 8997.86 examples/s]
+Filter: 99%|█████████▊| 807000/818627 [01:31<00:01, 8829.36 examples/s]
+Filter: 99%|█████████▊| 808000/818627 [01:31<00:01, 8851.72 examples/s]
+Filter: 99%|█████████▊| 808000/818627 [01:31<00:01, 8841.61 examples/s]
+Filter: 99%|█████████▊| 808000/818627 [01:31<00:01, 8880.17 examples/s]
+Filter: 99%|█████████▊| 808000/818627 [01:31<00:01, 8844.00 examples/s]
+Filter: 99%|█████████▊| 808000/818627 [01:31<00:01, 8859.47 examples/s]
+Filter: 99%|█████████▊| 808000/818627 [01:31<00:01, 8937.75 examples/s]
+Filter: 99%|█████████▊| 808000/818627 [01:31<00:01, 8879.84 examples/s]
+Filter: 99%|█████████▊| 808000/818627 [01:31<00:01, 8859.08 examples/s]
+Filter: 99%|█████████▉| 809000/818627 [01:31<00:01, 8710.43 examples/s]
+Filter: 99%|█████████▉| 809000/818627 [01:31<00:01, 8718.29 examples/s]
+Filter: 99%|█████████▉| 809000/818627 [01:31<00:01, 8719.32 examples/s]
+Filter: 99%|█████████▉| 809000/818627 [01:32<00:01, 8740.31 examples/s]
+Filter: 99%|█████████▉| 809000/818627 [01:31<00:01, 8801.98 examples/s]
+Filter: 99%|█████████▉| 809000/818627 [01:31<00:01, 8750.76 examples/s]
+Filter: 99%|█████████▉| 809000/818627 [01:31<00:01, 8727.40 examples/s]
+Filter: 99%|█████████▉| 809000/818627 [01:31<00:01, 8729.77 examples/s]
+Filter: 99%|█████████▉| 810000/818627 [01:31<00:00, 8679.61 examples/s]
+Filter: 99%|█████████▉| 810000/818627 [01:31<00:00, 8685.99 examples/s]
+Filter: 99%|█████████▉| 810000/818627 [01:32<00:00, 8700.50 examples/s]
+Filter: 99%|█████████▉| 810000/818627 [01:31<00:00, 8681.94 examples/s]
+Filter: 99%|█████████▉| 810000/818627 [01:31<00:00, 8711.49 examples/s]
+Filter: 99%|█████████▉| 810000/818627 [01:31<00:00, 8694.39 examples/s]
+Filter: 99%|█████████▉| 810000/818627 [01:31<00:00, 8747.53 examples/s]
+Filter: 99%|█████████▉| 810000/818627 [01:31<00:00, 8692.65 examples/s]
+Filter: 99%|█████████▉| 811000/818627 [01:31<00:00, 8639.13 examples/s]
+Filter: 99%|█████████▉| 811000/818627 [01:32<00:00, 8651.62 examples/s]
+Filter: 99%|█████████▉| 811000/818627 [01:31<00:00, 8644.24 examples/s]
+Filter: 99%|█████████▉| 811000/818627 [01:31<00:00, 8690.75 examples/s]
+Filter: 99%|█████████▉| 811000/818627 [01:32<00:00, 8659.85 examples/s]
+Filter: 99%|█████████▉| 811000/818627 [01:31<00:00, 8644.51 examples/s]
+Filter: 99%|█████████▉| 811000/818627 [01:31<00:00, 8647.16 examples/s]
+Filter: 99%|█████████▉| 811000/818627 [01:31<00:00, 8620.94 examples/s]
+Filter: 99%|█████████▉| 812000/818627 [01:32<00:00, 8887.06 examples/s]
+Filter: 99%|█████████▉| 812000/818627 [01:32<00:00, 8893.39 examples/s]
+Filter: 99%|█████████▉| 812000/818627 [01:32<00:00, 8894.90 examples/s]
+Filter: 99%|█████████▉| 812000/818627 [01:32<00:00, 8889.34 examples/s]
+Filter: 99%|█████████▉| 812000/818627 [01:32<00:00, 8894.50 examples/s]
+Filter: 99%|█████████▉| 812000/818627 [01:32<00:00, 8911.67 examples/s]
+Filter: 99%|█████████▉| 812000/818627 [01:32<00:00, 8895.87 examples/s]
+Filter: 99%|█████████▉| 812000/818627 [01:32<00:00, 8887.94 examples/s]
+Filter: 99%|█████████▉| 813000/818627 [01:32<00:00, 9097.55 examples/s]
+Filter: 99%|█████████▉| 813000/818627 [01:32<00:00, 9098.83 examples/s]
+Filter: 99%|█████████▉| 813000/818627 [01:32<00:00, 9096.04 examples/s]
+Filter: 99%|█████████▉| 813000/818627 [01:32<00:00, 9091.44 examples/s]
+Filter: 99%|█████████▉| 813000/818627 [01:32<00:00, 9109.63 examples/s]
+Filter: 99%|█████████▉| 813000/818627 [01:32<00:00, 9098.55 examples/s]
+Filter: 99%|█████████▉| 813000/818627 [01:32<00:00, 9100.26 examples/s]
+Filter: 99%|█████████▉| 813000/818627 [01:32<00:00, 9099.80 examples/s]
+Filter: 99%|█████████▉| 814000/818627 [01:32<00:00, 9315.90 examples/s]
+Filter: 99%|█████████▉| 814000/818627 [01:32<00:00, 9320.56 examples/s]
+Filter: 99%|█████████▉| 814000/818627 [01:32<00:00, 9316.47 examples/s]
+Filter: 99%|█████████▉| 814000/818627 [01:32<00:00, 9316.38 examples/s]
+Filter: 99%|█████████▉| 814000/818627 [01:32<00:00, 9319.63 examples/s]
+Filter: 99%|█████████▉| 814000/818627 [01:32<00:00, 9318.16 examples/s]
+Filter: 99%|█████████▉| 814000/818627 [01:32<00:00, 9315.45 examples/s]
+Filter: 99%|█████████▉| 814000/818627 [01:32<00:00, 9317.58 examples/s]
+Filter: 100%|█████████▉| 815000/818627 [01:32<00:00, 9255.23 examples/s]
+Filter: 100%|█████████▉| 815000/818627 [01:32<00:00, 9259.08 examples/s]
+Filter: 100%|█████████▉| 815000/818627 [01:32<00:00, 9264.35 examples/s]
+Filter: 100%|█████████▉| 815000/818627 [01:32<00:00, 9258.08 examples/s]
+Filter: 100%|█████████▉| 815000/818627 [01:32<00:00, 9261.59 examples/s]
+Filter: 100%|█████████▉| 815000/818627 [01:32<00:00, 9259.45 examples/s]
+Filter: 100%|█████████▉| 815000/818627 [01:32<00:00, 9256.48 examples/s]
+Filter: 100%|█████████▉| 815000/818627 [01:32<00:00, 9256.97 examples/s]
+Filter: 100%|█████████▉| 816000/818627 [01:32<00:00, 9089.65 examples/s]
+Filter: 100%|█████████▉| 816000/818627 [01:32<00:00, 9092.22 examples/s]
+Filter: 100%|█████████▉| 816000/818627 [01:32<00:00, 9093.25 examples/s]
+Filter: 100%|█████████▉| 816000/818627 [01:32<00:00, 9091.29 examples/s]
+Filter: 100%|█████████▉| 816000/818627 [01:32<00:00, 9092.85 examples/s]
+Filter: 100%|█████████▉| 816000/818627 [01:32<00:00, 9091.13 examples/s]
+Filter: 100%|█████████▉| 816000/818627 [01:32<00:00, 9090.10 examples/s]
+Filter: 100%|█████████▉| 816000/818627 [01:32<00:00, 9090.48 examples/s]
+Filter: 100%|█████████▉| 817000/818627 [01:32<00:00, 8939.31 examples/s]
+Filter: 100%|█████████▉| 817000/818627 [01:32<00:00, 8943.72 examples/s]
+Filter: 100%|█████████▉| 817000/818627 [01:32<00:00, 8942.93 examples/s]
+Filter: 100%|█████████▉| 817000/818627 [01:32<00:00, 8941.12 examples/s]
+Filter: 100%|█████████▉| 817000/818627 [01:32<00:00, 8939.41 examples/s]
+Filter: 100%|█████████▉| 817000/818627 [01:32<00:00, 8939.73 examples/s]
+Filter: 100%|█████████▉| 817000/818627 [01:32<00:00, 8934.51 examples/s]
+Filter: 100%|█████████▉| 817000/818627 [01:32<00:00, 8872.49 examples/s]
+Filter: 100%|█████████▉| 818000/818627 [01:32<00:00, 8841.52 examples/s]
+Filter: 100%|█████████▉| 818000/818627 [01:32<00:00, 8822.54 examples/s]
+Filter: 100%|█████████▉| 818000/818627 [01:32<00:00, 8822.92 examples/s]
+Filter: 100%|█████████▉| 818000/818627 [01:33<00:00, 8821.47 examples/s]
+Filter: 100%|█████████▉| 818000/818627 [01:32<00:00, 8826.93 examples/s]
+Filter: 100%|█████████▉| 818000/818627 [01:32<00:00, 8821.87 examples/s]
+Filter: 100%|█████████▉| 818000/818627 [01:32<00:00, 8823.89 examples/s]
+Filter: 100%|█████████▉| 818000/818627 [01:32<00:00, 8818.68 examples/s]
+Filter: 100%|██████████| 818627/818627 [01:32<00:00, 8822.79 examples/s]
+
+Filter: 100%|██████████| 818627/818627 [01:32<00:00, 8823.29 examples/s]
+
+Filter: 100%|██████████| 818627/818627 [01:32<00:00, 8823.25 examples/s]
+
+Filter: 100%|██████████| 818627/818627 [01:32<00:00, 8812.61 examples/s]
+
+Filter: 100%|██████████| 818627/818627 [01:32<00:00, 8822.77 examples/s]
+
+Filter: 100%|██████████| 818627/818627 [01:32<00:00, 8822.00 examples/s]
+
+Filter: 100%|██████████| 818627/818627 [01:32<00:00, 8822.33 examples/s]
+
+Filter: 100%|██████████| 818627/818627 [01:33<00:00, 8791.21 examples/s]
+
+Epoch 0: 0%| | 0/99077 [00:00, ?it/s]
+Epoch 0: 0%| | 0/99077 [00:01, ?it/s]
+[rank0]: Traceback (most recent call last):
+[rank0]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 487, in
+[rank0]: main()
+[rank0]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 438, in main
+[rank0]: for step_in_epoch, data in enumerate(progress_bar):
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/tqdm/std.py", line 1181, in __iter__
+[rank0]: for obj in iterable:
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 494, in __iter__
+[rank0]: return self._get_iterator()
+[rank0]: ^^^^^^^^^^^^^^^^^^^^
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 427, in _get_iterator
+[rank0]: return _MultiProcessingDataLoaderIter(self)
+[rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 1140, in __init__
+[rank0]: index_queue = multiprocessing_context.Queue() # type: ignore[var-annotated]
+[rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 103, in Queue
+[rank0]: return Queue(maxsize, ctx=self.get_context())
+[rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/queues.py", line 49, in __init__
+[rank0]: self._sem = ctx.BoundedSemaphore(maxsize)
+[rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 88, in BoundedSemaphore
+[rank0]: return BoundedSemaphore(value, ctx=self.get_context())
+[rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 152, in __init__
+[rank0]: SemLock.__init__(self, SEMAPHORE, value, value, ctx=ctx)
+[rank0]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 57, in __init__
+[rank0]: sl = self._semlock = _multiprocessing.SemLock(
+[rank0]: ^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank0]: OSError: [Errno 28] No space left on device
+[rank5]: Traceback (most recent call last):
+[rank5]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 487, in
+[rank5]: main()
+[rank5]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 438, in main
+[rank5]: for step_in_epoch, data in enumerate(progress_bar):
+[rank5]: ^^^^^^^^^^^^^^^^^^^^^^^
+[rank5]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 494, in __iter__
+[rank5]: return self._get_iterator()
+[rank5]: ^^^^^^^^^^^^^^^^^^^^
+[rank5]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 427, in _get_iterator
+[rank5]: return _MultiProcessingDataLoaderIter(self)
+[rank5]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank5]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 1140, in __init__
+[rank5]: index_queue = multiprocessing_context.Queue() # type: ignore[var-annotated]
+[rank5]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank5]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 103, in Queue
+[rank5]: return Queue(maxsize, ctx=self.get_context())
+[rank5]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank5]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/queues.py", line 43, in __init__
+[rank5]: self._rlock = ctx.Lock()
+[rank5]: ^^^^^^^^^^
+[rank5]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 68, in Lock
+[rank5]: return Lock(ctx=self.get_context())
+[rank5]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank5]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 169, in __init__
+[rank5]: SemLock.__init__(self, SEMAPHORE, 1, 1, ctx=ctx)
+[rank5]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 57, in __init__
+[rank5]: sl = self._semlock = _multiprocessing.SemLock(
+[rank5]: ^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank5]: OSError: [Errno 28] No space left on device
+[rank1]: Traceback (most recent call last):
+[rank1]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 487, in
+[rank1]: main()
+[rank1]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 438, in main
+[rank1]: for step_in_epoch, data in enumerate(progress_bar):
+[rank1]: ^^^^^^^^^^^^^^^^^^^^^^^
+[rank1]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 494, in __iter__
+[rank1]: return self._get_iterator()
+[rank1]: ^^^^^^^^^^^^^^^^^^^^
+[rank1]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 427, in _get_iterator
+[rank1]: return _MultiProcessingDataLoaderIter(self)
+[rank1]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank1]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 1140, in __init__
+[rank1]: index_queue = multiprocessing_context.Queue() # type: ignore[var-annotated]
+[rank1]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank1]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 103, in Queue
+[rank1]: return Queue(maxsize, ctx=self.get_context())
+[rank1]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank1]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/queues.py", line 43, in __init__
+[rank1]: self._rlock = ctx.Lock()
+[rank1]: ^^^^^^^^^^
+[rank1]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 68, in Lock
+[rank1]: return Lock(ctx=self.get_context())
+[rank1]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank1]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 169, in __init__
+[rank1]: SemLock.__init__(self, SEMAPHORE, 1, 1, ctx=ctx)
+[rank1]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 57, in __init__
+[rank1]: sl = self._semlock = _multiprocessing.SemLock(
+[rank1]: ^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank1]: OSError: [Errno 28] No space left on device
+[rank3]: Traceback (most recent call last):
+[rank3]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 487, in
+[rank3]: main()
+[rank3]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 438, in main
+[rank3]: for step_in_epoch, data in enumerate(progress_bar):
+[rank3]: ^^^^^^^^^^^^^^^^^^^^^^^
+[rank3]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 494, in __iter__
+[rank3]: return self._get_iterator()
+[rank3]: ^^^^^^^^^^^^^^^^^^^^
+[rank3]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 427, in _get_iterator
+[rank3]: return _MultiProcessingDataLoaderIter(self)
+[rank3]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank3]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 1140, in __init__
+[rank3]: index_queue = multiprocessing_context.Queue() # type: ignore[var-annotated]
+[rank3]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank3]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 103, in Queue
+[rank3]: return Queue(maxsize, ctx=self.get_context())
+[rank3]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank3]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/queues.py", line 43, in __init__
+[rank3]: self._rlock = ctx.Lock()
+[rank3]: ^^^^^^^^^^
+[rank3]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 68, in Lock
+[rank3]: return Lock(ctx=self.get_context())
+[rank3]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank3]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 169, in __init__
+[rank3]: SemLock.__init__(self, SEMAPHORE, 1, 1, ctx=ctx)
+[rank3]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 57, in __init__
+[rank3]: sl = self._semlock = _multiprocessing.SemLock(
+[rank3]: ^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank3]: OSError: [Errno 28] No space left on device
+[rank2]: Traceback (most recent call last):
+[rank2]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 487, in
+[rank2]: main()
+[rank2]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 438, in main
+[rank2]: for step_in_epoch, data in enumerate(progress_bar):
+[rank2]: ^^^^^^^^^^^^^^^^^^^^^^^
+[rank2]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 494, in __iter__
+[rank2]: return self._get_iterator()
+[rank2]: ^^^^^^^^^^^^^^^^^^^^
+[rank2]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 427, in _get_iterator
+[rank2]: return _MultiProcessingDataLoaderIter(self)
+[rank2]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank2]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 1140, in __init__
+[rank2]: index_queue = multiprocessing_context.Queue() # type: ignore[var-annotated]
+[rank2]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank2]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 103, in Queue
+[rank2]: return Queue(maxsize, ctx=self.get_context())
+[rank2]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank2]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/queues.py", line 43, in __init__
+[rank2]: self._rlock = ctx.Lock()
+[rank2]: ^^^^^^^^^^
+[rank2]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 68, in Lock
+[rank2]: return Lock(ctx=self.get_context())
+[rank2]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank2]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 169, in __init__
+[rank2]: SemLock.__init__(self, SEMAPHORE, 1, 1, ctx=ctx)
+[rank2]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 57, in __init__
+[rank2]: sl = self._semlock = _multiprocessing.SemLock(
+[rank2]: ^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank2]: OSError: [Errno 28] No space left on device
+[rank4]: Traceback (most recent call last):
+[rank4]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 487, in
+[rank4]: main()
+[rank4]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 438, in main
+[rank4]: for step_in_epoch, data in enumerate(progress_bar):
+[rank4]: ^^^^^^^^^^^^^^^^^^^^^^^
+[rank4]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 494, in __iter__
+[rank4]: return self._get_iterator()
+[rank4]: ^^^^^^^^^^^^^^^^^^^^
+[rank4]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 427, in _get_iterator
+[rank4]: return _MultiProcessingDataLoaderIter(self)
+[rank4]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank4]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 1140, in __init__
+[rank4]: index_queue = multiprocessing_context.Queue() # type: ignore[var-annotated]
+[rank4]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank4]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 103, in Queue
+[rank4]: return Queue(maxsize, ctx=self.get_context())
+[rank4]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank4]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/queues.py", line 43, in __init__
+[rank4]: self._rlock = ctx.Lock()
+[rank4]: ^^^^^^^^^^
+[rank4]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 68, in Lock
+[rank4]: return Lock(ctx=self.get_context())
+[rank4]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank4]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 169, in __init__
+[rank4]: SemLock.__init__(self, SEMAPHORE, 1, 1, ctx=ctx)
+[rank4]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 57, in __init__
+[rank4]: sl = self._semlock = _multiprocessing.SemLock(
+[rank4]: ^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank4]: OSError: [Errno 28] No space left on device
+[rank7]: Traceback (most recent call last):
+[rank7]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 487, in
+[rank7]: main()
+[rank7]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 438, in main
+[rank7]: for step_in_epoch, data in enumerate(progress_bar):
+[rank7]: ^^^^^^^^^^^^^^^^^^^^^^^
+[rank7]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 494, in __iter__
+[rank7]: return self._get_iterator()
+[rank7]: ^^^^^^^^^^^^^^^^^^^^
+[rank7]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 427, in _get_iterator
+[rank7]: return _MultiProcessingDataLoaderIter(self)
+[rank7]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank7]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 1140, in __init__
+[rank7]: index_queue = multiprocessing_context.Queue() # type: ignore[var-annotated]
+[rank7]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank7]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 103, in Queue
+[rank7]: return Queue(maxsize, ctx=self.get_context())
+[rank7]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank7]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/queues.py", line 43, in __init__
+[rank7]: self._rlock = ctx.Lock()
+[rank7]: ^^^^^^^^^^
+[rank7]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 68, in Lock
+[rank7]: return Lock(ctx=self.get_context())
+[rank7]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank7]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 169, in __init__
+[rank7]: SemLock.__init__(self, SEMAPHORE, 1, 1, ctx=ctx)
+[rank7]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 57, in __init__
+[rank7]: sl = self._semlock = _multiprocessing.SemLock(
+[rank7]: ^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank7]: OSError: [Errno 28] No space left on device
+[rank6]: Traceback (most recent call last):
+[rank6]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 487, in
+[rank6]: main()
+[rank6]: File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash_lora_inject.py", line 438, in main
+[rank6]: for step_in_epoch, data in enumerate(progress_bar):
+[rank6]: ^^^^^^^^^^^^^^^^^^^^^^^
+[rank6]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 494, in __iter__
+[rank6]: return self._get_iterator()
+[rank6]: ^^^^^^^^^^^^^^^^^^^^
+[rank6]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 427, in _get_iterator
+[rank6]: return _MultiProcessingDataLoaderIter(self)
+[rank6]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank6]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/utils/data/dataloader.py", line 1140, in __init__
+[rank6]: index_queue = multiprocessing_context.Queue() # type: ignore[var-annotated]
+[rank6]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank6]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 103, in Queue
+[rank6]: return Queue(maxsize, ctx=self.get_context())
+[rank6]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank6]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/queues.py", line 43, in __init__
+[rank6]: self._rlock = ctx.Lock()
+[rank6]: ^^^^^^^^^^
+[rank6]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/context.py", line 68, in Lock
+[rank6]: return Lock(ctx=self.get_context())
+[rank6]: ^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank6]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 169, in __init__
+[rank6]: SemLock.__init__(self, SEMAPHORE, 1, 1, ctx=ctx)
+[rank6]: File "/workspace/miniconda3/envs/specforge/lib/python3.11/multiprocessing/synchronize.py", line 57, in __init__
+[rank6]: sl = self._semlock = _multiprocessing.SemLock(
+[rank6]: ^^^^^^^^^^^^^^^^^^^^^^^^^
+[rank6]: OSError: [Errno 28] No space left on device
+[rank0]:[W309 17:04:38.228986039 ProcessGroupNCCL.cpp:1524] Warning: WARNING: destroy_process_group() was not called before program exit, which can leak resources. For more info, please see https://pytorch.org/docs/stable/distributed.html#shutdown (function operator())
+[rank5]:[W309 17:04:38.547654961 ProcessGroupNCCL.cpp:1524] Warning: WARNING: destroy_process_group() was not called before program exit, which can leak resources. For more info, please see https://pytorch.org/docs/stable/distributed.html#shutdown (function operator())
+[rank2]:[W309 17:04:38.725243170 ProcessGroupNCCL.cpp:1524] Warning: WARNING: destroy_process_group() was not called before program exit, which can leak resources. For more info, please see https://pytorch.org/docs/stable/distributed.html#shutdown (function operator())
+[rank6]:[W309 17:04:39.775916194 ProcessGroupNCCL.cpp:1524] Warning: WARNING: destroy_process_group() was not called before program exit, which can leak resources. For more info, please see https://pytorch.org/docs/stable/distributed.html#shutdown (function operator())
+[rank3]:[W309 17:04:39.906748747 ProcessGroupNCCL.cpp:1524] Warning: WARNING: destroy_process_group() was not called before program exit, which can leak resources. For more info, please see https://pytorch.org/docs/stable/distributed.html#shutdown (function operator())
+[rank1]:[W309 17:04:39.092233950 ProcessGroupNCCL.cpp:1524] Warning: WARNING: destroy_process_group() was not called before program exit, which can leak resources. For more info, please see https://pytorch.org/docs/stable/distributed.html#shutdown (function operator())
+[rank4]:[W309 17:04:39.101225015 ProcessGroupNCCL.cpp:1524] Warning: WARNING: destroy_process_group() was not called before program exit, which can leak resources. For more info, please see https://pytorch.org/docs/stable/distributed.html#shutdown (function operator())
+[rank7]:[W309 17:04:39.138781864 ProcessGroupNCCL.cpp:1524] Warning: WARNING: destroy_process_group() was not called before program exit, which can leak resources. For more info, please see https://pytorch.org/docs/stable/distributed.html#shutdown (function operator())
+W0309 17:04:39.582000 9566 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 9662 closing signal SIGTERM
+W0309 17:04:39.582000 9566 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 9663 closing signal SIGTERM
+W0309 17:04:39.583000 9566 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 9664 closing signal SIGTERM
+W0309 17:04:39.583000 9566 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 9665 closing signal SIGTERM
+W0309 17:04:39.583000 9566 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 9666 closing signal SIGTERM
+W0309 17:04:39.583000 9566 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 9668 closing signal SIGTERM
+W0309 17:04:39.584000 9566 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 9669 closing signal SIGTERM
+E0309 17:04:41.364000 9566 site-packages/torch/distributed/elastic/multiprocessing/api.py:882] failed (exitcode: 1) local_rank: 5 (pid: 9667) of binary: /workspace/miniconda3/envs/specforge/bin/python3
+Traceback (most recent call last):
+ File "", line 198, in _run_module_as_main
+ File "", line 88, in _run_code
+ File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 940, in
+ main()
+ File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/errors/__init__.py", line 357, in wrapper
+ return f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 936, in main
+ run(args)
+ File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 927, in run
+ elastic_launch(
+ File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 156, in __call__
+ return launch_agent(self._config, self._entrypoint, list(args))
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/specforge/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 293, in launch_agent
+ raise ChildFailedError(
+torch.distributed.elastic.multiprocessing.errors.ChildFailedError:
+============================================================
+scripts/train_dflash_lora_inject.py FAILED
+------------------------------------------------------------
+Failures:
+
+------------------------------------------------------------
+Root Cause (first observed failure):
+[0]:
+ time : 2026-03-09_17:04:39
+ host : job-006ce80a7c47-20260302193512-674f5ccb6f-hjq4c
+ rank : 5 (local_rank: 5)
+ exitcode : 1 (pid: 9667)
+ error_file:
+ traceback : To enable traceback see: https://pytorch.org/docs/stable/elastic/errors.html
+============================================================
diff --git a/syxin/dflash_lora_changelog.md b/syxin/dflash_lora_changelog.md
new file mode 100644
index 0000000000000000000000000000000000000000..09cdba4e72c1d91eff75bb1a974f2784f2bfca65
--- /dev/null
+++ b/syxin/dflash_lora_changelog.md
@@ -0,0 +1,232 @@
+# DFlash LoRA 全部改动记录
+
+## 概述
+
+为了让 Qwen3-8B DFlash LoRA 训练在 2×H100 上跑通(解决 OOM),共新增/修改了 **5 个文件,1084 行代码**。改动分为两大阶段:基础搭建 + OOM 修复。
+
+---
+
+## 新增文件清单
+
+| 文件 | 行数 | 用途 |
+|------|------|------|
+| `specforge/core/dflash_lora.py` | 453 | 训练 wrapper(OnlineDFlashLoRAModel) |
+| `specforge/modeling/draft/dflash_lora.py` | 141 | LoRA draft 模型(DFlashLoRADraftModel) |
+| `scripts/train_dflash_lora.py` | 449 | 训练入口脚本 |
+| `scripts/run_train_dflash_lora.sh` | 31 | 启动 shell 脚本 |
+| `configs/qwen3-8b-dflash-lora.json` | 10 | LoRA 配置文件 |
+
+---
+
+## Step 1 完成过程
+
+### 1.1 分析现有代码
+
+首先分析了非 LoRA 版 `train_dflash.py` 的完整流程:
+
+```
+input_ids → target_model.generate_dflash_data() → hidden_states
+ → OnlineDFlashModel.forward():
+ 1. 截断到 block 边界
+ 2. prepare_noise_input(): anchor 保留,其余 → MASK
+ 3. embed_tokens(noise_input_ids) → noise_embedding
+ 4. 构建 DFlash attention mask
+ 5. draft_model(noise_embedding, target_hidden, mask)
+ 6. lm_head(hidden) → logits → CE loss
+```
+
+非 LoRA 版使用独立的小型 draft model + 冻结 target model 提取 hidden states。
+
+### 1.2 确定 LoRA 版设计差异
+
+| 方面 | 非 LoRA 版 (`train_dflash.py`) | LoRA 版 (`train_dflash_lora.py`) |
+|------|------|------|
+| Draft model | 自定义小模型 (1-10 层) | Qwen3-8B + PEFT LoRA |
+| Target model | 冻结大模型提取 hidden states | 无需 — 模型用自身表征 |
+| Attention | 自定义 Qwen3DFlashAttention,KV = [ctx, noise] concat | 标准 HF attention + DFlash mask |
+| KV 结构 | Q_LEN = noise_len, KV_LEN = 2×noise_len | Q_LEN = KV_LEN = seq_len |
+| 可训练参数 | 全部 draft model 参数 | 仅 LoRA (q/k/v/o_proj) |
+
+### 1.3 新建 LoRA 版三个核心文件
+
+#### `specforge/modeling/draft/dflash_lora.py` — DFlashLoRADraftModel
+
+- `from_pretrained()`: 加载 Qwen3-8B,注入 PEFT LoRA,支持 `attn_implementation` 参数
+- `forward()`: 标准 HF forward,支持 `output_hidden_states` 参数(chunked loss 需要)
+- `get_lm_head()`: 穿透 PEFT 层级获取 lm_head 引用
+- `gradient_checkpointing_enable()`: 代理到底层模型
+- `save_pretrained()`: 仅保存 LoRA adapter 权重
+
+#### `specforge/core/dflash_lora.py` — OnlineDFlashLoRAModel
+
+- `prepare_noise_input()`: context 部分保持不变,block 部分只保留 anchor,其余替换为 MASK
+- `build_dflash_full_attn_mask_fast()`: 向量化构建 4D additive mask `[bsz, 1, seq, seq]`
+- `_compute_loss_weights()`: context + anchor 权重为 0,非 anchor 权重为 1(或 decay)
+- `_full_lm_loss()`: 标准 CE loss 路径
+- `_compute_accuracy()`: block-wise acceptance rate(累积正确预测长度 / block 非 anchor 长度)
+- `forward()`: 完整训练 forward pass
+
+LoRA 版 mask 规则:
+- context token i → 因果注意力 (j ≤ i)
+- block token i (属于 block b) → 所有 context + 同 block 内双向注意力
+
+#### `scripts/train_dflash_lora.py` — 训练脚本
+
+- 参数解析:model/lora/dataset/training/output/distributed/tracker 7 组参数
+- `build_model()`: 加载模型 + 注入 LoRA + 包装 OnlineDFlashLoRAModel
+- `build_dataloader()`: 复用 `build_eagle3_dataset` 和 `prepare_dp_dataloaders`
+- FSDP 包装 + BF16Optimizer
+- 训练循环:forward → backward → accumulation → optimizer step
+- checkpoint 保存/恢复
+
+---
+
+## OOM 修复改动(4 项)
+
+### 改动 1: FSDP FULL_SHARD (ZeRO-3)
+
+**问题**: `SHARD_GRAD_OP` (ZeRO-2) 每卡持有完整 Qwen3-8B 参数 (~16GB bf16)
+
+**修复**: `train_dflash_lora.py:362`
+```python
+# 之前
+sharding_strategy=ShardingStrategy.SHARD_GRAD_OP
+# 之后
+sharding_strategy=ShardingStrategy.FULL_SHARD
+```
+
+**效果**: 参数跨卡分片,每卡省 ~8-12GB
+
+### 改动 2: batch_size=1 + accumulation_steps=8
+
+**问题**: `batch_size=2` 时峰值显存过高
+
+**修复**: `run_train_dflash_lora.sh`
+```bash
+--batch-size 1 \
+--accumulation-steps 8 \
+```
+
+**效果**: 等效 global batch size 不变,峰值显存减半
+
+### 改动 3: flex_attention + BlockMask 替换 4D additive mask
+
+**问题**: SDPA 不支持 4D additive mask → fallback 到 math backend → 每层 materialize 完整 `[bsz, 32heads, 2048, 2048]` attention scores
+
+**修复**: 从非 LoRA 版 `dflash.py` 移植 `_get_or_create_block_mask()` 方法,适配 LoRA 场景
+
+涉及文件:
+
+1. **`specforge/core/dflash_lora.py`**
+ - `__init__()`: 添加 `attention_backend` 参数(默认 `"flex_attention"`),BlockMask 缓存字段
+ - 新增 `_get_or_create_block_mask()`: 用 `create_block_mask()` 构建零显存的 BlockMask
+ - `forward()`: 根据 `attention_backend` 选择 BlockMask 或 additive mask
+
+2. **`specforge/modeling/draft/dflash_lora.py`**
+ - `from_pretrained()`: 当 backend 为 flex_attention 时,传 `attn_implementation="flex_attention"` 给 HuggingFace
+
+3. **`scripts/train_dflash_lora.py`**
+ - `parse_args()`: `--attention-backend` 参数 (`flex_attention` | `additive`)
+ - `build_model()`: 根据 backend 选择 `attn_implementation`
+
+BlockMask mask function(LoRA 版):
+```python
+def dflash_lora_mask_fn(b, h, q_idx, kv_idx):
+ # Context query: 标准因果
+ is_q_ctx = q_idx < context_len
+ ctx_visible = is_q_ctx & (kv_idx <= q_idx)
+
+ # Block query: 全部 context + 同 block 双向
+ is_q_block = q_idx >= context_len
+ is_k_ctx = kv_idx < context_len
+ q_block_id = (q_idx - context_len) // block_size
+ k_block_id = (kv_idx - context_len) // block_size
+ block_attend_ctx = is_q_block & is_k_ctx
+ block_attend_same = is_q_block & (~is_k_ctx) & (q_block_id == k_block_id)
+
+ return ctx_visible | (block_attend_ctx | block_attend_same)
+```
+
+**验证**: 手动逐元素对比 BlockMask 和 additive mask 输出,三组测试 (context_len=4/0, seq=12/16/64) pattern 完全一致。
+
+**效果**: 不再 fallback 到 SDPA math backend,省去 `[bsz, heads, seq, seq]` attention scores 显存
+
+### 改动 4: chunked cross-entropy loss
+
+**问题**: `[bsz, 2048, 151936]` bf16 logits ≈ 1.18GB,加梯度 ~2.4GB+
+
+**修复**: 从非 LoRA 版 `dflash.py:419-478` 移植 chunked loss
+
+涉及文件:
+
+1. **`specforge/core/dflash_lora.py`**
+ - `__init__()`: 添加 `lm_head_chunk_size` 参数(默认 0 = 不启用)
+ - 新增 `_chunked_lm_loss()`: 分 chunk 过 lm_head + CE loss + gradient checkpointing
+ - 提取 `_full_lm_loss()`: 原始非 chunked 路径
+ - `forward()`: `lm_head_chunk_size > 0` 时走 chunked 路径
+
+2. **`specforge/modeling/draft/dflash_lora.py`**
+ - `forward()`: 新增 `output_hidden_states` 参数,True 时返回 last hidden state 而非 logits
+ - `get_lm_head()`: 穿透 PEFT 层级返回 `base_model.lm_head` 引用
+
+3. **`scripts/train_dflash_lora.py`**
+ - `parse_args()`: `--lm-head-chunk-size` 参数(默认 0,推荐 256)
+ - `build_model()`: 传递到 OnlineDFlashLoRAModel
+
+Chunked loss 核心逻辑:
+```python
+# 分 chunk 计算,每 chunk 用 gradient checkpointing(backward 时重算 logits,不存储)
+for start in range(0, effective_len, chunk_size):
+ end = min(start + chunk_size, effective_len)
+ chunk_loss, chunk_weight = grad_checkpoint(
+ _chunk_ce, # lm_head + CE
+ hidden[:, start:end, :], # 只取当前 chunk
+ input_ids[:, start:end],
+ combined_mask[:, start:end],
+ use_reentrant=False,
+ )
+ total_loss += chunk_loss
+ total_weight += chunk_weight
+loss = total_loss / total_weight
+```
+
+**效果**: logits 峰值显存从 `O(seq_len × vocab_size)` 降至 `O(chunk_size × vocab_size)`,256 chunk → ~150MB vs 1.18GB
+
+---
+
+## 当前训练命令
+
+```bash
+bash run_train_dflash_lora.sh 2 # 2 = GPU 数量
+```
+
+对应完整参数:
+```bash
+torchrun --nproc_per_node 2 scripts/train_dflash_lora.py \
+ --model-path /workspace/Qwen3-8B \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir outputs/qwen3-8b-dflash-lora \
+ --lora-config configs/qwen3-8b-dflash-lora.json \
+ --block-size 16 \
+ --max-length 2048 \
+ --batch-size 1 \
+ --num-epochs 3 \
+ --learning-rate 2e-4 \
+ --accumulation-steps 8 \
+ --loss-decay-gamma 7 \
+ --attention-backend flex_attention \
+ --lm-head-chunk-size 256 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500
+```
+
+---
+
+## 待验证
+
+- [ ] 跑 `bash run_train_dflash_lora.sh 2` 确认不再 OOM
+- [ ] 确认无 SDPA math fallback warning
+- [ ] 观察 GPU 显存峰值
+- [ ] 确认 loss 下降和 accuracy 上升趋势正常
diff --git a/syxin/eval_accepted_length.md b/syxin/eval_accepted_length.md
new file mode 100644
index 0000000000000000000000000000000000000000..5e9b4426efc43c8630650db25d5c7b060410cd56
--- /dev/null
+++ b/syxin/eval_accepted_length.md
@@ -0,0 +1,217 @@
+# DFlash-LoRA-Inject 评测:Accepted Length & Accuracy
+
+## 为什么不能用 sglang 在线评测?
+
+DFlash-LoRA-Inject 的推理需要**逐层注入 target 模型的 hidden states** 到 draft 模型中,
+这是 LoRA-Inject 训练时的核心机制。但 sglang 不支持这种推理模式:
+
+| sglang 算法 | 问题 |
+|---|---|
+| `STANDALONE` | 把 draft 当独立自回归模型跑,**完全忽略 layer injection**。merged 模型 ≈ 原始 Qwen3-8B,accept_length 恒 ≈ 4.7,跟 LoRA 训没训没关系 |
+| `DFLASH` | 期望 DFlash-b16 架构(5 层 + fc + hidden_norm),跟 LoRA-Inject(36 层全模型)结构不匹配 |
+
+因此必须**离线评测**:加载 target + draft 两个模型,手动实现带 layer injection 的 speculative decoding 循环。
+
+---
+
+## 基本信息
+
+| 项目 | 路径 / 值 |
+|---|---|
+| conda 环境 | `spec` |
+| 基座模型(target) | `/workspace/models/Qwen3-8B` |
+| 训练输出(最终 ckpt) | `.../outputs/qwen3-8b-dflash-lora-inject/epoch_3_step_1400` |
+| 合并后 draft 模型 | `.../outputs/qwen3-8b-dflash-lora-inject-merged` |
+| 评测脚本 | `/workspace/hanrui/syxin_old/eval_dflash_lora_inject.py` |
+| 本地数据集 | `/workspace/hanrui/datasets/{humaneval,mtbench,gsm8k}` |
+| 结果输出目录 | `/workspace/hanrui/syxin_old/Specforge/benchmarks/results/` |
+| GPU | 8 × H100 80GB(单卡即可,需 ~32GB 加载两个 8B 模型) |
+
+---
+
+## Step 1:合并 LoRA 权重
+
+LoRA-Inject 训练只保存 adapter 权重,评测时需要完整模型。
+
+```bash
+conda activate spec
+
+python3 -c "
+from peft import PeftModel
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch, os
+
+BASE = '/workspace/models/Qwen3-8B'
+ADAPTER = '/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject/epoch_3_step_1400'
+MERGED = '/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject-merged'
+
+if os.path.exists(MERGED):
+ print(f'[skip] Merged model already exists: {MERGED}')
+else:
+ print('[1/4] Loading base model to CPU ...')
+ model = AutoModelForCausalLM.from_pretrained(BASE, torch_dtype=torch.bfloat16, device_map='cpu')
+ print('[2/4] Loading LoRA adapter ...')
+ model = PeftModel.from_pretrained(model, ADAPTER)
+ print('[3/4] Merging weights ...')
+ model = model.merge_and_unload()
+ print('[4/4] Saving merged model ...')
+ os.makedirs(MERGED, exist_ok=True)
+ model.save_pretrained(MERGED, safe_serialization=True)
+ AutoTokenizer.from_pretrained(BASE).save_pretrained(MERGED)
+ print(f'Done. Merged model saved to: {MERGED}')
+"
+```
+
+> 耗时约 3–5 分钟,CPU 内存占用 ≈ 16 GB。已存在则自动跳过。
+
+---
+
+## Step 2:离线评测 accepted length
+
+**不需要启动 sglang server**,直接跑:
+
+### 全部 Bench(推荐)
+
+```bash
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh
+```
+
+### 单独跑 / 快速测试
+
+```bash
+# 只跑 HumanEval
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh humaneval
+
+# 快速测试(每个 bench 20 条)
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh --quick
+
+# 指定 checkpoint
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh --ckpt epoch_0_step_1000
+
+# 组合
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh humaneval gsm8k --quick
+```
+
+### 或者直接调 Python
+
+```bash
+conda activate spec
+
+python3 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --benchmarks humaneval mtbench gsm8k \
+ --block-size 16 \
+ --max-new-tokens 512 \
+ --temperature 0.0
+```
+
+---
+
+## 结果文件说明
+
+结果保存在 `results/` 下,文件名示例:
+```
+dflash_lora_inject_offline_epoch_3_step_1400_20260314_150000.json
+```
+
+```json
+{
+ "model": "dflash-lora-inject/epoch_3_step_1400",
+ "block_size": 16,
+ "humaneval": {
+ "avg_accept_length": 3.42,
+ "total_tokens": 28500,
+ "latency": 120.5,
+ "throughput": 236.5,
+ "num_samples": 164,
+ "num_verify_rounds": 8320
+ },
+ "mtbench": { ... },
+ "gsm8k": { ... }
+}
+```
+
+| 字段 | 含义 |
+|---|---|
+| `avg_accept_length` | **核心指标**:平均每次 verify 接受的 token 数(含 injection)。越高越好,`1.0` = draft 完全无效 |
+| `total_tokens` | 总生成 token 数 |
+| `throughput` | tokens/s(离线评测,不含 batching 优化) |
+| `num_verify_rounds` | 总验证轮数 |
+
+---
+
+## 对比 baseline
+
+对比未经 LoRA 训练的原始 Qwen3-8B 当 draft 的 accept_length:
+
+```bash
+python3 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --merged-path /workspace/models/Qwen3-8B \
+ --benchmarks humaneval mtbench gsm8k \
+ --num-samples 50
+```
+
+> 这会用原始 Qwen3-8B 同时当 target 和 draft(带 injection),
+> 对比 LoRA 训练前后 accept_length 是否有提升。
+
+---
+
+## 如何测其他 checkpoint
+
+```bash
+# 方法 1:直接加载 adapter(自动 merge,不保存)
+python3 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --ckpt epoch_0_step_1000 \
+ --benchmarks humaneval --num-samples 50
+
+# 方法 2:预先 merge 到不同目录
+python3 -c "
+from peft import PeftModel
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch, os
+BASE = '/workspace/models/Qwen3-8B'
+ADAPTER = '/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject/epoch_0_step_1000'
+MERGED = '/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject-merged-epoch_0_step_1000'
+model = AutoModelForCausalLM.from_pretrained(BASE, torch_dtype=torch.bfloat16, device_map='cpu')
+model = PeftModel.from_pretrained(model, ADAPTER).merge_and_unload()
+os.makedirs(MERGED, exist_ok=True)
+model.save_pretrained(MERGED, safe_serialization=True)
+AutoTokenizer.from_pretrained(BASE).save_pretrained(MERGED)
+"
+
+python3 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --merged-path .../qwen3-8b-dflash-lora-inject-merged-epoch_0_step_1000 \
+ --benchmarks humaneval --num-samples 50
+```
+
+可用 checkpoint:`epoch_0_step_500` / `epoch_0_step_1000` / `epoch_0_step_1400` / `epoch_2_step_34500` / `epoch_2_step_35000` / `epoch_3_step_1400`
+
+---
+
+## 常见问题
+
+### Q1:accept_length 和 STANDALONE 模式下差不多(都 ≈ 4.7)
+
+这说明 layer injection 没有真正起作用。检查:
+- 评测脚本确实用的是 `eval_dflash_lora_inject.py`(离线),不是 sglang bench
+- merged 模型确实是 LoRA-Inject 版本(不是原始 Qwen3-8B)
+
+### Q2:OOM(单卡放不下两个 8B 模型)
+
+两个 bf16 的 Qwen3-8B ≈ 32GB,单卡 H100 80GB 够用。如果 OOM:
+- 检查是否有其他进程占用显存
+- 减小 `--max-new-tokens`(试 256)
+- 减小 `--num-samples`
+
+### Q3:数据集下载失败(无外网)
+
+评测脚本优先读本地文件:
+
+| bench | 本地文件 |
+|---|---|
+| GSM8K | `/workspace/hanrui/datasets/gsm8k/test.jsonl` |
+| MT-Bench | `/workspace/hanrui/datasets/mtbench/question.jsonl` |
+| HumanEval | `/workspace/hanrui/datasets/humaneval/test.jsonl` |
+
+---
+
+*基座:`/workspace/models/Qwen3-8B` | 最终 ckpt:`epoch_3_step_1400` | block_size:16*
diff --git a/syxin/eval_dflash_b16_baseline.py b/syxin/eval_dflash_b16_baseline.py
new file mode 100644
index 0000000000000000000000000000000000000000..7676ece84c4e23f5f7cf6871fd6f49b38662db27
--- /dev/null
+++ b/syxin/eval_dflash_b16_baseline.py
@@ -0,0 +1,354 @@
+#!/usr/bin/env python3
+"""
+Offline evaluation for DFlash-b16 baseline: measure accepted length.
+8 GPUs parallel, each GPU loads target + draft independently.
+
+Usage:
+ # 8 GPUs
+ torchrun --nproc_per_node 8 eval_dflash_b16_baseline.py
+
+ # quick test
+ torchrun --nproc_per_node 8 eval_dflash_b16_baseline.py --num-samples 20
+
+ # single GPU
+ python3 eval_dflash_b16_baseline.py --benchmarks humaneval
+"""
+import argparse
+import json
+import os
+import sys
+import time
+from typing import List, Optional, Tuple
+
+import torch
+import torch.nn as nn
+import torch.distributed as dist
+from tqdm import tqdm
+from transformers import AutoModel, AutoModelForCausalLM, AutoTokenizer, DynamicCache
+
+# Add DFlash model path so we can import utils
+sys.path.insert(0, "/workspace/models/Qwen3-8B-DFlash-b16")
+from utils import extract_context_feature, sample
+
+# ──────────────────────────────────────────────────────────────────
+BASE_MODEL = "/workspace/models/Qwen3-8B"
+DRAFT_MODEL = "/workspace/models/Qwen3-8B-DFlash-b16"
+RESULT_DIR = "/workspace/hanrui/syxin_old/Specforge/benchmarks/results"
+
+
+# ──────────────────────────────────────────────────────────────────
+# Distributed helpers
+# ──────────────────────────────────────────────────────────────────
+def is_distributed():
+ return dist.is_available() and dist.is_initialized()
+
+def get_rank():
+ return dist.get_rank() if is_distributed() else 0
+
+def get_world_size():
+ return dist.get_world_size() if is_distributed() else 1
+
+def is_main():
+ return get_rank() == 0
+
+def print_rank0(*args, **kwargs):
+ if is_main():
+ print(*args, **kwargs)
+
+def split_list(lst, rank, world_size):
+ return [x for i, x in enumerate(lst) if i % world_size == rank]
+
+
+# ──────────────────────────────────────────────────────────────────
+# Prompts
+# ──────────────────────────────────────────────────────────────────
+def load_prompts(bench_name: str, num_samples: Optional[int] = None) -> List[str]:
+ local_paths = {
+ "humaneval": "/workspace/hanrui/datasets/humaneval/test.jsonl",
+ "mtbench": "/workspace/hanrui/datasets/mtbench/question.jsonl",
+ "gsm8k": "/workspace/hanrui/datasets/gsm8k/test.jsonl",
+ }
+ prompts = []
+ path = local_paths.get(bench_name)
+ if path and os.path.exists(path):
+ with open(path) as f:
+ for line in f:
+ item = json.loads(line)
+ if bench_name == "humaneval":
+ p = f"Write a solution to the following problem and make sure that it passes the tests:\n```python\n{item['prompt']}\n```"
+ elif bench_name == "mtbench":
+ p = item.get("turns", [item.get("prompt", "")])[0]
+ elif bench_name == "gsm8k":
+ p = item["question"] + "\nPlease reason step by step, and put your final answer within \\boxed{}."
+ else:
+ p = str(item)
+ prompts.append(p)
+ else:
+ from datasets import load_dataset
+ if bench_name == "humaneval":
+ ds = load_dataset("openai/openai_humaneval", split="test")
+ prompts = [f"Write a solution to the following problem and make sure that it passes the tests:\n```python\n{x['prompt']}\n```" for x in ds]
+ elif bench_name == "mtbench":
+ ds = load_dataset("HuggingFaceH4/mt_bench_prompts", split="train")
+ prompts = [x["prompt"][0] for x in ds]
+ elif bench_name == "gsm8k":
+ ds = load_dataset("openai/gsm8k", "main", split="test")
+ prompts = [x["question"] + "\nPlease reason step by step, and put your final answer within \\boxed{}." for x in ds]
+ if num_samples is not None:
+ prompts = prompts[:num_samples]
+ return prompts
+
+
+# ──────────────────────────────────────────────────────────────────
+# spec_generate with acceptance_lengths returned
+# (Same logic as DFlashDraftModel.spec_generate but returns accept lens)
+# ──────────────────────────────────────────────────────────────────
+@torch.inference_mode()
+def spec_generate_b16(
+ draft_model,
+ target_model: nn.Module,
+ input_ids: torch.LongTensor,
+ max_new_tokens: int = 512,
+ temperature: float = 0.0,
+ stop_token_ids: Optional[List[int]] = None,
+) -> Tuple[torch.Tensor, List[int]]:
+ """Same as DFlashDraftModel.spec_generate but also returns acceptance_lengths."""
+ draft_model.eval()
+ device = target_model.device if hasattr(target_model, 'device') else input_ids.device
+ num_input_tokens = input_ids.shape[1]
+ max_length = num_input_tokens + max_new_tokens
+ block_size = draft_model.block_size
+ mask_token_id = draft_model.mask_token_id
+
+ output_ids = torch.full(
+ (1, max_length + block_size), mask_token_id,
+ dtype=torch.long, device=device,
+ )
+ position_ids = torch.arange(output_ids.shape[1], device=device).unsqueeze(0)
+
+ past_key_values_target = DynamicCache()
+ past_key_values_draft = DynamicCache()
+
+ # Prefill
+ output = target_model(
+ input_ids,
+ position_ids=position_ids[:, :num_input_tokens],
+ past_key_values=past_key_values_target,
+ use_cache=True,
+ logits_to_keep=1,
+ output_hidden_states=True,
+ )
+ output_ids[:, :num_input_tokens] = input_ids
+ output_ids[:, num_input_tokens:num_input_tokens + 1] = sample(output.logits, temperature)
+ target_hidden = extract_context_feature(output.hidden_states, draft_model.target_layer_ids)
+
+ # Decode
+ acceptance_lengths = []
+ start = num_input_tokens
+ while start < max_length:
+ block_output_ids = output_ids[:, start:start + block_size].clone()
+ block_position_ids = position_ids[:, start:start + block_size]
+ noise_embedding = target_model.model.embed_tokens(block_output_ids)
+
+ draft_logits = target_model.lm_head(
+ draft_model(
+ target_hidden=target_hidden,
+ noise_embedding=noise_embedding,
+ position_ids=position_ids[:, past_key_values_draft.get_seq_length():start + block_size],
+ past_key_values=past_key_values_draft,
+ use_cache=True,
+ is_causal=False,
+ )[:, -block_size + 1:, :]
+ )
+ past_key_values_draft.crop(start)
+ block_output_ids[:, 1:] = sample(draft_logits)
+
+ output = target_model(
+ block_output_ids,
+ position_ids=block_position_ids,
+ past_key_values=past_key_values_target,
+ use_cache=True,
+ output_hidden_states=True,
+ )
+
+ posterior = sample(output.logits, temperature)
+ acceptance_length = (
+ (block_output_ids[:, 1:] == posterior[:, :-1])
+ .cumprod(dim=1).sum(dim=1)[0].item()
+ )
+ output_ids[:, start:start + int(acceptance_length) + 1] = block_output_ids[:, :int(acceptance_length) + 1]
+ output_ids[:, start + int(acceptance_length) + 1] = posterior[:, int(acceptance_length)]
+ start += int(acceptance_length) + 1
+ past_key_values_target.crop(start)
+ target_hidden = extract_context_feature(
+ output.hidden_states, draft_model.target_layer_ids
+ )[:, :int(acceptance_length) + 1, :]
+ acceptance_lengths.append(int(acceptance_length) + 1)
+
+ if stop_token_ids is not None and any(
+ sid in output_ids[:, num_input_tokens:start] for sid in stop_token_ids
+ ):
+ break
+
+ output_ids = output_ids[:, :max_length]
+ output_ids = output_ids[:, output_ids[0] != mask_token_id]
+ if stop_token_ids is not None:
+ stop_t = torch.tensor(stop_token_ids, device=output_ids.device)
+ stop_idx = torch.isin(output_ids[0][num_input_tokens:], stop_t).nonzero(as_tuple=True)[0]
+ if stop_idx.numel() > 0:
+ output_ids = output_ids[:, :num_input_tokens + stop_idx[0] + 1]
+
+ return output_ids, acceptance_lengths
+
+
+# ──────────────────────────────────────────────────────────────────
+def parse_args():
+ p = argparse.ArgumentParser()
+ p.add_argument("--base-model", default=BASE_MODEL)
+ p.add_argument("--draft-model", default=DRAFT_MODEL)
+ p.add_argument("--max-new-tokens", type=int, default=512)
+ p.add_argument("--temperature", type=float, default=0.0)
+ p.add_argument("--benchmarks", nargs="+", default=["humaneval", "mtbench", "gsm8k"])
+ p.add_argument("--num-samples", type=int, default=None)
+ p.add_argument("--output-dir", default=RESULT_DIR)
+ return p.parse_args()
+
+
+def main():
+ args = parse_args()
+
+ local_rank = int(os.environ.get("LOCAL_RANK", 0))
+ world_size = int(os.environ.get("WORLD_SIZE", 1))
+
+ if world_size > 1:
+ dist.init_process_group(backend="nccl")
+ torch.cuda.set_device(local_rank)
+
+ device = f"cuda:{local_rank}"
+ rank = get_rank()
+
+ print_rank0(f"Running DFlash-b16 baseline on {world_size} GPU(s)")
+
+ # ── Load models ──
+ print_rank0(f"Loading target: {args.base_model}")
+ target_model = AutoModelForCausalLM.from_pretrained(
+ args.base_model,
+ torch_dtype=torch.bfloat16,
+ device_map=device,
+ trust_remote_code=True,
+ )
+ target_model.eval()
+
+ print_rank0(f"Loading DFlash-b16 draft: {args.draft_model}")
+ draft_model = AutoModel.from_pretrained(
+ args.draft_model,
+ torch_dtype=torch.bfloat16,
+ trust_remote_code=True,
+ ).to(device)
+ draft_model.eval()
+
+ tokenizer = AutoTokenizer.from_pretrained(args.base_model, trust_remote_code=True)
+ stop_token_ids = [tokenizer.eos_token_id]
+
+ print_rank0(f"DFlash-b16: block_size={draft_model.block_size}, "
+ f"target_layer_ids={draft_model.target_layer_ids}, "
+ f"num_layers={len(draft_model.layers)}")
+
+ # ── Run benchmarks ──
+ results = {"model": "Qwen3-8B-DFlash-b16", "type": "baseline",
+ "block_size": draft_model.block_size}
+
+ for bench_name in args.benchmarks:
+ print_rank0(f"\n{'='*60}")
+ print_rank0(f"Benchmark: {bench_name} ({world_size} GPUs)")
+ print_rank0(f"{'='*60}")
+
+ all_prompts = load_prompts(bench_name, args.num_samples)
+ my_prompts = split_list(all_prompts, rank, world_size)
+ print_rank0(f"Total {len(all_prompts)} prompts, ~{len(my_prompts)} per GPU")
+
+ local_accept_lengths = []
+ local_tokens = 0
+ t0 = time.time()
+
+ iterator = tqdm(my_prompts, desc=f"[GPU{rank}] {bench_name}", unit="sample",
+ disable=(rank != 0))
+ for prompt in iterator:
+ messages = [{"role": "user", "content": prompt}]
+ text = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
+ input_ids = tokenizer(text, return_tensors="pt").input_ids.to(device)
+
+ output_ids, accept_lens = spec_generate_b16(
+ draft_model=draft_model,
+ target_model=target_model,
+ input_ids=input_ids,
+ max_new_tokens=args.max_new_tokens,
+ temperature=args.temperature,
+ stop_token_ids=stop_token_ids,
+ )
+
+ local_accept_lengths.extend(accept_lens)
+ num_gen = output_ids.shape[1] - input_ids.shape[1]
+ local_tokens += num_gen
+
+ if rank == 0 and len(local_accept_lengths) > 0:
+ avg = sum(local_accept_lengths) / len(local_accept_lengths)
+ iterator.set_postfix(accept_len=f"{avg:.2f}", tokens=local_tokens, gen=num_gen)
+
+ elapsed = time.time() - t0
+
+ # ── Gather ──
+ if world_size > 1:
+ local_sum = torch.tensor(sum(local_accept_lengths), dtype=torch.float64, device=device)
+ local_count = torch.tensor(len(local_accept_lengths), dtype=torch.long, device=device)
+ local_tok = torch.tensor(local_tokens, dtype=torch.long, device=device)
+ dist.all_reduce(local_sum, op=dist.ReduceOp.SUM)
+ dist.all_reduce(local_count, op=dist.ReduceOp.SUM)
+ dist.all_reduce(local_tok, op=dist.ReduceOp.SUM)
+ total_accept_sum = local_sum.item()
+ total_count = local_count.item()
+ total_tokens = local_tok.item()
+ else:
+ total_accept_sum = sum(local_accept_lengths)
+ total_count = len(local_accept_lengths)
+ total_tokens = local_tokens
+
+ avg_accept_length = total_accept_sum / max(total_count, 1)
+ throughput = total_tokens / elapsed if elapsed > 0 else 0
+
+ print_rank0(f"\n{bench_name} Results:")
+ print_rank0(f" Avg Accept Length: {avg_accept_length:.3f}")
+ print_rank0(f" Total tokens: {total_tokens}")
+ print_rank0(f" Latency: {elapsed:.1f}s")
+ print_rank0(f" Throughput: {throughput:.1f} tok/s (aggregate {world_size} GPUs)")
+ print_rank0(f" Num verify rounds: {total_count}")
+ print_rank0(f" Num samples: {len(all_prompts)}")
+
+ results[bench_name] = {
+ "avg_accept_length": avg_accept_length,
+ "total_tokens": total_tokens,
+ "latency": elapsed,
+ "throughput": throughput,
+ "num_samples": len(all_prompts),
+ "num_verify_rounds": total_count,
+ "num_gpus": world_size,
+ }
+
+ # ── Save ──
+ if is_main():
+ os.makedirs(args.output_dir, exist_ok=True)
+ timestamp = time.strftime("%Y%m%d_%H%M%S")
+ result_file = os.path.join(
+ args.output_dir,
+ f"dflash_b16_baseline_offline_{timestamp}.json",
+ )
+ with open(result_file, "w") as f:
+ json.dump(results, f, indent=2)
+ print(f"\nResults saved to: {result_file}")
+
+ if world_size > 1:
+ dist.destroy_process_group()
+
+
+if __name__ == "__main__":
+ main()
diff --git a/syxin/eval_dflash_lora_inject.py b/syxin/eval_dflash_lora_inject.py
new file mode 100644
index 0000000000000000000000000000000000000000..b3756b752d1df969a0263d608b09221c1b0d5970
--- /dev/null
+++ b/syxin/eval_dflash_lora_inject.py
@@ -0,0 +1,627 @@
+#!/usr/bin/env python3
+"""
+Offline evaluation for DFlash-LoRA-Inject: measure accepted length & speedup.
+Aligned with official DFlash benchmark.py methodology.
+
+Unlike DFlash-b16 which uses a small 5-layer draft model with fc/hidden_norm,
+LoRA-Inject uses a full Qwen3-8B with LoRA adapters that receives target hidden
+states via layer-by-layer injection.
+
+Usage:
+ conda activate spec
+
+ # 8 GPU parallel (default, all 10 benchmarks)
+ torchrun --nproc_per_node 8 eval_dflash_lora_inject.py
+
+ # single GPU
+ python3 eval_dflash_lora_inject.py
+
+ # specific checkpoint / benchmark
+ torchrun --nproc_per_node 8 eval_dflash_lora_inject.py --ckpt epoch_0_step_1000 --datasets humaneval
+
+ # quick test
+ torchrun --nproc_per_node 8 eval_dflash_lora_inject.py --max-samples 20
+"""
+import argparse
+import json
+import os
+import random
+import sys
+import time
+import warnings
+from itertools import chain
+from types import SimpleNamespace
+from typing import List, Optional, Tuple
+
+import numpy as np
+import torch
+import torch.nn as nn
+import torch.distributed as dist
+from peft import PeftModel
+from tqdm import tqdm
+from transformers import AutoModelForCausalLM, AutoTokenizer, DynamicCache
+
+# Import official dataset loader
+sys.path.insert(0, "/workspace/hanrui/dflash")
+from model.utils import load_and_process_dataset
+
+# ──────────────────────────────────────────────────────────────────
+# Config defaults
+# ──────────────────────────────────────────────────────────────────
+BASE_MODEL = "/workspace/models/Qwen3-8B"
+ADAPTER_ROOT = "/workspace/hanrui/syxin/Specforge/outputs/qwen3-8b-dflash-lora-inject"
+DEFAULT_CKPT = "epoch_3_step_1400"
+MASK_TOKEN_ID = 151669 # Qwen3 <|mask|>
+BLOCK_SIZE = 16
+RESULT_DIR = "/workspace/hanrui/syxin/Specforge/benchmarks/results"
+
+# Official benchmark tasks (from run_benchmark.sh)
+OFFICIAL_TASKS = {
+ "gsm8k": 128,
+ "math500": 128,
+ "aime24": 30,
+ "aime25": 30,
+ "humaneval": 164,
+ "mbpp": 128,
+ "livecodebench": 128,
+ "swe-bench": 128,
+ "mt-bench": 80,
+ "alpaca": 128,
+}
+
+
+# ──────────────────────────────────────────────────────────────────
+# CUDA-synchronised timer (matches official benchmark.py)
+# ──────────────────────────────────────────────────────────────────
+def cuda_time() -> float:
+ torch.cuda.synchronize()
+ return time.perf_counter()
+
+
+def has_flash_attn() -> bool:
+ try:
+ import flash_attn # noqa: F401
+ return True
+ except ImportError:
+ print("[WARN] flash_attn not installed, falling back to sdpa.")
+ return False
+
+
+# ──────────────────────────────────────────────────────────────────
+# Distributed helpers (mirrors official distributed.py)
+# ──────────────────────────────────────────────────────────────────
+def dist_init():
+ if "RANK" not in os.environ:
+ warnings.warn("RANK not set. Skipping distributed init.")
+ return
+ dist.init_process_group(backend="nccl", init_method="env://")
+
+def dist_rank():
+ return int(os.environ.get("RANK", 0))
+
+def dist_size():
+ return int(os.environ.get("WORLD_SIZE", 1))
+
+def dist_local_rank():
+ return int(os.environ.get("LOCAL_RANK", 0))
+
+def dist_is_main():
+ return dist_rank() == 0
+
+def dist_gather(obj, dst=0):
+ if not dist.is_initialized():
+ return [obj]
+ if dist_is_main():
+ objs = [None for _ in range(dist_size())]
+ dist.gather_object(obj, objs, dst=dst)
+ return objs
+ else:
+ dist.gather_object(obj, dst=dst)
+ return None
+
+def print_rank0(*args, **kwargs):
+ if dist_is_main():
+ print(*args, **kwargs)
+
+
+# ──────────────────────────────────────────────────────────────────
+# Sampling (matches official model/utils.py::sample)
+# ──────────────────────────────────────────────────────────────────
+def sample(logits: torch.Tensor, temperature: float = 0.0) -> torch.Tensor:
+ if temperature < 1e-5:
+ return torch.argmax(logits, dim=-1)
+ bsz, seq_len, vocab_size = logits.shape
+ logits = logits.view(-1, vocab_size)
+ logits = logits / temperature
+ probs = torch.softmax(logits, dim=-1)
+ return torch.multinomial(probs, num_samples=1).view(bsz, seq_len)
+
+
+# ──────────────────────────────────────────────────────────────────
+# Build DFlash attention mask (vectorized, no Python loops)
+# ──────────────────────────────────────────────────────────────────
+def build_dflash_mask(ctx_len: int, block_size: int, device, dtype=torch.bfloat16):
+ """
+ Build DFlash attention mask for [context | block] sequence.
+ - Context part: standard causal
+ - Block part: each token sees all context + all tokens in same block (bidirectional)
+ """
+ full_len = ctx_len + block_size
+ neg_inf = torch.finfo(dtype).min
+
+ mask = torch.full((1, 1, full_len, full_len), neg_inf, device=device, dtype=dtype)
+
+ if ctx_len > 0:
+ ctx_rows = torch.arange(ctx_len, device=device)
+ ctx_cols = torch.arange(ctx_len, device=device)
+ causal = ctx_cols.unsqueeze(0) <= ctx_rows.unsqueeze(1)
+ mask[0, 0, :ctx_len, :ctx_len].masked_fill_(causal, 0)
+
+ if ctx_len > 0:
+ mask[0, 0, ctx_len:, :ctx_len] = 0
+ mask[0, 0, ctx_len:, ctx_len:] = 0
+
+ return mask
+
+
+# ──────────────────────────────────────────────────────────────────
+# Pure autoregressive generation (target model only, no draft)
+# Used for AR baseline timing -- avoids inflating AR time with draft overhead.
+# ──────────────────────────────────────────────────────────────────
+@torch.inference_mode()
+def ar_generate(
+ target_model: nn.Module,
+ input_ids: torch.LongTensor,
+ max_new_tokens: int = 2048,
+ mask_token_id: int = MASK_TOKEN_ID,
+ temperature: float = 0.0,
+ stop_token_ids: Optional[List[int]] = None,
+) -> SimpleNamespace:
+ """
+ Pure autoregressive generation using only the target model.
+ Mirrors official benchmark.py with block_size=1 (no draft model involved).
+ Returns SimpleNamespace matching official dflash_generate output format.
+ """
+ device = input_ids.device
+ num_input_tokens = input_ids.shape[1]
+ max_length = num_input_tokens + max_new_tokens
+
+ output_ids = torch.full(
+ (1, max_length + 1), mask_token_id,
+ dtype=torch.long, device=device,
+ )
+ output_ids[:, :num_input_tokens] = input_ids
+ position_ids = torch.arange(output_ids.shape[1], device=device).unsqueeze(0)
+ past_key_values = DynamicCache()
+
+ # Prefill
+ prefill_start = cuda_time()
+ output = target_model(
+ input_ids,
+ position_ids=position_ids[:, :num_input_tokens],
+ past_key_values=past_key_values,
+ use_cache=True,
+ logits_to_keep=1,
+ output_hidden_states=False,
+ )
+ first_token = sample(output.logits, temperature)
+ output_ids[:, num_input_tokens:num_input_tokens + 1] = first_token
+ time_to_first_token = cuda_time() - prefill_start
+
+ # Decode (autoregressive, one token at a time)
+ decode_start = cuda_time()
+ start = num_input_tokens
+
+ while start < max_length:
+ cur_token = output_ids[:, start:start + 1]
+ cur_pos = position_ids[:, start:start + 1]
+
+ output = target_model(
+ cur_token,
+ position_ids=cur_pos,
+ past_key_values=past_key_values,
+ use_cache=True,
+ output_hidden_states=False,
+ )
+
+ next_token = sample(output.logits, temperature)
+ start += 1
+ output_ids[:, start:start + 1] = next_token
+ past_key_values.crop(start)
+
+ # Check stop tokens (matches official: check all generated)
+ if stop_token_ids is not None and any(
+ sid in output_ids[:, num_input_tokens:] for sid in stop_token_ids
+ ):
+ break
+
+ output_ids = output_ids[:, :max_length]
+ output_ids = output_ids[:, output_ids[0] != mask_token_id]
+ if stop_token_ids is not None:
+ stop_t = torch.tensor(stop_token_ids, device=output_ids.device)
+ stop_idx = torch.isin(output_ids[0][num_input_tokens:], stop_t).nonzero(as_tuple=True)[0]
+ if stop_idx.numel() > 0:
+ output_ids = output_ids[:, :num_input_tokens + stop_idx[0] + 1]
+
+ num_output_tokens = output_ids.shape[1] - num_input_tokens
+ total_decode_time = cuda_time() - decode_start
+ time_per_output_token = total_decode_time / max(num_output_tokens, 1)
+
+ return SimpleNamespace(
+ output_ids=output_ids,
+ num_input_tokens=num_input_tokens,
+ num_output_tokens=num_output_tokens,
+ time_to_first_token=time_to_first_token,
+ time_per_output_token=time_per_output_token,
+ acceptance_lengths=[1] * max(num_output_tokens, 0), # AR: always 1
+ )
+
+
+# ──────────────────────────────────────────────────────────────────
+# Core: spec_generate with layer-by-layer injection (KV-cached)
+# ──────────────────────────────────────────────────────────────────
+@torch.inference_mode()
+def spec_generate_inject(
+ target_model: nn.Module,
+ draft_model: nn.Module,
+ input_ids: torch.LongTensor,
+ max_new_tokens: int = 2048,
+ block_size: int = 16,
+ mask_token_id: int = MASK_TOKEN_ID,
+ temperature: float = 0.0,
+ stop_token_ids: Optional[List[int]] = None,
+) -> SimpleNamespace:
+ """
+ Speculative generation using DFlash-LoRA-Inject inference pattern.
+ Returns SimpleNamespace matching official dflash_generate output format.
+ """
+ device = input_ids.device
+ num_input_tokens = input_ids.shape[1]
+ max_length = num_input_tokens + max_new_tokens
+
+ draft_layers = draft_model.model.layers
+ draft_norm = draft_model.model.norm
+ draft_lm_head = draft_model.lm_head
+ rotary_emb = draft_model.model.rotary_emb
+ num_layers = len(draft_layers)
+
+ output_ids = torch.full(
+ (1, max_length + block_size), mask_token_id,
+ dtype=torch.long, device=device,
+ )
+ output_ids[:, :num_input_tokens] = input_ids
+
+ # ── Prefill: target with KV cache + hidden states ──
+ prefill_start = cuda_time()
+ target_kv = DynamicCache()
+ target_output = target_model(
+ input_ids,
+ past_key_values=target_kv,
+ use_cache=True,
+ output_hidden_states=True,
+ )
+ first_token = sample(target_output.logits[:, -1:, :], temperature)
+ output_ids[:, num_input_tokens] = first_token.squeeze()
+
+ ctx_hidden_per_layer = [
+ target_output.hidden_states[i + 1]
+ for i in range(num_layers)
+ ]
+
+ time_to_first_token = cuda_time() - prefill_start
+
+ # Decode
+ decode_start = cuda_time()
+ acceptance_lengths = []
+ start = num_input_tokens
+ draft_prefill = True
+
+ while start < max_length:
+ end = min(start + block_size, max_length)
+ actual_block_size = end - start
+
+ block_ids = output_ids[:, start:end].clone()
+
+ # ── Draft: forward with layer-by-layer injection ──
+ draft_hidden = draft_model.model.embed_tokens(block_ids)
+ ctx_len = ctx_hidden_per_layer[0].shape[1]
+
+ dflash_mask = build_dflash_mask(ctx_len, actual_block_size, device)
+ combined_pos = torch.arange(ctx_len + actual_block_size, device=device).unsqueeze(0)
+
+ dummy_combined = torch.empty(1, ctx_len + actual_block_size, draft_hidden.shape[-1],
+ device=device, dtype=torch.bfloat16)
+ position_embeddings = rotary_emb(dummy_combined, combined_pos)
+
+ for layer_idx in range(num_layers):
+ target_ctx = ctx_hidden_per_layer[layer_idx]
+ combined = torch.cat([target_ctx, draft_hidden], dim=1)
+
+ layer_output = draft_layers[layer_idx](
+ combined,
+ attention_mask=dflash_mask,
+ position_ids=combined_pos,
+ position_embeddings=position_embeddings,
+ )
+ if isinstance(layer_output, tuple):
+ layer_output = layer_output[0]
+ draft_hidden = layer_output[:, ctx_len:, :]
+
+ draft_hidden = draft_norm(draft_hidden)
+ draft_logits = draft_lm_head(draft_hidden)
+
+ draft_predictions = sample(draft_logits[:, :-1, :], temperature)
+ block_ids[:, 1:actual_block_size] = draft_predictions[:, :actual_block_size - 1]
+
+ # Exclude draft's first prefill from decode timing (matches official pattern)
+ if draft_prefill:
+ draft_prefill = False
+ decode_start = cuda_time()
+
+ # ── Verify: target forward on block tokens (with KV cache) ──
+ position_ids_block = torch.arange(
+ start, start + actual_block_size, device=device
+ ).unsqueeze(0)
+
+ target_verify = target_model(
+ block_ids,
+ position_ids=position_ids_block,
+ past_key_values=target_kv,
+ use_cache=True,
+ output_hidden_states=True,
+ )
+ target_tokens = sample(target_verify.logits, temperature)
+
+ # Acceptance
+ matches = (block_ids[:, 1:actual_block_size] == target_tokens[:, :actual_block_size - 1])
+ acceptance_length = int(matches.cumprod(dim=1).sum(dim=1)[0].item())
+
+ output_ids[:, start:start + acceptance_length + 1] = block_ids[:, :acceptance_length + 1]
+ output_ids[:, start + acceptance_length + 1] = target_tokens[:, acceptance_length]
+
+ accepted_end = start + acceptance_length + 1
+ target_kv.crop(accepted_end)
+
+ for i in range(num_layers):
+ new_hidden = target_verify.hidden_states[i + 1][:, :acceptance_length + 1, :]
+ ctx_hidden_per_layer[i] = torch.cat([ctx_hidden_per_layer[i], new_hidden], dim=1)
+
+ start += acceptance_length + 1
+ acceptance_lengths.append(acceptance_length + 1)
+
+ # Official: check ALL generated tokens
+ if stop_token_ids is not None and any(
+ sid in output_ids[:, num_input_tokens:] for sid in stop_token_ids
+ ):
+ break
+
+ output_ids = output_ids[:, :min(start, max_length)]
+ output_ids = output_ids[:, output_ids[0] != mask_token_id]
+ if stop_token_ids is not None:
+ stop_t = torch.tensor(stop_token_ids, device=output_ids.device)
+ stop_idx = torch.isin(output_ids[0][num_input_tokens:], stop_t).nonzero(as_tuple=True)[0]
+ if stop_idx.numel() > 0:
+ output_ids = output_ids[:, :num_input_tokens + stop_idx[0] + 1]
+
+ num_output_tokens = output_ids.shape[1] - num_input_tokens
+ total_decode_time = cuda_time() - decode_start
+ time_per_output_token = total_decode_time / max(num_output_tokens, 1)
+
+ return SimpleNamespace(
+ output_ids=output_ids,
+ num_input_tokens=num_input_tokens,
+ num_output_tokens=num_output_tokens,
+ time_to_first_token=time_to_first_token,
+ time_per_output_token=time_per_output_token,
+ acceptance_lengths=acceptance_lengths,
+ )
+
+
+# ──────────────────────────────────────────────────────────────────
+# Main
+# ──────────────────────────────────────────────────────────────────
+def parse_args():
+ p = argparse.ArgumentParser(description="Offline eval for DFlash-LoRA-Inject (aligned with official)")
+ p.add_argument("--base-model", default=BASE_MODEL)
+ p.add_argument("--adapter-root", default=ADAPTER_ROOT)
+ p.add_argument("--ckpt", default=DEFAULT_CKPT, help="Checkpoint folder name")
+ p.add_argument("--merged-path",
+ default="/workspace/hanrui/syxin/Specforge/outputs/qwen3-8b-dflash-lora-inject-merged",
+ help="Path to pre-merged model. If None, will merge on the fly.")
+ p.add_argument("--block-size", type=int, default=BLOCK_SIZE)
+ p.add_argument("--max-new-tokens", type=int, default=2048,
+ help="Max new tokens per turn (official shell uses 2048)")
+ p.add_argument("--temperature", type=float, default=0.0)
+ p.add_argument("--datasets", nargs="+", default=list(OFFICIAL_TASKS.keys()),
+ help="Benchmarks to run (default: all 10 official tasks)")
+ p.add_argument("--max-samples", type=int, default=None,
+ help="Override max samples per dataset (None = use official per-task counts)")
+ p.add_argument("--output-dir", default=RESULT_DIR)
+ return p.parse_args()
+
+
+def main():
+ args = parse_args()
+
+ # Fix random seeds (matches official)
+ random.seed(0)
+ np.random.seed(0)
+ torch.manual_seed(0)
+ torch.cuda.manual_seed_all(0)
+ torch.backends.cudnn.deterministic = True
+ torch.backends.cudnn.benchmark = False
+
+ # ── Init distributed ──
+ dist_init()
+ torch.cuda.set_device(dist_local_rank())
+ device = torch.device(f"cuda:{dist_local_rank()}")
+
+ print_rank0(f"Running on {dist_size()} GPU(s)")
+
+ # Detect flash_attn (only for target model; draft needs sdpa for custom DFlash mask)
+ installed_flash_attn = has_flash_attn()
+ target_attn_impl = "flash_attention_2" if installed_flash_attn else "sdpa"
+ draft_attn_impl = "sdpa" # DFlash injection uses custom attention mask
+ print_rank0(f"Using attn_implementation: target={target_attn_impl}, draft={draft_attn_impl}")
+
+ # ── Load models ──
+ print_rank0(f"Loading target model: {args.base_model}")
+ target_model = AutoModelForCausalLM.from_pretrained(
+ args.base_model,
+ torch_dtype=torch.bfloat16,
+ attn_implementation=target_attn_impl,
+ device_map=device,
+ trust_remote_code=True,
+ )
+ target_model.eval()
+
+ if args.merged_path and os.path.isdir(args.merged_path):
+ print_rank0(f"Loading pre-merged draft model: {args.merged_path}")
+ draft_model = AutoModelForCausalLM.from_pretrained(
+ args.merged_path,
+ torch_dtype=torch.bfloat16,
+ attn_implementation=draft_attn_impl,
+ device_map=device,
+ trust_remote_code=True,
+ )
+ else:
+ adapter_path = os.path.join(args.adapter_root, args.ckpt)
+ print_rank0(f"Loading base + LoRA adapter: {adapter_path}")
+ draft_model = AutoModelForCausalLM.from_pretrained(
+ args.base_model,
+ torch_dtype=torch.bfloat16,
+ attn_implementation=draft_attn_impl,
+ device_map=device,
+ trust_remote_code=True,
+ )
+ draft_model = PeftModel.from_pretrained(draft_model, adapter_path)
+ draft_model = draft_model.merge_and_unload()
+ draft_model.eval()
+
+ tokenizer = AutoTokenizer.from_pretrained(args.base_model, trust_remote_code=True)
+ stop_token_ids = [tokenizer.eos_token_id]
+
+ block_size = args.block_size
+
+ # ── Run benchmarks ──
+ all_results = {"model": f"dflash-lora-inject/{args.ckpt}", "block_size": block_size}
+
+ for dataset_name in args.datasets:
+ print_rank0(f"\n{'=' * 60}")
+ print_rank0(f"Benchmark: {dataset_name} ({dist_size()} GPUs)")
+ print_rank0(f"{'=' * 60}")
+
+ # Load dataset using official loader
+ dataset = load_and_process_dataset(dataset_name)
+
+ # Sample selection: official uses shuffle(seed=0).select()
+ max_samples = args.max_samples if args.max_samples is not None else OFFICIAL_TASKS.get(dataset_name)
+ if max_samples is not None and len(dataset) > max_samples:
+ dataset = dataset.shuffle(seed=0).select(range(max_samples))
+
+ print_rank0(f"Total {len(dataset)} samples, distributed across {dist_size()} GPUs")
+
+ responses = []
+ indices = range(dist_rank(), len(dataset), dist_size())
+
+ iterator = tqdm(indices, desc=f"[GPU{dist_rank()}] {dataset_name}",
+ unit="sample", disable=not dist_is_main())
+
+ for idx in iterator:
+ instance = dataset[idx]
+
+ # Multi-turn support (matches official benchmark.py)
+ messages = []
+ for turn_index, user_content in enumerate(instance["turns"]):
+ messages.append({"role": "user", "content": user_content})
+ input_text = tokenizer.apply_chat_template(
+ messages, tokenize=False, add_generation_prompt=True,
+ enable_thinking=False,
+ )
+ input_ids = tokenizer.encode(input_text, return_tensors="pt").to(device)
+
+ response = {}
+
+ # AR baseline: pure target-only autoregressive (no draft overhead)
+ response[1] = ar_generate(
+ target_model=target_model,
+ input_ids=input_ids,
+ max_new_tokens=args.max_new_tokens,
+ mask_token_id=MASK_TOKEN_ID,
+ temperature=args.temperature,
+ stop_token_ids=stop_token_ids,
+ )
+
+ # Speculative: DFlash-LoRA-Inject
+ response[block_size] = spec_generate_inject(
+ target_model=target_model,
+ draft_model=draft_model,
+ input_ids=input_ids,
+ max_new_tokens=args.max_new_tokens,
+ block_size=block_size,
+ mask_token_id=MASK_TOKEN_ID,
+ temperature=args.temperature,
+ stop_token_ids=stop_token_ids,
+ )
+
+ # Append assistant response for multi-turn context
+ spec_response = response[block_size]
+ generated_ids = spec_response.output_ids[0, spec_response.num_input_tokens:]
+ output_text = tokenizer.decode(generated_ids, skip_special_tokens=True)
+ messages.append({"role": "assistant", "content": output_text})
+ responses.append(response)
+
+ if dist_is_main() and responses:
+ recent_tau = np.mean([np.mean(r[block_size].acceptance_lengths) for r in responses[-5:]])
+ iterator.set_postfix(accept_len=f"{recent_tau:.2f}")
+
+ # ── Gather to rank 0 (matches official) ──
+ if dist_size() > 1:
+ gathered = dist_gather(responses, dst=0)
+ if not dist_is_main():
+ continue
+ responses = list(chain(*gathered))
+ elif not dist_is_main():
+ continue
+
+ # ── Compute metrics (exact official formulas) ──
+ t1 = np.mean([r[1].time_per_output_token for r in responses])
+ tb = np.mean([r[block_size].time_per_output_token for r in responses])
+ speedup = t1 / tb if tb > 0 else 0
+
+ # Acceptance length: per-sample mean, then mean of means (official)
+ tau = np.mean([np.mean(r[block_size].acceptance_lengths) for r in responses])
+
+ # Histogram
+ acceptance_lengths = list(chain(*[r[block_size].acceptance_lengths for r in responses]))
+ histogram = [acceptance_lengths.count(b) / len(acceptance_lengths) for b in range(block_size + 1)]
+
+ print_rank0(f"\n{dataset_name} Results:")
+ print_rank0(f" Decoding speedup: {speedup:.2f}x")
+ print_rank0(f" Average Acceptance length: {tau:.2f}")
+ print_rank0(f" Acceptance length histogram: {[f'{x * 100:.1f}%' for x in histogram]}")
+ print_rank0(f" Num responses: {len(responses)}")
+
+ all_results[dataset_name] = {
+ "decoding_speedup": speedup,
+ "avg_accept_length": tau,
+ "acceptance_histogram": histogram,
+ "num_responses": len(responses),
+ "num_gpus": dist_size(),
+ }
+
+ # ── Save results ──
+ if dist_is_main():
+ os.makedirs(args.output_dir, exist_ok=True)
+ timestamp = time.strftime("%Y%m%d_%H%M%S")
+ result_file = os.path.join(
+ args.output_dir,
+ f"dflash_lora_inject_offline_{args.ckpt}_{timestamp}.json",
+ )
+ with open(result_file, "w") as f:
+ json.dump(all_results, f, indent=2)
+ print(f"\nResults saved to: {result_file}")
+
+
+if __name__ == "__main__":
+ main()
diff --git a/syxin/idea.md b/syxin/idea.md
new file mode 100644
index 0000000000000000000000000000000000000000..50d7e9ccdced927b2f9ce92fcd0ae0315e4db6fd
--- /dev/null
+++ b/syxin/idea.md
@@ -0,0 +1,23 @@
+现在关于target model的hidden state注入
+
+dflash的做法是,抽5层的feature过一下fc然后concat到mask token对应的hidden state前面
+
+但是如果我们的draft是用lora的原始模型
+
+我们不用这样注入
+
+我们可以直接把target model的hidden state直接层对层拉过来
+
+我是把加了lora后的模型作为draft model用的
+
+它本质上还是一个speculative decode
+
+我的想法的核心是,因为这个draft model足够大,也和target model足够像,把他转为和dflash一样每次用mask直接生成16个token,可能能得到很长的accept len,以此获得加速
+
+而dflash能work的核心是,它在生成阶段是使用的部分target model的hidden state,注入到mask token的hidden state前面
+
+我们也用相同的做法
+
+带lora的模型,lora只负责让它能并行解码16个mask token,但是前面的上下文信息,依然用原始model跑出来的,通过注入放进draft的时候
+
+而且由于模型结构的一致,我们可以直接层对层注入进去
\ No newline at end of file
diff --git a/syxin/launch_train.sh b/syxin/launch_train.sh
new file mode 100644
index 0000000000000000000000000000000000000000..78e7ffc4ee53178703afd1d45ab1b491484fedb2
--- /dev/null
+++ b/syxin/launch_train.sh
@@ -0,0 +1,37 @@
+#!/bin/bash
+set -euo pipefail
+
+cd /workspace/hanrui/syxin/Specforge
+
+export TORCHINDUCTOR_CACHE_DIR=/workspace/hanrui/cache/compiled_kernels
+export SPECFORGE_DATA_NUM_PROC=16
+export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+export PYTORCH_ALLOC_CONF=expandable_segments:True
+export HF_DATASETS_CACHE=/workspace/hanrui/cache/hf_datasets
+export HF_HOME=/workspace/hanrui/cache/hf_home
+
+torchrun --nproc_per_node=8 \
+ scripts/train_dflash_lora_inject.py \
+ --target-model-path /workspace/models/Qwen3-8B \
+ --target-model-backend hf \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir outputs/qwen3-8b-sft-32gpu-v2 \
+ --block-size 16 \
+ --attention-backend additive \
+ --attn-implementation sdpa \
+ --max-length 2048 \
+ --batch-size 4 \
+ --accumulation-steps 8 \
+ --num-epochs 3 \
+ --learning-rate 5e-5 \
+ --loss-decay-gamma 7 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500 \
+ --cache-dir /workspace/hanrui/cache \
+ --lora-rank 32 \
+ --lora-alpha 64 \
+ --lora-dropout 0.1 \
+ --trust-remote-code \
+ --dataloader-num-workers 0
diff --git a/syxin/launch_train_wrapper.py b/syxin/launch_train_wrapper.py
new file mode 100644
index 0000000000000000000000000000000000000000..fcba064f3792044451c288d58b9a15801773c26e
--- /dev/null
+++ b/syxin/launch_train_wrapper.py
@@ -0,0 +1,21 @@
+#!/usr/bin/env python3
+"""
+Python wrapper to launch bash training script via torchrun
+"""
+import subprocess
+import sys
+import os
+
+if __name__ == "__main__":
+ # Get the bash script path and arguments
+ bash_script = "/workspace/hanrui/syxin/run_train_multinode.sh"
+ args = sys.argv[1:] # Pass through all arguments
+
+ # Build the command
+ cmd = ["bash", bash_script] + args
+
+ # Execute the bash script
+ result = subprocess.run(cmd, env=os.environ.copy())
+
+ # Exit with the same code as the bash script
+ sys.exit(result.returncode)
diff --git a/syxin/list.md b/syxin/list.md
new file mode 100644
index 0000000000000000000000000000000000000000..bf988b2ab86c4998e2edb9210fd6d71974f4be00
--- /dev/null
+++ b/syxin/list.md
@@ -0,0 +1,12 @@
+### 1. `train_dflash_lora.py`
+* 加了lora,原来是调用小模型,现在是hidden states+lora预测。
+* `dflash_lora_mask_fn`函数是在处理预测的那一块草稿Block时,可以同时看到这一块里的所有词。
+
+### 2. OOM优化
+* 分片策略ZeRO-3,FSDP切分从`SHARD_GRAD_OP`升级到`FULL_SHARD`。
+* `batch-size=1`,`accumulation-steps=8`。
+* 参考之前的代码用了FlexAttention(`dflash_lora_mask_fn`)。
+* `_chunked_lm_loss()`,把算loss切片成256块来算+梯度检查。
+
+### 运行
+* bash /workspace/hanrui/junquan/SpecForge/scripts/run_train_dflash_lora.sh 2
\ No newline at end of file
diff --git a/syxin/merge_lora.py b/syxin/merge_lora.py
new file mode 100644
index 0000000000000000000000000000000000000000..728027da00127040922cf688fc557daeaa8852d2
--- /dev/null
+++ b/syxin/merge_lora.py
@@ -0,0 +1,66 @@
+"""
+Step 1: Merge DFlash-LoRA adapter into base model.
+Usage:
+ conda activate sglang
+ python3 merge_lora.py
+ python3 merge_lora.py --ckpt epoch_2_step_15000 # 测其他 checkpoint
+"""
+import argparse
+import os
+
+import torch
+from peft import PeftModel
+from transformers import AutoModelForCausalLM, AutoTokenizer
+
+BASE_MODEL = "/workspace/models/Qwen3-8B"
+OUTPUT_ROOT = "/workspace/hanrui/syxin/Specforge/outputs/qwen3-8b-dflash-lora"
+MERGE_ROOT = "/workspace/hanrui/syxin/Specforge/outputs/qwen3-8b-dflash-lora-merged"
+
+def parse_args():
+ p = argparse.ArgumentParser()
+ p.add_argument("--ckpt", default="epoch_3_step_18576",
+ help="Checkpoint folder name under OUTPUT_ROOT")
+ p.add_argument("--merged-path", default=MERGE_ROOT,
+ help="Where to save the merged model")
+ return p.parse_args()
+
+
+def main():
+ args = parse_args()
+ adapter_path = os.path.join(OUTPUT_ROOT, args.ckpt)
+ merged_path = args.merged_path
+
+ if os.path.exists(merged_path):
+ print(f"[skip] Merged model already exists: {merged_path}")
+ return
+
+ assert os.path.isdir(adapter_path), f"Adapter not found: {adapter_path}"
+
+ print(f"Base model : {BASE_MODEL}")
+ print(f"Adapter : {adapter_path}")
+ print(f"Output : {merged_path}")
+ print()
+
+ print("[1/4] Loading base model to CPU ...")
+ model = AutoModelForCausalLM.from_pretrained(
+ BASE_MODEL,
+ torch_dtype=torch.bfloat16,
+ device_map="cpu",
+ )
+
+ print("[2/4] Loading LoRA adapter ...")
+ model = PeftModel.from_pretrained(model, adapter_path)
+
+ print("[3/4] Merging weights ...")
+ model = model.merge_and_unload()
+
+ print("[4/4] Saving merged model ...")
+ os.makedirs(merged_path, exist_ok=True)
+ model.save_pretrained(merged_path, safe_serialization=True)
+ AutoTokenizer.from_pretrained(BASE_MODEL).save_pretrained(merged_path)
+
+ print(f"\nDone. Merged model saved to: {merged_path}")
+
+
+if __name__ == "__main__":
+ main()
diff --git a/syxin/oom_fix_progress.md b/syxin/oom_fix_progress.md
new file mode 100644
index 0000000000000000000000000000000000000000..864a0dcb2ed406cb8f882edbdd1a3d821fdfee06
--- /dev/null
+++ b/syxin/oom_fix_progress.md
@@ -0,0 +1,42 @@
+# DFlash LoRA OOM 修复记录
+
+## OOM 根因分析
+
+1. **SHARD_GRAD_OP (ZeRO-2)** — 每卡持有完整 Qwen3-8B 参数 (~16GB bf16),参数未分片
+2. **SDPA + 4D additive mask** — FlashAttention 不支持 4D additive mask,fallback 到 math backend,每层 materialize 完整 attention scores (`bsz × 32heads × 2048 × 2048`)
+3. **大 vocab logits** — `[bsz, 2048, 151936]` bf16 ≈ 1.18GB,加上梯度和 boolean indexing 拷贝,峰值 ~3-4GB
+4. **机器只有 2 张 H100**,脚本默认 `NUM_GPUS=4`
+
+## 已完成的改动
+
+### 1. FSDP sharding 改为 FULL_SHARD (ZeRO-3)
+- 文件: `SpecForge/scripts/train_dflash_lora.py:347`
+- `ShardingStrategy.SHARD_GRAD_OP` → `ShardingStrategy.FULL_SHARD`
+- 效果: 参数跨卡分片,每卡省 ~8-12GB
+
+### 2. 降 batch-size,提高 accumulation-steps
+- 文件: `SpecForge/scripts/run_train_dflash_lora.sh`
+- `--batch-size 2` → `1`,`--accumulation-steps 4` → `8`
+- 效果: 等效 global batch size 不变,峰值显存减半
+
+## 待验证 / 后续优化
+
+- [ ] 运行时传 `bash run_train_dflash_lora.sh 2` 确保用 2 卡
+- [x] 如仍 OOM,考虑 chunked cross-entropy loss 避免大 vocab logits 全量 materialize
+- [x] 长期可探索自定义 attention kernel 支持 block-sparse mask,绕过 SDPA math fallback
+
+### 3. flex_attention + BlockMask 替换 4D additive mask
+- 文件: `SpecForge/specforge/core/dflash_lora.py`, `specforge/modeling/draft/dflash_lora.py`, `scripts/train_dflash_lora.py`
+- 从非 LoRA 版 `dflash.py` 移植 `_get_or_create_block_mask()` 方法,适配 LoRA 场景 (Q_LEN == KV_LEN == seq_len)
+- LoRA 版 mask: context causal + block bidirectional (非 LoRA 版是 [context, noise] concat KV)
+- 用 `--attention-backend flex_attention` 启用 (默认),退回 `--attention-backend additive` 走原有 4D mask
+- HuggingFace model 用 `attn_implementation="flex_attention"` 加载
+- 效果: 不再 fallback 到 SDPA math backend,省去 `[bsz, heads, seq, seq]` attention scores 的显存
+
+### 4. chunked cross-entropy loss
+- 文件: `SpecForge/specforge/core/dflash_lora.py`, `specforge/modeling/draft/dflash_lora.py`, `scripts/train_dflash_lora.py`
+- 从非 LoRA 版 `dflash.py` 移植 `_chunked_lm_loss()` 方法
+- 分 chunk 过 lm_head + CE loss + gradient checkpointing,避免 materialize 完整 `[bsz, seq, vocab]` logits
+- 用 `--lm-head-chunk-size 256` 启用 (默认 0 = 不启用)
+- `DFlashLoRADraftModel.forward()` 新增 `output_hidden_states` 参数,chunked 时返回 hidden states
+- 效果: logits 峰值显存从 O(seq_len × vocab_size) 降至 O(chunk_size × vocab_size)
diff --git a/syxin/requirements.txt b/syxin/requirements.txt
new file mode 100644
index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391
diff --git a/syxin/run_bench.sh b/syxin/run_bench.sh
new file mode 100644
index 0000000000000000000000000000000000000000..9164e86a1863415ce07f659233ff65cff7840615
--- /dev/null
+++ b/syxin/run_bench.sh
@@ -0,0 +1,68 @@
+#!/bin/bash
+# Step 3: Run HumanEval / MT-Bench / GSM8K benchmarks.
+# Run AFTER start_server.sh is up.
+# Usage:
+# bash run_bench.sh # all three benches, full dataset
+# bash run_bench.sh humaneval # only humaneval
+# bash run_bench.sh mtbench gsm8k # pick any subset
+
+set -e
+
+INTRANET_IP=10.1.1.131
+PORT=30000
+BASE_MODEL=/workspace/models/Qwen3-8B
+MERGED=/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-merged
+BENCH_DIR=/workspace/hanrui/syxin_old/Specforge/benchmarks
+RESULT_DIR=$BENCH_DIR/results
+
+# ---- sanity check ----
+echo "Checking server at http://$INTRANET_IP:$PORT ..."
+curl -sf http://$INTRANET_IP:$PORT/v1/models > /dev/null || {
+ echo "[ERROR] Server not reachable. Start it first: bash start_server.sh"
+ exit 1
+}
+echo "Server OK."
+
+mkdir -p $RESULT_DIR
+cd $BENCH_DIR
+export PYTHONPATH=/workspace/hanrui/syxin_old/Specforge:$PYTHONPATH
+
+# ---- decide which benches to run ----
+TARGETS=("$@")
+if [ ${#TARGETS[@]} -eq 0 ]; then
+ TARGETS=(humaneval mtbench gsm8k)
+fi
+
+BENCH_ARGS=""
+for t in "${TARGETS[@]}"; do
+ case $t in
+ humaneval) BENCH_ARGS="$BENCH_ARGS humaneval:164" ;;
+ mtbench) BENCH_ARGS="$BENCH_ARGS mtbench:80" ;;
+ gsm8k) BENCH_ARGS="$BENCH_ARGS gsm8k:1319" ;;
+ *)
+ echo "[ERROR] Unknown bench: $t (choices: humaneval mtbench gsm8k)"
+ exit 1
+ ;;
+ esac
+done
+
+TIMESTAMP=$(date +%Y%m%d_%H%M%S)
+echo "Running: $BENCH_ARGS"
+echo "Results -> $RESULT_DIR"
+echo ""
+
+python3 bench_eagle3.py \
+ --model-path $BASE_MODEL \
+ --speculative-draft-model-path $MERGED \
+ --host $INTRANET_IP \
+ --port $PORT \
+ --config-list "16,4,1,4" \
+ --benchmark-list $BENCH_ARGS \
+ --output-dir $RESULT_DIR \
+ --name dflash_lora_${TIMESTAMP} \
+ --skip-launch-server \
+ 2>&1 | tee $RESULT_DIR/bench_${TIMESTAMP}.log
+
+echo ""
+echo "Done. Latest result files:"
+ls -lht $RESULT_DIR/*.jsonl 2>/dev/null | head -5
diff --git a/syxin/run_bench_dflash.sh b/syxin/run_bench_dflash.sh
new file mode 100644
index 0000000000000000000000000000000000000000..f485fef5d3303163db8b2ea3ef38f59a91793c92
--- /dev/null
+++ b/syxin/run_bench_dflash.sh
@@ -0,0 +1,71 @@
+#!/bin/bash
+# Evaluate DFlash-LoRA-Inject accepted length (offline, 8 GPUs parallel).
+# No sglang server needed. Each GPU loads its own target+draft and processes a shard.
+#
+# Usage:
+# bash run_bench_dflash.sh # 8 GPUs, all 3 benches
+# bash run_bench_dflash.sh humaneval # only humaneval
+# bash run_bench_dflash.sh mtbench gsm8k # pick any subset
+# bash run_bench_dflash.sh --quick # quick test (20 samples)
+# bash run_bench_dflash.sh --ckpt epoch_0_step_500 # specific checkpoint
+# NUM_GPUS=4 bash run_bench_dflash.sh # use 4 GPUs
+
+set -e
+
+SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &>/dev/null && pwd)
+PYTHON=/workspace/miniconda3/envs/spec/bin/python3
+RESULT_DIR=/workspace/hanrui/syxin_old/Specforge/benchmarks/results
+NUM_GPUS=${NUM_GPUS:-8}
+
+# ---- parse args ----
+BENCHMARKS=()
+EXTRA_ARGS=()
+QUICK=false
+
+for arg in "$@"; do
+ case $arg in
+ humaneval|mtbench|gsm8k)
+ BENCHMARKS+=("$arg")
+ ;;
+ --quick)
+ QUICK=true
+ ;;
+ *)
+ EXTRA_ARGS+=("$arg")
+ ;;
+ esac
+done
+
+if [ ${#BENCHMARKS[@]} -eq 0 ]; then
+ BENCHMARKS=(humaneval mtbench gsm8k)
+fi
+
+if [ "$QUICK" = true ]; then
+ EXTRA_ARGS+=(--num-samples 20)
+fi
+
+TIMESTAMP=$(date +%Y%m%d_%H%M%S)
+
+echo "============================================"
+echo " DFlash-LoRA-Inject Offline Eval"
+echo " GPUs : $NUM_GPUS"
+echo " benchmarks : ${BENCHMARKS[*]}"
+echo " extra args : ${EXTRA_ARGS[*]}"
+echo " results : $RESULT_DIR"
+echo "============================================"
+echo ""
+
+mkdir -p $RESULT_DIR
+
+$PYTHON -m torch.distributed.run \
+ --standalone \
+ --nproc_per_node $NUM_GPUS \
+ $SCRIPT_DIR/eval_dflash_lora_inject.py \
+ --benchmarks ${BENCHMARKS[@]} \
+ --output-dir $RESULT_DIR \
+ "${EXTRA_ARGS[@]}" \
+ 2>&1 | tee $RESULT_DIR/bench_dflash_lora_inject_offline_${TIMESTAMP}.log
+
+echo ""
+echo "Done. Latest result files:"
+ls -lht $RESULT_DIR/*.json 2>/dev/null | head -5
diff --git a/syxin/run_bench_dflash_b16_baseline.sh b/syxin/run_bench_dflash_b16_baseline.sh
new file mode 100644
index 0000000000000000000000000000000000000000..2f297e467d165500300800e45201f03d99a72e2f
--- /dev/null
+++ b/syxin/run_bench_dflash_b16_baseline.sh
@@ -0,0 +1,60 @@
+#!/bin/bash
+# DFlash-b16 baseline: measure accepted length offline, 8 GPUs parallel.
+# Usage:
+# bash run_bench_dflash_b16_baseline.sh # 8 GPUs, all 3 benches
+# bash run_bench_dflash_b16_baseline.sh humaneval # only humaneval
+# bash run_bench_dflash_b16_baseline.sh --quick # 20 samples per bench
+# NUM_GPUS=4 bash run_bench_dflash_b16_baseline.sh # 4 GPUs
+
+set -e
+
+SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &>/dev/null && pwd)
+PYTHON=/workspace/miniconda3/envs/spec/bin/python3
+RESULT_DIR=/workspace/hanrui/syxin_old/Specforge/benchmarks/results
+NUM_GPUS=${NUM_GPUS:-8}
+
+BENCHMARKS=()
+EXTRA_ARGS=()
+QUICK=false
+
+for arg in "$@"; do
+ case $arg in
+ humaneval|mtbench|gsm8k) BENCHMARKS+=("$arg") ;;
+ --quick) QUICK=true ;;
+ *) EXTRA_ARGS+=("$arg") ;;
+ esac
+done
+
+if [ ${#BENCHMARKS[@]} -eq 0 ]; then
+ BENCHMARKS=(humaneval mtbench gsm8k)
+fi
+
+if [ "$QUICK" = true ]; then
+ EXTRA_ARGS+=(--num-samples 20)
+fi
+
+TIMESTAMP=$(date +%Y%m%d_%H%M%S)
+
+echo "============================================"
+echo " DFlash-b16 Baseline Offline Eval"
+echo " GPUs : $NUM_GPUS"
+echo " draft : /workspace/models/Qwen3-8B-DFlash-b16"
+echo " benchmarks : ${BENCHMARKS[*]}"
+echo " extra args : ${EXTRA_ARGS[*]}"
+echo "============================================"
+echo ""
+
+mkdir -p $RESULT_DIR
+
+$PYTHON -m torch.distributed.run \
+ --standalone \
+ --nproc_per_node $NUM_GPUS \
+ $SCRIPT_DIR/eval_dflash_b16_baseline.py \
+ --benchmarks ${BENCHMARKS[@]} \
+ --output-dir $RESULT_DIR \
+ "${EXTRA_ARGS[@]}" \
+ 2>&1 | tee $RESULT_DIR/bench_dflash_b16_baseline_${TIMESTAMP}.log
+
+echo ""
+echo "Done. Latest result files:"
+ls -lht $RESULT_DIR/*.json 2>/dev/null | head -5
diff --git a/syxin/run_qwen3_8b_sft_32gpu.sh b/syxin/run_qwen3_8b_sft_32gpu.sh
new file mode 100644
index 0000000000000000000000000000000000000000..b53599b79a0c141add42c2384d9306172360e569
--- /dev/null
+++ b/syxin/run_qwen3_8b_sft_32gpu.sh
@@ -0,0 +1,31 @@
+#!/bin/bash
+export JOB_NAME='qwen3-8b-sft'
+export GPU_NUMS=64
+export TRAIN_SCRIPT='/workspace/hanrui/syxin/launch_train_wrapper.py'
+export WORK_DIR='/workspace/hanrui/syxin/Specforge'
+
+if [ $GPU_NUMS -lt 8 ]; then
+ export NNODES=1
+ export GPU_NUMS_PER_NODE=$GPU_NUMS
+else
+ export NNODES=$((GPU_NUMS/8))
+ export GPU_NUMS_PER_NODE=8
+fi
+
+# 使用 spec 环境的 northjob
+/workspace/miniconda3/envs/spec/bin/northjob \
+create \
+--job-type train \
+--nproc-per-node $GPU_NUMS_PER_NODE \
+--gpu-per-node $GPU_NUMS_PER_NODE \
+--nnodes $NNODES \
+--k8s-priority 3 \
+--k8s-queue bg-agentic-coding \
+--k8s-namespace bg-agentic-coding \
+--k8s-pvc-name i-xinsiyang-y4zy0sik0a \
+--k8s-pvc-mount-path /workspace \
+--k8s-no-reclaim \
+--k8s-images harbor.local.clusters/bp/megatron-bplm:25.03_fp8.ibgda.qwen3.next.fix_triton.fix_te.hf457.qwen3_vl \
+--job-name $JOB_NAME \
+--workspace $WORK_DIR \
+$TRAIN_SCRIPT $GPU_NUMS_PER_NODE
diff --git a/syxin/run_train_dflash_direct_inject.sh b/syxin/run_train_dflash_direct_inject.sh
new file mode 100644
index 0000000000000000000000000000000000000000..de7facae55444c8bdb6d4aeca56029cc169cdad8
--- /dev/null
+++ b/syxin/run_train_dflash_direct_inject.sh
@@ -0,0 +1,56 @@
+#!/bin/bash
+set -euo pipefail
+
+ROOT_DIR=/workspace/hanrui/syxin_old/Specforge
+NUM_GPUS=8
+OUTPUT_DIR=$ROOT_DIR/outputs/qwen3-8b-dflash-direct-inject
+if [[ $# -ge 1 ]]; then
+ NUM_GPUS=$1
+ shift
+fi
+if [[ $# -ge 1 && "${1:0:1}" != "-" ]]; then
+ OUTPUT_DIR=$1
+ shift
+fi
+EXTRA_ARGS=("$@")
+
+export TORCHINDUCTOR_CACHE_DIR=$ROOT_DIR/cache/compiled_kernels
+export SPECFORGE_DATA_NUM_PROC=16
+export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+export PYTORCH_ALLOC_CONF=expandable_segments:True
+export PYTHONPATH="$ROOT_DIR:${PYTHONPATH:-}"
+DEFAULT_SPECFORGE_PY=/workspace/hanrui/specforge/bin/python3
+if [[ -z "${PYTHON_BIN:-}" ]]; then
+ if [[ -x "$DEFAULT_SPECFORGE_PY" ]]; then
+ PYTHON_BIN="$DEFAULT_SPECFORGE_PY"
+ else
+ PYTHON_BIN=python3
+ fi
+fi
+
+cd $ROOT_DIR
+
+$PYTHON_BIN -m torch.distributed.run \
+ --standalone \
+ --nproc_per_node $NUM_GPUS \
+ scripts/train_dflash.py \
+ --target-model-path /workspace/models/Qwen3-8B \
+ --target-model-backend sglang \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir $OUTPUT_DIR \
+ --block-size 16 \
+ --num-draft-layers 36 \
+ --attention-backend flex_attention \
+ --max-length 2048 \
+ --batch-size 1 \
+ --accumulation-steps 8 \
+ --num-epochs 3 \
+ --learning-rate 6e-4 \
+ --loss-decay-gamma 7 \
+ --lm-head-chunk-size 256 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500 \
+ --cache-dir $ROOT_DIR/cache \
+ "${EXTRA_ARGS[@]}"
diff --git a/syxin/run_train_dflash_lora_inject.sh b/syxin/run_train_dflash_lora_inject.sh
new file mode 100644
index 0000000000000000000000000000000000000000..a6444af375bebe412199ba19056f11bdafc3e597
--- /dev/null
+++ b/syxin/run_train_dflash_lora_inject.sh
@@ -0,0 +1,71 @@
+#!/bin/bash
+set -euo pipefail
+
+ROOT_DIR=/workspace/hanrui/syxin/Specforge
+NUM_GPUS=8
+OUTPUT_DIR=$ROOT_DIR/outputs/qwen3-8b-dflash-lora-inject
+CACHE_DIR=/tmp/specforge_cache
+
+# Parse arguments
+if [[ $# -ge 1 ]]; then
+ NUM_GPUS=$1
+ shift
+fi
+if [[ $# -ge 1 && "${1:0:1}" != "-" ]]; then
+ OUTPUT_DIR=$1
+ shift
+fi
+EXTRA_ARGS=("$@")
+
+# Environment variables
+export TORCHINDUCTOR_CACHE_DIR=/tmp/specforge_cache/compiled_kernels
+export SPECFORGE_DATA_NUM_PROC=16
+export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+export PYTORCH_ALLOC_CONF=expandable_segments:True
+export PYTHONPATH="$ROOT_DIR:${PYTHONPATH:-}"
+export HF_DATASETS_CACHE=/tmp/specforge_cache/hf_datasets
+export HF_HOME=/tmp/specforge_cache/hf_home
+
+# Python binary
+DEFAULT_SPECFORGE_PY=/workspace/hanrui/specforge/bin/python3
+if [[ -z "${PYTHON_BIN:-}" ]]; then
+ if [[ -x "$DEFAULT_SPECFORGE_PY" ]]; then
+ PYTHON_BIN="$DEFAULT_SPECFORGE_PY"
+ else
+ PYTHON_BIN=python3
+ fi
+fi
+
+cd $ROOT_DIR
+
+$PYTHON_BIN -m torch.distributed.run \
+ --standalone \
+ --nproc_per_node $NUM_GPUS \
+ scripts/train_dflash_lora_inject.py \
+ --target-model-path /workspace/models/Qwen3-8B \
+ --target-model-backend hf \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir $OUTPUT_DIR \
+ --block-size 16 \
+ --attention-backend additive \
+ --attn-implementation sdpa \
+ --max-length 2048 \
+ --batch-size 8 \
+ --accumulation-steps 8 \
+ --num-epochs 3 \
+ --learning-rate 5e-5 \
+ --loss-decay-gamma 7 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500 \
+ --cache-dir $CACHE_DIR \
+ --lora-rank 32 \
+ --lora-alpha 64 \
+ --lora-dropout 0.1 \
+ --trust-remote-code \
+ --dataloader-num-workers 0 \
+ --early-stop \
+ --early-stop-patience 5 \
+ --early-stop-min-delta 0.005 \
+ "${EXTRA_ARGS[@]}"
diff --git a/syxin/run_train_multinode.sh b/syxin/run_train_multinode.sh
new file mode 100644
index 0000000000000000000000000000000000000000..583a4faccacc4be1f4b5db1b085d3d900e954f09
--- /dev/null
+++ b/syxin/run_train_multinode.sh
@@ -0,0 +1,67 @@
+#!/bin/bash
+set -euo pipefail
+
+ROOT_DIR=/workspace/hanrui/syxin/Specforge
+NUM_GPUS=8
+OUTPUT_DIR=$ROOT_DIR/outputs/qwen3-8b-sft-32gpu-v3
+CACHE_DIR=/tmp/specforge_cache
+
+# Parse arguments
+if [[ $# -ge 1 ]]; then
+ NUM_GPUS=$1
+ shift
+fi
+if [[ $# -ge 1 && "${1:0:1}" != "-" ]]; then
+ OUTPUT_DIR=$1
+ shift
+fi
+EXTRA_ARGS=("$@")
+
+# Environment variables
+export TORCHINDUCTOR_CACHE_DIR=/tmp/specforge_cache/compiled_kernels
+export SPECFORGE_DATA_NUM_PROC=16
+export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+export PYTORCH_ALLOC_CONF=expandable_segments:True
+export PYTHONPATH="$ROOT_DIR:${PYTHONPATH:-}"
+export HF_DATASETS_CACHE=/tmp/specforge_cache/hf_datasets
+export HF_HOME=/tmp/specforge_cache/hf_home
+
+# Python binary
+DEFAULT_SPECFORGE_PY=/workspace/miniconda3/envs/spec/bin/python3
+if [[ -z "${PYTHON_BIN:-}" ]]; then
+ if [[ -x "$DEFAULT_SPECFORGE_PY" ]]; then
+ PYTHON_BIN="$DEFAULT_SPECFORGE_PY"
+ else
+ PYTHON_BIN=python3
+ fi
+fi
+
+cd $ROOT_DIR
+
+# northjob 已经通过 torchrun 设置了分布式环境变量
+# 直接运行训练脚本,不要再启动 torch.distributed.run
+$PYTHON_BIN scripts/train_dflash_lora_inject.py \
+ --target-model-path /workspace/models/Qwen3-8B \
+ --target-model-backend hf \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir $OUTPUT_DIR \
+ --block-size 16 \
+ --attention-backend additive \
+ --attn-implementation sdpa \
+ --max-length 2048 \
+ --batch-size 4 \
+ --accumulation-steps 16 \
+ --num-epochs 3 \
+ --learning-rate 5e-5 \
+ --loss-decay-gamma 7 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500 \
+ --cache-dir $CACHE_DIR \
+ --lora-rank 32 \
+ --lora-alpha 64 \
+ --lora-dropout 0.1 \
+ --trust-remote-code \
+ --dataloader-num-workers 0 \
+ "${EXTRA_ARGS[@]}"
diff --git a/syxin/run_train_qwen3_8b_sft_32gpu.sh b/syxin/run_train_qwen3_8b_sft_32gpu.sh
new file mode 100644
index 0000000000000000000000000000000000000000..d617ec44ece15524dadaec908f9d054797fa6d75
--- /dev/null
+++ b/syxin/run_train_qwen3_8b_sft_32gpu.sh
@@ -0,0 +1,66 @@
+#!/bin/bash
+set -euo pipefail
+
+ROOT_DIR=/workspace/hanrui/syxin_old/Specforge
+NUM_GPUS=8
+OUTPUT_DIR=$ROOT_DIR/outputs/qwen3-8b-sft-32gpu-v2
+CACHE_DIR=/tmp/specforge_cache_sft
+
+# Parse arguments
+if [[ $# -ge 1 ]]; then
+ NUM_GPUS=$1
+ shift
+fi
+if [[ $# -ge 1 && "${1:0:1}" != "-" ]]; then
+ OUTPUT_DIR=$1
+ shift
+fi
+EXTRA_ARGS=("$@")
+
+# Environment variables
+export TORCHINDUCTOR_CACHE_DIR=/tmp/specforge_cache_sft/compiled_kernels
+export SPECFORGE_DATA_NUM_PROC=16
+export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+export PYTORCH_ALLOC_CONF=expandable_segments:True
+export PYTHONPATH="$ROOT_DIR:${PYTHONPATH:-}"
+export HF_DATASETS_CACHE=/tmp/specforge_cache_sft/hf_datasets
+export HF_HOME=/tmp/specforge_cache_sft/hf_home
+
+# Python binary
+DEFAULT_SPECFORGE_PY=/workspace/hanrui/specforge/bin/python3
+if [[ -z "${PYTHON_BIN:-}" ]]; then
+ if [[ -x "$DEFAULT_SPECFORGE_PY" ]]; then
+ PYTHON_BIN="$DEFAULT_SPECFORGE_PY"
+ else
+ PYTHON_BIN=python3
+ fi
+fi
+
+cd $ROOT_DIR
+
+# northjob 已经通过 torchrun 启动了分布式,这里直接运行训练脚本
+$PYTHON_BIN $ROOT_DIR/scripts/train_dflash_lora_inject.py \
+ --target-model-path /workspace/models/Qwen3-8B \
+ --target-model-backend hf \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir $OUTPUT_DIR \
+ --block-size 16 \
+ --attention-backend additive \
+ --attn-implementation sdpa \
+ --max-length 2048 \
+ --batch-size 8 \
+ --accumulation-steps 8 \
+ --num-epochs 3 \
+ --learning-rate 5e-5 \
+ --loss-decay-gamma 7 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500 \
+ --cache-dir $CACHE_DIR \
+ --lora-rank 32 \
+ --lora-alpha 64 \
+ --lora-dropout 0.1 \
+ --trust-remote-code \
+ --dataloader-num-workers 0 \
+ "${EXTRA_ARGS[@]}"
diff --git a/syxin/server.log b/syxin/server.log
new file mode 100644
index 0000000000000000000000000000000000000000..8de27bf5c7527cdaf2e01d5d86545a6d1828f236
--- /dev/null
+++ b/syxin/server.log
@@ -0,0 +1,186 @@
+/workspace/hanrui/sglang/python/sglang/launch_server.py:51: UserWarning: 'python -m sglang.launch_server' is still supported, but 'sglang serve' is the recommended entrypoint.
+ Example: sglang serve --model-path [options]
+ warnings.warn(
+[2026-03-07 15:24:13] INFO server_args.py:2048: Attention backend not specified. Use fa3 backend by default.
+[2026-03-07 15:24:13] WARNING server_args.py:2629: Max running requests is reset to 48 for speculative decoding. You can override this by explicitly setting --max-running-requests.
+[2026-03-07 15:24:13] WARNING server_args.py:2650: Overlap scheduler is disabled when spec v2 is off or using unsupported speculative algorithm. You can set env SGLANG_ENABLE_SPEC_V2=True to enable the experimental overlap scheduler.
+[2026-03-07 15:24:13] WARNING server_args.py:2712: speculative_num_draft_tokens is adjusted to speculative_num_steps + 1 when speculative_eagle_topk == 1
+[2026-03-07 15:24:14] server_args=ServerArgs(model_path='/workspace/models/Qwen3-8B', tokenizer_path='/workspace/models/Qwen3-8B', tokenizer_mode='auto', tokenizer_worker_num=1, skip_tokenizer_init=False, load_format='auto', model_loader_extra_config='{}', trust_remote_code=True, context_length=None, is_embedding=False, enable_multimodal=None, revision=None, model_impl='auto', host='10.233.100.123', port=30000, fastapi_root_path='', grpc_mode=False, skip_server_warmup=False, warmups=None, nccl_port=None, checkpoint_engine_wait_weights_before_ready=False, ssl_keyfile=None, ssl_certfile=None, ssl_ca_certs=None, ssl_keyfile_password=None, enable_ssl_refresh=False, dtype='bfloat16', quantization=None, quantization_param_path=None, kv_cache_dtype='auto', enable_fp32_lm_head=False, modelopt_quant=None, modelopt_checkpoint_restore_path=None, modelopt_checkpoint_save_path=None, modelopt_export_path=None, quantize_and_serve=False, rl_quant_profile=None, mem_fraction_static=0.8, max_running_requests=48, max_queued_requests=None, max_total_tokens=None, chunked_prefill_size=8192, enable_dynamic_chunking=False, max_prefill_tokens=16384, prefill_max_requests=None, schedule_policy='fcfs', enable_priority_scheduling=False, disable_priority_preemption=False, default_priority_value=None, abort_on_priority_when_disabled=False, schedule_low_priority_values_first=False, priority_scheduling_preemption_threshold=10, schedule_conservativeness=1.0, page_size=1, swa_full_tokens_ratio=0.8, disable_hybrid_swa_memory=False, radix_eviction_policy='lru', enable_prefill_delayer=False, prefill_delayer_max_delay_passes=30, prefill_delayer_token_usage_low_watermark=None, prefill_delayer_forward_passes_buckets=None, prefill_delayer_wait_seconds_buckets=None, device='cuda', tp_size=4, pp_size=1, pp_max_micro_batch_size=None, pp_async_batch_depth=0, stream_interval=1, stream_output=False, enable_streaming_session=False, random_seed=551181117, constrained_json_whitespace_pattern=None, constrained_json_disable_any_whitespace=False, watchdog_timeout=300, soft_watchdog_timeout=None, dist_timeout=None, download_dir=None, model_checksum=None, base_gpu_id=0, gpu_id_step=1, sleep_on_idle=False, use_ray=False, custom_sigquit_handler=None, log_level='info', log_level_http=None, log_requests=False, log_requests_level=2, log_requests_format='text', log_requests_target=None, uvicorn_access_log_exclude_prefixes=[], crash_dump_folder=None, show_time_cost=False, enable_metrics=False, enable_metrics_for_all_schedulers=False, tokenizer_metrics_custom_labels_header='x-custom-labels', tokenizer_metrics_allowed_custom_labels=None, extra_metric_labels=None, bucket_time_to_first_token=None, bucket_inter_token_latency=None, bucket_e2e_request_latency=None, collect_tokens_histogram=False, prompt_tokens_buckets=None, generation_tokens_buckets=None, gc_warning_threshold_secs=0.0, decode_log_interval=40, enable_request_time_stats_logging=False, kv_events_config=None, enable_trace=False, otlp_traces_endpoint='localhost:4317', export_metrics_to_file=False, export_metrics_to_file_dir=None, api_key=None, admin_api_key=None, served_model_name='/workspace/models/Qwen3-8B', weight_version='default', chat_template=None, hf_chat_template_name=None, completion_template=None, file_storage_path='sglang_storage', enable_cache_report=False, reasoning_parser=None, tool_call_parser=None, tool_server=None, sampling_defaults='model', dp_size=1, load_balance_method='round_robin', attn_cp_size=1, moe_dp_size=1, dist_init_addr=None, nnodes=1, node_rank=0, json_model_override_args='{}', preferred_sampling_params=None, enable_lora=None, enable_lora_overlap_loading=None, max_lora_rank=None, lora_target_modules=None, lora_paths=None, max_loaded_loras=None, max_loras_per_batch=8, lora_eviction_policy='lru', lora_backend='csgmv', max_lora_chunk_size=16, attention_backend='fa3', decode_attention_backend=None, prefill_attention_backend=None, sampling_backend='flashinfer', grammar_backend='xgrammar', mm_attention_backend=None, fp8_gemm_runner_backend='auto', fp4_gemm_runner_backend='flashinfer_cutlass', nsa_prefill_backend=None, nsa_decode_backend=None, disable_flashinfer_autotune=False, mamba_backend='triton', speculative_algorithm='STANDALONE', speculative_draft_model_path='/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-merged', speculative_draft_model_revision='main', speculative_draft_load_format=None, speculative_num_steps=4, speculative_eagle_topk=1, speculative_num_draft_tokens=5, speculative_accept_threshold_single=1.0, speculative_accept_threshold_acc=1.0, speculative_token_map=None, speculative_attention_mode='prefill', speculative_draft_attention_backend=None, speculative_moe_runner_backend='auto', speculative_moe_a2a_backend=None, speculative_draft_model_quantization=None, speculative_ngram_min_match_window_size=1, speculative_ngram_max_match_window_size=12, speculative_ngram_min_bfs_breadth=1, speculative_ngram_max_bfs_breadth=10, speculative_ngram_match_type='BFS', speculative_ngram_branch_length=18, speculative_ngram_capacity=10000000, enable_multi_layer_eagle=False, ep_size=1, moe_a2a_backend='none', moe_runner_backend='auto', flashinfer_mxfp4_moe_precision='default', enable_flashinfer_allreduce_fusion=False, enable_aiter_allreduce_fusion=False, deepep_mode='auto', ep_num_redundant_experts=0, ep_dispatch_algorithm=None, init_expert_location='trivial', enable_eplb=False, eplb_algorithm='auto', eplb_rebalance_num_iterations=1000, eplb_rebalance_layers_per_chunk=None, eplb_min_rebalancing_utilization_threshold=1.0, expert_distribution_recorder_mode=None, expert_distribution_recorder_buffer_size=1000, enable_expert_distribution_metrics=False, deepep_config=None, moe_dense_tp_size=None, elastic_ep_backend=None, enable_elastic_expert_backup=False, mooncake_ib_device=None, max_mamba_cache_size=None, mamba_ssm_dtype=None, mamba_full_memory_ratio=0.9, mamba_scheduler_strategy='no_buffer', mamba_track_interval=256, linear_attn_backend='triton', linear_attn_decode_backend=None, linear_attn_prefill_backend=None, enable_hierarchical_cache=False, hicache_ratio=2.0, hicache_size=0, hicache_write_policy='write_through', hicache_io_backend='kernel', hicache_mem_layout='layer_first', disable_hicache_numa_detect=False, hicache_storage_backend=None, hicache_storage_prefetch_policy='best_effort', hicache_storage_backend_extra_config=None, hierarchical_sparse_attention_extra_config=None, enable_lmcache=False, kt_weight_path=None, kt_method='AMXINT4', kt_cpuinfer=None, kt_threadpool_count=2, kt_num_gpu_experts=None, kt_max_deferred_experts_per_token=None, dllm_algorithm=None, dllm_algorithm_config=None, enable_double_sparsity=False, ds_channel_config_path=None, ds_heavy_channel_num=32, ds_heavy_token_num=256, ds_heavy_channel_type='qk', ds_sparse_decode_threshold=4096, cpu_offload_gb=0, offload_group_size=-1, offload_num_in_group=1, offload_prefetch_step=1, offload_mode='cpu', multi_item_scoring_delimiter=None, disable_radix_cache=False, cuda_graph_max_bs=512, cuda_graph_bs=[1, 2, 3, 4, 5, 6, 7, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32, 40, 44, 48, 52, 56, 60, 64, 72, 80, 88, 96, 104, 112, 120, 128, 136, 144, 152, 160, 168, 176, 184, 192, 200, 208, 216, 224, 232, 240, 248, 256, 272, 288, 304, 320, 336, 352, 368, 384, 400, 416, 432, 448, 464, 480, 496, 512], disable_cuda_graph=False, disable_cuda_graph_padding=False, enable_profile_cuda_graph=False, enable_cudagraph_gc=False, enable_layerwise_nvtx_marker=False, enable_nccl_nvls=False, enable_symm_mem=False, disable_flashinfer_cutlass_moe_fp4_allgather=False, enable_tokenizer_batch_encode=False, disable_tokenizer_batch_decode=False, disable_outlines_disk_cache=False, disable_custom_all_reduce=False, enable_mscclpp=False, enable_torch_symm_mem=False, disable_overlap_schedule=True, enable_mixed_chunk=False, enable_dp_attention=False, enable_dp_lm_head=False, enable_two_batch_overlap=False, enable_single_batch_overlap=False, tbo_token_distribution_threshold=0.48, enable_torch_compile=False, disable_piecewise_cuda_graph=True, enforce_piecewise_cuda_graph=False, enable_torch_compile_debug_mode=False, torch_compile_max_bs=32, piecewise_cuda_graph_max_tokens=8192, piecewise_cuda_graph_tokens=[4, 8, 12, 16, 20, 24, 28, 32, 48, 64, 80, 96, 112, 128, 144, 160, 176, 192, 208, 224, 240, 256, 288, 320, 352, 384, 416, 448, 480, 512, 576, 640, 704, 768, 832, 896, 960, 1024, 1280, 1536, 1792, 2048, 2304, 2560, 2816, 3072, 3328, 3584, 3840, 4096, 4608, 5120, 5632, 6144, 6656, 7168, 7680, 8192], piecewise_cuda_graph_compiler='eager', torchao_config='', enable_nan_detection=False, enable_p2p_check=False, triton_attention_reduce_in_fp32=False, triton_attention_num_kv_splits=8, triton_attention_split_tile_size=None, num_continuous_decode_steps=1, delete_ckpt_after_loading=False, enable_memory_saver=False, enable_weights_cpu_backup=False, enable_draft_weights_cpu_backup=False, allow_auto_truncate=False, enable_custom_logit_processor=False, flashinfer_mla_disable_ragged=False, disable_shared_experts_fusion=False, disable_chunked_prefix_cache=False, disable_fast_image_processor=False, keep_mm_feature_on_device=False, enable_return_hidden_states=False, enable_return_routed_experts=False, scheduler_recv_interval=1, numa_node=None, enable_deterministic_inference=False, rl_on_policy_target=None, enable_attn_tp_input_scattered=False, enable_nsa_prefill_context_parallel=False, nsa_prefill_cp_mode='round-robin-split', enable_fused_qk_norm_rope=False, enable_precise_embedding_interpolation=False, enable_fused_moe_sum_all_reduce=False, enable_dynamic_batch_tokenizer=False, dynamic_batch_tokenizer_batch_size=32, dynamic_batch_tokenizer_batch_timeout=0.002, debug_tensor_dump_output_folder=None, debug_tensor_dump_layers=None, debug_tensor_dump_input_file=None, debug_tensor_dump_inject=False, disaggregation_mode='null', disaggregation_transfer_backend='mooncake', disaggregation_bootstrap_port=8998, disaggregation_ib_device=None, disaggregation_decode_enable_offload_kvcache=False, num_reserved_decode_tokens=512, disaggregation_decode_polling_interval=1, encoder_only=False, language_only=False, encoder_transfer_backend='zmq_to_scheduler', encoder_urls=[], enable_adaptive_dispatch_to_encoder=False, custom_weight_loader=[], weight_loader_disable_mmap=False, remote_instance_weight_loader_seed_instance_ip=None, remote_instance_weight_loader_seed_instance_service_port=None, remote_instance_weight_loader_send_weights_group_ports=None, remote_instance_weight_loader_backend='nccl', remote_instance_weight_loader_start_seed_via_transfer_engine=False, enable_pdmux=False, pdmux_config_path=None, sm_group_num=8, mm_max_concurrent_calls=32, mm_per_request_timeout=10.0, enable_broadcast_mm_inputs_process=False, enable_prefix_mm_cache=False, mm_enable_dp_encoder=False, mm_process_config={}, limit_mm_data_per_request=None, enable_mm_global_cache=False, decrypted_config_file=None, decrypted_draft_config_file=None, forward_hooks=None)
+[2026-03-07 15:24:15] Using default HuggingFace chat template with detected content format: string
+[2026-03-07 15:24:25 TP2] Mamba selective_state_update backend initialized: triton
+[2026-03-07 15:24:25 TP2] Init torch distributed begin.
+[2026-03-07 15:24:26 TP0] Mamba selective_state_update backend initialized: triton
+[2026-03-07 15:24:26 TP0] Init torch distributed begin.
+[2026-03-07 15:24:26 TP3] Mamba selective_state_update backend initialized: triton
+[2026-03-07 15:24:26 TP1] Mamba selective_state_update backend initialized: triton
+[2026-03-07 15:24:26 TP3] Init torch distributed begin.
+[2026-03-07 15:24:26 TP1] Init torch distributed begin.
+[Gloo] Rank 1 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 0 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 3 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 2 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 0 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 2 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 1 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 3 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[2026-03-07 15:24:27 TP0] sglang is using nccl==2.27.5
+[2026-03-07 15:24:29 TP0] Scheduler hit an exception: Traceback (most recent call last):
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 3239, in run_scheduler_process
+ scheduler = Scheduler(
+ ^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 365, in __init__
+ self.init_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 561, in init_model_worker
+ self.init_tp_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 519, in init_tp_model_worker
+ self.tp_worker = TpModelWorker(
+ ^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 258, in __init__
+ self._init_model_runner()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 341, in _init_model_runner
+ self._model_runner = ModelRunner(
+ ^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 395, in __init__
+ pre_model_load_memory = self.init_torch_distributed()
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 813, in init_torch_distributed
+ initialize_model_parallel(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1764, in initialize_model_parallel
+ _TP = init_model_parallel_group(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1450, in init_model_parallel_group
+ return GroupCoordinator(
+ ^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 357, in __init__
+ self.pynccl_comm = PyNcclCommunicator(
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl.py", line 113, in __init__
+ self.comm: ncclComm_t = self.nccl.ncclCommInitRank(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 401, in ncclCommInitRank
+ self.NCCL_CHECK(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 376, in NCCL_CHECK
+ raise RuntimeError(f"NCCL error: {error_str}")
+RuntimeError: NCCL error: unhandled system error (run with NCCL_DEBUG=INFO for details)
+
+[2026-03-07 15:24:29] Received sigquit from a child process. It usually means the child failed.
+[2026-03-07 15:24:29 TP2] Scheduler hit an exception: Traceback (most recent call last):
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 3239, in run_scheduler_process
+ scheduler = Scheduler(
+ ^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 365, in __init__
+ self.init_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 561, in init_model_worker
+ self.init_tp_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 519, in init_tp_model_worker
+ self.tp_worker = TpModelWorker(
+ ^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 258, in __init__
+ self._init_model_runner()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 341, in _init_model_runner
+ self._model_runner = ModelRunner(
+ ^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 395, in __init__
+ pre_model_load_memory = self.init_torch_distributed()
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 813, in init_torch_distributed
+ initialize_model_parallel(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1764, in initialize_model_parallel
+ _TP = init_model_parallel_group(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1450, in init_model_parallel_group
+ return GroupCoordinator(
+ ^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 357, in __init__
+ self.pynccl_comm = PyNcclCommunicator(
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl.py", line 113, in __init__
+ self.comm: ncclComm_t = self.nccl.ncclCommInitRank(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 401, in ncclCommInitRank
+ self.NCCL_CHECK(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 376, in NCCL_CHECK
+ raise RuntimeError(f"NCCL error: {error_str}")
+RuntimeError: NCCL error: unhandled system error (run with NCCL_DEBUG=INFO for details)
+
+[2026-03-07 15:24:29 TP1] Scheduler hit an exception: Traceback (most recent call last):
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 3239, in run_scheduler_process
+ scheduler = Scheduler(
+ ^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 365, in __init__
+ self.init_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 561, in init_model_worker
+ self.init_tp_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 519, in init_tp_model_worker
+ self.tp_worker = TpModelWorker(
+ ^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 258, in __init__
+ self._init_model_runner()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 341, in _init_model_runner
+ self._model_runner = ModelRunner(
+ ^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 395, in __init__
+ pre_model_load_memory = self.init_torch_distributed()
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 813, in init_torch_distributed
+ initialize_model_parallel(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1764, in initialize_model_parallel
+ _TP = init_model_parallel_group(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1450, in init_model_parallel_group
+ return GroupCoordinator(
+ ^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 357, in __init__
+ self.pynccl_comm = PyNcclCommunicator(
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl.py", line 113, in __init__
+ self.comm: ncclComm_t = self.nccl.ncclCommInitRank(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 401, in ncclCommInitRank
+ self.NCCL_CHECK(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 376, in NCCL_CHECK
+ raise RuntimeError(f"NCCL error: {error_str}")
+RuntimeError: NCCL error: unhandled system error (run with NCCL_DEBUG=INFO for details)
+
+[2026-03-07 15:24:29] Received sigquit from a child process. It usually means the child failed.
+[2026-03-07 15:24:29] Received sigquit from a child process. It usually means the child failed.
+[2026-03-07 15:24:29 TP3] Scheduler hit an exception: Traceback (most recent call last):
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 3239, in run_scheduler_process
+ scheduler = Scheduler(
+ ^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 365, in __init__
+ self.init_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 561, in init_model_worker
+ self.init_tp_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 519, in init_tp_model_worker
+ self.tp_worker = TpModelWorker(
+ ^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 258, in __init__
+ self._init_model_runner()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 341, in _init_model_runner
+ self._model_runner = ModelRunner(
+ ^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 395, in __init__
+ pre_model_load_memory = self.init_torch_distributed()
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 813, in init_torch_distributed
+ initialize_model_parallel(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1764, in initialize_model_parallel
+ _TP = init_model_parallel_group(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1450, in init_model_parallel_group
+ return GroupCoordinator(
+ ^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 357, in __init__
+ self.pynccl_comm = PyNcclCommunicator(
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl.py", line 113, in __init__
+ self.comm: ncclComm_t = self.nccl.ncclCommInitRank(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 401, in ncclCommInitRank
+ self.NCCL_CHECK(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 376, in NCCL_CHECK
+ raise RuntimeError(f"NCCL error: {error_str}")
+RuntimeError: NCCL error: unhandled system error (run with NCCL_DEBUG=INFO for details)
+
+[2026-03-07 15:24:29] Received sigquit from a child process. It usually means the child failed.
diff --git a/syxin/start_server.sh b/syxin/start_server.sh
new file mode 100644
index 0000000000000000000000000000000000000000..a33c20458b6f6ee51021f51be80ff50841f7f633
--- /dev/null
+++ b/syxin/start_server.sh
@@ -0,0 +1,42 @@
+#!/bin/bash
+# Step 2: Launch SGLang server with STANDALONE speculative decoding.
+# Usage:
+# bash start_server.sh
+# bash start_server.sh 8 # use tp=8
+
+set -e
+
+TP=${1:-2}
+
+BASE_MODEL=/workspace/models/Qwen3-8B
+MERGED=/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-merged
+INTRANET_IP=10.1.1.131
+PORT=30000
+
+if [ ! -d "$MERGED" ]; then
+ echo "[ERROR] Merged model not found: $MERGED"
+ echo " Run: conda activate sglang && python3 merge_lora.py"
+ exit 1
+fi
+
+echo "============================================"
+echo " SGLang STANDALONE Speculative Decoding"
+echo " target : $BASE_MODEL"
+echo " draft : $MERGED"
+echo " host : $INTRANET_IP:$PORT"
+echo " tp : $TP"
+echo "============================================"
+
+/workspace/miniconda3/envs/sglang/bin/python3 -m sglang.launch_server \
+ --model-path $BASE_MODEL \
+ --speculative-algorithm STANDALONE \
+ --speculative-draft-model-path $MERGED \
+ --speculative-num-steps 4 \
+ --speculative-eagle-topk 1 \
+ --speculative-num-draft-tokens 4 \
+ --tp-size $TP \
+ --mem-fraction-static 0.30 \
+ --trust-remote-code \
+ --host $INTRANET_IP \
+ --port $PORT \
+ --dtype bfloat16
diff --git a/syxin/start_server_dflash.sh b/syxin/start_server_dflash.sh
new file mode 100644
index 0000000000000000000000000000000000000000..6f4ee6ce894fa333d6a98558dad606c175968571
--- /dev/null
+++ b/syxin/start_server_dflash.sh
@@ -0,0 +1,54 @@
+#!/bin/bash
+# Evaluate DFlash-LoRA-Inject: measure accepted length OFFLINE.
+# 8 GPUs parallel by default, each GPU runs a shard of prompts independently.
+#
+# WHY offline?
+# sglang STANDALONE treats draft as an independent autoregressive model,
+# completely ignoring the layer-by-layer injection that LoRA-Inject was
+# trained with. Result: accept_length ≈ 4.7 for ALL models (no signal).
+#
+# sglang DFLASH expects the DFlash-b16 architecture (5-layer, fc+hidden_norm),
+# which is structurally different from LoRA-Inject (full 36-layer + LoRA).
+#
+# So we run offline spec-generate with the correct injection pattern.
+#
+# Usage:
+# bash start_server_dflash.sh # 8 GPUs, all benchmarks
+# bash start_server_dflash.sh 4 # 4 GPUs
+# bash start_server_dflash.sh 8 humaneval # specific benchmark
+# bash start_server_dflash.sh 8 --num-samples 20 # quick test
+
+set -e
+
+SCRIPT_DIR=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &>/dev/null && pwd)
+
+NUM_GPUS=${1:-8}
+shift 2>/dev/null || true
+
+# ---- defaults ----
+BASE_MODEL=/workspace/models/Qwen3-8B
+ADAPTER_ROOT=/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject
+CKPT=epoch_3_step_1400
+MERGED=/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject-merged
+RESULT_DIR=/workspace/hanrui/syxin_old/Specforge/benchmarks/results
+PYTHON=/workspace/miniconda3/envs/spec/bin/python3
+
+echo "============================================"
+echo " DFlash-LoRA-Inject Offline Evaluation"
+echo " target : $BASE_MODEL"
+echo " ckpt : $CKPT"
+echo " merged : $MERGED"
+echo " GPUs : $NUM_GPUS"
+echo "============================================"
+
+$PYTHON -m torch.distributed.run \
+ --standalone \
+ --nproc_per_node $NUM_GPUS \
+ $SCRIPT_DIR/eval_dflash_lora_inject.py \
+ --base-model $BASE_MODEL \
+ --adapter-root $ADAPTER_ROOT \
+ --ckpt $CKPT \
+ --merged-path $MERGED \
+ --block-size 16 \
+ --output-dir $RESULT_DIR \
+ "$@"
diff --git a/syxin/step1.md b/syxin/step1.md
new file mode 100644
index 0000000000000000000000000000000000000000..76984c1000dac6765c033cca50a23deb199fe06d
--- /dev/null
+++ b/syxin/step1.md
@@ -0,0 +1,139 @@
+Now I have a complete picture. Here's the full analysis and proposed plan.
+
+ ---
+ Current Logic of train_dflash.py
+
+ This script trains a small, standalone DFlash draft model (1–10 transformer layers) that learns to predict token blocks in parallel,
+ guided by hidden states extracted from a frozen target model.
+
+ Architecture (two separate models)
+
+ 1. Target model (frozen, e.g. Qwen3-8B/32B) — runs a full forward pass to produce hidden states at selected layers.
+ 2. Draft model (DFlashDraftModel, ~1–10 layers) — a lightweight Qwen3-based decoder that takes noise embeddings + target hidden states
+ and predicts the block tokens.
+ 3. Target embed_tokens + lm_head — loaded separately via TargetEmbeddingsAndHead to avoid duplicating the full target model in memory.
+
+ Key locations
+
+ ┌──────────────────────────┬────────────────────────────────────┬───────────────────────────────────────────────────────┐
+ │ Component │ File │ Lines │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Model init │ scripts/train_dflash.py │ build_models() L254–311 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Target hidden extraction │ scripts/train_dflash.py │ L644–647 (target_model.generate_dflash_data) │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Forward pass │ specforge/core/dflash.py │ OnlineDFlashModel.forward() L243–332 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Loss calculation │ specforge/core/dflash.py │ _full_lm_loss() L382–417, _chunked_lm_loss() L419–478 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Loss mask │ specforge/core/dflash.py │ create_dflash_loss_mask() L481–509 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Draft model architecture │ specforge/modeling/draft/dflash.py │ DFlashDraftModel L212–266 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ DFlash attention │ specforge/modeling/draft/dflash.py │ Qwen3DFlashAttention L42–134 │
+ └──────────────────────────┴────────────────────────────────────┴───────────────────────────────────────────────────────┘
+
+ Forward pass flow (per training step)
+
+ input_ids, attention_mask, loss_mask → target_model.generate_dflash_data()
+ ↓
+ hidden_states (from target layers [1,9,17,25,33])
+ ↓
+ OnlineDFlashModel.forward():
+ 1. Truncate to block boundary
+ 2. prepare_noise_input(): anchor tokens kept, rest → MASK
+ 3. embed_tokens(noise_input_ids) → noise_embedding
+ 4. Build DFlash attention mask (flex_attention or additive)
+ 5. draft_model(noise_embedding, target_hidden, mask)
+ 6. lm_head(hidden) → logits
+ 7. CE loss on non-anchor positions (weighted by loss_mask × decay)
+
+ The draft model's custom Qwen3DFlashAttention concatenates [context_hidden, noise_hidden] as KV, with queries only from noise tokens. The
+ attention mask enforces: block tokens see all preceding blocks' context + bidirectional within their own block.
+
+ ---
+ What already exists: train_dflash_lora.py
+
+ Interestingly, the repo already has a LoRA variant at scripts/train_dflash_lora.py with its own model (DFlashLoRADraftModel) and wrapper
+ (OnlineDFlashLoRAModel). This is exactly the approach you described — Qwen3-8B + LoRA, no separate target model, 1-step diffusion
+ training. The key differences from train_dflash.py:
+
+ ┌─────────────────┬─────────────────────────────────────────────────────────────┬────────────────────────────────────────────────────┐
+ │ Aspect │ train_dflash.py │ train_dflash_lora.py │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Draft model │ Small custom DFlashDraftModel (1–10 layers) │ Full Qwen3-8B + LoRA adapters │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Target model │ Separate frozen model for hidden state extraction │ None — model uses its own representations │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Attention │ Custom Qwen3DFlashAttention (Q from noise, KV from [ctx, │ Standard HF attention with 4D additive DFlash mask │
+ │ │ noise]) │ │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Forward │ draft_model(noise_emb, target_hidden, mask) │ model(noise_input_ids, 4d_mask, position_ids) → │
+ │ │ │ logits │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Trainable │ All draft model params │ Only LoRA (q/k/v/o_proj), base frozen │
+ │ params │ │ │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ FSDP strategy │ SHARD_GRAD_OP │ FULL_SHARD │
+ └─────────────────┴─────────────────────────────────────────────────────────────┴────────────────────────────────────────────────────┘
+
+ ---
+ Proposed Modification Plan
+
+ Since train_dflash_lora.py already implements the core idea, the plan focuses on what's missing or needs improvement to make it a proper
+ "1-step dLLM draft model" for your research:
+
+ Phase 1: Validate and extend the existing LoRA pipeline
+
+ 1. Add MLP to LoRA targets — The current config only targets q_proj, k_proj, v_proj, o_proj. For stronger 1-step diffusion capability,
+ add gate_proj, up_proj, down_proj to lora_target_modules. This gives the model more capacity to learn the non-autoregressive distribution
+ shift.
+ 2. Add multi-step noise schedule support — Currently the training is strictly 1-step (all non-anchors → MASK). For a proper diffusion/AR
+ fusion, add an option for a noise schedule where a fraction of block tokens are revealed (not just the anchor), controlled by a
+ noise_ratio parameter. This would modify prepare_noise_input() in OnlineDFlashLoRAModel:
+ # Instead of: all non-anchor → MASK
+ # Allow: randomly keep some non-anchor tokens with probability (1 - noise_ratio)
+ 3. Add configurable context_len strategy — Currently context_len=0 treats the whole sequence as blocks. Add a --context-ratio arg that
+ dynamically sets context_len as a fraction of the sequence, so the model learns to condition on varying amounts of AR-decoded prefix.
+
+ Phase 2: Training logic improvements
+
+ 4. Add KL divergence loss — In addition to CE loss against ground truth, add an optional KL loss against the base model's AR distribution
+ (teacher forcing). This regularizes the LoRA model to stay close to the original Qwen3-8B distribution. Modify
+ OnlineDFlashLoRAModel.forward():
+ # Compute base model logits (no_grad, no LoRA) as teacher
+ # KL(draft_logits || teacher_logits) on block positions
+ # total_loss = ce_loss + kl_weight * kl_loss
+ 5. Add evaluation with speculative decoding metrics — The current accuracy metric is block-wise acceptance rate. Add an eval loop that
+ actually runs speculative decoding (draft → verify) to measure real speedup, using the LoRA model as the drafter and the base model (with
+ LoRA disabled) as the verifier.
+
+ Phase 3: Integration with train_dflash.py style features
+
+ 6. Port random anchor sampling — train_dflash.py has --random-anchor (L147–156) which samples diverse anchor positions per sequence. This
+ is missing from the LoRA variant and would improve training diversity. Port _sample_anchor_positions and _build_blocks_from_anchors from
+ OnlineDFlashModel to OnlineDFlashLoRAModel.
+ 7. Port chunked lm_head — The LoRA variant materializes full [bsz, seq_len, vocab_size] logits. For Qwen3-8B's 152K vocab, this is ~1.2GB
+ per sample at seq_len=2048. Port the _chunked_lm_loss from OnlineDFlashModel for memory efficiency.
+ 8. Add tensor parallelism support — The LoRA script currently forces tp_size=1. For Qwen3-8B on multi-GPU setups, add TP support to shard
+ the base model across GPUs while keeping LoRA params on each rank.
+
+ Minimal starting point
+
+ If you want to just get training running immediately, the existing train_dflash_lora.py + configs/qwen3-8b-dflash-lora.json should work
+ out of the box:
+
+ torchrun --nproc_per_node=4 scripts/train_dflash_lora.py \
+ --model-path Qwen/Qwen3-8B \
+ --lora-config configs/qwen3-8b-dflash-lora.json \
+ --train-data-path /path/to/data.jsonl \
+ --output-dir ./outputs/qwen3-8b-dflash-lora \
+ --block-size 16 \
+ --gradient-checkpointing \
+ --learning-rate 2e-4 \
+ --batch-size 1 \
+ --max-length 2048 \
+ --num-epochs 3
+
+ Want me to start implementing any of these phases? I'd suggest starting with Phase 1 (noise schedule + MLP targets) since that's the most
+ impactful for the diffusion/AR fusion research angle.
\ No newline at end of file
diff --git a/syxin/training.log b/syxin/training.log
new file mode 100644
index 0000000000000000000000000000000000000000..77201ad0c9ea32123830c750c52f4233a882e15c
--- /dev/null
+++ b/syxin/training.log
@@ -0,0 +1,118 @@
+nohup: ignoring input
+
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.43s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.56s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.52s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.55s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.57s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.50s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.52s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.70s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.41s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.52s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.58s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.60s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.59s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.58s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.57s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.80s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.38s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.49s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.49s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.52s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.51s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.53s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.51s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.71s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:02, 2.14s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.26s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.59s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.91s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.33it/s]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.23s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.23s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.73s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.04s/it]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.30s/it]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.31s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.32s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 134.33it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.67s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.01s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.67s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.01s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 133.65it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.59it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.72s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.05s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.72s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.06s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.73s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.06s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.47s/it]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.20it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.54it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 134.23it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.82s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.19s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 134.21it/s]
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/distributed_c10d.py:4876: UserWarning: barrier(): using the device under current context. You can specify `device_id` in `init_process_group` to mute this warning.
+ warnings.warn( # warn only once
+[rank0]:[W310 08:22:07.434083485 ProcessGroupNCCL.cpp:5072] Guessing device ID based on global rank. This can cause a hang if rank to GPU mapping is heterogeneous. You can specify device_id in init_process_group()
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkldataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkldataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
+
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
Epoch 0: 0%| | 0/12384 [00:00, ?it/s]
Epoch 0: 0%| | 0/12384 [00:08, ?it/s, loss=11.4616, acc=0.0002, iter_time=7.95s]
Epoch 0: 0%| | 1/12384 [00:08<28:52:24, 8.39s/it, loss=11.4616, acc=0.0002, iter_time=7.95s]
Epoch 0: 0%| | 1/12384 [00:16<28:52:24, 8.39s/it, loss=10.6726, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 2/12384 [00:16<27:23:24, 7.96s/it, loss=10.6726, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 2/12384 [00:23<27:23:24, 7.96s/it, loss=10.4985, acc=0.0011, iter_time=8.86s]
Epoch 0: 0%| | 3/12384 [00:23<26:55:47, 7.83s/it, loss=10.4985, acc=0.0011, iter_time=8.86s]
Epoch 0: 0%| | 3/12384 [00:31<26:55:47, 7.83s/it, loss=12.4512, acc=0.0002, iter_time=4.60s]
Epoch 0: 0%| | 4/12384 [00:31<26:42:04, 7.76s/it, loss=12.4512, acc=0.0002, iter_time=4.60s]
Epoch 0: 0%| | 4/12384 [00:39<26:42:04, 7.76s/it, loss=10.6913, acc=0.0007, iter_time=10.74s]
Epoch 0: 0%| | 5/12384 [00:39<26:37:07, 7.74s/it, loss=10.6913, acc=0.0007, iter_time=10.74s]
Epoch 0: 0%| | 5/12384 [00:46<26:37:07, 7.74s/it, loss=10.7935, acc=0.0006, iter_time=7.67s]
Epoch 0: 0%| | 6/12384 [00:46<26:30:41, 7.71s/it, loss=10.7935, acc=0.0006, iter_time=7.67s]
Epoch 0: 0%| | 6/12384 [00:54<26:30:41, 7.71s/it, loss=12.5651, acc=0.0002, iter_time=7.69s]
Epoch 0: 0%| | 7/12384 [00:54<26:29:17, 7.70s/it, loss=12.5651, acc=0.0002, iter_time=7.69s]
Epoch 0: 0%| | 7/12384 [01:02<26:29:17, 7.70s/it, loss=11.6807, acc=0.0003, iter_time=8.32s]
Epoch 0: 0%| | 8/12384 [01:02<26:39:38, 7.76s/it, loss=11.6807, acc=0.0003, iter_time=8.32s]
Epoch 0: 0%| | 8/12384 [01:09<26:39:38, 7.76s/it, loss=11.3789, acc=0.0005, iter_time=4.95s]
Epoch 0: 0%| | 9/12384 [01:09<26:32:57, 7.72s/it, loss=11.3789, acc=0.0005, iter_time=4.95s]
Epoch 0: 0%| | 9/12384 [01:17<26:32:57, 7.72s/it, loss=10.5343, acc=0.0003, iter_time=10.35s]
Epoch 0: 0%| | 10/12384 [01:17<26:52:52, 7.82s/it, loss=10.5343, acc=0.0003, iter_time=10.35s]
Epoch 0: 0%| | 10/12384 [01:25<26:52:52, 7.82s/it, loss=11.6157, acc=0.0004, iter_time=7.60s]
Epoch 0: 0%| | 11/12384 [01:25<26:39:20, 7.76s/it, loss=11.6157, acc=0.0004, iter_time=7.60s]
Epoch 0: 0%| | 11/12384 [01:33<26:39:20, 7.76s/it, loss=11.2005, acc=0.0002, iter_time=7.61s]
Epoch 0: 0%| | 12/12384 [01:33<26:30:56, 7.72s/it, loss=11.2005, acc=0.0002, iter_time=7.61s]
Epoch 0: 0%| | 12/12384 [01:40<26:30:56, 7.72s/it, loss=11.8510, acc=0.0011, iter_time=5.03s]
Epoch 0: 0%| | 13/12384 [01:40<26:28:03, 7.70s/it, loss=11.8510, acc=0.0011, iter_time=5.03s]
Epoch 0: 0%| | 13/12384 [01:48<26:28:03, 7.70s/it, loss=12.6667, acc=0.0004, iter_time=8.56s]
Epoch 0: 0%| | 14/12384 [01:48<26:24:01, 7.68s/it, loss=12.6667, acc=0.0004, iter_time=8.56s]
Epoch 0: 0%| | 14/12384 [01:56<26:24:01, 7.68s/it, loss=11.3266, acc=0.0002, iter_time=9.36s]
Epoch 0: 0%| | 15/12384 [01:56<26:21:37, 7.67s/it, loss=11.3266, acc=0.0002, iter_time=9.36s]
Epoch 0: 0%| | 15/12384 [02:03<26:21:37, 7.67s/it, loss=12.2026, acc=0.0000, iter_time=7.61s]
Epoch 0: 0%| | 16/12384 [02:03<26:18:20, 7.66s/it, loss=12.2026, acc=0.0000, iter_time=7.61s]
Epoch 0: 0%| | 16/12384 [02:11<26:18:20, 7.66s/it, loss=10.7707, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 17/12384 [02:11<26:16:34, 7.65s/it, loss=10.7707, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 17/12384 [02:19<26:16:34, 7.65s/it, loss=10.9714, acc=0.0001, iter_time=8.84s]
Epoch 0: 0%| | 18/12384 [02:19<26:15:13, 7.64s/it, loss=10.9714, acc=0.0001, iter_time=8.84s]
Epoch 0: 0%| | 18/12384 [02:26<26:15:13, 7.64s/it, loss=11.0658, acc=0.0002, iter_time=6.42s]
Epoch 0: 0%| | 19/12384 [02:26<26:18:08, 7.66s/it, loss=11.0658, acc=0.0002, iter_time=6.42s]
Epoch 0: 0%| | 19/12384 [02:34<26:18:08, 7.66s/it, loss=10.9882, acc=0.0011, iter_time=8.88s]
Epoch 0: 0%| | 20/12384 [02:34<26:18:16, 7.66s/it, loss=10.9882, acc=0.0011, iter_time=8.88s]
Epoch 0: 0%| | 20/12384 [02:42<26:18:16, 7.66s/it, loss=11.3002, acc=0.0000, iter_time=7.65s]
Epoch 0: 0%| | 21/12384 [02:42<26:14:15, 7.64s/it, loss=11.3002, acc=0.0000, iter_time=7.65s]
Epoch 0: 0%| | 21/12384 [02:49<26:14:15, 7.64s/it, loss=10.9236, acc=0.0005, iter_time=7.62s]
Epoch 0: 0%| | 22/12384 [02:49<26:14:09, 7.64s/it, loss=10.9236, acc=0.0005, iter_time=7.62s]
Epoch 0: 0%| | 22/12384 [02:57<26:14:09, 7.64s/it, loss=11.6876, acc=0.0004, iter_time=7.64s]
Epoch 0: 0%| | 23/12384 [02:57<26:13:31, 7.64s/it, loss=11.6876, acc=0.0004, iter_time=7.64s]
Epoch 0: 0%| | 23/12384 [03:04<26:13:31, 7.64s/it, loss=10.1433, acc=0.0008, iter_time=8.02s]
Epoch 0: 0%| | 24/12384 [03:04<26:12:22, 7.63s/it, loss=10.1433, acc=0.0008, iter_time=8.02s]
Epoch 0: 0%| | 24/12384 [03:12<26:12:22, 7.63s/it, loss=11.4336, acc=0.0007, iter_time=7.26s]
Epoch 0: 0%| | 25/12384 [03:12<26:12:18, 7.63s/it, loss=11.4336, acc=0.0007, iter_time=7.26s]
Epoch 0: 0%| | 25/12384 [03:20<26:12:18, 7.63s/it, loss=11.4074, acc=0.0004, iter_time=7.63s]
Epoch 0: 0%| | 26/12384 [03:20<26:12:54, 7.64s/it, loss=11.4074, acc=0.0004, iter_time=7.63s]
Epoch 0: 0%| | 26/12384 [03:27<26:12:54, 7.64s/it, loss=11.0375, acc=0.0009, iter_time=7.64s]
Epoch 0: 0%| | 27/12384 [03:27<26:12:45, 7.64s/it, loss=11.0375, acc=0.0009, iter_time=7.64s]
Epoch 0: 0%| | 27/12384 [03:35<26:12:45, 7.64s/it, loss=13.4672, acc=0.0000, iter_time=4.34s]
Epoch 0: 0%| | 28/12384 [03:35<26:12:58, 7.64s/it, loss=13.4672, acc=0.0000, iter_time=4.34s]
Epoch 0: 0%| | 28/12384 [03:43<26:12:58, 7.64s/it, loss=10.7064, acc=0.0000, iter_time=10.95s]
Epoch 0: 0%| | 29/12384 [03:43<26:15:30, 7.65s/it, loss=10.7064, acc=0.0000, iter_time=10.95s]
Epoch 0: 0%| | 29/12384 [03:50<26:15:30, 7.65s/it, loss=10.6316, acc=0.0007, iter_time=7.05s]
Epoch 0: 0%| | 30/12384 [03:50<26:15:49, 7.65s/it, loss=10.6316, acc=0.0007, iter_time=7.05s]
Epoch 0: 0%| | 30/12384 [03:58<26:15:49, 7.65s/it, loss=10.6725, acc=0.0005, iter_time=8.31s]
Epoch 0: 0%| | 31/12384 [03:58<26:18:34, 7.67s/it, loss=10.6725, acc=0.0005, iter_time=8.31s]
Epoch 0: 0%| | 31/12384 [04:06<26:18:34, 7.67s/it, loss=11.1389, acc=0.0004, iter_time=8.08s]
Epoch 0: 0%| | 32/12384 [04:06<26:18:20, 7.67s/it, loss=11.1389, acc=0.0004, iter_time=8.08s]
Epoch 0: 0%| | 32/12384 [04:13<26:18:20, 7.67s/it, loss=11.0649, acc=0.0006, iter_time=7.25s]
Epoch 0: 0%| | 33/12384 [04:13<26:16:12, 7.66s/it, loss=11.0649, acc=0.0006, iter_time=7.25s]
Epoch 0: 0%| | 33/12384 [04:21<26:16:12, 7.66s/it, loss=10.9385, acc=0.0015, iter_time=7.64s]
Epoch 0: 0%| | 34/12384 [04:21<26:16:33, 7.66s/it, loss=10.9385, acc=0.0015, iter_time=7.64s]
Epoch 0: 0%| | 34/12384 [04:29<26:16:33, 7.66s/it, loss=11.5272, acc=0.0016, iter_time=5.92s]
Epoch 0: 0%| | 35/12384 [04:29<26:15:45, 7.66s/it, loss=11.5272, acc=0.0016, iter_time=5.92s]
Epoch 0: 0%| | 35/12384 [04:37<26:15:45, 7.66s/it, loss=10.9093, acc=0.0003, iter_time=9.69s]
Epoch 0: 0%| | 36/12384 [04:37<26:32:15, 7.74s/it, loss=10.9093, acc=0.0003, iter_time=9.69s]
Epoch 0: 0%| | 36/12384 [04:45<26:32:15, 7.74s/it, loss=12.0866, acc=0.0007, iter_time=7.66s]
Epoch 0: 0%| | 37/12384 [04:45<26:49:10, 7.82s/it, loss=12.0866, acc=0.0007, iter_time=7.66s]
Epoch 0: 0%| | 37/12384 [04:52<26:49:10, 7.82s/it, loss=12.0058, acc=0.0010, iter_time=4.01s]
Epoch 0: 0%| | 38/12384 [04:52<26:39:22, 7.77s/it, loss=12.0058, acc=0.0010, iter_time=4.01s]
Epoch 0: 0%| | 38/12384 [05:00<26:39:22, 7.77s/it, loss=11.0774, acc=0.0005, iter_time=11.59s]
Epoch 0: 0%| | 39/12384 [05:00<26:30:19, 7.73s/it, loss=11.0774, acc=0.0005, iter_time=11.59s]
Epoch 0: 0%| | 39/12384 [05:07<26:30:19, 7.73s/it, loss=11.2613, acc=0.0001, iter_time=8.04s]
Epoch 0: 0%| | 40/12384 [05:07<26:25:19, 7.71s/it, loss=11.2613, acc=0.0001, iter_time=8.04s]
Epoch 0: 0%| | 40/12384 [05:15<26:25:19, 7.71s/it, loss=10.6729, acc=0.0005, iter_time=7.24s]
Epoch 0: 0%| | 41/12384 [05:15<26:20:47, 7.68s/it, loss=10.6729, acc=0.0005, iter_time=7.24s]
Epoch 0: 0%| | 41/12384 [05:23<26:20:47, 7.68s/it, loss=10.2672, acc=0.0007, iter_time=7.62s]
Epoch 0: 0%| | 42/12384 [05:23<26:15:46, 7.66s/it, loss=10.2672, acc=0.0007, iter_time=7.62s]
Epoch 0: 0%| | 42/12384 [05:30<26:15:46, 7.66s/it, loss=11.5034, acc=0.0001, iter_time=7.04s]
Epoch 0: 0%| | 43/12384 [05:30<26:15:27, 7.66s/it, loss=11.5034, acc=0.0001, iter_time=7.04s]
Epoch 0: 0%| | 43/12384 [05:38<26:15:27, 7.66s/it, loss=11.4143, acc=0.0005, iter_time=8.24s]
Epoch 0: 0%| | 44/12384 [05:38<26:12:08, 7.64s/it, loss=11.4143, acc=0.0005, iter_time=8.24s]
Epoch 0: 0%| | 44/12384 [05:46<26:12:08, 7.64s/it, loss=11.8333, acc=0.0000, iter_time=7.62s]
Epoch 0: 0%| | 45/12384 [05:46<26:10:39, 7.64s/it, loss=11.8333, acc=0.0000, iter_time=7.62s]
Epoch 0: 0%| | 45/12384 [05:53<26:10:39, 7.64s/it, loss=12.4923, acc=0.0009, iter_time=4.75s]
Epoch 0: 0%| | 46/12384 [05:53<26:10:04, 7.64s/it, loss=12.4923, acc=0.0009, iter_time=4.75s]
Epoch 0: 0%| | 46/12384 [06:01<26:10:04, 7.64s/it, loss=10.7213, acc=0.0009, iter_time=10.48s]
Epoch 0: 0%| | 47/12384 [06:01<26:09:32, 7.63s/it, loss=10.7213, acc=0.0009, iter_time=10.48s]
Epoch 0: 0%| | 47/12384 [06:08<26:09:32, 7.63s/it, loss=11.5314, acc=0.0005, iter_time=8.04s]
Epoch 0: 0%| | 48/12384 [06:08<26:08:16, 7.63s/it, loss=11.5314, acc=0.0005, iter_time=8.04s]
Epoch 0: 0%| | 48/12384 [06:16<26:08:16, 7.63s/it, loss=12.5196, acc=0.0004, iter_time=5.45s]
Epoch 0: 0%| | 49/12384 [06:16<26:10:43, 7.64s/it, loss=12.5196, acc=0.0004, iter_time=5.45s]
Epoch 0: 0%| | 49/12384 [06:24<26:10:43, 7.64s/it, loss=12.3785, acc=0.0006, iter_time=9.85s]
Epoch 0: 0%| | 50/12384 [06:24<26:09:30, 7.64s/it, loss=12.3785, acc=0.0006, iter_time=9.85s]
Epoch 0: 0%| | 50/12384 [06:31<26:09:30, 7.64s/it, loss=11.2568, acc=0.0005, iter_time=4.59s]
Epoch 0: 0%| | 51/12384 [06:31<26:09:54, 7.64s/it, loss=11.2568, acc=0.0005, iter_time=4.59s]
Epoch 0: 0%| | 51/12384 [06:39<26:09:54, 7.64s/it, loss=12.6810, acc=0.0005, iter_time=9.62s]
Epoch 0: 0%| | 52/12384 [06:39<26:08:42, 7.63s/it, loss=12.6810, acc=0.0005, iter_time=9.62s]
Epoch 0: 0%| | 52/12384 [06:47<26:08:42, 7.63s/it, loss=11.2767, acc=0.0006, iter_time=8.28s]
Epoch 0: 0%| | 53/12384 [06:47<26:07:18, 7.63s/it, loss=11.2767, acc=0.0006, iter_time=8.28s]
Epoch 0: 0%| | 53/12384 [06:54<26:07:18, 7.63s/it, loss=12.0088, acc=0.0004, iter_time=4.82s]
Epoch 0: 0%| | 54/12384 [06:54<26:06:35, 7.62s/it, loss=12.0088, acc=0.0004, iter_time=4.82s]
Epoch 0: 0%| | 54/12384 [07:02<26:06:35, 7.62s/it, loss=12.1385, acc=0.0004, iter_time=10.43s]
Epoch 0: 0%| | 55/12384 [07:02<26:07:25, 7.63s/it, loss=12.1385, acc=0.0004, iter_time=10.43s]
Epoch 0: 0%| | 55/12384 [07:10<26:07:25, 7.63s/it, loss=10.7962, acc=0.0001, iter_time=8.01s]
Epoch 0: 0%| | 56/12384 [07:10<26:12:48, 7.65s/it, loss=10.7962, acc=0.0001, iter_time=8.01s]
Epoch 0: 0%| | 56/12384 [07:17<26:12:48, 7.65s/it, loss=11.5871, acc=0.0005, iter_time=6.45s]
Epoch 0: 0%| | 57/12384 [07:17<26:10:12, 7.64s/it, loss=11.5871, acc=0.0005, iter_time=6.45s]
Epoch 0: 0%| | 57/12384 [07:25<26:10:12, 7.64s/it, loss=14.1009, acc=0.0005, iter_time=5.16s]
Epoch 0: 0%| | 58/12384 [07:25<26:10:08, 7.64s/it, loss=14.1009, acc=0.0005, iter_time=5.16s]
Epoch 0: 0%| | 58/12384 [07:33<26:10:08, 7.64s/it, loss=10.7893, acc=0.0008, iter_time=10.96s]
Epoch 0: 0%| | 59/12384 [07:33<26:08:22, 7.64s/it, loss=10.7893, acc=0.0008, iter_time=10.96s]
Epoch 0: 0%| | 59/12384 [07:40<26:08:22, 7.64s/it, loss=10.9049, acc=0.0003, iter_time=7.62s]
Epoch 0: 0%| | 60/12384 [07:40<26:05:26, 7.62s/it, loss=10.9049, acc=0.0003, iter_time=7.62s]
Epoch 0: 0%| | 60/12384 [07:48<26:05:26, 7.62s/it, loss=11.4199, acc=0.0004, iter_time=6.67s]
Epoch 0: 0%| | 61/12384 [07:48<26:09:03, 7.64s/it, loss=11.4199, acc=0.0004, iter_time=6.67s]
Epoch 0: 0%| | 61/12384 [07:56<26:09:03, 7.64s/it, loss=13.1510, acc=0.0002, iter_time=7.12s]
Epoch 0: 1%| | 62/12384 [07:56<26:28:37, 7.74s/it, loss=13.1510, acc=0.0002, iter_time=7.12s]
Epoch 0: 1%| | 62/12384 [08:03<26:28:37, 7.74s/it, loss=10.5607, acc=0.0006, iter_time=9.46s]
Epoch 0: 1%| | 63/12384 [08:03<26:21:20, 7.70s/it, loss=10.5607, acc=0.0006, iter_time=9.46s]
Epoch 0: 1%| | 63/12384 [08:11<26:21:20, 7.70s/it, loss=11.2135, acc=0.0007, iter_time=7.68s]
Epoch 0: 1%| | 64/12384 [08:11<26:17:46, 7.68s/it, loss=11.2135, acc=0.0007, iter_time=7.68s]
Epoch 0: 1%| | 64/12384 [08:19<26:17:46, 7.68s/it, loss=11.6287, acc=0.0007, iter_time=7.01s]
Epoch 0: 1%| | 65/12384 [08:19<26:14:43, 7.67s/it, loss=11.6287, acc=0.0007, iter_time=7.01s]
Epoch 0: 1%| | 65/12384 [08:26<26:14:43, 7.67s/it, loss=11.7011, acc=0.0006, iter_time=8.20s]
Epoch 0: 1%| | 66/12384 [08:26<26:13:16, 7.66s/it, loss=11.7011, acc=0.0006, iter_time=8.20s]
Epoch 0: 1%| | 66/12384 [08:34<26:13:16, 7.66s/it, loss=11.1116, acc=0.0009, iter_time=7.66s]
Epoch 0: 1%| | 67/12384 [08:34<26:10:08, 7.65s/it, loss=11.1116, acc=0.0009, iter_time=7.66s]
Epoch 0: 1%| | 67/12384 [08:42<26:10:08, 7.65s/it, loss=10.5857, acc=0.0003, iter_time=7.62s]
Epoch 0: 1%| | 68/12384 [08:42<26:08:44, 7.64s/it, loss=10.5857, acc=0.0003, iter_time=7.62s]
Epoch 0: 1%| | 68/12384 [08:49<26:08:44, 7.64s/it, loss=12.2984, acc=0.0002, iter_time=6.42s]
Epoch 0: 1%| | 69/12384 [08:49<26:10:22, 7.65s/it, loss=12.2984, acc=0.0002, iter_time=6.42s]
Epoch 0: 1%| | 69/12384 [08:57<26:10:22, 7.65s/it, loss=10.6612, acc=0.0003, iter_time=8.87s]
Epoch 0: 1%| | 70/12384 [08:57<26:10:57, 7.65s/it, loss=10.6612, acc=0.0003, iter_time=8.87s]
Epoch 0: 1%| | 70/12384 [09:05<26:10:57, 7.65s/it, loss=10.8825, acc=0.0005, iter_time=7.65s]
Epoch 0: 1%| | 71/12384 [09:05<26:10:27, 7.65s/it, loss=10.8825, acc=0.0005, iter_time=7.65s]
Epoch 0: 1%| | 71/12384 [09:12<26:10:27, 7.65s/it, loss=10.7391, acc=0.0006, iter_time=8.04s]
Epoch 0: 1%| | 72/12384 [09:12<26:08:05, 7.64s/it, loss=10.7391, acc=0.0006, iter_time=8.04s]
Epoch 0: 1%| | 72/12384 [09:20<26:08:05, 7.64s/it, loss=12.1920, acc=0.0007, iter_time=5.13s]
Epoch 0: 1%| | 73/12384 [09:20<26:11:50, 7.66s/it, loss=12.1920, acc=0.0007, iter_time=5.13s]
Epoch 0: 1%| | 73/12384 [09:27<26:11:50, 7.66s/it, loss=10.5516, acc=0.0004, iter_time=9.80s]
Epoch 0: 1%| | 74/12384 [09:27<26:10:12, 7.65s/it, loss=10.5516, acc=0.0004, iter_time=9.80s]
Epoch 0: 1%| | 74/12384 [09:35<26:10:12, 7.65s/it, loss=10.1934, acc=0.0006, iter_time=7.66s]
Epoch 0: 1%| | 75/12384 [09:35<26:13:17, 7.67s/it, loss=10.1934, acc=0.0006, iter_time=7.66s]
Epoch 0: 1%| | 75/12384 [09:43<26:13:17, 7.67s/it, loss=11.6410, acc=0.0000, iter_time=7.04s]
Epoch 0: 1%| | 76/12384 [09:43<26:09:20, 7.65s/it, loss=11.6410, acc=0.0000, iter_time=7.04s]
Epoch 0: 1%| | 76/12384 [09:50<26:09:20, 7.65s/it, loss=10.9323, acc=0.0004, iter_time=7.31s]
Epoch 0: 1%| | 77/12384 [09:50<26:07:08, 7.64s/it, loss=10.9323, acc=0.0004, iter_time=7.31s]
Epoch 0: 1%| | 77/12384 [09:58<26:07:08, 7.64s/it, loss=11.0105, acc=0.0003, iter_time=8.54s]
Epoch 0: 1%| | 78/12384 [09:58<26:05:41, 7.63s/it, loss=11.0105, acc=0.0003, iter_time=8.54s]
Epoch 0: 1%| | 78/12384 [10:06<26:05:41, 7.63s/it, loss=10.8721, acc=0.0004, iter_time=7.63s]
Epoch 0: 1%| | 79/12384 [10:06<26:05:22, 7.63s/it, loss=10.8721, acc=0.0004, iter_time=7.63s]
Epoch 0: 1%| | 79/12384 [10:13<26:05:22, 7.63s/it, loss=11.3602, acc=0.0013, iter_time=7.61s]
Epoch 0: 1%| | 80/12384 [10:13<26:05:57, 7.64s/it, loss=11.3602, acc=0.0013, iter_time=7.61s]
Epoch 0: 1%| | 80/12384 [10:21<26:05:57, 7.64s/it, loss=12.4490, acc=0.0004, iter_time=4.84s]
Epoch 0: 1%| | 81/12384 [10:21<26:05:10, 7.63s/it, loss=12.4490, acc=0.0004, iter_time=4.84s]
Epoch 0: 1%| | 81/12384 [10:29<26:05:10, 7.63s/it, loss=11.2284, acc=0.0006, iter_time=10.44s]
Epoch 0: 1%| | 82/12384 [10:29<26:04:56, 7.63s/it, loss=11.2284, acc=0.0006, iter_time=10.44s]
Epoch 0: 1%| | 82/12384 [10:36<26:04:56, 7.63s/it, loss=11.5251, acc=0.0009, iter_time=7.66s]
Epoch 0: 1%| | 83/12384 [10:36<26:05:22, 7.64s/it, loss=11.5251, acc=0.0009, iter_time=7.66s]
Epoch 0: 1%| | 83/12384 [10:44<26:05:22, 7.64s/it, loss=11.2945, acc=0.0005, iter_time=7.31s]
Epoch 0: 1%| | 84/12384 [10:44<26:05:29, 7.64s/it, loss=11.2945, acc=0.0005, iter_time=7.31s]
Epoch 0: 1%| | 84/12384 [10:51<26:05:29, 7.64s/it, loss=10.4840, acc=0.0002, iter_time=7.96s]
Epoch 0: 1%| | 85/12384 [10:51<26:04:50, 7.63s/it, loss=10.4840, acc=0.0002, iter_time=7.96s]
Epoch 0: 1%| | 85/12384 [10:59<26:04:50, 7.63s/it, loss=10.6111, acc=0.0000, iter_time=7.63s]
Epoch 0: 1%| | 86/12384 [10:59<26:04:25, 7.63s/it, loss=10.6111, acc=0.0000, iter_time=7.63s]
Epoch 0: 1%| | 86/12384 [11:07<26:04:25, 7.63s/it, loss=10.8529, acc=0.0007, iter_time=7.63s]
Epoch 0: 1%| | 87/12384 [11:07<26:06:07, 7.64s/it, loss=10.8529, acc=0.0007, iter_time=7.63s]
Epoch 0: 1%| | 87/12384 [11:14<26:06:07, 7.64s/it, loss=11.2738, acc=0.0003, iter_time=8.06s]
Epoch 0: 1%| | 88/12384 [11:14<26:05:24, 7.64s/it, loss=11.2738, acc=0.0003, iter_time=8.06s]
Epoch 0: 1%| | 88/12384 [11:22<26:05:24, 7.64s/it, loss=11.2256, acc=0.0007, iter_time=5.78s]
Epoch 0: 1%| | 89/12384 [11:22<26:25:48, 7.74s/it, loss=11.2256, acc=0.0007, iter_time=5.78s]
Epoch 0: 1%| | 89/12384 [11:30<26:25:48, 7.74s/it, loss=11.0972, acc=0.0007, iter_time=9.42s]
Epoch 0: 1%| | 90/12384 [11:30<26:19:15, 7.71s/it, loss=11.0972, acc=0.0007, iter_time=9.42s]
Epoch 0: 1%| | 90/12384 [11:38<26:19:15, 7.71s/it, loss=10.9571, acc=0.0001, iter_time=7.64s]
Epoch 0: 1%| | 91/12384 [11:38<26:13:34, 7.68s/it, loss=10.9571, acc=0.0001, iter_time=7.64s]
Epoch 0: 1%| | 91/12384 [11:45<26:13:34, 7.68s/it, loss=10.6801, acc=0.0009, iter_time=7.60s]
Epoch 0: 1%| | 92/12384 [11:45<26:09:53, 7.66s/it, loss=10.6801, acc=0.0009, iter_time=7.60s]
Epoch 0: 1%| | 92/12384 [11:53<26:09:53, 7.66s/it, loss=12.3925, acc=0.0003, iter_time=5.89s]
Epoch 0: 1%| | 93/12384 [11:53<26:09:45, 7.66s/it, loss=12.3925, acc=0.0003, iter_time=5.89s]
Epoch 0: 1%| | 93/12384 [12:01<26:09:45, 7.66s/it, loss=10.8816, acc=0.0004, iter_time=9.39s]
Epoch 0: 1%| | 94/12384 [12:01<26:08:02, 7.66s/it, loss=10.8816, acc=0.0004, iter_time=9.39s]
Epoch 0: 1%| | 94/12384 [12:08<26:08:02, 7.66s/it, loss=12.1385, acc=0.0006, iter_time=6.20s]
Epoch 0: 1%| | 95/12384 [12:08<26:08:16, 7.66s/it, loss=12.1385, acc=0.0006, iter_time=6.20s]
Epoch 0: 1%| | 95/12384 [12:16<26:08:16, 7.66s/it, loss=12.2838, acc=0.0003, iter_time=9.09s]
Epoch 0: 1%| | 96/12384 [12:16<26:07:25, 7.65s/it, loss=12.2838, acc=0.0003, iter_time=9.09s]
Epoch 0: 1%| | 96/12384 [12:23<26:07:25, 7.65s/it, loss=12.4777, acc=0.0002, iter_time=4.85s]
Epoch 0: 1%| | 97/12384 [12:23<26:06:29, 7.65s/it, loss=12.4777, acc=0.0002, iter_time=4.85s]
Epoch 0: 1%| | 97/12384 [12:31<26:06:29, 7.65s/it, loss=11.9554, acc=0.0004, iter_time=10.47s]
Epoch 0: 1%| | 98/12384 [12:31<26:04:05, 7.64s/it, loss=11.9554, acc=0.0004, iter_time=10.47s]
Epoch 0: 1%| | 98/12384 [12:39<26:04:05, 7.64s/it, loss=10.9768, acc=0.0004, iter_time=7.63s]
Epoch 0: 1%| | 99/12384 [12:39<26:04:48, 7.64s/it, loss=10.9768, acc=0.0004, iter_time=7.63s]
Epoch 0: 1%| | 99/12384 [12:46<26:04:48, 7.64s/it, loss=10.7849, acc=0.0000, iter_time=8.05s]
Epoch 0: 1%| | 100/12384 [12:46<26:03:52, 7.64s/it, loss=10.7849, acc=0.0000, iter_time=8.05s]
Epoch 0: 1%| | 100/12384 [12:54<26:03:52, 7.64s/it, loss=11.4376, acc=0.0003, iter_time=7.24s]
Epoch 0: 1%| | 101/12384 [12:54<26:03:53, 7.64s/it, loss=11.4376, acc=0.0003, iter_time=7.24s]
Epoch 0: 1%| | 101/12384 [13:02<26:03:53, 7.64s/it, loss=11.4607, acc=0.0003, iter_time=7.64s]
Epoch 0: 1%| | 102/12384 [13:02<26:05:40, 7.65s/it, loss=11.4607, acc=0.0003, iter_time=7.64s]
Epoch 0: 1%| | 102/12384 [13:09<26:05:40, 7.65s/it, loss=11.0372, acc=0.0003, iter_time=7.66s]
Epoch 0: 1%| | 103/12384 [13:09<26:04:55, 7.65s/it, loss=11.0372, acc=0.0003, iter_time=7.66s]
Epoch 0: 1%| | 103/12384 [13:17<26:04:55, 7.65s/it, loss=11.2025, acc=0.0004, iter_time=8.03s]
Epoch 0: 1%| | 104/12384 [13:17<26:04:11, 7.64s/it, loss=11.2025, acc=0.0004, iter_time=8.03s]
Epoch 0: 1%| | 104/12384 [13:25<26:04:11, 7.64s/it, loss=12.3039, acc=0.0006, iter_time=4.90s]
Epoch 0: 1%| | 105/12384 [13:25<26:04:23, 7.64s/it, loss=12.3039, acc=0.0006, iter_time=4.90s]
Epoch 0: 1%| | 105/12384 [13:32<26:04:23, 7.64s/it, loss=10.6288, acc=0.0004, iter_time=9.11s]
Epoch 0: 1%| | 106/12384 [13:32<26:06:49, 7.66s/it, loss=10.6288, acc=0.0004, iter_time=9.11s]
Epoch 0: 1%| | 106/12384 [13:40<26:06:49, 7.66s/it, loss=11.4025, acc=0.0003, iter_time=8.57s]
Epoch 0: 1%| | 107/12384 [13:40<26:11:31, 7.68s/it, loss=11.4025, acc=0.0003, iter_time=8.57s]
Epoch 0: 1%| | 107/12384 [13:48<26:11:31, 7.68s/it, loss=10.4986, acc=0.0008, iter_time=7.75s]
Epoch 0: 1%| | 108/12384 [13:48<26:08:36, 7.67s/it, loss=10.4986, acc=0.0008, iter_time=7.75s]
Epoch 0: 1%| | 108/12384 [13:55<26:08:36, 7.67s/it, loss=10.0305, acc=0.0009, iter_time=7.62s]
Epoch 0: 1%| | 109/12384 [13:55<26:06:18, 7.66s/it, loss=10.0305, acc=0.0009, iter_time=7.62s]
Epoch 0: 1%| | 109/12384 [14:03<26:06:18, 7.66s/it, loss=10.4411, acc=0.0003, iter_time=7.66s]
Epoch 0: 1%| | 110/12384 [14:03<26:05:16, 7.65s/it, loss=10.4411, acc=0.0003, iter_time=7.66s]
Epoch 0: 1%| | 110/12384 [14:11<26:05:16, 7.65s/it, loss=11.6141, acc=0.0005, iter_time=7.70s]
Epoch 0: 1%| | 111/12384 [14:11<26:08:19, 7.67s/it, loss=11.6141, acc=0.0005, iter_time=7.70s]
Epoch 0: 1%| | 111/12384 [14:18<26:08:19, 7.67s/it, loss=11.2663, acc=0.0000, iter_time=8.01s]
Epoch 0: 1%| | 112/12384 [14:18<26:06:23, 7.66s/it, loss=11.2663, acc=0.0000, iter_time=8.01s]
Epoch 0: 1%| | 112/12384 [14:26<26:06:23, 7.66s/it, loss=11.4721, acc=0.0005, iter_time=5.13s]
Epoch 0: 1%| | 113/12384 [14:26<26:04:23, 7.65s/it, loss=11.4721, acc=0.0005, iter_time=5.13s]
Epoch 0: 1%| | 113/12384 [14:34<26:04:23, 7.65s/it, loss=11.8473, acc=0.0004, iter_time=6.20s]
Epoch 0: 1%| | 114/12384 [14:34<26:02:36, 7.64s/it, loss=11.8473, acc=0.0004, iter_time=6.20s]
Epoch 0: 1%| | 114/12384 [14:41<26:02:36, 7.64s/it, loss=11.5466, acc=0.0006, iter_time=7.83s]
Epoch 0: 1%| | 115/12384 [14:41<26:01:00, 7.63s/it, loss=11.5466, acc=0.0006, iter_time=7.83s]
Epoch 0: 1%| | 115/12384 [14:49<26:01:00, 7.63s/it, loss=11.3700, acc=0.0006, iter_time=10.94s]
Epoch 0: 1%| | 116/12384 [14:49<26:23:31, 7.74s/it, loss=11.3700, acc=0.0006, iter_time=10.94s]
Epoch 0: 1%| | 116/12384 [14:57<26:23:31, 7.74s/it, loss=10.0672, acc=0.0009, iter_time=8.01s]
Epoch 0: 1%| | 117/12384 [14:57<26:14:58, 7.70s/it, loss=10.0672, acc=0.0009, iter_time=8.01s]
Epoch 0: 1%| | 117/12384 [15:04<26:14:58, 7.70s/it, loss=10.2974, acc=0.0002, iter_time=7.60s]
Epoch 0: 1%| | 118/12384 [15:04<26:12:54, 7.69s/it, loss=10.2974, acc=0.0002, iter_time=7.60s]
Epoch 0: 1%| | 118/12384 [15:12<26:12:54, 7.69s/it, loss=11.7279, acc=0.0002, iter_time=6.46s]
Epoch 0: 1%| | 119/12384 [15:12<26:11:26, 7.69s/it, loss=11.7279, acc=0.0002, iter_time=6.46s]
Epoch 0: 1%| | 119/12384 [15:20<26:11:26, 7.69s/it, loss=9.5479, acc=0.0020, iter_time=9.27s]
Epoch 0: 1%| | 120/12384 [15:20<26:11:33, 7.69s/it, loss=9.5479, acc=0.0020, iter_time=9.27s]
Epoch 0: 1%| | 120/12384 [15:27<26:11:33, 7.69s/it, loss=11.3597, acc=0.0003, iter_time=7.29s]
Epoch 0: 1%| | 121/12384 [15:27<26:06:25, 7.66s/it, loss=11.3597, acc=0.0003, iter_time=7.29s]
Epoch 0: 1%| | 121/12384 [15:35<26:06:25, 7.66s/it, loss=10.2827, acc=0.0015, iter_time=7.62s]
Epoch 0: 1%| | 122/12384 [15:35<26:04:38, 7.66s/it, loss=10.2827, acc=0.0015, iter_time=7.62s]
Epoch 0: 1%| | 122/12384 [15:43<26:04:38, 7.66s/it, loss=11.4825, acc=0.0000, iter_time=4.05s]
Epoch 0: 1%| | 123/12384 [15:43<26:01:14, 7.64s/it, loss=11.4825, acc=0.0000, iter_time=4.05s]
Epoch 0: 1%| | 123/12384 [15:50<26:01:14, 7.64s/it, loss=10.4938, acc=0.0008, iter_time=11.19s]
Epoch 0: 1%| | 124/12384 [15:50<26:02:12, 7.65s/it, loss=10.4938, acc=0.0008, iter_time=11.19s]
Epoch 0: 1%| | 124/12384 [15:58<26:02:12, 7.65s/it, loss=10.7784, acc=0.0002, iter_time=7.65s]
Epoch 0: 1%| | 125/12384 [15:58<25:59:50, 7.63s/it, loss=10.7784, acc=0.0002, iter_time=7.65s]
Epoch 0: 1%| | 125/12384 [16:06<25:59:50, 7.63s/it, loss=11.1809, acc=0.0004, iter_time=4.00s]
Epoch 0: 1%| | 126/12384 [16:06<26:03:43, 7.65s/it, loss=11.1809, acc=0.0004, iter_time=4.00s]
Epoch 0: 1%| | 126/12384 [16:13<26:03:43, 7.65s/it, loss=9.8621, acc=0.0010, iter_time=11.32s]
Epoch 0: 1%| | 127/12384 [16:13<26:04:01, 7.66s/it, loss=9.8621, acc=0.0010, iter_time=11.32s]
Epoch 0: 1%| | 127/12384 [16:21<26:04:01, 7.66s/it, loss=9.6572, acc=0.0019, iter_time=8.05s]
Epoch 0: 1%| | 128/12384 [16:21<26:03:51, 7.66s/it, loss=9.6572, acc=0.0019, iter_time=8.05s]
Epoch 0: 1%| | 128/12384 [16:29<26:03:51, 7.66s/it, loss=9.7301, acc=0.0003, iter_time=7.26s]
Epoch 0: 1%| | 129/12384 [16:29<26:03:13, 7.65s/it, loss=9.7301, acc=0.0003, iter_time=7.26s]
Epoch 0: 1%| | 129/12384 [16:36<26:03:13, 7.65s/it, loss=11.0160, acc=0.0008, iter_time=4.07s]
Epoch 0: 1%| | 130/12384 [16:36<26:01:29, 7.65s/it, loss=11.0160, acc=0.0008, iter_time=4.07s]
Epoch 0: 1%| | 130/12384 [16:44<26:01:29, 7.65s/it, loss=10.1317, acc=0.0012, iter_time=11.20s]
Epoch 0: 1%| | 131/12384 [16:44<25:58:40, 7.63s/it, loss=10.1317, acc=0.0012, iter_time=11.20s]
Epoch 0: 1%| | 131/12384 [16:51<25:58:40, 7.63s/it, loss=10.1372, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 132/12384 [16:51<25:58:53, 7.63s/it, loss=10.1372, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 132/12384 [16:59<25:58:53, 7.63s/it, loss=11.0534, acc=0.0004, iter_time=7.64s]
Epoch 0: 1%| | 133/12384 [16:59<25:57:38, 7.63s/it, loss=11.0534, acc=0.0004, iter_time=7.64s]
Epoch 0: 1%| | 133/12384 [17:07<25:57:38, 7.63s/it, loss=10.4665, acc=0.0001, iter_time=7.62s]
Epoch 0: 1%| | 134/12384 [17:07<25:57:10, 7.63s/it, loss=10.4665, acc=0.0001, iter_time=7.62s]
Epoch 0: 1%| | 134/12384 [17:14<25:57:10, 7.63s/it, loss=10.1935, acc=0.0002, iter_time=7.61s]
Epoch 0: 1%| | 135/12384 [17:14<25:57:13, 7.63s/it, loss=10.1935, acc=0.0002, iter_time=7.61s]
Epoch 0: 1%| | 135/12384 [17:22<25:57:13, 7.63s/it, loss=10.0622, acc=0.0014, iter_time=8.00s]
Epoch 0: 1%| | 136/12384 [17:22<25:55:40, 7.62s/it, loss=10.0622, acc=0.0014, iter_time=8.00s]
Epoch 0: 1%| | 136/12384 [17:30<25:55:40, 7.62s/it, loss=9.8737, acc=0.0004, iter_time=7.23s]
Epoch 0: 1%| | 137/12384 [17:30<25:55:40, 7.62s/it, loss=9.8737, acc=0.0004, iter_time=7.23s]
Epoch 0: 1%| | 137/12384 [17:37<25:55:40, 7.62s/it, loss=9.8373, acc=0.0002, iter_time=7.60s]
Epoch 0: 1%| | 138/12384 [17:37<25:57:43, 7.63s/it, loss=9.8373, acc=0.0002, iter_time=7.60s]
Epoch 0: 1%| | 138/12384 [17:45<25:57:43, 7.63s/it, loss=11.1797, acc=0.0004, iter_time=5.42s]
Epoch 0: 1%| | 139/12384 [17:45<25:57:27, 7.63s/it, loss=11.1797, acc=0.0004, iter_time=5.42s]
Epoch 0: 1%| | 139/12384 [17:52<25:57:27, 7.63s/it, loss=10.2283, acc=0.0009, iter_time=9.90s]
Epoch 0: 1%| | 140/12384 [17:52<25:57:42, 7.63s/it, loss=10.2283, acc=0.0009, iter_time=9.90s]
Epoch 0: 1%| | 140/12384 [18:00<25:57:42, 7.63s/it, loss=9.6406, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 141/12384 [18:00<25:56:35, 7.63s/it, loss=9.6406, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 141/12384 [18:08<25:56:35, 7.63s/it, loss=9.4581, acc=0.0005, iter_time=7.94s]
Epoch 0: 1%| | 142/12384 [18:08<26:15:45, 7.72s/it, loss=9.4581, acc=0.0005, iter_time=7.94s]
Epoch 0: 1%| | 142/12384 [18:16<26:15:45, 7.72s/it, loss=10.2313, acc=0.0004, iter_time=7.64s]
Epoch 0: 1%| | 143/12384 [18:16<26:10:37, 7.70s/it, loss=10.2313, acc=0.0004, iter_time=7.64s]
Epoch 0: 1%| | 143/12384 [18:23<26:10:37, 7.70s/it, loss=10.6638, acc=0.0008, iter_time=8.01s]
Epoch 0: 1%| | 144/12384 [18:23<26:04:59, 7.67s/it, loss=10.6638, acc=0.0008, iter_time=8.01s]
Epoch 0: 1%| | 144/12384 [18:31<26:04:59, 7.67s/it, loss=10.3811, acc=0.0003, iter_time=5.72s]
Epoch 0: 1%| | 145/12384 [18:31<26:04:45, 7.67s/it, loss=10.3811, acc=0.0003, iter_time=5.72s]
Epoch 0: 1%| | 145/12384 [18:39<26:04:45, 7.67s/it, loss=10.4208, acc=0.0005, iter_time=7.06s]
Epoch 0: 1%| | 146/12384 [18:39<26:03:27, 7.67s/it, loss=10.4208, acc=0.0005, iter_time=7.06s]
Epoch 0: 1%| | 146/12384 [18:46<26:03:27, 7.67s/it, loss=10.2973, acc=0.0005, iter_time=9.76s]
Epoch 0: 1%| | 147/12384 [18:46<26:03:35, 7.67s/it, loss=10.2973, acc=0.0005, iter_time=9.76s]
Epoch 0: 1%| | 147/12384 [18:54<26:03:35, 7.67s/it, loss=10.8811, acc=0.0005, iter_time=5.57s]
Epoch 0: 1%| | 148/12384 [18:54<26:01:39, 7.66s/it, loss=10.8811, acc=0.0005, iter_time=5.57s]
Epoch 0: 1%| | 148/12384 [19:02<26:01:39, 7.66s/it, loss=9.8736, acc=0.0004, iter_time=9.75s]
Epoch 0: 1%| | 149/12384 [19:02<26:01:06, 7.66s/it, loss=9.8736, acc=0.0004, iter_time=9.75s]
Epoch 0: 1%| | 149/12384 [19:09<26:01:06, 7.66s/it, loss=9.4176, acc=0.0008, iter_time=8.07s]
Epoch 0: 1%| | 150/12384 [19:09<25:59:58, 7.65s/it, loss=9.4176, acc=0.0008, iter_time=8.07s]
Epoch 0: 1%| | 150/12384 [19:17<25:59:58, 7.65s/it, loss=9.5935, acc=0.0012, iter_time=7.24s]
Epoch 0: 1%| | 151/12384 [19:17<26:00:40, 7.65s/it, loss=9.5935, acc=0.0012, iter_time=7.24s]
Epoch 0: 1%| | 151/12384 [19:24<26:00:40, 7.65s/it, loss=10.0799, acc=0.0001, iter_time=8.03s]
Epoch 0: 1%| | 152/12384 [19:24<25:57:28, 7.64s/it, loss=10.0799, acc=0.0001, iter_time=8.03s]
Epoch 0: 1%| | 152/12384 [19:32<25:57:28, 7.64s/it, loss=10.7032, acc=0.0000, iter_time=5.11s]
Epoch 0: 1%| | 153/12384 [19:32<25:58:43, 7.65s/it, loss=10.7032, acc=0.0000, iter_time=5.11s]
Epoch 0: 1%| | 153/12384 [19:40<25:58:43, 7.65s/it, loss=11.3994, acc=0.0005, iter_time=7.22s]
Epoch 0: 1%| | 154/12384 [19:40<25:57:32, 7.64s/it, loss=11.3994, acc=0.0005, iter_time=7.22s]
Epoch 0: 1%| | 154/12384 [19:47<25:57:32, 7.64s/it, loss=9.8630, acc=0.0006, iter_time=9.57s]
Epoch 0: 1%|▏ | 155/12384 [19:47<25:57:18, 7.64s/it, loss=9.8630, acc=0.0006, iter_time=9.57s]
Epoch 0: 1%|▏ | 155/12384 [19:55<25:57:18, 7.64s/it, loss=9.9163, acc=0.0012, iter_time=4.86s]
Epoch 0: 1%|▏ | 156/12384 [19:55<25:54:38, 7.63s/it, loss=9.9163, acc=0.0012, iter_time=4.86s]
Epoch 0: 1%|▏ | 156/12384 [20:03<25:54:38, 7.63s/it, loss=10.2178, acc=0.0009, iter_time=10.06s]
Epoch 0: 1%|▏ | 157/12384 [20:03<25:54:09, 7.63s/it, loss=10.2178, acc=0.0009, iter_time=10.06s]
Epoch 0: 1%|▏ | 157/12384 [20:10<25:54:09, 7.63s/it, loss=8.8109, acc=0.0006, iter_time=8.55s]
Epoch 0: 1%|▏ | 158/12384 [20:10<25:54:06, 7.63s/it, loss=8.8109, acc=0.0006, iter_time=8.55s]
Epoch 0: 1%|▏ | 158/12384 [20:18<25:54:06, 7.63s/it, loss=9.9846, acc=0.0005, iter_time=7.64s]
Epoch 0: 1%|▏ | 159/12384 [20:18<25:54:16, 7.63s/it, loss=9.9846, acc=0.0005, iter_time=7.64s]
Epoch 0: 1%|▏ | 159/12384 [20:26<25:54:16, 7.63s/it, loss=10.0358, acc=0.0004, iter_time=8.01s]
Epoch 0: 1%|▏ | 160/12384 [20:26<25:54:33, 7.63s/it, loss=10.0358, acc=0.0004, iter_time=8.01s]
Epoch 0: 1%|▏ | 160/12384 [20:33<25:54:33, 7.63s/it, loss=10.1687, acc=0.0002, iter_time=4.45s]
Epoch 0: 1%|▏ | 161/12384 [20:33<25:56:01, 7.64s/it, loss=10.1687, acc=0.0002, iter_time=4.45s]
Epoch 0: 1%|▏ | 161/12384 [20:41<25:56:01, 7.64s/it, loss=9.5081, acc=0.0001, iter_time=9.61s]
Epoch 0: 1%|▏ | 162/12384 [20:41<25:55:16, 7.64s/it, loss=9.5081, acc=0.0001, iter_time=9.61s]
Epoch 0: 1%|▏ | 162/12384 [20:48<25:55:16, 7.64s/it, loss=10.1441, acc=0.0009, iter_time=8.48s]
Epoch 0: 1%|▏ | 163/12384 [20:48<25:54:59, 7.63s/it, loss=10.1441, acc=0.0009, iter_time=8.48s]
Epoch 0: 1%|▏ | 163/12384 [20:56<25:54:59, 7.63s/it, loss=9.8535, acc=0.0006, iter_time=5.60s]
Epoch 0: 1%|▏ | 164/12384 [20:56<25:56:47, 7.64s/it, loss=9.8535, acc=0.0006, iter_time=5.60s]
Epoch 0: 1%|▏ | 164/12384 [21:04<25:56:47, 7.64s/it, loss=9.5386, acc=0.0011, iter_time=8.18s]
Epoch 0: 1%|▏ | 165/12384 [21:04<25:54:40, 7.63s/it, loss=9.5386, acc=0.0011, iter_time=8.18s]
Epoch 0: 1%|▏ | 165/12384 [21:11<25:54:40, 7.63s/it, loss=10.1718, acc=0.0001, iter_time=7.61s]
Epoch 0: 1%|▏ | 166/12384 [21:11<25:54:19, 7.63s/it, loss=10.1718, acc=0.0001, iter_time=7.61s]
Epoch 0: 1%|▏ | 166/12384 [21:19<25:54:19, 7.63s/it, loss=9.0794, acc=0.0002, iter_time=9.46s]
Epoch 0: 1%|▏ | 167/12384 [21:19<26:16:06, 7.74s/it, loss=9.0794, acc=0.0002, iter_time=9.46s]
Epoch 0: 1%|▏ | 167/12384 [21:27<26:16:06, 7.74s/it, loss=10.0714, acc=0.0000, iter_time=7.65s]
Epoch 0: 1%|▏ | 168/12384 [21:27<26:09:28, 7.71s/it, loss=10.0714, acc=0.0000, iter_time=7.65s]
Epoch 0: 1%|▏ | 168/12384 [21:35<26:09:28, 7.71s/it, loss=9.7891, acc=0.0004, iter_time=4.80s]
Epoch 0: 1%|▏ | 169/12384 [21:35<26:03:41, 7.68s/it, loss=9.7891, acc=0.0004, iter_time=4.80s]
Epoch 0: 1%|▏ | 169/12384 [21:42<26:03:41, 7.68s/it, loss=11.7103, acc=0.0006, iter_time=7.71s]
Epoch 0: 1%|▏ | 170/12384 [21:42<26:02:47, 7.68s/it, loss=11.7103, acc=0.0006, iter_time=7.71s]
Epoch 0: 1%|▏ | 170/12384 [21:50<26:02:47, 7.68s/it, loss=9.3130, acc=0.0011, iter_time=10.46s]
Epoch 0: 1%|▏ | 171/12384 [21:50<26:03:50, 7.68s/it, loss=9.3130, acc=0.0011, iter_time=10.46s]
Epoch 0: 1%|▏ | 171/12384 [21:58<26:03:50, 7.68s/it, loss=9.5550, acc=0.0006, iter_time=7.13s]
Epoch 0: 1%|▏ | 172/12384 [21:58<26:04:05, 7.68s/it, loss=9.5550, acc=0.0006, iter_time=7.13s]
Epoch 0: 1%|▏ | 172/12384 [22:05<26:04:05, 7.68s/it, loss=8.9668, acc=0.0003, iter_time=8.24s]
Epoch 0: 1%|▏ | 173/12384 [22:05<26:01:45, 7.67s/it, loss=8.9668, acc=0.0003, iter_time=8.24s]
Epoch 0: 1%|▏ | 173/12384 [22:13<26:01:45, 7.67s/it, loss=11.1200, acc=0.0010, iter_time=6.44s]
Epoch 0: 1%|▏ | 174/12384 [22:13<26:01:11, 7.67s/it, loss=11.1200, acc=0.0010, iter_time=6.44s]
Epoch 0: 1%|▏ | 174/12384 [22:21<26:01:11, 7.67s/it, loss=9.4657, acc=0.0002, iter_time=7.11s]
Epoch 0: 1%|▏ | 175/12384 [22:21<25:58:09, 7.66s/it, loss=9.4657, acc=0.0002, iter_time=7.11s]
Epoch 0: 1%|▏ | 175/12384 [22:28<25:58:09, 7.66s/it, loss=9.2463, acc=0.0005, iter_time=9.79s]
Epoch 0: 1%|▏ | 176/12384 [22:28<25:56:57, 7.65s/it, loss=9.2463, acc=0.0005, iter_time=9.79s]
Epoch 0: 1%|▏ | 176/12384 [22:36<25:56:57, 7.65s/it, loss=9.1595, acc=0.0007, iter_time=7.24s]
Epoch 0: 1%|▏ | 177/12384 [22:36<25:54:34, 7.64s/it, loss=9.1595, acc=0.0007, iter_time=7.24s]
Epoch 0: 1%|▏ | 177/12384 [22:43<25:54:34, 7.64s/it, loss=9.4691, acc=0.0010, iter_time=5.81s]
Epoch 0: 1%|▏ | 178/12384 [22:43<25:51:50, 7.63s/it, loss=9.4691, acc=0.0010, iter_time=5.81s]
Epoch 0: 1%|▏ | 178/12384 [22:51<25:51:50, 7.63s/it, loss=9.2089, acc=0.0009, iter_time=9.41s]
Epoch 0: 1%|▏ | 179/12384 [22:51<25:54:16, 7.64s/it, loss=9.2089, acc=0.0009, iter_time=9.41s]
Epoch 0: 1%|▏ | 179/12384 [22:59<25:54:16, 7.64s/it, loss=9.3071, acc=0.0003, iter_time=7.67s]
Epoch 0: 1%|▏ | 180/12384 [22:59<25:52:58, 7.64s/it, loss=9.3071, acc=0.0003, iter_time=7.67s]
Epoch 0: 1%|▏ | 180/12384 [23:06<25:52:58, 7.64s/it, loss=9.2088, acc=0.0019, iter_time=7.62s]
Epoch 0: 1%|▏ | 181/12384 [23:06<25:53:54, 7.64s/it, loss=9.2088, acc=0.0019, iter_time=7.62s]
Epoch 0: 1%|▏ | 181/12384 [23:14<25:53:54, 7.64s/it, loss=9.0347, acc=0.0000, iter_time=5.58s]
Epoch 0: 1%|▏ | 182/12384 [23:14<25:53:41, 7.64s/it, loss=9.0347, acc=0.0000, iter_time=5.58s]
Epoch 0: 1%|▏ | 182/12384 [23:22<25:53:41, 7.64s/it, loss=8.9288, acc=0.0003, iter_time=7.97s]
Epoch 0: 1%|▏ | 183/12384 [23:22<25:55:01, 7.65s/it, loss=8.9288, acc=0.0003, iter_time=7.97s]
Epoch 0: 1%|▏ | 183/12384 [23:29<25:55:01, 7.65s/it, loss=9.0327, acc=0.0004, iter_time=9.80s]
Epoch 0: 1%|▏ | 184/12384 [23:29<25:55:15, 7.65s/it, loss=9.0327, acc=0.0004, iter_time=9.80s]
Epoch 0: 1%|▏ | 184/12384 [23:37<25:55:15, 7.65s/it, loss=9.1654, acc=0.0003, iter_time=7.26s]
Epoch 0: 1%|▏ | 185/12384 [23:37<25:55:05, 7.65s/it, loss=9.1654, acc=0.0003, iter_time=7.26s]
Epoch 0: 1%|▏ | 185/12384 [23:45<25:55:05, 7.65s/it, loss=8.8745, acc=0.0000, iter_time=4.37s]
Epoch 0: 2%|▏ | 186/12384 [23:45<25:59:27, 7.67s/it, loss=8.8745, acc=0.0000, iter_time=4.37s]
Epoch 0: 2%|▏ | 186/12384 [23:52<25:59:27, 7.67s/it, loss=8.9560, acc=0.0007, iter_time=11.00s]
Epoch 0: 2%|▏ | 187/12384 [23:52<25:56:24, 7.66s/it, loss=8.9560, acc=0.0007, iter_time=11.00s]
Epoch 0: 2%|▏ | 187/12384 [24:00<25:56:24, 7.66s/it, loss=8.7837, acc=0.0015, iter_time=7.64s]
Epoch 0: 2%|▏ | 188/12384 [24:00<25:59:04, 7.67s/it, loss=8.7837, acc=0.0015, iter_time=7.64s]
Epoch 0: 2%|▏ | 188/12384 [24:08<25:59:04, 7.67s/it, loss=9.0256, acc=0.0023, iter_time=5.96s]
Epoch 0: 2%|▏ | 189/12384 [24:08<25:57:07, 7.66s/it, loss=9.0256, acc=0.0023, iter_time=5.96s]
Epoch 0: 2%|▏ | 189/12384 [24:15<25:57:07, 7.66s/it, loss=9.4618, acc=0.0007, iter_time=9.04s]
Epoch 0: 2%|▏ | 190/12384 [24:15<25:56:23, 7.66s/it, loss=9.4618, acc=0.0007, iter_time=9.04s]
Epoch 0: 2%|▏ | 190/12384 [24:23<25:56:23, 7.66s/it, loss=8.8491, acc=0.0006, iter_time=7.97s]
Epoch 0: 2%|▏ | 191/12384 [24:23<25:54:09, 7.65s/it, loss=8.8491, acc=0.0006, iter_time=7.97s]
Epoch 0: 2%|▏ | 191/12384 [24:31<25:54:09, 7.65s/it, loss=9.3567, acc=0.0000, iter_time=7.60s]
Epoch 0: 2%|▏ | 192/12384 [24:31<25:54:00, 7.65s/it, loss=9.3567, acc=0.0000, iter_time=7.60s]
Epoch 0: 2%|▏ | 192/12384 [24:39<25:54:00, 7.65s/it, loss=8.7066, acc=0.0010, iter_time=7.97s]
Epoch 0: 2%|▏ | 193/12384 [24:39<26:13:47, 7.75s/it, loss=8.7066, acc=0.0010, iter_time=7.97s]
Epoch 0: 2%|▏ | 193/12384 [24:46<26:13:47, 7.75s/it, loss=9.0475, acc=0.0007, iter_time=7.68s]
Epoch 0: 2%|▏ | 194/12384 [24:46<26:08:06, 7.72s/it, loss=9.0475, acc=0.0007, iter_time=7.68s]
Epoch 0: 2%|▏ | 194/12384 [24:54<26:08:06, 7.72s/it, loss=9.0842, acc=0.0005, iter_time=5.57s]
Epoch 0: 2%|▏ | 195/12384 [24:54<26:03:40, 7.70s/it, loss=9.0842, acc=0.0005, iter_time=5.57s]
Epoch 0: 2%|▏ | 195/12384 [25:01<26:03:40, 7.70s/it, loss=8.1855, acc=0.0004, iter_time=9.71s]
Epoch 0: 2%|▏ | 196/12384 [25:01<25:59:19, 7.68s/it, loss=8.1855, acc=0.0004, iter_time=9.71s]
Epoch 0: 2%|▏ | 196/12384 [25:09<25:59:19, 7.68s/it, loss=8.0778, acc=0.0012, iter_time=7.63s]
Epoch 0: 2%|▏ | 197/12384 [25:09<25:55:00, 7.66s/it, loss=8.0778, acc=0.0012, iter_time=7.63s]
Epoch 0: 2%|▏ | 197/12384 [25:17<25:55:00, 7.66s/it, loss=8.8967, acc=0.0010, iter_time=7.35s]
Epoch 0: 2%|▏ | 198/12384 [25:17<25:59:45, 7.68s/it, loss=8.8967, acc=0.0010, iter_time=7.35s]
Epoch 0: 2%|▏ | 198/12384 [25:24<25:59:45, 7.68s/it, loss=9.0389, acc=0.0004, iter_time=7.99s]
Epoch 0: 2%|▏ | 199/12384 [25:24<25:55:17, 7.66s/it, loss=9.0389, acc=0.0004, iter_time=7.99s]
Epoch 0: 2%|▏ | 199/12384 [25:32<25:55:17, 7.66s/it, loss=9.1124, acc=0.0009, iter_time=8.07s]
Epoch 0: 2%|▏ | 200/12384 [25:32<25:55:07, 7.66s/it, loss=9.1124, acc=0.0009, iter_time=8.07s]
Epoch 0: 2%|▏ | 200/12384 [25:40<25:55:07, 7.66s/it, loss=8.4466, acc=0.0007, iter_time=6.24s]
Epoch 0: 2%|▏ | 201/12384 [25:40<25:53:28, 7.65s/it, loss=8.4466, acc=0.0007, iter_time=6.24s]
Epoch 0: 2%|▏ | 201/12384 [25:47<25:53:28, 7.65s/it, loss=8.7056, acc=0.0011, iter_time=8.61s]
Epoch 0: 2%|▏ | 202/12384 [25:47<25:52:45, 7.65s/it, loss=8.7056, acc=0.0011, iter_time=8.61s]
Epoch 0: 2%|▏ | 202/12384 [25:55<25:52:45, 7.65s/it, loss=8.5991, acc=0.0011, iter_time=7.66s]
Epoch 0: 2%|▏ | 203/12384 [25:55<25:51:32, 7.64s/it, loss=8.5991, acc=0.0011, iter_time=7.66s]
Epoch 0: 2%|▏ | 203/12384 [26:03<25:51:32, 7.64s/it, loss=8.7091, acc=0.0012, iter_time=7.30s]
Epoch 0: 2%|▏ | 204/12384 [26:03<25:49:56, 7.64s/it, loss=8.7091, acc=0.0012, iter_time=7.30s]
Epoch 0: 2%|▏ | 204/12384 [26:10<25:49:56, 7.64s/it, loss=8.7888, acc=0.0019, iter_time=7.01s]
Epoch 0: 2%|▏ | 205/12384 [26:10<25:52:18, 7.65s/it, loss=8.7888, acc=0.0019, iter_time=7.01s]
Epoch 0: 2%|▏ | 205/12384 [26:18<25:52:18, 7.65s/it, loss=9.4526, acc=0.0002, iter_time=5.57s]
Epoch 0: 2%|▏ | 206/12384 [26:18<25:52:19, 7.65s/it, loss=9.4526, acc=0.0002, iter_time=5.57s]
Epoch 0: 2%|▏ | 206/12384 [26:26<25:52:19, 7.65s/it, loss=8.4342, acc=0.0012, iter_time=10.67s]
Epoch 0: 2%|▏ | 207/12384 [26:26<25:50:36, 7.64s/it, loss=8.4342, acc=0.0012, iter_time=10.67s]
Epoch 0: 2%|▏ | 207/12384 [26:33<25:50:36, 7.64s/it, loss=8.3416, acc=0.0008, iter_time=7.58s]
Epoch 0: 2%|▏ | 208/12384 [26:33<25:48:59, 7.63s/it, loss=8.3416, acc=0.0008, iter_time=7.58s]
Epoch 0: 2%|▏ | 208/12384 [26:41<25:48:59, 7.63s/it, loss=8.3990, acc=0.0019, iter_time=5.93s]
Epoch 0: 2%|▏ | 209/12384 [26:41<25:47:45, 7.63s/it, loss=8.3990, acc=0.0019, iter_time=5.93s]
Epoch 0: 2%|▏ | 209/12384 [26:48<25:47:45, 7.63s/it, loss=8.1943, acc=0.0015, iter_time=6.07s]
Epoch 0: 2%|▏ | 210/12384 [26:48<25:47:02, 7.62s/it, loss=8.1943, acc=0.0015, iter_time=6.07s]
Epoch 0: 2%|▏ | 210/12384 [26:56<25:47:02, 7.62s/it, loss=8.5613, acc=0.0008, iter_time=10.91s]
Epoch 0: 2%|▏ | 211/12384 [26:56<25:49:23, 7.64s/it, loss=8.5613, acc=0.0008, iter_time=10.91s]
Epoch 0: 2%|▏ | 211/12384 [27:04<25:49:23, 7.64s/it, loss=8.1708, acc=0.0016, iter_time=7.68s]
Epoch 0: 2%|▏ | 212/12384 [27:04<25:50:05, 7.64s/it, loss=8.1708, acc=0.0016, iter_time=7.68s]
Epoch 0: 2%|▏ | 212/12384 [27:11<25:50:05, 7.64s/it, loss=8.1459, acc=0.0007, iter_time=7.64s]
Epoch 0: 2%|▏ | 213/12384 [27:11<25:48:42, 7.63s/it, loss=8.1459, acc=0.0007, iter_time=7.64s]
Epoch 0: 2%|▏ | 213/12384 [27:19<25:48:42, 7.63s/it, loss=8.5384, acc=0.0014, iter_time=4.30s]
Epoch 0: 2%|▏ | 214/12384 [27:19<25:48:03, 7.63s/it, loss=8.5384, acc=0.0014, iter_time=4.30s]
Epoch 0: 2%|▏ | 214/12384 [27:27<25:48:03, 7.63s/it, loss=8.1967, acc=0.0009, iter_time=10.94s]
Epoch 0: 2%|▏ | 215/12384 [27:27<25:47:52, 7.63s/it, loss=8.1967, acc=0.0009, iter_time=10.94s]
Epoch 0: 2%|▏ | 215/12384 [27:34<25:47:52, 7.63s/it, loss=9.2198, acc=0.0004, iter_time=7.59s]
Epoch 0: 2%|▏ | 216/12384 [27:34<25:46:40, 7.63s/it, loss=9.2198, acc=0.0004, iter_time=7.59s]
Epoch 0: 2%|▏ | 216/12384 [27:42<25:46:40, 7.63s/it, loss=8.2690, acc=0.0009, iter_time=4.80s]
Epoch 0: 2%|▏ | 217/12384 [27:42<25:47:47, 7.63s/it, loss=8.2690, acc=0.0009, iter_time=4.80s]
Epoch 0: 2%|▏ | 217/12384 [27:50<25:47:47, 7.63s/it, loss=7.8197, acc=0.0006, iter_time=8.26s]
Epoch 0: 2%|▏ | 218/12384 [27:50<25:50:16, 7.65s/it, loss=7.8197, acc=0.0006, iter_time=8.26s]
Epoch 0: 2%|▏ | 218/12384 [27:58<25:50:16, 7.65s/it, loss=8.0925, acc=0.0007, iter_time=10.22s]
Epoch 0: 2%|▏ | 219/12384 [27:58<26:11:49, 7.75s/it, loss=8.0925, acc=0.0007, iter_time=10.22s]
Epoch 0: 2%|▏ | 219/12384 [28:05<26:11:49, 7.75s/it, loss=8.1300, acc=0.0019, iter_time=7.70s]
Epoch 0: 2%|▏ | 220/12384 [28:05<26:02:22, 7.71s/it, loss=8.1300, acc=0.0019, iter_time=7.70s]
Epoch 0: 2%|▏ | 220/12384 [28:13<26:02:22, 7.71s/it, loss=7.9561, acc=0.0015, iter_time=7.61s]
Epoch 0: 2%|▏ | 221/12384 [28:13<25:56:33, 7.68s/it, loss=7.9561, acc=0.0015, iter_time=7.61s]
Epoch 0: 2%|▏ | 221/12384 [28:20<25:56:33, 7.68s/it, loss=8.0051, acc=0.0010, iter_time=7.60s]
Epoch 0: 2%|▏ | 222/12384 [28:20<25:55:49, 7.68s/it, loss=8.0051, acc=0.0010, iter_time=7.60s]
Epoch 0: 2%|▏ | 222/12384 [28:28<25:55:49, 7.68s/it, loss=8.2760, acc=0.0003, iter_time=7.68s]
Epoch 0: 2%|▏ | 223/12384 [28:28<25:54:58, 7.67s/it, loss=8.2760, acc=0.0003, iter_time=7.68s]
Epoch 0: 2%|▏ | 223/12384 [28:36<25:54:58, 7.67s/it, loss=8.1733, acc=0.0003, iter_time=8.06s]
Epoch 0: 2%|▏ | 224/12384 [28:36<25:54:30, 7.67s/it, loss=8.1733, acc=0.0003, iter_time=8.06s]
Epoch 0: 2%|▏ | 224/12384 [28:43<25:54:30, 7.67s/it, loss=8.0470, acc=0.0007, iter_time=7.27s]
Epoch 0: 2%|▏ | 225/12384 [28:43<25:50:46, 7.65s/it, loss=8.0470, acc=0.0007, iter_time=7.27s]
Epoch 0: 2%|▏ | 225/12384 [28:51<25:50:46, 7.65s/it, loss=7.5724, acc=0.0013, iter_time=7.62s]
Epoch 0: 2%|▏ | 226/12384 [28:51<25:48:04, 7.64s/it, loss=7.5724, acc=0.0013, iter_time=7.62s]
Epoch 0: 2%|▏ | 226/12384 [28:59<25:48:04, 7.64s/it, loss=8.4081, acc=0.0011, iter_time=6.12s]
Epoch 0: 2%|▏ | 227/12384 [28:59<25:48:26, 7.64s/it, loss=8.4081, acc=0.0011, iter_time=6.12s]
Epoch 0: 2%|▏ | 227/12384 [29:06<25:48:26, 7.64s/it, loss=8.6103, acc=0.0008, iter_time=9.11s]
Epoch 0: 2%|▏ | 228/12384 [29:06<25:46:50, 7.63s/it, loss=8.6103, acc=0.0008, iter_time=9.11s]
Epoch 0: 2%|▏ | 228/12384 [29:14<25:46:50, 7.63s/it, loss=7.8253, acc=0.0011, iter_time=7.64s]
Epoch 0: 2%|▏ | 229/12384 [29:14<25:47:33, 7.64s/it, loss=7.8253, acc=0.0011, iter_time=7.64s]
Epoch 0: 2%|▏ | 229/12384 [29:21<25:47:33, 7.64s/it, loss=8.3221, acc=0.0004, iter_time=7.64s]
Epoch 0: 2%|▏ | 230/12384 [29:21<25:45:26, 7.63s/it, loss=8.3221, acc=0.0004, iter_time=7.64s]
Epoch 0: 2%|▏ | 230/12384 [29:29<25:45:26, 7.63s/it, loss=7.7024, acc=0.0009, iter_time=7.58s]
Epoch 0: 2%|▏ | 231/12384 [29:29<25:44:38, 7.63s/it, loss=7.7024, acc=0.0009, iter_time=7.58s]
Epoch 0: 2%|▏ | 231/12384 [29:37<25:44:38, 7.63s/it, loss=7.7472, acc=0.0008, iter_time=8.02s]
Epoch 0: 2%|▏ | 232/12384 [29:37<25:47:42, 7.64s/it, loss=7.7472, acc=0.0008, iter_time=8.02s]
Epoch 0: 2%|▏ | 232/12384 [29:44<25:47:42, 7.64s/it, loss=7.7262, acc=0.0011, iter_time=7.31s]
Epoch 0: 2%|▏ | 233/12384 [29:44<25:48:58, 7.65s/it, loss=7.7262, acc=0.0011, iter_time=7.31s]
Epoch 0: 2%|▏ | 233/12384 [29:52<25:48:58, 7.65s/it, loss=7.4931, acc=0.0028, iter_time=7.41s]
Epoch 0: 2%|▏ | 234/12384 [29:52<25:50:21, 7.66s/it, loss=7.4931, acc=0.0028, iter_time=7.41s]
Epoch 0: 2%|▏ | 234/12384 [30:00<25:50:21, 7.66s/it, loss=7.4022, acc=0.0014, iter_time=7.93s]
Epoch 0: 2%|▏ | 235/12384 [30:00<25:48:15, 7.65s/it, loss=7.4022, acc=0.0014, iter_time=7.93s]
Epoch 0: 2%|▏ | 235/12384 [30:07<25:48:15, 7.65s/it, loss=7.7223, acc=0.0014, iter_time=7.59s]
Epoch 0: 2%|▏ | 236/12384 [30:07<25:45:43, 7.63s/it, loss=7.7223, acc=0.0014, iter_time=7.59s]
Epoch 0: 2%|▏ | 236/12384 [30:15<25:45:43, 7.63s/it, loss=7.8947, acc=0.0015, iter_time=4.31s]
Epoch 0: 2%|▏ | 237/12384 [30:15<25:46:15, 7.64s/it, loss=7.8947, acc=0.0015, iter_time=4.31s]
Epoch 0: 2%|▏ | 237/12384 [30:23<25:46:15, 7.64s/it, loss=7.7654, acc=0.0010, iter_time=9.74s]
Epoch 0: 2%|▏ | 238/12384 [30:23<25:47:31, 7.64s/it, loss=7.7654, acc=0.0010, iter_time=9.74s]
Epoch 0: 2%|▏ | 238/12384 [30:30<25:47:31, 7.64s/it, loss=7.4437, acc=0.0005, iter_time=8.88s]
Epoch 0: 2%|▏ | 239/12384 [30:30<25:47:04, 7.64s/it, loss=7.4437, acc=0.0005, iter_time=8.88s]
Epoch 0: 2%|▏ | 239/12384 [30:38<25:47:04, 7.64s/it, loss=7.7818, acc=0.0017, iter_time=7.71s]
Epoch 0: 2%|▏ | 240/12384 [30:38<25:47:28, 7.65s/it, loss=7.7818, acc=0.0017, iter_time=7.71s]
Epoch 0: 2%|▏ | 240/12384 [30:46<25:47:28, 7.65s/it, loss=7.3091, acc=0.0018, iter_time=7.57s]
Epoch 0: 2%|▏ | 241/12384 [30:46<25:48:50, 7.65s/it, loss=7.3091, acc=0.0018, iter_time=7.57s]
Epoch 0: 2%|▏ | 241/12384 [30:53<25:48:50, 7.65s/it, loss=7.3295, acc=0.0004, iter_time=7.66s]
Epoch 0: 2%|▏ | 242/12384 [30:53<25:47:11, 7.65s/it, loss=7.3295, acc=0.0004, iter_time=7.66s]
Epoch 0: 2%|▏ | 242/12384 [31:01<25:47:11, 7.65s/it, loss=7.2502, acc=0.0021, iter_time=5.10s]
Epoch 0: 2%|▏ | 243/12384 [31:01<25:47:23, 7.65s/it, loss=7.2502, acc=0.0021, iter_time=5.10s]
Epoch 0: 2%|▏ | 243/12384 [31:09<25:47:23, 7.65s/it, loss=7.8696, acc=0.0010, iter_time=10.20s]
Epoch 0: 2%|▏ | 244/12384 [31:09<25:45:32, 7.64s/it, loss=7.8696, acc=0.0010, iter_time=10.20s]
Epoch 0: 2%|▏ | 244/12384 [31:16<25:45:32, 7.64s/it, loss=7.1887, acc=0.0007, iter_time=6.46s]
Epoch 0: 2%|▏ | 245/12384 [31:16<26:04:58, 7.74s/it, loss=7.1887, acc=0.0007, iter_time=6.46s]
Epoch 0: 2%|▏ | 245/12384 [31:24<26:04:58, 7.74s/it, loss=7.3708, acc=0.0018, iter_time=9.11s]
Epoch 0: 2%|▏ | 246/12384 [31:24<26:00:05, 7.71s/it, loss=7.3708, acc=0.0018, iter_time=9.11s]
Epoch 0: 2%|▏ | 246/12384 [31:32<26:00:05, 7.71s/it, loss=7.8745, acc=0.0013, iter_time=7.66s]
Epoch 0: 2%|▏ | 247/12384 [31:32<25:56:15, 7.69s/it, loss=7.8745, acc=0.0013, iter_time=7.66s]
Epoch 0: 2%|▏ | 247/12384 [31:39<25:56:15, 7.69s/it, loss=7.2406, acc=0.0013, iter_time=7.64s]
Epoch 0: 2%|▏ | 248/12384 [31:39<25:54:27, 7.69s/it, loss=7.2406, acc=0.0013, iter_time=7.64s]
Epoch 0: 2%|▏ | 248/12384 [31:47<25:54:27, 7.69s/it, loss=7.3163, acc=0.0023, iter_time=7.34s]
Epoch 0: 2%|▏ | 249/12384 [31:47<25:50:08, 7.66s/it, loss=7.3163, acc=0.0023, iter_time=7.34s]
Epoch 0: 2%|▏ | 249/12384 [31:55<25:50:08, 7.66s/it, loss=7.6082, acc=0.0018, iter_time=8.41s]
Epoch 0: 2%|▏ | 250/12384 [31:55<25:51:22, 7.67s/it, loss=7.6082, acc=0.0018, iter_time=8.41s]
Epoch 0: 2%|▏ | 250/12384 [32:02<25:51:22, 7.67s/it, loss=7.2558, acc=0.0005, iter_time=7.23s]
Epoch 0: 2%|▏ | 251/12384 [32:02<25:50:15, 7.67s/it, loss=7.2558, acc=0.0005, iter_time=7.23s]
Epoch 0: 2%|▏ | 251/12384 [32:10<25:50:15, 7.67s/it, loss=7.6217, acc=0.0037, iter_time=7.64s]
Epoch 0: 2%|▏ | 252/12384 [32:10<25:50:25, 7.67s/it, loss=7.6217, acc=0.0037, iter_time=7.64s]
Epoch 0: 2%|▏ | 252/12384 [32:18<25:50:25, 7.67s/it, loss=7.3812, acc=0.0011, iter_time=7.77s]
Epoch 0: 2%|▏ | 253/12384 [32:18<25:52:09, 7.68s/it, loss=7.3812, acc=0.0011, iter_time=7.77s]
Epoch 0: 2%|▏ | 253/12384 [32:25<25:52:09, 7.68s/it, loss=7.3565, acc=0.0025, iter_time=7.60s]
Epoch 0: 2%|▏ | 254/12384 [32:25<25:48:52, 7.66s/it, loss=7.3565, acc=0.0025, iter_time=7.60s]
Epoch 0: 2%|▏ | 254/12384 [32:33<25:48:52, 7.66s/it, loss=7.2157, acc=0.0006, iter_time=7.65s]
Epoch 0: 2%|▏ | 255/12384 [32:33<25:48:10, 7.66s/it, loss=7.2157, acc=0.0006, iter_time=7.65s]
Epoch 0: 2%|▏ | 255/12384 [32:41<25:48:10, 7.66s/it, loss=7.7335, acc=0.0032, iter_time=8.03s]
Epoch 0: 2%|▏ | 256/12384 [32:41<25:47:10, 7.65s/it, loss=7.7335, acc=0.0032, iter_time=8.03s]
Epoch 0: 2%|▏ | 256/12384 [32:48<25:47:10, 7.65s/it, loss=7.2015, acc=0.0031, iter_time=7.33s]
Epoch 0: 2%|▏ | 257/12384 [32:48<25:50:04, 7.67s/it, loss=7.2015, acc=0.0031, iter_time=7.33s]
Epoch 0: 2%|▏ | 257/12384 [32:56<25:50:04, 7.67s/it, loss=7.1932, acc=0.0012, iter_time=4.10s]
Epoch 0: 2%|▏ | 258/12384 [32:56<25:47:00, 7.65s/it, loss=7.1932, acc=0.0012, iter_time=4.10s]
Epoch 0: 2%|▏ | 258/12384 [33:04<25:47:00, 7.65s/it, loss=7.2090, acc=0.0023, iter_time=8.53s]
Epoch 0: 2%|▏ | 259/12384 [33:04<25:48:05, 7.66s/it, loss=7.2090, acc=0.0023, iter_time=8.53s]
Epoch 0: 2%|▏ | 259/12384 [33:11<25:48:05, 7.66s/it, loss=7.0185, acc=0.0026, iter_time=8.88s]
Epoch 0: 2%|▏ | 260/12384 [33:11<25:45:49, 7.65s/it, loss=7.0185, acc=0.0026, iter_time=8.88s]
Epoch 0: 2%|▏ | 260/12384 [33:19<25:45:49, 7.65s/it, loss=6.9527, acc=0.0025, iter_time=9.03s]
Epoch 0: 2%|▏ | 261/12384 [33:19<25:45:03, 7.65s/it, loss=6.9527, acc=0.0025, iter_time=9.03s]
Epoch 0: 2%|▏ | 261/12384 [33:27<25:45:03, 7.65s/it, loss=7.0574, acc=0.0020, iter_time=7.67s]
Epoch 0: 2%|▏ | 262/12384 [33:27<25:45:16, 7.65s/it, loss=7.0574, acc=0.0020, iter_time=7.67s]
Epoch 0: 2%|▏ | 262/12384 [33:34<25:45:16, 7.65s/it, loss=7.2073, acc=0.0025, iter_time=7.63s]
Epoch 0: 2%|▏ | 263/12384 [33:34<25:48:03, 7.66s/it, loss=7.2073, acc=0.0025, iter_time=7.63s]
Epoch 0: 2%|▏ | 263/12384 [33:42<25:48:03, 7.66s/it, loss=7.3061, acc=0.0012, iter_time=8.09s]
Epoch 0: 2%|▏ | 264/12384 [33:42<25:44:58, 7.65s/it, loss=7.3061, acc=0.0012, iter_time=8.09s]
Epoch 0: 2%|▏ | 264/12384 [33:50<25:44:58, 7.65s/it, loss=7.0960, acc=0.0025, iter_time=7.21s]
Epoch 0: 2%|▏ | 265/12384 [33:50<25:46:19, 7.66s/it, loss=7.0960, acc=0.0025, iter_time=7.21s]
Epoch 0: 2%|▏ | 265/12384 [33:57<25:46:19, 7.66s/it, loss=6.9338, acc=0.0029, iter_time=5.62s]
Epoch 0: 2%|▏ | 266/12384 [33:57<25:46:25, 7.66s/it, loss=6.9338, acc=0.0029, iter_time=5.62s]
Epoch 0: 2%|▏ | 266/12384 [34:05<25:46:25, 7.66s/it, loss=6.8391, acc=0.0025, iter_time=9.73s]
Epoch 0: 2%|▏ | 267/12384 [34:05<25:43:47, 7.64s/it, loss=6.8391, acc=0.0025, iter_time=9.73s]
Epoch 0: 2%|▏ | 267/12384 [34:13<25:43:47, 7.64s/it, loss=7.1970, acc=0.0025, iter_time=5.53s]
Epoch 0: 2%|▏ | 268/12384 [34:13<25:42:40, 7.64s/it, loss=7.1970, acc=0.0025, iter_time=5.53s]
Epoch 0: 2%|▏ | 268/12384 [34:20<25:42:40, 7.64s/it, loss=7.0222, acc=0.0014, iter_time=7.73s]
Epoch 0: 2%|▏ | 269/12384 [34:20<25:41:18, 7.63s/it, loss=7.0222, acc=0.0014, iter_time=7.73s]
Epoch 0: 2%|▏ | 269/12384 [34:28<25:41:18, 7.63s/it, loss=6.9741, acc=0.0025, iter_time=9.60s]
Epoch 0: 2%|▏ | 270/12384 [34:28<25:42:21, 7.64s/it, loss=6.9741, acc=0.0025, iter_time=9.60s]
Epoch 0: 2%|▏ | 270/12384 [34:35<25:42:21, 7.64s/it, loss=7.2850, acc=0.0027, iter_time=7.68s]
Epoch 0: 2%|▏ | 271/12384 [34:35<25:45:43, 7.66s/it, loss=7.2850, acc=0.0027, iter_time=7.68s]
Epoch 0: 2%|▏ | 271/12384 [34:43<25:45:43, 7.66s/it, loss=7.3393, acc=0.0022, iter_time=8.00s]
Epoch 0: 2%|▏ | 272/12384 [34:43<26:05:41, 7.76s/it, loss=7.3393, acc=0.0022, iter_time=8.00s]
Epoch 0: 2%|▏ | 272/12384 [34:51<26:05:41, 7.76s/it, loss=6.7739, acc=0.0020, iter_time=7.68s]
Epoch 0: 2%|▏ | 273/12384 [34:51<25:58:03, 7.72s/it, loss=6.7739, acc=0.0020, iter_time=7.68s]
Epoch 0: 2%|▏ | 273/12384 [34:59<25:58:03, 7.72s/it, loss=6.9052, acc=0.0031, iter_time=7.63s]
Epoch 0: 2%|▏ | 274/12384 [34:59<25:52:15, 7.69s/it, loss=6.9052, acc=0.0031, iter_time=7.63s]
Epoch 0: 2%|▏ | 274/12384 [35:06<25:52:15, 7.69s/it, loss=6.9783, acc=0.0027, iter_time=7.61s]
Epoch 0: 2%|▏ | 275/12384 [35:06<25:47:34, 7.67s/it, loss=6.9783, acc=0.0027, iter_time=7.61s]
Epoch 0: 2%|▏ | 275/12384 [35:14<25:47:34, 7.67s/it, loss=7.3331, acc=0.0043, iter_time=7.61s]
Epoch 0: 2%|▏ | 276/12384 [35:14<25:45:53, 7.66s/it, loss=7.3331, acc=0.0043, iter_time=7.61s]
Epoch 0: 2%|▏ | 276/12384 [35:22<25:45:53, 7.66s/it, loss=6.9467, acc=0.0037, iter_time=7.65s]
Epoch 0: 2%|▏ | 277/12384 [35:22<25:43:51, 7.65s/it, loss=6.9467, acc=0.0037, iter_time=7.65s]
Epoch 0: 2%|▏ | 277/12384 [35:29<25:43:51, 7.65s/it, loss=6.8180, acc=0.0021, iter_time=7.61s]
Epoch 0: 2%|▏ | 278/12384 [35:29<25:43:24, 7.65s/it, loss=6.8180, acc=0.0021, iter_time=7.61s]
Epoch 0: 2%|▏ | 278/12384 [35:37<25:43:24, 7.65s/it, loss=6.8739, acc=0.0022, iter_time=7.66s]
Epoch 0: 2%|▏ | 279/12384 [35:37<25:43:12, 7.65s/it, loss=6.8739, acc=0.0022, iter_time=7.66s]
Epoch 0: 2%|▏ | 279/12384 [35:45<25:43:12, 7.65s/it, loss=7.0975, acc=0.0034, iter_time=7.73s]
Epoch 0: 2%|▏ | 280/12384 [35:45<25:40:40, 7.64s/it, loss=7.0975, acc=0.0034, iter_time=7.73s]
Epoch 0: 2%|▏ | 280/12384 [35:52<25:40:40, 7.64s/it, loss=7.0766, acc=0.0038, iter_time=7.50s]
Epoch 0: 2%|▏ | 281/12384 [35:52<25:40:49, 7.64s/it, loss=7.0766, acc=0.0038, iter_time=7.50s]
Epoch 0: 2%|▏ | 281/12384 [36:00<25:40:49, 7.64s/it, loss=6.6622, acc=0.0049, iter_time=7.04s]
Epoch 0: 2%|▏ | 282/12384 [36:00<25:38:44, 7.63s/it, loss=6.6622, acc=0.0049, iter_time=7.04s]
Epoch 0: 2%|▏ | 282/12384 [36:07<25:38:44, 7.63s/it, loss=7.0217, acc=0.0012, iter_time=5.96s]
Epoch 0: 2%|▏ | 283/12384 [36:07<25:41:08, 7.64s/it, loss=7.0217, acc=0.0012, iter_time=5.96s]
Epoch 0: 2%|▏ | 283/12384 [36:15<25:41:08, 7.64s/it, loss=6.9411, acc=0.0038, iter_time=9.92s]
Epoch 0: 2%|▏ | 284/12384 [36:15<25:38:59, 7.63s/it, loss=6.9411, acc=0.0038, iter_time=9.92s]
Epoch 0: 2%|▏ | 284/12384 [36:23<25:38:59, 7.63s/it, loss=7.3455, acc=0.0022, iter_time=7.63s]
Epoch 0: 2%|▏ | 285/12384 [36:23<25:38:43, 7.63s/it, loss=7.3455, acc=0.0022, iter_time=7.63s]
Epoch 0: 2%|▏ | 285/12384 [36:30<25:38:43, 7.63s/it, loss=6.8002, acc=0.0029, iter_time=7.63s]
Epoch 0: 2%|▏ | 286/12384 [36:30<25:39:46, 7.64s/it, loss=6.8002, acc=0.0029, iter_time=7.63s]
Epoch 0: 2%|▏ | 286/12384 [36:38<25:39:46, 7.64s/it, loss=6.7756, acc=0.0042, iter_time=7.65s]
Epoch 0: 2%|▏ | 287/12384 [36:38<25:37:32, 7.63s/it, loss=6.7756, acc=0.0042, iter_time=7.65s]
Epoch 0: 2%|▏ | 287/12384 [36:46<25:37:32, 7.63s/it, loss=7.3387, acc=0.0033, iter_time=7.99s]
Epoch 0: 2%|▏ | 288/12384 [36:46<25:38:22, 7.63s/it, loss=7.3387, acc=0.0033, iter_time=7.99s]
Epoch 0: 2%|▏ | 288/12384 [36:53<25:38:22, 7.63s/it, loss=6.7459, acc=0.0030, iter_time=6.96s]
Epoch 0: 2%|▏ | 289/12384 [36:53<25:35:55, 7.62s/it, loss=6.7459, acc=0.0030, iter_time=6.96s]
Epoch 0: 2%|▏ | 289/12384 [37:01<25:35:55, 7.62s/it, loss=6.3971, acc=0.0034, iter_time=7.90s]
Epoch 0: 2%|▏ | 290/12384 [37:01<25:37:36, 7.63s/it, loss=6.3971, acc=0.0034, iter_time=7.90s]
Epoch 0: 2%|▏ | 290/12384 [37:08<25:37:36, 7.63s/it, loss=6.7184, acc=0.0072, iter_time=7.63s]
Epoch 0: 2%|▏ | 291/12384 [37:08<25:38:29, 7.63s/it, loss=6.7184, acc=0.0072, iter_time=7.63s]
Epoch 0: 2%|▏ | 291/12384 [37:16<25:38:29, 7.63s/it, loss=6.7790, acc=0.0035, iter_time=7.64s]
Epoch 0: 2%|▏ | 292/12384 [37:16<25:39:30, 7.64s/it, loss=6.7790, acc=0.0035, iter_time=7.64s]
Epoch 0: 2%|▏ | 292/12384 [37:24<25:39:30, 7.64s/it, loss=6.5072, acc=0.0040, iter_time=7.66s]
Epoch 0: 2%|▏ | 293/12384 [37:24<25:38:43, 7.64s/it, loss=6.5072, acc=0.0040, iter_time=7.66s]
Epoch 0: 2%|▏ | 293/12384 [37:31<25:38:43, 7.64s/it, loss=6.6935, acc=0.0026, iter_time=5.07s]
Epoch 0: 2%|▏ | 294/12384 [37:31<25:40:16, 7.64s/it, loss=6.6935, acc=0.0026, iter_time=5.07s]
Epoch 0: 2%|▏ | 294/12384 [37:39<25:40:16, 7.64s/it, loss=6.3948, acc=0.0052, iter_time=8.13s]
Epoch 0: 2%|▏ | 295/12384 [37:39<25:38:37, 7.64s/it, loss=6.3948, acc=0.0052, iter_time=8.13s]
Epoch 0: 2%|▏ | 295/12384 [37:47<25:38:37, 7.64s/it, loss=6.7583, acc=0.0028, iter_time=9.71s]
Epoch 0: 2%|▏ | 296/12384 [37:47<25:40:48, 7.65s/it, loss=6.7583, acc=0.0028, iter_time=9.71s]
Epoch 0: 2%|▏ | 296/12384 [37:54<25:40:48, 7.65s/it, loss=6.1203, acc=0.0043, iter_time=7.66s]
Epoch 0: 2%|▏ | 297/12384 [37:54<25:39:54, 7.64s/it, loss=6.1203, acc=0.0043, iter_time=7.66s]
Epoch 0: 2%|▏ | 297/12384 [38:02<25:39:54, 7.64s/it, loss=7.0972, acc=0.0035, iter_time=7.96s]
Epoch 0: 2%|▏ | 298/12384 [38:02<26:00:03, 7.74s/it, loss=7.0972, acc=0.0035, iter_time=7.96s]
Epoch 0: 2%|▏ | 298/12384 [38:10<26:00:03, 7.74s/it, loss=6.2468, acc=0.0040, iter_time=7.07s]
Epoch 0: 2%|▏ | 299/12384 [38:10<25:54:47, 7.72s/it, loss=6.2468, acc=0.0040, iter_time=7.07s]
Epoch 0: 2%|▏ | 299/12384 [38:18<25:54:47, 7.72s/it, loss=6.3538, acc=0.0050, iter_time=8.72s]
Epoch 0: 2%|▏ | 300/12384 [38:18<25:52:28, 7.71s/it, loss=6.3538, acc=0.0050, iter_time=8.72s]
Epoch 0: 2%|▏ | 300/12384 [38:25<25:52:28, 7.71s/it, loss=5.8291, acc=0.0066, iter_time=4.60s]
Epoch 0: 2%|▏ | 301/12384 [38:25<25:49:18, 7.69s/it, loss=5.8291, acc=0.0066, iter_time=4.60s]
Epoch 0: 2%|▏ | 301/12384 [38:33<25:49:18, 7.69s/it, loss=6.3087, acc=0.0032, iter_time=10.30s]
Epoch 0: 2%|▏ | 302/12384 [38:33<25:48:30, 7.69s/it, loss=6.3087, acc=0.0032, iter_time=10.30s]
Epoch 0: 2%|▏ | 302/12384 [38:41<25:48:30, 7.69s/it, loss=6.6376, acc=0.0032, iter_time=5.61s]
Epoch 0: 2%|▏ | 303/12384 [38:41<25:42:30, 7.66s/it, loss=6.6376, acc=0.0032, iter_time=5.61s]
Epoch 0: 2%|▏ | 303/12384 [38:48<25:42:30, 7.66s/it, loss=6.8154, acc=0.0040, iter_time=10.00s]
Epoch 0: 2%|▏ | 304/12384 [38:48<25:41:36, 7.66s/it, loss=6.8154, acc=0.0040, iter_time=10.00s]
Epoch 0: 2%|▏ | 304/12384 [38:56<25:41:36, 7.66s/it, loss=5.8010, acc=0.0080, iter_time=4.22s]
Epoch 0: 2%|▏ | 305/12384 [38:56<25:39:34, 7.65s/it, loss=5.8010, acc=0.0080, iter_time=4.22s]
Epoch 0: 2%|▏ | 305/12384 [39:03<25:39:34, 7.65s/it, loss=6.6645, acc=0.0055, iter_time=10.67s]
Epoch 0: 2%|▏ | 306/12384 [39:03<25:38:25, 7.64s/it, loss=6.6645, acc=0.0055, iter_time=10.67s]
Epoch 0: 2%|▏ | 306/12384 [39:11<25:38:25, 7.64s/it, loss=6.6756, acc=0.0038, iter_time=5.32s]
Epoch 0: 2%|▏ | 307/12384 [39:11<25:34:56, 7.63s/it, loss=6.6756, acc=0.0038, iter_time=5.32s]
Epoch 0: 2%|▏ | 307/12384 [39:19<25:34:56, 7.63s/it, loss=6.4505, acc=0.0060, iter_time=9.92s]
Epoch 0: 2%|▏ | 308/12384 [39:19<25:36:27, 7.63s/it, loss=6.4505, acc=0.0060, iter_time=9.92s]
Epoch 0: 2%|▏ | 308/12384 [39:26<25:36:27, 7.63s/it, loss=6.1419, acc=0.0045, iter_time=4.76s]
Epoch 0: 2%|▏ | 309/12384 [39:26<25:35:33, 7.63s/it, loss=6.1419, acc=0.0045, iter_time=4.76s]
Epoch 0: 2%|▏ | 309/12384 [39:34<25:35:33, 7.63s/it, loss=5.9926, acc=0.0045, iter_time=6.99s]
Epoch 0: 3%|▎ | 310/12384 [39:34<25:37:26, 7.64s/it, loss=5.9926, acc=0.0045, iter_time=6.99s]
Epoch 0: 3%|▎ | 310/12384 [39:42<25:37:26, 7.64s/it, loss=6.0707, acc=0.0056, iter_time=11.17s]
Epoch 0: 3%|▎ | 311/12384 [39:42<25:36:56, 7.64s/it, loss=6.0707, acc=0.0056, iter_time=11.17s]
Epoch 0: 3%|▎ | 311/12384 [39:49<25:36:56, 7.64s/it, loss=6.5124, acc=0.0036, iter_time=7.74s]
Epoch 0: 3%|▎ | 312/12384 [39:49<25:37:29, 7.64s/it, loss=6.5124, acc=0.0036, iter_time=7.74s]
Epoch 0: 3%|▎ | 312/12384 [39:57<25:37:29, 7.64s/it, loss=5.6124, acc=0.0070, iter_time=5.01s]
Epoch 0: 3%|▎ | 313/12384 [39:57<25:39:13, 7.65s/it, loss=5.6124, acc=0.0070, iter_time=5.01s]
Epoch 0: 3%|▎ | 313/12384 [40:05<25:39:13, 7.65s/it, loss=6.2550, acc=0.0054, iter_time=10.20s]
Epoch 0: 3%|▎ | 314/12384 [40:05<25:39:13, 7.65s/it, loss=6.2550, acc=0.0054, iter_time=10.20s]
Epoch 0: 3%|▎ | 314/12384 [40:12<25:39:13, 7.65s/it, loss=5.9709, acc=0.0075, iter_time=5.64s]
Epoch 0: 3%|▎ | 315/12384 [40:12<25:40:12, 7.66s/it, loss=5.9709, acc=0.0075, iter_time=5.64s]
Epoch 0: 3%|▎ | 315/12384 [40:20<25:40:12, 7.66s/it, loss=6.4455, acc=0.0052, iter_time=9.69s]
Epoch 0: 3%|▎ | 316/12384 [40:20<25:41:19, 7.66s/it, loss=6.4455, acc=0.0052, iter_time=9.69s]
Epoch 0: 3%|▎ | 316/12384 [40:28<25:41:19, 7.66s/it, loss=5.5123, acc=0.0076, iter_time=5.37s]
Epoch 0: 3%|▎ | 317/12384 [40:28<25:42:23, 7.67s/it, loss=5.5123, acc=0.0076, iter_time=5.37s]
Epoch 0: 3%|▎ | 317/12384 [40:35<25:42:23, 7.67s/it, loss=5.9083, acc=0.0054, iter_time=10.00s]
Epoch 0: 3%|▎ | 318/12384 [40:35<25:43:43, 7.68s/it, loss=5.9083, acc=0.0054, iter_time=10.00s]
Epoch 0: 3%|▎ | 318/12384 [40:43<25:43:43, 7.68s/it, loss=5.7044, acc=0.0059, iter_time=4.80s]
Epoch 0: 3%|▎ | 319/12384 [40:43<25:43:38, 7.68s/it, loss=5.7044, acc=0.0059, iter_time=4.80s]
Epoch 0: 3%|▎ | 319/12384 [40:51<25:43:38, 7.68s/it, loss=6.1768, acc=0.0078, iter_time=10.52s]
Epoch 0: 3%|▎ | 320/12384 [40:51<25:42:00, 7.67s/it, loss=6.1768, acc=0.0078, iter_time=10.52s]
Epoch 0: 3%|▎ | 320/12384 [40:58<25:42:00, 7.67s/it, loss=5.7468, acc=0.0071, iter_time=7.68s]
Epoch 0: 3%|▎ | 321/12384 [40:58<25:39:49, 7.66s/it, loss=5.7468, acc=0.0071, iter_time=7.68s]
Epoch 0: 3%|▎ | 321/12384 [41:06<25:39:49, 7.66s/it, loss=5.8584, acc=0.0098, iter_time=4.80s]
Epoch 0: 3%|▎ | 322/12384 [41:06<25:35:59, 7.64s/it, loss=5.8584, acc=0.0098, iter_time=4.80s]
Epoch 0: 3%|▎ | 322/12384 [41:14<25:35:59, 7.64s/it, loss=6.2379, acc=0.0060, iter_time=10.44s]
Epoch 0: 3%|▎ | 323/12384 [41:14<25:35:57, 7.64s/it, loss=6.2379, acc=0.0060, iter_time=10.44s]
Epoch 0: 3%|▎ | 323/12384 [41:21<25:35:57, 7.64s/it, loss=5.9168, acc=0.0098, iter_time=7.30s]
Epoch 0: 3%|▎ | 324/12384 [41:21<25:36:27, 7.64s/it, loss=5.9168, acc=0.0098, iter_time=7.30s]
Epoch 0: 3%|▎ | 324/12384 [41:29<25:36:27, 7.64s/it, loss=5.6638, acc=0.0060, iter_time=8.30s]
Epoch 0: 3%|▎ | 325/12384 [41:29<25:54:59, 7.74s/it, loss=5.6638, acc=0.0060, iter_time=8.30s]
Epoch 0: 3%|▎ | 325/12384 [41:37<25:54:59, 7.74s/it, loss=5.8490, acc=0.0072, iter_time=7.62s]
Epoch 0: 3%|▎ | 326/12384 [41:37<25:50:37, 7.72s/it, loss=5.8490, acc=0.0072, iter_time=7.62s]
Epoch 0: 3%|▎ | 326/12384 [41:44<25:50:37, 7.72s/it, loss=5.6499, acc=0.0070, iter_time=7.66s]
Epoch 0: 3%|▎ | 327/12384 [41:44<25:45:52, 7.69s/it, loss=5.6499, acc=0.0070, iter_time=7.66s]
Epoch 0: 3%|▎ | 327/12384 [41:52<25:45:52, 7.69s/it, loss=5.8528, acc=0.0058, iter_time=8.03s]
Epoch 0: 3%|▎ | 328/12384 [41:52<25:40:44, 7.67s/it, loss=5.8528, acc=0.0058, iter_time=8.03s]
Epoch 0: 3%|▎ | 328/12384 [42:00<25:40:44, 7.67s/it, loss=5.3495, acc=0.0093, iter_time=7.22s]
Epoch 0: 3%|▎ | 329/12384 [42:00<25:39:31, 7.66s/it, loss=5.3495, acc=0.0093, iter_time=7.22s]
Epoch 0: 3%|▎ | 329/12384 [42:07<25:39:31, 7.66s/it, loss=5.3448, acc=0.0088, iter_time=7.64s]
Epoch 0: 3%|▎ | 330/12384 [42:07<25:37:29, 7.65s/it, loss=5.3448, acc=0.0088, iter_time=7.64s]
Epoch 0: 3%|▎ | 330/12384 [42:15<25:37:29, 7.65s/it, loss=5.8485, acc=0.0064, iter_time=7.66s]
Epoch 0: 3%|▎ | 331/12384 [42:15<25:35:47, 7.65s/it, loss=5.8485, acc=0.0064, iter_time=7.66s]
Epoch 0: 3%|▎ | 331/12384 [42:23<25:35:47, 7.65s/it, loss=5.9459, acc=0.0068, iter_time=7.62s]
Epoch 0: 3%|▎ | 332/12384 [42:23<25:35:17, 7.64s/it, loss=5.9459, acc=0.0068, iter_time=7.62s]
Epoch 0: 3%|▎ | 332/12384 [42:30<25:35:17, 7.64s/it, loss=5.4085, acc=0.0101, iter_time=7.63s]
Epoch 0: 3%|▎ | 333/12384 [42:30<25:37:01, 7.65s/it, loss=5.4085, acc=0.0101, iter_time=7.63s]
Epoch 0: 3%|▎ | 333/12384 [42:38<25:37:01, 7.65s/it, loss=5.3133, acc=0.0101, iter_time=5.07s]
Epoch 0: 3%|▎ | 334/12384 [42:38<25:36:06, 7.65s/it, loss=5.3133, acc=0.0101, iter_time=5.07s]
Epoch 0: 3%|▎ | 334/12384 [42:46<25:36:06, 7.65s/it, loss=5.3288, acc=0.0072, iter_time=10.25s]
Epoch 0: 3%|▎ | 335/12384 [42:46<25:36:47, 7.65s/it, loss=5.3288, acc=0.0072, iter_time=10.25s]
Epoch 0: 3%|▎ | 335/12384 [42:53<25:36:47, 7.65s/it, loss=5.7861, acc=0.0081, iter_time=8.04s]
Epoch 0: 3%|▎ | 336/12384 [42:53<25:34:58, 7.64s/it, loss=5.7861, acc=0.0081, iter_time=8.04s]
Epoch 0: 3%|▎ | 336/12384 [43:01<25:34:58, 7.64s/it, loss=5.7992, acc=0.0069, iter_time=7.23s]
Epoch 0: 3%|▎ | 337/12384 [43:01<25:38:53, 7.66s/it, loss=5.7992, acc=0.0069, iter_time=7.23s]
Epoch 0: 3%|▎ | 337/12384 [43:09<25:38:53, 7.66s/it, loss=6.0970, acc=0.0070, iter_time=7.73s]
Epoch 0: 3%|▎ | 338/12384 [43:09<25:40:20, 7.67s/it, loss=6.0970, acc=0.0070, iter_time=7.73s]
Epoch 0: 3%|▎ | 338/12384 [43:16<25:40:20, 7.67s/it, loss=5.6665, acc=0.0068, iter_time=7.69s]
Epoch 0: 3%|▎ | 339/12384 [43:16<25:38:39, 7.66s/it, loss=5.6665, acc=0.0068, iter_time=7.69s]
Epoch 0: 3%|▎ | 339/12384 [43:24<25:38:39, 7.66s/it, loss=5.7326, acc=0.0087, iter_time=5.86s]
Epoch 0: 3%|▎ | 340/12384 [43:24<25:38:37, 7.66s/it, loss=5.7326, acc=0.0087, iter_time=5.86s]
Epoch 0: 3%|▎ | 340/12384 [43:32<25:38:37, 7.66s/it, loss=5.4915, acc=0.0102, iter_time=9.45s]
Epoch 0: 3%|▎ | 341/12384 [43:32<25:38:16, 7.66s/it, loss=5.4915, acc=0.0102, iter_time=9.45s]
Epoch 0: 3%|▎ | 341/12384 [43:39<25:38:16, 7.66s/it, loss=5.7700, acc=0.0064, iter_time=7.67s]
Epoch 0: 3%|▎ | 342/12384 [43:39<25:37:02, 7.66s/it, loss=5.7700, acc=0.0064, iter_time=7.67s]
Epoch 0: 3%|▎ | 342/12384 [43:47<25:37:02, 7.66s/it, loss=5.6819, acc=0.0080, iter_time=7.63s]
Epoch 0: 3%|▎ | 343/12384 [43:47<25:34:27, 7.65s/it, loss=5.6819, acc=0.0080, iter_time=7.63s]
Epoch 0: 3%|▎ | 343/12384 [43:54<25:34:27, 7.65s/it, loss=5.4848, acc=0.0113, iter_time=8.01s]
Epoch 0: 3%|▎ | 344/12384 [43:54<25:33:07, 7.64s/it, loss=5.4848, acc=0.0113, iter_time=8.01s]
Epoch 0: 3%|▎ | 344/12384 [44:02<25:33:07, 7.64s/it, loss=5.6680, acc=0.0124, iter_time=7.25s]
Epoch 0: 3%|▎ | 345/12384 [44:02<25:33:43, 7.64s/it, loss=5.6680, acc=0.0124, iter_time=7.25s]
Epoch 0: 3%|▎ | 345/12384 [44:10<25:33:43, 7.64s/it, loss=5.4482, acc=0.0082, iter_time=7.64s]
Epoch 0: 3%|▎ | 346/12384 [44:10<25:33:42, 7.64s/it, loss=5.4482, acc=0.0082, iter_time=7.64s]
Epoch 0: 3%|▎ | 346/12384 [44:17<25:33:42, 7.64s/it, loss=5.3382, acc=0.0116, iter_time=7.65s]
Epoch 0: 3%|▎ | 347/12384 [44:17<25:30:54, 7.63s/it, loss=5.3382, acc=0.0116, iter_time=7.65s]
Epoch 0: 3%|▎ | 347/12384 [44:25<25:30:54, 7.63s/it, loss=5.9495, acc=0.0055, iter_time=7.62s]
Epoch 0: 3%|▎ | 348/12384 [44:25<25:30:03, 7.63s/it, loss=5.9495, acc=0.0055, iter_time=7.62s]
Epoch 0: 3%|▎ | 348/12384 [44:33<25:30:03, 7.63s/it, loss=5.5126, acc=0.0067, iter_time=7.60s]
Epoch 0: 3%|▎ | 349/12384 [44:33<25:30:12, 7.63s/it, loss=5.5126, acc=0.0067, iter_time=7.60s]
Epoch 0: 3%|▎ | 349/12384 [44:40<25:30:12, 7.63s/it, loss=5.4053, acc=0.0117, iter_time=8.02s]
Epoch 0: 3%|▎ | 350/12384 [44:40<25:28:43, 7.62s/it, loss=5.4053, acc=0.0117, iter_time=8.02s]
Epoch 0: 3%|▎ | 350/12384 [44:48<25:28:43, 7.62s/it, loss=5.0049, acc=0.0102, iter_time=7.57s]
Epoch 0: 3%|▎ | 351/12384 [44:48<25:50:39, 7.73s/it, loss=5.0049, acc=0.0102, iter_time=7.57s]
Epoch 0: 3%|▎ | 351/12384 [44:56<25:50:39, 7.73s/it, loss=4.9376, acc=0.0129, iter_time=7.60s]
Epoch 0: 3%|▎ | 352/12384 [44:56<25:44:47, 7.70s/it, loss=4.9376, acc=0.0129, iter_time=7.60s]
Epoch 0: 3%|▎ | 352/12384 [45:03<25:44:47, 7.70s/it, loss=5.2557, acc=0.0145, iter_time=7.66s]
Epoch 0: 3%|▎ | 353/12384 [45:03<25:40:11, 7.68s/it, loss=5.2557, acc=0.0145, iter_time=7.66s]
Epoch 0: 3%|▎ | 353/12384 [45:11<25:40:11, 7.68s/it, loss=4.6446, acc=0.0172, iter_time=7.64s]
Epoch 0: 3%|▎ | 354/12384 [45:11<25:35:22, 7.66s/it, loss=4.6446, acc=0.0172, iter_time=7.64s]
Epoch 0: 3%|▎ | 354/12384 [45:19<25:35:22, 7.66s/it, loss=4.7147, acc=0.0130, iter_time=7.60s]
Epoch 0: 3%|▎ | 355/12384 [45:19<25:33:58, 7.65s/it, loss=4.7147, acc=0.0130, iter_time=7.60s]
Epoch 0: 3%|▎ | 355/12384 [45:26<25:33:58, 7.65s/it, loss=5.1595, acc=0.0100, iter_time=3.61s]
Epoch 0: 3%|▎ | 356/12384 [45:26<25:37:44, 7.67s/it, loss=5.1595, acc=0.0100, iter_time=3.61s]
Epoch 0: 3%|▎ | 356/12384 [45:34<25:37:44, 7.67s/it, loss=5.1754, acc=0.0106, iter_time=11.74s]
Epoch 0: 3%|▎ | 357/12384 [45:34<25:34:07, 7.65s/it, loss=5.1754, acc=0.0106, iter_time=11.74s]
Epoch 0: 3%|▎ | 357/12384 [45:42<25:34:07, 7.65s/it, loss=5.2104, acc=0.0132, iter_time=7.60s]
Epoch 0: 3%|▎ | 358/12384 [45:42<25:33:46, 7.65s/it, loss=5.2104, acc=0.0132, iter_time=7.60s]
Epoch 0: 3%|▎ | 358/12384 [45:49<25:33:46, 7.65s/it, loss=5.5443, acc=0.0122, iter_time=7.68s]
Epoch 0: 3%|▎ | 359/12384 [45:49<25:32:20, 7.65s/it, loss=5.5443, acc=0.0122, iter_time=7.68s]
Epoch 0: 3%|▎ | 359/12384 [45:57<25:32:20, 7.65s/it, loss=4.6941, acc=0.0179, iter_time=7.56s]
Epoch 0: 3%|▎ | 360/12384 [45:57<25:30:07, 7.64s/it, loss=4.6941, acc=0.0179, iter_time=7.56s]
Epoch 0: 3%|▎ | 360/12384 [46:05<25:30:07, 7.64s/it, loss=5.2813, acc=0.0146, iter_time=7.65s]
Epoch 0: 3%|▎ | 361/12384 [46:05<25:28:42, 7.63s/it, loss=5.2813, acc=0.0146, iter_time=7.65s]
Epoch 0: 3%|▎ | 361/12384 [46:12<25:28:42, 7.63s/it, loss=4.4687, acc=0.0203, iter_time=5.53s]
Epoch 0: 3%|▎ | 362/12384 [46:12<25:32:07, 7.65s/it, loss=4.4687, acc=0.0203, iter_time=5.53s]
Epoch 0: 3%|▎ | 362/12384 [46:20<25:32:07, 7.65s/it, loss=4.8078, acc=0.0235, iter_time=9.80s]
Epoch 0: 3%|▎ | 363/12384 [46:20<25:32:04, 7.65s/it, loss=4.8078, acc=0.0235, iter_time=9.80s]
Epoch 0: 3%|▎ | 363/12384 [46:28<25:32:04, 7.65s/it, loss=4.4958, acc=0.0183, iter_time=7.63s]
Epoch 0: 3%|▎ | 364/12384 [46:28<25:30:55, 7.64s/it, loss=4.4958, acc=0.0183, iter_time=7.63s]
Epoch 0: 3%|▎ | 364/12384 [46:35<25:30:55, 7.64s/it, loss=5.0373, acc=0.0105, iter_time=7.66s]
Epoch 0: 3%|▎ | 365/12384 [46:35<25:29:15, 7.63s/it, loss=5.0373, acc=0.0105, iter_time=7.66s]
Epoch 0: 3%|▎ | 365/12384 [46:43<25:29:15, 7.63s/it, loss=4.6957, acc=0.0158, iter_time=7.60s]
Epoch 0: 3%|▎ | 366/12384 [46:43<25:31:48, 7.65s/it, loss=4.6957, acc=0.0158, iter_time=7.60s]
Epoch 0: 3%|▎ | 366/12384 [46:50<25:31:48, 7.65s/it, loss=4.7914, acc=0.0158, iter_time=7.70s]
Epoch 0: 3%|▎ | 367/12384 [46:50<25:29:35, 7.64s/it, loss=4.7914, acc=0.0158, iter_time=7.70s]
Epoch 0: 3%|▎ | 367/12384 [46:58<25:29:35, 7.64s/it, loss=4.8600, acc=0.0196, iter_time=7.59s]
Epoch 0: 3%|▎ | 368/12384 [46:58<25:30:08, 7.64s/it, loss=4.8600, acc=0.0196, iter_time=7.59s]
Epoch 0: 3%|▎ | 368/12384 [47:06<25:30:08, 7.64s/it, loss=4.6137, acc=0.0147, iter_time=7.68s]
Epoch 0: 3%|▎ | 369/12384 [47:06<25:37:18, 7.68s/it, loss=4.6137, acc=0.0147, iter_time=7.68s]
Epoch 0: 3%|▎ | 369/12384 [47:13<25:37:18, 7.68s/it, loss=4.9908, acc=0.0129, iter_time=7.73s]
Epoch 0: 3%|▎ | 370/12384 [47:13<25:33:52, 7.66s/it, loss=4.9908, acc=0.0129, iter_time=7.73s]
Epoch 0: 3%|▎ | 370/12384 [47:21<25:33:52, 7.66s/it, loss=4.8862, acc=0.0132, iter_time=7.66s]
Epoch 0: 3%|▎ | 371/12384 [47:21<25:32:29, 7.65s/it, loss=4.8862, acc=0.0132, iter_time=7.66s]
Epoch 0: 3%|▎ | 371/12384 [47:29<25:32:29, 7.65s/it, loss=4.9949, acc=0.0125, iter_time=7.61s]
Epoch 0: 3%|▎ | 372/12384 [47:29<25:29:35, 7.64s/it, loss=4.9949, acc=0.0125, iter_time=7.61s]
Epoch 0: 3%|▎ | 372/12384 [47:36<25:29:35, 7.64s/it, loss=4.9881, acc=0.0133, iter_time=7.64s]
Epoch 0: 3%|▎ | 373/12384 [47:36<25:30:03, 7.64s/it, loss=4.9881, acc=0.0133, iter_time=7.64s]
Epoch 0: 3%|▎ | 373/12384 [47:44<25:30:03, 7.64s/it, loss=4.7250, acc=0.0206, iter_time=4.32s]
Epoch 0: 3%|▎ | 374/12384 [47:44<25:29:53, 7.64s/it, loss=4.7250, acc=0.0206, iter_time=4.32s]
Epoch 0: 3%|▎ | 374/12384 [47:52<25:29:53, 7.64s/it, loss=5.1235, acc=0.0125, iter_time=10.95s]
Epoch 0: 3%|▎ | 375/12384 [47:52<25:28:39, 7.64s/it, loss=5.1235, acc=0.0125, iter_time=10.95s]
Epoch 0: 3%|▎ | 375/12384 [47:59<25:28:39, 7.64s/it, loss=5.1166, acc=0.0131, iter_time=8.01s]
Epoch 0: 3%|▎ | 376/12384 [47:59<25:29:48, 7.64s/it, loss=5.1166, acc=0.0131, iter_time=8.01s]
Epoch 0: 3%|▎ | 376/12384 [48:07<25:29:48, 7.64s/it, loss=5.0236, acc=0.0119, iter_time=7.56s]
Epoch 0: 3%|▎ | 377/12384 [48:07<25:47:08, 7.73s/it, loss=5.0236, acc=0.0119, iter_time=7.56s]
Epoch 0: 3%|▎ | 377/12384 [48:15<25:47:08, 7.73s/it, loss=4.2411, acc=0.0275, iter_time=4.34s]
Epoch 0: 3%|▎ | 378/12384 [48:15<25:37:55, 7.69s/it, loss=4.2411, acc=0.0275, iter_time=4.34s]
Epoch 0: 3%|▎ | 378/12384 [48:22<25:37:55, 7.69s/it, loss=4.5981, acc=0.0179, iter_time=10.23s]
Epoch 0: 3%|▎ | 379/12384 [48:22<25:37:33, 7.68s/it, loss=4.5981, acc=0.0179, iter_time=10.23s]
Epoch 0: 3%|▎ | 379/12384 [48:30<25:37:33, 7.68s/it, loss=5.0602, acc=0.0156, iter_time=7.47s]
Epoch 0: 3%|▎ | 380/12384 [48:30<25:36:04, 7.68s/it, loss=5.0602, acc=0.0156, iter_time=7.47s]
Epoch 0: 3%|▎ | 380/12384 [48:38<25:36:04, 7.68s/it, loss=4.7217, acc=0.0143, iter_time=8.51s]
Epoch 0: 3%|▎ | 381/12384 [48:38<25:32:56, 7.66s/it, loss=4.7217, acc=0.0143, iter_time=8.51s]
Epoch 0: 3%|▎ | 381/12384 [48:45<25:32:56, 7.66s/it, loss=4.8477, acc=0.0153, iter_time=7.63s]
Epoch 0: 3%|▎ | 382/12384 [48:45<25:30:49, 7.65s/it, loss=4.8477, acc=0.0153, iter_time=7.63s]
Epoch 0: 3%|▎ | 382/12384 [48:53<25:30:49, 7.65s/it, loss=4.2739, acc=0.0184, iter_time=7.65s]
Epoch 0: 3%|▎ | 383/12384 [48:53<25:31:10, 7.66s/it, loss=4.2739, acc=0.0184, iter_time=7.65s]
Epoch 0: 3%|▎ | 383/12384 [49:01<25:31:10, 7.66s/it, loss=4.7012, acc=0.0205, iter_time=8.04s]
Epoch 0: 3%|▎ | 384/12384 [49:01<25:28:24, 7.64s/it, loss=4.7012, acc=0.0205, iter_time=8.04s]
Epoch 0: 3%|▎ | 384/12384 [49:08<25:28:24, 7.64s/it, loss=4.2782, acc=0.0249, iter_time=7.27s]
Epoch 0: 3%|▎ | 385/12384 [49:08<25:29:26, 7.65s/it, loss=4.2782, acc=0.0249, iter_time=7.27s]
Epoch 0: 3%|▎ | 385/12384 [49:16<25:29:26, 7.65s/it, loss=4.4541, acc=0.0239, iter_time=7.62s]
Epoch 0: 3%|▎ | 386/12384 [49:16<25:28:25, 7.64s/it, loss=4.4541, acc=0.0239, iter_time=7.62s]
Epoch 0: 3%|▎ | 386/12384 [49:24<25:28:25, 7.64s/it, loss=4.2846, acc=0.0287, iter_time=6.77s]
Epoch 0: 3%|▎ | 387/12384 [49:24<25:28:19, 7.64s/it, loss=4.2846, acc=0.0287, iter_time=6.77s]
Epoch 0: 3%|▎ | 387/12384 [49:31<25:28:19, 7.64s/it, loss=4.1714, acc=0.0222, iter_time=8.50s]
Epoch 0: 3%|▎ | 388/12384 [49:31<25:27:30, 7.64s/it, loss=4.1714, acc=0.0222, iter_time=8.50s]
Epoch 0: 3%|▎ | 388/12384 [49:39<25:27:30, 7.64s/it, loss=4.2648, acc=0.0199, iter_time=7.63s]
Epoch 0: 3%|▎ | 389/12384 [49:39<25:31:02, 7.66s/it, loss=4.2648, acc=0.0199, iter_time=7.63s]
Epoch 0: 3%|▎ | 389/12384 [49:47<25:31:02, 7.66s/it, loss=4.3564, acc=0.0300, iter_time=7.40s]
Epoch 0: 3%|▎ | 390/12384 [49:47<25:27:13, 7.64s/it, loss=4.3564, acc=0.0300, iter_time=7.40s]
Epoch 0: 3%|▎ | 390/12384 [49:54<25:27:13, 7.64s/it, loss=4.5471, acc=0.0209, iter_time=7.91s]
Epoch 0: 3%|▎ | 391/12384 [49:54<25:27:37, 7.64s/it, loss=4.5471, acc=0.0209, iter_time=7.91s]
Epoch 0: 3%|▎ | 391/12384 [50:02<25:27:37, 7.64s/it, loss=4.4058, acc=0.0166, iter_time=8.04s]
Epoch 0: 3%|▎ | 392/12384 [50:02<25:28:59, 7.65s/it, loss=4.4058, acc=0.0166, iter_time=8.04s]
Epoch 0: 3%|▎ | 392/12384 [50:10<25:28:59, 7.65s/it, loss=4.1021, acc=0.0195, iter_time=7.38s]
Epoch 0: 3%|▎ | 393/12384 [50:10<25:32:59, 7.67s/it, loss=4.1021, acc=0.0195, iter_time=7.38s]
Epoch 0: 3%|▎ | 393/12384 [50:17<25:32:59, 7.67s/it, loss=4.2500, acc=0.0247, iter_time=6.98s]
Epoch 0: 3%|▎ | 394/12384 [50:17<25:31:09, 7.66s/it, loss=4.2500, acc=0.0247, iter_time=6.98s]
Epoch 0: 3%|▎ | 394/12384 [50:25<25:31:09, 7.66s/it, loss=4.0351, acc=0.0294, iter_time=5.35s]
Epoch 0: 3%|▎ | 395/12384 [50:25<25:32:56, 7.67s/it, loss=4.0351, acc=0.0294, iter_time=5.35s]
Epoch 0: 3%|▎ | 395/12384 [50:33<25:32:56, 7.67s/it, loss=4.0351, acc=0.0264, iter_time=10.65s]
Epoch 0: 3%|▎ | 396/12384 [50:33<25:32:00, 7.67s/it, loss=4.0351, acc=0.0264, iter_time=10.65s]
Epoch 0: 3%|▎ | 396/12384 [50:40<25:32:00, 7.67s/it, loss=3.8231, acc=0.0282, iter_time=7.63s]
Epoch 0: 3%|▎ | 397/12384 [50:40<25:29:23, 7.66s/it, loss=3.8231, acc=0.0282, iter_time=7.63s]
Epoch 0: 3%|▎ | 397/12384 [50:48<25:29:23, 7.66s/it, loss=4.3682, acc=0.0196, iter_time=7.65s]
Epoch 0: 3%|▎ | 398/12384 [50:48<25:31:08, 7.66s/it, loss=4.3682, acc=0.0196, iter_time=7.65s]
Epoch 0: 3%|▎ | 398/12384 [50:56<25:31:08, 7.66s/it, loss=3.7488, acc=0.0245, iter_time=6.43s]
Epoch 0: 3%|▎ | 399/12384 [50:56<25:29:10, 7.66s/it, loss=3.7488, acc=0.0245, iter_time=6.43s]
Epoch 0: 3%|▎ | 399/12384 [51:03<25:29:10, 7.66s/it, loss=4.3565, acc=0.0228, iter_time=9.42s]
Epoch 0: 3%|▎ | 400/12384 [51:03<25:35:48, 7.69s/it, loss=4.3565, acc=0.0228, iter_time=9.42s]
Epoch 0: 3%|▎ | 400/12384 [51:11<25:35:48, 7.69s/it, loss=3.7938, acc=0.0266, iter_time=7.20s]
Epoch 0: 3%|▎ | 401/12384 [51:11<25:31:45, 7.67s/it, loss=3.7938, acc=0.0266, iter_time=7.20s]
Epoch 0: 3%|▎ | 401/12384 [51:19<25:31:45, 7.67s/it, loss=4.2312, acc=0.0216, iter_time=7.64s]
Epoch 0: 3%|▎ | 402/12384 [51:19<25:31:52, 7.67s/it, loss=4.2312, acc=0.0216, iter_time=7.64s]
Epoch 0: 3%|▎ | 402/12384 [51:27<25:31:52, 7.67s/it, loss=3.9393, acc=0.0294, iter_time=8.02s]
Epoch 0: 3%|▎ | 403/12384 [51:27<25:53:43, 7.78s/it, loss=3.9393, acc=0.0294, iter_time=8.02s]
Epoch 0: 3%|▎ | 403/12384 [51:34<25:53:43, 7.78s/it, loss=4.2445, acc=0.0226, iter_time=6.81s]
Epoch 0: 3%|▎ | 404/12384 [51:34<25:45:49, 7.74s/it, loss=4.2445, acc=0.0226, iter_time=6.81s]
Epoch 0: 3%|▎ | 404/12384 [51:42<25:45:49, 7.74s/it, loss=3.7501, acc=0.0291, iter_time=7.12s]
Epoch 0: 3%|▎ | 405/12384 [51:42<25:43:25, 7.73s/it, loss=3.7501, acc=0.0291, iter_time=7.12s]
Epoch 0: 3%|▎ | 405/12384 [51:50<25:43:25, 7.73s/it, loss=3.5726, acc=0.0380, iter_time=7.14s]
Epoch 0: 3%|▎ | 406/12384 [51:50<25:38:49, 7.71s/it, loss=3.5726, acc=0.0380, iter_time=7.14s]
Epoch 0: 3%|▎ | 406/12384 [51:57<25:38:49, 7.71s/it, loss=4.2236, acc=0.0188, iter_time=9.66s]
Epoch 0: 3%|▎ | 407/12384 [51:57<25:35:21, 7.69s/it, loss=4.2236, acc=0.0188, iter_time=9.66s]
Epoch 0: 3%|▎ | 407/12384 [52:05<25:35:21, 7.69s/it, loss=3.8117, acc=0.0293, iter_time=8.06s]
Epoch 0: 3%|▎ | 408/12384 [52:05<25:33:23, 7.68s/it, loss=3.8117, acc=0.0293, iter_time=8.06s]
Epoch 0: 3%|▎ | 408/12384 [52:13<25:33:23, 7.68s/it, loss=3.6982, acc=0.0342, iter_time=7.23s]
Epoch 0: 3%|▎ | 409/12384 [52:13<25:30:38, 7.67s/it, loss=3.6982, acc=0.0342, iter_time=7.23s]
Epoch 0: 3%|▎ | 409/12384 [52:20<25:30:38, 7.67s/it, loss=3.5757, acc=0.0318, iter_time=7.67s]
Epoch 0: 3%|▎ | 410/12384 [52:20<25:33:26, 7.68s/it, loss=3.5757, acc=0.0318, iter_time=7.67s]
Epoch 0: 3%|▎ | 410/12384 [52:28<25:33:26, 7.68s/it, loss=3.8740, acc=0.0279, iter_time=7.70s]
Epoch 0: 3%|▎ | 411/12384 [52:28<25:32:28, 7.68s/it, loss=3.8740, acc=0.0279, iter_time=7.70s]
Epoch 0: 3%|▎ | 411/12384 [52:36<25:32:28, 7.68s/it, loss=3.5094, acc=0.0339, iter_time=7.09s]
Epoch 0: 3%|▎ | 412/12384 [52:36<25:30:37, 7.67s/it, loss=3.5094, acc=0.0339, iter_time=7.09s]
Epoch 0: 3%|▎ | 412/12384 [52:43<25:30:37, 7.67s/it, loss=3.2465, acc=0.0371, iter_time=4.61s]
Epoch 0: 3%|▎ | 413/12384 [52:43<25:29:09, 7.66s/it, loss=3.2465, acc=0.0371, iter_time=4.61s]
Epoch 0: 3%|▎ | 413/12384 [52:51<25:29:09, 7.66s/it, loss=2.8904, acc=0.0574, iter_time=8.40s]
Epoch 0: 3%|▎ | 414/12384 [52:51<25:28:28, 7.66s/it, loss=2.8904, acc=0.0574, iter_time=8.40s]
Epoch 0: 3%|▎ | 414/12384 [52:59<25:28:28, 7.66s/it, loss=3.6628, acc=0.0276, iter_time=10.50s]
Epoch 0: 3%|▎ | 415/12384 [52:59<25:25:31, 7.65s/it, loss=3.6628, acc=0.0276, iter_time=10.50s]
Epoch 0: 3%|▎ | 415/12384 [53:06<25:25:31, 7.65s/it, loss=3.8821, acc=0.0325, iter_time=8.01s]
Epoch 0: 3%|▎ | 416/12384 [53:06<25:26:24, 7.65s/it, loss=3.8821, acc=0.0325, iter_time=8.01s]
Epoch 0: 3%|▎ | 416/12384 [53:14<25:26:24, 7.65s/it, loss=3.2570, acc=0.0432, iter_time=4.50s]
Epoch 0: 3%|▎ | 417/12384 [53:14<25:28:00, 7.66s/it, loss=3.2570, acc=0.0432, iter_time=4.50s]
Epoch 0: 3%|▎ | 417/12384 [53:22<25:28:00, 7.66s/it, loss=3.5080, acc=0.0288, iter_time=10.45s]
Epoch 0: 3%|▎ | 418/12384 [53:22<25:30:13, 7.67s/it, loss=3.5080, acc=0.0288, iter_time=10.45s]
Epoch 0: 3%|▎ | 418/12384 [53:29<25:30:13, 7.67s/it, loss=3.0909, acc=0.0365, iter_time=7.70s]
Epoch 0: 3%|▎ | 419/12384 [53:29<25:27:52, 7.66s/it, loss=3.0909, acc=0.0365, iter_time=7.70s]
Epoch 0: 3%|▎ | 419/12384 [53:37<25:27:52, 7.66s/it, loss=3.4928, acc=0.0372, iter_time=7.65s]
Epoch 0: 3%|▎ | 420/12384 [53:37<25:27:45, 7.66s/it, loss=3.4928, acc=0.0372, iter_time=7.65s]
Epoch 0: 3%|▎ | 420/12384 [53:45<25:27:45, 7.66s/it, loss=3.4464, acc=0.0396, iter_time=7.65s]
Epoch 0: 3%|▎ | 421/12384 [53:45<25:25:33, 7.65s/it, loss=3.4464, acc=0.0396, iter_time=7.65s]
Epoch 0: 3%|▎ | 421/12384 [53:52<25:25:33, 7.65s/it, loss=3.3146, acc=0.0343, iter_time=7.63s]
Epoch 0: 3%|▎ | 422/12384 [53:52<25:22:39, 7.64s/it, loss=3.3146, acc=0.0343, iter_time=7.63s]
Epoch 0: 3%|▎ | 422/12384 [54:00<25:22:39, 7.64s/it, loss=3.3239, acc=0.0348, iter_time=6.66s]
Epoch 0: 3%|▎ | 423/12384 [54:00<25:23:53, 7.64s/it, loss=3.3239, acc=0.0348, iter_time=6.66s]
Epoch 0: 3%|▎ | 423/12384 [54:07<25:23:53, 7.64s/it, loss=3.2749, acc=0.0364, iter_time=8.56s]
Epoch 0: 3%|▎ | 424/12384 [54:07<25:22:46, 7.64s/it, loss=3.2749, acc=0.0364, iter_time=8.56s]
Epoch 0: 3%|▎ | 424/12384 [54:15<25:22:46, 7.64s/it, loss=3.0364, acc=0.0451, iter_time=7.66s]
Epoch 0: 3%|▎ | 425/12384 [54:15<25:22:33, 7.64s/it, loss=3.0364, acc=0.0451, iter_time=7.66s]
Epoch 0: 3%|▎ | 425/12384 [54:23<25:22:33, 7.64s/it, loss=3.0444, acc=0.0412, iter_time=7.65s]
Epoch 0: 3%|▎ | 426/12384 [54:23<25:21:50, 7.64s/it, loss=3.0444, acc=0.0412, iter_time=7.65s]
Epoch 0: 3%|▎ | 426/12384 [54:30<25:21:50, 7.64s/it, loss=3.2301, acc=0.0386, iter_time=7.72s]
Epoch 0: 3%|▎ | 427/12384 [54:30<25:26:05, 7.66s/it, loss=3.2301, acc=0.0386, iter_time=7.72s]
Epoch 0: 3%|▎ | 427/12384 [54:38<25:26:05, 7.66s/it, loss=3.2357, acc=0.0334, iter_time=7.62s]
Epoch 0: 3%|▎ | 428/12384 [54:38<25:22:50, 7.64s/it, loss=3.2357, acc=0.0334, iter_time=7.62s]
Epoch 0: 3%|▎ | 428/12384 [54:46<25:22:50, 7.64s/it, loss=3.1309, acc=0.0459, iter_time=5.59s]
Epoch 0: 3%|▎ | 429/12384 [54:46<25:44:00, 7.75s/it, loss=3.1309, acc=0.0459, iter_time=5.59s]
Epoch 0: 3%|▎ | 429/12384 [54:54<25:44:00, 7.75s/it, loss=2.9865, acc=0.0453, iter_time=10.01s]
Epoch 0: 3%|▎ | 430/12384 [54:54<25:38:28, 7.72s/it, loss=2.9865, acc=0.0453, iter_time=10.01s]
Epoch 0: 3%|▎ | 430/12384 [55:01<25:38:28, 7.72s/it, loss=3.1372, acc=0.0429, iter_time=7.65s]
Epoch 0: 3%|▎ | 431/12384 [55:01<25:37:07, 7.72s/it, loss=3.1372, acc=0.0429, iter_time=7.65s]
Epoch 0: 3%|▎ | 431/12384 [55:09<25:37:07, 7.72s/it, loss=3.2819, acc=0.0415, iter_time=8.11s]
Epoch 0: 3%|▎ | 432/12384 [55:09<25:33:47, 7.70s/it, loss=3.2819, acc=0.0415, iter_time=8.11s]
Epoch 0: 3%|▎ | 432/12384 [55:17<25:33:47, 7.70s/it, loss=3.0646, acc=0.0505, iter_time=7.26s]
Epoch 0: 3%|▎ | 433/12384 [55:17<25:31:41, 7.69s/it, loss=3.0646, acc=0.0505, iter_time=7.26s]
Epoch 0: 3%|▎ | 433/12384 [55:24<25:31:41, 7.69s/it, loss=3.4927, acc=0.0437, iter_time=7.74s]
Epoch 0: 4%|▎ | 434/12384 [55:24<25:29:55, 7.68s/it, loss=3.4927, acc=0.0437, iter_time=7.74s]
Epoch 0: 4%|▎ | 434/12384 [55:32<25:29:55, 7.68s/it, loss=3.1577, acc=0.0383, iter_time=7.62s]
Epoch 0: 4%|▎ | 435/12384 [55:32<25:28:53, 7.68s/it, loss=3.1577, acc=0.0383, iter_time=7.62s]
Epoch 0: 4%|▎ | 435/12384 [55:40<25:28:53, 7.68s/it, loss=2.9042, acc=0.0446, iter_time=7.64s]
Epoch 0: 4%|▎ | 436/12384 [55:40<25:23:48, 7.65s/it, loss=2.9042, acc=0.0446, iter_time=7.64s]
Epoch 0: 4%|▎ | 436/12384 [55:47<25:23:48, 7.65s/it, loss=2.8476, acc=0.0494, iter_time=7.62s]
Epoch 0: 4%|▎ | 437/12384 [55:47<25:24:27, 7.66s/it, loss=2.8476, acc=0.0494, iter_time=7.62s]
Epoch 0: 4%|▎ | 437/12384 [55:55<25:24:27, 7.66s/it, loss=2.5513, acc=0.0720, iter_time=4.37s]
Epoch 0: 4%|▎ | 438/12384 [55:55<25:24:39, 7.66s/it, loss=2.5513, acc=0.0720, iter_time=4.37s]
Epoch 0: 4%|▎ | 438/12384 [56:03<25:24:39, 7.66s/it, loss=3.1866, acc=0.0466, iter_time=10.93s]
Epoch 0: 4%|▎ | 439/12384 [56:03<25:22:33, 7.65s/it, loss=3.1866, acc=0.0466, iter_time=10.93s]
Epoch 0: 4%|▎ | 439/12384 [56:10<25:22:33, 7.65s/it, loss=3.7266, acc=0.0348, iter_time=8.02s]
Epoch 0: 4%|▎ | 440/12384 [56:10<25:21:13, 7.64s/it, loss=3.7266, acc=0.0348, iter_time=8.02s]
Epoch 0: 4%|▎ | 440/12384 [56:18<25:21:13, 7.64s/it, loss=2.6208, acc=0.0580, iter_time=4.90s]
Epoch 0: 4%|▎ | 441/12384 [56:18<25:19:17, 7.63s/it, loss=2.6208, acc=0.0580, iter_time=4.90s]
Epoch 0: 4%|▎ | 441/12384 [56:25<25:19:17, 7.63s/it, loss=2.8994, acc=0.0426, iter_time=9.96s]
Epoch 0: 4%|▎ | 442/12384 [56:25<25:18:06, 7.63s/it, loss=2.8994, acc=0.0426, iter_time=9.96s]
Epoch 0: 4%|▎ | 442/12384 [56:33<25:18:06, 7.63s/it, loss=2.9250, acc=0.0597, iter_time=5.03s]
Epoch 0: 4%|▎ | 443/12384 [56:33<25:19:24, 7.63s/it, loss=2.9250, acc=0.0597, iter_time=5.03s]
Epoch 0: 4%|▎ | 443/12384 [56:41<25:19:24, 7.63s/it, loss=3.0754, acc=0.0495, iter_time=9.93s]
Epoch 0: 4%|▎ | 444/12384 [56:41<25:18:40, 7.63s/it, loss=3.0754, acc=0.0495, iter_time=9.93s]
Epoch 0: 4%|▎ | 444/12384 [56:48<25:18:40, 7.63s/it, loss=2.9707, acc=0.0498, iter_time=7.93s]
Epoch 0: 4%|▎ | 445/12384 [56:48<25:17:50, 7.63s/it, loss=2.9707, acc=0.0498, iter_time=7.93s]
Epoch 0: 4%|▎ | 445/12384 [56:56<25:17:50, 7.63s/it, loss=2.7525, acc=0.0550, iter_time=7.62s]
Epoch 0: 4%|▎ | 446/12384 [56:56<25:16:04, 7.62s/it, loss=2.7525, acc=0.0550, iter_time=7.62s]
Epoch 0: 4%|▎ | 446/12384 [57:04<25:16:04, 7.62s/it, loss=3.1286, acc=0.0480, iter_time=7.60s]
Epoch 0: 4%|▎ | 447/12384 [57:04<25:14:50, 7.61s/it, loss=3.1286, acc=0.0480, iter_time=7.60s]
Epoch 0: 4%|▎ | 447/12384 [57:11<25:14:50, 7.61s/it, loss=2.8419, acc=0.0528, iter_time=7.54s]
Epoch 0: 4%|▎ | 448/12384 [57:11<25:14:05, 7.61s/it, loss=2.8419, acc=0.0528, iter_time=7.54s]
Epoch 0: 4%|▎ | 448/12384 [57:19<25:14:05, 7.61s/it, loss=2.3611, acc=0.0641, iter_time=7.65s]
Epoch 0: 4%|▎ | 449/12384 [57:19<25:15:34, 7.62s/it, loss=2.3611, acc=0.0641, iter_time=7.65s]
Epoch 0: 4%|▎ | 449/12384 [57:26<25:15:34, 7.62s/it, loss=2.8634, acc=0.0636, iter_time=8.04s]
Epoch 0: 4%|▎ | 450/12384 [57:26<25:14:47, 7.62s/it, loss=2.8634, acc=0.0636, iter_time=8.04s]
Epoch 0: 4%|▎ | 450/12384 [57:34<25:14:47, 7.62s/it, loss=2.6805, acc=0.0543, iter_time=7.21s]
Epoch 0: 4%|▎ | 451/12384 [57:34<25:16:42, 7.63s/it, loss=2.6805, acc=0.0543, iter_time=7.21s]
Epoch 0: 4%|▎ | 451/12384 [57:42<25:16:42, 7.63s/it, loss=2.7589, acc=0.0638, iter_time=7.65s]
Epoch 0: 4%|▎ | 452/12384 [57:42<25:18:12, 7.63s/it, loss=2.7589, acc=0.0638, iter_time=7.65s]
Epoch 0: 4%|▎ | 452/12384 [57:49<25:18:12, 7.63s/it, loss=2.5675, acc=0.0499, iter_time=7.38s]
Epoch 0: 4%|▎ | 453/12384 [57:49<25:19:49, 7.64s/it, loss=2.5675, acc=0.0499, iter_time=7.38s]
Epoch 0: 4%|▎ | 453/12384 [57:57<25:19:49, 7.64s/it, loss=2.9277, acc=0.0398, iter_time=7.96s]
Epoch 0: 4%|▎ | 454/12384 [57:57<25:18:56, 7.64s/it, loss=2.9277, acc=0.0398, iter_time=7.96s]
Epoch 0: 4%|▎ | 454/12384 [58:05<25:18:56, 7.64s/it, loss=2.5893, acc=0.0614, iter_time=7.62s]
Epoch 0: 4%|▎ | 455/12384 [58:05<25:18:51, 7.64s/it, loss=2.5893, acc=0.0614, iter_time=7.62s]
Epoch 0: 4%|▎ | 455/12384 [58:13<25:18:51, 7.64s/it, loss=2.7613, acc=0.0720, iter_time=8.34s]
Epoch 0: 4%|▎ | 456/12384 [58:13<25:39:03, 7.74s/it, loss=2.7613, acc=0.0720, iter_time=8.34s]
Epoch 0: 4%|▎ | 456/12384 [58:20<25:39:03, 7.74s/it, loss=2.6479, acc=0.0560, iter_time=7.30s]
Epoch 0: 4%|▎ | 457/12384 [58:20<25:32:43, 7.71s/it, loss=2.6479, acc=0.0560, iter_time=7.30s]
Epoch 0: 4%|▎ | 457/12384 [58:28<25:32:43, 7.71s/it, loss=2.1886, acc=0.0814, iter_time=5.28s]
Epoch 0: 4%|▎ | 458/12384 [58:28<25:32:53, 7.71s/it, loss=2.1886, acc=0.0814, iter_time=5.28s]
Epoch 0: 4%|▎ | 458/12384 [58:36<25:32:53, 7.71s/it, loss=2.3791, acc=0.0607, iter_time=10.05s]
Epoch 0: 4%|▎ | 459/12384 [58:36<25:28:02, 7.69s/it, loss=2.3791, acc=0.0607, iter_time=10.05s]
Epoch 0: 4%|▎ | 459/12384 [58:43<25:28:02, 7.69s/it, loss=2.1744, acc=0.0658, iter_time=7.66s]
Epoch 0: 4%|▎ | 460/12384 [58:43<25:24:42, 7.67s/it, loss=2.1744, acc=0.0658, iter_time=7.66s]
Epoch 0: 4%|▎ | 460/12384 [58:51<25:24:42, 7.67s/it, loss=2.9240, acc=0.0432, iter_time=7.63s]
Epoch 0: 4%|▎ | 461/12384 [58:51<25:21:46, 7.66s/it, loss=2.9240, acc=0.0432, iter_time=7.63s]
Epoch 0: 4%|▎ | 461/12384 [58:58<25:21:46, 7.66s/it, loss=2.4064, acc=0.0642, iter_time=7.63s]
Epoch 0: 4%|▎ | 462/12384 [58:58<25:21:49, 7.66s/it, loss=2.4064, acc=0.0642, iter_time=7.63s]
Epoch 0: 4%|▎ | 462/12384 [59:06<25:21:49, 7.66s/it, loss=2.2047, acc=0.0689, iter_time=5.08s]
Epoch 0: 4%|▎ | 463/12384 [59:06<25:19:56, 7.65s/it, loss=2.2047, acc=0.0689, iter_time=5.08s]
Epoch 0: 4%|▎ | 463/12384 [59:14<25:19:56, 7.65s/it, loss=2.6974, acc=0.0564, iter_time=10.58s]
Epoch 0: 4%|▎ | 464/12384 [59:14<25:23:11, 7.67s/it, loss=2.6974, acc=0.0564, iter_time=10.58s]
Epoch 0: 4%|▎ | 464/12384 [59:21<25:23:11, 7.67s/it, loss=2.0215, acc=0.0805, iter_time=4.25s]
Epoch 0: 4%|▍ | 465/12384 [59:21<25:21:02, 7.66s/it, loss=2.0215, acc=0.0805, iter_time=4.25s]
Epoch 0: 4%|▍ | 465/12384 [59:29<25:21:02, 7.66s/it, loss=2.1350, acc=0.0804, iter_time=8.90s]
Epoch 0: 4%|▍ | 466/12384 [59:29<25:20:03, 7.65s/it, loss=2.1350, acc=0.0804, iter_time=8.90s]
Epoch 0: 4%|▍ | 466/12384 [59:37<25:20:03, 7.65s/it, loss=1.8644, acc=0.0877, iter_time=7.17s]
Epoch 0: 4%|▍ | 467/12384 [59:37<25:19:16, 7.65s/it, loss=1.8644, acc=0.0877, iter_time=7.17s]
Epoch 0: 4%|▍ | 467/12384 [59:44<25:19:16, 7.65s/it, loss=2.3691, acc=0.0603, iter_time=9.93s]
Epoch 0: 4%|▍ | 468/12384 [59:44<25:17:20, 7.64s/it, loss=2.3691, acc=0.0603, iter_time=9.93s]
Epoch 0: 4%|▍ | 468/12384 [59:52<25:17:20, 7.64s/it, loss=2.5097, acc=0.0765, iter_time=7.62s]
Epoch 0: 4%|▍ | 469/12384 [59:52<25:16:52, 7.64s/it, loss=2.5097, acc=0.0765, iter_time=7.62s]
Epoch 0: 4%|▍ | 469/12384 [1:00:00<25:16:52, 7.64s/it, loss=2.3412, acc=0.0614, iter_time=7.64s]
Epoch 0: 4%|▍ | 470/12384 [1:00:00<25:17:42, 7.64s/it, loss=2.3412, acc=0.0614, iter_time=7.64s]
Epoch 0: 4%|▍ | 470/12384 [1:00:07<25:17:42, 7.64s/it, loss=2.4188, acc=0.0616, iter_time=7.63s]
Epoch 0: 4%|▍ | 471/12384 [1:00:07<25:17:57, 7.65s/it, loss=2.4188, acc=0.0616, iter_time=7.63s]
Epoch 0: 4%|▍ | 471/12384 [1:00:15<25:17:57, 7.65s/it, loss=2.3378, acc=0.0728, iter_time=7.60s]
Epoch 0: 4%|▍ | 472/12384 [1:00:15<25:16:22, 7.64s/it, loss=2.3378, acc=0.0728, iter_time=7.60s]
Epoch 0: 4%|▍ | 472/12384 [1:00:23<25:16:22, 7.64s/it, loss=2.0764, acc=0.0804, iter_time=7.69s]
Epoch 0: 4%|▍ | 473/12384 [1:00:23<25:15:48, 7.64s/it, loss=2.0764, acc=0.0804, iter_time=7.69s]
Epoch 0: 4%|▍ | 473/12384 [1:00:30<25:15:48, 7.64s/it, loss=1.9360, acc=0.0943, iter_time=6.75s]
Epoch 0: 4%|▍ | 474/12384 [1:00:30<25:17:34, 7.65s/it, loss=1.9360, acc=0.0943, iter_time=6.75s]
Epoch 0: 4%|▍ | 474/12384 [1:00:38<25:17:34, 7.65s/it, loss=1.9062, acc=0.0851, iter_time=7.92s]
Epoch 0: 4%|▍ | 475/12384 [1:00:38<25:15:16, 7.63s/it, loss=1.9062, acc=0.0851, iter_time=7.92s]
Epoch 0: 4%|▍ | 475/12384 [1:00:45<25:15:16, 7.63s/it, loss=2.1786, acc=0.0661, iter_time=8.23s]
Epoch 0: 4%|▍ | 476/12384 [1:00:45<25:16:11, 7.64s/it, loss=2.1786, acc=0.0661, iter_time=8.23s]
Epoch 0: 4%|▍ | 476/12384 [1:00:53<25:16:11, 7.64s/it, loss=2.6808, acc=0.0632, iter_time=5.05s]
Epoch 0: 4%|▍ | 477/12384 [1:00:53<25:20:18, 7.66s/it, loss=2.6808, acc=0.0632, iter_time=5.05s]
Epoch 0: 4%|▍ | 477/12384 [1:01:01<25:20:18, 7.66s/it, loss=2.1899, acc=0.0762, iter_time=10.31s]
Epoch 0: 4%|▍ | 478/12384 [1:01:01<25:21:22, 7.67s/it, loss=2.1899, acc=0.0762, iter_time=10.31s]
Epoch 0: 4%|▍ | 478/12384 [1:01:08<25:21:22, 7.67s/it, loss=2.0382, acc=0.0792, iter_time=7.67s]
Epoch 0: 4%|▍ | 479/12384 [1:01:08<25:17:54, 7.65s/it, loss=2.0382, acc=0.0792, iter_time=7.67s]
Epoch 0: 4%|▍ | 479/12384 [1:01:16<25:17:54, 7.65s/it, loss=2.1239, acc=0.0640, iter_time=8.01s]
Epoch 0: 4%|▍ | 480/12384 [1:01:16<25:17:39, 7.65s/it, loss=2.1239, acc=0.0640, iter_time=8.01s]
Epoch 0: 4%|▍ | 480/12384 [1:01:24<25:17:39, 7.65s/it, loss=1.8730, acc=0.0906, iter_time=5.69s]
Epoch 0: 4%|▍ | 481/12384 [1:01:24<25:16:10, 7.64s/it, loss=1.8730, acc=0.0906, iter_time=5.69s]
Epoch 0: 4%|▍ | 481/12384 [1:01:32<25:16:10, 7.64s/it, loss=1.7140, acc=0.1096, iter_time=6.45s]
Epoch 0: 4%|▍ | 482/12384 [1:01:32<25:38:55, 7.76s/it, loss=1.7140, acc=0.1096, iter_time=6.45s]
Epoch 0: 4%|▍ | 482/12384 [1:01:39<25:38:55, 7.76s/it, loss=1.8818, acc=0.1072, iter_time=7.94s]
Epoch 0: 4%|▍ | 483/12384 [1:01:39<25:33:20, 7.73s/it, loss=1.8818, acc=0.1072, iter_time=7.94s]
Epoch 0: 4%|▍ | 483/12384 [1:01:47<25:33:20, 7.73s/it, loss=1.8504, acc=0.0905, iter_time=9.27s]
Epoch 0: 4%|▍ | 484/12384 [1:01:47<25:29:08, 7.71s/it, loss=1.8504, acc=0.0905, iter_time=9.27s]
Epoch 0: 4%|▍ | 484/12384 [1:01:55<25:29:08, 7.71s/it, loss=2.3645, acc=0.0783, iter_time=8.87s]
Epoch 0: 4%|▍ | 485/12384 [1:01:55<25:24:33, 7.69s/it, loss=2.3645, acc=0.0783, iter_time=8.87s]
Epoch 0: 4%|▍ | 485/12384 [1:02:02<25:24:33, 7.69s/it, loss=2.0253, acc=0.0711, iter_time=7.64s]
Epoch 0: 4%|▍ | 486/12384 [1:02:02<25:21:34, 7.67s/it, loss=2.0253, acc=0.0711, iter_time=7.64s]
Epoch 0: 4%|▍ | 486/12384 [1:02:10<25:21:34, 7.67s/it, loss=1.8402, acc=0.0922, iter_time=7.62s]
Epoch 0: 4%|▍ | 487/12384 [1:02:10<25:18:25, 7.66s/it, loss=1.8402, acc=0.0922, iter_time=7.62s]
Epoch 0: 4%|▍ | 487/12384 [1:02:18<25:18:25, 7.66s/it, loss=2.3611, acc=0.0677, iter_time=8.05s]
Epoch 0: 4%|▍ | 488/12384 [1:02:18<25:17:37, 7.65s/it, loss=2.3611, acc=0.0677, iter_time=8.05s]
Epoch 0: 4%|▍ | 488/12384 [1:02:25<25:17:37, 7.65s/it, loss=1.8946, acc=0.1047, iter_time=7.23s]
Epoch 0: 4%|▍ | 489/12384 [1:02:25<25:15:22, 7.64s/it, loss=1.8946, acc=0.1047, iter_time=7.23s]
Epoch 0: 4%|▍ | 489/12384 [1:02:33<25:15:22, 7.64s/it, loss=1.8590, acc=0.0874, iter_time=7.63s]
Epoch 0: 4%|▍ | 490/12384 [1:02:33<25:15:18, 7.64s/it, loss=1.8590, acc=0.0874, iter_time=7.63s]
Epoch 0: 4%|▍ | 490/12384 [1:02:41<25:15:18, 7.64s/it, loss=1.9773, acc=0.1019, iter_time=7.66s]
Epoch 0: 4%|▍ | 491/12384 [1:02:41<25:16:13, 7.65s/it, loss=1.9773, acc=0.1019, iter_time=7.66s]
Epoch 0: 4%|▍ | 491/12384 [1:02:48<25:16:13, 7.65s/it, loss=1.5691, acc=0.1026, iter_time=7.74s]
Epoch 0: 4%|▍ | 492/12384 [1:02:48<25:19:21, 7.67s/it, loss=1.5691, acc=0.1026, iter_time=7.74s]
Epoch 0: 4%|▍ | 492/12384 [1:02:56<25:19:21, 7.67s/it, loss=1.7926, acc=0.0978, iter_time=7.63s]
Epoch 0: 4%|▍ | 493/12384 [1:02:56<25:16:38, 7.65s/it, loss=1.7926, acc=0.0978, iter_time=7.63s]
Epoch 0: 4%|▍ | 493/12384 [1:03:04<25:16:38, 7.65s/it, loss=2.1797, acc=0.0721, iter_time=7.62s]
Epoch 0: 4%|▍ | 494/12384 [1:03:04<25:17:48, 7.66s/it, loss=2.1797, acc=0.0721, iter_time=7.62s]
Epoch 0: 4%|▍ | 494/12384 [1:03:11<25:17:48, 7.66s/it, loss=2.0808, acc=0.0790, iter_time=7.67s]
Epoch 0: 4%|▍ | 495/12384 [1:03:11<25:17:14, 7.66s/it, loss=2.0808, acc=0.0790, iter_time=7.67s]
Epoch 0: 4%|▍ | 495/12384 [1:03:19<25:17:14, 7.66s/it, loss=2.2031, acc=0.0782, iter_time=8.10s]
Epoch 0: 4%|▍ | 496/12384 [1:03:19<25:18:08, 7.66s/it, loss=2.2031, acc=0.0782, iter_time=8.10s]
Epoch 0: 4%|▍ | 496/12384 [1:03:27<25:18:08, 7.66s/it, loss=1.7503, acc=0.1270, iter_time=6.93s]
Epoch 0: 4%|▍ | 497/12384 [1:03:27<25:17:23, 7.66s/it, loss=1.7503, acc=0.1270, iter_time=6.93s]
Epoch 0: 4%|▍ | 497/12384 [1:03:34<25:17:23, 7.66s/it, loss=1.7370, acc=0.0869, iter_time=7.92s]
Epoch 0: 4%|▍ | 498/12384 [1:03:34<25:15:02, 7.65s/it, loss=1.7370, acc=0.0869, iter_time=7.92s]
Epoch 0: 4%|▍ | 498/12384 [1:03:42<25:15:02, 7.65s/it, loss=2.2853, acc=0.0846, iter_time=7.66s]
Epoch 0: 4%|▍ | 499/12384 [1:03:42<25:13:21, 7.64s/it, loss=2.2853, acc=0.0846, iter_time=7.66s]
Epoch 0: 4%|▍ | 499/12384 [1:03:49<25:13:21, 7.64s/it, loss=1.5637, acc=0.0990, iter_time=8.00s]
Epoch 0: 4%|▍ | 500/12384 [1:03:50<25:25:18, 7.70s/it, loss=1.5637, acc=0.0990, iter_time=8.00s]
Epoch 0: 4%|▍ | 500/12384 [1:03:57<25:25:18, 7.70s/it, loss=1.9870, acc=0.0964, iter_time=7.46s]
Epoch 0: 4%|▍ | 501/12384 [1:03:57<25:20:35, 7.68s/it, loss=1.9870, acc=0.0964, iter_time=7.46s]
Epoch 0: 4%|▍ | 501/12384 [1:04:05<25:20:35, 7.68s/it, loss=1.5320, acc=0.1148, iter_time=6.78s]
Epoch 0: 4%|▍ | 502/12384 [1:04:05<25:19:51, 7.67s/it, loss=1.5320, acc=0.1148, iter_time=6.78s]
Epoch 0: 4%|▍ | 502/12384 [1:04:13<25:19:51, 7.67s/it, loss=1.6261, acc=0.0951, iter_time=7.55s]
Epoch 0: 4%|▍ | 503/12384 [1:04:13<25:17:47, 7.66s/it, loss=1.6261, acc=0.0951, iter_time=7.55s]
Epoch 0: 4%|▍ | 503/12384 [1:04:20<25:17:47, 7.66s/it, loss=1.4938, acc=0.1099, iter_time=8.54s]
Epoch 0: 4%|▍ | 504/12384 [1:04:20<25:14:29, 7.65s/it, loss=1.4938, acc=0.1099, iter_time=8.54s]
Epoch 0: 4%|▍ | 504/12384 [1:04:28<25:14:29, 7.65s/it, loss=1.7771, acc=0.1023, iter_time=7.67s]
Epoch 0: 4%|▍ | 505/12384 [1:04:28<25:12:02, 7.64s/it, loss=1.7771, acc=0.1023, iter_time=7.67s]
Epoch 0: 4%|▍ | 505/12384 [1:04:35<25:12:02, 7.64s/it, loss=1.6810, acc=0.1148, iter_time=7.60s]
Epoch 0: 4%|▍ | 506/12384 [1:04:35<25:10:43, 7.63s/it, loss=1.6810, acc=0.1148, iter_time=7.60s]
Epoch 0: 4%|▍ | 506/12384 [1:04:43<25:10:43, 7.63s/it, loss=1.5150, acc=0.1185, iter_time=7.63s]
Epoch 0: 4%|▍ | 507/12384 [1:04:43<25:12:23, 7.64s/it, loss=1.5150, acc=0.1185, iter_time=7.63s]
Epoch 0: 4%|▍ | 507/12384 [1:04:51<25:12:23, 7.64s/it, loss=1.5239, acc=0.1060, iter_time=7.66s]
Epoch 0: 4%|▍ | 508/12384 [1:04:51<25:10:50, 7.63s/it, loss=1.5239, acc=0.1060, iter_time=7.66s]
Epoch 0: 4%|▍ | 508/12384 [1:04:59<25:10:50, 7.63s/it, loss=1.5047, acc=0.1262, iter_time=7.95s]
Epoch 0: 4%|▍ | 509/12384 [1:04:59<25:30:52, 7.73s/it, loss=1.5047, acc=0.1262, iter_time=7.95s]
Epoch 0: 4%|▍ | 509/12384 [1:05:06<25:30:52, 7.73s/it, loss=1.8039, acc=0.1183, iter_time=7.66s]
Epoch 0: 4%|▍ | 510/12384 [1:05:06<25:24:40, 7.70s/it, loss=1.8039, acc=0.1183, iter_time=7.66s]
Epoch 0: 4%|▍ | 510/12384 [1:05:14<25:24:40, 7.70s/it, loss=1.6836, acc=0.1040, iter_time=7.60s]
Epoch 0: 4%|▍ | 511/12384 [1:05:14<25:18:24, 7.67s/it, loss=1.6836, acc=0.1040, iter_time=7.60s]
Epoch 0: 4%|▍ | 511/12384 [1:05:22<25:18:24, 7.67s/it, loss=1.4030, acc=0.1384, iter_time=7.70s]
Epoch 0: 4%|▍ | 512/12384 [1:05:22<25:20:09, 7.68s/it, loss=1.4030, acc=0.1384, iter_time=7.70s]
Epoch 0: 4%|▍ | 512/12384 [1:05:29<25:20:09, 7.68s/it, loss=1.4032, acc=0.1294, iter_time=7.60s]
Epoch 0: 4%|▍ | 513/12384 [1:05:29<25:16:35, 7.67s/it, loss=1.4032, acc=0.1294, iter_time=7.60s]
Epoch 0: 4%|▍ | 513/12384 [1:05:37<25:16:35, 7.67s/it, loss=1.3707, acc=0.1583, iter_time=7.66s]
Epoch 0: 4%|▍ | 514/12384 [1:05:37<25:16:22, 7.66s/it, loss=1.3707, acc=0.1583, iter_time=7.66s]
Epoch 0: 4%|▍ | 514/12384 [1:05:45<25:16:22, 7.66s/it, loss=1.1802, acc=0.1476, iter_time=7.70s]
Epoch 0: 4%|▍ | 515/12384 [1:05:45<25:17:33, 7.67s/it, loss=1.1802, acc=0.1476, iter_time=7.70s]
Epoch 0: 4%|▍ | 515/12384 [1:05:52<25:17:33, 7.67s/it, loss=1.4299, acc=0.1386, iter_time=5.39s]
Epoch 0: 4%|▍ | 516/12384 [1:05:52<25:16:08, 7.67s/it, loss=1.4299, acc=0.1386, iter_time=5.39s]
Epoch 0: 4%|▍ | 516/12384 [1:06:00<25:16:08, 7.67s/it, loss=1.4811, acc=0.1189, iter_time=7.71s]
Epoch 0: 4%|▍ | 517/12384 [1:06:00<25:21:03, 7.69s/it, loss=1.4811, acc=0.1189, iter_time=7.71s]
Epoch 0: 4%|▍ | 517/12384 [1:06:08<25:21:03, 7.69s/it, loss=1.3481, acc=0.1673, iter_time=7.67s]
Epoch 0: 4%|▍ | 518/12384 [1:06:08<25:17:24, 7.67s/it, loss=1.3481, acc=0.1673, iter_time=7.67s]
Epoch 0: 4%|▍ | 518/12384 [1:06:15<25:17:24, 7.67s/it, loss=1.5646, acc=0.1122, iter_time=9.89s]
Epoch 0: 4%|▍ | 519/12384 [1:06:15<25:16:26, 7.67s/it, loss=1.5646, acc=0.1122, iter_time=9.89s]
Epoch 0: 4%|▍ | 519/12384 [1:06:23<25:16:26, 7.67s/it, loss=1.2987, acc=0.1386, iter_time=8.08s]
Epoch 0: 4%|▍ | 520/12384 [1:06:23<25:15:20, 7.66s/it, loss=1.2987, acc=0.1386, iter_time=8.08s]
Epoch 0: 4%|▍ | 520/12384 [1:06:31<25:15:20, 7.66s/it, loss=1.3657, acc=0.1161, iter_time=6.35s]
Epoch 0: 4%|▍ | 521/12384 [1:06:31<25:15:28, 7.66s/it, loss=1.3657, acc=0.1161, iter_time=6.35s]
Epoch 0: 4%|▍ | 521/12384 [1:06:38<25:15:28, 7.66s/it, loss=1.2062, acc=0.1535, iter_time=8.55s]
Epoch 0: 4%|▍ | 522/12384 [1:06:38<25:13:49, 7.66s/it, loss=1.2062, acc=0.1535, iter_time=8.55s]
Epoch 0: 4%|▍ | 522/12384 [1:06:46<25:13:49, 7.66s/it, loss=1.2758, acc=0.1454, iter_time=7.65s]
Epoch 0: 4%|▍ | 523/12384 [1:06:46<25:12:01, 7.65s/it, loss=1.2758, acc=0.1454, iter_time=7.65s]
Epoch 0: 4%|▍ | 523/12384 [1:06:53<25:12:01, 7.65s/it, loss=1.2117, acc=0.1257, iter_time=5.83s]
Epoch 0: 4%|▍ | 524/12384 [1:06:53<25:11:32, 7.65s/it, loss=1.2117, acc=0.1257, iter_time=5.83s]
Epoch 0: 4%|▍ | 524/12384 [1:07:01<25:11:32, 7.65s/it, loss=1.4545, acc=0.1447, iter_time=8.59s]
Epoch 0: 4%|▍ | 525/12384 [1:07:01<25:16:09, 7.67s/it, loss=1.4545, acc=0.1447, iter_time=8.59s]
Epoch 0: 4%|▍ | 525/12384 [1:07:09<25:16:09, 7.67s/it, loss=1.0486, acc=0.1929, iter_time=7.63s]
Epoch 0: 4%|▍ | 526/12384 [1:07:09<25:14:50, 7.66s/it, loss=1.0486, acc=0.1929, iter_time=7.63s]
Epoch 0: 4%|▍ | 526/12384 [1:07:16<25:14:50, 7.66s/it, loss=1.2718, acc=0.1351, iter_time=8.60s]
Epoch 0: 4%|▍ | 527/12384 [1:07:16<25:12:15, 7.65s/it, loss=1.2718, acc=0.1351, iter_time=8.60s]
Epoch 0: 4%|▍ | 527/12384 [1:07:24<25:12:15, 7.65s/it, loss=1.2497, acc=0.1386, iter_time=8.01s]
Epoch 0: 4%|▍ | 528/12384 [1:07:24<25:11:41, 7.65s/it, loss=1.2497, acc=0.1386, iter_time=8.01s]
Epoch 0: 4%|▍ | 528/12384 [1:07:32<25:11:41, 7.65s/it, loss=1.0450, acc=0.2315, iter_time=5.73s]
Epoch 0: 4%|▍ | 529/12384 [1:07:32<25:11:20, 7.65s/it, loss=1.0450, acc=0.2315, iter_time=5.73s]
Epoch 0: 4%|▍ | 529/12384 [1:07:39<25:11:20, 7.65s/it, loss=1.1168, acc=0.1592, iter_time=8.55s]
Epoch 0: 4%|▍ | 530/12384 [1:07:39<25:10:04, 7.64s/it, loss=1.1168, acc=0.1592, iter_time=8.55s]
Epoch 0: 4%|▍ | 530/12384 [1:07:47<25:10:04, 7.64s/it, loss=1.1135, acc=0.1942, iter_time=7.33s]
Epoch 0: 4%|▍ | 531/12384 [1:07:47<25:10:01, 7.64s/it, loss=1.1135, acc=0.1942, iter_time=7.33s]
Epoch 0: 4%|▍ | 531/12384 [1:07:55<25:10:01, 7.64s/it, loss=1.1992, acc=0.1433, iter_time=8.58s]
Epoch 0: 4%|▍ | 532/12384 [1:07:55<25:13:53, 7.66s/it, loss=1.1992, acc=0.1433, iter_time=8.58s]
Epoch 0: 4%|▍ | 532/12384 [1:08:02<25:13:53, 7.66s/it, loss=1.0983, acc=0.1781, iter_time=6.61s]
Epoch 0: 4%|▍ | 533/12384 [1:08:02<25:11:17, 7.65s/it, loss=1.0983, acc=0.1781, iter_time=6.61s]
Epoch 0: 4%|▍ | 533/12384 [1:08:10<25:11:17, 7.65s/it, loss=1.1803, acc=0.1655, iter_time=8.71s]
Epoch 0: 4%|▍ | 534/12384 [1:08:10<25:11:47, 7.65s/it, loss=1.1803, acc=0.1655, iter_time=8.71s]
Epoch 0: 4%|▍ | 534/12384 [1:08:18<25:11:47, 7.65s/it, loss=1.3010, acc=0.1560, iter_time=7.15s]
Epoch 0: 4%|▍ | 535/12384 [1:08:18<25:30:05, 7.75s/it, loss=1.3010, acc=0.1560, iter_time=7.15s]
Epoch 0: 4%|▍ | 535/12384 [1:08:26<25:30:05, 7.75s/it, loss=1.3130, acc=0.1668, iter_time=8.47s]
Epoch 0: 4%|▍ | 536/12384 [1:08:26<25:24:29, 7.72s/it, loss=1.3130, acc=0.1668, iter_time=8.47s]
Epoch 0: 4%|▍ | 536/12384 [1:08:33<25:24:29, 7.72s/it, loss=1.0739, acc=0.1849, iter_time=7.67s]
Epoch 0: 4%|▍ | 537/12384 [1:08:33<25:18:47, 7.69s/it, loss=1.0739, acc=0.1849, iter_time=7.67s]
Epoch 0: 4%|▍ | 537/12384 [1:08:41<25:18:47, 7.69s/it, loss=0.9642, acc=0.2393, iter_time=7.07s]
Epoch 0: 4%|▍ | 538/12384 [1:08:41<25:17:07, 7.68s/it, loss=0.9642, acc=0.2393, iter_time=7.07s]
Epoch 0: 4%|▍ | 538/12384 [1:08:49<25:17:07, 7.68s/it, loss=1.1014, acc=0.1750, iter_time=8.22s]
Epoch 0: 4%|▍ | 539/12384 [1:08:49<25:14:01, 7.67s/it, loss=1.1014, acc=0.1750, iter_time=8.22s]
Epoch 0: 4%|▍ | 539/12384 [1:08:56<25:14:01, 7.67s/it, loss=1.0269, acc=0.1964, iter_time=7.65s]
Epoch 0: 4%|▍ | 540/12384 [1:08:56<25:13:27, 7.67s/it, loss=1.0269, acc=0.1964, iter_time=7.65s]
Epoch 0: 4%|▍ | 540/12384 [1:09:04<25:13:27, 7.67s/it, loss=1.0619, acc=0.2396, iter_time=5.85s]
Epoch 0: 4%|▍ | 541/12384 [1:09:04<25:16:54, 7.69s/it, loss=1.0619, acc=0.2396, iter_time=5.85s]
Epoch 0: 4%|▍ | 541/12384 [1:09:12<25:16:54, 7.69s/it, loss=1.0353, acc=0.2250, iter_time=9.52s]
Epoch 0: 4%|▍ | 542/12384 [1:09:12<25:14:13, 7.67s/it, loss=1.0353, acc=0.2250, iter_time=9.52s]
Epoch 0: 4%|▍ | 542/12384 [1:09:19<25:14:13, 7.67s/it, loss=1.2098, acc=0.1728, iter_time=7.64s]
Epoch 0: 4%|▍ | 543/12384 [1:09:19<25:11:36, 7.66s/it, loss=1.2098, acc=0.1728, iter_time=7.64s]
Epoch 0: 4%|▍ | 543/12384 [1:09:27<25:11:36, 7.66s/it, loss=1.0547, acc=0.1759, iter_time=8.02s]
Epoch 0: 4%|▍ | 544/12384 [1:09:27<25:09:47, 7.65s/it, loss=1.0547, acc=0.1759, iter_time=8.02s]
Epoch 0: 4%|▍ | 544/12384 [1:09:35<25:09:47, 7.65s/it, loss=0.9190, acc=0.2185, iter_time=3.87s]
Epoch 0: 4%|▍ | 545/12384 [1:09:35<25:09:37, 7.65s/it, loss=0.9190, acc=0.2185, iter_time=3.87s]
Epoch 0: 4%|▍ | 545/12384 [1:09:42<25:09:37, 7.65s/it, loss=1.3871, acc=0.1515, iter_time=11.01s]
Epoch 0: 4%|▍ | 546/12384 [1:09:42<25:07:06, 7.64s/it, loss=1.3871, acc=0.1515, iter_time=11.01s]
Epoch 0: 4%|▍ | 546/12384 [1:09:50<25:07:06, 7.64s/it, loss=0.8361, acc=0.2270, iter_time=7.65s]
Epoch 0: 4%|▍ | 547/12384 [1:09:50<25:06:51, 7.64s/it, loss=0.8361, acc=0.2270, iter_time=7.65s]
Epoch 0: 4%|▍ | 547/12384 [1:09:57<25:06:51, 7.64s/it, loss=1.1352, acc=0.1755, iter_time=7.30s]
Epoch 0: 4%|▍ | 548/12384 [1:09:57<25:07:55, 7.64s/it, loss=1.1352, acc=0.1755, iter_time=7.30s]
Epoch 0: 4%|▍ | 548/12384 [1:10:05<25:07:55, 7.64s/it, loss=1.0154, acc=0.2016, iter_time=7.96s]
Epoch 0: 4%|▍ | 549/12384 [1:10:05<25:05:44, 7.63s/it, loss=1.0154, acc=0.2016, iter_time=7.96s]
Epoch 0: 4%|▍ | 549/12384 [1:10:13<25:05:44, 7.63s/it, loss=1.0715, acc=0.2152, iter_time=8.04s]
Epoch 0: 4%|▍ | 550/12384 [1:10:13<25:06:09, 7.64s/it, loss=1.0715, acc=0.2152, iter_time=8.04s]
Epoch 0: 4%|▍ | 550/12384 [1:10:20<25:06:09, 7.64s/it, loss=0.9247, acc=0.2230, iter_time=5.12s]
Epoch 0: 4%|▍ | 551/12384 [1:10:20<25:05:22, 7.63s/it, loss=0.9247, acc=0.2230, iter_time=5.12s]
Epoch 0: 4%|▍ | 551/12384 [1:10:28<25:05:22, 7.63s/it, loss=0.9215, acc=0.2149, iter_time=10.11s]
Epoch 0: 4%|▍ | 552/12384 [1:10:28<25:04:53, 7.63s/it, loss=0.9215, acc=0.2149, iter_time=10.11s]
Epoch 0: 4%|▍ | 552/12384 [1:10:36<25:04:53, 7.63s/it, loss=0.8211, acc=0.2492, iter_time=7.23s]
Epoch 0: 4%|▍ | 553/12384 [1:10:36<25:04:05, 7.63s/it, loss=0.8211, acc=0.2492, iter_time=7.23s]
Epoch 0: 4%|▍ | 553/12384 [1:10:43<25:04:05, 7.63s/it, loss=1.0839, acc=0.2324, iter_time=7.66s]
Epoch 0: 4%|▍ | 554/12384 [1:10:43<25:04:50, 7.63s/it, loss=1.0839, acc=0.2324, iter_time=7.66s]
Epoch 0: 4%|▍ | 554/12384 [1:10:51<25:04:50, 7.63s/it, loss=0.9729, acc=0.2124, iter_time=7.31s]
Epoch 0: 4%|▍ | 555/12384 [1:10:51<25:03:22, 7.63s/it, loss=0.9729, acc=0.2124, iter_time=7.31s]
Epoch 0: 4%|▍ | 555/12384 [1:10:58<25:03:22, 7.63s/it, loss=0.7429, acc=0.2806, iter_time=5.57s]
Epoch 0: 4%|▍ | 556/12384 [1:10:58<25:03:14, 7.63s/it, loss=0.7429, acc=0.2806, iter_time=5.57s]
Epoch 0: 4%|▍ | 556/12384 [1:11:06<25:03:14, 7.63s/it, loss=0.9001, acc=0.2481, iter_time=9.97s]
Epoch 0: 4%|▍ | 557/12384 [1:11:06<25:03:57, 7.63s/it, loss=0.9001, acc=0.2481, iter_time=9.97s]
Epoch 0: 4%|▍ | 557/12384 [1:11:14<25:03:57, 7.63s/it, loss=0.8742, acc=0.2299, iter_time=7.64s]
Epoch 0: 5%|▍ | 558/12384 [1:11:14<25:04:17, 7.63s/it, loss=0.8742, acc=0.2299, iter_time=7.64s]
Epoch 0: 5%|▍ | 558/12384 [1:11:21<25:04:17, 7.63s/it, loss=0.8940, acc=0.2662, iter_time=7.63s]
Epoch 0: 5%|▍ | 559/12384 [1:11:21<25:04:39, 7.63s/it, loss=0.8940, acc=0.2662, iter_time=7.63s]
Epoch 0: 5%|▍ | 559/12384 [1:11:29<25:04:39, 7.63s/it, loss=0.7924, acc=0.2755, iter_time=7.65s]
Epoch 0: 5%|▍ | 560/12384 [1:11:29<25:07:08, 7.65s/it, loss=0.7924, acc=0.2755, iter_time=7.65s]
Epoch 0: 5%|▍ | 560/12384 [1:11:37<25:07:08, 7.65s/it, loss=0.7921, acc=0.3057, iter_time=7.98s]
Epoch 0: 5%|▍ | 561/12384 [1:11:37<25:26:43, 7.75s/it, loss=0.7921, acc=0.3057, iter_time=7.98s]
Epoch 0: 5%|▍ | 561/12384 [1:11:45<25:26:43, 7.75s/it, loss=0.6653, acc=0.3116, iter_time=7.69s]
Epoch 0: 5%|▍ | 562/12384 [1:11:45<25:20:26, 7.72s/it, loss=0.6653, acc=0.3116, iter_time=7.69s]
Epoch 0: 5%|▍ | 562/12384 [1:11:52<25:20:26, 7.72s/it, loss=0.7885, acc=0.2770, iter_time=7.10s]
Epoch 0: 5%|▍ | 563/12384 [1:11:52<25:16:42, 7.70s/it, loss=0.7885, acc=0.2770, iter_time=7.10s]
Epoch 0: 5%|▍ | 563/12384 [1:12:00<25:16:42, 7.70s/it, loss=0.6566, acc=0.3586, iter_time=6.40s]
Epoch 0: 5%|▍ | 564/12384 [1:12:00<25:14:28, 7.69s/it, loss=0.6566, acc=0.3586, iter_time=6.40s]
Epoch 0: 5%|▍ | 564/12384 [1:12:08<25:14:28, 7.69s/it, loss=0.6048, acc=0.3385, iter_time=7.36s]
Epoch 0: 5%|▍ | 565/12384 [1:12:08<25:10:16, 7.67s/it, loss=0.6048, acc=0.3385, iter_time=7.36s]
Epoch 0: 5%|▍ | 565/12384 [1:12:15<25:10:16, 7.67s/it, loss=0.7702, acc=0.2858, iter_time=9.73s]
Epoch 0: 5%|▍ | 566/12384 [1:12:15<25:08:33, 7.66s/it, loss=0.7702, acc=0.2858, iter_time=9.73s]
Epoch 0: 5%|▍ | 566/12384 [1:12:23<25:08:33, 7.66s/it, loss=0.6689, acc=0.3683, iter_time=3.88s]
Epoch 0: 5%|▍ | 567/12384 [1:12:23<25:07:46, 7.66s/it, loss=0.6689, acc=0.3683, iter_time=3.88s]
Epoch 0: 5%|▍ | 567/12384 [1:12:31<25:07:46, 7.66s/it, loss=0.8656, acc=0.2532, iter_time=11.79s]
Epoch 0: 5%|▍ | 568/12384 [1:12:31<25:07:39, 7.66s/it, loss=0.8656, acc=0.2532, iter_time=11.79s]
Epoch 0: 5%|▍ | 568/12384 [1:12:38<25:07:39, 7.66s/it, loss=0.5556, acc=0.4360, iter_time=5.19s]
Epoch 0: 5%|▍ | 569/12384 [1:12:38<25:10:33, 7.67s/it, loss=0.5556, acc=0.4360, iter_time=5.19s]
Epoch 0: 5%|▍ | 569/12384 [1:12:46<25:10:33, 7.67s/it, loss=0.6650, acc=0.3469, iter_time=9.78s]
Epoch 0: 5%|▍ | 570/12384 [1:12:46<25:06:09, 7.65s/it, loss=0.6650, acc=0.3469, iter_time=9.78s]
Epoch 0: 5%|▍ | 570/12384 [1:12:53<25:06:09, 7.65s/it, loss=0.6787, acc=0.3174, iter_time=7.60s]
Epoch 0: 5%|▍ | 571/12384 [1:12:53<25:02:46, 7.63s/it, loss=0.6787, acc=0.3174, iter_time=7.60s]
Epoch 0: 5%|▍ | 571/12384 [1:13:01<25:02:46, 7.63s/it, loss=0.6823, acc=0.3189, iter_time=6.18s]
Epoch 0: 5%|▍ | 572/12384 [1:13:01<25:02:20, 7.63s/it, loss=0.6823, acc=0.3189, iter_time=6.18s]
Epoch 0: 5%|▍ | 572/12384 [1:13:09<25:02:20, 7.63s/it, loss=0.6189, acc=0.3393, iter_time=9.04s]
Epoch 0: 5%|▍ | 573/12384 [1:13:09<25:00:04, 7.62s/it, loss=0.6189, acc=0.3393, iter_time=9.04s]
Epoch 0: 5%|▍ | 573/12384 [1:13:16<25:00:04, 7.62s/it, loss=0.6919, acc=0.3102, iter_time=7.62s]
Epoch 0: 5%|▍ | 574/12384 [1:13:16<25:01:22, 7.63s/it, loss=0.6919, acc=0.3102, iter_time=7.62s]
Epoch 0: 5%|▍ | 574/12384 [1:13:24<25:01:22, 7.63s/it, loss=0.6962, acc=0.2823, iter_time=7.64s]
Epoch 0: 5%|▍ | 575/12384 [1:13:24<25:01:18, 7.63s/it, loss=0.6962, acc=0.2823, iter_time=7.64s]
Epoch 0: 5%|▍ | 575/12384 [1:13:32<25:01:18, 7.63s/it, loss=0.7182, acc=0.2974, iter_time=8.01s]
Epoch 0: 5%|▍ | 576/12384 [1:13:32<24:59:54, 7.62s/it, loss=0.7182, acc=0.2974, iter_time=8.01s]
Epoch 0: 5%|▍ | 576/12384 [1:13:39<24:59:54, 7.62s/it, loss=0.7195, acc=0.3184, iter_time=6.00s]
Epoch 0: 5%|▍ | 577/12384 [1:13:39<25:01:44, 7.63s/it, loss=0.7195, acc=0.3184, iter_time=6.00s]
Epoch 0: 5%|▍ | 577/12384 [1:13:47<25:01:44, 7.63s/it, loss=0.5484, acc=0.3960, iter_time=5.53s]
Epoch 0: 5%|▍ | 578/12384 [1:13:47<25:00:46, 7.63s/it, loss=0.5484, acc=0.3960, iter_time=5.53s]
Epoch 0: 5%|▍ | 578/12384 [1:13:55<25:00:46, 7.63s/it, loss=0.5956, acc=0.4156, iter_time=8.19s]
Epoch 0: 5%|▍ | 579/12384 [1:13:55<25:04:22, 7.65s/it, loss=0.5956, acc=0.4156, iter_time=8.19s]
Epoch 0: 5%|▍ | 579/12384 [1:14:02<25:04:22, 7.65s/it, loss=0.5682, acc=0.3444, iter_time=10.49s]
Epoch 0: 5%|▍ | 580/12384 [1:14:02<25:02:46, 7.64s/it, loss=0.5682, acc=0.3444, iter_time=10.49s]
Epoch 0: 5%|▍ | 580/12384 [1:14:10<25:02:46, 7.64s/it, loss=0.5496, acc=0.4052, iter_time=7.59s]
Epoch 0: 5%|▍ | 581/12384 [1:14:10<25:00:41, 7.63s/it, loss=0.5496, acc=0.4052, iter_time=7.59s]
Epoch 0: 5%|▍ | 581/12384 [1:14:17<25:00:41, 7.63s/it, loss=0.6160, acc=0.3355, iter_time=7.62s]
Epoch 0: 5%|▍ | 582/12384 [1:14:17<25:02:43, 7.64s/it, loss=0.6160, acc=0.3355, iter_time=7.62s]
Epoch 0: 5%|▍ | 582/12384 [1:14:25<25:02:43, 7.64s/it, loss=0.7119, acc=0.3244, iter_time=7.65s]
Epoch 0: 5%|▍ | 583/12384 [1:14:25<25:02:10, 7.64s/it, loss=0.7119, acc=0.3244, iter_time=7.65s]
Epoch 0: 5%|▍ | 583/12384 [1:14:33<25:02:10, 7.64s/it, loss=0.6709, acc=0.3242, iter_time=8.04s]
Epoch 0: 5%|▍ | 584/12384 [1:14:33<25:02:46, 7.64s/it, loss=0.6709, acc=0.3242, iter_time=8.04s]
Epoch 0: 5%|▍ | 584/12384 [1:14:40<25:02:46, 7.64s/it, loss=0.6783, acc=0.3475, iter_time=6.95s]
Epoch 0: 5%|▍ | 585/12384 [1:14:40<25:03:34, 7.65s/it, loss=0.6783, acc=0.3475, iter_time=6.95s]
Epoch 0: 5%|▍ | 585/12384 [1:14:48<25:03:34, 7.65s/it, loss=0.5960, acc=0.4014, iter_time=7.95s]
Epoch 0: 5%|▍ | 586/12384 [1:14:48<25:00:06, 7.63s/it, loss=0.5960, acc=0.4014, iter_time=7.95s]
Epoch 0: 5%|▍ | 586/12384 [1:14:56<25:00:06, 7.63s/it, loss=0.3958, acc=0.5014, iter_time=5.40s]
Epoch 0: 5%|▍ | 587/12384 [1:14:56<25:19:14, 7.73s/it, loss=0.3958, acc=0.5014, iter_time=5.40s]
Epoch 0: 5%|▍ | 587/12384 [1:15:04<25:19:14, 7.73s/it, loss=0.5950, acc=0.3516, iter_time=10.16s]
Epoch 0: 5%|▍ | 588/12384 [1:15:04<25:13:55, 7.70s/it, loss=0.5950, acc=0.3516, iter_time=10.16s]
Epoch 0: 5%|▍ | 588/12384 [1:15:11<25:13:55, 7.70s/it, loss=0.4965, acc=0.4395, iter_time=7.63s]
Epoch 0: 5%|▍ | 589/12384 [1:15:11<25:09:42, 7.68s/it, loss=0.4965, acc=0.4395, iter_time=7.63s]
Epoch 0: 5%|▍ | 589/12384 [1:15:19<25:09:42, 7.68s/it, loss=0.5482, acc=0.4071, iter_time=7.35s]
Epoch 0: 5%|▍ | 590/12384 [1:15:19<25:07:35, 7.67s/it, loss=0.5482, acc=0.4071, iter_time=7.35s]
Epoch 0: 5%|▍ | 590/12384 [1:15:26<25:07:35, 7.67s/it, loss=0.5106, acc=0.4397, iter_time=7.93s]
Epoch 0: 5%|▍ | 591/12384 [1:15:26<25:04:16, 7.65s/it, loss=0.5106, acc=0.4397, iter_time=7.93s]
Epoch 0: 5%|▍ | 591/12384 [1:15:34<25:04:16, 7.65s/it, loss=0.5197, acc=0.4329, iter_time=7.61s]
Epoch 0: 5%|▍ | 592/12384 [1:15:34<25:04:07, 7.65s/it, loss=0.5197, acc=0.4329, iter_time=7.61s]
Epoch 0: 5%|▍ | 592/12384 [1:15:42<25:04:07, 7.65s/it, loss=0.4506, acc=0.4788, iter_time=5.93s]
Epoch 0: 5%|▍ | 593/12384 [1:15:42<25:03:26, 7.65s/it, loss=0.4506, acc=0.4788, iter_time=5.93s]
Epoch 0: 5%|▍ | 593/12384 [1:15:49<25:03:26, 7.65s/it, loss=0.4671, acc=0.4699, iter_time=6.23s]
Epoch 0: 5%|▍ | 594/12384 [1:15:49<25:03:28, 7.65s/it, loss=0.4671, acc=0.4699, iter_time=6.23s]
Epoch 0: 5%|▍ | 594/12384 [1:15:57<25:03:28, 7.65s/it, loss=0.3762, acc=0.4901, iter_time=9.68s]
Epoch 0: 5%|▍ | 595/12384 [1:15:57<25:02:26, 7.65s/it, loss=0.3762, acc=0.4901, iter_time=9.68s]
Epoch 0: 5%|▍ | 595/12384 [1:16:05<25:02:26, 7.65s/it, loss=0.6318, acc=0.4473, iter_time=8.77s]
Epoch 0: 5%|▍ | 596/12384 [1:16:05<25:02:30, 7.65s/it, loss=0.6318, acc=0.4473, iter_time=8.77s]
Epoch 0: 5%|▍ | 596/12384 [1:16:12<25:02:30, 7.65s/it, loss=0.4220, acc=0.5015, iter_time=7.72s]
Epoch 0: 5%|▍ | 597/12384 [1:16:12<25:05:04, 7.66s/it, loss=0.4220, acc=0.5015, iter_time=7.72s]
Epoch 0: 5%|▍ | 597/12384 [1:16:20<25:05:04, 7.66s/it, loss=0.4720, acc=0.4488, iter_time=7.02s]
Epoch 0: 5%|▍ | 598/12384 [1:16:20<25:02:10, 7.65s/it, loss=0.4720, acc=0.4488, iter_time=7.02s]
Epoch 0: 5%|▍ | 598/12384 [1:16:28<25:02:10, 7.65s/it, loss=0.4471, acc=0.4765, iter_time=8.24s]
Epoch 0: 5%|▍ | 599/12384 [1:16:28<25:02:04, 7.65s/it, loss=0.4471, acc=0.4765, iter_time=8.24s]
Epoch 0: 5%|▍ | 599/12384 [1:16:35<25:02:04, 7.65s/it, loss=0.4545, acc=0.4907, iter_time=8.04s]
Epoch 0: 5%|▍ | 600/12384 [1:16:35<25:01:31, 7.65s/it, loss=0.4545, acc=0.4907, iter_time=8.04s]
Epoch 0: 5%|▍ | 600/12384 [1:16:43<25:01:31, 7.65s/it, loss=0.3590, acc=0.5658, iter_time=7.21s]
Epoch 0: 5%|▍ | 601/12384 [1:16:43<24:58:57, 7.63s/it, loss=0.3590, acc=0.5658, iter_time=7.21s]
Epoch 0: 5%|▍ | 601/12384 [1:16:51<24:58:57, 7.63s/it, loss=0.3608, acc=0.5635, iter_time=4.77s]
Epoch 0: 5%|▍ | 602/12384 [1:16:51<24:59:41, 7.64s/it, loss=0.3608, acc=0.5635, iter_time=4.77s]
Epoch 0: 5%|▍ | 602/12384 [1:16:58<24:59:41, 7.64s/it, loss=0.4167, acc=0.4805, iter_time=10.47s]
Epoch 0: 5%|▍ | 603/12384 [1:16:58<24:59:09, 7.64s/it, loss=0.4167, acc=0.4805, iter_time=10.47s]
Epoch 0: 5%|▍ | 603/12384 [1:17:06<24:59:09, 7.64s/it, loss=0.3339, acc=0.5512, iter_time=7.66s]
Epoch 0: 5%|▍ | 604/12384 [1:17:06<25:00:31, 7.64s/it, loss=0.3339, acc=0.5512, iter_time=7.66s]
Epoch 0: 5%|▍ | 604/12384 [1:17:13<25:00:31, 7.64s/it, loss=0.3723, acc=0.6058, iter_time=6.45s]
Epoch 0: 5%|▍ | 605/12384 [1:17:13<24:58:34, 7.63s/it, loss=0.3723, acc=0.6058, iter_time=6.45s]
Epoch 0: 5%|▍ | 605/12384 [1:17:21<24:58:34, 7.63s/it, loss=0.4356, acc=0.4972, iter_time=8.80s]
Epoch 0: 5%|▍ | 606/12384 [1:17:21<24:58:41, 7.63s/it, loss=0.4356, acc=0.4972, iter_time=8.80s]
Epoch 0: 5%|▍ | 606/12384 [1:17:29<24:58:41, 7.63s/it, loss=0.3879, acc=0.5585, iter_time=7.63s]
Epoch 0: 5%|▍ | 607/12384 [1:17:29<24:59:41, 7.64s/it, loss=0.3879, acc=0.5585, iter_time=7.63s]
Epoch 0: 5%|▍ | 607/12384 [1:17:36<24:59:41, 7.64s/it, loss=0.4014, acc=0.5559, iter_time=7.64s]
Epoch 0: 5%|▍ | 608/12384 [1:17:36<25:00:20, 7.64s/it, loss=0.4014, acc=0.5559, iter_time=7.64s]
Epoch 0: 5%|▍ | 608/12384 [1:17:44<25:00:20, 7.64s/it, loss=0.3320, acc=0.5873, iter_time=7.68s]
Epoch 0: 5%|▍ | 609/12384 [1:17:44<24:58:37, 7.64s/it, loss=0.3320, acc=0.5873, iter_time=7.68s]
Epoch 0: 5%|▍ | 609/12384 [1:17:52<24:58:37, 7.64s/it, loss=0.4512, acc=0.5488, iter_time=4.07s]
Epoch 0: 5%|▍ | 610/12384 [1:17:52<24:59:21, 7.64s/it, loss=0.4512, acc=0.5488, iter_time=4.07s]
Epoch 0: 5%|▍ | 610/12384 [1:17:59<24:59:21, 7.64s/it, loss=0.3436, acc=0.5503, iter_time=11.19s]
Epoch 0: 5%|▍ | 611/12384 [1:17:59<25:00:45, 7.65s/it, loss=0.3436, acc=0.5503, iter_time=11.19s]
Epoch 0: 5%|▍ | 611/12384 [1:18:07<25:00:45, 7.65s/it, loss=0.2757, acc=0.6474, iter_time=7.72s]
Epoch 0: 5%|▍ | 612/12384 [1:18:07<25:01:53, 7.65s/it, loss=0.2757, acc=0.6474, iter_time=7.72s]
Epoch 0: 5%|▍ | 612/12384 [1:18:15<25:01:53, 7.65s/it, loss=0.3746, acc=0.5754, iter_time=7.92s]
Epoch 0: 5%|▍ | 613/12384 [1:18:15<25:19:13, 7.74s/it, loss=0.3746, acc=0.5754, iter_time=7.92s]
Epoch 0: 5%|▍ | 613/12384 [1:18:23<25:19:13, 7.74s/it, loss=0.3046, acc=0.5813, iter_time=6.71s]
Epoch 0: 5%|▍ | 614/12384 [1:18:23<25:12:10, 7.71s/it, loss=0.3046, acc=0.5813, iter_time=6.71s]
Epoch 0: 5%|▍ | 614/12384 [1:18:30<25:12:10, 7.71s/it, loss=0.3546, acc=0.5911, iter_time=5.79s]
Epoch 0: 5%|▍ | 615/12384 [1:18:30<25:07:42, 7.69s/it, loss=0.3546, acc=0.5911, iter_time=5.79s]
Epoch 0: 5%|▍ | 615/12384 [1:18:38<25:07:42, 7.69s/it, loss=0.2801, acc=0.6547, iter_time=10.86s]
Epoch 0: 5%|▍ | 616/12384 [1:18:38<25:06:35, 7.68s/it, loss=0.2801, acc=0.6547, iter_time=10.86s]
Epoch 0: 5%|▍ | 616/12384 [1:18:45<25:06:35, 7.68s/it, loss=0.3847, acc=0.5504, iter_time=7.21s]
Epoch 0: 5%|▍ | 617/12384 [1:18:45<25:03:00, 7.66s/it, loss=0.3847, acc=0.5504, iter_time=7.21s]
Epoch 0: 5%|▍ | 617/12384 [1:18:53<25:03:00, 7.66s/it, loss=0.2462, acc=0.6632, iter_time=5.85s]
Epoch 0: 5%|▍ | 618/12384 [1:18:53<25:01:59, 7.66s/it, loss=0.2462, acc=0.6632, iter_time=5.85s]
Epoch 0: 5%|▍ | 618/12384 [1:19:01<25:01:59, 7.66s/it, loss=0.3307, acc=0.6648, iter_time=9.42s]
Epoch 0: 5%|▍ | 619/12384 [1:19:01<25:00:27, 7.65s/it, loss=0.3307, acc=0.6648, iter_time=9.42s]
Epoch 0: 5%|▍ | 619/12384 [1:19:08<25:00:27, 7.65s/it, loss=0.3192, acc=0.5956, iter_time=7.64s]
Epoch 0: 5%|▌ | 620/12384 [1:19:08<24:56:30, 7.63s/it, loss=0.3192, acc=0.5956, iter_time=7.64s]
Epoch 0: 5%|▌ | 620/12384 [1:19:16<24:56:30, 7.63s/it, loss=0.2890, acc=0.6224, iter_time=7.60s]
Epoch 0: 5%|▌ | 621/12384 [1:19:16<24:55:58, 7.63s/it, loss=0.2890, acc=0.6224, iter_time=7.60s]
Epoch 0: 5%|▌ | 621/12384 [1:19:24<24:55:58, 7.63s/it, loss=0.2759, acc=0.6690, iter_time=7.63s]
Epoch 0: 5%|▌ | 622/12384 [1:19:24<24:57:59, 7.64s/it, loss=0.2759, acc=0.6690, iter_time=7.63s]
Epoch 0: 5%|▌ | 622/12384 [1:19:31<24:57:59, 7.64s/it, loss=0.2857, acc=0.6261, iter_time=7.66s]
Epoch 0: 5%|▌ | 623/12384 [1:19:31<24:57:50, 7.64s/it, loss=0.2857, acc=0.6261, iter_time=7.66s]
Epoch 0: 5%|▌ | 623/12384 [1:19:39<24:57:50, 7.64s/it, loss=0.2741, acc=0.6090, iter_time=8.04s]
Epoch 0: 5%|▌ | 624/12384 [1:19:39<25:00:58, 7.66s/it, loss=0.2741, acc=0.6090, iter_time=8.04s]
Epoch 0: 5%|▌ | 624/12384 [1:19:47<25:00:58, 7.66s/it, loss=0.3084, acc=0.5810, iter_time=7.30s]
Epoch 0: 5%|▌ | 625/12384 [1:19:47<24:59:33, 7.65s/it, loss=0.3084, acc=0.5810, iter_time=7.30s]
Epoch 0: 5%|▌ | 625/12384 [1:19:54<24:59:33, 7.65s/it, loss=0.2274, acc=0.7522, iter_time=4.04s]
Epoch 0: 5%|▌ | 626/12384 [1:19:54<24:56:39, 7.64s/it, loss=0.2274, acc=0.7522, iter_time=4.04s]
Epoch 0: 5%|▌ | 626/12384 [1:20:02<24:56:39, 7.64s/it, loss=0.2724, acc=0.6851, iter_time=11.17s]
Epoch 0: 5%|▌ | 627/12384 [1:20:02<24:55:59, 7.63s/it, loss=0.2724, acc=0.6851, iter_time=11.17s]
Epoch 0: 5%|▌ | 627/12384 [1:20:09<24:55:59, 7.63s/it, loss=0.2737, acc=0.6208, iter_time=7.65s]
Epoch 0: 5%|▌ | 628/12384 [1:20:09<24:54:54, 7.63s/it, loss=0.2737, acc=0.6208, iter_time=7.65s]
Epoch 0: 5%|▌ | 628/12384 [1:20:17<24:54:54, 7.63s/it, loss=0.2697, acc=0.6223, iter_time=7.62s]
Epoch 0: 5%|▌ | 629/12384 [1:20:17<24:54:39, 7.63s/it, loss=0.2697, acc=0.6223, iter_time=7.62s]
Epoch 0: 5%|▌ | 629/12384 [1:20:25<24:54:39, 7.63s/it, loss=0.3092, acc=0.6069, iter_time=7.65s]
Epoch 0: 5%|▌ | 630/12384 [1:20:25<24:56:20, 7.64s/it, loss=0.3092, acc=0.6069, iter_time=7.65s]
Epoch 0: 5%|▌ | 630/12384 [1:20:32<24:56:20, 7.64s/it, loss=0.2454, acc=0.6816, iter_time=7.64s]
Epoch 0: 5%|▌ | 631/12384 [1:20:32<24:56:58, 7.64s/it, loss=0.2454, acc=0.6816, iter_time=7.64s]
Epoch 0: 5%|▌ | 631/12384 [1:20:40<24:56:58, 7.64s/it, loss=0.3183, acc=0.5691, iter_time=8.04s]
Epoch 0: 5%|▌ | 632/12384 [1:20:40<24:56:56, 7.64s/it, loss=0.3183, acc=0.5691, iter_time=8.04s]
Epoch 0: 5%|▌ | 632/12384 [1:20:48<24:56:56, 7.64s/it, loss=0.2355, acc=0.6794, iter_time=7.25s]
Epoch 0: 5%|▌ | 633/12384 [1:20:48<24:56:52, 7.64s/it, loss=0.2355, acc=0.6794, iter_time=7.25s]
Epoch 0: 5%|▌ | 633/12384 [1:20:55<24:56:52, 7.64s/it, loss=0.2374, acc=0.6964, iter_time=7.63s]
Epoch 0: 5%|▌ | 634/12384 [1:20:55<24:57:06, 7.64s/it, loss=0.2374, acc=0.6964, iter_time=7.63s]
Epoch 0: 5%|▌ | 634/12384 [1:21:03<24:57:06, 7.64s/it, loss=0.2305, acc=0.6784, iter_time=7.66s]
Epoch 0: 5%|▌ | 635/12384 [1:21:03<24:58:33, 7.65s/it, loss=0.2305, acc=0.6784, iter_time=7.66s]
Epoch 0: 5%|▌ | 635/12384 [1:21:11<24:58:33, 7.65s/it, loss=0.1761, acc=0.7745, iter_time=7.67s]
Epoch 0: 5%|▌ | 636/12384 [1:21:11<24:59:50, 7.66s/it, loss=0.1761, acc=0.7745, iter_time=7.67s]
Epoch 0: 5%|▌ | 636/12384 [1:21:18<24:59:50, 7.66s/it, loss=0.1990, acc=0.7060, iter_time=7.68s]
Epoch 0: 5%|▌ | 637/12384 [1:21:18<24:57:25, 7.65s/it, loss=0.1990, acc=0.7060, iter_time=7.68s]
Epoch 0: 5%|▌ | 637/12384 [1:21:26<24:57:25, 7.65s/it, loss=0.2891, acc=0.6542, iter_time=7.66s]
Epoch 0: 5%|▌ | 638/12384 [1:21:26<25:01:05, 7.67s/it, loss=0.2891, acc=0.6542, iter_time=7.66s]
Epoch 0: 5%|▌ | 638/12384 [1:21:35<25:01:05, 7.67s/it, loss=0.2287, acc=0.6787, iter_time=8.48s]
Epoch 0: 5%|▌ | 639/12384 [1:21:35<25:54:06, 7.94s/it, loss=0.2287, acc=0.6787, iter_time=8.48s]
Epoch 0: 5%|▌ | 639/12384 [1:21:43<25:54:06, 7.94s/it, loss=0.2104, acc=0.7418, iter_time=8.11s]
Epoch 0: 5%|▌ | 640/12384 [1:21:43<25:58:16, 7.96s/it, loss=0.2104, acc=0.7418, iter_time=8.11s]
Epoch 0: 5%|▌ | 640/12384 [1:21:50<25:58:16, 7.96s/it, loss=0.2158, acc=0.6936, iter_time=7.65s]
Epoch 0: 5%|▌ | 641/12384 [1:21:50<25:42:47, 7.88s/it, loss=0.2158, acc=0.6936, iter_time=7.65s]
Epoch 0: 5%|▌ | 641/12384 [1:21:58<25:42:47, 7.88s/it, loss=0.1843, acc=0.7471, iter_time=7.73s]
Epoch 0: 5%|▌ | 642/12384 [1:21:58<25:26:42, 7.80s/it, loss=0.1843, acc=0.7471, iter_time=7.73s]
Epoch 0: 5%|▌ | 642/12384 [1:22:06<25:26:42, 7.80s/it, loss=0.2027, acc=0.7683, iter_time=6.67s]
Epoch 0: 5%|▌ | 643/12384 [1:22:06<25:17:14, 7.75s/it, loss=0.2027, acc=0.7683, iter_time=6.67s]
Epoch 0: 5%|▌ | 643/12384 [1:22:13<25:17:14, 7.75s/it, loss=0.1985, acc=0.7134, iter_time=8.56s]
Epoch 0: 5%|▌ | 644/12384 [1:22:13<25:08:42, 7.71s/it, loss=0.1985, acc=0.7134, iter_time=8.56s]
Epoch 0: 5%|▌ | 644/12384 [1:22:21<25:08:42, 7.71s/it, loss=0.1784, acc=0.7264, iter_time=7.64s]
Epoch 0: 5%|▌ | 645/12384 [1:22:21<25:04:52, 7.69s/it, loss=0.1784, acc=0.7264, iter_time=7.64s]
Epoch 0: 5%|▌ | 645/12384 [1:22:28<25:04:52, 7.69s/it, loss=0.1879, acc=0.7621, iter_time=7.62s]
Epoch 0: 5%|▌ | 646/12384 [1:22:28<25:00:38, 7.67s/it, loss=0.1879, acc=0.7621, iter_time=7.62s]
Epoch 0: 5%|▌ | 646/12384 [1:22:36<25:00:38, 7.67s/it, loss=0.1737, acc=0.7515, iter_time=7.63s]
Epoch 0: 5%|▌ | 647/12384 [1:22:36<24:58:09, 7.66s/it, loss=0.1737, acc=0.7515, iter_time=7.63s]
Epoch 0: 5%|▌ | 647/12384 [1:22:44<24:58:09, 7.66s/it, loss=0.1593, acc=0.7533, iter_time=8.02s]
Epoch 0: 5%|▌ | 648/12384 [1:22:44<24:54:37, 7.64s/it, loss=0.1593, acc=0.7533, iter_time=8.02s]
Epoch 0: 5%|▌ | 648/12384 [1:22:51<24:54:37, 7.64s/it, loss=0.1462, acc=0.7813, iter_time=7.21s]
Epoch 0: 5%|▌ | 649/12384 [1:22:51<24:52:36, 7.63s/it, loss=0.1462, acc=0.7813, iter_time=7.21s]
Epoch 0: 5%|▌ | 649/12384 [1:22:59<24:52:36, 7.63s/it, loss=0.5466, acc=0.6792, iter_time=8.10s]
Epoch 0: 5%|▌ | 650/12384 [1:22:59<24:56:29, 7.65s/it, loss=0.5466, acc=0.6792, iter_time=8.10s]
Epoch 0: 5%|▌ | 650/12384 [1:23:07<24:56:29, 7.65s/it, loss=0.1704, acc=0.7695, iter_time=7.24s]
Epoch 0: 5%|▌ | 651/12384 [1:23:07<24:59:51, 7.67s/it, loss=0.1704, acc=0.7695, iter_time=7.24s]
Epoch 0: 5%|▌ | 651/12384 [1:23:14<24:59:51, 7.67s/it, loss=0.1583, acc=0.7768, iter_time=7.70s]
Epoch 0: 5%|▌ | 652/12384 [1:23:14<24:57:30, 7.66s/it, loss=0.1583, acc=0.7768, iter_time=7.70s]
Epoch 0: 5%|▌ | 652/12384 [1:23:22<24:57:30, 7.66s/it, loss=0.2298, acc=0.7080, iter_time=7.64s]
Epoch 0: 5%|▌ | 653/12384 [1:23:22<24:55:59, 7.65s/it, loss=0.2298, acc=0.7080, iter_time=7.64s]
Epoch 0: 5%|▌ | 653/12384 [1:23:30<24:55:59, 7.65s/it, loss=0.1883, acc=0.7259, iter_time=4.84s]
Epoch 0: 5%|▌ | 654/12384 [1:23:30<24:54:47, 7.65s/it, loss=0.1883, acc=0.7259, iter_time=4.84s]
Epoch 0: 5%|▌ | 654/12384 [1:23:37<24:54:47, 7.65s/it, loss=0.1999, acc=0.7265, iter_time=10.41s]
Epoch 0: 5%|▌ | 655/12384 [1:23:37<24:53:51, 7.64s/it, loss=0.1999, acc=0.7265, iter_time=10.41s]
Epoch 0: 5%|▌ | 655/12384 [1:23:45<24:53:51, 7.64s/it, loss=0.1884, acc=0.7112, iter_time=8.01s]
Epoch 0: 5%|▌ | 656/12384 [1:23:45<24:58:08, 7.66s/it, loss=0.1884, acc=0.7112, iter_time=8.01s]
Epoch 0: 5%|▌ | 656/12384 [1:23:53<24:58:08, 7.66s/it, loss=0.1850, acc=0.7239, iter_time=7.35s]
Epoch 0: 5%|▌ | 657/12384 [1:23:53<24:54:59, 7.65s/it, loss=0.1850, acc=0.7239, iter_time=7.35s]
Epoch 0: 5%|▌ | 657/12384 [1:24:00<24:54:59, 7.65s/it, loss=0.1589, acc=0.7934, iter_time=7.59s]
Epoch 0: 5%|▌ | 658/12384 [1:24:00<24:51:10, 7.63s/it, loss=0.1589, acc=0.7934, iter_time=7.59s]
Epoch 0: 5%|▌ | 658/12384 [1:24:08<24:51:10, 7.63s/it, loss=0.1807, acc=0.7450, iter_time=7.62s]
Epoch 0: 5%|▌ | 659/12384 [1:24:08<24:53:02, 7.64s/it, loss=0.1807, acc=0.7450, iter_time=7.62s]
Epoch 0: 5%|▌ | 659/12384 [1:24:15<24:53:02, 7.64s/it, loss=0.1695, acc=0.7443, iter_time=6.70s]
Epoch 0: 5%|▌ | 660/12384 [1:24:15<24:52:43, 7.64s/it, loss=0.1695, acc=0.7443, iter_time=6.70s]
Epoch 0: 5%|▌ | 660/12384 [1:24:23<24:52:43, 7.64s/it, loss=0.1544, acc=0.7608, iter_time=8.60s]
Epoch 0: 5%|▌ | 661/12384 [1:24:23<24:52:39, 7.64s/it, loss=0.1544, acc=0.7608, iter_time=8.60s]
Epoch 0: 5%|▌ | 661/12384 [1:24:31<24:52:39, 7.64s/it, loss=0.1465, acc=0.7956, iter_time=7.64s]
Epoch 0: 5%|▌ | 662/12384 [1:24:31<24:52:13, 7.64s/it, loss=0.1465, acc=0.7956, iter_time=7.64s]
Epoch 0: 5%|▌ | 662/12384 [1:24:38<24:52:13, 7.64s/it, loss=0.2700, acc=0.7387, iter_time=4.85s]
Epoch 0: 5%|▌ | 663/12384 [1:24:38<24:52:28, 7.64s/it, loss=0.2700, acc=0.7387, iter_time=4.85s]
Epoch 0: 5%|▌ | 663/12384 [1:24:46<24:52:28, 7.64s/it, loss=0.1463, acc=0.7929, iter_time=10.38s]
Epoch 0: 5%|▌ | 664/12384 [1:24:46<24:51:12, 7.63s/it, loss=0.1463, acc=0.7929, iter_time=10.38s]
Epoch 0: 5%|▌ | 664/12384 [1:24:54<24:51:12, 7.63s/it, loss=0.2011, acc=0.7511, iter_time=7.66s]
Epoch 0: 5%|▌ | 665/12384 [1:24:54<24:49:41, 7.63s/it, loss=0.2011, acc=0.7511, iter_time=7.66s]
Epoch 0: 5%|▌ | 665/12384 [1:25:01<24:49:41, 7.63s/it, loss=0.1036, acc=0.8381, iter_time=7.92s]
Epoch 0: 5%|▌ | 666/12384 [1:25:01<25:06:07, 7.71s/it, loss=0.1036, acc=0.8381, iter_time=7.92s]
Epoch 0: 5%|▌ | 666/12384 [1:25:09<25:06:07, 7.71s/it, loss=0.1327, acc=0.8042, iter_time=4.23s]
Epoch 0: 5%|▌ | 667/12384 [1:25:09<25:00:36, 7.68s/it, loss=0.1327, acc=0.8042, iter_time=4.23s]
Epoch 0: 5%|▌ | 667/12384 [1:25:17<25:00:36, 7.68s/it, loss=0.1302, acc=0.8088, iter_time=10.99s]
Epoch 0: 5%|▌ | 668/12384 [1:25:17<24:56:54, 7.67s/it, loss=0.1302, acc=0.8088, iter_time=10.99s]
Epoch 0: 5%|▌ | 668/12384 [1:25:24<24:56:54, 7.67s/it, loss=0.0870, acc=0.8783, iter_time=7.63s]
Epoch 0: 5%|▌ | 669/12384 [1:25:24<24:54:18, 7.65s/it, loss=0.0870, acc=0.8783, iter_time=7.63s]
Epoch 0: 5%|▌ | 669/12384 [1:25:32<24:54:18, 7.65s/it, loss=0.1286, acc=0.8579, iter_time=5.56s]
Epoch 0: 5%|▌ | 670/12384 [1:25:32<24:52:04, 7.64s/it, loss=0.1286, acc=0.8579, iter_time=5.56s]
Epoch 0: 5%|▌ | 670/12384 [1:25:40<24:52:04, 7.64s/it, loss=0.1241, acc=0.8032, iter_time=9.44s]
Epoch 0: 5%|▌ | 671/12384 [1:25:40<24:49:59, 7.63s/it, loss=0.1241, acc=0.8032, iter_time=9.44s]
Epoch 0: 5%|▌ | 671/12384 [1:25:47<24:49:59, 7.63s/it, loss=0.1622, acc=0.8018, iter_time=7.83s]
Epoch 0: 5%|▌ | 672/12384 [1:25:47<24:50:36, 7.64s/it, loss=0.1622, acc=0.8018, iter_time=7.83s]
Epoch 0: 5%|▌ | 672/12384 [1:25:55<24:50:36, 7.64s/it, loss=0.1058, acc=0.8327, iter_time=6.69s]
Epoch 0: 5%|▌ | 673/12384 [1:25:55<24:48:24, 7.63s/it, loss=0.1058, acc=0.8327, iter_time=6.69s]
Epoch 0: 5%|▌ | 673/12384 [1:26:02<24:48:24, 7.63s/it, loss=0.1210, acc=0.8160, iter_time=5.04s]
Epoch 0: 5%|▌ | 674/12384 [1:26:02<24:46:49, 7.62s/it, loss=0.1210, acc=0.8160, iter_time=5.04s]
Epoch 0: 5%|▌ | 674/12384 [1:26:10<24:46:49, 7.62s/it, loss=0.1089, acc=0.8183, iter_time=11.10s]
Epoch 0: 5%|▌ | 675/12384 [1:26:10<24:46:43, 7.62s/it, loss=0.1089, acc=0.8183, iter_time=11.10s]
Epoch 0: 5%|▌ | 675/12384 [1:26:18<24:46:43, 7.62s/it, loss=0.1180, acc=0.8083, iter_time=7.63s]
Epoch 0: 5%|▌ | 676/12384 [1:26:18<24:47:31, 7.62s/it, loss=0.1180, acc=0.8083, iter_time=7.63s]
Epoch 0: 5%|▌ | 676/12384 [1:26:25<24:47:31, 7.62s/it, loss=0.1031, acc=0.8541, iter_time=7.63s]
Epoch 0: 5%|▌ | 677/12384 [1:26:25<24:45:33, 7.61s/it, loss=0.1031, acc=0.8541, iter_time=7.63s]
Epoch 0: 5%|▌ | 677/12384 [1:26:33<24:45:33, 7.61s/it, loss=0.1068, acc=0.8435, iter_time=7.60s]
Epoch 0: 5%|▌ | 678/12384 [1:26:33<24:46:14, 7.62s/it, loss=0.1068, acc=0.8435, iter_time=7.60s]
Epoch 0: 5%|▌ | 678/12384 [1:26:41<24:46:14, 7.62s/it, loss=0.2316, acc=0.7498, iter_time=5.90s]
Epoch 0: 5%|▌ | 679/12384 [1:26:41<24:50:06, 7.64s/it, loss=0.2316, acc=0.7498, iter_time=5.90s]
Epoch 0: 5%|▌ | 679/12384 [1:26:48<24:50:06, 7.64s/it, loss=0.1292, acc=0.8201, iter_time=9.40s]
Epoch 0: 5%|▌ | 680/12384 [1:26:48<24:50:21, 7.64s/it, loss=0.1292, acc=0.8201, iter_time=9.40s]
Epoch 0: 5%|▌ | 680/12384 [1:26:56<24:50:21, 7.64s/it, loss=0.1082, acc=0.8327, iter_time=7.72s]
Epoch 0: 5%|▌ | 681/12384 [1:26:56<24:51:59, 7.65s/it, loss=0.1082, acc=0.8327, iter_time=7.72s]
Epoch 0: 5%|▌ | 681/12384 [1:27:04<24:51:59, 7.65s/it, loss=0.1277, acc=0.8374, iter_time=4.84s]
Epoch 0: 6%|▌ | 682/12384 [1:27:04<24:50:16, 7.64s/it, loss=0.1277, acc=0.8374, iter_time=4.84s]
Epoch 0: 6%|▌ | 682/12384 [1:27:11<24:50:16, 7.64s/it, loss=0.1247, acc=0.7995, iter_time=10.39s]
Epoch 0: 6%|▌ | 683/12384 [1:27:11<24:50:26, 7.64s/it, loss=0.1247, acc=0.7995, iter_time=10.39s]
Epoch 0: 6%|▌ | 683/12384 [1:27:19<24:50:26, 7.64s/it, loss=0.1036, acc=0.8508, iter_time=6.42s]
Epoch 0: 6%|▌ | 684/12384 [1:27:19<24:49:39, 7.64s/it, loss=0.1036, acc=0.8508, iter_time=6.42s]
Epoch 0: 6%|▌ | 684/12384 [1:27:26<24:49:39, 7.64s/it, loss=0.1177, acc=0.8069, iter_time=7.94s]
Epoch 0: 6%|▌ | 685/12384 [1:27:26<24:47:02, 7.63s/it, loss=0.1177, acc=0.8069, iter_time=7.94s]
Epoch 0: 6%|▌ | 685/12384 [1:27:34<24:47:02, 7.63s/it, loss=0.1126, acc=0.8421, iter_time=8.53s]
Epoch 0: 6%|▌ | 686/12384 [1:27:34<24:48:19, 7.63s/it, loss=0.1126, acc=0.8421, iter_time=8.53s]
Epoch 0: 6%|▌ | 686/12384 [1:27:42<24:48:19, 7.63s/it, loss=0.1070, acc=0.8501, iter_time=7.64s]
Epoch 0: 6%|▌ | 687/12384 [1:27:42<24:50:35, 7.65s/it, loss=0.1070, acc=0.8501, iter_time=7.64s]
Epoch 0: 6%|▌ | 687/12384 [1:27:49<24:50:35, 7.65s/it, loss=0.1305, acc=0.7891, iter_time=8.06s]
Epoch 0: 6%|▌ | 688/12384 [1:27:49<24:48:56, 7.64s/it, loss=0.1305, acc=0.7891, iter_time=8.06s]
Epoch 0: 6%|▌ | 688/12384 [1:27:57<24:48:56, 7.64s/it, loss=0.0905, acc=0.8557, iter_time=7.36s]
Epoch 0: 6%|▌ | 689/12384 [1:27:57<24:53:38, 7.66s/it, loss=0.0905, acc=0.8557, iter_time=7.36s]
Epoch 0: 6%|▌ | 689/12384 [1:28:05<24:53:38, 7.66s/it, loss=0.0984, acc=0.8304, iter_time=6.40s]
Epoch 0: 6%|▌ | 690/12384 [1:28:05<24:51:24, 7.65s/it, loss=0.0984, acc=0.8304, iter_time=6.40s]
Epoch 0: 6%|▌ | 690/12384 [1:28:12<24:51:24, 7.65s/it, loss=0.0924, acc=0.8252, iter_time=8.84s]
Epoch 0: 6%|▌ | 691/12384 [1:28:12<24:51:44, 7.65s/it, loss=0.0924, acc=0.8252, iter_time=8.84s]
Epoch 0: 6%|▌ | 691/12384 [1:28:20<24:51:44, 7.65s/it, loss=0.0950, acc=0.8587, iter_time=7.66s]
Epoch 0: 6%|▌ | 692/12384 [1:28:20<24:49:29, 7.64s/it, loss=0.0950, acc=0.8587, iter_time=7.66s]
Epoch 0: 6%|▌ | 692/12384 [1:28:28<24:49:29, 7.64s/it, loss=0.1179, acc=0.7997, iter_time=7.94s]
Epoch 0: 6%|▌ | 693/12384 [1:28:28<25:08:25, 7.74s/it, loss=0.1179, acc=0.7997, iter_time=7.94s]
Epoch 0: 6%|▌ | 693/12384 [1:28:36<25:08:25, 7.74s/it, loss=0.0900, acc=0.8538, iter_time=7.08s]
Epoch 0: 6%|▌ | 694/12384 [1:28:36<25:00:02, 7.70s/it, loss=0.0900, acc=0.8538, iter_time=7.08s]
Epoch 0: 6%|▌ | 694/12384 [1:28:43<25:00:02, 7.70s/it, loss=0.0796, acc=0.8855, iter_time=4.61s]
Epoch 0: 6%|▌ | 695/12384 [1:28:43<24:53:38, 7.67s/it, loss=0.0796, acc=0.8855, iter_time=4.61s]
Epoch 0: 6%|▌ | 695/12384 [1:28:51<24:53:38, 7.67s/it, loss=0.0898, acc=0.8556, iter_time=11.22s]
Epoch 0: 6%|▌ | 696/12384 [1:28:51<24:49:06, 7.64s/it, loss=0.0898, acc=0.8556, iter_time=11.22s]
Epoch 0: 6%|▌ | 696/12384 [1:28:58<24:49:06, 7.64s/it, loss=0.0742, acc=0.9220, iter_time=4.88s]
Epoch 0: 6%|▌ | 697/12384 [1:28:58<24:47:54, 7.64s/it, loss=0.0742, acc=0.9220, iter_time=4.88s]
Epoch 0: 6%|▌ | 697/12384 [1:29:06<24:47:54, 7.64s/it, loss=0.0700, acc=0.9074, iter_time=8.46s]
Epoch 0: 6%|▌ | 698/12384 [1:29:06<24:49:52, 7.65s/it, loss=0.0700, acc=0.9074, iter_time=8.46s]
Epoch 0: 6%|▌ | 698/12384 [1:29:14<24:49:52, 7.65s/it, loss=0.1078, acc=0.8478, iter_time=8.52s]
Epoch 0: 6%|▌ | 699/12384 [1:29:14<24:46:45, 7.63s/it, loss=0.1078, acc=0.8478, iter_time=8.52s]
Epoch 0: 6%|▌ | 699/12384 [1:29:21<24:46:45, 7.63s/it, loss=0.0870, acc=0.8846, iter_time=8.96s]
Epoch 0: 6%|▌ | 700/12384 [1:29:21<24:45:54, 7.63s/it, loss=0.0870, acc=0.8846, iter_time=8.96s]
Epoch 0: 6%|▌ | 700/12384 [1:29:29<24:45:54, 7.63s/it, loss=0.0963, acc=0.8636, iter_time=7.20s]
Epoch 0: 6%|▌ | 701/12384 [1:29:29<24:44:46, 7.63s/it, loss=0.0963, acc=0.8636, iter_time=7.20s]
Epoch 0: 6%|▌ | 701/12384 [1:29:36<24:44:46, 7.63s/it, loss=0.0899, acc=0.8464, iter_time=7.63s]
Epoch 0: 6%|▌ | 702/12384 [1:29:36<24:44:36, 7.63s/it, loss=0.0899, acc=0.8464, iter_time=7.63s]
Epoch 0: 6%|▌ | 702/12384 [1:29:44<24:44:36, 7.63s/it, loss=0.0659, acc=0.8993, iter_time=7.62s]
Epoch 0: 6%|▌ | 703/12384 [1:29:44<24:44:40, 7.63s/it, loss=0.0659, acc=0.8993, iter_time=7.62s]
Epoch 0: 6%|▌ | 703/12384 [1:29:52<24:44:40, 7.63s/it, loss=0.0636, acc=0.9133, iter_time=7.61s]
Epoch 0: 6%|▌ | 704/12384 [1:29:52<24:45:31, 7.63s/it, loss=0.0636, acc=0.9133, iter_time=7.61s]
Epoch 0: 6%|▌ | 704/12384 [1:29:59<24:45:31, 7.63s/it, loss=0.0882, acc=0.8802, iter_time=5.10s]
Epoch 0: 6%|▌ | 705/12384 [1:29:59<24:45:50, 7.63s/it, loss=0.0882, acc=0.8802, iter_time=5.10s]
Epoch 0: 6%|▌ | 705/12384 [1:30:07<24:45:50, 7.63s/it, loss=0.0552, acc=0.9215, iter_time=10.19s]
Epoch 0: 6%|▌ | 706/12384 [1:30:07<24:44:24, 7.63s/it, loss=0.0552, acc=0.9215, iter_time=10.19s]
Epoch 0: 6%|▌ | 706/12384 [1:30:15<24:44:24, 7.63s/it, loss=0.0729, acc=0.8890, iter_time=7.63s]
Epoch 0: 6%|▌ | 707/12384 [1:30:15<24:45:26, 7.63s/it, loss=0.0729, acc=0.8890, iter_time=7.63s]
Epoch 0: 6%|▌ | 707/12384 [1:30:22<24:45:26, 7.63s/it, loss=0.0743, acc=0.8881, iter_time=7.62s]
Epoch 0: 6%|▌ | 708/12384 [1:30:22<24:44:36, 7.63s/it, loss=0.0743, acc=0.8881, iter_time=7.62s]
Epoch 0: 6%|▌ | 708/12384 [1:30:30<24:44:36, 7.63s/it, loss=0.0683, acc=0.8922, iter_time=7.65s]
Epoch 0: 6%|▌ | 709/12384 [1:30:30<24:43:40, 7.62s/it, loss=0.0683, acc=0.8922, iter_time=7.65s]
Epoch 0: 6%|▌ | 709/12384 [1:30:38<24:43:40, 7.62s/it, loss=0.0779, acc=0.8605, iter_time=4.74s]
Epoch 0: 6%|▌ | 710/12384 [1:30:38<24:44:15, 7.63s/it, loss=0.0779, acc=0.8605, iter_time=4.74s]
Epoch 0: 6%|▌ | 710/12384 [1:30:45<24:44:15, 7.63s/it, loss=0.0851, acc=0.8623, iter_time=10.49s]
Epoch 0: 6%|▌ | 711/12384 [1:30:45<24:45:14, 7.63s/it, loss=0.0851, acc=0.8623, iter_time=10.49s]
Epoch 0: 6%|▌ | 711/12384 [1:30:53<24:45:14, 7.63s/it, loss=0.1700, acc=0.8449, iter_time=8.04s]
Epoch 0: 6%|▌ | 712/12384 [1:30:53<24:45:44, 7.64s/it, loss=0.1700, acc=0.8449, iter_time=8.04s]
Epoch 0: 6%|▌ | 712/12384 [1:31:00<24:45:44, 7.64s/it, loss=0.1078, acc=0.8213, iter_time=7.23s]
Epoch 0: 6%|▌ | 713/12384 [1:31:00<24:45:00, 7.63s/it, loss=0.1078, acc=0.8213, iter_time=7.23s]
Epoch 0: 6%|▌ | 713/12384 [1:31:08<24:45:00, 7.63s/it, loss=0.0854, acc=0.8348, iter_time=7.01s]
Epoch 0: 6%|▌ | 714/12384 [1:31:08<24:45:39, 7.64s/it, loss=0.0854, acc=0.8348, iter_time=7.01s]
Epoch 0: 6%|▌ | 714/12384 [1:31:16<24:45:39, 7.64s/it, loss=0.0721, acc=0.8963, iter_time=8.30s]
Epoch 0: 6%|▌ | 715/12384 [1:31:16<24:46:52, 7.65s/it, loss=0.0721, acc=0.8963, iter_time=8.30s]
Epoch 0: 6%|▌ | 715/12384 [1:31:23<24:46:52, 7.65s/it, loss=0.0602, acc=0.9016, iter_time=7.66s]
Epoch 0: 6%|▌ | 716/12384 [1:31:23<24:44:33, 7.63s/it, loss=0.0602, acc=0.9016, iter_time=7.66s]
Epoch 0: 6%|▌ | 716/12384 [1:31:31<24:44:33, 7.63s/it, loss=0.0475, acc=0.9400, iter_time=7.61s]
Epoch 0: 6%|▌ | 717/12384 [1:31:31<24:43:56, 7.63s/it, loss=0.0475, acc=0.9400, iter_time=7.61s]
Epoch 0: 6%|▌ | 717/12384 [1:31:39<24:43:56, 7.63s/it, loss=0.0821, acc=0.8669, iter_time=5.83s]
Epoch 0: 6%|▌ | 718/12384 [1:31:39<24:47:11, 7.65s/it, loss=0.0821, acc=0.8669, iter_time=5.83s]
Epoch 0: 6%|▌ | 718/12384 [1:31:47<24:47:11, 7.65s/it, loss=0.0577, acc=0.9257, iter_time=9.48s]
Epoch 0: 6%|▌ | 719/12384 [1:31:47<25:02:04, 7.73s/it, loss=0.0577, acc=0.9257, iter_time=9.48s]
Epoch 0: 6%|▌ | 719/12384 [1:31:54<25:02:04, 7.73s/it, loss=0.0791, acc=0.8718, iter_time=8.29s]
Epoch 0: 6%|▌ | 720/12384 [1:31:54<24:57:03, 7.70s/it, loss=0.0791, acc=0.8718, iter_time=8.29s]
Epoch 0: 6%|▌ | 720/12384 [1:32:02<24:57:03, 7.70s/it, loss=0.1032, acc=0.8775, iter_time=7.24s]
Epoch 0: 6%|▌ | 721/12384 [1:32:02<24:51:42, 7.67s/it, loss=0.1032, acc=0.8775, iter_time=7.24s]
Epoch 0: 6%|▌ | 721/12384 [1:32:09<24:51:42, 7.67s/it, loss=0.0505, acc=0.9189, iter_time=6.42s]
Epoch 0: 6%|▌ | 722/12384 [1:32:09<24:47:12, 7.65s/it, loss=0.0505, acc=0.9189, iter_time=6.42s]
Epoch 0: 6%|▌ | 722/12384 [1:32:17<24:47:12, 7.65s/it, loss=0.0540, acc=0.9087, iter_time=8.80s]
Epoch 0: 6%|▌ | 723/12384 [1:32:17<24:45:45, 7.64s/it, loss=0.0540, acc=0.9087, iter_time=8.80s]
Epoch 0: 6%|▌ | 723/12384 [1:32:25<24:45:45, 7.64s/it, loss=0.0382, acc=0.9305, iter_time=7.64s]
Epoch 0: 6%|▌ | 724/12384 [1:32:25<24:44:41, 7.64s/it, loss=0.0382, acc=0.9305, iter_time=7.64s]
Epoch 0: 6%|▌ | 724/12384 [1:32:32<24:44:41, 7.64s/it, loss=0.0724, acc=0.8542, iter_time=4.25s]
Epoch 0: 6%|▌ | 725/12384 [1:32:32<24:45:24, 7.64s/it, loss=0.0724, acc=0.8542, iter_time=4.25s]
Epoch 0: 6%|▌ | 725/12384 [1:32:40<24:45:24, 7.64s/it, loss=0.0610, acc=0.9049, iter_time=11.01s]
Epoch 0: 6%|▌ | 726/12384 [1:32:40<24:43:10, 7.63s/it, loss=0.0610, acc=0.9049, iter_time=11.01s]
Epoch 0: 6%|▌ | 726/12384 [1:32:48<24:43:10, 7.63s/it, loss=0.0618, acc=0.9024, iter_time=7.63s]
Epoch 0: 6%|▌ | 727/12384 [1:32:48<24:41:11, 7.62s/it, loss=0.0618, acc=0.9024, iter_time=7.63s]
Epoch 0: 6%|▌ | 727/12384 [1:32:55<24:41:11, 7.62s/it, loss=0.0476, acc=0.9378, iter_time=7.57s]
Epoch 0: 6%|▌ | 728/12384 [1:32:55<24:41:34, 7.63s/it, loss=0.0476, acc=0.9378, iter_time=7.57s]
Epoch 0: 6%|▌ | 728/12384 [1:33:03<24:41:34, 7.63s/it, loss=0.0640, acc=0.8811, iter_time=7.68s]
Epoch 0: 6%|▌ | 729/12384 [1:33:03<24:41:03, 7.62s/it, loss=0.0640, acc=0.8811, iter_time=7.68s]
Epoch 0: 6%|▌ | 729/12384 [1:33:10<24:41:03, 7.62s/it, loss=0.0732, acc=0.8555, iter_time=7.59s]
Epoch 0: 6%|▌ | 730/12384 [1:33:10<24:40:30, 7.62s/it, loss=0.0732, acc=0.8555, iter_time=7.59s]
Epoch 0: 6%|▌ | 730/12384 [1:33:18<24:40:30, 7.62s/it, loss=0.1067, acc=0.8770, iter_time=4.56s]
Epoch 0: 6%|▌ | 731/12384 [1:33:18<24:42:32, 7.63s/it, loss=0.1067, acc=0.8770, iter_time=4.56s]
Epoch 0: 6%|▌ | 731/12384 [1:33:26<24:42:32, 7.63s/it, loss=0.0435, acc=0.9228, iter_time=7.91s]
Epoch 0: 6%|▌ | 732/12384 [1:33:26<24:49:14, 7.67s/it, loss=0.0435, acc=0.9228, iter_time=7.91s]
Epoch 0: 6%|▌ | 732/12384 [1:33:33<24:49:14, 7.67s/it, loss=0.0788, acc=0.8607, iter_time=10.56s]
Epoch 0: 6%|▌ | 733/12384 [1:33:33<24:47:25, 7.66s/it, loss=0.0788, acc=0.8607, iter_time=10.56s]
Epoch 0: 6%|▌ | 733/12384 [1:33:41<24:47:25, 7.66s/it, loss=0.0610, acc=0.8936, iter_time=6.16s]
Epoch 0: 6%|▌ | 734/12384 [1:33:41<24:46:09, 7.65s/it, loss=0.0610, acc=0.8936, iter_time=6.16s]
Epoch 0: 6%|▌ | 734/12384 [1:33:49<24:46:09, 7.65s/it, loss=0.0510, acc=0.9132, iter_time=7.92s]
Epoch 0: 6%|▌ | 735/12384 [1:33:49<24:45:02, 7.65s/it, loss=0.0510, acc=0.9132, iter_time=7.92s]
Epoch 0: 6%|▌ | 735/12384 [1:33:56<24:45:02, 7.65s/it, loss=0.0514, acc=0.9083, iter_time=9.25s]
Epoch 0: 6%|▌ | 736/12384 [1:33:56<24:46:00, 7.65s/it, loss=0.0514, acc=0.9083, iter_time=9.25s]
Epoch 0: 6%|▌ | 736/12384 [1:34:04<24:46:00, 7.65s/it, loss=0.0416, acc=0.9112, iter_time=4.95s]
Epoch 0: 6%|▌ | 737/12384 [1:34:04<24:42:48, 7.64s/it, loss=0.0416, acc=0.9112, iter_time=4.95s]
Epoch 0: 6%|▌ | 737/12384 [1:34:12<24:42:48, 7.64s/it, loss=0.0671, acc=0.9069, iter_time=9.90s]
Epoch 0: 6%|▌ | 738/12384 [1:34:12<24:42:37, 7.64s/it, loss=0.0671, acc=0.9069, iter_time=9.90s]
Epoch 0: 6%|▌ | 738/12384 [1:34:19<24:42:37, 7.64s/it, loss=0.0615, acc=0.8817, iter_time=7.66s]
Epoch 0: 6%|▌ | 739/12384 [1:34:19<24:44:39, 7.65s/it, loss=0.0615, acc=0.8817, iter_time=7.66s]
Epoch 0: 6%|▌ | 739/12384 [1:34:27<24:44:39, 7.65s/it, loss=0.0525, acc=0.9135, iter_time=5.90s]
Epoch 0: 6%|▌ | 740/12384 [1:34:27<24:47:19, 7.66s/it, loss=0.0525, acc=0.9135, iter_time=5.90s]
Epoch 0: 6%|▌ | 740/12384 [1:34:35<24:47:19, 7.66s/it, loss=0.2883, acc=0.8236, iter_time=9.47s]
Epoch 0: 6%|▌ | 741/12384 [1:34:35<24:44:20, 7.65s/it, loss=0.2883, acc=0.8236, iter_time=9.47s]
Epoch 0: 6%|▌ | 741/12384 [1:34:42<24:44:20, 7.65s/it, loss=0.0424, acc=0.9257, iter_time=7.59s]
Epoch 0: 6%|▌ | 742/12384 [1:34:42<24:42:15, 7.64s/it, loss=0.0424, acc=0.9257, iter_time=7.59s]
Epoch 0: 6%|▌ | 742/12384 [1:34:50<24:42:15, 7.64s/it, loss=0.1948, acc=0.8517, iter_time=7.62s]
Epoch 0: 6%|▌ | 743/12384 [1:34:50<24:41:33, 7.64s/it, loss=0.1948, acc=0.8517, iter_time=7.62s]
Epoch 0: 6%|▌ | 743/12384 [1:34:58<24:41:33, 7.64s/it, loss=0.0475, acc=0.9171, iter_time=8.04s]
Epoch 0: 6%|▌ | 744/12384 [1:34:58<24:40:17, 7.63s/it, loss=0.0475, acc=0.9171, iter_time=8.04s]
Epoch 0: 6%|▌ | 744/12384 [1:35:05<24:40:17, 7.63s/it, loss=0.0418, acc=0.9287, iter_time=7.52s]
Epoch 0: 6%|▌ | 745/12384 [1:35:05<24:58:51, 7.73s/it, loss=0.0418, acc=0.9287, iter_time=7.52s]
Epoch 0: 6%|▌ | 745/12384 [1:35:13<24:58:51, 7.73s/it, loss=0.0360, acc=0.9375, iter_time=7.68s]
Epoch 0: 6%|▌ | 746/12384 [1:35:13<24:57:01, 7.72s/it, loss=0.0360, acc=0.9375, iter_time=7.68s]
Epoch 0: 6%|▌ | 746/12384 [1:35:21<24:57:01, 7.72s/it, loss=0.0492, acc=0.9099, iter_time=7.68s]
Epoch 0: 6%|▌ | 747/12384 [1:35:21<24:51:00, 7.69s/it, loss=0.0492, acc=0.9099, iter_time=7.68s]
Epoch 0: 6%|▌ | 747/12384 [1:35:28<24:51:00, 7.69s/it, loss=0.0421, acc=0.9237, iter_time=7.61s]
Epoch 0: 6%|▌ | 748/12384 [1:35:28<24:47:09, 7.67s/it, loss=0.0421, acc=0.9237, iter_time=7.61s]
Epoch 0: 6%|▌ | 748/12384 [1:35:36<24:47:09, 7.67s/it, loss=0.0499, acc=0.9035, iter_time=7.03s]
Epoch 0: 6%|▌ | 749/12384 [1:35:36<24:42:50, 7.65s/it, loss=0.0499, acc=0.9035, iter_time=7.03s]
Epoch 0: 6%|▌ | 749/12384 [1:35:44<24:42:50, 7.65s/it, loss=0.0404, acc=0.9213, iter_time=8.59s]
Epoch 0: 6%|▌ | 750/12384 [1:35:44<24:41:44, 7.64s/it, loss=0.0404, acc=0.9213, iter_time=8.59s]
Epoch 0: 6%|▌ | 750/12384 [1:35:51<24:41:44, 7.64s/it, loss=0.0422, acc=0.9309, iter_time=4.63s]
Epoch 0: 6%|▌ | 751/12384 [1:35:51<24:39:00, 7.63s/it, loss=0.0422, acc=0.9309, iter_time=4.63s]
Epoch 0: 6%|▌ | 751/12384 [1:35:59<24:39:00, 7.63s/it, loss=0.0383, acc=0.9451, iter_time=10.54s]
Epoch 0: 6%|▌ | 752/12384 [1:35:59<24:39:12, 7.63s/it, loss=0.0383, acc=0.9451, iter_time=10.54s]
Epoch 0: 6%|▌ | 752/12384 [1:36:06<24:39:12, 7.63s/it, loss=0.0451, acc=0.9196, iter_time=7.27s]
Epoch 0: 6%|▌ | 753/12384 [1:36:06<24:39:29, 7.63s/it, loss=0.0451, acc=0.9196, iter_time=7.27s]
Epoch 0: 6%|▌ | 753/12384 [1:36:14<24:39:29, 7.63s/it, loss=0.0458, acc=0.9211, iter_time=7.64s]
Epoch 0: 6%|▌ | 754/12384 [1:36:14<24:40:17, 7.64s/it, loss=0.0458, acc=0.9211, iter_time=7.64s]
Epoch 0: 6%|▌ | 754/12384 [1:36:22<24:40:17, 7.64s/it, loss=0.0374, acc=0.9325, iter_time=7.64s]
Epoch 0: 6%|▌ | 755/12384 [1:36:22<24:40:36, 7.64s/it, loss=0.0374, acc=0.9325, iter_time=7.64s]
Epoch 0: 6%|▌ | 755/12384 [1:36:29<24:40:36, 7.64s/it, loss=0.2386, acc=0.8100, iter_time=7.64s]
Epoch 0: 6%|▌ | 756/12384 [1:36:29<24:39:46, 7.64s/it, loss=0.2386, acc=0.8100, iter_time=7.64s]
Epoch 0: 6%|▌ | 756/12384 [1:36:37<24:39:46, 7.64s/it, loss=0.0359, acc=0.9196, iter_time=6.43s]
Epoch 0: 6%|▌ | 757/12384 [1:36:37<24:36:51, 7.62s/it, loss=0.0359, acc=0.9196, iter_time=6.43s]
Epoch 0: 6%|▌ | 757/12384 [1:36:45<24:36:51, 7.62s/it, loss=0.0413, acc=0.9169, iter_time=5.04s]
Epoch 0: 6%|▌ | 758/12384 [1:36:45<24:36:17, 7.62s/it, loss=0.0413, acc=0.9169, iter_time=5.04s]
Epoch 0: 6%|▌ | 758/12384 [1:36:52<24:36:17, 7.62s/it, loss=0.0432, acc=0.9119, iter_time=11.35s]
Epoch 0: 6%|▌ | 759/12384 [1:36:52<24:34:29, 7.61s/it, loss=0.0432, acc=0.9119, iter_time=11.35s]
Epoch 0: 6%|▌ | 759/12384 [1:37:00<24:34:29, 7.61s/it, loss=0.0478, acc=0.9104, iter_time=7.99s]
Epoch 0: 6%|▌ | 760/12384 [1:37:00<24:36:19, 7.62s/it, loss=0.0478, acc=0.9104, iter_time=7.99s]
Epoch 0: 6%|▌ | 760/12384 [1:37:07<24:36:19, 7.62s/it, loss=0.0376, acc=0.9337, iter_time=7.24s]
Epoch 0: 6%|▌ | 761/12384 [1:37:07<24:37:37, 7.63s/it, loss=0.0376, acc=0.9337, iter_time=7.24s]
Epoch 0: 6%|▌ | 761/12384 [1:37:15<24:37:37, 7.63s/it, loss=0.0319, acc=0.9420, iter_time=7.67s]
Epoch 0: 6%|▌ | 762/12384 [1:37:15<24:36:26, 7.62s/it, loss=0.0319, acc=0.9420, iter_time=7.67s]
Epoch 0: 6%|▌ | 762/12384 [1:37:23<24:36:26, 7.62s/it, loss=0.0306, acc=0.9524, iter_time=7.58s]
Epoch 0: 6%|▌ | 763/12384 [1:37:23<24:34:05, 7.61s/it, loss=0.0306, acc=0.9524, iter_time=7.58s]
Epoch 0: 6%|▌ | 763/12384 [1:37:30<24:34:05, 7.61s/it, loss=0.0217, acc=0.9687, iter_time=4.47s]
Epoch 0: 6%|▌ | 764/12384 [1:37:30<24:36:08, 7.62s/it, loss=0.0217, acc=0.9687, iter_time=4.47s]
Epoch 0: 6%|▌ | 764/12384 [1:37:38<24:36:08, 7.62s/it, loss=0.0435, acc=0.9098, iter_time=10.17s]
Epoch 0: 6%|▌ | 765/12384 [1:37:38<24:34:32, 7.61s/it, loss=0.0435, acc=0.9098, iter_time=10.17s]
Epoch 0: 6%|▌ | 765/12384 [1:37:46<24:34:32, 7.61s/it, loss=0.0369, acc=0.9183, iter_time=6.73s]
Epoch 0: 6%|▌ | 766/12384 [1:37:46<24:35:48, 7.62s/it, loss=0.0369, acc=0.9183, iter_time=6.73s]
Epoch 0: 6%|▌ | 766/12384 [1:37:53<24:35:48, 7.62s/it, loss=0.0226, acc=0.9585, iter_time=6.53s]
Epoch 0: 6%|▌ | 767/12384 [1:37:53<24:35:49, 7.62s/it, loss=0.0226, acc=0.9585, iter_time=6.53s]
Epoch 0: 6%|▌ | 767/12384 [1:38:01<24:35:49, 7.62s/it, loss=0.0323, acc=0.9444, iter_time=10.59s]
Epoch 0: 6%|▌ | 768/12384 [1:38:01<24:38:55, 7.64s/it, loss=0.0323, acc=0.9444, iter_time=10.59s]
Epoch 0: 6%|▌ | 768/12384 [1:38:09<24:38:55, 7.64s/it, loss=0.0343, acc=0.9373, iter_time=7.30s]
Epoch 0: 6%|▌ | 769/12384 [1:38:09<24:38:52, 7.64s/it, loss=0.0343, acc=0.9373, iter_time=7.30s]
Epoch 0: 6%|▌ | 769/12384 [1:38:16<24:38:52, 7.64s/it, loss=0.0251, acc=0.9559, iter_time=7.65s]
Epoch 0: 6%|▌ | 770/12384 [1:38:16<24:38:04, 7.64s/it, loss=0.0251, acc=0.9559, iter_time=7.65s]
Epoch 0: 6%|▌ | 770/12384 [1:38:24<24:38:04, 7.64s/it, loss=0.0246, acc=0.9612, iter_time=7.94s]
Epoch 0: 6%|▌ | 771/12384 [1:38:24<24:59:50, 7.75s/it, loss=0.0246, acc=0.9612, iter_time=7.94s]
Epoch 0: 6%|▌ | 771/12384 [1:38:32<24:59:50, 7.75s/it, loss=0.0601, acc=0.8999, iter_time=7.70s]
Epoch 0: 6%|▌ | 772/12384 [1:38:32<24:51:15, 7.71s/it, loss=0.0601, acc=0.8999, iter_time=7.70s]
Epoch 0: 6%|▌ | 772/12384 [1:38:39<24:51:15, 7.71s/it, loss=0.0359, acc=0.9443, iter_time=7.60s]
Epoch 0: 6%|▌ | 773/12384 [1:38:39<24:44:39, 7.67s/it, loss=0.0359, acc=0.9443, iter_time=7.60s]
Epoch 0: 6%|▌ | 773/12384 [1:38:47<24:44:39, 7.67s/it, loss=0.0329, acc=0.9437, iter_time=7.58s]
Epoch 0: 6%|▋ | 774/12384 [1:38:47<24:40:25, 7.65s/it, loss=0.0329, acc=0.9437, iter_time=7.58s]
Epoch 0: 6%|▋ | 774/12384 [1:38:55<24:40:25, 7.65s/it, loss=0.0413, acc=0.9204, iter_time=7.63s]
Epoch 0: 6%|▋ | 775/12384 [1:38:55<24:38:11, 7.64s/it, loss=0.0413, acc=0.9204, iter_time=7.63s]
Epoch 0: 6%|▋ | 775/12384 [1:39:02<24:38:11, 7.64s/it, loss=0.0435, acc=0.9154, iter_time=7.64s]
Epoch 0: 6%|▋ | 776/12384 [1:39:02<24:41:52, 7.66s/it, loss=0.0435, acc=0.9154, iter_time=7.64s]
Epoch 0: 6%|▋ | 776/12384 [1:39:10<24:41:52, 7.66s/it, loss=0.0415, acc=0.9187, iter_time=7.66s]
Epoch 0: 6%|▋ | 777/12384 [1:39:10<24:45:14, 7.68s/it, loss=0.0415, acc=0.9187, iter_time=7.66s]
Epoch 0: 6%|▋ | 777/12384 [1:39:18<24:45:14, 7.68s/it, loss=0.0216, acc=0.9552, iter_time=7.74s]
Epoch 0: 6%|▋ | 778/12384 [1:39:18<24:42:22, 7.66s/it, loss=0.0216, acc=0.9552, iter_time=7.74s]
Epoch 0: 6%|▋ | 778/12384 [1:39:25<24:42:22, 7.66s/it, loss=0.0148, acc=0.9775, iter_time=7.63s]
Epoch 0: 6%|▋ | 779/12384 [1:39:25<24:40:21, 7.65s/it, loss=0.0148, acc=0.9775, iter_time=7.63s]
Epoch 0: 6%|▋ | 779/12384 [1:39:33<24:40:21, 7.65s/it, loss=0.0324, acc=0.9460, iter_time=7.65s]
Epoch 0: 6%|▋ | 780/12384 [1:39:33<24:38:24, 7.64s/it, loss=0.0324, acc=0.9460, iter_time=7.65s]
Epoch 0: 6%|▋ | 780/12384 [1:39:40<24:38:24, 7.64s/it, loss=0.0238, acc=0.9511, iter_time=7.60s]
Epoch 0: 6%|▋ | 781/12384 [1:39:40<24:36:47, 7.64s/it, loss=0.0238, acc=0.9511, iter_time=7.60s]
Epoch 0: 6%|▋ | 781/12384 [1:39:48<24:36:47, 7.64s/it, loss=0.0370, acc=0.9297, iter_time=7.65s]
Epoch 0: 6%|▋ | 782/12384 [1:39:48<24:36:28, 7.64s/it, loss=0.0370, acc=0.9297, iter_time=7.65s]
Epoch 0: 6%|▋ | 782/12384 [1:39:56<24:36:28, 7.64s/it, loss=0.0324, acc=0.9425, iter_time=7.60s]
Epoch 0: 6%|▋ | 783/12384 [1:39:56<24:37:43, 7.64s/it, loss=0.0324, acc=0.9425, iter_time=7.60s]
Epoch 0: 6%|▋ | 783/12384 [1:40:03<24:37:43, 7.64s/it, loss=0.0326, acc=0.9294, iter_time=8.04s]
Epoch 0: 6%|▋ | 784/12384 [1:40:03<24:37:34, 7.64s/it, loss=0.0326, acc=0.9294, iter_time=8.04s]
Epoch 0: 6%|▋ | 784/12384 [1:40:11<24:37:34, 7.64s/it, loss=0.0227, acc=0.9600, iter_time=7.24s]
Epoch 0: 6%|▋ | 785/12384 [1:40:11<24:35:05, 7.63s/it, loss=0.0227, acc=0.9600, iter_time=7.24s]
Epoch 0: 6%|▋ | 785/12384 [1:40:19<24:35:05, 7.63s/it, loss=0.0224, acc=0.9444, iter_time=4.49s]
Epoch 0: 6%|▋ | 786/12384 [1:40:19<24:34:26, 7.63s/it, loss=0.0224, acc=0.9444, iter_time=4.49s]
Epoch 0: 6%|▋ | 786/12384 [1:40:26<24:34:26, 7.63s/it, loss=0.0280, acc=0.9426, iter_time=7.69s]
Epoch 0: 6%|▋ | 787/12384 [1:40:26<24:33:20, 7.62s/it, loss=0.0280, acc=0.9426, iter_time=7.69s]
Epoch 0: 6%|▋ | 787/12384 [1:40:34<24:33:20, 7.62s/it, loss=0.0509, acc=0.9484, iter_time=10.66s]
Epoch 0: 6%|▋ | 788/12384 [1:40:34<24:33:31, 7.62s/it, loss=0.0509, acc=0.9484, iter_time=10.66s]
Epoch 0: 6%|▋ | 788/12384 [1:40:42<24:33:31, 7.62s/it, loss=0.0369, acc=0.9292, iter_time=5.66s]
Epoch 0: 6%|▋ | 789/12384 [1:40:42<24:34:25, 7.63s/it, loss=0.0369, acc=0.9292, iter_time=5.66s]
Epoch 0: 6%|▋ | 789/12384 [1:40:49<24:34:25, 7.63s/it, loss=0.0209, acc=0.9621, iter_time=9.60s]
Epoch 0: 6%|▋ | 790/12384 [1:40:49<24:33:11, 7.62s/it, loss=0.0209, acc=0.9621, iter_time=9.60s]
Epoch 0: 6%|▋ | 790/12384 [1:40:57<24:33:11, 7.62s/it, loss=0.0131, acc=0.9784, iter_time=7.63s]
Epoch 0: 6%|▋ | 791/12384 [1:40:57<24:33:43, 7.63s/it, loss=0.0131, acc=0.9784, iter_time=7.63s]
Epoch 0: 6%|▋ | 791/12384 [1:41:04<24:33:43, 7.63s/it, loss=0.0366, acc=0.9400, iter_time=8.03s]
Epoch 0: 6%|▋ | 792/12384 [1:41:04<24:36:42, 7.64s/it, loss=0.0366, acc=0.9400, iter_time=8.03s]
Epoch 0: 6%|▋ | 792/12384 [1:41:12<24:36:42, 7.64s/it, loss=0.0259, acc=0.9537, iter_time=7.29s]
Epoch 0: 6%|▋ | 793/12384 [1:41:12<24:35:23, 7.64s/it, loss=0.0259, acc=0.9537, iter_time=7.29s]
Epoch 0: 6%|▋ | 793/12384 [1:41:20<24:35:23, 7.64s/it, loss=0.0289, acc=0.9530, iter_time=7.62s]
Epoch 0: 6%|▋ | 794/12384 [1:41:20<24:34:26, 7.63s/it, loss=0.0289, acc=0.9530, iter_time=7.62s]
Epoch 0: 6%|▋ | 794/12384 [1:41:27<24:34:26, 7.63s/it, loss=0.0270, acc=0.9490, iter_time=7.63s]
Epoch 0: 6%|▋ | 795/12384 [1:41:27<24:32:28, 7.62s/it, loss=0.0270, acc=0.9490, iter_time=7.63s]
Epoch 0: 6%|▋ | 795/12384 [1:41:35<24:32:28, 7.62s/it, loss=0.0203, acc=0.9541, iter_time=6.98s]
Epoch 0: 6%|▋ | 796/12384 [1:41:35<24:34:21, 7.63s/it, loss=0.0203, acc=0.9541, iter_time=6.98s]
Epoch 0: 6%|▋ | 796/12384 [1:41:43<24:34:21, 7.63s/it, loss=0.0223, acc=0.9582, iter_time=7.37s]
Epoch 0: 6%|▋ | 797/12384 [1:41:43<24:55:27, 7.74s/it, loss=0.0223, acc=0.9582, iter_time=7.37s]
Epoch 0: 6%|▋ | 797/12384 [1:41:51<24:55:27, 7.74s/it, loss=0.0206, acc=0.9566, iter_time=7.97s]
Epoch 0: 6%|▋ | 798/12384 [1:41:51<24:49:17, 7.71s/it, loss=0.0206, acc=0.9566, iter_time=7.97s]
Epoch 0: 6%|▋ | 798/12384 [1:41:58<24:49:17, 7.71s/it, loss=0.0391, acc=0.9308, iter_time=8.58s]
Epoch 0: 6%|▋ | 799/12384 [1:41:58<24:44:52, 7.69s/it, loss=0.0391, acc=0.9308, iter_time=8.58s]
Epoch 0: 6%|▋ | 799/12384 [1:42:06<24:44:52, 7.69s/it, loss=0.0208, acc=0.9563, iter_time=8.09s]
Epoch 0: 6%|▋ | 800/12384 [1:42:06<24:42:33, 7.68s/it, loss=0.0208, acc=0.9563, iter_time=8.09s]
Epoch 0: 6%|▋ | 800/12384 [1:42:14<24:42:33, 7.68s/it, loss=0.0147, acc=0.9859, iter_time=6.97s]
Epoch 0: 6%|▋ | 801/12384 [1:42:14<24:38:48, 7.66s/it, loss=0.0147, acc=0.9859, iter_time=6.97s]
Epoch 0: 6%|▋ | 801/12384 [1:42:21<24:38:48, 7.66s/it, loss=0.0229, acc=0.9482, iter_time=7.84s]
Epoch 0: 6%|▋ | 802/12384 [1:42:21<24:36:18, 7.65s/it, loss=0.0229, acc=0.9482, iter_time=7.84s]
Epoch 0: 6%|▋ | 802/12384 [1:42:29<24:36:18, 7.65s/it, loss=0.0218, acc=0.9426, iter_time=7.63s]
Epoch 0: 6%|▋ | 803/12384 [1:42:29<24:33:55, 7.64s/it, loss=0.0218, acc=0.9426, iter_time=7.63s]
Epoch 0: 6%|▋ | 803/12384 [1:42:36<24:33:55, 7.64s/it, loss=0.0136, acc=0.9779, iter_time=4.58s]
Epoch 0: 6%|▋ | 804/12384 [1:42:36<24:31:23, 7.62s/it, loss=0.0136, acc=0.9779, iter_time=4.58s]
Epoch 0: 6%|▋ | 804/12384 [1:42:44<24:31:23, 7.62s/it, loss=0.1282, acc=0.8586, iter_time=10.63s]
Epoch 0: 7%|▋ | 805/12384 [1:42:44<24:32:52, 7.63s/it, loss=0.1282, acc=0.8586, iter_time=10.63s]
Epoch 0: 7%|▋ | 805/12384 [1:42:52<24:32:52, 7.63s/it, loss=0.0136, acc=0.9759, iter_time=5.35s]
Epoch 0: 7%|▋ | 806/12384 [1:42:52<24:31:08, 7.62s/it, loss=0.0136, acc=0.9759, iter_time=5.35s]
Epoch 0: 7%|▋ | 806/12384 [1:42:59<24:31:08, 7.62s/it, loss=0.0248, acc=0.9474, iter_time=9.89s]
Epoch 0: 7%|▋ | 807/12384 [1:42:59<24:30:53, 7.62s/it, loss=0.0248, acc=0.9474, iter_time=9.89s]
Epoch 0: 7%|▋ | 807/12384 [1:43:07<24:30:53, 7.62s/it, loss=0.0343, acc=0.9413, iter_time=8.01s]
Epoch 0: 7%|▋ | 808/12384 [1:43:07<24:31:35, 7.63s/it, loss=0.0343, acc=0.9413, iter_time=8.01s]
Epoch 0: 7%|▋ | 808/12384 [1:43:14<24:31:35, 7.63s/it, loss=0.0203, acc=0.9623, iter_time=7.24s]
Epoch 0: 7%|▋ | 809/12384 [1:43:14<24:29:47, 7.62s/it, loss=0.0203, acc=0.9623, iter_time=7.24s]
Epoch 0: 7%|▋ | 809/12384 [1:43:22<24:29:47, 7.62s/it, loss=0.0209, acc=0.9636, iter_time=7.31s]
Epoch 0: 7%|▋ | 810/12384 [1:43:22<24:30:05, 7.62s/it, loss=0.0209, acc=0.9636, iter_time=7.31s]
Epoch 0: 7%|▋ | 810/12384 [1:43:30<24:30:05, 7.62s/it, loss=0.0101, acc=0.9779, iter_time=7.62s]
Epoch 0: 7%|▋ | 811/12384 [1:43:30<24:29:12, 7.62s/it, loss=0.0101, acc=0.9779, iter_time=7.62s]
Epoch 0: 7%|▋ | 811/12384 [1:43:37<24:29:12, 7.62s/it, loss=0.0137, acc=0.9719, iter_time=7.92s]
Epoch 0: 7%|▋ | 812/12384 [1:43:37<24:29:00, 7.62s/it, loss=0.0137, acc=0.9719, iter_time=7.92s]
Epoch 0: 7%|▋ | 812/12384 [1:43:45<24:29:00, 7.62s/it, loss=0.0200, acc=0.9688, iter_time=6.11s]
Epoch 0: 7%|▋ | 813/12384 [1:43:45<24:28:13, 7.61s/it, loss=0.0200, acc=0.9688, iter_time=6.11s]
Epoch 0: 7%|▋ | 813/12384 [1:43:53<24:28:13, 7.61s/it, loss=0.0177, acc=0.9663, iter_time=9.11s]
Epoch 0: 7%|▋ | 814/12384 [1:43:53<24:31:41, 7.63s/it, loss=0.0177, acc=0.9663, iter_time=9.11s]
Epoch 0: 7%|▋ | 814/12384 [1:44:00<24:31:41, 7.63s/it, loss=0.0262, acc=0.9547, iter_time=7.69s]
Epoch 0: 7%|▋ | 815/12384 [1:44:00<24:31:52, 7.63s/it, loss=0.0262, acc=0.9547, iter_time=7.69s]
Epoch 0: 7%|▋ | 815/12384 [1:44:08<24:31:52, 7.63s/it, loss=0.0173, acc=0.9666, iter_time=8.01s]
Epoch 0: 7%|▋ | 816/12384 [1:44:08<24:30:53, 7.63s/it, loss=0.0173, acc=0.9666, iter_time=8.01s]
Epoch 0: 7%|▋ | 816/12384 [1:44:16<24:30:53, 7.63s/it, loss=0.0208, acc=0.9611, iter_time=7.25s]
Epoch 0: 7%|▋ | 817/12384 [1:44:16<24:32:36, 7.64s/it, loss=0.0208, acc=0.9611, iter_time=7.25s]
Epoch 0: 7%|▋ | 817/12384 [1:44:23<24:32:36, 7.64s/it, loss=0.0165, acc=0.9687, iter_time=7.67s]
Epoch 0: 7%|▋ | 818/12384 [1:44:23<24:32:21, 7.64s/it, loss=0.0165, acc=0.9687, iter_time=7.67s]
Epoch 0: 7%|▋ | 818/12384 [1:44:31<24:32:21, 7.64s/it, loss=0.0184, acc=0.9669, iter_time=7.34s]
Epoch 0: 7%|▋ | 819/12384 [1:44:31<24:32:55, 7.64s/it, loss=0.0184, acc=0.9669, iter_time=7.34s]
Epoch 0: 7%|▋ | 819/12384 [1:44:38<24:32:55, 7.64s/it, loss=0.0115, acc=0.9805, iter_time=7.94s]
Epoch 0: 7%|▋ | 820/12384 [1:44:38<24:33:14, 7.64s/it, loss=0.0115, acc=0.9805, iter_time=7.94s]
Epoch 0: 7%|▋ | 820/12384 [1:44:46<24:33:14, 7.64s/it, loss=0.0213, acc=0.9653, iter_time=7.65s]
Epoch 0: 7%|▋ | 821/12384 [1:44:46<24:33:30, 7.65s/it, loss=0.0213, acc=0.9653, iter_time=7.65s]
Epoch 0: 7%|▋ | 821/12384 [1:44:54<24:33:30, 7.65s/it, loss=0.0548, acc=0.9306, iter_time=7.63s]
Epoch 0: 7%|▋ | 822/12384 [1:44:54<24:30:32, 7.63s/it, loss=0.0548, acc=0.9306, iter_time=7.63s]
Epoch 0: 7%|▋ | 822/12384 [1:45:01<24:30:32, 7.63s/it, loss=0.0178, acc=0.9735, iter_time=7.62s]
Epoch 0: 7%|▋ | 823/12384 [1:45:01<24:30:45, 7.63s/it, loss=0.0178, acc=0.9735, iter_time=7.62s]
Epoch 0: 7%|▋ | 823/12384 [1:45:09<24:30:45, 7.63s/it, loss=0.0151, acc=0.9684, iter_time=8.33s]
Epoch 0: 7%|▋ | 824/12384 [1:45:09<24:54:14, 7.76s/it, loss=0.0151, acc=0.9684, iter_time=8.33s]
Epoch 0: 7%|▋ | 824/12384 [1:45:17<24:54:14, 7.76s/it, loss=0.0110, acc=0.9790, iter_time=7.35s]
Epoch 0: 7%|▋ | 825/12384 [1:45:17<24:45:43, 7.71s/it, loss=0.0110, acc=0.9790, iter_time=7.35s]
Epoch 0: 7%|▋ | 825/12384 [1:45:25<24:45:43, 7.71s/it, loss=0.0301, acc=0.9566, iter_time=7.61s]
Epoch 0: 7%|▋ | 826/12384 [1:45:25<24:41:51, 7.69s/it, loss=0.0301, acc=0.9566, iter_time=7.61s]
Epoch 0: 7%|▋ | 826/12384 [1:45:32<24:41:51, 7.69s/it, loss=0.0191, acc=0.9618, iter_time=7.65s]
Epoch 0: 7%|▋ | 827/12384 [1:45:32<24:39:56, 7.68s/it, loss=0.0191, acc=0.9618, iter_time=7.65s]
Epoch 0: 7%|▋ | 827/12384 [1:45:40<24:39:56, 7.68s/it, loss=0.0231, acc=0.9660, iter_time=7.66s]
Epoch 0: 7%|▋ | 828/12384 [1:45:40<24:37:35, 7.67s/it, loss=0.0231, acc=0.9660, iter_time=7.66s]
Epoch 0: 7%|▋ | 828/12384 [1:45:48<24:37:35, 7.67s/it, loss=0.0083, acc=0.9900, iter_time=4.25s]
Epoch 0: 7%|▋ | 829/12384 [1:45:48<24:37:24, 7.67s/it, loss=0.0083, acc=0.9900, iter_time=4.25s]
Epoch 0: 7%|▋ | 829/12384 [1:45:55<24:37:24, 7.67s/it, loss=0.0175, acc=0.9750, iter_time=11.07s]
Epoch 0: 7%|▋ | 830/12384 [1:45:55<24:35:23, 7.66s/it, loss=0.0175, acc=0.9750, iter_time=11.07s]
Epoch 0: 7%|▋ | 830/12384 [1:46:03<24:35:23, 7.66s/it, loss=0.0138, acc=0.9700, iter_time=5.81s]
Epoch 0: 7%|▋ | 831/12384 [1:46:03<24:32:21, 7.65s/it, loss=0.0138, acc=0.9700, iter_time=5.81s]
Epoch 0: 7%|▋ | 831/12384 [1:46:10<24:32:21, 7.65s/it, loss=0.0289, acc=0.9414, iter_time=9.79s]
Epoch 0: 7%|▋ | 832/12384 [1:46:10<24:31:03, 7.64s/it, loss=0.0289, acc=0.9414, iter_time=9.79s]
Epoch 0: 7%|▋ | 832/12384 [1:46:18<24:31:03, 7.64s/it, loss=0.0426, acc=0.9357, iter_time=7.28s]
Epoch 0: 7%|▋ | 833/12384 [1:46:18<24:30:12, 7.64s/it, loss=0.0426, acc=0.9357, iter_time=7.28s]
Epoch 0: 7%|▋ | 833/12384 [1:46:26<24:30:12, 7.64s/it, loss=0.0132, acc=0.9743, iter_time=7.62s]
Epoch 0: 7%|▋ | 834/12384 [1:46:26<24:28:12, 7.63s/it, loss=0.0132, acc=0.9743, iter_time=7.62s]
Epoch 0: 7%|▋ | 834/12384 [1:46:33<24:28:12, 7.63s/it, loss=0.0149, acc=0.9719, iter_time=7.60s]
Epoch 0: 7%|▋ | 835/12384 [1:46:33<24:31:57, 7.65s/it, loss=0.0149, acc=0.9719, iter_time=7.60s]
Epoch 0: 7%|▋ | 835/12384 [1:46:41<24:31:57, 7.65s/it, loss=0.0825, acc=0.8881, iter_time=7.70s]
Epoch 0: 7%|▋ | 836/12384 [1:46:41<24:31:48, 7.65s/it, loss=0.0825, acc=0.8881, iter_time=7.70s]
Epoch 0: 7%|▋ | 836/12384 [1:46:49<24:31:48, 7.65s/it, loss=0.0171, acc=0.9772, iter_time=7.65s]
Epoch 0: 7%|▋ | 837/12384 [1:46:49<24:29:26, 7.64s/it, loss=0.0171, acc=0.9772, iter_time=7.65s]
Epoch 0: 7%|▋ | 837/12384 [1:46:56<24:29:26, 7.64s/it, loss=0.0180, acc=0.9716, iter_time=7.30s]
Epoch 0: 7%|▋ | 838/12384 [1:46:56<24:31:59, 7.65s/it, loss=0.0180, acc=0.9716, iter_time=7.30s]
Epoch 0: 7%|▋ | 838/12384 [1:47:04<24:31:59, 7.65s/it, loss=0.0183, acc=0.9586, iter_time=8.00s]
Epoch 0: 7%|▋ | 839/12384 [1:47:04<24:30:42, 7.64s/it, loss=0.0183, acc=0.9586, iter_time=8.00s]
Epoch 0: 7%|▋ | 839/12384 [1:47:12<24:30:42, 7.64s/it, loss=0.0253, acc=0.9593, iter_time=8.01s]
Epoch 0: 7%|▋ | 840/12384 [1:47:12<24:28:48, 7.63s/it, loss=0.0253, acc=0.9593, iter_time=8.01s]
Epoch 0: 7%|▋ | 840/12384 [1:47:19<24:28:48, 7.63s/it, loss=0.0115, acc=0.9781, iter_time=6.90s]
Epoch 0: 7%|▋ | 841/12384 [1:47:19<24:27:11, 7.63s/it, loss=0.0115, acc=0.9781, iter_time=6.90s]
Epoch 0: 7%|▋ | 841/12384 [1:47:27<24:27:11, 7.63s/it, loss=0.0146, acc=0.9697, iter_time=3.73s]
Epoch 0: 7%|▋ | 842/12384 [1:47:27<24:25:26, 7.62s/it, loss=0.0146, acc=0.9697, iter_time=3.73s]
Epoch 0: 7%|▋ | 842/12384 [1:47:34<24:25:26, 7.62s/it, loss=0.0187, acc=0.9620, iter_time=11.78s]
Epoch 0: 7%|▋ | 843/12384 [1:47:34<24:24:37, 7.61s/it, loss=0.0187, acc=0.9620, iter_time=11.78s]
Epoch 0: 7%|▋ | 843/12384 [1:47:42<24:24:37, 7.61s/it, loss=0.0183, acc=0.9614, iter_time=7.62s]
Epoch 0: 7%|▋ | 844/12384 [1:47:42<24:26:51, 7.63s/it, loss=0.0183, acc=0.9614, iter_time=7.62s]
Epoch 0: 7%|▋ | 844/12384 [1:47:50<24:26:51, 7.63s/it, loss=0.0190, acc=0.9616, iter_time=7.65s]
Epoch 0: 7%|▋ | 845/12384 [1:47:50<24:25:37, 7.62s/it, loss=0.0190, acc=0.9616, iter_time=7.65s]
Epoch 0: 7%|▋ | 845/12384 [1:47:57<24:25:37, 7.62s/it, loss=0.0199, acc=0.9600, iter_time=7.62s]
Epoch 0: 7%|▋ | 846/12384 [1:47:57<24:25:50, 7.62s/it, loss=0.0199, acc=0.9600, iter_time=7.62s]
Epoch 0: 7%|▋ | 846/12384 [1:48:05<24:25:50, 7.62s/it, loss=0.0185, acc=0.9690, iter_time=7.63s]
Epoch 0: 7%|▋ | 847/12384 [1:48:05<24:27:53, 7.63s/it, loss=0.0185, acc=0.9690, iter_time=7.63s]
Epoch 0: 7%|▋ | 847/12384 [1:48:13<24:27:53, 7.63s/it, loss=0.0248, acc=0.9542, iter_time=8.02s]
Epoch 0: 7%|▋ | 848/12384 [1:48:13<24:25:41, 7.62s/it, loss=0.0248, acc=0.9542, iter_time=8.02s]
Epoch 0: 7%|▋ | 848/12384 [1:48:20<24:25:41, 7.62s/it, loss=0.0102, acc=0.9843, iter_time=6.91s]
Epoch 0: 7%|▋ | 849/12384 [1:48:20<24:25:20, 7.62s/it, loss=0.0102, acc=0.9843, iter_time=6.91s]
Epoch 0: 7%|▋ | 849/12384 [1:48:28<24:25:20, 7.62s/it, loss=0.0156, acc=0.9599, iter_time=8.69s]
Epoch 0: 7%|▋ | 850/12384 [1:48:28<24:45:13, 7.73s/it, loss=0.0156, acc=0.9599, iter_time=8.69s]
Epoch 0: 7%|▋ | 850/12384 [1:48:36<24:45:13, 7.73s/it, loss=0.0109, acc=0.9779, iter_time=4.39s]
Epoch 0: 7%|▋ | 851/12384 [1:48:36<24:40:36, 7.70s/it, loss=0.0109, acc=0.9779, iter_time=4.39s]
Epoch 0: 7%|▋ | 851/12384 [1:48:43<24:40:36, 7.70s/it, loss=0.0097, acc=0.9877, iter_time=10.13s]
Epoch 0: 7%|▋ | 852/12384 [1:48:43<24:34:49, 7.67s/it, loss=0.0097, acc=0.9877, iter_time=10.13s]
Epoch 0: 7%|▋ | 852/12384 [1:48:51<24:34:49, 7.67s/it, loss=0.0090, acc=0.9889, iter_time=7.93s]
Epoch 0: 7%|▋ | 853/12384 [1:48:51<24:32:00, 7.66s/it, loss=0.0090, acc=0.9889, iter_time=7.93s]
Epoch 0: 7%|▋ | 853/12384 [1:48:59<24:32:00, 7.66s/it, loss=0.0139, acc=0.9684, iter_time=7.64s]
Epoch 0: 7%|▋ | 854/12384 [1:48:59<24:30:48, 7.65s/it, loss=0.0139, acc=0.9684, iter_time=7.64s]
Epoch 0: 7%|▋ | 854/12384 [1:49:06<24:30:48, 7.65s/it, loss=0.0155, acc=0.9751, iter_time=7.05s]
Epoch 0: 7%|▋ | 855/12384 [1:49:06<24:31:08, 7.66s/it, loss=0.0155, acc=0.9751, iter_time=7.05s]
Epoch 0: 7%|▋ | 855/12384 [1:49:14<24:31:08, 7.66s/it, loss=0.0106, acc=0.9826, iter_time=8.23s]
Epoch 0: 7%|▋ | 856/12384 [1:49:14<24:30:33, 7.65s/it, loss=0.0106, acc=0.9826, iter_time=8.23s]
Epoch 0: 7%|▋ | 856/12384 [1:49:22<24:30:33, 7.65s/it, loss=0.0139, acc=0.9761, iter_time=4.62s]
Epoch 0: 7%|▋ | 857/12384 [1:49:22<24:29:09, 7.65s/it, loss=0.0139, acc=0.9761, iter_time=4.62s]
Epoch 0: 7%|▋ | 857/12384 [1:49:29<24:29:09, 7.65s/it, loss=0.0123, acc=0.9790, iter_time=10.65s]
Epoch 0: 7%|▋ | 858/12384 [1:49:29<24:27:52, 7.64s/it, loss=0.0123, acc=0.9790, iter_time=10.65s]
Epoch 0: 7%|▋ | 858/12384 [1:49:37<24:27:52, 7.64s/it, loss=0.0113, acc=0.9809, iter_time=7.63s]
Epoch 0: 7%|▋ | 859/12384 [1:49:37<24:25:10, 7.63s/it, loss=0.0113, acc=0.9809, iter_time=7.63s]
Epoch 0: 7%|▋ | 859/12384 [1:49:44<24:25:10, 7.63s/it, loss=0.0244, acc=0.9623, iter_time=7.63s]
Epoch 0: 7%|▋ | 860/12384 [1:49:44<24:25:51, 7.63s/it, loss=0.0244, acc=0.9623, iter_time=7.63s]
Epoch 0: 7%|▋ | 860/12384 [1:49:52<24:25:51, 7.63s/it, loss=0.0264, acc=0.9585, iter_time=7.64s]
Epoch 0: 7%|▋ | 861/12384 [1:49:52<24:25:31, 7.63s/it, loss=0.0264, acc=0.9585, iter_time=7.64s]
Epoch 0: 7%|▋ | 861/12384 [1:50:00<24:25:31, 7.63s/it, loss=0.0170, acc=0.9770, iter_time=7.30s]
Epoch 0: 7%|▋ | 862/12384 [1:50:00<24:24:35, 7.63s/it, loss=0.0170, acc=0.9770, iter_time=7.30s]
Epoch 0: 7%|▋ | 862/12384 [1:50:07<24:24:35, 7.63s/it, loss=0.0183, acc=0.9607, iter_time=7.92s]
Epoch 0: 7%|▋ | 863/12384 [1:50:07<24:22:44, 7.62s/it, loss=0.0183, acc=0.9607, iter_time=7.92s]
Epoch 0: 7%|▋ | 863/12384 [1:50:15<24:22:44, 7.62s/it, loss=0.0102, acc=0.9789, iter_time=8.00s]
Epoch 0: 7%|▋ | 864/12384 [1:50:15<24:27:43, 7.64s/it, loss=0.0102, acc=0.9789, iter_time=8.00s]
Epoch 0: 7%|▋ | 864/12384 [1:50:23<24:27:43, 7.64s/it, loss=0.0188, acc=0.9524, iter_time=7.31s]
Epoch 0: 7%|▋ | 865/12384 [1:50:23<24:31:50, 7.67s/it, loss=0.0188, acc=0.9524, iter_time=7.31s]
Epoch 0: 7%|▋ | 865/12384 [1:50:30<24:31:50, 7.67s/it, loss=0.0153, acc=0.9746, iter_time=4.41s]
Epoch 0: 7%|▋ | 866/12384 [1:50:30<24:28:25, 7.65s/it, loss=0.0153, acc=0.9746, iter_time=4.41s]
Epoch 0: 7%|▋ | 866/12384 [1:50:38<24:28:25, 7.65s/it, loss=0.0112, acc=0.9766, iter_time=10.92s]
Epoch 0: 7%|▋ | 867/12384 [1:50:38<24:29:13, 7.65s/it, loss=0.0112, acc=0.9766, iter_time=10.92s]
Epoch 0: 7%|▋ | 867/12384 [1:50:46<24:29:13, 7.65s/it, loss=0.0185, acc=0.9797, iter_time=7.67s]
Epoch 0: 7%|▋ | 868/12384 [1:50:46<24:29:22, 7.66s/it, loss=0.0185, acc=0.9797, iter_time=7.67s]
Epoch 0: 7%|▋ | 868/12384 [1:50:53<24:29:22, 7.66s/it, loss=0.0243, acc=0.9345, iter_time=5.87s]
Epoch 0: 7%|▋ | 869/12384 [1:50:53<24:29:02, 7.65s/it, loss=0.0243, acc=0.9345, iter_time=5.87s]
Epoch 0: 7%|▋ | 869/12384 [1:51:01<24:29:02, 7.65s/it, loss=0.0124, acc=0.9805, iter_time=9.45s]
Epoch 0: 7%|▋ | 870/12384 [1:51:01<24:29:59, 7.66s/it, loss=0.0124, acc=0.9805, iter_time=9.45s]
Epoch 0: 7%|▋ | 870/12384 [1:51:09<24:29:59, 7.66s/it, loss=0.0180, acc=0.9692, iter_time=7.66s]
Epoch 0: 7%|▋ | 871/12384 [1:51:09<24:29:34, 7.66s/it, loss=0.0180, acc=0.9692, iter_time=7.66s]
Epoch 0: 7%|▋ | 871/12384 [1:51:16<24:29:34, 7.66s/it, loss=0.0118, acc=0.9705, iter_time=8.04s]
Epoch 0: 7%|▋ | 872/12384 [1:51:16<24:26:10, 7.64s/it, loss=0.0118, acc=0.9705, iter_time=8.04s]
Epoch 0: 7%|▋ | 872/12384 [1:51:24<24:26:10, 7.64s/it, loss=0.0069, acc=0.9855, iter_time=7.21s]
Epoch 0: 7%|▋ | 873/12384 [1:51:24<24:25:22, 7.64s/it, loss=0.0069, acc=0.9855, iter_time=7.21s]
Epoch 0: 7%|▋ | 873/12384 [1:51:32<24:25:22, 7.64s/it, loss=0.0156, acc=0.9652, iter_time=7.65s]
Epoch 0: 7%|▋ | 874/12384 [1:51:32<24:25:17, 7.64s/it, loss=0.0156, acc=0.9652, iter_time=7.65s]
Epoch 0: 7%|▋ | 874/12384 [1:51:39<24:25:17, 7.64s/it, loss=0.0104, acc=0.9822, iter_time=6.18s]
Epoch 0: 7%|▋ | 875/12384 [1:51:39<24:22:57, 7.63s/it, loss=0.0104, acc=0.9822, iter_time=6.18s]
Epoch 0: 7%|▋ | 875/12384 [1:51:47<24:22:57, 7.63s/it, loss=0.0386, acc=0.9483, iter_time=6.50s]
Epoch 0: 7%|▋ | 876/12384 [1:51:47<24:22:17, 7.62s/it, loss=0.0386, acc=0.9483, iter_time=6.50s]
Epoch 0: 7%|▋ | 876/12384 [1:51:55<24:22:17, 7.62s/it, loss=0.0079, acc=0.9851, iter_time=7.63s]
Epoch 0: 7%|▋ | 877/12384 [1:51:55<24:41:25, 7.72s/it, loss=0.0079, acc=0.9851, iter_time=7.63s]
Epoch 0: 7%|▋ | 877/12384 [1:52:02<24:41:25, 7.72s/it, loss=0.0182, acc=0.9646, iter_time=9.54s]
Epoch 0: 7%|▋ | 878/12384 [1:52:02<24:35:23, 7.69s/it, loss=0.0182, acc=0.9646, iter_time=9.54s]
Epoch 0: 7%|▋ | 878/12384 [1:52:10<24:35:23, 7.69s/it, loss=0.0433, acc=0.9516, iter_time=7.45s]
Epoch 0: 7%|▋ | 879/12384 [1:52:10<24:32:25, 7.68s/it, loss=0.0433, acc=0.9516, iter_time=7.45s]
Epoch 0: 7%|▋ | 879/12384 [1:52:18<24:32:25, 7.68s/it, loss=0.0351, acc=0.9565, iter_time=9.15s]
Epoch 0: 7%|▋ | 880/12384 [1:52:18<24:29:23, 7.66s/it, loss=0.0351, acc=0.9565, iter_time=9.15s]
Epoch 0: 7%|▋ | 880/12384 [1:52:25<24:29:23, 7.66s/it, loss=0.0080, acc=0.9885, iter_time=7.25s]
Epoch 0: 7%|▋ | 881/12384 [1:52:25<24:25:23, 7.64s/it, loss=0.0080, acc=0.9885, iter_time=7.25s]
Epoch 0: 7%|▋ | 881/12384 [1:52:33<24:25:23, 7.64s/it, loss=0.0067, acc=0.9919, iter_time=5.03s]
Epoch 0: 7%|▋ | 882/12384 [1:52:33<24:25:18, 7.64s/it, loss=0.0067, acc=0.9919, iter_time=5.03s]
Epoch 0: 7%|▋ | 882/12384 [1:52:41<24:25:18, 7.64s/it, loss=0.0187, acc=0.9653, iter_time=10.24s]
Epoch 0: 7%|▋ | 883/12384 [1:52:41<24:27:27, 7.66s/it, loss=0.0187, acc=0.9653, iter_time=10.24s]
Epoch 0: 7%|▋ | 883/12384 [1:52:48<24:27:27, 7.66s/it, loss=0.0916, acc=0.8901, iter_time=7.66s]
Epoch 0: 7%|▋ | 884/12384 [1:52:48<24:27:57, 7.66s/it, loss=0.0916, acc=0.8901, iter_time=7.66s]
Epoch 0: 7%|▋ | 884/12384 [1:52:56<24:27:57, 7.66s/it, loss=0.0093, acc=0.9872, iter_time=4.27s]
Epoch 0: 7%|▋ | 885/12384 [1:52:56<24:26:06, 7.65s/it, loss=0.0093, acc=0.9872, iter_time=4.27s]
Epoch 0: 7%|▋ | 885/12384 [1:53:03<24:26:06, 7.65s/it, loss=0.0097, acc=0.9795, iter_time=11.03s]
Epoch 0: 7%|▋ | 886/12384 [1:53:03<24:24:13, 7.64s/it, loss=0.0097, acc=0.9795, iter_time=11.03s]
Epoch 0: 7%|▋ | 886/12384 [1:53:11<24:24:13, 7.64s/it, loss=0.0123, acc=0.9842, iter_time=7.60s]
Epoch 0: 7%|▋ | 887/12384 [1:53:11<24:22:34, 7.63s/it, loss=0.0123, acc=0.9842, iter_time=7.60s]
Epoch 0: 7%|▋ | 887/12384 [1:53:19<24:22:34, 7.63s/it, loss=0.0123, acc=0.9846, iter_time=7.74s]
Epoch 0: 7%|▋ | 888/12384 [1:53:19<24:22:31, 7.63s/it, loss=0.0123, acc=0.9846, iter_time=7.74s]
Epoch 0: 7%|▋ | 888/12384 [1:53:26<24:22:31, 7.63s/it, loss=0.0083, acc=0.9848, iter_time=3.98s]
Epoch 0: 7%|▋ | 889/12384 [1:53:26<24:21:08, 7.63s/it, loss=0.0083, acc=0.9848, iter_time=3.98s]
Epoch 0: 7%|▋ | 889/12384 [1:53:34<24:21:08, 7.63s/it, loss=0.0099, acc=0.9743, iter_time=8.59s]
Epoch 0: 7%|▋ | 890/12384 [1:53:34<24:21:46, 7.63s/it, loss=0.0099, acc=0.9743, iter_time=8.59s]
Epoch 0: 7%|▋ | 890/12384 [1:53:42<24:21:46, 7.63s/it, loss=0.0048, acc=0.9982, iter_time=10.18s]
Epoch 0: 7%|▋ | 891/12384 [1:53:42<24:21:03, 7.63s/it, loss=0.0048, acc=0.9982, iter_time=10.18s]
Epoch 0: 7%|▋ | 891/12384 [1:53:49<24:21:03, 7.63s/it, loss=0.0110, acc=0.9736, iter_time=4.82s]
Epoch 0: 7%|▋ | 892/12384 [1:53:49<24:19:20, 7.62s/it, loss=0.0110, acc=0.9736, iter_time=4.82s]
Epoch 0: 7%|▋ | 892/12384 [1:53:57<24:19:20, 7.62s/it, loss=0.0163, acc=0.9813, iter_time=10.40s]
Epoch 0: 7%|▋ | 893/12384 [1:53:57<24:17:30, 7.61s/it, loss=0.0163, acc=0.9813, iter_time=10.40s]
Epoch 0: 7%|▋ | 893/12384 [1:54:04<24:17:30, 7.61s/it, loss=0.0304, acc=0.9713, iter_time=3.85s]
Epoch 0: 7%|▋ | 894/12384 [1:54:04<24:19:22, 7.62s/it, loss=0.0304, acc=0.9713, iter_time=3.85s]
Epoch 0: 7%|▋ | 894/12384 [1:54:12<24:19:22, 7.62s/it, loss=0.0085, acc=0.9878, iter_time=11.38s]
Epoch 0: 7%|▋ | 895/12384 [1:54:12<24:18:12, 7.62s/it, loss=0.0085, acc=0.9878, iter_time=11.38s]
Epoch 0: 7%|▋ | 895/12384 [1:54:20<24:18:12, 7.62s/it, loss=0.0163, acc=0.9603, iter_time=8.03s]
Epoch 0: 7%|▋ | 896/12384 [1:54:20<24:18:28, 7.62s/it, loss=0.0163, acc=0.9603, iter_time=8.03s]
Epoch 0: 7%|▋ | 896/12384 [1:54:27<24:18:28, 7.62s/it, loss=0.0134, acc=0.9753, iter_time=7.22s]
Epoch 0: 7%|▋ | 897/12384 [1:54:27<24:20:59, 7.63s/it, loss=0.0134, acc=0.9753, iter_time=7.22s]
Epoch 0: 7%|▋ | 897/12384 [1:54:35<24:20:59, 7.63s/it, loss=0.0070, acc=0.9910, iter_time=7.17s]
Epoch 0: 7%|▋ | 898/12384 [1:54:35<24:25:03, 7.65s/it, loss=0.0070, acc=0.9910, iter_time=7.17s]
Epoch 0: 7%|▋ | 898/12384 [1:54:43<24:25:03, 7.65s/it, loss=0.0069, acc=0.9903, iter_time=8.19s]
Epoch 0: 7%|▋ | 899/12384 [1:54:43<24:23:12, 7.64s/it, loss=0.0069, acc=0.9903, iter_time=8.19s]
Epoch 0: 7%|▋ | 899/12384 [1:54:50<24:23:12, 7.64s/it, loss=0.0056, acc=0.9915, iter_time=8.05s]
Epoch 0: 7%|▋ | 900/12384 [1:54:50<24:22:19, 7.64s/it, loss=0.0056, acc=0.9915, iter_time=8.05s]
Epoch 0: 7%|▋ | 900/12384 [1:54:58<24:22:19, 7.64s/it, loss=0.0070, acc=0.9881, iter_time=7.21s]
Epoch 0: 7%|▋ | 901/12384 [1:54:58<24:24:29, 7.65s/it, loss=0.0070, acc=0.9881, iter_time=7.21s]
Epoch 0: 7%|▋ | 901/12384 [1:55:06<24:24:29, 7.65s/it, loss=0.0109, acc=0.9777, iter_time=7.67s]
Epoch 0: 7%|▋ | 902/12384 [1:55:06<24:21:26, 7.64s/it, loss=0.0109, acc=0.9777, iter_time=7.67s]
Epoch 0: 7%|▋ | 902/12384 [1:55:13<24:21:26, 7.64s/it, loss=0.0091, acc=0.9803, iter_time=7.94s]
Epoch 0: 7%|▋ | 903/12384 [1:55:13<24:41:11, 7.74s/it, loss=0.0091, acc=0.9803, iter_time=7.94s]
Epoch 0: 7%|▋ | 903/12384 [1:55:21<24:41:11, 7.74s/it, loss=0.0026, acc=0.9954, iter_time=7.63s]
Epoch 0: 7%|▋ | 904/12384 [1:55:21<24:35:18, 7.71s/it, loss=0.0026, acc=0.9954, iter_time=7.63s]
Epoch 0: 7%|▋ | 904/12384 [1:55:29<24:35:18, 7.71s/it, loss=0.0046, acc=0.9914, iter_time=7.64s]
Epoch 0: 7%|▋ | 905/12384 [1:55:29<24:30:44, 7.69s/it, loss=0.0046, acc=0.9914, iter_time=7.64s]
Epoch 0: 7%|▋ | 905/12384 [1:55:36<24:30:44, 7.69s/it, loss=0.0099, acc=0.9801, iter_time=5.55s]
Epoch 0: 7%|▋ | 906/12384 [1:55:36<24:27:25, 7.67s/it, loss=0.0099, acc=0.9801, iter_time=5.55s]
Epoch 0: 7%|▋ | 906/12384 [1:55:44<24:27:25, 7.67s/it, loss=0.0061, acc=0.9900, iter_time=7.19s]
Epoch 0: 7%|▋ | 907/12384 [1:55:44<24:23:42, 7.65s/it, loss=0.0061, acc=0.9900, iter_time=7.19s]
Epoch 0: 7%|▋ | 907/12384 [1:55:52<24:23:42, 7.65s/it, loss=0.0144, acc=0.9691, iter_time=8.66s]
Epoch 0: 7%|▋ | 908/12384 [1:55:52<24:23:25, 7.65s/it, loss=0.0144, acc=0.9691, iter_time=8.66s]
Epoch 0: 7%|▋ | 908/12384 [1:55:59<24:23:25, 7.65s/it, loss=0.0047, acc=0.9894, iter_time=6.57s]
Epoch 0: 7%|▋ | 909/12384 [1:55:59<24:21:01, 7.64s/it, loss=0.0047, acc=0.9894, iter_time=6.57s]
Epoch 0: 7%|▋ | 909/12384 [1:56:07<24:21:01, 7.64s/it, loss=0.0067, acc=0.9882, iter_time=10.20s]
Epoch 0: 7%|▋ | 910/12384 [1:56:07<24:21:33, 7.64s/it, loss=0.0067, acc=0.9882, iter_time=10.20s]
Epoch 0: 7%|▋ | 910/12384 [1:56:15<24:21:33, 7.64s/it, loss=0.0257, acc=0.9608, iter_time=7.64s]
Epoch 0: 7%|▋ | 911/12384 [1:56:15<24:20:38, 7.64s/it, loss=0.0257, acc=0.9608, iter_time=7.64s]
Epoch 0: 7%|▋ | 911/12384 [1:56:22<24:20:38, 7.64s/it, loss=0.0071, acc=0.9838, iter_time=8.03s]
Epoch 0: 7%|▋ | 912/12384 [1:56:22<24:19:40, 7.63s/it, loss=0.0071, acc=0.9838, iter_time=8.03s]
Epoch 0: 7%|▋ | 912/12384 [1:56:30<24:19:40, 7.63s/it, loss=0.0060, acc=0.9953, iter_time=7.23s]
Epoch 0: 7%|▋ | 913/12384 [1:56:30<24:20:15, 7.64s/it, loss=0.0060, acc=0.9953, iter_time=7.23s]
Epoch 0: 7%|▋ | 913/12384 [1:56:37<24:20:15, 7.64s/it, loss=0.0149, acc=0.9700, iter_time=5.56s]
Epoch 0: 7%|▋ | 914/12384 [1:56:37<24:22:47, 7.65s/it, loss=0.0149, acc=0.9700, iter_time=5.56s]
Epoch 0: 7%|▋ | 914/12384 [1:56:45<24:22:47, 7.65s/it, loss=0.0048, acc=0.9880, iter_time=9.76s]
Epoch 0: 7%|▋ | 915/12384 [1:56:45<24:23:39, 7.66s/it, loss=0.0048, acc=0.9880, iter_time=9.76s]
Epoch 0: 7%|▋ | 915/12384 [1:56:53<24:23:39, 7.66s/it, loss=0.0040, acc=0.9897, iter_time=7.67s]
Epoch 0: 7%|▋ | 916/12384 [1:56:53<24:20:39, 7.64s/it, loss=0.0040, acc=0.9897, iter_time=7.67s]
Epoch 0: 7%|▋ | 916/12384 [1:57:00<24:20:39, 7.64s/it, loss=0.0328, acc=0.9407, iter_time=7.62s]
Epoch 0: 7%|▋ | 917/12384 [1:57:00<24:20:57, 7.64s/it, loss=0.0328, acc=0.9407, iter_time=7.62s]
Epoch 0: 7%|▋ | 917/12384 [1:57:08<24:20:57, 7.64s/it, loss=0.0061, acc=0.9846, iter_time=7.63s]
Epoch 0: 7%|▋ | 918/12384 [1:57:08<24:19:24, 7.64s/it, loss=0.0061, acc=0.9846, iter_time=7.63s]
Epoch 0: 7%|▋ | 918/12384 [1:57:16<24:19:24, 7.64s/it, loss=0.0317, acc=0.9741, iter_time=5.08s]
Epoch 0: 7%|▋ | 919/12384 [1:57:16<24:19:35, 7.64s/it, loss=0.0317, acc=0.9741, iter_time=5.08s]
Epoch 0: 7%|▋ | 919/12384 [1:57:23<24:19:35, 7.64s/it, loss=0.0099, acc=0.9790, iter_time=10.11s]
Epoch 0: 7%|▋ | 920/12384 [1:57:23<24:16:38, 7.62s/it, loss=0.0099, acc=0.9790, iter_time=10.11s]
Epoch 0: 7%|▋ | 920/12384 [1:57:31<24:16:38, 7.62s/it, loss=0.0050, acc=0.9933, iter_time=7.04s]
Epoch 0: 7%|▋ | 921/12384 [1:57:31<24:17:59, 7.63s/it, loss=0.0050, acc=0.9933, iter_time=7.04s]
Epoch 0: 7%|▋ | 921/12384 [1:57:39<24:17:59, 7.63s/it, loss=0.0143, acc=0.9628, iter_time=8.27s]
Epoch 0: 7%|▋ | 922/12384 [1:57:39<24:15:17, 7.62s/it, loss=0.0143, acc=0.9628, iter_time=8.27s]
Epoch 0: 7%|▋ | 922/12384 [1:57:46<24:15:17, 7.62s/it, loss=0.0085, acc=0.9817, iter_time=4.23s]
Epoch 0: 7%|▋ | 923/12384 [1:57:46<24:15:32, 7.62s/it, loss=0.0085, acc=0.9817, iter_time=4.23s]
Epoch 0: 7%|▋ | 923/12384 [1:57:54<24:15:32, 7.62s/it, loss=0.0057, acc=0.9899, iter_time=10.97s]
Epoch 0: 7%|▋ | 924/12384 [1:57:54<24:14:32, 7.62s/it, loss=0.0057, acc=0.9899, iter_time=10.97s]
Epoch 0: 7%|▋ | 924/12384 [1:58:01<24:14:32, 7.62s/it, loss=0.0348, acc=0.9716, iter_time=7.62s]
Epoch 0: 7%|▋ | 925/12384 [1:58:01<24:14:53, 7.62s/it, loss=0.0348, acc=0.9716, iter_time=7.62s]
Epoch 0: 7%|▋ | 925/12384 [1:58:09<24:14:53, 7.62s/it, loss=0.0068, acc=0.9897, iter_time=7.64s]
Epoch 0: 7%|▋ | 926/12384 [1:58:09<24:16:13, 7.63s/it, loss=0.0068, acc=0.9897, iter_time=7.64s]
Epoch 0: 7%|▋ | 926/12384 [1:58:17<24:16:13, 7.63s/it, loss=0.0071, acc=0.9885, iter_time=5.51s]
Epoch 0: 7%|▋ | 927/12384 [1:58:17<24:14:21, 7.62s/it, loss=0.0071, acc=0.9885, iter_time=5.51s]
Epoch 0: 7%|▋ | 927/12384 [1:58:24<24:14:21, 7.62s/it, loss=0.0071, acc=0.9841, iter_time=10.09s]
Epoch 0: 7%|▋ | 928/12384 [1:58:24<24:19:26, 7.64s/it, loss=0.0071, acc=0.9841, iter_time=10.09s]
Epoch 0: 7%|▋ | 928/12384 [1:58:32<24:19:26, 7.64s/it, loss=0.0101, acc=0.9736, iter_time=7.65s]
Epoch 0: 8%|▊ | 929/12384 [1:58:32<24:38:19, 7.74s/it, loss=0.0101, acc=0.9736, iter_time=7.65s]
Epoch 0: 8%|▊ | 929/12384 [1:58:40<24:38:19, 7.74s/it, loss=0.0028, acc=0.9978, iter_time=7.65s]
Epoch 0: 8%|▊ | 930/12384 [1:58:40<24:30:26, 7.70s/it, loss=0.0028, acc=0.9978, iter_time=7.65s]
Epoch 0: 8%|▊ | 930/12384 [1:58:48<24:30:26, 7.70s/it, loss=0.0289, acc=0.9722, iter_time=7.62s]
Epoch 0: 8%|▊ | 931/12384 [1:58:48<24:27:47, 7.69s/it, loss=0.0289, acc=0.9722, iter_time=7.62s]
Epoch 0: 8%|▊ | 931/12384 [1:58:55<24:27:47, 7.69s/it, loss=0.0086, acc=0.9780, iter_time=6.47s]
Epoch 0: 8%|▊ | 932/12384 [1:58:55<24:23:26, 7.67s/it, loss=0.0086, acc=0.9780, iter_time=6.47s]
Epoch 0: 8%|▊ | 932/12384 [1:59:03<24:23:26, 7.67s/it, loss=0.0093, acc=0.9876, iter_time=8.81s]
Epoch 0: 8%|▊ | 933/12384 [1:59:03<24:21:39, 7.66s/it, loss=0.0093, acc=0.9876, iter_time=8.81s]
Epoch 0: 8%|▊ | 933/12384 [1:59:10<24:21:39, 7.66s/it, loss=0.0111, acc=0.9763, iter_time=7.62s]
Epoch 0: 8%|▊ | 934/12384 [1:59:10<24:18:29, 7.64s/it, loss=0.0111, acc=0.9763, iter_time=7.62s]
Epoch 0: 8%|▊ | 934/12384 [1:59:18<24:18:29, 7.64s/it, loss=0.0127, acc=0.9751, iter_time=7.61s]
Epoch 0: 8%|▊ | 935/12384 [1:59:18<24:22:24, 7.66s/it, loss=0.0127, acc=0.9751, iter_time=7.61s]
Epoch 0: 8%|▊ | 935/12384 [1:59:26<24:22:24, 7.66s/it, loss=0.0039, acc=0.9964, iter_time=7.69s]
Epoch 0: 8%|▊ | 936/12384 [1:59:26<24:20:33, 7.65s/it, loss=0.0039, acc=0.9964, iter_time=7.69s]
Epoch 0: 8%|▊ | 936/12384 [1:59:33<24:20:33, 7.65s/it, loss=0.0041, acc=0.9931, iter_time=7.65s]
Epoch 0: 8%|▊ | 937/12384 [1:59:33<24:18:13, 7.64s/it, loss=0.0041, acc=0.9931, iter_time=7.65s]
Epoch 0: 8%|▊ | 937/12384 [1:59:41<24:18:13, 7.64s/it, loss=0.0169, acc=0.9569, iter_time=7.64s]
Epoch 0: 8%|▊ | 938/12384 [1:59:41<24:17:14, 7.64s/it, loss=0.0169, acc=0.9569, iter_time=7.64s]
Epoch 0: 8%|▊ | 938/12384 [1:59:49<24:17:14, 7.64s/it, loss=0.0282, acc=0.9559, iter_time=7.33s]
Epoch 0: 8%|▊ | 939/12384 [1:59:49<24:17:52, 7.64s/it, loss=0.0282, acc=0.9559, iter_time=7.33s]
Epoch 0: 8%|▊ | 939/12384 [1:59:56<24:17:52, 7.64s/it, loss=0.0076, acc=0.9813, iter_time=5.94s]
Epoch 0: 8%|▊ | 940/12384 [1:59:56<24:21:19, 7.66s/it, loss=0.0076, acc=0.9813, iter_time=5.94s]
Epoch 0: 8%|▊ | 940/12384 [2:00:04<24:21:19, 7.66s/it, loss=0.0069, acc=0.9862, iter_time=6.89s]
Epoch 0: 8%|▊ | 941/12384 [2:00:04<24:19:46, 7.65s/it, loss=0.0069, acc=0.9862, iter_time=6.89s]
Epoch 0: 8%|▊ | 941/12384 [2:00:12<24:19:46, 7.65s/it, loss=0.0056, acc=0.9913, iter_time=7.31s]
Epoch 0: 8%|▊ | 942/12384 [2:00:12<24:18:49, 7.65s/it, loss=0.0056, acc=0.9913, iter_time=7.31s]
Epoch 0: 8%|▊ | 942/12384 [2:00:19<24:18:49, 7.65s/it, loss=0.0028, acc=0.9981, iter_time=7.23s]
Epoch 0: 8%|▊ | 943/12384 [2:00:19<24:17:59, 7.65s/it, loss=0.0028, acc=0.9981, iter_time=7.23s]
Epoch 0: 8%|▊ | 943/12384 [2:00:27<24:17:59, 7.65s/it, loss=0.0162, acc=0.9659, iter_time=11.58s]
Epoch 0: 8%|▊ | 944/12384 [2:00:27<24:19:31, 7.65s/it, loss=0.0162, acc=0.9659, iter_time=11.58s]
Epoch 0: 8%|▊ | 944/12384 [2:00:35<24:19:31, 7.65s/it, loss=0.0048, acc=0.9966, iter_time=7.27s]
Epoch 0: 8%|▊ | 945/12384 [2:00:35<24:18:15, 7.65s/it, loss=0.0048, acc=0.9966, iter_time=7.27s]
Epoch 0: 8%|▊ | 945/12384 [2:00:42<24:18:15, 7.65s/it, loss=0.0056, acc=0.9894, iter_time=7.64s]
Epoch 0: 8%|▊ | 946/12384 [2:00:42<24:20:59, 7.66s/it, loss=0.0056, acc=0.9894, iter_time=7.64s]
Epoch 0: 8%|▊ | 946/12384 [2:00:50<24:20:59, 7.66s/it, loss=0.0072, acc=0.9839, iter_time=7.69s]
Epoch 0: 8%|▊ | 947/12384 [2:00:50<24:21:03, 7.66s/it, loss=0.0072, acc=0.9839, iter_time=7.69s]
Epoch 0: 8%|▊ | 947/12384 [2:00:58<24:21:03, 7.66s/it, loss=0.0051, acc=0.9963, iter_time=7.37s]
Epoch 0: 8%|▊ | 948/12384 [2:00:58<24:20:27, 7.66s/it, loss=0.0051, acc=0.9963, iter_time=7.37s]
Epoch 0: 8%|▊ | 948/12384 [2:01:05<24:20:27, 7.66s/it, loss=0.0054, acc=0.9898, iter_time=7.96s]
Epoch 0: 8%|▊ | 949/12384 [2:01:05<24:19:33, 7.66s/it, loss=0.0054, acc=0.9898, iter_time=7.96s]
Epoch 0: 8%|▊ | 949/12384 [2:01:13<24:19:33, 7.66s/it, loss=0.0045, acc=0.9898, iter_time=8.10s]
Epoch 0: 8%|▊ | 950/12384 [2:01:13<24:20:07, 7.66s/it, loss=0.0045, acc=0.9898, iter_time=8.10s]
Epoch 0: 8%|▊ | 950/12384 [2:01:21<24:20:07, 7.66s/it, loss=0.0064, acc=0.9899, iter_time=7.21s]
Epoch 0: 8%|▊ | 951/12384 [2:01:21<24:19:20, 7.66s/it, loss=0.0064, acc=0.9899, iter_time=7.21s]
Epoch 0: 8%|▊ | 951/12384 [2:01:28<24:19:20, 7.66s/it, loss=0.0126, acc=0.9777, iter_time=7.60s]
Epoch 0: 8%|▊ | 952/12384 [2:01:28<24:16:31, 7.64s/it, loss=0.0126, acc=0.9777, iter_time=7.60s]
Epoch 0: 8%|▊ | 952/12384 [2:01:36<24:16:31, 7.64s/it, loss=0.0079, acc=0.9837, iter_time=6.18s]
Epoch 0: 8%|▊ | 953/12384 [2:01:36<24:14:29, 7.63s/it, loss=0.0079, acc=0.9837, iter_time=6.18s]
Epoch 0: 8%|▊ | 953/12384 [2:01:43<24:14:29, 7.63s/it, loss=0.0069, acc=0.9834, iter_time=9.07s]
Epoch 0: 8%|▊ | 954/12384 [2:01:43<24:11:46, 7.62s/it, loss=0.0069, acc=0.9834, iter_time=9.07s]
Epoch 0: 8%|▊ | 954/12384 [2:01:51<24:11:46, 7.62s/it, loss=0.0086, acc=0.9863, iter_time=5.14s]
Epoch 0: 8%|▊ | 955/12384 [2:01:51<24:31:54, 7.73s/it, loss=0.0086, acc=0.9863, iter_time=5.14s]
Epoch 0: 8%|▊ | 955/12384 [2:01:59<24:31:54, 7.73s/it, loss=0.0138, acc=0.9684, iter_time=10.44s]
Epoch 0: 8%|▊ | 956/12384 [2:01:59<24:25:35, 7.69s/it, loss=0.0138, acc=0.9684, iter_time=10.44s]
Epoch 0: 8%|▊ | 956/12384 [2:02:07<24:25:35, 7.69s/it, loss=0.0067, acc=0.9871, iter_time=7.62s]
Epoch 0: 8%|▊ | 957/12384 [2:02:07<24:21:12, 7.67s/it, loss=0.0067, acc=0.9871, iter_time=7.62s]
Epoch 0: 8%|▊ | 957/12384 [2:02:14<24:21:12, 7.67s/it, loss=0.0045, acc=0.9881, iter_time=7.62s]
Epoch 0: 8%|▊ | 958/12384 [2:02:14<24:19:15, 7.66s/it, loss=0.0045, acc=0.9881, iter_time=7.62s]
Epoch 0: 8%|▊ | 958/12384 [2:02:22<24:19:15, 7.66s/it, loss=0.0051, acc=0.9858, iter_time=7.65s]
Epoch 0: 8%|▊ | 959/12384 [2:02:22<24:16:33, 7.65s/it, loss=0.0051, acc=0.9858, iter_time=7.65s]
Epoch 0: 8%|▊ | 959/12384 [2:02:29<24:16:33, 7.65s/it, loss=0.0079, acc=0.9799, iter_time=7.53s]
Epoch 0: 8%|▊ | 960/12384 [2:02:29<24:13:12, 7.63s/it, loss=0.0079, acc=0.9799, iter_time=7.53s]
Epoch 0: 8%|▊ | 960/12384 [2:02:37<24:13:12, 7.63s/it, loss=0.0177, acc=0.9659, iter_time=7.65s]
Epoch 0: 8%|▊ | 961/12384 [2:02:37<24:11:44, 7.63s/it, loss=0.0177, acc=0.9659, iter_time=7.65s]
Epoch 0: 8%|▊ | 961/12384 [2:02:45<24:11:44, 7.63s/it, loss=0.0062, acc=0.9867, iter_time=7.65s]
Epoch 0: 8%|▊ | 962/12384 [2:02:45<24:11:46, 7.63s/it, loss=0.0062, acc=0.9867, iter_time=7.65s]
Epoch 0: 8%|▊ | 962/12384 [2:02:52<24:11:46, 7.63s/it, loss=0.0075, acc=0.9800, iter_time=6.66s]
Epoch 0: 8%|▊ | 963/12384 [2:02:52<24:13:43, 7.64s/it, loss=0.0075, acc=0.9800, iter_time=6.66s]
Epoch 0: 8%|▊ | 963/12384 [2:03:00<24:13:43, 7.64s/it, loss=0.0128, acc=0.9723, iter_time=8.61s]
Epoch 0: 8%|▊ | 964/12384 [2:03:00<24:13:56, 7.64s/it, loss=0.0128, acc=0.9723, iter_time=8.61s]
Epoch 0: 8%|▊ | 964/12384 [2:03:08<24:13:56, 7.64s/it, loss=0.0050, acc=0.9939, iter_time=4.50s]
Epoch 0: 8%|▊ | 965/12384 [2:03:08<24:13:56, 7.64s/it, loss=0.0050, acc=0.9939, iter_time=4.50s]
Epoch 0: 8%|▊ | 965/12384 [2:03:15<24:13:56, 7.64s/it, loss=0.0042, acc=0.9962, iter_time=8.47s]
Epoch 0: 8%|▊ | 966/12384 [2:03:15<24:11:58, 7.63s/it, loss=0.0042, acc=0.9962, iter_time=8.47s]
Epoch 0: 8%|▊ | 966/12384 [2:03:23<24:11:58, 7.63s/it, loss=0.0046, acc=0.9878, iter_time=9.32s]
Epoch 0: 8%|▊ | 967/12384 [2:03:23<24:11:51, 7.63s/it, loss=0.0046, acc=0.9878, iter_time=9.32s]
Epoch 0: 8%|▊ | 967/12384 [2:03:31<24:11:51, 7.63s/it, loss=0.0041, acc=0.9892, iter_time=8.64s]
Epoch 0: 8%|▊ | 968/12384 [2:03:31<24:16:11, 7.65s/it, loss=0.0041, acc=0.9892, iter_time=8.64s]
Epoch 0: 8%|▊ | 968/12384 [2:03:38<24:16:11, 7.65s/it, loss=0.0117, acc=0.9770, iter_time=7.31s]
Epoch 0: 8%|▊ | 969/12384 [2:03:38<24:14:42, 7.65s/it, loss=0.0117, acc=0.9770, iter_time=7.31s]
Epoch 0: 8%|▊ | 969/12384 [2:03:46<24:14:42, 7.65s/it, loss=0.0022, acc=0.9920, iter_time=4.27s]
Epoch 0: 8%|▊ | 970/12384 [2:03:46<24:12:02, 7.63s/it, loss=0.0022, acc=0.9920, iter_time=4.27s]
Epoch 0: 8%|▊ | 970/12384 [2:03:53<24:12:02, 7.63s/it, loss=0.0055, acc=0.9921, iter_time=10.98s]
Epoch 0: 8%|▊ | 971/12384 [2:03:53<24:12:16, 7.63s/it, loss=0.0055, acc=0.9921, iter_time=10.98s]
Epoch 0: 8%|▊ | 971/12384 [2:04:01<24:12:16, 7.63s/it, loss=0.0067, acc=0.9879, iter_time=7.62s]
Epoch 0: 8%|▊ | 972/12384 [2:04:01<24:11:08, 7.63s/it, loss=0.0067, acc=0.9879, iter_time=7.62s]
Epoch 0: 8%|▊ | 972/12384 [2:04:09<24:11:08, 7.63s/it, loss=0.0050, acc=0.9938, iter_time=7.65s]
Epoch 0: 8%|▊ | 973/12384 [2:04:09<24:10:53, 7.63s/it, loss=0.0050, acc=0.9938, iter_time=7.65s]
Epoch 0: 8%|▊ | 973/12384 [2:04:16<24:10:53, 7.63s/it, loss=0.0055, acc=0.9927, iter_time=7.61s]
Epoch 0: 8%|▊ | 974/12384 [2:04:16<24:11:04, 7.63s/it, loss=0.0055, acc=0.9927, iter_time=7.61s]
Epoch 0: 8%|▊ | 974/12384 [2:04:24<24:11:04, 7.63s/it, loss=0.0124, acc=0.9897, iter_time=7.66s]
Epoch 0: 8%|▊ | 975/12384 [2:04:24<24:11:32, 7.63s/it, loss=0.0124, acc=0.9897, iter_time=7.66s]
Epoch 0: 8%|▊ | 975/12384 [2:04:32<24:11:32, 7.63s/it, loss=0.0121, acc=0.9766, iter_time=7.99s]
Epoch 0: 8%|▊ | 976/12384 [2:04:32<24:11:18, 7.63s/it, loss=0.0121, acc=0.9766, iter_time=7.99s]
Epoch 0: 8%|▊ | 976/12384 [2:04:39<24:11:18, 7.63s/it, loss=0.0060, acc=0.9853, iter_time=6.04s]
Epoch 0: 8%|▊ | 977/12384 [2:04:39<24:11:24, 7.63s/it, loss=0.0060, acc=0.9853, iter_time=6.04s]
Epoch 0: 8%|▊ | 977/12384 [2:04:47<24:11:24, 7.63s/it, loss=0.0064, acc=0.9838, iter_time=5.56s]
Epoch 0: 8%|▊ | 978/12384 [2:04:47<24:13:29, 7.65s/it, loss=0.0064, acc=0.9838, iter_time=5.56s]
Epoch 0: 8%|▊ | 978/12384 [2:04:55<24:13:29, 7.65s/it, loss=0.0102, acc=0.9818, iter_time=8.17s]
Epoch 0: 8%|▊ | 979/12384 [2:04:55<24:12:27, 7.64s/it, loss=0.0102, acc=0.9818, iter_time=8.17s]
Epoch 0: 8%|▊ | 979/12384 [2:05:02<24:12:27, 7.64s/it, loss=0.0152, acc=0.9760, iter_time=7.64s]
Epoch 0: 8%|▊ | 980/12384 [2:05:02<24:12:53, 7.64s/it, loss=0.0152, acc=0.9760, iter_time=7.64s]
Epoch 0: 8%|▊ | 980/12384 [2:05:10<24:12:53, 7.64s/it, loss=0.0098, acc=0.9809, iter_time=10.72s]
Epoch 0: 8%|▊ | 981/12384 [2:05:10<24:31:40, 7.74s/it, loss=0.0098, acc=0.9809, iter_time=10.72s]
Epoch 0: 8%|▊ | 981/12384 [2:05:18<24:31:40, 7.74s/it, loss=0.0065, acc=0.9818, iter_time=7.70s]
Epoch 0: 8%|▊ | 982/12384 [2:05:18<24:24:43, 7.71s/it, loss=0.0065, acc=0.9818, iter_time=7.70s]
Epoch 0: 8%|▊ | 982/12384 [2:05:25<24:24:43, 7.71s/it, loss=0.0123, acc=0.9675, iter_time=7.61s]
Epoch 0: 8%|▊ | 983/12384 [2:05:25<24:18:41, 7.68s/it, loss=0.0123, acc=0.9675, iter_time=7.61s]
Epoch 0: 8%|▊ | 983/12384 [2:05:33<24:18:41, 7.68s/it, loss=0.0034, acc=0.9942, iter_time=7.54s]
Epoch 0: 8%|▊ | 984/12384 [2:05:33<24:14:16, 7.65s/it, loss=0.0034, acc=0.9942, iter_time=7.54s]
Epoch 0: 8%|▊ | 984/12384 [2:05:41<24:14:16, 7.65s/it, loss=0.0045, acc=0.9879, iter_time=7.66s]
Epoch 0: 8%|▊ | 985/12384 [2:05:41<24:11:22, 7.64s/it, loss=0.0045, acc=0.9879, iter_time=7.66s]
Epoch 0: 8%|▊ | 985/12384 [2:05:48<24:11:22, 7.64s/it, loss=0.0083, acc=0.9807, iter_time=7.59s]
Epoch 0: 8%|▊ | 986/12384 [2:05:48<24:10:31, 7.64s/it, loss=0.0083, acc=0.9807, iter_time=7.59s]
Epoch 0: 8%|▊ | 986/12384 [2:05:56<24:10:31, 7.64s/it, loss=0.0047, acc=0.9907, iter_time=6.71s]
Epoch 0: 8%|▊ | 987/12384 [2:05:56<24:12:32, 7.65s/it, loss=0.0047, acc=0.9907, iter_time=6.71s]
Epoch 0: 8%|▊ | 987/12384 [2:06:04<24:12:32, 7.65s/it, loss=0.0027, acc=0.9948, iter_time=8.61s]
Epoch 0: 8%|▊ | 988/12384 [2:06:04<24:11:33, 7.64s/it, loss=0.0027, acc=0.9948, iter_time=8.61s]
Epoch 0: 8%|▊ | 988/12384 [2:06:11<24:11:33, 7.64s/it, loss=0.0072, acc=0.9799, iter_time=7.62s]
Epoch 0: 8%|▊ | 989/12384 [2:06:11<24:09:29, 7.63s/it, loss=0.0072, acc=0.9799, iter_time=7.62s]
Epoch 0: 8%|▊ | 989/12384 [2:06:19<24:09:29, 7.63s/it, loss=0.0042, acc=0.9847, iter_time=6.97s]
Epoch 0: 8%|▊ | 990/12384 [2:06:19<24:09:25, 7.63s/it, loss=0.0042, acc=0.9847, iter_time=6.97s]
Epoch 0: 8%|▊ | 990/12384 [2:06:26<24:09:25, 7.63s/it, loss=0.0053, acc=0.9882, iter_time=8.28s]
Epoch 0: 8%|▊ | 991/12384 [2:06:26<24:08:06, 7.63s/it, loss=0.0053, acc=0.9882, iter_time=8.28s]
Epoch 0: 8%|▊ | 991/12384 [2:06:34<24:08:06, 7.63s/it, loss=0.0059, acc=0.9857, iter_time=7.55s]
Epoch 0: 8%|▊ | 992/12384 [2:06:34<24:07:14, 7.62s/it, loss=0.0059, acc=0.9857, iter_time=7.55s]
Epoch 0: 8%|▊ | 992/12384 [2:06:42<24:07:14, 7.62s/it, loss=0.0017, acc=0.9995, iter_time=7.65s]
Epoch 0: 8%|▊ | 993/12384 [2:06:42<24:06:18, 7.62s/it, loss=0.0017, acc=0.9995, iter_time=7.65s]
Epoch 0: 8%|▊ | 993/12384 [2:06:49<24:06:18, 7.62s/it, loss=0.0124, acc=0.9837, iter_time=7.60s]
Epoch 0: 8%|▊ | 994/12384 [2:06:49<24:06:58, 7.62s/it, loss=0.0124, acc=0.9837, iter_time=7.60s]
Epoch 0: 8%|▊ | 994/12384 [2:06:57<24:06:58, 7.62s/it, loss=0.0210, acc=0.9684, iter_time=7.68s]
Epoch 0: 8%|▊ | 995/12384 [2:06:57<24:08:26, 7.63s/it, loss=0.0210, acc=0.9684, iter_time=7.68s]
Epoch 0: 8%|▊ | 995/12384 [2:07:04<24:08:26, 7.63s/it, loss=0.0028, acc=0.9942, iter_time=7.61s]
Epoch 0: 8%|▊ | 996/12384 [2:07:04<24:06:30, 7.62s/it, loss=0.0028, acc=0.9942, iter_time=7.61s]
Epoch 0: 8%|▊ | 996/12384 [2:07:12<24:06:30, 7.62s/it, loss=0.0053, acc=0.9909, iter_time=7.62s]
Epoch 0: 8%|▊ | 997/12384 [2:07:12<24:07:22, 7.63s/it, loss=0.0053, acc=0.9909, iter_time=7.62s]
Epoch 0: 8%|▊ | 997/12384 [2:07:20<24:07:22, 7.63s/it, loss=0.0038, acc=0.9914, iter_time=7.63s]
Epoch 0: 8%|▊ | 998/12384 [2:07:20<24:06:39, 7.62s/it, loss=0.0038, acc=0.9914, iter_time=7.63s]
Epoch 0: 8%|▊ | 998/12384 [2:07:27<24:06:39, 7.62s/it, loss=0.0072, acc=0.9869, iter_time=7.59s]
Epoch 0: 8%|▊ | 999/12384 [2:07:27<24:06:45, 7.62s/it, loss=0.0072, acc=0.9869, iter_time=7.59s]
Epoch 0: 8%|▊ | 999/12384 [2:07:35<24:06:45, 7.62s/it, loss=0.0031, acc=0.9893, iter_time=8.08s]
Epoch 0: 8%|▊ | 1000/12384 [2:07:35<24:19:36, 7.69s/it, loss=0.0031, acc=0.9893, iter_time=8.08s]
Epoch 0: 8%|▊ | 1000/12384 [2:07:43<24:19:36, 7.69s/it, loss=0.0037, acc=0.9923, iter_time=7.40s]
Epoch 0: 8%|▊ | 1001/12384 [2:07:43<24:18:34, 7.69s/it, loss=0.0037, acc=0.9923, iter_time=7.40s]
Epoch 0: 8%|▊ | 1001/12384 [2:07:51<24:18:34, 7.69s/it, loss=0.0036, acc=0.9895, iter_time=7.69s]
Epoch 0: 8%|▊ | 1002/12384 [2:07:51<24:14:21, 7.67s/it, loss=0.0036, acc=0.9895, iter_time=7.69s]
Epoch 0: 8%|▊ | 1002/12384 [2:07:58<24:14:21, 7.67s/it, loss=0.0148, acc=0.9791, iter_time=7.61s]
Epoch 0: 8%|▊ | 1003/12384 [2:07:58<24:12:05, 7.66s/it, loss=0.0148, acc=0.9791, iter_time=7.61s]
Epoch 0: 8%|▊ | 1003/12384 [2:08:06<24:12:05, 7.66s/it, loss=0.0058, acc=0.9831, iter_time=7.61s]
Epoch 0: 8%|▊ | 1004/12384 [2:08:06<24:09:25, 7.64s/it, loss=0.0058, acc=0.9831, iter_time=7.61s]
Epoch 0: 8%|▊ | 1004/12384 [2:08:13<24:09:25, 7.64s/it, loss=0.0033, acc=0.9912, iter_time=7.63s]
Epoch 0: 8%|▊ | 1005/12384 [2:08:13<24:10:25, 7.65s/it, loss=0.0033, acc=0.9912, iter_time=7.63s]
Epoch 0: 8%|▊ | 1005/12384 [2:08:21<24:10:25, 7.65s/it, loss=0.0048, acc=0.9879, iter_time=7.95s]
Epoch 0: 8%|▊ | 1006/12384 [2:08:21<24:23:44, 7.72s/it, loss=0.0048, acc=0.9879, iter_time=7.95s]
Epoch 0: 8%|▊ | 1006/12384 [2:08:29<24:23:44, 7.72s/it, loss=0.0050, acc=0.9908, iter_time=5.26s]
Epoch 0: 8%|▊ | 1007/12384 [2:08:29<24:16:39, 7.68s/it, loss=0.0050, acc=0.9908, iter_time=5.26s]
Epoch 0: 8%|▊ | 1007/12384 [2:08:37<24:16:39, 7.68s/it, loss=0.0141, acc=0.9724, iter_time=10.38s]
Epoch 0: 8%|▊ | 1008/12384 [2:08:37<24:31:53, 7.76s/it, loss=0.0141, acc=0.9724, iter_time=10.38s]
Epoch 0: 8%|▊ | 1008/12384 [2:08:45<24:31:53, 7.76s/it, loss=0.0036, acc=0.9910, iter_time=7.51s]
Epoch 0: 8%|▊ | 1009/12384 [2:08:45<24:25:42, 7.73s/it, loss=0.0036, acc=0.9910, iter_time=7.51s]
Epoch 0: 8%|▊ | 1009/12384 [2:08:52<24:25:42, 7.73s/it, loss=0.0130, acc=0.9754, iter_time=7.69s]
Epoch 0: 8%|▊ | 1010/12384 [2:08:52<24:20:05, 7.70s/it, loss=0.0130, acc=0.9754, iter_time=7.69s]
Epoch 0: 8%|▊ | 1010/12384 [2:09:00<24:20:05, 7.70s/it, loss=0.0031, acc=0.9924, iter_time=7.61s]
Epoch 0: 8%|▊ | 1011/12384 [2:09:00<24:14:39, 7.67s/it, loss=0.0031, acc=0.9924, iter_time=7.61s]
Epoch 0: 8%|▊ | 1011/12384 [2:09:07<24:14:39, 7.67s/it, loss=0.0112, acc=0.9841, iter_time=7.61s]
Epoch 0: 8%|▊ | 1012/12384 [2:09:07<24:14:25, 7.67s/it, loss=0.0112, acc=0.9841, iter_time=7.61s]
Epoch 0: 8%|▊ | 1012/12384 [2:09:15<24:14:25, 7.67s/it, loss=0.0066, acc=0.9865, iter_time=7.65s]
Epoch 0: 8%|▊ | 1013/12384 [2:09:15<24:09:50, 7.65s/it, loss=0.0066, acc=0.9865, iter_time=7.65s]
Epoch 0: 8%|▊ | 1013/12384 [2:09:23<24:09:50, 7.65s/it, loss=0.0024, acc=0.9921, iter_time=7.59s]
Epoch 0: 8%|▊ | 1014/12384 [2:09:23<24:08:22, 7.64s/it, loss=0.0024, acc=0.9921, iter_time=7.59s]
Epoch 0: 8%|▊ | 1014/12384 [2:09:30<24:08:22, 7.64s/it, loss=0.0065, acc=0.9930, iter_time=7.64s]
Epoch 0: 8%|▊ | 1015/12384 [2:09:30<24:10:31, 7.66s/it, loss=0.0065, acc=0.9930, iter_time=7.64s]
Epoch 0: 8%|▊ | 1015/12384 [2:09:38<24:10:31, 7.66s/it, loss=0.0042, acc=0.9923, iter_time=8.07s]
Epoch 0: 8%|▊ | 1016/12384 [2:09:38<24:09:48, 7.65s/it, loss=0.0042, acc=0.9923, iter_time=8.07s]
Epoch 0: 8%|▊ | 1016/12384 [2:09:46<24:09:48, 7.65s/it, loss=0.0075, acc=0.9877, iter_time=7.26s]
Epoch 0: 8%|▊ | 1017/12384 [2:09:46<24:08:06, 7.64s/it, loss=0.0075, acc=0.9877, iter_time=7.26s]
Epoch 0: 8%|▊ | 1017/12384 [2:09:53<24:08:06, 7.64s/it, loss=0.0109, acc=0.9815, iter_time=7.62s]
Epoch 0: 8%|▊ | 1018/12384 [2:09:53<24:06:33, 7.64s/it, loss=0.0109, acc=0.9815, iter_time=7.62s]
Epoch 0: 8%|▊ | 1018/12384 [2:10:01<24:06:33, 7.64s/it, loss=0.0056, acc=0.9881, iter_time=5.82s]
Epoch 0: 8%|▊ | 1019/12384 [2:10:01<24:04:06, 7.62s/it, loss=0.0056, acc=0.9881, iter_time=5.82s]
Epoch 0: 8%|▊ | 1019/12384 [2:10:08<24:04:06, 7.62s/it, loss=0.0039, acc=0.9879, iter_time=7.85s]
Epoch 0: 8%|▊ | 1020/12384 [2:10:08<24:02:43, 7.62s/it, loss=0.0039, acc=0.9879, iter_time=7.85s]
Epoch 0: 8%|▊ | 1020/12384 [2:10:16<24:02:43, 7.62s/it, loss=0.0122, acc=0.9763, iter_time=9.13s]
Epoch 0: 8%|▊ | 1021/12384 [2:10:16<24:00:47, 7.61s/it, loss=0.0122, acc=0.9763, iter_time=9.13s]
Epoch 0: 8%|▊ | 1021/12384 [2:10:24<24:00:47, 7.61s/it, loss=0.0047, acc=0.9898, iter_time=7.59s]
Epoch 0: 8%|▊ | 1022/12384 [2:10:24<24:02:24, 7.62s/it, loss=0.0047, acc=0.9898, iter_time=7.59s]
Epoch 0: 8%|▊ | 1022/12384 [2:10:31<24:02:24, 7.62s/it, loss=0.0020, acc=0.9959, iter_time=7.66s]
Epoch 0: 8%|▊ | 1023/12384 [2:10:31<24:05:35, 7.63s/it, loss=0.0020, acc=0.9959, iter_time=7.66s]
Epoch 0: 8%|▊ | 1023/12384 [2:10:39<24:05:35, 7.63s/it, loss=0.0020, acc=0.9976, iter_time=7.65s]
Epoch 0: 8%|▊ | 1024/12384 [2:10:39<24:06:11, 7.64s/it, loss=0.0020, acc=0.9976, iter_time=7.65s]
Epoch 0: 8%|▊ | 1024/12384 [2:10:47<24:06:11, 7.64s/it, loss=0.0025, acc=0.9925, iter_time=7.66s]
Epoch 0: 8%|▊ | 1025/12384 [2:10:47<24:04:54, 7.63s/it, loss=0.0025, acc=0.9925, iter_time=7.66s]
Epoch 0: 8%|▊ | 1025/12384 [2:10:54<24:04:54, 7.63s/it, loss=0.0031, acc=0.9926, iter_time=4.60s]
Epoch 0: 8%|▊ | 1026/12384 [2:10:54<24:06:06, 7.64s/it, loss=0.0031, acc=0.9926, iter_time=4.60s]
Epoch 0: 8%|▊ | 1026/12384 [2:11:02<24:06:06, 7.64s/it, loss=0.0125, acc=0.9719, iter_time=10.68s]
Epoch 0: 8%|▊ | 1027/12384 [2:11:02<24:06:45, 7.64s/it, loss=0.0125, acc=0.9719, iter_time=10.68s]
Epoch 0: 8%|▊ | 1027/12384 [2:11:10<24:06:45, 7.64s/it, loss=0.0014, acc=0.9990, iter_time=7.33s]
Epoch 0: 8%|▊ | 1028/12384 [2:11:10<24:06:24, 7.64s/it, loss=0.0014, acc=0.9990, iter_time=7.33s]
Epoch 0: 8%|▊ | 1028/12384 [2:11:17<24:06:24, 7.64s/it, loss=0.0025, acc=0.9945, iter_time=6.23s]
Epoch 0: 8%|▊ | 1029/12384 [2:11:17<24:06:39, 7.64s/it, loss=0.0025, acc=0.9945, iter_time=6.23s]
Epoch 0: 8%|▊ | 1029/12384 [2:11:25<24:06:39, 7.64s/it, loss=0.0064, acc=0.9901, iter_time=9.37s]
Epoch 0: 8%|▊ | 1030/12384 [2:11:25<24:05:51, 7.64s/it, loss=0.0064, acc=0.9901, iter_time=9.37s]
Epoch 0: 8%|▊ | 1030/12384 [2:11:32<24:05:51, 7.64s/it, loss=0.0037, acc=0.9942, iter_time=7.66s]
Epoch 0: 8%|▊ | 1031/12384 [2:11:32<24:05:45, 7.64s/it, loss=0.0037, acc=0.9942, iter_time=7.66s]
Epoch 0: 8%|▊ | 1031/12384 [2:11:40<24:05:45, 7.64s/it, loss=0.0344, acc=0.9582, iter_time=7.61s]
Epoch 0: 8%|▊ | 1032/12384 [2:11:40<24:06:26, 7.65s/it, loss=0.0344, acc=0.9582, iter_time=7.61s]
Epoch 0: 8%|▊ | 1032/12384 [2:11:48<24:06:26, 7.65s/it, loss=0.0038, acc=0.9897, iter_time=7.96s]
Epoch 0: 8%|▊ | 1033/12384 [2:11:48<24:21:06, 7.72s/it, loss=0.0038, acc=0.9897, iter_time=7.96s]
Epoch 0: 8%|▊ | 1033/12384 [2:11:56<24:21:06, 7.72s/it, loss=0.0090, acc=0.9823, iter_time=6.13s]
Epoch 0: 8%|▊ | 1034/12384 [2:11:56<24:34:01, 7.79s/it, loss=0.0090, acc=0.9823, iter_time=6.13s]
Epoch 0: 8%|▊ | 1034/12384 [2:12:04<24:34:01, 7.79s/it, loss=0.0085, acc=0.9762, iter_time=9.42s]
Epoch 0: 8%|▊ | 1035/12384 [2:12:04<24:22:58, 7.73s/it, loss=0.0085, acc=0.9762, iter_time=9.42s]
Epoch 0: 8%|▊ | 1035/12384 [2:12:11<24:22:58, 7.73s/it, loss=0.0046, acc=0.9904, iter_time=7.66s]
Epoch 0: 8%|▊ | 1036/12384 [2:12:11<24:18:27, 7.71s/it, loss=0.0046, acc=0.9904, iter_time=7.66s]
Epoch 0: 8%|▊ | 1036/12384 [2:12:19<24:18:27, 7.71s/it, loss=0.0035, acc=0.9900, iter_time=5.36s]
Epoch 0: 8%|▊ | 1037/12384 [2:12:19<24:12:10, 7.68s/it, loss=0.0035, acc=0.9900, iter_time=5.36s]
Epoch 0: 8%|▊ | 1037/12384 [2:12:26<24:12:10, 7.68s/it, loss=0.0055, acc=0.9900, iter_time=9.85s]
Epoch 0: 8%|▊ | 1038/12384 [2:12:26<24:09:12, 7.66s/it, loss=0.0055, acc=0.9900, iter_time=9.85s]
Epoch 0: 8%|▊ | 1038/12384 [2:12:34<24:09:12, 7.66s/it, loss=0.0053, acc=0.9886, iter_time=7.61s]
Epoch 0: 8%|▊ | 1039/12384 [2:12:34<24:06:53, 7.65s/it, loss=0.0053, acc=0.9886, iter_time=7.61s]
Epoch 0: 8%|▊ | 1039/12384 [2:12:42<24:06:53, 7.65s/it, loss=0.0073, acc=0.9914, iter_time=8.01s]
Epoch 0: 8%|▊ | 1040/12384 [2:12:42<24:04:31, 7.64s/it, loss=0.0073, acc=0.9914, iter_time=8.01s]
Epoch 0: 8%|▊ | 1040/12384 [2:12:49<24:04:31, 7.64s/it, loss=0.0017, acc=0.9949, iter_time=4.09s]
Epoch 0: 8%|▊ | 1041/12384 [2:12:49<24:05:20, 7.65s/it, loss=0.0017, acc=0.9949, iter_time=4.09s]
Epoch 0: 8%|▊ | 1041/12384 [2:12:57<24:05:20, 7.65s/it, loss=0.5570, acc=0.7423, iter_time=10.50s]
Epoch 0: 8%|▊ | 1042/12384 [2:12:57<24:05:00, 7.64s/it, loss=0.5570, acc=0.7423, iter_time=10.50s]
Epoch 0: 8%|▊ | 1042/12384 [2:13:05<24:05:00, 7.64s/it, loss=0.0054, acc=0.9913, iter_time=7.95s]
Epoch 0: 8%|▊ | 1043/12384 [2:13:05<24:05:05, 7.65s/it, loss=0.0054, acc=0.9913, iter_time=7.95s]
Epoch 0: 8%|▊ | 1043/12384 [2:13:12<24:05:05, 7.65s/it, loss=0.0042, acc=0.9910, iter_time=4.33s]
Epoch 0: 8%|▊ | 1044/12384 [2:13:12<24:01:51, 7.63s/it, loss=0.0042, acc=0.9910, iter_time=4.33s]
Epoch 0: 8%|▊ | 1044/12384 [2:13:20<24:01:51, 7.63s/it, loss=0.0046, acc=0.9945, iter_time=9.17s]
Epoch 0: 8%|▊ | 1045/12384 [2:13:20<23:59:58, 7.62s/it, loss=0.0046, acc=0.9945, iter_time=9.17s]
Epoch 0: 8%|▊ | 1045/12384 [2:13:28<23:59:58, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.09s]
Epoch 0: 8%|▊ | 1046/12384 [2:13:28<24:03:00, 7.64s/it, loss=0.0008, acc=0.9980, iter_time=7.09s]
Epoch 0: 8%|▊ | 1046/12384 [2:13:35<24:03:00, 7.64s/it, loss=0.0017, acc=0.9987, iter_time=9.92s]
Epoch 0: 8%|▊ | 1047/12384 [2:13:35<24:02:51, 7.64s/it, loss=0.0017, acc=0.9987, iter_time=9.92s]
Epoch 0: 8%|▊ | 1047/12384 [2:13:43<24:02:51, 7.64s/it, loss=0.0029, acc=0.9876, iter_time=8.03s]
Epoch 0: 8%|▊ | 1048/12384 [2:13:43<24:00:54, 7.63s/it, loss=0.0029, acc=0.9876, iter_time=8.03s]
Epoch 0: 8%|▊ | 1048/12384 [2:13:50<24:00:54, 7.63s/it, loss=0.0029, acc=0.9957, iter_time=7.21s]
Epoch 0: 8%|▊ | 1049/12384 [2:13:50<24:01:35, 7.63s/it, loss=0.0029, acc=0.9957, iter_time=7.21s]
Epoch 0: 8%|▊ | 1049/12384 [2:13:58<24:01:35, 7.63s/it, loss=0.0153, acc=0.9740, iter_time=8.05s]
Epoch 0: 8%|▊ | 1050/12384 [2:13:58<24:00:47, 7.63s/it, loss=0.0153, acc=0.9740, iter_time=8.05s]
Epoch 0: 8%|▊ | 1050/12384 [2:14:06<24:00:47, 7.63s/it, loss=0.0118, acc=0.9700, iter_time=6.61s]
Epoch 0: 8%|▊ | 1051/12384 [2:14:06<23:59:57, 7.62s/it, loss=0.0118, acc=0.9700, iter_time=6.61s]
Epoch 0: 8%|▊ | 1051/12384 [2:14:13<23:59:57, 7.62s/it, loss=0.0067, acc=0.9849, iter_time=8.22s]
Epoch 0: 8%|▊ | 1052/12384 [2:14:13<23:59:57, 7.62s/it, loss=0.0067, acc=0.9849, iter_time=8.22s]
Epoch 0: 8%|▊ | 1052/12384 [2:14:21<23:59:57, 7.62s/it, loss=0.0013, acc=0.9975, iter_time=4.44s]
Epoch 0: 9%|▊ | 1053/12384 [2:14:21<24:05:07, 7.65s/it, loss=0.0013, acc=0.9975, iter_time=4.44s]
Epoch 0: 9%|▊ | 1053/12384 [2:14:29<24:05:07, 7.65s/it, loss=0.0042, acc=0.9887, iter_time=9.14s]
Epoch 0: 9%|▊ | 1054/12384 [2:14:29<24:03:45, 7.65s/it, loss=0.0042, acc=0.9887, iter_time=9.14s]
Epoch 0: 9%|▊ | 1054/12384 [2:14:36<24:03:45, 7.65s/it, loss=0.0031, acc=0.9946, iter_time=9.42s]
Epoch 0: 9%|▊ | 1055/12384 [2:14:36<24:01:44, 7.64s/it, loss=0.0031, acc=0.9946, iter_time=9.42s]
Epoch 0: 9%|▊ | 1055/12384 [2:14:44<24:01:44, 7.64s/it, loss=0.0053, acc=0.9915, iter_time=7.57s]
Epoch 0: 9%|▊ | 1056/12384 [2:14:44<24:00:39, 7.63s/it, loss=0.0053, acc=0.9915, iter_time=7.57s]
Epoch 0: 9%|▊ | 1056/12384 [2:14:51<24:00:39, 7.63s/it, loss=0.0066, acc=0.9869, iter_time=3.90s]
Epoch 0: 9%|▊ | 1057/12384 [2:14:51<23:59:10, 7.62s/it, loss=0.0066, acc=0.9869, iter_time=3.90s]
Epoch 0: 9%|▊ | 1057/12384 [2:14:59<23:59:10, 7.62s/it, loss=0.0075, acc=0.9860, iter_time=11.33s]
Epoch 0: 9%|▊ | 1058/12384 [2:14:59<23:59:28, 7.63s/it, loss=0.0075, acc=0.9860, iter_time=11.33s]
Epoch 0: 9%|▊ | 1058/12384 [2:15:07<23:59:28, 7.63s/it, loss=0.0016, acc=0.9973, iter_time=7.66s]
Epoch 0: 9%|▊ | 1059/12384 [2:15:07<23:58:55, 7.62s/it, loss=0.0016, acc=0.9973, iter_time=7.66s]
Epoch 0: 9%|▊ | 1059/12384 [2:15:15<23:58:55, 7.62s/it, loss=0.0038, acc=0.9930, iter_time=7.91s]
Epoch 0: 9%|▊ | 1060/12384 [2:15:15<24:14:29, 7.71s/it, loss=0.0038, acc=0.9930, iter_time=7.91s]
Epoch 0: 9%|▊ | 1060/12384 [2:15:23<24:14:29, 7.71s/it, loss=0.0093, acc=0.9816, iter_time=7.67s]
Epoch 0: 9%|▊ | 1061/12384 [2:15:23<24:26:31, 7.77s/it, loss=0.0093, acc=0.9816, iter_time=7.67s]
Epoch 0: 9%|▊ | 1061/12384 [2:15:30<24:26:31, 7.77s/it, loss=0.0259, acc=0.9664, iter_time=7.56s]
Epoch 0: 9%|▊ | 1062/12384 [2:15:30<24:18:30, 7.73s/it, loss=0.0259, acc=0.9664, iter_time=7.56s]
Epoch 0: 9%|▊ | 1062/12384 [2:15:38<24:18:30, 7.73s/it, loss=0.0054, acc=0.9909, iter_time=7.93s]
Epoch 0: 9%|▊ | 1063/12384 [2:15:38<24:13:58, 7.71s/it, loss=0.0054, acc=0.9909, iter_time=7.93s]
Epoch 0: 9%|▊ | 1063/12384 [2:15:45<24:13:58, 7.71s/it, loss=0.0047, acc=0.9945, iter_time=8.02s]
Epoch 0: 9%|▊ | 1064/12384 [2:15:45<24:08:51, 7.68s/it, loss=0.0047, acc=0.9945, iter_time=8.02s]
Epoch 0: 9%|▊ | 1064/12384 [2:15:53<24:08:51, 7.68s/it, loss=0.0019, acc=0.9982, iter_time=4.12s]
Epoch 0: 9%|▊ | 1065/12384 [2:15:53<24:05:15, 7.66s/it, loss=0.0019, acc=0.9982, iter_time=4.12s]
Epoch 0: 9%|▊ | 1065/12384 [2:16:01<24:05:15, 7.66s/it, loss=0.0088, acc=0.9754, iter_time=7.00s]
Epoch 0: 9%|▊ | 1066/12384 [2:16:01<24:01:44, 7.64s/it, loss=0.0088, acc=0.9754, iter_time=7.00s]
Epoch 0: 9%|▊ | 1066/12384 [2:16:08<24:01:44, 7.64s/it, loss=0.0053, acc=0.9916, iter_time=11.34s]
Epoch 0: 9%|▊ | 1067/12384 [2:16:08<24:00:59, 7.64s/it, loss=0.0053, acc=0.9916, iter_time=11.34s]
Epoch 0: 9%|▊ | 1067/12384 [2:16:16<24:00:59, 7.64s/it, loss=0.0053, acc=0.9881, iter_time=7.72s]
Epoch 0: 9%|▊ | 1068/12384 [2:16:16<24:03:29, 7.65s/it, loss=0.0053, acc=0.9881, iter_time=7.72s]
Epoch 0: 9%|▊ | 1068/12384 [2:16:24<24:03:29, 7.65s/it, loss=0.0033, acc=0.9901, iter_time=7.61s]
Epoch 0: 9%|▊ | 1069/12384 [2:16:24<24:00:21, 7.64s/it, loss=0.0033, acc=0.9901, iter_time=7.61s]
Epoch 0: 9%|▊ | 1069/12384 [2:16:31<24:00:21, 7.64s/it, loss=0.0090, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▊ | 1070/12384 [2:16:31<23:58:48, 7.63s/it, loss=0.0090, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▊ | 1070/12384 [2:16:39<23:58:48, 7.63s/it, loss=0.0053, acc=0.9913, iter_time=7.61s]
Epoch 0: 9%|▊ | 1071/12384 [2:16:39<23:57:25, 7.62s/it, loss=0.0053, acc=0.9913, iter_time=7.61s]
Epoch 0: 9%|▊ | 1071/12384 [2:16:46<23:57:25, 7.62s/it, loss=0.0068, acc=0.9760, iter_time=7.65s]
Epoch 0: 9%|▊ | 1072/12384 [2:16:46<24:02:12, 7.65s/it, loss=0.0068, acc=0.9760, iter_time=7.65s]
Epoch 0: 9%|▊ | 1072/12384 [2:16:54<24:02:12, 7.65s/it, loss=0.0065, acc=0.9832, iter_time=7.68s]
Epoch 0: 9%|▊ | 1073/12384 [2:16:54<24:01:02, 7.64s/it, loss=0.0065, acc=0.9832, iter_time=7.68s]
Epoch 0: 9%|▊ | 1073/12384 [2:17:02<24:01:02, 7.64s/it, loss=0.0020, acc=0.9961, iter_time=5.91s]
Epoch 0: 9%|▊ | 1074/12384 [2:17:02<23:58:32, 7.63s/it, loss=0.0020, acc=0.9961, iter_time=5.91s]
Epoch 0: 9%|▊ | 1074/12384 [2:17:09<23:58:32, 7.63s/it, loss=0.0044, acc=0.9916, iter_time=9.32s]
Epoch 0: 9%|▊ | 1075/12384 [2:17:09<24:01:15, 7.65s/it, loss=0.0044, acc=0.9916, iter_time=9.32s]
Epoch 0: 9%|▊ | 1075/12384 [2:17:17<24:01:15, 7.65s/it, loss=0.0024, acc=0.9923, iter_time=7.68s]
Epoch 0: 9%|▊ | 1076/12384 [2:17:17<24:04:15, 7.66s/it, loss=0.0024, acc=0.9923, iter_time=7.68s]
Epoch 0: 9%|▊ | 1076/12384 [2:17:25<24:04:15, 7.66s/it, loss=0.0029, acc=0.9968, iter_time=7.70s]
Epoch 0: 9%|▊ | 1077/12384 [2:17:25<24:02:45, 7.66s/it, loss=0.0029, acc=0.9968, iter_time=7.70s]
Epoch 0: 9%|▊ | 1077/12384 [2:17:32<24:02:45, 7.66s/it, loss=0.0078, acc=0.9792, iter_time=7.63s]
Epoch 0: 9%|▊ | 1078/12384 [2:17:32<24:00:09, 7.64s/it, loss=0.0078, acc=0.9792, iter_time=7.63s]
Epoch 0: 9%|▊ | 1078/12384 [2:17:40<24:00:09, 7.64s/it, loss=0.0087, acc=0.9875, iter_time=7.62s]
Epoch 0: 9%|▊ | 1079/12384 [2:17:40<23:57:41, 7.63s/it, loss=0.0087, acc=0.9875, iter_time=7.62s]
Epoch 0: 9%|▊ | 1079/12384 [2:17:48<23:57:41, 7.63s/it, loss=0.0031, acc=0.9944, iter_time=8.00s]
Epoch 0: 9%|▊ | 1080/12384 [2:17:48<23:56:43, 7.63s/it, loss=0.0031, acc=0.9944, iter_time=8.00s]
Epoch 0: 9%|▊ | 1080/12384 [2:17:55<23:56:43, 7.63s/it, loss=0.0123, acc=0.9817, iter_time=7.24s]
Epoch 0: 9%|▊ | 1081/12384 [2:17:55<24:00:39, 7.65s/it, loss=0.0123, acc=0.9817, iter_time=7.24s]
Epoch 0: 9%|▊ | 1081/12384 [2:18:03<24:00:39, 7.65s/it, loss=0.0037, acc=0.9943, iter_time=7.70s]
Epoch 0: 9%|▊ | 1082/12384 [2:18:03<23:59:20, 7.64s/it, loss=0.0037, acc=0.9943, iter_time=7.70s]
Epoch 0: 9%|▊ | 1082/12384 [2:18:11<23:59:20, 7.64s/it, loss=0.0018, acc=0.9940, iter_time=4.54s]
Epoch 0: 9%|▊ | 1083/12384 [2:18:11<24:00:25, 7.65s/it, loss=0.0018, acc=0.9940, iter_time=4.54s]
Epoch 0: 9%|▊ | 1083/12384 [2:18:18<24:00:25, 7.65s/it, loss=0.0023, acc=0.9947, iter_time=10.72s]
Epoch 0: 9%|▉ | 1084/12384 [2:18:18<23:57:23, 7.63s/it, loss=0.0023, acc=0.9947, iter_time=10.72s]
Epoch 0: 9%|▉ | 1084/12384 [2:18:26<23:57:23, 7.63s/it, loss=0.0039, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▉ | 1085/12384 [2:18:26<23:56:25, 7.63s/it, loss=0.0039, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▉ | 1085/12384 [2:18:33<23:56:25, 7.63s/it, loss=0.0028, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1086/12384 [2:18:33<23:55:09, 7.62s/it, loss=0.0028, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1086/12384 [2:18:41<23:55:09, 7.62s/it, loss=0.0044, acc=0.9905, iter_time=7.89s]
Epoch 0: 9%|▉ | 1087/12384 [2:18:41<24:12:41, 7.72s/it, loss=0.0044, acc=0.9905, iter_time=7.89s]
Epoch 0: 9%|▉ | 1087/12384 [2:18:49<24:12:41, 7.72s/it, loss=0.0036, acc=0.9913, iter_time=7.67s]
Epoch 0: 9%|▉ | 1088/12384 [2:18:49<24:11:52, 7.71s/it, loss=0.0036, acc=0.9913, iter_time=7.67s]
Epoch 0: 9%|▉ | 1088/12384 [2:18:57<24:11:52, 7.71s/it, loss=0.0069, acc=0.9895, iter_time=7.66s]
Epoch 0: 9%|▉ | 1089/12384 [2:18:57<24:11:20, 7.71s/it, loss=0.0069, acc=0.9895, iter_time=7.66s]
Epoch 0: 9%|▉ | 1089/12384 [2:19:04<24:11:20, 7.71s/it, loss=0.0073, acc=0.9904, iter_time=7.71s]
Epoch 0: 9%|▉ | 1090/12384 [2:19:04<24:08:06, 7.69s/it, loss=0.0073, acc=0.9904, iter_time=7.71s]
Epoch 0: 9%|▉ | 1090/12384 [2:19:12<24:08:06, 7.69s/it, loss=0.0017, acc=0.9979, iter_time=7.67s]
Epoch 0: 9%|▉ | 1091/12384 [2:19:12<24:05:08, 7.68s/it, loss=0.0017, acc=0.9979, iter_time=7.67s]
Epoch 0: 9%|▉ | 1091/12384 [2:19:20<24:05:08, 7.68s/it, loss=0.0028, acc=0.9936, iter_time=7.66s]
Epoch 0: 9%|▉ | 1092/12384 [2:19:20<24:01:42, 7.66s/it, loss=0.0028, acc=0.9936, iter_time=7.66s]
Epoch 0: 9%|▉ | 1092/12384 [2:19:27<24:01:42, 7.66s/it, loss=0.0009, acc=0.9965, iter_time=4.29s]
Epoch 0: 9%|▉ | 1093/12384 [2:19:27<23:58:49, 7.65s/it, loss=0.0009, acc=0.9965, iter_time=4.29s]
Epoch 0: 9%|▉ | 1093/12384 [2:19:35<23:58:49, 7.65s/it, loss=0.0037, acc=0.9918, iter_time=10.93s]
Epoch 0: 9%|▉ | 1094/12384 [2:19:35<23:57:22, 7.64s/it, loss=0.0037, acc=0.9918, iter_time=10.93s]
Epoch 0: 9%|▉ | 1094/12384 [2:19:43<23:57:22, 7.64s/it, loss=0.0014, acc=0.9980, iter_time=4.31s]
Epoch 0: 9%|▉ | 1095/12384 [2:19:43<24:02:39, 7.67s/it, loss=0.0014, acc=0.9980, iter_time=4.31s]
Epoch 0: 9%|▉ | 1095/12384 [2:19:50<24:02:39, 7.67s/it, loss=0.0019, acc=0.9985, iter_time=11.44s]
Epoch 0: 9%|▉ | 1096/12384 [2:19:50<24:06:09, 7.69s/it, loss=0.0019, acc=0.9985, iter_time=11.44s]
Epoch 0: 9%|▉ | 1096/12384 [2:19:58<24:06:09, 7.69s/it, loss=0.0028, acc=0.9901, iter_time=7.33s]
Epoch 0: 9%|▉ | 1097/12384 [2:19:58<24:02:16, 7.67s/it, loss=0.0028, acc=0.9901, iter_time=7.33s]
Epoch 0: 9%|▉ | 1097/12384 [2:20:06<24:02:16, 7.67s/it, loss=0.0053, acc=0.9867, iter_time=7.63s]
Epoch 0: 9%|▉ | 1098/12384 [2:20:06<24:00:08, 7.66s/it, loss=0.0053, acc=0.9867, iter_time=7.63s]
Epoch 0: 9%|▉ | 1098/12384 [2:20:13<24:00:08, 7.66s/it, loss=0.0036, acc=0.9950, iter_time=7.64s]
Epoch 0: 9%|▉ | 1099/12384 [2:20:13<23:58:38, 7.65s/it, loss=0.0036, acc=0.9950, iter_time=7.64s]
Epoch 0: 9%|▉ | 1099/12384 [2:20:21<23:58:38, 7.65s/it, loss=0.0021, acc=0.9967, iter_time=8.11s]
Epoch 0: 9%|▉ | 1100/12384 [2:20:21<24:01:07, 7.66s/it, loss=0.0021, acc=0.9967, iter_time=8.11s]
Epoch 0: 9%|▉ | 1100/12384 [2:20:29<24:01:07, 7.66s/it, loss=0.0107, acc=0.9828, iter_time=4.90s]
Epoch 0: 9%|▉ | 1101/12384 [2:20:29<23:58:37, 7.65s/it, loss=0.0107, acc=0.9828, iter_time=4.90s]
Epoch 0: 9%|▉ | 1101/12384 [2:20:36<23:58:37, 7.65s/it, loss=0.0031, acc=0.9938, iter_time=9.92s]
Epoch 0: 9%|▉ | 1102/12384 [2:20:36<23:56:44, 7.64s/it, loss=0.0031, acc=0.9938, iter_time=9.92s]
Epoch 0: 9%|▉ | 1102/12384 [2:20:44<23:56:44, 7.64s/it, loss=0.0047, acc=0.9906, iter_time=7.63s]
Epoch 0: 9%|▉ | 1103/12384 [2:20:44<23:54:59, 7.63s/it, loss=0.0047, acc=0.9906, iter_time=7.63s]
Epoch 0: 9%|▉ | 1103/12384 [2:20:51<23:54:59, 7.63s/it, loss=0.0013, acc=0.9977, iter_time=7.99s]
Epoch 0: 9%|▉ | 1104/12384 [2:20:51<23:52:25, 7.62s/it, loss=0.0013, acc=0.9977, iter_time=7.99s]
Epoch 0: 9%|▉ | 1104/12384 [2:20:59<23:52:25, 7.62s/it, loss=0.0027, acc=0.9968, iter_time=7.21s]
Epoch 0: 9%|▉ | 1105/12384 [2:20:59<23:57:00, 7.64s/it, loss=0.0027, acc=0.9968, iter_time=7.21s]
Epoch 0: 9%|▉ | 1105/12384 [2:21:07<23:57:00, 7.64s/it, loss=0.0031, acc=0.9918, iter_time=7.71s]
Epoch 0: 9%|▉ | 1106/12384 [2:21:07<24:02:02, 7.67s/it, loss=0.0031, acc=0.9918, iter_time=7.71s]
Epoch 0: 9%|▉ | 1106/12384 [2:21:14<24:02:02, 7.67s/it, loss=0.0142, acc=0.9920, iter_time=7.20s]
Epoch 0: 9%|▉ | 1107/12384 [2:21:14<23:59:01, 7.66s/it, loss=0.0142, acc=0.9920, iter_time=7.20s]
Epoch 0: 9%|▉ | 1107/12384 [2:21:22<23:59:01, 7.66s/it, loss=0.0018, acc=0.9979, iter_time=8.15s]
Epoch 0: 9%|▉ | 1108/12384 [2:21:22<23:57:19, 7.65s/it, loss=0.0018, acc=0.9979, iter_time=8.15s]
Epoch 0: 9%|▉ | 1108/12384 [2:21:30<23:57:19, 7.65s/it, loss=0.0028, acc=0.9922, iter_time=7.64s]
Epoch 0: 9%|▉ | 1109/12384 [2:21:30<23:55:40, 7.64s/it, loss=0.0028, acc=0.9922, iter_time=7.64s]
Epoch 0: 9%|▉ | 1109/12384 [2:21:37<23:55:40, 7.64s/it, loss=0.0025, acc=0.9972, iter_time=7.63s]
Epoch 0: 9%|▉ | 1110/12384 [2:21:37<23:56:13, 7.64s/it, loss=0.0025, acc=0.9972, iter_time=7.63s]
Epoch 0: 9%|▉ | 1110/12384 [2:21:45<23:56:13, 7.64s/it, loss=0.0018, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1111/12384 [2:21:45<23:54:44, 7.64s/it, loss=0.0018, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1111/12384 [2:21:53<23:54:44, 7.64s/it, loss=0.0011, acc=1.0000, iter_time=8.29s]
Epoch 0: 9%|▉ | 1112/12384 [2:21:53<24:08:41, 7.71s/it, loss=0.0011, acc=1.0000, iter_time=8.29s]
Epoch 0: 9%|▉ | 1112/12384 [2:22:01<24:08:41, 7.71s/it, loss=0.0023, acc=0.9968, iter_time=7.25s]
Epoch 0: 9%|▉ | 1113/12384 [2:22:01<24:23:09, 7.79s/it, loss=0.0023, acc=0.9968, iter_time=7.25s]
Epoch 0: 9%|▉ | 1113/12384 [2:22:08<24:23:09, 7.79s/it, loss=0.0052, acc=0.9896, iter_time=5.64s]
Epoch 0: 9%|▉ | 1114/12384 [2:22:08<24:13:44, 7.74s/it, loss=0.0052, acc=0.9896, iter_time=5.64s]
Epoch 0: 9%|▉ | 1114/12384 [2:22:16<24:13:44, 7.74s/it, loss=0.0067, acc=0.9904, iter_time=9.92s]
Epoch 0: 9%|▉ | 1115/12384 [2:22:16<24:07:04, 7.70s/it, loss=0.0067, acc=0.9904, iter_time=9.92s]
Epoch 0: 9%|▉ | 1115/12384 [2:22:24<24:07:04, 7.70s/it, loss=0.0036, acc=0.9925, iter_time=4.31s]
Epoch 0: 9%|▉ | 1116/12384 [2:22:24<24:00:49, 7.67s/it, loss=0.0036, acc=0.9925, iter_time=4.31s]
Epoch 0: 9%|▉ | 1116/12384 [2:22:31<24:00:49, 7.67s/it, loss=0.0171, acc=0.9720, iter_time=10.90s]
Epoch 0: 9%|▉ | 1117/12384 [2:22:31<24:00:08, 7.67s/it, loss=0.0171, acc=0.9720, iter_time=10.90s]
Epoch 0: 9%|▉ | 1117/12384 [2:22:39<24:00:08, 7.67s/it, loss=0.0036, acc=0.9873, iter_time=7.66s]
Epoch 0: 9%|▉ | 1118/12384 [2:22:39<23:56:26, 7.65s/it, loss=0.0036, acc=0.9873, iter_time=7.66s]
Epoch 0: 9%|▉ | 1118/12384 [2:22:46<23:56:26, 7.65s/it, loss=0.0045, acc=0.9943, iter_time=7.61s]
Epoch 0: 9%|▉ | 1119/12384 [2:22:46<23:53:21, 7.63s/it, loss=0.0045, acc=0.9943, iter_time=7.61s]
Epoch 0: 9%|▉ | 1119/12384 [2:22:54<23:53:21, 7.63s/it, loss=0.0036, acc=0.9881, iter_time=7.55s]
Epoch 0: 9%|▉ | 1120/12384 [2:22:54<23:51:38, 7.63s/it, loss=0.0036, acc=0.9881, iter_time=7.55s]
Epoch 0: 9%|▉ | 1120/12384 [2:23:02<23:51:38, 7.63s/it, loss=0.0032, acc=0.9953, iter_time=7.64s]
Epoch 0: 9%|▉ | 1121/12384 [2:23:02<23:49:49, 7.62s/it, loss=0.0032, acc=0.9953, iter_time=7.64s]
Epoch 0: 9%|▉ | 1121/12384 [2:23:09<23:49:49, 7.62s/it, loss=0.0044, acc=0.9883, iter_time=7.07s]
Epoch 0: 9%|▉ | 1122/12384 [2:23:09<23:49:19, 7.61s/it, loss=0.0044, acc=0.9883, iter_time=7.07s]
Epoch 0: 9%|▉ | 1122/12384 [2:23:17<23:49:19, 7.61s/it, loss=0.0035, acc=0.9950, iter_time=4.42s]
Epoch 0: 9%|▉ | 1123/12384 [2:23:17<23:48:52, 7.61s/it, loss=0.0035, acc=0.9950, iter_time=4.42s]
Epoch 0: 9%|▉ | 1123/12384 [2:23:25<23:48:52, 7.61s/it, loss=0.0019, acc=0.9946, iter_time=11.07s]
Epoch 0: 9%|▉ | 1124/12384 [2:23:25<23:48:19, 7.61s/it, loss=0.0019, acc=0.9946, iter_time=11.07s]
Epoch 0: 9%|▉ | 1124/12384 [2:23:32<23:48:19, 7.61s/it, loss=0.0025, acc=0.9956, iter_time=7.89s]
Epoch 0: 9%|▉ | 1125/12384 [2:23:32<23:49:38, 7.62s/it, loss=0.0025, acc=0.9956, iter_time=7.89s]
Epoch 0: 9%|▉ | 1125/12384 [2:23:40<23:49:38, 7.62s/it, loss=0.0030, acc=0.9933, iter_time=6.18s]
Epoch 0: 9%|▉ | 1126/12384 [2:23:40<23:49:34, 7.62s/it, loss=0.0030, acc=0.9933, iter_time=6.18s]
Epoch 0: 9%|▉ | 1126/12384 [2:23:47<23:49:34, 7.62s/it, loss=0.0015, acc=0.9988, iter_time=9.11s]
Epoch 0: 9%|▉ | 1127/12384 [2:23:47<23:51:16, 7.63s/it, loss=0.0015, acc=0.9988, iter_time=9.11s]
Epoch 0: 9%|▉ | 1127/12384 [2:23:55<23:51:16, 7.63s/it, loss=0.0020, acc=0.9968, iter_time=7.98s]
Epoch 0: 9%|▉ | 1128/12384 [2:23:55<23:50:03, 7.62s/it, loss=0.0020, acc=0.9968, iter_time=7.98s]
Epoch 0: 9%|▉ | 1128/12384 [2:24:03<23:50:03, 7.62s/it, loss=0.0019, acc=0.9998, iter_time=4.21s]
Epoch 0: 9%|▉ | 1129/12384 [2:24:03<23:49:07, 7.62s/it, loss=0.0019, acc=0.9998, iter_time=4.21s]
Epoch 0: 9%|▉ | 1129/12384 [2:24:10<23:49:07, 7.62s/it, loss=0.0021, acc=0.9953, iter_time=9.12s]
Epoch 0: 9%|▉ | 1130/12384 [2:24:10<23:47:01, 7.61s/it, loss=0.0021, acc=0.9953, iter_time=9.12s]
Epoch 0: 9%|▉ | 1130/12384 [2:24:18<23:47:01, 7.61s/it, loss=0.0048, acc=0.9911, iter_time=9.10s]
Epoch 0: 9%|▉ | 1131/12384 [2:24:18<23:48:26, 7.62s/it, loss=0.0048, acc=0.9911, iter_time=9.10s]
Epoch 0: 9%|▉ | 1131/12384 [2:24:25<23:48:26, 7.62s/it, loss=0.0023, acc=0.9956, iter_time=7.65s]
Epoch 0: 9%|▉ | 1132/12384 [2:24:25<23:48:37, 7.62s/it, loss=0.0023, acc=0.9956, iter_time=7.65s]
Epoch 0: 9%|▉ | 1132/12384 [2:24:33<23:48:37, 7.62s/it, loss=0.0060, acc=0.9853, iter_time=7.31s]
Epoch 0: 9%|▉ | 1133/12384 [2:24:33<23:47:08, 7.61s/it, loss=0.0060, acc=0.9853, iter_time=7.31s]
Epoch 0: 9%|▉ | 1133/12384 [2:24:41<23:47:08, 7.61s/it, loss=0.0062, acc=0.9846, iter_time=6.70s]
Epoch 0: 9%|▉ | 1134/12384 [2:24:41<23:48:48, 7.62s/it, loss=0.0062, acc=0.9846, iter_time=6.70s]
Epoch 0: 9%|▉ | 1134/12384 [2:24:48<23:48:48, 7.62s/it, loss=0.0059, acc=0.9877, iter_time=7.89s]
Epoch 0: 9%|▉ | 1135/12384 [2:24:48<23:48:54, 7.62s/it, loss=0.0059, acc=0.9877, iter_time=7.89s]
Epoch 0: 9%|▉ | 1135/12384 [2:24:56<23:48:54, 7.62s/it, loss=0.0018, acc=0.9956, iter_time=8.99s]
Epoch 0: 9%|▉ | 1136/12384 [2:24:56<23:50:35, 7.63s/it, loss=0.0018, acc=0.9956, iter_time=8.99s]
Epoch 0: 9%|▉ | 1136/12384 [2:25:04<23:50:35, 7.63s/it, loss=0.0028, acc=0.9941, iter_time=7.22s]
Epoch 0: 9%|▉ | 1137/12384 [2:25:04<23:48:38, 7.62s/it, loss=0.0028, acc=0.9941, iter_time=7.22s]
Epoch 0: 9%|▉ | 1137/12384 [2:25:11<23:48:38, 7.62s/it, loss=0.0018, acc=0.9974, iter_time=7.88s]
Epoch 0: 9%|▉ | 1138/12384 [2:25:11<24:01:44, 7.69s/it, loss=0.0018, acc=0.9974, iter_time=7.88s]
Epoch 0: 9%|▉ | 1138/12384 [2:25:19<24:01:44, 7.69s/it, loss=0.0086, acc=0.9795, iter_time=7.64s]
Epoch 0: 9%|▉ | 1139/12384 [2:25:19<24:16:45, 7.77s/it, loss=0.0086, acc=0.9795, iter_time=7.64s]
Epoch 0: 9%|▉ | 1139/12384 [2:25:27<24:16:45, 7.77s/it, loss=0.0016, acc=0.9998, iter_time=5.38s]
Epoch 0: 9%|▉ | 1140/12384 [2:25:27<24:11:36, 7.75s/it, loss=0.0016, acc=0.9998, iter_time=5.38s]
Epoch 0: 9%|▉ | 1140/12384 [2:25:35<24:11:36, 7.75s/it, loss=0.0015, acc=0.9978, iter_time=10.24s]
Epoch 0: 9%|▉ | 1141/12384 [2:25:35<24:04:10, 7.71s/it, loss=0.0015, acc=0.9978, iter_time=10.24s]
Epoch 0: 9%|▉ | 1141/12384 [2:25:42<24:04:10, 7.71s/it, loss=0.0026, acc=0.9950, iter_time=5.04s]
Epoch 0: 9%|▉ | 1142/12384 [2:25:42<23:58:32, 7.68s/it, loss=0.0026, acc=0.9950, iter_time=5.04s]
Epoch 0: 9%|▉ | 1142/12384 [2:25:50<23:58:32, 7.68s/it, loss=0.0012, acc=0.9982, iter_time=8.92s]
Epoch 0: 9%|▉ | 1143/12384 [2:25:50<23:55:16, 7.66s/it, loss=0.0012, acc=0.9982, iter_time=8.92s]
Epoch 0: 9%|▉ | 1143/12384 [2:25:58<23:55:16, 7.66s/it, loss=0.0024, acc=0.9909, iter_time=9.26s]
Epoch 0: 9%|▉ | 1144/12384 [2:25:58<23:52:52, 7.65s/it, loss=0.0024, acc=0.9909, iter_time=9.26s]
Epoch 0: 9%|▉ | 1144/12384 [2:26:05<23:52:52, 7.65s/it, loss=0.0043, acc=0.9876, iter_time=7.23s]
Epoch 0: 9%|▉ | 1145/12384 [2:26:05<23:51:03, 7.64s/it, loss=0.0043, acc=0.9876, iter_time=7.23s]
Epoch 0: 9%|▉ | 1145/12384 [2:26:13<23:51:03, 7.64s/it, loss=0.0021, acc=0.9979, iter_time=6.11s]
Epoch 0: 9%|▉ | 1146/12384 [2:26:13<23:50:19, 7.64s/it, loss=0.0021, acc=0.9979, iter_time=6.11s]
Epoch 0: 9%|▉ | 1146/12384 [2:26:21<23:50:19, 7.64s/it, loss=0.0052, acc=0.9965, iter_time=9.14s]
Epoch 0: 9%|▉ | 1147/12384 [2:26:21<23:53:45, 7.66s/it, loss=0.0052, acc=0.9965, iter_time=9.14s]
Epoch 0: 9%|▉ | 1147/12384 [2:26:28<23:53:45, 7.66s/it, loss=0.0020, acc=0.9983, iter_time=4.42s]
Epoch 0: 9%|▉ | 1148/12384 [2:26:28<23:52:12, 7.65s/it, loss=0.0020, acc=0.9983, iter_time=4.42s]
Epoch 0: 9%|▉ | 1148/12384 [2:26:36<23:52:12, 7.65s/it, loss=0.0030, acc=0.9913, iter_time=10.90s]
Epoch 0: 9%|▉ | 1149/12384 [2:26:36<23:50:40, 7.64s/it, loss=0.0030, acc=0.9913, iter_time=10.90s]
Epoch 0: 9%|▉ | 1149/12384 [2:26:43<23:50:40, 7.64s/it, loss=0.0054, acc=0.9857, iter_time=8.03s]
Epoch 0: 9%|▉ | 1150/12384 [2:26:43<23:48:18, 7.63s/it, loss=0.0054, acc=0.9857, iter_time=8.03s]
Epoch 0: 9%|▉ | 1150/12384 [2:26:51<23:48:18, 7.63s/it, loss=0.0021, acc=0.9958, iter_time=7.20s]
Epoch 0: 9%|▉ | 1151/12384 [2:26:51<23:49:47, 7.64s/it, loss=0.0021, acc=0.9958, iter_time=7.20s]
Epoch 0: 9%|▉ | 1151/12384 [2:26:59<23:49:47, 7.64s/it, loss=0.0022, acc=0.9931, iter_time=7.66s]
Epoch 0: 9%|▉ | 1152/12384 [2:26:59<23:50:45, 7.64s/it, loss=0.0022, acc=0.9931, iter_time=7.66s]
Epoch 0: 9%|▉ | 1152/12384 [2:27:06<23:50:45, 7.64s/it, loss=0.0062, acc=0.9890, iter_time=5.65s]
Epoch 0: 9%|▉ | 1153/12384 [2:27:06<23:48:08, 7.63s/it, loss=0.0062, acc=0.9890, iter_time=5.65s]
Epoch 0: 9%|▉ | 1153/12384 [2:27:14<23:48:08, 7.63s/it, loss=0.0012, acc=0.9975, iter_time=5.87s]
Epoch 0: 9%|▉ | 1154/12384 [2:27:14<23:48:53, 7.63s/it, loss=0.0012, acc=0.9975, iter_time=5.87s]
Epoch 0: 9%|▉ | 1154/12384 [2:27:22<23:48:53, 7.63s/it, loss=0.0010, acc=0.9977, iter_time=9.87s]
Epoch 0: 9%|▉ | 1155/12384 [2:27:22<23:45:41, 7.62s/it, loss=0.0010, acc=0.9977, iter_time=9.87s]
Epoch 0: 9%|▉ | 1155/12384 [2:27:29<23:45:41, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=9.08s]
Epoch 0: 9%|▉ | 1156/12384 [2:27:29<23:45:19, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=9.08s]
Epoch 0: 9%|▉ | 1156/12384 [2:27:37<23:45:19, 7.62s/it, loss=0.0033, acc=0.9963, iter_time=4.77s]
Epoch 0: 9%|▉ | 1157/12384 [2:27:37<23:43:56, 7.61s/it, loss=0.0033, acc=0.9963, iter_time=4.77s]
Epoch 0: 9%|▉ | 1157/12384 [2:27:44<23:43:56, 7.61s/it, loss=0.0025, acc=0.9946, iter_time=7.41s]
Epoch 0: 9%|▉ | 1158/12384 [2:27:44<23:45:03, 7.62s/it, loss=0.0025, acc=0.9946, iter_time=7.41s]
Epoch 0: 9%|▉ | 1158/12384 [2:27:52<23:45:03, 7.62s/it, loss=0.0033, acc=0.9901, iter_time=10.68s]
Epoch 0: 9%|▉ | 1159/12384 [2:27:52<23:45:07, 7.62s/it, loss=0.0033, acc=0.9901, iter_time=10.68s]
Epoch 0: 9%|▉ | 1159/12384 [2:28:00<23:45:07, 7.62s/it, loss=0.0082, acc=0.9832, iter_time=8.00s]
Epoch 0: 9%|▉ | 1160/12384 [2:28:00<23:47:15, 7.63s/it, loss=0.0082, acc=0.9832, iter_time=8.00s]
Epoch 0: 9%|▉ | 1160/12384 [2:28:07<23:47:15, 7.63s/it, loss=0.0026, acc=0.9970, iter_time=7.27s]
Epoch 0: 9%|▉ | 1161/12384 [2:28:07<23:46:49, 7.63s/it, loss=0.0026, acc=0.9970, iter_time=7.27s]
Epoch 0: 9%|▉ | 1161/12384 [2:28:15<23:46:49, 7.63s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 9%|▉ | 1162/12384 [2:28:15<23:44:41, 7.62s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 9%|▉ | 1162/12384 [2:28:22<23:44:41, 7.62s/it, loss=0.0059, acc=0.9853, iter_time=7.61s]
Epoch 0: 9%|▉ | 1163/12384 [2:28:22<23:46:09, 7.63s/it, loss=0.0059, acc=0.9853, iter_time=7.61s]
Epoch 0: 9%|▉ | 1163/12384 [2:28:30<23:46:09, 7.63s/it, loss=0.0030, acc=0.9947, iter_time=7.63s]
Epoch 0: 9%|▉ | 1164/12384 [2:28:30<23:47:41, 7.63s/it, loss=0.0030, acc=0.9947, iter_time=7.63s]
Epoch 0: 9%|▉ | 1164/12384 [2:28:38<23:47:41, 7.63s/it, loss=0.0025, acc=0.9942, iter_time=7.94s]
Epoch 0: 9%|▉ | 1165/12384 [2:28:38<24:07:09, 7.74s/it, loss=0.0025, acc=0.9942, iter_time=7.94s]
Epoch 0: 9%|▉ | 1165/12384 [2:28:46<24:07:09, 7.74s/it, loss=0.0023, acc=0.9957, iter_time=5.90s]
Epoch 0: 9%|▉ | 1166/12384 [2:28:46<23:59:38, 7.70s/it, loss=0.0023, acc=0.9957, iter_time=5.90s]
Epoch 0: 9%|▉ | 1166/12384 [2:28:53<23:59:38, 7.70s/it, loss=0.0065, acc=0.9885, iter_time=9.39s]
Epoch 0: 9%|▉ | 1167/12384 [2:28:53<23:56:52, 7.69s/it, loss=0.0065, acc=0.9885, iter_time=9.39s]
Epoch 0: 9%|▉ | 1167/12384 [2:29:01<23:56:52, 7.69s/it, loss=0.0015, acc=0.9978, iter_time=8.06s]
Epoch 0: 9%|▉ | 1168/12384 [2:29:01<23:53:34, 7.67s/it, loss=0.0015, acc=0.9978, iter_time=8.06s]
Epoch 0: 9%|▉ | 1168/12384 [2:29:09<23:53:34, 7.67s/it, loss=0.0033, acc=0.9889, iter_time=7.24s]
Epoch 0: 9%|▉ | 1169/12384 [2:29:09<23:50:38, 7.65s/it, loss=0.0033, acc=0.9889, iter_time=7.24s]
Epoch 0: 9%|▉ | 1169/12384 [2:29:16<23:50:38, 7.65s/it, loss=0.0009, acc=0.9990, iter_time=5.83s]
Epoch 0: 9%|▉ | 1170/12384 [2:29:16<23:50:24, 7.65s/it, loss=0.0009, acc=0.9990, iter_time=5.83s]
Epoch 0: 9%|▉ | 1170/12384 [2:29:24<23:50:24, 7.65s/it, loss=0.0049, acc=0.9915, iter_time=9.44s]
Epoch 0: 9%|▉ | 1171/12384 [2:29:24<23:49:31, 7.65s/it, loss=0.0049, acc=0.9915, iter_time=9.44s]
Epoch 0: 9%|▉ | 1171/12384 [2:29:32<23:49:31, 7.65s/it, loss=0.0081, acc=0.9851, iter_time=7.63s]
Epoch 0: 9%|▉ | 1172/12384 [2:29:32<23:47:50, 7.64s/it, loss=0.0081, acc=0.9851, iter_time=7.63s]
Epoch 0: 9%|▉ | 1172/12384 [2:29:39<23:47:50, 7.64s/it, loss=0.0085, acc=0.9846, iter_time=7.65s]
Epoch 0: 9%|▉ | 1173/12384 [2:29:39<23:47:34, 7.64s/it, loss=0.0085, acc=0.9846, iter_time=7.65s]
Epoch 0: 9%|▉ | 1173/12384 [2:29:47<23:47:34, 7.64s/it, loss=0.0014, acc=0.9965, iter_time=7.62s]
Epoch 0: 9%|▉ | 1174/12384 [2:29:47<23:49:29, 7.65s/it, loss=0.0014, acc=0.9965, iter_time=7.62s]
Epoch 0: 9%|▉ | 1174/12384 [2:29:54<23:49:29, 7.65s/it, loss=0.0007, acc=0.9991, iter_time=5.10s]
Epoch 0: 9%|▉ | 1175/12384 [2:29:54<23:46:52, 7.64s/it, loss=0.0007, acc=0.9991, iter_time=5.10s]
Epoch 0: 9%|▉ | 1175/12384 [2:30:02<23:46:52, 7.64s/it, loss=0.0024, acc=0.9959, iter_time=10.56s]
Epoch 0: 9%|▉ | 1176/12384 [2:30:02<23:46:08, 7.63s/it, loss=0.0024, acc=0.9959, iter_time=10.56s]
Epoch 0: 9%|▉ | 1176/12384 [2:30:10<23:46:08, 7.63s/it, loss=0.0026, acc=0.9958, iter_time=7.25s]
Epoch 0: 10%|▉ | 1177/12384 [2:30:10<23:44:29, 7.63s/it, loss=0.0026, acc=0.9958, iter_time=7.25s]
Epoch 0: 10%|▉ | 1177/12384 [2:30:17<23:44:29, 7.63s/it, loss=0.0034, acc=0.9929, iter_time=7.60s]
Epoch 0: 10%|▉ | 1178/12384 [2:30:17<23:42:15, 7.62s/it, loss=0.0034, acc=0.9929, iter_time=7.60s]
Epoch 0: 10%|▉ | 1178/12384 [2:30:25<23:42:15, 7.62s/it, loss=0.0028, acc=0.9944, iter_time=7.70s]
Epoch 0: 10%|▉ | 1179/12384 [2:30:25<23:49:07, 7.65s/it, loss=0.0028, acc=0.9944, iter_time=7.70s]
Epoch 0: 10%|▉ | 1179/12384 [2:30:33<23:49:07, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 10%|▉ | 1180/12384 [2:30:33<23:47:11, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 10%|▉ | 1180/12384 [2:30:40<23:47:11, 7.64s/it, loss=0.0013, acc=0.9968, iter_time=6.42s]
Epoch 0: 10%|▉ | 1181/12384 [2:30:40<23:40:29, 7.61s/it, loss=0.0013, acc=0.9968, iter_time=6.42s]
Epoch 0: 10%|▉ | 1181/12384 [2:30:48<23:40:29, 7.61s/it, loss=0.0040, acc=0.9933, iter_time=8.73s]
Epoch 0: 10%|▉ | 1182/12384 [2:30:48<23:40:13, 7.61s/it, loss=0.0040, acc=0.9933, iter_time=8.73s]
Epoch 0: 10%|▉ | 1182/12384 [2:30:55<23:40:13, 7.61s/it, loss=0.0040, acc=0.9918, iter_time=5.55s]
Epoch 0: 10%|▉ | 1183/12384 [2:30:55<23:39:36, 7.60s/it, loss=0.0040, acc=0.9918, iter_time=5.55s]
Epoch 0: 10%|▉ | 1183/12384 [2:31:03<23:39:36, 7.60s/it, loss=0.0035, acc=0.9963, iter_time=9.61s]
Epoch 0: 10%|▉ | 1184/12384 [2:31:03<23:40:11, 7.61s/it, loss=0.0035, acc=0.9963, iter_time=9.61s]
Epoch 0: 10%|▉ | 1184/12384 [2:31:11<23:40:11, 7.61s/it, loss=0.0059, acc=0.9922, iter_time=7.65s]
Epoch 0: 10%|▉ | 1185/12384 [2:31:11<23:39:13, 7.60s/it, loss=0.0059, acc=0.9922, iter_time=7.65s]
Epoch 0: 10%|▉ | 1185/12384 [2:31:18<23:39:13, 7.60s/it, loss=0.0024, acc=0.9944, iter_time=7.61s]
Epoch 0: 10%|▉ | 1186/12384 [2:31:18<23:39:40, 7.61s/it, loss=0.0024, acc=0.9944, iter_time=7.61s]
Epoch 0: 10%|▉ | 1186/12384 [2:31:26<23:39:40, 7.61s/it, loss=0.0068, acc=0.9873, iter_time=7.71s]
Epoch 0: 10%|▉ | 1187/12384 [2:31:26<23:45:23, 7.64s/it, loss=0.0068, acc=0.9873, iter_time=7.71s]
Epoch 0: 10%|▉ | 1187/12384 [2:31:34<23:45:23, 7.64s/it, loss=0.0028, acc=0.9921, iter_time=7.61s]
Epoch 0: 10%|▉ | 1188/12384 [2:31:34<23:44:16, 7.63s/it, loss=0.0028, acc=0.9921, iter_time=7.61s]
Epoch 0: 10%|▉ | 1188/12384 [2:31:41<23:44:16, 7.63s/it, loss=0.0046, acc=0.9948, iter_time=7.62s]
Epoch 0: 10%|▉ | 1189/12384 [2:31:41<23:43:30, 7.63s/it, loss=0.0046, acc=0.9948, iter_time=7.62s]
Epoch 0: 10%|▉ | 1189/12384 [2:31:49<23:43:30, 7.63s/it, loss=0.0006, acc=0.9994, iter_time=5.28s]
Epoch 0: 10%|▉ | 1190/12384 [2:31:49<23:41:11, 7.62s/it, loss=0.0006, acc=0.9994, iter_time=5.28s]
Epoch 0: 10%|▉ | 1190/12384 [2:31:56<23:41:11, 7.62s/it, loss=0.0019, acc=0.9951, iter_time=9.93s]
Epoch 0: 10%|▉ | 1191/12384 [2:31:56<23:41:35, 7.62s/it, loss=0.0019, acc=0.9951, iter_time=9.93s]
Epoch 0: 10%|▉ | 1191/12384 [2:32:04<23:41:35, 7.62s/it, loss=0.0023, acc=0.9951, iter_time=8.10s]
Epoch 0: 10%|▉ | 1192/12384 [2:32:04<24:02:45, 7.73s/it, loss=0.0023, acc=0.9951, iter_time=8.10s]
Epoch 0: 10%|▉ | 1192/12384 [2:32:12<24:02:45, 7.73s/it, loss=0.0045, acc=0.9965, iter_time=6.10s]
Epoch 0: 10%|▉ | 1193/12384 [2:32:12<24:01:59, 7.73s/it, loss=0.0045, acc=0.9965, iter_time=6.10s]
Epoch 0: 10%|▉ | 1193/12384 [2:32:20<24:01:59, 7.73s/it, loss=0.0010, acc=0.9997, iter_time=7.64s]
Epoch 0: 10%|▉ | 1194/12384 [2:32:20<23:55:44, 7.70s/it, loss=0.0010, acc=0.9997, iter_time=7.64s]
Epoch 0: 10%|▉ | 1194/12384 [2:32:27<23:55:44, 7.70s/it, loss=0.0057, acc=0.9928, iter_time=9.12s]
Epoch 0: 10%|▉ | 1195/12384 [2:32:27<23:51:03, 7.67s/it, loss=0.0057, acc=0.9928, iter_time=9.12s]
Epoch 0: 10%|▉ | 1195/12384 [2:32:35<23:51:03, 7.67s/it, loss=0.0006, acc=0.9986, iter_time=4.76s]
Epoch 0: 10%|▉ | 1196/12384 [2:32:35<23:46:32, 7.65s/it, loss=0.0006, acc=0.9986, iter_time=4.76s]
Epoch 0: 10%|▉ | 1196/12384 [2:32:43<23:46:32, 7.65s/it, loss=0.0022, acc=0.9961, iter_time=7.92s]
Epoch 0: 10%|▉ | 1197/12384 [2:32:43<23:44:11, 7.64s/it, loss=0.0022, acc=0.9961, iter_time=7.92s]
Epoch 0: 10%|▉ | 1197/12384 [2:32:50<23:44:11, 7.64s/it, loss=0.0095, acc=0.9842, iter_time=8.41s]
Epoch 0: 10%|▉ | 1198/12384 [2:32:50<23:45:00, 7.64s/it, loss=0.0095, acc=0.9842, iter_time=8.41s]
Epoch 0: 10%|▉ | 1198/12384 [2:32:58<23:45:00, 7.64s/it, loss=0.0017, acc=0.9975, iter_time=9.39s]
Epoch 0: 10%|▉ | 1199/12384 [2:32:58<23:46:09, 7.65s/it, loss=0.0017, acc=0.9975, iter_time=9.39s]
Epoch 0: 10%|▉ | 1199/12384 [2:33:05<23:46:09, 7.65s/it, loss=0.0046, acc=0.9872, iter_time=8.06s]
Epoch 0: 10%|▉ | 1200/12384 [2:33:05<23:43:34, 7.64s/it, loss=0.0046, acc=0.9872, iter_time=8.06s]
Epoch 0: 10%|▉ | 1200/12384 [2:33:13<23:43:34, 7.64s/it, loss=0.0009, acc=0.9962, iter_time=3.01s]
Epoch 0: 10%|▉ | 1201/12384 [2:33:13<23:39:06, 7.61s/it, loss=0.0009, acc=0.9962, iter_time=3.01s]
Epoch 0: 10%|▉ | 1201/12384 [2:33:21<23:39:06, 7.61s/it, loss=0.0045, acc=0.9904, iter_time=8.16s]
Epoch 0: 10%|▉ | 1202/12384 [2:33:21<23:43:19, 7.64s/it, loss=0.0045, acc=0.9904, iter_time=8.16s]
Epoch 0: 10%|▉ | 1202/12384 [2:33:28<23:43:19, 7.64s/it, loss=0.0034, acc=0.9887, iter_time=11.27s]
Epoch 0: 10%|▉ | 1203/12384 [2:33:28<23:42:20, 7.63s/it, loss=0.0034, acc=0.9887, iter_time=11.27s]
Epoch 0: 10%|▉ | 1203/12384 [2:33:36<23:42:20, 7.63s/it, loss=0.0030, acc=0.9949, iter_time=5.35s]
Epoch 0: 10%|▉ | 1204/12384 [2:33:36<23:42:14, 7.63s/it, loss=0.0030, acc=0.9949, iter_time=5.35s]
Epoch 0: 10%|▉ | 1204/12384 [2:33:44<23:42:14, 7.63s/it, loss=0.0010, acc=0.9977, iter_time=7.07s]
Epoch 0: 10%|▉ | 1205/12384 [2:33:44<23:40:59, 7.63s/it, loss=0.0010, acc=0.9977, iter_time=7.07s]
Epoch 0: 10%|▉ | 1205/12384 [2:33:51<23:40:59, 7.63s/it, loss=0.0027, acc=0.9942, iter_time=10.46s]
Epoch 0: 10%|▉ | 1206/12384 [2:33:51<23:41:16, 7.63s/it, loss=0.0027, acc=0.9942, iter_time=10.46s]
Epoch 0: 10%|▉ | 1206/12384 [2:33:59<23:41:16, 7.63s/it, loss=0.0029, acc=0.9945, iter_time=7.65s]
Epoch 0: 10%|▉ | 1207/12384 [2:33:59<23:40:33, 7.63s/it, loss=0.0029, acc=0.9945, iter_time=7.65s]
Epoch 0: 10%|▉ | 1207/12384 [2:34:06<23:40:33, 7.63s/it, loss=0.0035, acc=0.9897, iter_time=7.99s]
Epoch 0: 10%|▉ | 1208/12384 [2:34:06<23:38:34, 7.62s/it, loss=0.0035, acc=0.9897, iter_time=7.99s]
Epoch 0: 10%|▉ | 1208/12384 [2:34:14<23:38:34, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=7.23s]
Epoch 0: 10%|▉ | 1209/12384 [2:34:14<23:40:27, 7.63s/it, loss=0.0007, acc=0.9981, iter_time=7.23s]
Epoch 0: 10%|▉ | 1209/12384 [2:34:22<23:40:27, 7.63s/it, loss=0.0037, acc=0.9939, iter_time=7.63s]
Epoch 0: 10%|▉ | 1210/12384 [2:34:22<23:39:15, 7.62s/it, loss=0.0037, acc=0.9939, iter_time=7.63s]
Epoch 0: 10%|▉ | 1210/12384 [2:34:29<23:39:15, 7.62s/it, loss=0.0051, acc=0.9901, iter_time=7.63s]
Epoch 0: 10%|▉ | 1211/12384 [2:34:29<23:40:00, 7.63s/it, loss=0.0051, acc=0.9901, iter_time=7.63s]
Epoch 0: 10%|▉ | 1211/12384 [2:34:37<23:40:00, 7.63s/it, loss=0.0013, acc=0.9969, iter_time=7.64s]
Epoch 0: 10%|▉ | 1212/12384 [2:34:37<23:39:50, 7.63s/it, loss=0.0013, acc=0.9969, iter_time=7.64s]
Epoch 0: 10%|▉ | 1212/12384 [2:34:45<23:39:50, 7.63s/it, loss=0.0008, acc=0.9986, iter_time=7.63s]
Epoch 0: 10%|▉ | 1213/12384 [2:34:45<23:39:41, 7.63s/it, loss=0.0008, acc=0.9986, iter_time=7.63s]
Epoch 0: 10%|▉ | 1213/12384 [2:34:52<23:39:41, 7.63s/it, loss=0.0086, acc=0.9859, iter_time=4.00s]
Epoch 0: 10%|▉ | 1214/12384 [2:34:52<23:41:25, 7.64s/it, loss=0.0086, acc=0.9859, iter_time=4.00s]
Epoch 0: 10%|▉ | 1214/12384 [2:35:00<23:41:25, 7.64s/it, loss=0.0026, acc=0.9962, iter_time=9.18s]
Epoch 0: 10%|▉ | 1215/12384 [2:35:00<23:41:19, 7.64s/it, loss=0.0026, acc=0.9962, iter_time=9.18s]
Epoch 0: 10%|▉ | 1215/12384 [2:35:08<23:41:19, 7.64s/it, loss=0.0024, acc=0.9972, iter_time=9.87s]
Epoch 0: 10%|▉ | 1216/12384 [2:35:08<23:41:43, 7.64s/it, loss=0.0024, acc=0.9972, iter_time=9.87s]
Epoch 0: 10%|▉ | 1216/12384 [2:35:15<23:41:43, 7.64s/it, loss=0.0049, acc=0.9911, iter_time=5.14s]
Epoch 0: 10%|▉ | 1217/12384 [2:35:15<23:41:31, 7.64s/it, loss=0.0049, acc=0.9911, iter_time=5.14s]
Epoch 0: 10%|▉ | 1217/12384 [2:35:23<23:41:31, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=10.03s]
Epoch 0: 10%|▉ | 1218/12384 [2:35:23<24:01:35, 7.75s/it, loss=0.0006, acc=1.0000, iter_time=10.03s]
Epoch 0: 10%|▉ | 1218/12384 [2:35:31<24:01:35, 7.75s/it, loss=0.0005, acc=0.9992, iter_time=7.95s]
Epoch 0: 10%|▉ | 1219/12384 [2:35:31<23:54:06, 7.71s/it, loss=0.0005, acc=0.9992, iter_time=7.95s]
Epoch 0: 10%|▉ | 1219/12384 [2:35:39<23:54:06, 7.71s/it, loss=0.0037, acc=0.9884, iter_time=5.52s]
Epoch 0: 10%|▉ | 1220/12384 [2:35:39<23:55:08, 7.71s/it, loss=0.0037, acc=0.9884, iter_time=5.52s]
Epoch 0: 10%|▉ | 1220/12384 [2:35:46<23:55:08, 7.71s/it, loss=0.0015, acc=0.9915, iter_time=9.83s]
Epoch 0: 10%|▉ | 1221/12384 [2:35:46<23:50:17, 7.69s/it, loss=0.0015, acc=0.9915, iter_time=9.83s]
Epoch 0: 10%|▉ | 1221/12384 [2:35:54<23:50:17, 7.69s/it, loss=0.0010, acc=0.9999, iter_time=7.63s]
Epoch 0: 10%|▉ | 1222/12384 [2:35:54<23:45:44, 7.66s/it, loss=0.0010, acc=0.9999, iter_time=7.63s]
Epoch 0: 10%|▉ | 1222/12384 [2:36:01<23:45:44, 7.66s/it, loss=0.0045, acc=0.9887, iter_time=5.62s]
Epoch 0: 10%|▉ | 1223/12384 [2:36:01<23:44:23, 7.66s/it, loss=0.0045, acc=0.9887, iter_time=5.62s]
Epoch 0: 10%|▉ | 1223/12384 [2:36:09<23:44:23, 7.66s/it, loss=0.0045, acc=0.9916, iter_time=10.01s]
Epoch 0: 10%|▉ | 1224/12384 [2:36:09<23:41:03, 7.64s/it, loss=0.0045, acc=0.9916, iter_time=10.01s]
Epoch 0: 10%|▉ | 1224/12384 [2:36:17<23:41:03, 7.64s/it, loss=0.0026, acc=0.9983, iter_time=7.25s]
Epoch 0: 10%|▉ | 1225/12384 [2:36:17<23:40:04, 7.64s/it, loss=0.0026, acc=0.9983, iter_time=7.25s]
Epoch 0: 10%|▉ | 1225/12384 [2:36:24<23:40:04, 7.64s/it, loss=0.0013, acc=0.9985, iter_time=7.63s]
Epoch 0: 10%|▉ | 1226/12384 [2:36:24<23:40:03, 7.64s/it, loss=0.0013, acc=0.9985, iter_time=7.63s]
Epoch 0: 10%|▉ | 1226/12384 [2:36:32<23:40:03, 7.64s/it, loss=0.0016, acc=0.9919, iter_time=7.61s]
Epoch 0: 10%|▉ | 1227/12384 [2:36:32<23:38:07, 7.63s/it, loss=0.0016, acc=0.9919, iter_time=7.61s]
Epoch 0: 10%|▉ | 1227/12384 [2:36:40<23:38:07, 7.63s/it, loss=0.0051, acc=0.9953, iter_time=5.78s]
Epoch 0: 10%|▉ | 1228/12384 [2:36:40<23:55:41, 7.72s/it, loss=0.0051, acc=0.9953, iter_time=5.78s]
Epoch 0: 10%|▉ | 1228/12384 [2:36:48<23:55:41, 7.72s/it, loss=0.0035, acc=0.9960, iter_time=8.42s]
Epoch 0: 10%|▉ | 1229/12384 [2:36:48<24:02:12, 7.76s/it, loss=0.0035, acc=0.9960, iter_time=8.42s]
Epoch 0: 10%|▉ | 1229/12384 [2:36:55<24:02:12, 7.76s/it, loss=0.0021, acc=0.9960, iter_time=9.18s]
Epoch 0: 10%|▉ | 1230/12384 [2:36:55<23:53:45, 7.71s/it, loss=0.0021, acc=0.9960, iter_time=9.18s]
Epoch 0: 10%|▉ | 1230/12384 [2:37:03<23:53:45, 7.71s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 10%|▉ | 1231/12384 [2:37:03<23:52:43, 7.71s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 10%|▉ | 1231/12384 [2:37:11<23:52:43, 7.71s/it, loss=0.0009, acc=0.9971, iter_time=8.07s]
Epoch 0: 10%|▉ | 1232/12384 [2:37:11<23:49:13, 7.69s/it, loss=0.0009, acc=0.9971, iter_time=8.07s]
Epoch 0: 10%|▉ | 1232/12384 [2:37:18<23:49:13, 7.69s/it, loss=0.0057, acc=0.9894, iter_time=6.55s]
Epoch 0: 10%|▉ | 1233/12384 [2:37:18<23:44:49, 7.67s/it, loss=0.0057, acc=0.9894, iter_time=6.55s]
Epoch 0: 10%|▉ | 1233/12384 [2:37:26<23:44:49, 7.67s/it, loss=0.0028, acc=0.9957, iter_time=8.29s]
Epoch 0: 10%|▉ | 1234/12384 [2:37:26<23:42:56, 7.66s/it, loss=0.0028, acc=0.9957, iter_time=8.29s]
Epoch 0: 10%|▉ | 1234/12384 [2:37:33<23:42:56, 7.66s/it, loss=0.0017, acc=0.9926, iter_time=7.63s]
Epoch 0: 10%|▉ | 1235/12384 [2:37:33<23:42:50, 7.66s/it, loss=0.0017, acc=0.9926, iter_time=7.63s]
Epoch 0: 10%|▉ | 1235/12384 [2:37:41<23:42:50, 7.66s/it, loss=0.0025, acc=0.9932, iter_time=7.67s]
Epoch 0: 10%|▉ | 1236/12384 [2:37:41<23:41:19, 7.65s/it, loss=0.0025, acc=0.9932, iter_time=7.67s]
Epoch 0: 10%|▉ | 1236/12384 [2:37:49<23:41:19, 7.65s/it, loss=0.0009, acc=0.9973, iter_time=7.62s]
Epoch 0: 10%|▉ | 1237/12384 [2:37:49<23:41:07, 7.65s/it, loss=0.0009, acc=0.9973, iter_time=7.62s]
Epoch 0: 10%|▉ | 1237/12384 [2:37:56<23:41:07, 7.65s/it, loss=0.0013, acc=0.9989, iter_time=7.65s]
Epoch 0: 10%|▉ | 1238/12384 [2:37:56<23:39:52, 7.64s/it, loss=0.0013, acc=0.9989, iter_time=7.65s]
Epoch 0: 10%|▉ | 1238/12384 [2:38:04<23:39:52, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=4.30s]
Epoch 0: 10%|█ | 1239/12384 [2:38:04<23:38:52, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=4.30s]
Epoch 0: 10%|█ | 1239/12384 [2:38:12<23:38:52, 7.64s/it, loss=0.0027, acc=0.9915, iter_time=10.89s]
Epoch 0: 10%|█ | 1240/12384 [2:38:12<23:37:56, 7.63s/it, loss=0.0027, acc=0.9915, iter_time=10.89s]
Epoch 0: 10%|█ | 1240/12384 [2:38:19<23:37:56, 7.63s/it, loss=0.0016, acc=0.9968, iter_time=5.41s]
Epoch 0: 10%|█ | 1241/12384 [2:38:19<23:37:42, 7.63s/it, loss=0.0016, acc=0.9968, iter_time=5.41s]
Epoch 0: 10%|█ | 1241/12384 [2:38:27<23:37:42, 7.63s/it, loss=0.0018, acc=0.9977, iter_time=9.89s]
Epoch 0: 10%|█ | 1242/12384 [2:38:27<23:37:44, 7.63s/it, loss=0.0018, acc=0.9977, iter_time=9.89s]
Epoch 0: 10%|█ | 1242/12384 [2:38:35<23:37:44, 7.63s/it, loss=0.0014, acc=0.9955, iter_time=7.65s]
Epoch 0: 10%|█ | 1243/12384 [2:38:35<23:39:41, 7.65s/it, loss=0.0014, acc=0.9955, iter_time=7.65s]
Epoch 0: 10%|█ | 1243/12384 [2:38:42<23:39:41, 7.65s/it, loss=0.0013, acc=0.9973, iter_time=7.96s]
Epoch 0: 10%|█ | 1244/12384 [2:38:42<23:53:40, 7.72s/it, loss=0.0013, acc=0.9973, iter_time=7.96s]
Epoch 0: 10%|█ | 1244/12384 [2:38:50<23:53:40, 7.72s/it, loss=0.0019, acc=0.9973, iter_time=7.35s]
Epoch 0: 10%|█ | 1245/12384 [2:38:50<24:05:31, 7.79s/it, loss=0.0019, acc=0.9973, iter_time=7.35s]
Epoch 0: 10%|█ | 1245/12384 [2:38:58<24:05:31, 7.79s/it, loss=0.0016, acc=0.9977, iter_time=8.20s]
Epoch 0: 10%|█ | 1246/12384 [2:38:58<23:57:00, 7.74s/it, loss=0.0016, acc=0.9977, iter_time=8.20s]
Epoch 0: 10%|█ | 1246/12384 [2:39:06<23:57:00, 7.74s/it, loss=0.0050, acc=0.9893, iter_time=4.79s]
Epoch 0: 10%|█ | 1247/12384 [2:39:06<23:51:46, 7.71s/it, loss=0.0050, acc=0.9893, iter_time=4.79s]
Epoch 0: 10%|█ | 1247/12384 [2:39:13<23:51:46, 7.71s/it, loss=0.0004, acc=0.9991, iter_time=10.44s]
Epoch 0: 10%|█ | 1248/12384 [2:39:13<23:46:12, 7.68s/it, loss=0.0004, acc=0.9991, iter_time=10.44s]
Epoch 0: 10%|█ | 1248/12384 [2:39:21<23:46:12, 7.68s/it, loss=0.0011, acc=0.9985, iter_time=7.66s]
Epoch 0: 10%|█ | 1249/12384 [2:39:21<23:42:36, 7.67s/it, loss=0.0011, acc=0.9985, iter_time=7.66s]
Epoch 0: 10%|█ | 1249/12384 [2:39:29<23:42:36, 7.67s/it, loss=0.0050, acc=0.9874, iter_time=8.04s]
Epoch 0: 10%|█ | 1250/12384 [2:39:29<23:40:32, 7.66s/it, loss=0.0050, acc=0.9874, iter_time=8.04s]
Epoch 0: 10%|█ | 1250/12384 [2:39:36<23:40:32, 7.66s/it, loss=0.0013, acc=0.9988, iter_time=7.19s]
Epoch 0: 10%|█ | 1251/12384 [2:39:36<23:36:45, 7.64s/it, loss=0.0013, acc=0.9988, iter_time=7.19s]
Epoch 0: 10%|█ | 1251/12384 [2:39:44<23:36:45, 7.64s/it, loss=0.0021, acc=0.9985, iter_time=7.62s]
Epoch 0: 10%|█ | 1252/12384 [2:39:44<23:38:53, 7.65s/it, loss=0.0021, acc=0.9985, iter_time=7.62s]
Epoch 0: 10%|█ | 1252/12384 [2:39:52<23:38:53, 7.65s/it, loss=0.0027, acc=0.9948, iter_time=7.14s]
Epoch 0: 10%|█ | 1253/12384 [2:39:52<23:40:12, 7.66s/it, loss=0.0027, acc=0.9948, iter_time=7.14s]
Epoch 0: 10%|█ | 1253/12384 [2:39:59<23:40:12, 7.66s/it, loss=0.0023, acc=0.9969, iter_time=8.21s]
Epoch 0: 10%|█ | 1254/12384 [2:39:59<23:37:50, 7.64s/it, loss=0.0023, acc=0.9969, iter_time=8.21s]
Epoch 0: 10%|█ | 1254/12384 [2:40:07<23:37:50, 7.64s/it, loss=0.0040, acc=0.9939, iter_time=7.62s]
Epoch 0: 10%|█ | 1255/12384 [2:40:07<23:37:31, 7.64s/it, loss=0.0040, acc=0.9939, iter_time=7.62s]
Epoch 0: 10%|█ | 1255/12384 [2:40:14<23:37:31, 7.64s/it, loss=0.0046, acc=0.9950, iter_time=7.79s]
Epoch 0: 10%|█ | 1256/12384 [2:40:14<23:37:21, 7.64s/it, loss=0.0046, acc=0.9950, iter_time=7.79s]
Epoch 0: 10%|█ | 1256/12384 [2:40:22<23:37:21, 7.64s/it, loss=0.0023, acc=0.9920, iter_time=7.49s]
Epoch 0: 10%|█ | 1257/12384 [2:40:22<23:37:52, 7.65s/it, loss=0.0023, acc=0.9920, iter_time=7.49s]
Epoch 0: 10%|█ | 1257/12384 [2:40:31<23:37:52, 7.65s/it, loss=0.0018, acc=0.9976, iter_time=7.25s]
Epoch 0: 10%|█ | 1258/12384 [2:40:31<24:32:45, 7.94s/it, loss=0.0018, acc=0.9976, iter_time=7.25s]
Epoch 0: 10%|█ | 1258/12384 [2:40:39<24:32:45, 7.94s/it, loss=0.0068, acc=0.9937, iter_time=9.48s]
Epoch 0: 10%|█ | 1259/12384 [2:40:39<24:39:00, 7.98s/it, loss=0.0068, acc=0.9937, iter_time=9.48s]
Epoch 0: 10%|█ | 1259/12384 [2:40:46<24:39:00, 7.98s/it, loss=0.0009, acc=0.9995, iter_time=6.99s]
Epoch 0: 10%|█ | 1260/12384 [2:40:46<24:20:12, 7.88s/it, loss=0.0009, acc=0.9995, iter_time=6.99s]
Epoch 0: 10%|█ | 1260/12384 [2:40:54<24:20:12, 7.88s/it, loss=0.0020, acc=0.9966, iter_time=8.24s]
Epoch 0: 10%|█ | 1261/12384 [2:40:54<24:03:57, 7.79s/it, loss=0.0020, acc=0.9966, iter_time=8.24s]
Epoch 0: 10%|█ | 1261/12384 [2:41:02<24:03:57, 7.79s/it, loss=0.0032, acc=0.9925, iter_time=7.60s]
Epoch 0: 10%|█ | 1262/12384 [2:41:02<23:56:23, 7.75s/it, loss=0.0032, acc=0.9925, iter_time=7.60s]
Epoch 0: 10%|█ | 1262/12384 [2:41:09<23:56:23, 7.75s/it, loss=0.0014, acc=0.9984, iter_time=7.66s]
Epoch 0: 10%|█ | 1263/12384 [2:41:09<23:50:14, 7.72s/it, loss=0.0014, acc=0.9984, iter_time=7.66s]
Epoch 0: 10%|█ | 1263/12384 [2:41:17<23:50:14, 7.72s/it, loss=0.0015, acc=0.9954, iter_time=7.73s]
Epoch 0: 10%|█ | 1264/12384 [2:41:17<23:45:33, 7.69s/it, loss=0.0015, acc=0.9954, iter_time=7.73s]
Epoch 0: 10%|█ | 1264/12384 [2:41:25<23:45:33, 7.69s/it, loss=0.0032, acc=0.9940, iter_time=7.54s]
Epoch 0: 10%|█ | 1265/12384 [2:41:25<23:41:28, 7.67s/it, loss=0.0032, acc=0.9940, iter_time=7.54s]
Epoch 0: 10%|█ | 1265/12384 [2:41:33<23:41:28, 7.67s/it, loss=0.0019, acc=0.9945, iter_time=8.78s]
Epoch 0: 10%|█ | 1266/12384 [2:41:33<24:46:07, 8.02s/it, loss=0.0019, acc=0.9945, iter_time=8.78s]
Epoch 0: 10%|█ | 1266/12384 [2:41:41<24:46:07, 8.02s/it, loss=0.0023, acc=0.9930, iter_time=5.06s]
Epoch 0: 10%|█ | 1267/12384 [2:41:41<24:24:09, 7.90s/it, loss=0.0023, acc=0.9930, iter_time=5.06s]
Epoch 0: 10%|█ | 1267/12384 [2:41:49<24:24:09, 7.90s/it, loss=0.0022, acc=0.9947, iter_time=10.23s]
Epoch 0: 10%|█ | 1268/12384 [2:41:49<24:08:42, 7.82s/it, loss=0.0022, acc=0.9947, iter_time=10.23s]
Epoch 0: 10%|█ | 1268/12384 [2:41:56<24:08:42, 7.82s/it, loss=0.0020, acc=0.9968, iter_time=7.62s]
Epoch 0: 10%|█ | 1269/12384 [2:41:56<23:57:01, 7.76s/it, loss=0.0020, acc=0.9968, iter_time=7.62s]
Epoch 0: 10%|█ | 1269/12384 [2:42:04<23:57:01, 7.76s/it, loss=0.0016, acc=0.9966, iter_time=7.63s]
Epoch 0: 10%|█ | 1270/12384 [2:42:04<23:48:42, 7.71s/it, loss=0.0016, acc=0.9966, iter_time=7.63s]
Epoch 0: 10%|█ | 1270/12384 [2:42:12<23:48:42, 7.71s/it, loss=0.0022, acc=0.9952, iter_time=8.00s]
Epoch 0: 10%|█ | 1271/12384 [2:42:12<24:04:42, 7.80s/it, loss=0.0022, acc=0.9952, iter_time=8.00s]
Epoch 0: 10%|█ | 1271/12384 [2:42:19<24:04:42, 7.80s/it, loss=0.0109, acc=0.9800, iter_time=7.98s]
Epoch 0: 10%|█ | 1272/12384 [2:42:19<23:55:40, 7.75s/it, loss=0.0109, acc=0.9800, iter_time=7.98s]
Epoch 0: 10%|█ | 1272/12384 [2:42:27<23:55:40, 7.75s/it, loss=0.0036, acc=0.9902, iter_time=7.27s]
Epoch 0: 10%|█ | 1273/12384 [2:42:27<23:50:17, 7.72s/it, loss=0.0036, acc=0.9902, iter_time=7.27s]
Epoch 0: 10%|█ | 1273/12384 [2:42:35<23:50:17, 7.72s/it, loss=0.0007, acc=0.9990, iter_time=7.67s]
Epoch 0: 10%|█ | 1274/12384 [2:42:35<23:44:53, 7.70s/it, loss=0.0007, acc=0.9990, iter_time=7.67s]
Epoch 0: 10%|█ | 1274/12384 [2:42:42<23:44:53, 7.70s/it, loss=0.0225, acc=0.9631, iter_time=7.61s]
Epoch 0: 10%|█ | 1275/12384 [2:42:42<23:41:11, 7.68s/it, loss=0.0225, acc=0.9631, iter_time=7.61s]
Epoch 0: 10%|█ | 1275/12384 [2:42:50<23:41:11, 7.68s/it, loss=0.0045, acc=0.9963, iter_time=7.64s]
Epoch 0: 10%|█ | 1276/12384 [2:42:50<23:40:05, 7.67s/it, loss=0.0045, acc=0.9963, iter_time=7.64s]
Epoch 0: 10%|█ | 1276/12384 [2:42:58<23:40:05, 7.67s/it, loss=0.0020, acc=0.9943, iter_time=7.67s]
Epoch 0: 10%|█ | 1277/12384 [2:42:58<23:40:02, 7.67s/it, loss=0.0020, acc=0.9943, iter_time=7.67s]
Epoch 0: 10%|█ | 1277/12384 [2:43:05<23:40:02, 7.67s/it, loss=0.0007, acc=0.9991, iter_time=5.66s]
Epoch 0: 10%|█ | 1278/12384 [2:43:05<23:34:18, 7.64s/it, loss=0.0007, acc=0.9991, iter_time=5.66s]
Epoch 0: 10%|█ | 1278/12384 [2:43:13<23:34:18, 7.64s/it, loss=0.0024, acc=0.9970, iter_time=9.56s]
Epoch 0: 10%|█ | 1279/12384 [2:43:13<23:33:08, 7.64s/it, loss=0.0024, acc=0.9970, iter_time=9.56s]
Epoch 0: 10%|█ | 1279/12384 [2:43:21<23:33:08, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.58s]
Epoch 0: 10%|█ | 1280/12384 [2:43:21<23:32:11, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.58s]
Epoch 0: 10%|█ | 1280/12384 [2:43:28<23:32:11, 7.63s/it, loss=0.0018, acc=0.9980, iter_time=6.42s]
Epoch 0: 10%|█ | 1281/12384 [2:43:28<23:33:36, 7.64s/it, loss=0.0018, acc=0.9980, iter_time=6.42s]
Epoch 0: 10%|█ | 1281/12384 [2:43:36<23:33:36, 7.64s/it, loss=0.0370, acc=0.9481, iter_time=8.92s]
Epoch 0: 10%|█ | 1282/12384 [2:43:36<23:32:31, 7.63s/it, loss=0.0370, acc=0.9481, iter_time=8.92s]
Epoch 0: 10%|█ | 1282/12384 [2:43:43<23:32:31, 7.63s/it, loss=0.0005, acc=0.9993, iter_time=5.51s]
Epoch 0: 10%|█ | 1283/12384 [2:43:43<23:33:03, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=5.51s]
Epoch 0: 10%|█ | 1283/12384 [2:43:51<23:33:03, 7.64s/it, loss=0.0015, acc=0.9951, iter_time=9.75s]
Epoch 0: 10%|█ | 1284/12384 [2:43:51<23:33:22, 7.64s/it, loss=0.0015, acc=0.9951, iter_time=9.75s]
Epoch 0: 10%|█ | 1284/12384 [2:43:59<23:33:22, 7.64s/it, loss=0.0038, acc=0.9940, iter_time=4.32s]
Epoch 0: 10%|█ | 1285/12384 [2:43:59<23:34:37, 7.65s/it, loss=0.0038, acc=0.9940, iter_time=4.32s]
Epoch 0: 10%|█ | 1285/12384 [2:44:06<23:34:37, 7.65s/it, loss=0.0010, acc=1.0000, iter_time=10.96s]
Epoch 0: 10%|█ | 1286/12384 [2:44:06<23:33:08, 7.64s/it, loss=0.0010, acc=1.0000, iter_time=10.96s]
Epoch 0: 10%|█ | 1286/12384 [2:44:14<23:33:08, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.33s]
Epoch 0: 10%|█ | 1287/12384 [2:44:14<23:33:29, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.33s]
Epoch 0: 10%|█ | 1287/12384 [2:44:22<23:33:29, 7.64s/it, loss=0.0015, acc=0.9954, iter_time=7.93s]
Epoch 0: 10%|█ | 1288/12384 [2:44:22<23:33:00, 7.64s/it, loss=0.0015, acc=0.9954, iter_time=7.93s]
Epoch 0: 10%|█ | 1288/12384 [2:44:29<23:33:00, 7.64s/it, loss=0.0015, acc=0.9969, iter_time=7.67s]
Epoch 0: 10%|█ | 1289/12384 [2:44:29<23:31:30, 7.63s/it, loss=0.0015, acc=0.9969, iter_time=7.67s]
Epoch 0: 10%|█ | 1289/12384 [2:44:37<23:31:30, 7.63s/it, loss=0.0031, acc=0.9954, iter_time=7.61s]
Epoch 0: 10%|█ | 1290/12384 [2:44:37<23:29:38, 7.62s/it, loss=0.0031, acc=0.9954, iter_time=7.61s]
Epoch 0: 10%|█ | 1290/12384 [2:44:45<23:29:38, 7.62s/it, loss=0.0005, acc=0.9983, iter_time=5.26s]
Epoch 0: 10%|█ | 1291/12384 [2:44:45<23:30:09, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=5.26s]
Epoch 0: 10%|█ | 1291/12384 [2:44:52<23:30:09, 7.63s/it, loss=0.0014, acc=0.9966, iter_time=9.97s]
Epoch 0: 10%|█ | 1292/12384 [2:44:52<23:28:58, 7.62s/it, loss=0.0014, acc=0.9966, iter_time=9.97s]
Epoch 0: 10%|█ | 1292/12384 [2:45:00<23:28:58, 7.62s/it, loss=0.0007, acc=0.9974, iter_time=7.61s]
Epoch 0: 10%|█ | 1293/12384 [2:45:00<23:27:26, 7.61s/it, loss=0.0007, acc=0.9974, iter_time=7.61s]
Epoch 0: 10%|█ | 1293/12384 [2:45:07<23:27:26, 7.61s/it, loss=0.0015, acc=0.9986, iter_time=6.40s]
Epoch 0: 10%|█ | 1294/12384 [2:45:07<23:28:17, 7.62s/it, loss=0.0015, acc=0.9986, iter_time=6.40s]
Epoch 0: 10%|█ | 1294/12384 [2:45:15<23:28:17, 7.62s/it, loss=0.0008, acc=0.9999, iter_time=8.85s]
Epoch 0: 10%|█ | 1295/12384 [2:45:15<23:27:38, 7.62s/it, loss=0.0008, acc=0.9999, iter_time=8.85s]
Epoch 0: 10%|█ | 1295/12384 [2:45:23<23:27:38, 7.62s/it, loss=0.0011, acc=0.9996, iter_time=7.56s]
Epoch 0: 10%|█ | 1296/12384 [2:45:23<23:27:46, 7.62s/it, loss=0.0011, acc=0.9996, iter_time=7.56s]
Epoch 0: 10%|█ | 1296/12384 [2:45:31<23:27:46, 7.62s/it, loss=0.0014, acc=0.9974, iter_time=7.67s]
Epoch 0: 10%|█ | 1297/12384 [2:45:31<23:44:33, 7.71s/it, loss=0.0014, acc=0.9974, iter_time=7.67s]
Epoch 0: 10%|█ | 1297/12384 [2:45:38<23:44:33, 7.71s/it, loss=0.0012, acc=0.9978, iter_time=7.92s]
Epoch 0: 10%|█ | 1298/12384 [2:45:38<23:41:19, 7.69s/it, loss=0.0012, acc=0.9978, iter_time=7.92s]
Epoch 0: 10%|█ | 1298/12384 [2:45:46<23:41:19, 7.69s/it, loss=0.0009, acc=0.9982, iter_time=7.63s]
Epoch 0: 10%|█ | 1299/12384 [2:45:46<23:35:49, 7.66s/it, loss=0.0009, acc=0.9982, iter_time=7.63s]
Epoch 0: 10%|█ | 1299/12384 [2:45:53<23:35:49, 7.66s/it, loss=0.0009, acc=0.9992, iter_time=8.02s]
Epoch 0: 10%|█ | 1300/12384 [2:45:53<23:33:25, 7.65s/it, loss=0.0009, acc=0.9992, iter_time=8.02s]
Epoch 0: 10%|█ | 1300/12384 [2:46:01<23:33:25, 7.65s/it, loss=0.0020, acc=0.9980, iter_time=5.12s]
Epoch 0: 11%|█ | 1301/12384 [2:46:01<23:34:20, 7.66s/it, loss=0.0020, acc=0.9980, iter_time=5.12s]
Epoch 0: 11%|█ | 1301/12384 [2:46:09<23:34:20, 7.66s/it, loss=0.0051, acc=0.9890, iter_time=9.75s]
Epoch 0: 11%|█ | 1302/12384 [2:46:09<23:30:35, 7.64s/it, loss=0.0051, acc=0.9890, iter_time=9.75s]
Epoch 0: 11%|█ | 1302/12384 [2:46:16<23:30:35, 7.64s/it, loss=0.0028, acc=0.9950, iter_time=7.59s]
Epoch 0: 11%|█ | 1303/12384 [2:46:16<23:28:46, 7.63s/it, loss=0.0028, acc=0.9950, iter_time=7.59s]
Epoch 0: 11%|█ | 1303/12384 [2:46:24<23:28:46, 7.63s/it, loss=0.0018, acc=0.9936, iter_time=7.98s]
Epoch 0: 11%|█ | 1304/12384 [2:46:24<23:27:47, 7.62s/it, loss=0.0018, acc=0.9936, iter_time=7.98s]
Epoch 0: 11%|█ | 1304/12384 [2:46:32<23:27:47, 7.62s/it, loss=0.0009, acc=0.9979, iter_time=7.25s]
Epoch 0: 11%|█ | 1305/12384 [2:46:32<23:28:32, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=7.25s]
Epoch 0: 11%|█ | 1305/12384 [2:46:39<23:28:32, 7.63s/it, loss=0.0008, acc=1.0000, iter_time=2.76s]
Epoch 0: 11%|█ | 1306/12384 [2:46:39<23:26:14, 7.62s/it, loss=0.0008, acc=1.0000, iter_time=2.76s]
Epoch 0: 11%|█ | 1306/12384 [2:46:47<23:26:14, 7.62s/it, loss=0.0011, acc=0.9978, iter_time=12.45s]
Epoch 0: 11%|█ | 1307/12384 [2:46:47<23:27:06, 7.62s/it, loss=0.0011, acc=0.9978, iter_time=12.45s]
Epoch 0: 11%|█ | 1307/12384 [2:46:54<23:27:06, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 0: 11%|█ | 1308/12384 [2:46:54<23:27:42, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 0: 11%|█ | 1308/12384 [2:47:02<23:27:42, 7.63s/it, loss=0.0026, acc=0.9920, iter_time=7.64s]
Epoch 0: 11%|█ | 1309/12384 [2:47:02<23:31:59, 7.65s/it, loss=0.0026, acc=0.9920, iter_time=7.64s]
Epoch 0: 11%|█ | 1309/12384 [2:47:10<23:31:59, 7.65s/it, loss=0.0018, acc=0.9961, iter_time=7.69s]
Epoch 0: 11%|█ | 1310/12384 [2:47:10<23:29:53, 7.64s/it, loss=0.0018, acc=0.9961, iter_time=7.69s]
Epoch 0: 11%|█ | 1310/12384 [2:47:17<23:29:53, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 11%|█ | 1311/12384 [2:47:17<23:27:24, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 11%|█ | 1311/12384 [2:47:25<23:27:24, 7.63s/it, loss=0.0026, acc=0.9940, iter_time=7.61s]
Epoch 0: 11%|█ | 1312/12384 [2:47:25<23:30:48, 7.65s/it, loss=0.0026, acc=0.9940, iter_time=7.61s]
Epoch 0: 11%|█ | 1312/12384 [2:47:33<23:30:48, 7.65s/it, loss=0.0020, acc=0.9969, iter_time=7.67s]
Epoch 0: 11%|█ | 1313/12384 [2:47:33<23:28:25, 7.63s/it, loss=0.0020, acc=0.9969, iter_time=7.67s]
Epoch 0: 11%|█ | 1313/12384 [2:47:40<23:28:25, 7.63s/it, loss=0.0014, acc=0.9957, iter_time=7.61s]
Epoch 0: 11%|█ | 1314/12384 [2:47:40<23:28:52, 7.64s/it, loss=0.0014, acc=0.9957, iter_time=7.61s]
Epoch 0: 11%|█ | 1314/12384 [2:47:48<23:28:52, 7.64s/it, loss=0.0013, acc=0.9971, iter_time=7.64s]
Epoch 0: 11%|█ | 1315/12384 [2:47:48<23:28:22, 7.63s/it, loss=0.0013, acc=0.9971, iter_time=7.64s]
Epoch 0: 11%|█ | 1315/12384 [2:47:56<23:28:22, 7.63s/it, loss=0.0030, acc=0.9924, iter_time=7.64s]
Epoch 0: 11%|█ | 1316/12384 [2:47:56<23:28:28, 7.64s/it, loss=0.0030, acc=0.9924, iter_time=7.64s]
Epoch 0: 11%|█ | 1316/12384 [2:48:03<23:28:28, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=6.68s]
Epoch 0: 11%|█ | 1317/12384 [2:48:03<23:25:45, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.68s]
Epoch 0: 11%|█ | 1317/12384 [2:48:11<23:25:45, 7.62s/it, loss=0.0025, acc=0.9951, iter_time=8.53s]
Epoch 0: 11%|█ | 1318/12384 [2:48:11<23:26:19, 7.63s/it, loss=0.0025, acc=0.9951, iter_time=8.53s]
Epoch 0: 11%|█ | 1318/12384 [2:48:18<23:26:19, 7.63s/it, loss=0.0006, acc=0.9979, iter_time=6.12s]
Epoch 0: 11%|█ | 1319/12384 [2:48:18<23:25:14, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=6.12s]
Epoch 0: 11%|█ | 1319/12384 [2:48:26<23:25:14, 7.62s/it, loss=0.0042, acc=0.9955, iter_time=9.51s]
Epoch 0: 11%|█ | 1320/12384 [2:48:26<23:29:52, 7.65s/it, loss=0.0042, acc=0.9955, iter_time=9.51s]
Epoch 0: 11%|█ | 1320/12384 [2:48:34<23:29:52, 7.65s/it, loss=0.0033, acc=0.9970, iter_time=3.02s]
Epoch 0: 11%|█ | 1321/12384 [2:48:34<23:27:46, 7.64s/it, loss=0.0033, acc=0.9970, iter_time=3.02s]
Epoch 0: 11%|█ | 1321/12384 [2:48:41<23:27:46, 7.64s/it, loss=0.0052, acc=0.9919, iter_time=8.65s]
Epoch 0: 11%|█ | 1322/12384 [2:48:41<23:30:44, 7.65s/it, loss=0.0052, acc=0.9919, iter_time=8.65s]
Epoch 0: 11%|█ | 1322/12384 [2:48:49<23:30:44, 7.65s/it, loss=0.0019, acc=0.9965, iter_time=10.98s]
Epoch 0: 11%|█ | 1323/12384 [2:48:49<23:50:43, 7.76s/it, loss=0.0019, acc=0.9965, iter_time=10.98s]
Epoch 0: 11%|█ | 1323/12384 [2:48:57<23:50:43, 7.76s/it, loss=0.0040, acc=0.9948, iter_time=7.96s]
Epoch 0: 11%|█ | 1324/12384 [2:48:57<23:40:56, 7.71s/it, loss=0.0040, acc=0.9948, iter_time=7.96s]
Epoch 0: 11%|█ | 1324/12384 [2:49:05<23:40:56, 7.71s/it, loss=0.0020, acc=0.9962, iter_time=7.07s]
Epoch 0: 11%|█ | 1325/12384 [2:49:05<23:35:45, 7.68s/it, loss=0.0020, acc=0.9962, iter_time=7.07s]
Epoch 0: 11%|█ | 1325/12384 [2:49:12<23:35:45, 7.68s/it, loss=0.0021, acc=0.9964, iter_time=8.15s]
Epoch 0: 11%|█ | 1326/12384 [2:49:12<23:35:09, 7.68s/it, loss=0.0021, acc=0.9964, iter_time=8.15s]
Epoch 0: 11%|█ | 1326/12384 [2:49:20<23:35:09, 7.68s/it, loss=0.0052, acc=0.9894, iter_time=7.69s]
Epoch 0: 11%|█ | 1327/12384 [2:49:20<23:33:00, 7.67s/it, loss=0.0052, acc=0.9894, iter_time=7.69s]
Epoch 0: 11%|█ | 1327/12384 [2:49:27<23:33:00, 7.67s/it, loss=0.0020, acc=0.9931, iter_time=8.02s]
Epoch 0: 11%|█ | 1328/12384 [2:49:27<23:29:15, 7.65s/it, loss=0.0020, acc=0.9931, iter_time=8.02s]
Epoch 0: 11%|█ | 1328/12384 [2:49:35<23:29:15, 7.65s/it, loss=0.0017, acc=0.9981, iter_time=7.22s]
Epoch 0: 11%|█ | 1329/12384 [2:49:35<23:27:27, 7.64s/it, loss=0.0017, acc=0.9981, iter_time=7.22s]
Epoch 0: 11%|█ | 1329/12384 [2:49:43<23:27:27, 7.64s/it, loss=0.0023, acc=0.9969, iter_time=6.39s]
Epoch 0: 11%|█ | 1330/12384 [2:49:43<23:25:25, 7.63s/it, loss=0.0023, acc=0.9969, iter_time=6.39s]
Epoch 0: 11%|█ | 1330/12384 [2:49:50<23:25:25, 7.63s/it, loss=0.0037, acc=0.9956, iter_time=8.81s]
Epoch 0: 11%|█ | 1331/12384 [2:49:50<23:24:30, 7.62s/it, loss=0.0037, acc=0.9956, iter_time=8.81s]
Epoch 0: 11%|█ | 1331/12384 [2:49:58<23:24:30, 7.62s/it, loss=0.0016, acc=0.9969, iter_time=7.08s]
Epoch 0: 11%|█ | 1332/12384 [2:49:58<23:29:17, 7.65s/it, loss=0.0016, acc=0.9969, iter_time=7.08s]
Epoch 0: 11%|█ | 1332/12384 [2:50:06<23:29:17, 7.65s/it, loss=0.0008, acc=0.9974, iter_time=5.41s]
Epoch 0: 11%|█ | 1333/12384 [2:50:06<23:34:26, 7.68s/it, loss=0.0008, acc=0.9974, iter_time=5.41s]
Epoch 0: 11%|█ | 1333/12384 [2:50:13<23:34:26, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=7.74s]
Epoch 0: 11%|█ | 1334/12384 [2:50:13<23:34:02, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=7.74s]
Epoch 0: 11%|█ | 1334/12384 [2:50:21<23:34:02, 7.68s/it, loss=0.0009, acc=0.9973, iter_time=10.53s]
Epoch 0: 11%|█ | 1335/12384 [2:50:21<23:32:08, 7.67s/it, loss=0.0009, acc=0.9973, iter_time=10.53s]
Epoch 0: 11%|█ | 1335/12384 [2:50:29<23:32:08, 7.67s/it, loss=0.0017, acc=0.9960, iter_time=8.02s]
Epoch 0: 11%|█ | 1336/12384 [2:50:29<23:28:59, 7.65s/it, loss=0.0017, acc=0.9960, iter_time=8.02s]
Epoch 0: 11%|█ | 1336/12384 [2:50:36<23:28:59, 7.65s/it, loss=0.0069, acc=0.9884, iter_time=7.24s]
Epoch 0: 11%|█ | 1337/12384 [2:50:36<23:30:32, 7.66s/it, loss=0.0069, acc=0.9884, iter_time=7.24s]
Epoch 0: 11%|█ | 1337/12384 [2:50:44<23:30:32, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=7.69s]
Epoch 0: 11%|█ | 1338/12384 [2:50:44<23:30:14, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=7.69s]
Epoch 0: 11%|█ | 1338/12384 [2:50:52<23:30:14, 7.66s/it, loss=0.0011, acc=0.9988, iter_time=7.66s]
Epoch 0: 11%|█ | 1339/12384 [2:50:52<23:28:57, 7.65s/it, loss=0.0011, acc=0.9988, iter_time=7.66s]
Epoch 0: 11%|█ | 1339/12384 [2:50:59<23:28:57, 7.65s/it, loss=0.0009, acc=0.9997, iter_time=7.61s]
Epoch 0: 11%|█ | 1340/12384 [2:50:59<23:28:07, 7.65s/it, loss=0.0009, acc=0.9997, iter_time=7.61s]
Epoch 0: 11%|█ | 1340/12384 [2:51:07<23:28:07, 7.65s/it, loss=0.0023, acc=0.9950, iter_time=7.65s]
Epoch 0: 11%|█ | 1341/12384 [2:51:07<23:24:54, 7.63s/it, loss=0.0023, acc=0.9950, iter_time=7.65s]
Epoch 0: 11%|█ | 1341/12384 [2:51:15<23:24:54, 7.63s/it, loss=0.0028, acc=0.9939, iter_time=7.58s]
Epoch 0: 11%|█ | 1342/12384 [2:51:15<23:22:27, 7.62s/it, loss=0.0028, acc=0.9939, iter_time=7.58s]
Epoch 0: 11%|█ | 1342/12384 [2:51:22<23:22:27, 7.62s/it, loss=0.0016, acc=0.9969, iter_time=7.61s]
Epoch 0: 11%|█ | 1343/12384 [2:51:22<23:23:32, 7.63s/it, loss=0.0016, acc=0.9969, iter_time=7.61s]
Epoch 0: 11%|█ | 1343/12384 [2:51:30<23:23:32, 7.63s/it, loss=0.0018, acc=0.9928, iter_time=7.61s]
Epoch 0: 11%|█ | 1344/12384 [2:51:30<23:23:42, 7.63s/it, loss=0.0018, acc=0.9928, iter_time=7.61s]
Epoch 0: 11%|█ | 1344/12384 [2:51:37<23:23:42, 7.63s/it, loss=0.0014, acc=0.9959, iter_time=6.44s]
Epoch 0: 11%|█ | 1345/12384 [2:51:37<23:22:20, 7.62s/it, loss=0.0014, acc=0.9959, iter_time=6.44s]
Epoch 0: 11%|█ | 1345/12384 [2:51:45<23:22:20, 7.62s/it, loss=0.0056, acc=0.9839, iter_time=8.83s]
Epoch 0: 11%|█ | 1346/12384 [2:51:45<23:27:06, 7.65s/it, loss=0.0056, acc=0.9839, iter_time=8.83s]
Epoch 0: 11%|█ | 1346/12384 [2:51:53<23:27:06, 7.65s/it, loss=0.0010, acc=0.9984, iter_time=7.11s]
Epoch 0: 11%|█ | 1347/12384 [2:51:53<23:28:31, 7.66s/it, loss=0.0010, acc=0.9984, iter_time=7.11s]
Epoch 0: 11%|█ | 1347/12384 [2:52:00<23:28:31, 7.66s/it, loss=0.0010, acc=0.9986, iter_time=7.09s]
Epoch 0: 11%|█ | 1348/12384 [2:52:00<23:25:39, 7.64s/it, loss=0.0010, acc=0.9986, iter_time=7.09s]
Epoch 0: 11%|█ | 1348/12384 [2:52:08<23:25:39, 7.64s/it, loss=0.0025, acc=0.9925, iter_time=9.09s]
Epoch 0: 11%|█ | 1349/12384 [2:52:08<23:42:32, 7.73s/it, loss=0.0025, acc=0.9925, iter_time=9.09s]
Epoch 0: 11%|█ | 1349/12384 [2:52:16<23:42:32, 7.73s/it, loss=0.0016, acc=0.9970, iter_time=8.05s]
Epoch 0: 11%|█ | 1350/12384 [2:52:16<23:35:11, 7.70s/it, loss=0.0016, acc=0.9970, iter_time=8.05s]
Epoch 0: 11%|█ | 1350/12384 [2:52:24<23:35:11, 7.70s/it, loss=0.0138, acc=0.9784, iter_time=7.22s]
Epoch 0: 11%|█ | 1351/12384 [2:52:24<23:30:48, 7.67s/it, loss=0.0138, acc=0.9784, iter_time=7.22s]
Epoch 0: 11%|█ | 1351/12384 [2:52:31<23:30:48, 7.67s/it, loss=0.0063, acc=0.9920, iter_time=7.60s]
Epoch 0: 11%|█ | 1352/12384 [2:52:31<23:29:17, 7.66s/it, loss=0.0063, acc=0.9920, iter_time=7.60s]
Epoch 0: 11%|█ | 1352/12384 [2:52:39<23:29:17, 7.66s/it, loss=0.0010, acc=0.9994, iter_time=4.52s]
Epoch 0: 11%|█ | 1353/12384 [2:52:39<23:29:04, 7.66s/it, loss=0.0010, acc=0.9994, iter_time=4.52s]
Epoch 0: 11%|█ | 1353/12384 [2:52:47<23:29:04, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.77s]
Epoch 0: 11%|█ | 1354/12384 [2:52:47<23:28:17, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.77s]
Epoch 0: 11%|█ | 1354/12384 [2:52:54<23:28:17, 7.66s/it, loss=0.0013, acc=0.9980, iter_time=10.67s]
Epoch 0: 11%|█ | 1355/12384 [2:52:54<23:26:51, 7.65s/it, loss=0.0013, acc=0.9980, iter_time=10.67s]
Epoch 0: 11%|█ | 1355/12384 [2:53:02<23:26:51, 7.65s/it, loss=0.0019, acc=0.9979, iter_time=5.56s]
Epoch 0: 11%|█ | 1356/12384 [2:53:02<23:26:20, 7.65s/it, loss=0.0019, acc=0.9979, iter_time=5.56s]
Epoch 0: 11%|█ | 1356/12384 [2:53:09<23:26:20, 7.65s/it, loss=0.0033, acc=0.9935, iter_time=9.72s]
Epoch 0: 11%|█ | 1357/12384 [2:53:09<23:24:06, 7.64s/it, loss=0.0033, acc=0.9935, iter_time=9.72s]
Epoch 0: 11%|█ | 1357/12384 [2:53:17<23:24:06, 7.64s/it, loss=0.0008, acc=0.9971, iter_time=7.63s]
Epoch 0: 11%|█ | 1358/12384 [2:53:17<23:23:38, 7.64s/it, loss=0.0008, acc=0.9971, iter_time=7.63s]
Epoch 0: 11%|█ | 1358/12384 [2:53:25<23:23:38, 7.64s/it, loss=0.0016, acc=0.9977, iter_time=7.63s]
Epoch 0: 11%|█ | 1359/12384 [2:53:25<23:20:57, 7.62s/it, loss=0.0016, acc=0.9977, iter_time=7.63s]
Epoch 0: 11%|█ | 1359/12384 [2:53:32<23:20:57, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=7.98s]
Epoch 0: 11%|█ | 1360/12384 [2:53:32<23:20:22, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=7.98s]
Epoch 0: 11%|█ | 1360/12384 [2:53:40<23:20:22, 7.62s/it, loss=0.0043, acc=0.9899, iter_time=7.23s]
Epoch 0: 11%|█ | 1361/12384 [2:53:40<23:20:19, 7.62s/it, loss=0.0043, acc=0.9899, iter_time=7.23s]
Epoch 0: 11%|█ | 1361/12384 [2:53:48<23:20:19, 7.62s/it, loss=0.0013, acc=0.9979, iter_time=7.63s]
Epoch 0: 11%|█ | 1362/12384 [2:53:48<23:19:55, 7.62s/it, loss=0.0013, acc=0.9979, iter_time=7.63s]
Epoch 0: 11%|█ | 1362/12384 [2:53:55<23:19:55, 7.62s/it, loss=0.0033, acc=0.9928, iter_time=7.37s]
Epoch 0: 11%|█ | 1363/12384 [2:53:55<23:20:20, 7.62s/it, loss=0.0033, acc=0.9928, iter_time=7.37s]
Epoch 0: 11%|█ | 1363/12384 [2:54:03<23:20:20, 7.62s/it, loss=0.0121, acc=0.9796, iter_time=7.87s]
Epoch 0: 11%|█ | 1364/12384 [2:54:03<23:18:55, 7.62s/it, loss=0.0121, acc=0.9796, iter_time=7.87s]
Epoch 0: 11%|█ | 1364/12384 [2:54:10<23:18:55, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=7.61s]
Epoch 0: 11%|█ | 1365/12384 [2:54:10<23:20:06, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=7.61s]
Epoch 0: 11%|█ | 1365/12384 [2:54:18<23:20:06, 7.62s/it, loss=0.0041, acc=0.9914, iter_time=7.72s]
Epoch 0: 11%|█ | 1366/12384 [2:54:18<23:23:20, 7.64s/it, loss=0.0041, acc=0.9914, iter_time=7.72s]
Epoch 0: 11%|█ | 1366/12384 [2:54:26<23:23:20, 7.64s/it, loss=0.0021, acc=0.9929, iter_time=5.82s]
Epoch 0: 11%|█ | 1367/12384 [2:54:26<23:27:25, 7.66s/it, loss=0.0021, acc=0.9929, iter_time=5.82s]
Epoch 0: 11%|█ | 1367/12384 [2:54:33<23:27:25, 7.66s/it, loss=0.0012, acc=0.9947, iter_time=9.90s]
Epoch 0: 11%|█ | 1368/12384 [2:54:33<23:26:38, 7.66s/it, loss=0.0012, acc=0.9947, iter_time=9.90s]
Epoch 0: 11%|█ | 1368/12384 [2:54:41<23:26:38, 7.66s/it, loss=0.0060, acc=0.9860, iter_time=7.27s]
Epoch 0: 11%|█ | 1369/12384 [2:54:41<23:26:07, 7.66s/it, loss=0.0060, acc=0.9860, iter_time=7.27s]
Epoch 0: 11%|█ | 1369/12384 [2:54:49<23:26:07, 7.66s/it, loss=0.0057, acc=0.9873, iter_time=7.63s]
Epoch 0: 11%|█ | 1370/12384 [2:54:49<23:23:50, 7.65s/it, loss=0.0057, acc=0.9873, iter_time=7.63s]
Epoch 0: 11%|█ | 1370/12384 [2:54:56<23:23:50, 7.65s/it, loss=0.0010, acc=0.9993, iter_time=7.64s]
Epoch 0: 11%|█ | 1371/12384 [2:54:56<23:23:21, 7.65s/it, loss=0.0010, acc=0.9993, iter_time=7.64s]
Epoch 0: 11%|█ | 1371/12384 [2:55:04<23:23:21, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.63s]
Epoch 0: 11%|█ | 1372/12384 [2:55:04<23:22:13, 7.64s/it, loss=0.0004, acc=0.9988, iter_time=7.63s]
Epoch 0: 11%|█ | 1372/12384 [2:55:12<23:22:13, 7.64s/it, loss=0.0032, acc=0.9937, iter_time=5.56s]
Epoch 0: 11%|█ | 1373/12384 [2:55:12<23:20:45, 7.63s/it, loss=0.0032, acc=0.9937, iter_time=5.56s]
Epoch 0: 11%|█ | 1373/12384 [2:55:19<23:20:45, 7.63s/it, loss=0.0027, acc=0.9947, iter_time=9.92s]
Epoch 0: 11%|█ | 1374/12384 [2:55:19<23:31:56, 7.69s/it, loss=0.0027, acc=0.9947, iter_time=9.92s]
Epoch 0: 11%|█ | 1374/12384 [2:55:27<23:31:56, 7.69s/it, loss=0.0007, acc=0.9998, iter_time=7.58s]
Epoch 0: 11%|█ | 1375/12384 [2:55:27<23:28:09, 7.67s/it, loss=0.0007, acc=0.9998, iter_time=7.58s]
Epoch 0: 11%|█ | 1375/12384 [2:55:35<23:28:09, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=8.12s]
Epoch 0: 11%|█ | 1376/12384 [2:55:35<23:46:18, 7.77s/it, loss=0.0004, acc=1.0000, iter_time=8.12s]
Epoch 0: 11%|█ | 1376/12384 [2:55:43<23:46:18, 7.77s/it, loss=0.0007, acc=0.9998, iter_time=4.93s]
Epoch 0: 11%|█ | 1377/12384 [2:55:43<23:40:00, 7.74s/it, loss=0.0007, acc=0.9998, iter_time=4.93s]
Epoch 0: 11%|█ | 1377/12384 [2:55:50<23:40:00, 7.74s/it, loss=0.0032, acc=0.9939, iter_time=10.27s]
Epoch 0: 11%|█ | 1378/12384 [2:55:50<23:35:33, 7.72s/it, loss=0.0032, acc=0.9939, iter_time=10.27s]
Epoch 0: 11%|█ | 1378/12384 [2:55:58<23:35:33, 7.72s/it, loss=0.0039, acc=0.9865, iter_time=7.67s]
Epoch 0: 11%|█ | 1379/12384 [2:55:58<23:30:03, 7.69s/it, loss=0.0039, acc=0.9865, iter_time=7.67s]
Epoch 0: 11%|█ | 1379/12384 [2:56:06<23:30:03, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=6.68s]
Epoch 0: 11%|█ | 1380/12384 [2:56:06<23:27:23, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.68s]
Epoch 0: 11%|█ | 1380/12384 [2:56:13<23:27:23, 7.67s/it, loss=0.0021, acc=0.9973, iter_time=8.59s]
Epoch 0: 11%|█ | 1381/12384 [2:56:13<23:26:17, 7.67s/it, loss=0.0021, acc=0.9973, iter_time=8.59s]
Epoch 0: 11%|█ | 1381/12384 [2:56:21<23:26:17, 7.67s/it, loss=0.0019, acc=0.9953, iter_time=5.34s]
Epoch 0: 11%|█ | 1382/12384 [2:56:21<23:26:31, 7.67s/it, loss=0.0019, acc=0.9953, iter_time=5.34s]
Epoch 0: 11%|█ | 1382/12384 [2:56:29<23:26:31, 7.67s/it, loss=0.0061, acc=0.9972, iter_time=9.72s]
Epoch 0: 11%|█ | 1383/12384 [2:56:29<23:25:36, 7.67s/it, loss=0.0061, acc=0.9972, iter_time=9.72s]
Epoch 0: 11%|█ | 1383/12384 [2:56:36<23:25:36, 7.67s/it, loss=0.0016, acc=0.9940, iter_time=8.27s]
Epoch 0: 11%|█ | 1384/12384 [2:56:36<23:23:08, 7.65s/it, loss=0.0016, acc=0.9940, iter_time=8.27s]
Epoch 0: 11%|█ | 1384/12384 [2:56:44<23:23:08, 7.65s/it, loss=0.0016, acc=0.9941, iter_time=7.24s]
Epoch 0: 11%|█ | 1385/12384 [2:56:44<23:23:42, 7.66s/it, loss=0.0016, acc=0.9941, iter_time=7.24s]
Epoch 0: 11%|█ | 1385/12384 [2:56:52<23:23:42, 7.66s/it, loss=0.0007, acc=1.0000, iter_time=7.68s]
Epoch 0: 11%|█ | 1386/12384 [2:56:52<23:23:45, 7.66s/it, loss=0.0007, acc=1.0000, iter_time=7.68s]
Epoch 0: 11%|█ | 1386/12384 [2:56:59<23:23:45, 7.66s/it, loss=0.0016, acc=0.9959, iter_time=7.67s]
Epoch 0: 11%|█ | 1387/12384 [2:56:59<23:22:35, 7.65s/it, loss=0.0016, acc=0.9959, iter_time=7.67s]
Epoch 0: 11%|█ | 1387/12384 [2:57:07<23:22:35, 7.65s/it, loss=0.0024, acc=0.9940, iter_time=6.70s]
Epoch 0: 11%|█ | 1388/12384 [2:57:07<23:21:27, 7.65s/it, loss=0.0024, acc=0.9940, iter_time=6.70s]
Epoch 0: 11%|█ | 1388/12384 [2:57:15<23:21:27, 7.65s/it, loss=0.0030, acc=0.9943, iter_time=8.58s]
Epoch 0: 11%|█ | 1389/12384 [2:57:15<23:21:08, 7.65s/it, loss=0.0030, acc=0.9943, iter_time=8.58s]
Epoch 0: 11%|█ | 1389/12384 [2:57:22<23:21:08, 7.65s/it, loss=0.0060, acc=0.9835, iter_time=5.33s]
Epoch 0: 11%|█ | 1390/12384 [2:57:22<23:21:16, 7.65s/it, loss=0.0060, acc=0.9835, iter_time=5.33s]
Epoch 0: 11%|█ | 1390/12384 [2:57:30<23:21:16, 7.65s/it, loss=0.0015, acc=0.9946, iter_time=9.97s]
Epoch 0: 11%|█ | 1391/12384 [2:57:30<23:20:13, 7.64s/it, loss=0.0015, acc=0.9946, iter_time=9.97s]
Epoch 0: 11%|█ | 1391/12384 [2:57:37<23:20:13, 7.64s/it, loss=0.0061, acc=0.9859, iter_time=7.57s]
Epoch 0: 11%|█ | 1392/12384 [2:57:37<23:18:32, 7.63s/it, loss=0.0061, acc=0.9859, iter_time=7.57s]
Epoch 0: 11%|█ | 1392/12384 [2:57:45<23:18:32, 7.63s/it, loss=0.0007, acc=0.9968, iter_time=7.64s]
Epoch 0: 11%|█ | 1393/12384 [2:57:45<23:18:39, 7.64s/it, loss=0.0007, acc=0.9968, iter_time=7.64s]
Epoch 0: 11%|█ | 1393/12384 [2:57:53<23:18:39, 7.64s/it, loss=0.0011, acc=0.9962, iter_time=5.86s]
Epoch 0: 11%|█▏ | 1394/12384 [2:57:53<23:18:13, 7.63s/it, loss=0.0011, acc=0.9962, iter_time=5.86s]
Epoch 0: 11%|█▏ | 1394/12384 [2:58:00<23:18:13, 7.63s/it, loss=0.0013, acc=0.9985, iter_time=9.44s]
Epoch 0: 11%|█▏ | 1395/12384 [2:58:00<23:16:59, 7.63s/it, loss=0.0013, acc=0.9985, iter_time=9.44s]
Epoch 0: 11%|█▏ | 1395/12384 [2:58:08<23:16:59, 7.63s/it, loss=0.0034, acc=0.9940, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1396/12384 [2:58:08<23:17:17, 7.63s/it, loss=0.0034, acc=0.9940, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1396/12384 [2:58:16<23:17:17, 7.63s/it, loss=0.0015, acc=0.9980, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1397/12384 [2:58:16<23:15:04, 7.62s/it, loss=0.0015, acc=0.9980, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1397/12384 [2:58:23<23:15:04, 7.62s/it, loss=0.0027, acc=0.9903, iter_time=6.09s]
Epoch 0: 11%|█▏ | 1398/12384 [2:58:23<23:13:33, 7.61s/it, loss=0.0027, acc=0.9903, iter_time=6.09s]
Epoch 0: 11%|█▏ | 1398/12384 [2:58:31<23:13:33, 7.61s/it, loss=0.0011, acc=0.9960, iter_time=9.10s]
Epoch 0: 11%|█▏ | 1399/12384 [2:58:31<23:16:42, 7.63s/it, loss=0.0011, acc=0.9960, iter_time=9.10s]
Epoch 0: 11%|█▏ | 1399/12384 [2:58:38<23:16:42, 7.63s/it, loss=0.0051, acc=0.9938, iter_time=8.07s]
Epoch 0: 11%|█▏ | 1400/12384 [2:58:38<23:15:07, 7.62s/it, loss=0.0051, acc=0.9938, iter_time=8.07s]
Epoch 0: 11%|█▏ | 1400/12384 [2:58:46<23:15:07, 7.62s/it, loss=0.0021, acc=0.9899, iter_time=7.51s]
Epoch 0: 11%|█▏ | 1401/12384 [2:58:46<23:30:28, 7.71s/it, loss=0.0021, acc=0.9899, iter_time=7.51s]
Epoch 0: 11%|█▏ | 1401/12384 [2:58:54<23:30:28, 7.71s/it, loss=0.0022, acc=0.9952, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1402/12384 [2:58:54<23:44:02, 7.78s/it, loss=0.0022, acc=0.9952, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1402/12384 [2:59:02<23:44:02, 7.78s/it, loss=0.0016, acc=0.9975, iter_time=4.63s]
Epoch 0: 11%|█▏ | 1403/12384 [2:59:02<23:33:59, 7.73s/it, loss=0.0016, acc=0.9975, iter_time=4.63s]
Epoch 0: 11%|█▏ | 1403/12384 [2:59:09<23:33:59, 7.73s/it, loss=0.0006, acc=0.9989, iter_time=8.28s]
Epoch 0: 11%|█▏ | 1404/12384 [2:59:09<23:27:31, 7.69s/it, loss=0.0006, acc=0.9989, iter_time=8.28s]
Epoch 0: 11%|█▏ | 1404/12384 [2:59:17<23:27:31, 7.69s/it, loss=0.0010, acc=0.9990, iter_time=9.60s]
Epoch 0: 11%|█▏ | 1405/12384 [2:59:17<23:25:23, 7.68s/it, loss=0.0010, acc=0.9990, iter_time=9.60s]
Epoch 0: 11%|█▏ | 1405/12384 [2:59:25<23:25:23, 7.68s/it, loss=0.0004, acc=0.9985, iter_time=8.27s]
Epoch 0: 11%|█▏ | 1406/12384 [2:59:25<23:23:02, 7.67s/it, loss=0.0004, acc=0.9985, iter_time=8.27s]
Epoch 0: 11%|█▏ | 1406/12384 [2:59:32<23:23:02, 7.67s/it, loss=0.0011, acc=0.9982, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1407/12384 [2:59:32<23:22:28, 7.67s/it, loss=0.0011, acc=0.9982, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1407/12384 [2:59:40<23:22:28, 7.67s/it, loss=0.0006, acc=1.0000, iter_time=8.05s]
Epoch 0: 11%|█▏ | 1408/12384 [2:59:40<23:25:01, 7.68s/it, loss=0.0006, acc=1.0000, iter_time=8.05s]
Epoch 0: 11%|█▏ | 1408/12384 [2:59:48<23:25:01, 7.68s/it, loss=0.0032, acc=0.9934, iter_time=7.33s]
Epoch 0: 11%|█▏ | 1409/12384 [2:59:48<23:21:49, 7.66s/it, loss=0.0032, acc=0.9934, iter_time=7.33s]
Epoch 0: 11%|█▏ | 1409/12384 [2:59:55<23:21:49, 7.66s/it, loss=0.0015, acc=0.9966, iter_time=7.32s]
Epoch 0: 11%|█▏ | 1410/12384 [2:59:55<23:21:03, 7.66s/it, loss=0.0015, acc=0.9966, iter_time=7.32s]
Epoch 0: 11%|█▏ | 1410/12384 [3:00:03<23:21:03, 7.66s/it, loss=0.0012, acc=0.9982, iter_time=7.95s]
Epoch 0: 11%|█▏ | 1411/12384 [3:00:03<23:20:15, 7.66s/it, loss=0.0012, acc=0.9982, iter_time=7.95s]
Epoch 0: 11%|█▏ | 1411/12384 [3:00:11<23:20:15, 7.66s/it, loss=0.0020, acc=0.9994, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1412/12384 [3:00:11<23:18:34, 7.65s/it, loss=0.0020, acc=0.9994, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1412/12384 [3:00:18<23:18:34, 7.65s/it, loss=0.0019, acc=0.9947, iter_time=7.63s]
Epoch 0: 11%|█▏ | 1413/12384 [3:00:18<23:15:54, 7.63s/it, loss=0.0019, acc=0.9947, iter_time=7.63s]
Epoch 0: 11%|█▏ | 1413/12384 [3:00:26<23:15:54, 7.63s/it, loss=0.0021, acc=0.9964, iter_time=4.76s]
Epoch 0: 11%|█▏ | 1414/12384 [3:00:26<23:17:34, 7.64s/it, loss=0.0021, acc=0.9964, iter_time=4.76s]
Epoch 0: 11%|█▏ | 1414/12384 [3:00:34<23:17:34, 7.64s/it, loss=0.0006, acc=0.9998, iter_time=10.50s]
Epoch 0: 11%|█▏ | 1415/12384 [3:00:34<23:18:40, 7.65s/it, loss=0.0006, acc=0.9998, iter_time=10.50s]
Epoch 0: 11%|█▏ | 1415/12384 [3:00:41<23:18:40, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=8.05s]
Epoch 0: 11%|█▏ | 1416/12384 [3:00:41<23:17:56, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=8.05s]
Epoch 0: 11%|█▏ | 1416/12384 [3:00:49<23:17:56, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 11%|█▏ | 1417/12384 [3:00:49<23:16:17, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 11%|█▏ | 1417/12384 [3:00:56<23:16:17, 7.64s/it, loss=0.0051, acc=0.9926, iter_time=5.57s]
Epoch 0: 11%|█▏ | 1418/12384 [3:00:56<23:15:03, 7.63s/it, loss=0.0051, acc=0.9926, iter_time=5.57s]
Epoch 0: 11%|█▏ | 1418/12384 [3:01:04<23:15:03, 7.63s/it, loss=0.0020, acc=0.9930, iter_time=8.49s]
Epoch 0: 11%|█▏ | 1419/12384 [3:01:04<23:15:50, 7.64s/it, loss=0.0020, acc=0.9930, iter_time=8.49s]
Epoch 0: 11%|█▏ | 1419/12384 [3:01:12<23:15:50, 7.64s/it, loss=0.0010, acc=0.9988, iter_time=8.83s]
Epoch 0: 11%|█▏ | 1420/12384 [3:01:12<23:13:23, 7.63s/it, loss=0.0010, acc=0.9988, iter_time=8.83s]
Epoch 0: 11%|█▏ | 1420/12384 [3:01:19<23:13:23, 7.63s/it, loss=0.0003, acc=0.9995, iter_time=7.59s]
Epoch 0: 11%|█▏ | 1421/12384 [3:01:19<23:12:43, 7.62s/it, loss=0.0003, acc=0.9995, iter_time=7.59s]
Epoch 0: 11%|█▏ | 1421/12384 [3:01:27<23:12:43, 7.62s/it, loss=0.0063, acc=0.9903, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1422/12384 [3:01:27<23:14:12, 7.63s/it, loss=0.0063, acc=0.9903, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1422/12384 [3:01:35<23:14:12, 7.63s/it, loss=0.0008, acc=0.9993, iter_time=7.67s]
Epoch 0: 11%|█▏ | 1423/12384 [3:01:35<23:13:05, 7.63s/it, loss=0.0008, acc=0.9993, iter_time=7.67s]
Epoch 0: 11%|█▏ | 1423/12384 [3:01:42<23:13:05, 7.63s/it, loss=0.0028, acc=0.9919, iter_time=7.98s]
Epoch 0: 11%|█▏ | 1424/12384 [3:01:42<23:12:42, 7.62s/it, loss=0.0028, acc=0.9919, iter_time=7.98s]
Epoch 0: 11%|█▏ | 1424/12384 [3:01:50<23:12:42, 7.62s/it, loss=0.0028, acc=0.9949, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1425/12384 [3:01:50<23:11:21, 7.62s/it, loss=0.0028, acc=0.9949, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1425/12384 [3:01:57<23:11:21, 7.62s/it, loss=0.0007, acc=0.9964, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1426/12384 [3:01:57<23:12:19, 7.62s/it, loss=0.0007, acc=0.9964, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1426/12384 [3:02:05<23:12:19, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.40s]
Epoch 0: 12%|█▏ | 1427/12384 [3:02:05<23:12:11, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.40s]
Epoch 0: 12%|█▏ | 1427/12384 [3:02:13<23:12:11, 7.62s/it, loss=0.0009, acc=0.9981, iter_time=6.83s]
Epoch 0: 12%|█▏ | 1428/12384 [3:02:13<23:11:27, 7.62s/it, loss=0.0009, acc=0.9981, iter_time=6.83s]
Epoch 0: 12%|█▏ | 1428/12384 [3:02:21<23:11:27, 7.62s/it, loss=0.0012, acc=0.9981, iter_time=9.67s]
Epoch 0: 12%|█▏ | 1429/12384 [3:02:21<23:31:37, 7.73s/it, loss=0.0012, acc=0.9981, iter_time=9.67s]
Epoch 0: 12%|█▏ | 1429/12384 [3:02:28<23:31:37, 7.73s/it, loss=0.0014, acc=0.9982, iter_time=7.96s]
Epoch 0: 12%|█▏ | 1430/12384 [3:02:28<23:25:29, 7.70s/it, loss=0.0014, acc=0.9982, iter_time=7.96s]
Epoch 0: 12%|█▏ | 1430/12384 [3:02:36<23:25:29, 7.70s/it, loss=0.0027, acc=0.9930, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1431/12384 [3:02:36<23:21:29, 7.68s/it, loss=0.0027, acc=0.9930, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1431/12384 [3:02:44<23:21:29, 7.68s/it, loss=0.0011, acc=0.9973, iter_time=7.57s]
Epoch 0: 12%|█▏ | 1432/12384 [3:02:44<23:18:01, 7.66s/it, loss=0.0011, acc=0.9973, iter_time=7.57s]
Epoch 0: 12%|█▏ | 1432/12384 [3:02:51<23:18:01, 7.66s/it, loss=0.0040, acc=0.9944, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1433/12384 [3:02:51<23:13:51, 7.64s/it, loss=0.0040, acc=0.9944, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1433/12384 [3:02:59<23:13:51, 7.64s/it, loss=0.0021, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1434/12384 [3:02:59<23:15:20, 7.65s/it, loss=0.0021, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1434/12384 [3:03:06<23:15:20, 7.65s/it, loss=0.0005, acc=0.9998, iter_time=4.50s]
Epoch 0: 12%|█▏ | 1435/12384 [3:03:06<23:13:16, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=4.50s]
Epoch 0: 12%|█▏ | 1435/12384 [3:03:14<23:13:16, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=10.75s]
Epoch 0: 12%|█▏ | 1436/12384 [3:03:14<23:14:10, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=10.75s]
Epoch 0: 12%|█▏ | 1436/12384 [3:03:22<23:14:10, 7.64s/it, loss=0.0034, acc=0.9931, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1437/12384 [3:03:22<23:12:35, 7.63s/it, loss=0.0034, acc=0.9931, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1437/12384 [3:03:29<23:12:35, 7.63s/it, loss=0.0005, acc=0.9977, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1438/12384 [3:03:29<23:10:44, 7.62s/it, loss=0.0005, acc=0.9977, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1438/12384 [3:03:37<23:10:44, 7.62s/it, loss=0.0027, acc=0.9941, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1439/12384 [3:03:37<23:10:54, 7.62s/it, loss=0.0027, acc=0.9941, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1439/12384 [3:03:45<23:10:54, 7.62s/it, loss=0.0031, acc=0.9954, iter_time=8.01s]
Epoch 0: 12%|█▏ | 1440/12384 [3:03:45<23:10:25, 7.62s/it, loss=0.0031, acc=0.9954, iter_time=8.01s]
Epoch 0: 12%|█▏ | 1440/12384 [3:03:52<23:10:25, 7.62s/it, loss=0.0094, acc=0.9850, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1441/12384 [3:03:52<23:08:47, 7.61s/it, loss=0.0094, acc=0.9850, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1441/12384 [3:04:00<23:08:47, 7.61s/it, loss=0.0019, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1442/12384 [3:04:00<23:10:23, 7.62s/it, loss=0.0019, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1442/12384 [3:04:07<23:10:23, 7.62s/it, loss=0.0021, acc=0.9978, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1443/12384 [3:04:07<23:10:14, 7.62s/it, loss=0.0021, acc=0.9978, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1443/12384 [3:04:15<23:10:14, 7.62s/it, loss=0.0011, acc=0.9958, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1444/12384 [3:04:15<23:11:39, 7.63s/it, loss=0.0011, acc=0.9958, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1444/12384 [3:04:23<23:11:39, 7.63s/it, loss=0.0011, acc=0.9987, iter_time=6.79s]
Epoch 0: 12%|█▏ | 1445/12384 [3:04:23<23:10:07, 7.62s/it, loss=0.0011, acc=0.9987, iter_time=6.79s]
Epoch 0: 12%|█▏ | 1445/12384 [3:04:30<23:10:07, 7.62s/it, loss=0.0044, acc=0.9944, iter_time=8.46s]
Epoch 0: 12%|█▏ | 1446/12384 [3:04:30<23:13:12, 7.64s/it, loss=0.0044, acc=0.9944, iter_time=8.46s]
Epoch 0: 12%|█▏ | 1446/12384 [3:04:38<23:13:12, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=7.69s]
Epoch 0: 12%|█▏ | 1447/12384 [3:04:38<23:10:50, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=7.69s]
Epoch 0: 12%|█▏ | 1447/12384 [3:04:46<23:10:50, 7.63s/it, loss=0.0019, acc=0.9938, iter_time=7.84s]
Epoch 0: 12%|█▏ | 1448/12384 [3:04:46<23:16:35, 7.66s/it, loss=0.0019, acc=0.9938, iter_time=7.84s]
Epoch 0: 12%|█▏ | 1448/12384 [3:04:53<23:16:35, 7.66s/it, loss=0.0006, acc=0.9987, iter_time=5.50s]
Epoch 0: 12%|█▏ | 1449/12384 [3:04:53<23:15:42, 7.66s/it, loss=0.0006, acc=0.9987, iter_time=5.50s]
Epoch 0: 12%|█▏ | 1449/12384 [3:05:01<23:15:42, 7.66s/it, loss=0.0007, acc=0.9996, iter_time=10.08s]
Epoch 0: 12%|█▏ | 1450/12384 [3:05:01<23:14:28, 7.65s/it, loss=0.0007, acc=0.9996, iter_time=10.08s]
Epoch 0: 12%|█▏ | 1450/12384 [3:05:09<23:14:28, 7.65s/it, loss=0.0008, acc=0.9987, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1451/12384 [3:05:09<23:13:06, 7.65s/it, loss=0.0008, acc=0.9987, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1451/12384 [3:05:16<23:13:06, 7.65s/it, loss=0.0007, acc=0.9985, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1452/12384 [3:05:16<23:11:34, 7.64s/it, loss=0.0007, acc=0.9985, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1452/12384 [3:05:24<23:11:34, 7.64s/it, loss=0.0014, acc=0.9968, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1453/12384 [3:05:24<23:10:29, 7.63s/it, loss=0.0014, acc=0.9968, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1453/12384 [3:05:31<23:10:29, 7.63s/it, loss=0.0010, acc=0.9983, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1454/12384 [3:05:31<23:08:18, 7.62s/it, loss=0.0010, acc=0.9983, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1454/12384 [3:05:39<23:08:18, 7.62s/it, loss=0.0004, acc=0.9981, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1455/12384 [3:05:39<23:29:52, 7.74s/it, loss=0.0004, acc=0.9981, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1455/12384 [3:05:47<23:29:52, 7.74s/it, loss=0.0004, acc=0.9999, iter_time=9.24s]
Epoch 0: 12%|█▏ | 1456/12384 [3:05:47<23:21:42, 7.70s/it, loss=0.0004, acc=0.9999, iter_time=9.24s]
Epoch 0: 12%|█▏ | 1456/12384 [3:05:55<23:21:42, 7.70s/it, loss=0.0004, acc=0.9986, iter_time=6.27s]
Epoch 0: 12%|█▏ | 1457/12384 [3:05:55<23:18:49, 7.68s/it, loss=0.0004, acc=0.9986, iter_time=6.27s]
Epoch 0: 12%|█▏ | 1457/12384 [3:06:02<23:18:49, 7.68s/it, loss=0.0035, acc=0.9884, iter_time=8.58s]
Epoch 0: 12%|█▏ | 1458/12384 [3:06:02<23:15:22, 7.66s/it, loss=0.0035, acc=0.9884, iter_time=8.58s]
Epoch 0: 12%|█▏ | 1458/12384 [3:06:10<23:15:22, 7.66s/it, loss=0.0033, acc=0.9933, iter_time=5.30s]
Epoch 0: 12%|█▏ | 1459/12384 [3:06:10<23:12:52, 7.65s/it, loss=0.0033, acc=0.9933, iter_time=5.30s]
Epoch 0: 12%|█▏ | 1459/12384 [3:06:18<23:12:52, 7.65s/it, loss=0.0028, acc=0.9899, iter_time=9.96s]
Epoch 0: 12%|█▏ | 1460/12384 [3:06:18<23:09:56, 7.63s/it, loss=0.0028, acc=0.9899, iter_time=9.96s]
Epoch 0: 12%|█▏ | 1460/12384 [3:06:25<23:09:56, 7.63s/it, loss=0.0006, acc=0.9972, iter_time=6.10s]
Epoch 0: 12%|█▏ | 1461/12384 [3:06:25<23:08:45, 7.63s/it, loss=0.0006, acc=0.9972, iter_time=6.10s]
Epoch 0: 12%|█▏ | 1461/12384 [3:06:33<23:08:45, 7.63s/it, loss=0.0017, acc=0.9976, iter_time=9.11s]
Epoch 0: 12%|█▏ | 1462/12384 [3:06:33<23:07:25, 7.62s/it, loss=0.0017, acc=0.9976, iter_time=9.11s]
Epoch 0: 12%|█▏ | 1462/12384 [3:06:40<23:07:25, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1463/12384 [3:06:40<23:07:26, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1463/12384 [3:06:48<23:07:26, 7.62s/it, loss=0.0009, acc=0.9993, iter_time=7.54s]
Epoch 0: 12%|█▏ | 1464/12384 [3:06:48<23:05:49, 7.61s/it, loss=0.0009, acc=0.9993, iter_time=7.54s]
Epoch 0: 12%|█▏ | 1464/12384 [3:06:56<23:05:49, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1465/12384 [3:06:56<23:04:37, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1465/12384 [3:07:03<23:04:37, 7.61s/it, loss=0.0023, acc=0.9963, iter_time=7.40s]
Epoch 0: 12%|█▏ | 1466/12384 [3:07:03<23:07:39, 7.63s/it, loss=0.0023, acc=0.9963, iter_time=7.40s]
Epoch 0: 12%|█▏ | 1466/12384 [3:07:11<23:07:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 12%|█▏ | 1467/12384 [3:07:11<23:08:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 12%|█▏ | 1467/12384 [3:07:19<23:08:13, 7.63s/it, loss=0.0012, acc=0.9984, iter_time=9.43s]
Epoch 0: 12%|█▏ | 1468/12384 [3:07:19<23:14:28, 7.66s/it, loss=0.0012, acc=0.9984, iter_time=9.43s]
Epoch 0: 12%|█▏ | 1468/12384 [3:07:26<23:14:28, 7.66s/it, loss=0.0016, acc=0.9978, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1469/12384 [3:07:26<23:11:32, 7.65s/it, loss=0.0016, acc=0.9978, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1469/12384 [3:07:34<23:11:32, 7.65s/it, loss=0.0013, acc=0.9975, iter_time=5.29s]
Epoch 0: 12%|█▏ | 1470/12384 [3:07:34<23:12:45, 7.66s/it, loss=0.0013, acc=0.9975, iter_time=5.29s]
Epoch 0: 12%|█▏ | 1470/12384 [3:07:42<23:12:45, 7.66s/it, loss=0.0006, acc=0.9992, iter_time=9.99s]
Epoch 0: 12%|█▏ | 1471/12384 [3:07:42<23:10:19, 7.64s/it, loss=0.0006, acc=0.9992, iter_time=9.99s]
Epoch 0: 12%|█▏ | 1471/12384 [3:07:49<23:10:19, 7.64s/it, loss=0.0015, acc=0.9968, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1472/12384 [3:07:49<23:08:20, 7.63s/it, loss=0.0015, acc=0.9968, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1472/12384 [3:07:57<23:08:20, 7.63s/it, loss=0.0008, acc=0.9966, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1473/12384 [3:07:57<23:07:32, 7.63s/it, loss=0.0008, acc=0.9966, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1473/12384 [3:08:04<23:07:32, 7.63s/it, loss=0.0014, acc=0.9954, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1474/12384 [3:08:04<23:07:26, 7.63s/it, loss=0.0014, acc=0.9954, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1474/12384 [3:08:12<23:07:26, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=5.84s]
Epoch 0: 12%|█▏ | 1475/12384 [3:08:12<23:10:48, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=5.84s]
Epoch 0: 12%|█▏ | 1475/12384 [3:08:20<23:10:48, 7.65s/it, loss=0.0021, acc=0.9938, iter_time=9.18s]
Epoch 0: 12%|█▏ | 1476/12384 [3:08:20<23:08:50, 7.64s/it, loss=0.0021, acc=0.9938, iter_time=9.18s]
Epoch 0: 12%|█▏ | 1476/12384 [3:08:27<23:08:50, 7.64s/it, loss=0.0011, acc=0.9961, iter_time=4.68s]
Epoch 0: 12%|█▏ | 1477/12384 [3:08:27<23:10:21, 7.65s/it, loss=0.0011, acc=0.9961, iter_time=4.68s]
Epoch 0: 12%|█▏ | 1477/12384 [3:08:35<23:10:21, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=10.96s]
Epoch 0: 12%|█▏ | 1478/12384 [3:08:35<23:12:34, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=10.96s]
Epoch 0: 12%|█▏ | 1478/12384 [3:08:43<23:12:34, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1479/12384 [3:08:43<23:09:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1479/12384 [3:08:51<23:09:25, 7.64s/it, loss=0.0020, acc=0.9936, iter_time=8.50s]
Epoch 0: 12%|█▏ | 1480/12384 [3:08:51<23:35:32, 7.79s/it, loss=0.0020, acc=0.9936, iter_time=8.50s]
Epoch 0: 12%|█▏ | 1480/12384 [3:08:59<23:35:32, 7.79s/it, loss=0.0027, acc=0.9929, iter_time=5.77s]
Epoch 0: 12%|█▏ | 1481/12384 [3:08:59<23:44:54, 7.84s/it, loss=0.0027, acc=0.9929, iter_time=5.77s]
Epoch 0: 12%|█▏ | 1481/12384 [3:09:06<23:44:54, 7.84s/it, loss=0.0005, acc=0.9999, iter_time=8.86s]
Epoch 0: 12%|█▏ | 1482/12384 [3:09:06<23:33:27, 7.78s/it, loss=0.0005, acc=0.9999, iter_time=8.86s]
Epoch 0: 12%|█▏ | 1482/12384 [3:09:14<23:33:27, 7.78s/it, loss=0.0023, acc=0.9971, iter_time=6.13s]
Epoch 0: 12%|█▏ | 1483/12384 [3:09:14<23:25:20, 7.74s/it, loss=0.0023, acc=0.9971, iter_time=6.13s]
Epoch 0: 12%|█▏ | 1483/12384 [3:09:22<23:25:20, 7.74s/it, loss=0.0136, acc=0.9805, iter_time=9.65s]
Epoch 0: 12%|█▏ | 1484/12384 [3:09:22<23:21:42, 7.72s/it, loss=0.0136, acc=0.9805, iter_time=9.65s]
Epoch 0: 12%|█▏ | 1484/12384 [3:09:29<23:21:42, 7.72s/it, loss=0.0017, acc=0.9970, iter_time=7.70s]
Epoch 0: 12%|█▏ | 1485/12384 [3:09:29<23:21:54, 7.72s/it, loss=0.0017, acc=0.9970, iter_time=7.70s]
Epoch 0: 12%|█▏ | 1485/12384 [3:09:37<23:21:54, 7.72s/it, loss=0.0021, acc=0.9939, iter_time=4.72s]
Epoch 0: 12%|█▏ | 1486/12384 [3:09:37<23:17:19, 7.69s/it, loss=0.0021, acc=0.9939, iter_time=4.72s]
Epoch 0: 12%|█▏ | 1486/12384 [3:09:45<23:17:19, 7.69s/it, loss=0.0008, acc=0.9964, iter_time=10.64s]
Epoch 0: 12%|█▏ | 1487/12384 [3:09:45<23:13:58, 7.68s/it, loss=0.0008, acc=0.9964, iter_time=10.64s]
Epoch 0: 12%|█▏ | 1487/12384 [3:09:52<23:13:58, 7.68s/it, loss=0.0022, acc=0.9957, iter_time=8.04s]
Epoch 0: 12%|█▏ | 1488/12384 [3:09:52<23:12:30, 7.67s/it, loss=0.0022, acc=0.9957, iter_time=8.04s]
Epoch 0: 12%|█▏ | 1488/12384 [3:10:00<23:12:30, 7.67s/it, loss=0.0035, acc=0.9887, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1489/12384 [3:10:00<23:09:56, 7.65s/it, loss=0.0035, acc=0.9887, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1489/12384 [3:10:08<23:09:56, 7.65s/it, loss=0.0028, acc=0.9943, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1490/12384 [3:10:08<23:09:10, 7.65s/it, loss=0.0028, acc=0.9943, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1490/12384 [3:10:15<23:09:10, 7.65s/it, loss=0.0006, acc=0.9988, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1491/12384 [3:10:15<23:06:42, 7.64s/it, loss=0.0006, acc=0.9988, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1491/12384 [3:10:23<23:06:42, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1492/12384 [3:10:23<23:06:10, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1492/12384 [3:10:31<23:06:10, 7.64s/it, loss=0.0126, acc=0.9808, iter_time=7.37s]
Epoch 0: 12%|█▏ | 1493/12384 [3:10:31<23:07:24, 7.64s/it, loss=0.0126, acc=0.9808, iter_time=7.37s]
Epoch 0: 12%|█▏ | 1493/12384 [3:10:38<23:07:24, 7.64s/it, loss=0.0022, acc=0.9956, iter_time=6.76s]
Epoch 0: 12%|█▏ | 1494/12384 [3:10:38<23:07:30, 7.64s/it, loss=0.0022, acc=0.9956, iter_time=6.76s]
Epoch 0: 12%|█▏ | 1494/12384 [3:10:46<23:07:30, 7.64s/it, loss=0.0007, acc=0.9998, iter_time=5.76s]
Epoch 0: 12%|█▏ | 1495/12384 [3:10:46<23:06:24, 7.64s/it, loss=0.0007, acc=0.9998, iter_time=5.76s]
Epoch 0: 12%|█▏ | 1495/12384 [3:10:53<23:06:24, 7.64s/it, loss=0.0030, acc=0.9960, iter_time=11.09s]
Epoch 0: 12%|█▏ | 1496/12384 [3:10:53<23:06:48, 7.64s/it, loss=0.0030, acc=0.9960, iter_time=11.09s]
Epoch 0: 12%|█▏ | 1496/12384 [3:11:01<23:06:48, 7.64s/it, loss=0.0012, acc=0.9962, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1497/12384 [3:11:01<23:06:21, 7.64s/it, loss=0.0012, acc=0.9962, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1497/12384 [3:11:09<23:06:21, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=6.72s]
Epoch 0: 12%|█▏ | 1498/12384 [3:11:09<23:04:51, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.72s]
Epoch 0: 12%|█▏ | 1498/12384 [3:11:16<23:04:51, 7.63s/it, loss=0.0013, acc=0.9961, iter_time=7.33s]
Epoch 0: 12%|█▏ | 1499/12384 [3:11:16<23:05:24, 7.64s/it, loss=0.0013, acc=0.9961, iter_time=7.33s]
Epoch 0: 12%|█▏ | 1499/12384 [3:11:24<23:05:24, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=9.29s]
Epoch 0: 12%|█▏ | 1500/12384 [3:11:24<23:16:06, 7.70s/it, loss=0.0004, acc=1.0000, iter_time=9.29s]
Epoch 0: 12%|█▏ | 1500/12384 [3:11:32<23:16:06, 7.70s/it, loss=0.0019, acc=0.9970, iter_time=5.91s]
Epoch 0: 12%|█▏ | 1501/12384 [3:11:32<23:10:47, 7.67s/it, loss=0.0019, acc=0.9970, iter_time=5.91s]
Epoch 0: 12%|█▏ | 1501/12384 [3:11:39<23:10:47, 7.67s/it, loss=0.0025, acc=0.9960, iter_time=9.13s]
Epoch 0: 12%|█▏ | 1502/12384 [3:11:39<23:12:44, 7.68s/it, loss=0.0025, acc=0.9960, iter_time=9.13s]
Epoch 0: 12%|█▏ | 1502/12384 [3:11:47<23:12:44, 7.68s/it, loss=0.0012, acc=0.9977, iter_time=7.72s]
Epoch 0: 12%|█▏ | 1503/12384 [3:11:47<23:10:18, 7.67s/it, loss=0.0012, acc=0.9977, iter_time=7.72s]
Epoch 0: 12%|█▏ | 1503/12384 [3:11:55<23:10:18, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.56s]
Epoch 0: 12%|█▏ | 1504/12384 [3:11:55<23:07:27, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.56s]
Epoch 0: 12%|█▏ | 1504/12384 [3:12:02<23:07:27, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1505/12384 [3:12:02<23:08:35, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1505/12384 [3:12:10<23:08:35, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1506/12384 [3:12:10<23:10:07, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1506/12384 [3:12:18<23:10:07, 7.67s/it, loss=0.0021, acc=0.9969, iter_time=4.86s]
Epoch 0: 12%|█▏ | 1507/12384 [3:12:18<23:25:05, 7.75s/it, loss=0.0021, acc=0.9969, iter_time=4.86s]
Epoch 0: 12%|█▏ | 1507/12384 [3:12:26<23:25:05, 7.75s/it, loss=0.0007, acc=0.9990, iter_time=9.26s]
Epoch 0: 12%|█▏ | 1508/12384 [3:12:26<23:17:48, 7.71s/it, loss=0.0007, acc=0.9990, iter_time=9.26s]
Epoch 0: 12%|█▏ | 1508/12384 [3:12:33<23:17:48, 7.71s/it, loss=0.0008, acc=0.9986, iter_time=9.12s]
Epoch 0: 12%|█▏ | 1509/12384 [3:12:33<23:12:32, 7.68s/it, loss=0.0008, acc=0.9986, iter_time=9.12s]
Epoch 0: 12%|█▏ | 1509/12384 [3:12:41<23:12:32, 7.68s/it, loss=0.0013, acc=0.9969, iter_time=4.76s]
Epoch 0: 12%|█▏ | 1510/12384 [3:12:41<23:09:02, 7.66s/it, loss=0.0013, acc=0.9969, iter_time=4.76s]
Epoch 0: 12%|█▏ | 1510/12384 [3:12:49<23:09:02, 7.66s/it, loss=0.0007, acc=0.9972, iter_time=10.48s]
Epoch 0: 12%|█▏ | 1511/12384 [3:12:49<23:08:10, 7.66s/it, loss=0.0007, acc=0.9972, iter_time=10.48s]
Epoch 0: 12%|█▏ | 1511/12384 [3:12:56<23:08:10, 7.66s/it, loss=0.0009, acc=0.9984, iter_time=8.06s]
Epoch 0: 12%|█▏ | 1512/12384 [3:12:56<23:08:56, 7.67s/it, loss=0.0009, acc=0.9984, iter_time=8.06s]
Epoch 0: 12%|█▏ | 1512/12384 [3:13:04<23:08:56, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.16s]
Epoch 0: 12%|█▏ | 1513/12384 [3:13:04<23:07:30, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.16s]
Epoch 0: 12%|█▏ | 1513/12384 [3:13:12<23:07:30, 7.66s/it, loss=0.0005, acc=0.9994, iter_time=8.88s]
Epoch 0: 12%|█▏ | 1514/12384 [3:13:12<23:12:22, 7.69s/it, loss=0.0005, acc=0.9994, iter_time=8.88s]
Epoch 0: 12%|█▏ | 1514/12384 [3:13:19<23:12:22, 7.69s/it, loss=0.0022, acc=0.9975, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1515/12384 [3:13:19<23:08:29, 7.66s/it, loss=0.0022, acc=0.9975, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1515/12384 [3:13:27<23:08:29, 7.66s/it, loss=0.0019, acc=0.9969, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1516/12384 [3:13:27<23:06:06, 7.65s/it, loss=0.0019, acc=0.9969, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1516/12384 [3:13:34<23:06:06, 7.65s/it, loss=0.0150, acc=0.9878, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1517/12384 [3:13:34<23:05:12, 7.65s/it, loss=0.0150, acc=0.9878, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1517/12384 [3:13:42<23:05:12, 7.65s/it, loss=0.0009, acc=0.9995, iter_time=4.04s]
Epoch 0: 12%|█▏ | 1518/12384 [3:13:42<23:05:17, 7.65s/it, loss=0.0009, acc=0.9995, iter_time=4.04s]
Epoch 0: 12%|█▏ | 1518/12384 [3:13:50<23:05:17, 7.65s/it, loss=0.0018, acc=0.9972, iter_time=11.22s]
Epoch 0: 12%|█▏ | 1519/12384 [3:13:50<23:03:27, 7.64s/it, loss=0.0018, acc=0.9972, iter_time=11.22s]
Epoch 0: 12%|█▏ | 1519/12384 [3:13:57<23:03:27, 7.64s/it, loss=0.0075, acc=0.9868, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1520/12384 [3:13:57<23:04:11, 7.64s/it, loss=0.0075, acc=0.9868, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1520/12384 [3:14:05<23:04:11, 7.64s/it, loss=0.0009, acc=0.9977, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1521/12384 [3:14:05<23:06:29, 7.66s/it, loss=0.0009, acc=0.9977, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1521/12384 [3:14:13<23:06:29, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 12%|█▏ | 1522/12384 [3:14:13<23:04:56, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 12%|█▏ | 1522/12384 [3:14:20<23:04:56, 7.65s/it, loss=0.0009, acc=0.9973, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1523/12384 [3:14:20<23:04:30, 7.65s/it, loss=0.0009, acc=0.9973, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1523/12384 [3:14:28<23:04:30, 7.65s/it, loss=0.0015, acc=0.9973, iter_time=5.06s]
Epoch 0: 12%|█▏ | 1524/12384 [3:14:28<23:02:57, 7.64s/it, loss=0.0015, acc=0.9973, iter_time=5.06s]
Epoch 0: 12%|█▏ | 1524/12384 [3:14:36<23:02:57, 7.64s/it, loss=0.0007, acc=0.9992, iter_time=10.18s]
Epoch 0: 12%|█▏ | 1525/12384 [3:14:36<23:03:16, 7.64s/it, loss=0.0007, acc=0.9992, iter_time=10.18s]
Epoch 0: 12%|█▏ | 1525/12384 [3:14:43<23:03:16, 7.64s/it, loss=0.0009, acc=0.9974, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1526/12384 [3:14:43<23:04:36, 7.65s/it, loss=0.0009, acc=0.9974, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1526/12384 [3:14:51<23:04:36, 7.65s/it, loss=0.0006, acc=1.0000, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1527/12384 [3:14:51<23:02:04, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1527/12384 [3:14:59<23:02:04, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1528/12384 [3:14:59<23:00:12, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1528/12384 [3:15:06<23:00:12, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=5.68s]
Epoch 0: 12%|█▏ | 1529/12384 [3:15:06<22:58:58, 7.62s/it, loss=0.0005, acc=0.9997, iter_time=5.68s]
Epoch 0: 12%|█▏ | 1529/12384 [3:15:14<22:58:58, 7.62s/it, loss=0.0013, acc=0.9963, iter_time=7.34s]
Epoch 0: 12%|█▏ | 1530/12384 [3:15:14<23:00:16, 7.63s/it, loss=0.0013, acc=0.9963, iter_time=7.34s]
Epoch 0: 12%|█▏ | 1530/12384 [3:15:21<23:00:16, 7.63s/it, loss=0.0008, acc=0.9983, iter_time=9.45s]
Epoch 0: 12%|█▏ | 1531/12384 [3:15:21<23:02:13, 7.64s/it, loss=0.0008, acc=0.9983, iter_time=9.45s]
Epoch 0: 12%|█▏ | 1531/12384 [3:15:29<23:02:13, 7.64s/it, loss=0.0010, acc=0.9979, iter_time=5.89s]
Epoch 0: 12%|█▏ | 1532/12384 [3:15:29<23:00:17, 7.63s/it, loss=0.0010, acc=0.9979, iter_time=5.89s]
Epoch 0: 12%|█▏ | 1532/12384 [3:15:37<23:00:17, 7.63s/it, loss=0.0004, acc=0.9985, iter_time=9.64s]
Epoch 0: 12%|█▏ | 1533/12384 [3:15:37<23:17:42, 7.73s/it, loss=0.0004, acc=0.9985, iter_time=9.64s]
Epoch 0: 12%|█▏ | 1533/12384 [3:15:45<23:17:42, 7.73s/it, loss=0.0029, acc=0.9919, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1534/12384 [3:15:45<23:10:12, 7.69s/it, loss=0.0029, acc=0.9919, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1534/12384 [3:15:52<23:10:12, 7.69s/it, loss=0.0009, acc=0.9962, iter_time=6.68s]
Epoch 0: 12%|█▏ | 1535/12384 [3:15:52<23:05:38, 7.66s/it, loss=0.0009, acc=0.9962, iter_time=6.68s]
Epoch 0: 12%|█▏ | 1535/12384 [3:16:00<23:05:38, 7.66s/it, loss=0.0023, acc=0.9937, iter_time=8.92s]
Epoch 0: 12%|█▏ | 1536/12384 [3:16:00<23:03:56, 7.65s/it, loss=0.0023, acc=0.9937, iter_time=8.92s]
Epoch 0: 12%|█▏ | 1536/12384 [3:16:07<23:03:56, 7.65s/it, loss=0.0012, acc=1.0000, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1537/12384 [3:16:07<23:03:24, 7.65s/it, loss=0.0012, acc=1.0000, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1537/12384 [3:16:15<23:03:24, 7.65s/it, loss=0.0012, acc=0.9967, iter_time=7.35s]
Epoch 0: 12%|█▏ | 1538/12384 [3:16:15<23:00:34, 7.64s/it, loss=0.0012, acc=0.9967, iter_time=7.35s]
Epoch 0: 12%|█▏ | 1538/12384 [3:16:23<23:00:34, 7.64s/it, loss=0.0006, acc=0.9982, iter_time=7.90s]
Epoch 0: 12%|█▏ | 1539/12384 [3:16:23<22:59:31, 7.63s/it, loss=0.0006, acc=0.9982, iter_time=7.90s]
Epoch 0: 12%|█▏ | 1539/12384 [3:16:30<22:59:31, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1540/12384 [3:16:30<22:58:35, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1540/12384 [3:16:38<22:58:35, 7.63s/it, loss=0.0024, acc=0.9947, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1541/12384 [3:16:38<22:56:39, 7.62s/it, loss=0.0024, acc=0.9947, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1541/12384 [3:16:46<22:56:39, 7.62s/it, loss=0.0049, acc=0.9881, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1542/12384 [3:16:46<22:56:55, 7.62s/it, loss=0.0049, acc=0.9881, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1542/12384 [3:16:53<22:56:55, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1543/12384 [3:16:53<22:56:57, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1543/12384 [3:17:01<22:56:57, 7.62s/it, loss=0.0010, acc=0.9980, iter_time=8.13s]
Epoch 0: 12%|█▏ | 1544/12384 [3:17:01<23:02:32, 7.65s/it, loss=0.0010, acc=0.9980, iter_time=8.13s]
Epoch 0: 12%|█▏ | 1544/12384 [3:17:09<23:02:32, 7.65s/it, loss=0.0014, acc=0.9992, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1545/12384 [3:17:09<23:02:22, 7.65s/it, loss=0.0014, acc=0.9992, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1545/12384 [3:17:16<23:02:22, 7.65s/it, loss=0.0048, acc=0.9919, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1546/12384 [3:17:16<23:02:57, 7.66s/it, loss=0.0048, acc=0.9919, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1546/12384 [3:17:24<23:02:57, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1547/12384 [3:17:24<23:01:48, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1547/12384 [3:17:31<23:01:48, 7.65s/it, loss=0.0013, acc=0.9988, iter_time=8.60s]
Epoch 0: 12%|█▎ | 1548/12384 [3:17:31<23:01:00, 7.65s/it, loss=0.0013, acc=0.9988, iter_time=8.60s]
Epoch 0: 12%|█▎ | 1548/12384 [3:17:39<23:01:00, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1549/12384 [3:17:39<22:59:30, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1549/12384 [3:17:47<22:59:30, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=8.09s]
Epoch 0: 13%|█▎ | 1550/12384 [3:17:47<23:01:30, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=8.09s]
Epoch 0: 13%|█▎ | 1550/12384 [3:17:54<23:01:30, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=4.15s]
Epoch 0: 13%|█▎ | 1551/12384 [3:17:54<23:01:58, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=4.15s]
Epoch 0: 13%|█▎ | 1551/12384 [3:18:02<23:01:58, 7.65s/it, loss=0.0007, acc=0.9989, iter_time=11.10s]
Epoch 0: 13%|█▎ | 1552/12384 [3:18:02<23:00:29, 7.65s/it, loss=0.0007, acc=0.9989, iter_time=11.10s]
Epoch 0: 13%|█▎ | 1552/12384 [3:18:10<23:00:29, 7.65s/it, loss=0.0006, acc=0.9980, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1553/12384 [3:18:10<23:00:36, 7.65s/it, loss=0.0006, acc=0.9980, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1553/12384 [3:18:17<23:00:36, 7.65s/it, loss=0.0007, acc=0.9998, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1554/12384 [3:18:17<23:01:50, 7.66s/it, loss=0.0007, acc=0.9998, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1554/12384 [3:18:25<23:01:50, 7.66s/it, loss=0.0211, acc=0.9780, iter_time=8.81s]
Epoch 0: 13%|█▎ | 1555/12384 [3:18:25<22:59:00, 7.64s/it, loss=0.0211, acc=0.9780, iter_time=8.81s]
Epoch 0: 13%|█▎ | 1555/12384 [3:18:33<22:59:00, 7.64s/it, loss=0.0010, acc=0.9978, iter_time=9.05s]
Epoch 0: 13%|█▎ | 1556/12384 [3:18:33<22:57:38, 7.63s/it, loss=0.0010, acc=0.9978, iter_time=9.05s]
Epoch 0: 13%|█▎ | 1556/12384 [3:18:40<22:57:38, 7.63s/it, loss=0.0010, acc=0.9950, iter_time=4.84s]
Epoch 0: 13%|█▎ | 1557/12384 [3:18:40<22:55:52, 7.62s/it, loss=0.0010, acc=0.9950, iter_time=4.84s]
Epoch 0: 13%|█▎ | 1557/12384 [3:18:48<22:55:52, 7.62s/it, loss=0.0012, acc=0.9998, iter_time=7.08s]
Epoch 0: 13%|█▎ | 1558/12384 [3:18:48<22:55:40, 7.62s/it, loss=0.0012, acc=0.9998, iter_time=7.08s]
Epoch 0: 13%|█▎ | 1558/12384 [3:18:55<22:55:40, 7.62s/it, loss=0.0007, acc=0.9967, iter_time=7.53s]
Epoch 0: 13%|█▎ | 1559/12384 [3:18:55<22:56:06, 7.63s/it, loss=0.0007, acc=0.9967, iter_time=7.53s]
Epoch 0: 13%|█▎ | 1559/12384 [3:19:03<22:56:06, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=11.71s]
Epoch 0: 13%|█▎ | 1560/12384 [3:19:03<23:11:11, 7.71s/it, loss=0.0005, acc=0.9983, iter_time=11.71s]
Epoch 0: 13%|█▎ | 1560/12384 [3:19:11<23:11:11, 7.71s/it, loss=0.0009, acc=0.9979, iter_time=7.21s]
Epoch 0: 13%|█▎ | 1561/12384 [3:19:11<23:06:16, 7.69s/it, loss=0.0009, acc=0.9979, iter_time=7.21s]
Epoch 0: 13%|█▎ | 1561/12384 [3:19:19<23:06:16, 7.69s/it, loss=0.0013, acc=0.9957, iter_time=5.10s]
Epoch 0: 13%|█▎ | 1562/12384 [3:19:19<23:01:29, 7.66s/it, loss=0.0013, acc=0.9957, iter_time=5.10s]
Epoch 0: 13%|█▎ | 1562/12384 [3:19:26<23:01:29, 7.66s/it, loss=0.0006, acc=0.9981, iter_time=10.14s]
Epoch 0: 13%|█▎ | 1563/12384 [3:19:26<22:59:33, 7.65s/it, loss=0.0006, acc=0.9981, iter_time=10.14s]
Epoch 0: 13%|█▎ | 1563/12384 [3:19:34<22:59:33, 7.65s/it, loss=0.0033, acc=0.9926, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1564/12384 [3:19:34<22:58:37, 7.64s/it, loss=0.0033, acc=0.9926, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1564/12384 [3:19:41<22:58:37, 7.64s/it, loss=0.0080, acc=0.9841, iter_time=10.64s]
Epoch 0: 13%|█▎ | 1565/12384 [3:19:41<22:56:46, 7.64s/it, loss=0.0080, acc=0.9841, iter_time=10.64s]
Epoch 0: 13%|█▎ | 1565/12384 [3:19:49<22:56:46, 7.64s/it, loss=0.0042, acc=0.9969, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1566/12384 [3:19:49<22:56:44, 7.64s/it, loss=0.0042, acc=0.9969, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1566/12384 [3:19:57<22:56:44, 7.64s/it, loss=0.0015, acc=0.9952, iter_time=5.84s]
Epoch 0: 13%|█▎ | 1567/12384 [3:19:57<22:55:26, 7.63s/it, loss=0.0015, acc=0.9952, iter_time=5.84s]
Epoch 0: 13%|█▎ | 1567/12384 [3:20:04<22:55:26, 7.63s/it, loss=0.0007, acc=0.9999, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1568/12384 [3:20:04<22:53:18, 7.62s/it, loss=0.0007, acc=0.9999, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1568/12384 [3:20:12<22:53:18, 7.62s/it, loss=0.0009, acc=0.9978, iter_time=3.86s]
Epoch 0: 13%|█▎ | 1569/12384 [3:20:12<22:56:36, 7.64s/it, loss=0.0009, acc=0.9978, iter_time=3.86s]
Epoch 0: 13%|█▎ | 1569/12384 [3:20:20<22:56:36, 7.64s/it, loss=0.0008, acc=0.9954, iter_time=9.60s]
Epoch 0: 13%|█▎ | 1570/12384 [3:20:20<22:57:19, 7.64s/it, loss=0.0008, acc=0.9954, iter_time=9.60s]
Epoch 0: 13%|█▎ | 1570/12384 [3:20:27<22:57:19, 7.64s/it, loss=0.0051, acc=0.9882, iter_time=7.57s]
Epoch 0: 13%|█▎ | 1571/12384 [3:20:27<22:57:35, 7.64s/it, loss=0.0051, acc=0.9882, iter_time=7.57s]
Epoch 0: 13%|█▎ | 1571/12384 [3:20:35<22:57:35, 7.64s/it, loss=0.0013, acc=0.9959, iter_time=9.16s]
Epoch 0: 13%|█▎ | 1572/12384 [3:20:35<22:55:31, 7.63s/it, loss=0.0013, acc=0.9959, iter_time=9.16s]
Epoch 0: 13%|█▎ | 1572/12384 [3:20:43<22:55:31, 7.63s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1573/12384 [3:20:43<22:53:17, 7.62s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1573/12384 [3:20:50<22:53:17, 7.62s/it, loss=0.0005, acc=0.9993, iter_time=4.76s]
Epoch 0: 13%|█▎ | 1574/12384 [3:20:50<22:53:55, 7.63s/it, loss=0.0005, acc=0.9993, iter_time=4.76s]
Epoch 0: 13%|█▎ | 1574/12384 [3:20:58<22:53:55, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=10.49s]
Epoch 0: 13%|█▎ | 1575/12384 [3:20:58<22:56:57, 7.64s/it, loss=0.0005, acc=0.9997, iter_time=10.49s]
Epoch 0: 13%|█▎ | 1575/12384 [3:21:05<22:56:57, 7.64s/it, loss=0.0028, acc=0.9960, iter_time=8.08s]
Epoch 0: 13%|█▎ | 1576/12384 [3:21:05<22:56:33, 7.64s/it, loss=0.0028, acc=0.9960, iter_time=8.08s]
Epoch 0: 13%|█▎ | 1576/12384 [3:21:13<22:56:33, 7.64s/it, loss=0.0037, acc=0.9941, iter_time=7.23s]
Epoch 0: 13%|█▎ | 1577/12384 [3:21:13<22:56:12, 7.64s/it, loss=0.0037, acc=0.9941, iter_time=7.23s]
Epoch 0: 13%|█▎ | 1577/12384 [3:21:21<22:56:12, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1578/12384 [3:21:21<22:54:41, 7.63s/it, loss=0.0005, acc=0.9979, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1578/12384 [3:21:28<22:54:41, 7.63s/it, loss=0.0009, acc=0.9978, iter_time=6.66s]
Epoch 0: 13%|█▎ | 1579/12384 [3:21:28<22:53:32, 7.63s/it, loss=0.0009, acc=0.9978, iter_time=6.66s]
Epoch 0: 13%|█▎ | 1579/12384 [3:21:36<22:53:32, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.27s]
Epoch 0: 13%|█▎ | 1580/12384 [3:21:36<22:51:45, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=8.27s]
Epoch 0: 13%|█▎ | 1580/12384 [3:21:44<22:51:45, 7.62s/it, loss=0.0041, acc=0.9935, iter_time=6.18s]
Epoch 0: 13%|█▎ | 1581/12384 [3:21:44<22:50:30, 7.61s/it, loss=0.0041, acc=0.9935, iter_time=6.18s]
Epoch 0: 13%|█▎ | 1581/12384 [3:21:51<22:50:30, 7.61s/it, loss=0.0013, acc=0.9954, iter_time=9.33s]
Epoch 0: 13%|█▎ | 1582/12384 [3:21:51<22:51:13, 7.62s/it, loss=0.0013, acc=0.9954, iter_time=9.33s]
Epoch 0: 13%|█▎ | 1582/12384 [3:21:59<22:51:13, 7.62s/it, loss=0.0008, acc=0.9990, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1583/12384 [3:21:59<22:51:47, 7.62s/it, loss=0.0008, acc=0.9990, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1583/12384 [3:22:06<22:51:47, 7.62s/it, loss=0.0012, acc=0.9966, iter_time=8.01s]
Epoch 0: 13%|█▎ | 1584/12384 [3:22:06<22:52:57, 7.63s/it, loss=0.0012, acc=0.9966, iter_time=8.01s]
Epoch 0: 13%|█▎ | 1584/12384 [3:22:14<22:52:57, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.29s]
Epoch 0: 13%|█▎ | 1585/12384 [3:22:14<22:54:10, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.29s]
Epoch 0: 13%|█▎ | 1585/12384 [3:22:22<22:54:10, 7.63s/it, loss=0.0015, acc=0.9975, iter_time=5.60s]
Epoch 0: 13%|█▎ | 1586/12384 [3:22:22<23:11:30, 7.73s/it, loss=0.0015, acc=0.9975, iter_time=5.60s]
Epoch 0: 13%|█▎ | 1586/12384 [3:22:30<23:11:30, 7.73s/it, loss=0.0004, acc=0.9998, iter_time=9.96s]
Epoch 0: 13%|█▎ | 1587/12384 [3:22:30<23:05:37, 7.70s/it, loss=0.0004, acc=0.9998, iter_time=9.96s]
Epoch 0: 13%|█▎ | 1587/12384 [3:22:37<23:05:37, 7.70s/it, loss=0.0005, acc=0.9980, iter_time=7.70s]
Epoch 0: 13%|█▎ | 1588/12384 [3:22:37<23:04:33, 7.69s/it, loss=0.0005, acc=0.9980, iter_time=7.70s]
Epoch 0: 13%|█▎ | 1588/12384 [3:22:45<23:04:33, 7.69s/it, loss=0.0005, acc=0.9972, iter_time=6.11s]
Epoch 0: 13%|█▎ | 1589/12384 [3:22:45<23:02:00, 7.68s/it, loss=0.0005, acc=0.9972, iter_time=6.11s]
Epoch 0: 13%|█▎ | 1589/12384 [3:22:53<23:02:00, 7.68s/it, loss=0.0051, acc=0.9887, iter_time=9.14s]
Epoch 0: 13%|█▎ | 1590/12384 [3:22:53<22:57:25, 7.66s/it, loss=0.0051, acc=0.9887, iter_time=9.14s]
Epoch 0: 13%|█▎ | 1590/12384 [3:23:00<22:57:25, 7.66s/it, loss=0.0006, acc=0.9992, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1591/12384 [3:23:00<23:00:08, 7.67s/it, loss=0.0006, acc=0.9992, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1591/12384 [3:23:08<23:00:08, 7.67s/it, loss=0.0019, acc=0.9985, iter_time=7.65s]
Epoch 0: 13%|█▎ | 1592/12384 [3:23:08<22:57:23, 7.66s/it, loss=0.0019, acc=0.9985, iter_time=7.65s]
Epoch 0: 13%|█▎ | 1592/12384 [3:23:16<22:57:23, 7.66s/it, loss=0.0057, acc=0.9909, iter_time=7.66s]
Epoch 0: 13%|█▎ | 1593/12384 [3:23:16<22:56:01, 7.65s/it, loss=0.0057, acc=0.9909, iter_time=7.66s]
Epoch 0: 13%|█▎ | 1593/12384 [3:23:23<22:56:01, 7.65s/it, loss=0.0022, acc=0.9970, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1594/12384 [3:23:23<22:54:34, 7.64s/it, loss=0.0022, acc=0.9970, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1594/12384 [3:23:31<22:54:34, 7.64s/it, loss=0.0005, acc=0.9996, iter_time=5.52s]
Epoch 0: 13%|█▎ | 1595/12384 [3:23:31<22:56:24, 7.65s/it, loss=0.0005, acc=0.9996, iter_time=5.52s]
Epoch 0: 13%|█▎ | 1595/12384 [3:23:39<22:56:24, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1596/12384 [3:23:39<22:54:38, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1596/12384 [3:23:46<22:54:38, 7.65s/it, loss=0.0013, acc=0.9976, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1597/12384 [3:23:46<22:54:46, 7.65s/it, loss=0.0013, acc=0.9976, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1597/12384 [3:23:54<22:54:46, 7.65s/it, loss=0.0027, acc=0.9962, iter_time=5.05s]
Epoch 0: 13%|█▎ | 1598/12384 [3:23:54<22:52:44, 7.64s/it, loss=0.0027, acc=0.9962, iter_time=5.05s]
Epoch 0: 13%|█▎ | 1598/12384 [3:24:01<22:52:44, 7.64s/it, loss=0.0005, acc=0.9994, iter_time=7.71s]
Epoch 0: 13%|█▎ | 1599/12384 [3:24:01<22:54:51, 7.65s/it, loss=0.0005, acc=0.9994, iter_time=7.71s]
Epoch 0: 13%|█▎ | 1599/12384 [3:24:09<22:54:51, 7.65s/it, loss=0.0029, acc=0.9943, iter_time=10.60s]
Epoch 0: 13%|█▎ | 1600/12384 [3:24:09<22:53:36, 7.64s/it, loss=0.0029, acc=0.9943, iter_time=10.60s]
Epoch 0: 13%|█▎ | 1600/12384 [3:24:17<22:53:36, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1601/12384 [3:24:17<22:50:58, 7.63s/it, loss=0.0007, acc=0.9980, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1601/12384 [3:24:24<22:50:58, 7.63s/it, loss=0.0022, acc=0.9979, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1602/12384 [3:24:24<22:50:03, 7.62s/it, loss=0.0022, acc=0.9979, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1602/12384 [3:24:32<22:50:03, 7.62s/it, loss=0.0007, acc=0.9977, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1603/12384 [3:24:32<22:50:23, 7.63s/it, loss=0.0007, acc=0.9977, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1603/12384 [3:24:40<22:50:23, 7.63s/it, loss=0.0016, acc=0.9905, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1604/12384 [3:24:40<22:59:01, 7.68s/it, loss=0.0016, acc=0.9905, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1604/12384 [3:24:47<22:59:01, 7.68s/it, loss=0.0010, acc=0.9991, iter_time=10.81s]
Epoch 0: 13%|█▎ | 1605/12384 [3:24:47<22:59:29, 7.68s/it, loss=0.0010, acc=0.9991, iter_time=10.81s]
Epoch 0: 13%|█▎ | 1605/12384 [3:24:55<22:59:29, 7.68s/it, loss=0.0037, acc=0.9920, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1606/12384 [3:24:55<22:58:01, 7.67s/it, loss=0.0037, acc=0.9920, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1606/12384 [3:25:03<22:58:01, 7.67s/it, loss=0.0025, acc=0.9956, iter_time=7.66s]
Epoch 0: 13%|█▎ | 1607/12384 [3:25:03<22:56:18, 7.66s/it, loss=0.0025, acc=0.9956, iter_time=7.66s]
Epoch 0: 13%|█▎ | 1607/12384 [3:25:10<22:56:18, 7.66s/it, loss=0.0010, acc=0.9992, iter_time=8.02s]
Epoch 0: 13%|█▎ | 1608/12384 [3:25:10<22:55:38, 7.66s/it, loss=0.0010, acc=0.9992, iter_time=8.02s]
Epoch 0: 13%|█▎ | 1608/12384 [3:25:18<22:55:38, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 13%|█▎ | 1609/12384 [3:25:18<22:54:02, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 13%|█▎ | 1609/12384 [3:25:26<22:54:02, 7.65s/it, loss=0.0033, acc=0.9928, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1610/12384 [3:25:26<22:52:26, 7.64s/it, loss=0.0033, acc=0.9928, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1610/12384 [3:25:33<22:52:26, 7.64s/it, loss=0.0009, acc=0.9998, iter_time=4.09s]
Epoch 0: 13%|█▎ | 1611/12384 [3:25:33<22:52:51, 7.65s/it, loss=0.0009, acc=0.9998, iter_time=4.09s]
Epoch 0: 13%|█▎ | 1611/12384 [3:25:41<22:52:51, 7.65s/it, loss=0.0007, acc=0.9997, iter_time=11.18s]
Epoch 0: 13%|█▎ | 1612/12384 [3:25:41<22:51:08, 7.64s/it, loss=0.0007, acc=0.9997, iter_time=11.18s]
Epoch 0: 13%|█▎ | 1612/12384 [3:25:49<22:51:08, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.94s]
Epoch 0: 13%|█▎ | 1613/12384 [3:25:49<23:12:34, 7.76s/it, loss=0.0003, acc=1.0000, iter_time=7.94s]
Epoch 0: 13%|█▎ | 1613/12384 [3:25:57<23:12:34, 7.76s/it, loss=0.0050, acc=0.9920, iter_time=7.71s]
Epoch 0: 13%|█▎ | 1614/12384 [3:25:57<23:05:10, 7.72s/it, loss=0.0050, acc=0.9920, iter_time=7.71s]
Epoch 0: 13%|█▎ | 1614/12384 [3:26:04<23:05:10, 7.72s/it, loss=0.0006, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1615/12384 [3:26:04<22:59:45, 7.69s/it, loss=0.0006, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1615/12384 [3:26:12<22:59:45, 7.69s/it, loss=0.0011, acc=0.9966, iter_time=7.99s]
Epoch 0: 13%|█▎ | 1616/12384 [3:26:12<22:55:11, 7.66s/it, loss=0.0011, acc=0.9966, iter_time=7.99s]
Epoch 0: 13%|█▎ | 1616/12384 [3:26:19<22:55:11, 7.66s/it, loss=0.0033, acc=0.9960, iter_time=7.23s]
Epoch 0: 13%|█▎ | 1617/12384 [3:26:19<22:53:37, 7.65s/it, loss=0.0033, acc=0.9960, iter_time=7.23s]
Epoch 0: 13%|█▎ | 1617/12384 [3:26:27<22:53:37, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1618/12384 [3:26:27<22:55:24, 7.67s/it, loss=0.0006, acc=0.9975, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1618/12384 [3:26:35<22:55:24, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=4.83s]
Epoch 0: 13%|█▎ | 1619/12384 [3:26:35<22:53:44, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=4.83s]
Epoch 0: 13%|█▎ | 1619/12384 [3:26:42<22:53:44, 7.66s/it, loss=0.0040, acc=0.9900, iter_time=10.22s]
Epoch 0: 13%|█▎ | 1620/12384 [3:26:42<22:53:00, 7.65s/it, loss=0.0040, acc=0.9900, iter_time=10.22s]
Epoch 0: 13%|█▎ | 1620/12384 [3:26:50<22:53:00, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.39s]
Epoch 0: 13%|█▎ | 1621/12384 [3:26:50<22:52:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.39s]
Epoch 0: 13%|█▎ | 1621/12384 [3:26:58<22:52:43, 7.65s/it, loss=0.0013, acc=0.9965, iter_time=7.15s]
Epoch 0: 13%|█▎ | 1622/12384 [3:26:58<22:51:56, 7.65s/it, loss=0.0013, acc=0.9965, iter_time=7.15s]
Epoch 0: 13%|█▎ | 1622/12384 [3:27:05<22:51:56, 7.65s/it, loss=0.0041, acc=0.9894, iter_time=8.60s]
Epoch 0: 13%|█▎ | 1623/12384 [3:27:05<22:50:39, 7.64s/it, loss=0.0041, acc=0.9894, iter_time=8.60s]
Epoch 0: 13%|█▎ | 1623/12384 [3:27:13<22:50:39, 7.64s/it, loss=0.0009, acc=0.9983, iter_time=10.73s]
Epoch 0: 13%|█▎ | 1624/12384 [3:27:13<22:53:37, 7.66s/it, loss=0.0009, acc=0.9983, iter_time=10.73s]
Epoch 0: 13%|█▎ | 1624/12384 [3:27:21<22:53:37, 7.66s/it, loss=0.0004, acc=0.9989, iter_time=5.31s]
Epoch 0: 13%|█▎ | 1625/12384 [3:27:21<22:50:47, 7.64s/it, loss=0.0004, acc=0.9989, iter_time=5.31s]
Epoch 0: 13%|█▎ | 1625/12384 [3:27:28<22:50:47, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=9.95s]
Epoch 0: 13%|█▎ | 1626/12384 [3:27:28<22:49:14, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=9.95s]
Epoch 0: 13%|█▎ | 1626/12384 [3:27:36<22:49:14, 7.64s/it, loss=0.0032, acc=0.9947, iter_time=6.50s]
Epoch 0: 13%|█▎ | 1627/12384 [3:27:36<22:47:16, 7.63s/it, loss=0.0032, acc=0.9947, iter_time=6.50s]
Epoch 0: 13%|█▎ | 1627/12384 [3:27:43<22:47:16, 7.63s/it, loss=0.0011, acc=0.9979, iter_time=8.73s]
Epoch 0: 13%|█▎ | 1628/12384 [3:27:43<22:45:29, 7.62s/it, loss=0.0011, acc=0.9979, iter_time=8.73s]
Epoch 0: 13%|█▎ | 1628/12384 [3:27:51<22:45:29, 7.62s/it, loss=0.0011, acc=0.9975, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1629/12384 [3:27:51<22:44:32, 7.61s/it, loss=0.0011, acc=0.9975, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1629/12384 [3:27:59<22:44:32, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.59s]
Epoch 0: 13%|█▎ | 1630/12384 [3:27:59<22:45:03, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.59s]
Epoch 0: 13%|█▎ | 1630/12384 [3:28:06<22:45:03, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1631/12384 [3:28:06<22:45:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1631/12384 [3:28:14<22:45:05, 7.62s/it, loss=0.0061, acc=0.9873, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1632/12384 [3:28:14<22:46:33, 7.63s/it, loss=0.0061, acc=0.9873, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1632/12384 [3:28:22<22:46:33, 7.63s/it, loss=0.0006, acc=0.9977, iter_time=5.04s]
Epoch 0: 13%|█▎ | 1633/12384 [3:28:22<22:46:23, 7.63s/it, loss=0.0006, acc=0.9977, iter_time=5.04s]
Epoch 0: 13%|█▎ | 1633/12384 [3:28:29<22:46:23, 7.63s/it, loss=0.0004, acc=0.9996, iter_time=10.24s]
Epoch 0: 13%|█▎ | 1634/12384 [3:28:29<22:46:01, 7.62s/it, loss=0.0004, acc=0.9996, iter_time=10.24s]
Epoch 0: 13%|█▎ | 1634/12384 [3:28:37<22:46:01, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1635/12384 [3:28:37<22:45:36, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1635/12384 [3:28:44<22:45:36, 7.62s/it, loss=0.0010, acc=0.9962, iter_time=5.55s]
Epoch 0: 13%|█▎ | 1636/12384 [3:28:44<22:45:11, 7.62s/it, loss=0.0010, acc=0.9962, iter_time=5.55s]
Epoch 0: 13%|█▎ | 1636/12384 [3:28:52<22:45:11, 7.62s/it, loss=0.0028, acc=0.9894, iter_time=9.70s]
Epoch 0: 13%|█▎ | 1637/12384 [3:28:52<22:44:03, 7.62s/it, loss=0.0028, acc=0.9894, iter_time=9.70s]
Epoch 0: 13%|█▎ | 1637/12384 [3:29:00<22:44:03, 7.62s/it, loss=0.0014, acc=0.9971, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1638/12384 [3:29:00<22:44:45, 7.62s/it, loss=0.0014, acc=0.9971, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1638/12384 [3:29:08<22:44:45, 7.62s/it, loss=0.0010, acc=0.9967, iter_time=7.96s]
Epoch 0: 13%|█▎ | 1639/12384 [3:29:08<23:04:34, 7.73s/it, loss=0.0010, acc=0.9967, iter_time=7.96s]
Epoch 0: 13%|█▎ | 1639/12384 [3:29:15<23:04:34, 7.73s/it, loss=0.0004, acc=0.9998, iter_time=8.03s]
Epoch 0: 13%|█▎ | 1640/12384 [3:29:15<23:00:18, 7.71s/it, loss=0.0004, acc=0.9998, iter_time=8.03s]
Epoch 0: 13%|█▎ | 1640/12384 [3:29:23<23:00:18, 7.71s/it, loss=0.0013, acc=0.9970, iter_time=6.33s]
Epoch 0: 13%|█▎ | 1641/12384 [3:29:23<22:53:58, 7.67s/it, loss=0.0013, acc=0.9970, iter_time=6.33s]
Epoch 0: 13%|█▎ | 1641/12384 [3:29:30<22:53:58, 7.67s/it, loss=0.0004, acc=0.9979, iter_time=6.73s]
Epoch 0: 13%|█▎ | 1642/12384 [3:29:30<22:49:37, 7.65s/it, loss=0.0004, acc=0.9979, iter_time=6.73s]
Epoch 0: 13%|█▎ | 1642/12384 [3:29:38<22:49:37, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.34s]
Epoch 0: 13%|█▎ | 1643/12384 [3:29:38<22:47:35, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.34s]
Epoch 0: 13%|█▎ | 1643/12384 [3:29:46<22:47:35, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.84s]
Epoch 0: 13%|█▎ | 1644/12384 [3:29:46<22:47:35, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.84s]
Epoch 0: 13%|█▎ | 1644/12384 [3:29:53<22:47:35, 7.64s/it, loss=0.0009, acc=0.9970, iter_time=9.22s]
Epoch 0: 13%|█▎ | 1645/12384 [3:29:53<22:47:55, 7.64s/it, loss=0.0009, acc=0.9970, iter_time=9.22s]
Epoch 0: 13%|█▎ | 1645/12384 [3:30:01<22:47:55, 7.64s/it, loss=0.0016, acc=0.9929, iter_time=6.84s]
Epoch 0: 13%|█▎ | 1646/12384 [3:30:01<22:47:12, 7.64s/it, loss=0.0016, acc=0.9929, iter_time=6.84s]
Epoch 0: 13%|█▎ | 1646/12384 [3:30:09<22:47:12, 7.64s/it, loss=0.0028, acc=0.9952, iter_time=9.76s]
Epoch 0: 13%|█▎ | 1647/12384 [3:30:09<22:46:32, 7.64s/it, loss=0.0028, acc=0.9952, iter_time=9.76s]
Epoch 0: 13%|█▎ | 1647/12384 [3:30:16<22:46:32, 7.64s/it, loss=0.0043, acc=0.9931, iter_time=8.54s]
Epoch 0: 13%|█▎ | 1648/12384 [3:30:16<22:45:12, 7.63s/it, loss=0.0043, acc=0.9931, iter_time=8.54s]
Epoch 0: 13%|█▎ | 1648/12384 [3:30:24<22:45:12, 7.63s/it, loss=0.0085, acc=0.9804, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1649/12384 [3:30:24<22:48:40, 7.65s/it, loss=0.0085, acc=0.9804, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1649/12384 [3:30:32<22:48:40, 7.65s/it, loss=0.0005, acc=0.9961, iter_time=11.15s]
Epoch 0: 13%|█▎ | 1650/12384 [3:30:32<22:47:24, 7.64s/it, loss=0.0005, acc=0.9961, iter_time=11.15s]
Epoch 0: 13%|█▎ | 1650/12384 [3:30:39<22:47:24, 7.64s/it, loss=0.0027, acc=0.9919, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1651/12384 [3:30:39<22:46:08, 7.64s/it, loss=0.0027, acc=0.9919, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1651/12384 [3:30:47<22:46:08, 7.64s/it, loss=0.0033, acc=0.9895, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1652/12384 [3:30:47<22:49:42, 7.66s/it, loss=0.0033, acc=0.9895, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1652/12384 [3:30:55<22:49:42, 7.66s/it, loss=0.0012, acc=0.9998, iter_time=5.12s]
Epoch 0: 13%|█▎ | 1653/12384 [3:30:55<22:47:25, 7.65s/it, loss=0.0012, acc=0.9998, iter_time=5.12s]
Epoch 0: 13%|█▎ | 1653/12384 [3:31:02<22:47:25, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=8.16s]
Epoch 0: 13%|█▎ | 1654/12384 [3:31:02<22:45:15, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.16s]
Epoch 0: 13%|█▎ | 1654/12384 [3:31:10<22:45:15, 7.63s/it, loss=0.0006, acc=0.9980, iter_time=8.72s]
Epoch 0: 13%|█▎ | 1655/12384 [3:31:10<22:45:43, 7.64s/it, loss=0.0006, acc=0.9980, iter_time=8.72s]
Epoch 0: 13%|█▎ | 1655/12384 [3:31:17<22:45:43, 7.64s/it, loss=0.0014, acc=0.9987, iter_time=9.02s]
Epoch 0: 13%|█▎ | 1656/12384 [3:31:17<22:47:03, 7.65s/it, loss=0.0014, acc=0.9987, iter_time=9.02s]
Epoch 0: 13%|█▎ | 1656/12384 [3:31:25<22:47:03, 7.65s/it, loss=0.0010, acc=0.9989, iter_time=7.24s]
Epoch 0: 13%|█▎ | 1657/12384 [3:31:25<22:45:31, 7.64s/it, loss=0.0010, acc=0.9989, iter_time=7.24s]
Epoch 0: 13%|█▎ | 1657/12384 [3:31:33<22:45:31, 7.64s/it, loss=0.0026, acc=0.9958, iter_time=4.31s]
Epoch 0: 13%|█▎ | 1658/12384 [3:31:33<22:45:51, 7.64s/it, loss=0.0026, acc=0.9958, iter_time=4.31s]
Epoch 0: 13%|█▎ | 1658/12384 [3:31:40<22:45:51, 7.64s/it, loss=0.0015, acc=0.9970, iter_time=9.70s]
Epoch 0: 13%|█▎ | 1659/12384 [3:31:40<22:45:10, 7.64s/it, loss=0.0015, acc=0.9970, iter_time=9.70s]
Epoch 0: 13%|█▎ | 1659/12384 [3:31:48<22:45:10, 7.64s/it, loss=0.0010, acc=0.9990, iter_time=8.92s]
Epoch 0: 13%|█▎ | 1660/12384 [3:31:48<22:45:49, 7.64s/it, loss=0.0010, acc=0.9990, iter_time=8.92s]
Epoch 0: 13%|█▎ | 1660/12384 [3:31:56<22:45:49, 7.64s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1661/12384 [3:31:56<22:45:47, 7.64s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1661/12384 [3:32:03<22:45:47, 7.64s/it, loss=0.0023, acc=0.9972, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1662/12384 [3:32:03<22:44:21, 7.63s/it, loss=0.0023, acc=0.9972, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1662/12384 [3:32:11<22:44:21, 7.63s/it, loss=0.0004, acc=0.9986, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1663/12384 [3:32:11<22:43:25, 7.63s/it, loss=0.0004, acc=0.9986, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1663/12384 [3:32:18<22:43:25, 7.63s/it, loss=0.0030, acc=0.9895, iter_time=8.00s]
Epoch 0: 13%|█▎ | 1664/12384 [3:32:18<22:42:33, 7.63s/it, loss=0.0030, acc=0.9895, iter_time=8.00s]
Epoch 0: 13%|█▎ | 1664/12384 [3:32:26<22:42:33, 7.63s/it, loss=0.0007, acc=0.9980, iter_time=6.28s]
Epoch 0: 13%|█▎ | 1665/12384 [3:32:26<23:03:26, 7.74s/it, loss=0.0007, acc=0.9980, iter_time=6.28s]
Epoch 0: 13%|█▎ | 1665/12384 [3:32:34<23:03:26, 7.74s/it, loss=0.0078, acc=0.9933, iter_time=8.98s]
Epoch 0: 13%|█▎ | 1666/12384 [3:32:34<22:57:53, 7.71s/it, loss=0.0078, acc=0.9933, iter_time=8.98s]
Epoch 0: 13%|█▎ | 1666/12384 [3:32:42<22:57:53, 7.71s/it, loss=0.0013, acc=0.9975, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1667/12384 [3:32:42<22:53:18, 7.69s/it, loss=0.0013, acc=0.9975, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1667/12384 [3:32:49<22:53:18, 7.69s/it, loss=0.0013, acc=0.9971, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1668/12384 [3:32:49<22:48:25, 7.66s/it, loss=0.0013, acc=0.9971, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1668/12384 [3:32:57<22:48:25, 7.66s/it, loss=0.0027, acc=0.9915, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1669/12384 [3:32:57<22:46:03, 7.65s/it, loss=0.0027, acc=0.9915, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1669/12384 [3:33:05<22:46:03, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1670/12384 [3:33:05<22:43:52, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1670/12384 [3:33:12<22:43:52, 7.64s/it, loss=0.0015, acc=0.9982, iter_time=5.26s]
Epoch 0: 13%|█▎ | 1671/12384 [3:33:12<22:44:01, 7.64s/it, loss=0.0015, acc=0.9982, iter_time=5.26s]
Epoch 0: 13%|█▎ | 1671/12384 [3:33:20<22:44:01, 7.64s/it, loss=0.0023, acc=0.9957, iter_time=10.36s]
Epoch 0: 14%|█▎ | 1672/12384 [3:33:20<22:43:54, 7.64s/it, loss=0.0023, acc=0.9957, iter_time=10.36s]
Epoch 0: 14%|█▎ | 1672/12384 [3:33:27<22:43:54, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=7.24s]
Epoch 0: 14%|█▎ | 1673/12384 [3:33:27<22:42:38, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.24s]
Epoch 0: 14%|█▎ | 1673/12384 [3:33:35<22:42:38, 7.63s/it, loss=0.0028, acc=0.9923, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1674/12384 [3:33:35<22:41:35, 7.63s/it, loss=0.0028, acc=0.9923, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1674/12384 [3:33:43<22:41:35, 7.63s/it, loss=0.0018, acc=0.9952, iter_time=3.87s]
Epoch 0: 14%|█▎ | 1675/12384 [3:33:43<22:42:51, 7.64s/it, loss=0.0018, acc=0.9952, iter_time=3.87s]
Epoch 0: 14%|█▎ | 1675/12384 [3:33:50<22:42:51, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.10s]
Epoch 0: 14%|█▎ | 1676/12384 [3:33:50<22:42:13, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.10s]
Epoch 0: 14%|█▎ | 1676/12384 [3:33:58<22:42:13, 7.63s/it, loss=0.0006, acc=0.9981, iter_time=9.72s]
Epoch 0: 14%|█▎ | 1677/12384 [3:33:58<22:40:57, 7.63s/it, loss=0.0006, acc=0.9981, iter_time=9.72s]
Epoch 0: 14%|█▎ | 1677/12384 [3:34:06<22:40:57, 7.63s/it, loss=0.0133, acc=0.9850, iter_time=8.82s]
Epoch 0: 14%|█▎ | 1678/12384 [3:34:06<22:39:33, 7.62s/it, loss=0.0133, acc=0.9850, iter_time=8.82s]
Epoch 0: 14%|█▎ | 1678/12384 [3:34:13<22:39:33, 7.62s/it, loss=0.0004, acc=0.9999, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1679/12384 [3:34:13<22:40:00, 7.62s/it, loss=0.0004, acc=0.9999, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1679/12384 [3:34:21<22:40:00, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 14%|█▎ | 1680/12384 [3:34:21<22:40:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 14%|█▎ | 1680/12384 [3:34:28<22:40:23, 7.63s/it, loss=0.0015, acc=0.9982, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1681/12384 [3:34:28<22:40:11, 7.63s/it, loss=0.0015, acc=0.9982, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1681/12384 [3:34:36<22:40:11, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.74s]
Epoch 0: 14%|█▎ | 1682/12384 [3:34:36<22:40:36, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.74s]
Epoch 0: 14%|█▎ | 1682/12384 [3:34:44<22:40:36, 7.63s/it, loss=0.0003, acc=0.9987, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1683/12384 [3:34:44<22:39:50, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1683/12384 [3:34:51<22:39:50, 7.62s/it, loss=0.0031, acc=0.9975, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1684/12384 [3:34:51<22:40:31, 7.63s/it, loss=0.0031, acc=0.9975, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1684/12384 [3:34:59<22:40:31, 7.63s/it, loss=0.0008, acc=0.9973, iter_time=6.47s]
Epoch 0: 14%|█▎ | 1685/12384 [3:34:59<22:40:01, 7.63s/it, loss=0.0008, acc=0.9973, iter_time=6.47s]
Epoch 0: 14%|█▎ | 1685/12384 [3:35:07<22:40:01, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=8.78s]
Epoch 0: 14%|█▎ | 1686/12384 [3:35:07<22:39:20, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=8.78s]
Epoch 0: 14%|█▎ | 1686/12384 [3:35:14<22:39:20, 7.62s/it, loss=0.0015, acc=0.9972, iter_time=7.08s]
Epoch 0: 14%|█▎ | 1687/12384 [3:35:14<22:40:44, 7.63s/it, loss=0.0015, acc=0.9972, iter_time=7.08s]
Epoch 0: 14%|█▎ | 1687/12384 [3:35:22<22:40:44, 7.63s/it, loss=0.0020, acc=0.9973, iter_time=8.55s]
Epoch 0: 14%|█▎ | 1688/12384 [3:35:22<22:38:06, 7.62s/it, loss=0.0020, acc=0.9973, iter_time=8.55s]
Epoch 0: 14%|█▎ | 1688/12384 [3:35:29<22:38:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 14%|█▎ | 1689/12384 [3:35:29<22:37:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 14%|█▎ | 1689/12384 [3:35:37<22:37:41, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1690/12384 [3:35:37<22:39:35, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1690/12384 [3:35:45<22:39:35, 7.63s/it, loss=0.0016, acc=0.9976, iter_time=7.97s]
Epoch 0: 14%|█▎ | 1691/12384 [3:35:45<22:58:02, 7.73s/it, loss=0.0016, acc=0.9976, iter_time=7.97s]
Epoch 0: 14%|█▎ | 1691/12384 [3:35:53<22:58:02, 7.73s/it, loss=0.0008, acc=0.9981, iter_time=7.68s]
Epoch 0: 14%|█▎ | 1692/12384 [3:35:53<22:52:25, 7.70s/it, loss=0.0008, acc=0.9981, iter_time=7.68s]
Epoch 0: 14%|█▎ | 1692/12384 [3:36:00<22:52:25, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 14%|█▎ | 1693/12384 [3:36:00<22:49:08, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 14%|█▎ | 1693/12384 [3:36:08<22:49:08, 7.68s/it, loss=0.0006, acc=0.9978, iter_time=7.66s]
Epoch 0: 14%|█▎ | 1694/12384 [3:36:08<22:46:06, 7.67s/it, loss=0.0006, acc=0.9978, iter_time=7.66s]
Epoch 0: 14%|█▎ | 1694/12384 [3:36:16<22:46:06, 7.67s/it, loss=0.0032, acc=0.9913, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1695/12384 [3:36:16<22:45:08, 7.66s/it, loss=0.0032, acc=0.9913, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1695/12384 [3:36:23<22:45:08, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=9.52s]
Epoch 0: 14%|█▎ | 1696/12384 [3:36:23<22:42:45, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.52s]
Epoch 0: 14%|█▎ | 1696/12384 [3:36:31<22:42:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 14%|█▎ | 1697/12384 [3:36:31<22:45:55, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 14%|█▎ | 1697/12384 [3:36:39<22:45:55, 7.67s/it, loss=0.0022, acc=0.9965, iter_time=8.32s]
Epoch 0: 14%|█▎ | 1698/12384 [3:36:39<22:42:35, 7.65s/it, loss=0.0022, acc=0.9965, iter_time=8.32s]
Epoch 0: 14%|█▎ | 1698/12384 [3:36:46<22:42:35, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=7.91s]
Epoch 0: 14%|█▎ | 1699/12384 [3:36:46<22:39:54, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=7.91s]
Epoch 0: 14%|█▎ | 1699/12384 [3:36:54<22:39:54, 7.64s/it, loss=0.0003, acc=0.9982, iter_time=8.03s]
Epoch 0: 14%|█▎ | 1700/12384 [3:36:54<22:39:20, 7.63s/it, loss=0.0003, acc=0.9982, iter_time=8.03s]
Epoch 0: 14%|█▎ | 1700/12384 [3:37:01<22:39:20, 7.63s/it, loss=0.0024, acc=0.9943, iter_time=7.21s]
Epoch 0: 14%|█▎ | 1701/12384 [3:37:01<22:39:27, 7.64s/it, loss=0.0024, acc=0.9943, iter_time=7.21s]
Epoch 0: 14%|█▎ | 1701/12384 [3:37:09<22:39:27, 7.64s/it, loss=0.0011, acc=0.9969, iter_time=7.66s]
Epoch 0: 14%|█▎ | 1702/12384 [3:37:09<22:39:32, 7.64s/it, loss=0.0011, acc=0.9969, iter_time=7.66s]
Epoch 0: 14%|█▎ | 1702/12384 [3:37:17<22:39:32, 7.64s/it, loss=0.0010, acc=0.9969, iter_time=7.63s]
Epoch 0: 14%|█▍ | 1703/12384 [3:37:17<22:38:23, 7.63s/it, loss=0.0010, acc=0.9969, iter_time=7.63s]
Epoch 0: 14%|█▍ | 1703/12384 [3:37:24<22:38:23, 7.63s/it, loss=0.0017, acc=0.9983, iter_time=7.57s]
Epoch 0: 14%|█▍ | 1704/12384 [3:37:24<22:37:54, 7.63s/it, loss=0.0017, acc=0.9983, iter_time=7.57s]
Epoch 0: 14%|█▍ | 1704/12384 [3:37:32<22:37:54, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.13s]
Epoch 0: 14%|█▍ | 1705/12384 [3:37:32<22:37:02, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.13s]
Epoch 0: 14%|█▍ | 1705/12384 [3:37:40<22:37:02, 7.62s/it, loss=0.0007, acc=0.9984, iter_time=8.16s]
Epoch 0: 14%|█▍ | 1706/12384 [3:37:40<22:35:50, 7.62s/it, loss=0.0007, acc=0.9984, iter_time=8.16s]
Epoch 0: 14%|█▍ | 1706/12384 [3:37:47<22:35:50, 7.62s/it, loss=0.0011, acc=0.9977, iter_time=7.60s]
Epoch 0: 14%|█▍ | 1707/12384 [3:37:47<22:36:40, 7.62s/it, loss=0.0011, acc=0.9977, iter_time=7.60s]
Epoch 0: 14%|█▍ | 1707/12384 [3:37:55<22:36:40, 7.62s/it, loss=0.0027, acc=0.9970, iter_time=6.14s]
Epoch 0: 14%|█▍ | 1708/12384 [3:37:55<22:34:27, 7.61s/it, loss=0.0027, acc=0.9970, iter_time=6.14s]
Epoch 0: 14%|█▍ | 1708/12384 [3:38:02<22:34:27, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=7.56s]
Epoch 0: 14%|█▍ | 1709/12384 [3:38:02<22:34:25, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=7.56s]
Epoch 0: 14%|█▍ | 1709/12384 [3:38:10<22:34:25, 7.61s/it, loss=0.0014, acc=0.9979, iter_time=7.70s]
Epoch 0: 14%|█▍ | 1710/12384 [3:38:10<22:39:47, 7.64s/it, loss=0.0014, acc=0.9979, iter_time=7.70s]
Epoch 0: 14%|█▍ | 1710/12384 [3:38:18<22:39:47, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.37s]
Epoch 0: 14%|█▍ | 1711/12384 [3:38:18<22:37:40, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.37s]
Epoch 0: 14%|█▍ | 1711/12384 [3:38:25<22:37:40, 7.63s/it, loss=0.0045, acc=0.9931, iter_time=9.78s]
Epoch 0: 14%|█▍ | 1712/12384 [3:38:25<22:41:04, 7.65s/it, loss=0.0045, acc=0.9931, iter_time=9.78s]
Epoch 0: 14%|█▍ | 1712/12384 [3:38:33<22:41:04, 7.65s/it, loss=0.0008, acc=0.9988, iter_time=7.29s]
Epoch 0: 14%|█▍ | 1713/12384 [3:38:33<22:38:24, 7.64s/it, loss=0.0008, acc=0.9988, iter_time=7.29s]
Epoch 0: 14%|█▍ | 1713/12384 [3:38:41<22:38:24, 7.64s/it, loss=0.0005, acc=0.9997, iter_time=5.36s]
Epoch 0: 14%|█▍ | 1714/12384 [3:38:41<22:39:52, 7.65s/it, loss=0.0005, acc=0.9997, iter_time=5.36s]
Epoch 0: 14%|█▍ | 1714/12384 [3:38:48<22:39:52, 7.65s/it, loss=0.0007, acc=0.9960, iter_time=9.93s]
Epoch 0: 14%|█▍ | 1715/12384 [3:38:48<22:39:56, 7.65s/it, loss=0.0007, acc=0.9960, iter_time=9.93s]
Epoch 0: 14%|█▍ | 1715/12384 [3:38:56<22:39:56, 7.65s/it, loss=0.0005, acc=0.9988, iter_time=6.22s]
Epoch 0: 14%|█▍ | 1716/12384 [3:38:56<22:40:25, 7.65s/it, loss=0.0005, acc=0.9988, iter_time=6.22s]
Epoch 0: 14%|█▍ | 1716/12384 [3:39:04<22:40:25, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.39s]
Epoch 0: 14%|█▍ | 1717/12384 [3:39:04<22:59:14, 7.76s/it, loss=0.0004, acc=1.0000, iter_time=9.39s]
Epoch 0: 14%|█▍ | 1717/12384 [3:39:12<22:59:14, 7.76s/it, loss=0.0009, acc=0.9999, iter_time=7.71s]
Epoch 0: 14%|█▍ | 1718/12384 [3:39:12<22:52:20, 7.72s/it, loss=0.0009, acc=0.9999, iter_time=7.71s]
Epoch 0: 14%|█▍ | 1718/12384 [3:39:19<22:52:20, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=4.34s]
Epoch 0: 14%|█▍ | 1719/12384 [3:39:19<22:46:00, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.34s]
Epoch 0: 14%|█▍ | 1719/12384 [3:39:27<22:46:00, 7.68s/it, loss=0.0013, acc=0.9983, iter_time=11.28s]
Epoch 0: 14%|█▍ | 1720/12384 [3:39:27<22:43:02, 7.67s/it, loss=0.0013, acc=0.9983, iter_time=11.28s]
Epoch 0: 14%|█▍ | 1720/12384 [3:39:34<22:43:02, 7.67s/it, loss=0.0039, acc=0.9931, iter_time=3.73s]
Epoch 0: 14%|█▍ | 1721/12384 [3:39:34<22:40:36, 7.66s/it, loss=0.0039, acc=0.9931, iter_time=3.73s]
Epoch 0: 14%|█▍ | 1721/12384 [3:39:42<22:40:36, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=9.96s]
Epoch 0: 14%|█▍ | 1722/12384 [3:39:42<22:38:37, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=9.96s]
Epoch 0: 14%|█▍ | 1722/12384 [3:39:50<22:38:37, 7.65s/it, loss=0.0128, acc=0.9713, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1723/12384 [3:39:50<22:38:43, 7.65s/it, loss=0.0128, acc=0.9713, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1723/12384 [3:39:57<22:38:43, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.09s]
Epoch 0: 14%|█▍ | 1724/12384 [3:39:57<22:38:47, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.09s]
Epoch 0: 14%|█▍ | 1724/12384 [3:40:05<22:38:47, 7.65s/it, loss=0.0010, acc=1.0000, iter_time=8.19s]
Epoch 0: 14%|█▍ | 1725/12384 [3:40:05<22:36:52, 7.64s/it, loss=0.0010, acc=1.0000, iter_time=8.19s]
Epoch 0: 14%|█▍ | 1725/12384 [3:40:13<22:36:52, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.31s]
Epoch 0: 14%|█▍ | 1726/12384 [3:40:13<22:36:05, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.31s]
Epoch 0: 14%|█▍ | 1726/12384 [3:40:20<22:36:05, 7.63s/it, loss=0.0012, acc=0.9972, iter_time=10.10s]
Epoch 0: 14%|█▍ | 1727/12384 [3:40:20<22:44:06, 7.68s/it, loss=0.0012, acc=0.9972, iter_time=10.10s]
Epoch 0: 14%|█▍ | 1727/12384 [3:40:28<22:44:06, 7.68s/it, loss=0.0022, acc=0.9962, iter_time=7.84s]
Epoch 0: 14%|█▍ | 1728/12384 [3:40:28<22:54:03, 7.74s/it, loss=0.0022, acc=0.9962, iter_time=7.84s]
Epoch 0: 14%|█▍ | 1728/12384 [3:40:36<22:54:03, 7.74s/it, loss=0.0008, acc=0.9980, iter_time=5.70s]
Epoch 0: 14%|█▍ | 1729/12384 [3:40:36<22:55:51, 7.75s/it, loss=0.0008, acc=0.9980, iter_time=5.70s]
Epoch 0: 14%|█▍ | 1729/12384 [3:40:44<22:55:51, 7.75s/it, loss=0.0006, acc=0.9994, iter_time=9.84s]
Epoch 0: 14%|█▍ | 1730/12384 [3:40:44<22:54:17, 7.74s/it, loss=0.0006, acc=0.9994, iter_time=9.84s]
Epoch 0: 14%|█▍ | 1730/12384 [3:40:52<22:54:17, 7.74s/it, loss=0.0007, acc=0.9983, iter_time=7.76s]
Epoch 0: 14%|█▍ | 1731/12384 [3:40:52<22:56:12, 7.75s/it, loss=0.0007, acc=0.9983, iter_time=7.76s]
Epoch 0: 14%|█▍ | 1731/12384 [3:40:59<22:56:12, 7.75s/it, loss=0.0012, acc=0.9969, iter_time=7.76s]
Epoch 0: 14%|█▍ | 1732/12384 [3:40:59<22:58:46, 7.77s/it, loss=0.0012, acc=0.9969, iter_time=7.76s]
Epoch 0: 14%|█▍ | 1732/12384 [3:41:07<22:58:46, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=7.16s]
Epoch 0: 14%|█▍ | 1733/12384 [3:41:07<23:00:06, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=7.16s]
Epoch 0: 14%|█▍ | 1733/12384 [3:41:15<23:00:06, 7.77s/it, loss=0.0001, acc=0.9998, iter_time=5.34s]
Epoch 0: 14%|█▍ | 1734/12384 [3:41:15<23:01:20, 7.78s/it, loss=0.0001, acc=0.9998, iter_time=5.34s]
Epoch 0: 14%|█▍ | 1734/12384 [3:41:23<23:01:20, 7.78s/it, loss=0.0016, acc=0.9975, iter_time=8.05s]
Epoch 0: 14%|█▍ | 1735/12384 [3:41:23<23:02:09, 7.79s/it, loss=0.0016, acc=0.9975, iter_time=8.05s]
Epoch 0: 14%|█▍ | 1735/12384 [3:41:31<23:02:09, 7.79s/it, loss=0.0017, acc=0.9965, iter_time=10.99s]
Epoch 0: 14%|█▍ | 1736/12384 [3:41:31<23:01:56, 7.79s/it, loss=0.0017, acc=0.9965, iter_time=10.99s]
Epoch 0: 14%|█▍ | 1736/12384 [3:41:38<23:01:56, 7.79s/it, loss=0.0003, acc=0.9999, iter_time=7.50s]
Epoch 0: 14%|█▍ | 1737/12384 [3:41:38<23:03:27, 7.80s/it, loss=0.0003, acc=0.9999, iter_time=7.50s]
Epoch 0: 14%|█▍ | 1737/12384 [3:41:46<23:03:27, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1738/12384 [3:41:46<23:04:52, 7.81s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1738/12384 [3:41:54<23:04:52, 7.81s/it, loss=0.0006, acc=0.9982, iter_time=7.54s]
Epoch 0: 14%|█▍ | 1739/12384 [3:41:54<23:02:54, 7.79s/it, loss=0.0006, acc=0.9982, iter_time=7.54s]
Epoch 0: 14%|█▍ | 1739/12384 [3:42:02<23:02:54, 7.79s/it, loss=0.0007, acc=0.9994, iter_time=8.07s]
Epoch 0: 14%|█▍ | 1740/12384 [3:42:02<23:03:58, 7.80s/it, loss=0.0007, acc=0.9994, iter_time=8.07s]
Epoch 0: 14%|█▍ | 1740/12384 [3:42:10<23:03:58, 7.80s/it, loss=0.0002, acc=0.9998, iter_time=7.85s]
Epoch 0: 14%|█▍ | 1741/12384 [3:42:10<23:05:46, 7.81s/it, loss=0.0002, acc=0.9998, iter_time=7.85s]
Epoch 0: 14%|█▍ | 1741/12384 [3:42:17<23:05:46, 7.81s/it, loss=0.0039, acc=0.9914, iter_time=4.48s]
Epoch 0: 14%|█▍ | 1742/12384 [3:42:17<23:02:34, 7.80s/it, loss=0.0039, acc=0.9914, iter_time=4.48s]
Epoch 0: 14%|█▍ | 1742/12384 [3:42:25<23:02:34, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=9.76s]
Epoch 0: 14%|█▍ | 1743/12384 [3:42:25<23:03:44, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=9.76s]
Epoch 0: 14%|█▍ | 1743/12384 [3:42:33<23:03:44, 7.80s/it, loss=0.0023, acc=0.9954, iter_time=9.54s]
Epoch 0: 14%|█▍ | 1744/12384 [3:42:33<23:25:28, 7.93s/it, loss=0.0023, acc=0.9954, iter_time=9.54s]
Epoch 0: 14%|█▍ | 1744/12384 [3:42:41<23:25:28, 7.93s/it, loss=0.0022, acc=0.9948, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1745/12384 [3:42:41<23:16:25, 7.88s/it, loss=0.0022, acc=0.9948, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1745/12384 [3:42:49<23:16:25, 7.88s/it, loss=0.0006, acc=0.9994, iter_time=7.85s]
Epoch 0: 14%|█▍ | 1746/12384 [3:42:49<23:12:17, 7.85s/it, loss=0.0006, acc=0.9994, iter_time=7.85s]
Epoch 0: 14%|█▍ | 1746/12384 [3:42:57<23:12:17, 7.85s/it, loss=0.0018, acc=0.9937, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1747/12384 [3:42:57<23:09:45, 7.84s/it, loss=0.0018, acc=0.9937, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1747/12384 [3:43:05<23:09:45, 7.84s/it, loss=0.0006, acc=0.9974, iter_time=7.83s]
Epoch 0: 14%|█▍ | 1748/12384 [3:43:05<23:08:43, 7.83s/it, loss=0.0006, acc=0.9974, iter_time=7.83s]
Epoch 0: 14%|█▍ | 1748/12384 [3:43:12<23:08:43, 7.83s/it, loss=0.0024, acc=0.9947, iter_time=7.81s]
Epoch 0: 14%|█▍ | 1749/12384 [3:43:12<23:06:45, 7.82s/it, loss=0.0024, acc=0.9947, iter_time=7.81s]
Epoch 0: 14%|█▍ | 1749/12384 [3:43:20<23:06:45, 7.82s/it, loss=0.0003, acc=0.9999, iter_time=8.27s]
Epoch 0: 14%|█▍ | 1750/12384 [3:43:20<23:06:22, 7.82s/it, loss=0.0003, acc=0.9999, iter_time=8.27s]
Epoch 0: 14%|█▍ | 1750/12384 [3:43:28<23:06:22, 7.82s/it, loss=0.0006, acc=0.9997, iter_time=7.42s]
Epoch 0: 14%|█▍ | 1751/12384 [3:43:28<23:07:47, 7.83s/it, loss=0.0006, acc=0.9997, iter_time=7.42s]
Epoch 0: 14%|█▍ | 1751/12384 [3:43:36<23:07:47, 7.83s/it, loss=0.0003, acc=0.9993, iter_time=7.79s]
Epoch 0: 14%|█▍ | 1752/12384 [3:43:36<23:06:34, 7.82s/it, loss=0.0003, acc=0.9993, iter_time=7.79s]
Epoch 0: 14%|█▍ | 1752/12384 [3:43:44<23:06:34, 7.82s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 14%|█▍ | 1753/12384 [3:43:44<23:11:13, 7.85s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 14%|█▍ | 1753/12384 [3:43:52<23:11:13, 7.85s/it, loss=0.0024, acc=0.9939, iter_time=6.94s]
Epoch 0: 14%|█▍ | 1754/12384 [3:43:52<23:28:14, 7.95s/it, loss=0.0024, acc=0.9939, iter_time=6.94s]
Epoch 0: 14%|█▍ | 1754/12384 [3:44:00<23:28:14, 7.95s/it, loss=0.0014, acc=0.9977, iter_time=8.44s]
Epoch 0: 14%|█▍ | 1755/12384 [3:44:00<23:20:30, 7.91s/it, loss=0.0014, acc=0.9977, iter_time=8.44s]
Epoch 0: 14%|█▍ | 1755/12384 [3:44:08<23:20:30, 7.91s/it, loss=0.0008, acc=0.9980, iter_time=7.78s]
Epoch 0: 14%|█▍ | 1756/12384 [3:44:08<23:14:59, 7.88s/it, loss=0.0008, acc=0.9980, iter_time=7.78s]
Epoch 0: 14%|█▍ | 1756/12384 [3:44:16<23:14:59, 7.88s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 14%|█▍ | 1757/12384 [3:44:16<23:16:59, 7.89s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 14%|█▍ | 1757/12384 [3:44:23<23:16:59, 7.89s/it, loss=0.0002, acc=1.0000, iter_time=7.28s]
Epoch 0: 14%|█▍ | 1758/12384 [3:44:23<23:12:50, 7.86s/it, loss=0.0002, acc=1.0000, iter_time=7.28s]
Epoch 0: 14%|█▍ | 1758/12384 [3:44:31<23:12:50, 7.86s/it, loss=0.0007, acc=0.9974, iter_time=8.09s]
Epoch 0: 14%|█▍ | 1759/12384 [3:44:31<23:12:35, 7.86s/it, loss=0.0007, acc=0.9974, iter_time=8.09s]
Epoch 0: 14%|█▍ | 1759/12384 [3:44:39<23:12:35, 7.86s/it, loss=0.0018, acc=0.9956, iter_time=8.11s]
Epoch 0: 14%|█▍ | 1760/12384 [3:44:39<23:09:14, 7.85s/it, loss=0.0018, acc=0.9956, iter_time=8.11s]
Epoch 0: 14%|█▍ | 1760/12384 [3:44:47<23:09:14, 7.85s/it, loss=0.0004, acc=0.9991, iter_time=5.90s]
Epoch 0: 14%|█▍ | 1761/12384 [3:44:47<23:19:35, 7.91s/it, loss=0.0004, acc=0.9991, iter_time=5.90s]
Epoch 0: 14%|█▍ | 1761/12384 [3:44:55<23:19:35, 7.91s/it, loss=0.0005, acc=0.9976, iter_time=8.25s]
Epoch 0: 14%|█▍ | 1762/12384 [3:44:55<23:12:07, 7.86s/it, loss=0.0005, acc=0.9976, iter_time=8.25s]
Epoch 0: 14%|█▍ | 1762/12384 [3:45:03<23:12:07, 7.86s/it, loss=0.0002, acc=1.0000, iter_time=9.50s]
Epoch 0: 14%|█▍ | 1763/12384 [3:45:03<23:09:11, 7.85s/it, loss=0.0002, acc=1.0000, iter_time=9.50s]
Epoch 0: 14%|█▍ | 1763/12384 [3:45:10<23:09:11, 7.85s/it, loss=0.0007, acc=0.9982, iter_time=4.94s]
Epoch 0: 14%|█▍ | 1764/12384 [3:45:10<23:08:14, 7.84s/it, loss=0.0007, acc=0.9982, iter_time=4.94s]
Epoch 0: 14%|█▍ | 1764/12384 [3:45:18<23:08:14, 7.84s/it, loss=0.0006, acc=0.9982, iter_time=10.69s]
Epoch 0: 14%|█▍ | 1765/12384 [3:45:18<23:08:06, 7.84s/it, loss=0.0006, acc=0.9982, iter_time=10.69s]
Epoch 0: 14%|█▍ | 1765/12384 [3:45:26<23:08:06, 7.84s/it, loss=0.0001, acc=1.0000, iter_time=5.71s]
Epoch 0: 14%|█▍ | 1766/12384 [3:45:26<23:06:33, 7.84s/it, loss=0.0001, acc=1.0000, iter_time=5.71s]
Epoch 0: 14%|█▍ | 1766/12384 [3:45:34<23:06:33, 7.84s/it, loss=0.0002, acc=0.9998, iter_time=9.05s]
Epoch 0: 14%|█▍ | 1767/12384 [3:45:34<23:05:36, 7.83s/it, loss=0.0002, acc=0.9998, iter_time=9.05s]
Epoch 0: 14%|█▍ | 1767/12384 [3:45:42<23:05:36, 7.83s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 14%|█▍ | 1768/12384 [3:45:42<23:08:10, 7.85s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 14%|█▍ | 1768/12384 [3:45:50<23:08:10, 7.85s/it, loss=0.0003, acc=0.9994, iter_time=6.85s]
Epoch 0: 14%|█▍ | 1769/12384 [3:45:50<23:04:41, 7.83s/it, loss=0.0003, acc=0.9994, iter_time=6.85s]
Epoch 0: 14%|█▍ | 1769/12384 [3:45:58<23:04:41, 7.83s/it, loss=0.0004, acc=0.9997, iter_time=8.80s]
Epoch 0: 14%|█▍ | 1770/12384 [3:45:58<23:24:37, 7.94s/it, loss=0.0004, acc=0.9997, iter_time=8.80s]
Epoch 0: 14%|█▍ | 1770/12384 [3:46:06<23:24:37, 7.94s/it, loss=0.0004, acc=0.9998, iter_time=7.86s]
Epoch 0: 14%|█▍ | 1771/12384 [3:46:06<23:16:48, 7.90s/it, loss=0.0004, acc=0.9998, iter_time=7.86s]
Epoch 0: 14%|█▍ | 1771/12384 [3:46:13<23:16:48, 7.90s/it, loss=0.0007, acc=0.9953, iter_time=7.87s]
Epoch 0: 14%|█▍ | 1772/12384 [3:46:13<23:17:09, 7.90s/it, loss=0.0007, acc=0.9953, iter_time=7.87s]
Epoch 0: 14%|█▍ | 1772/12384 [3:46:21<23:17:09, 7.90s/it, loss=0.0025, acc=0.9956, iter_time=7.79s]
Epoch 0: 14%|█▍ | 1773/12384 [3:46:21<23:16:44, 7.90s/it, loss=0.0025, acc=0.9956, iter_time=7.79s]
Epoch 0: 14%|█▍ | 1773/12384 [3:46:29<23:16:44, 7.90s/it, loss=0.0004, acc=1.0000, iter_time=7.95s]
Epoch 0: 14%|█▍ | 1774/12384 [3:46:29<23:12:54, 7.88s/it, loss=0.0004, acc=1.0000, iter_time=7.95s]
Epoch 0: 14%|█▍ | 1774/12384 [3:46:37<23:12:54, 7.88s/it, loss=0.0030, acc=0.9984, iter_time=6.09s]
Epoch 0: 14%|█▍ | 1775/12384 [3:46:37<23:08:46, 7.85s/it, loss=0.0030, acc=0.9984, iter_time=6.09s]
Epoch 0: 14%|█▍ | 1775/12384 [3:46:45<23:08:46, 7.85s/it, loss=0.0011, acc=0.9989, iter_time=9.50s]
Epoch 0: 14%|█▍ | 1776/12384 [3:46:45<23:07:33, 7.85s/it, loss=0.0011, acc=0.9989, iter_time=9.50s]
Epoch 0: 14%|█▍ | 1776/12384 [3:46:53<23:07:33, 7.85s/it, loss=0.0014, acc=0.9959, iter_time=7.89s]
Epoch 0: 14%|█▍ | 1777/12384 [3:46:53<23:06:48, 7.84s/it, loss=0.0014, acc=0.9959, iter_time=7.89s]
Epoch 0: 14%|█▍ | 1777/12384 [3:47:01<23:06:48, 7.84s/it, loss=0.0004, acc=1.0000, iter_time=7.80s]
Epoch 0: 14%|█▍ | 1778/12384 [3:47:01<23:08:36, 7.86s/it, loss=0.0004, acc=1.0000, iter_time=7.80s]
Epoch 0: 14%|█▍ | 1778/12384 [3:47:08<23:08:36, 7.86s/it, loss=0.0004, acc=0.9999, iter_time=7.94s]
Epoch 0: 14%|█▍ | 1779/12384 [3:47:08<23:09:00, 7.86s/it, loss=0.0004, acc=0.9999, iter_time=7.94s]
Epoch 0: 14%|█▍ | 1779/12384 [3:47:16<23:09:00, 7.86s/it, loss=0.0003, acc=0.9998, iter_time=7.16s]
Epoch 0: 14%|█▍ | 1780/12384 [3:47:16<23:04:48, 7.84s/it, loss=0.0003, acc=0.9998, iter_time=7.16s]
Epoch 0: 14%|█▍ | 1780/12384 [3:47:24<23:04:48, 7.84s/it, loss=0.0029, acc=0.9959, iter_time=8.36s]
Epoch 0: 14%|█▍ | 1781/12384 [3:47:24<23:02:08, 7.82s/it, loss=0.0029, acc=0.9959, iter_time=8.36s]
Epoch 0: 14%|█▍ | 1781/12384 [3:47:32<23:02:08, 7.82s/it, loss=0.0003, acc=0.9996, iter_time=7.17s]
Epoch 0: 14%|█▍ | 1782/12384 [3:47:32<23:00:41, 7.81s/it, loss=0.0003, acc=0.9996, iter_time=7.17s]
Epoch 0: 14%|█▍ | 1782/12384 [3:47:40<23:00:41, 7.81s/it, loss=0.0002, acc=0.9990, iter_time=8.58s]
Epoch 0: 14%|█▍ | 1783/12384 [3:47:40<23:04:46, 7.84s/it, loss=0.0002, acc=0.9990, iter_time=8.58s]
Epoch 0: 14%|█▍ | 1783/12384 [3:47:47<23:04:46, 7.84s/it, loss=0.0015, acc=0.9984, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1784/12384 [3:47:47<22:55:30, 7.79s/it, loss=0.0015, acc=0.9984, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1784/12384 [3:47:55<22:55:30, 7.79s/it, loss=0.0077, acc=0.9807, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1785/12384 [3:47:55<22:46:32, 7.74s/it, loss=0.0077, acc=0.9807, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1785/12384 [3:48:03<22:46:32, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=6.46s]
Epoch 0: 14%|█▍ | 1786/12384 [3:48:03<22:41:12, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.46s]
Epoch 0: 14%|█▍ | 1786/12384 [3:48:10<22:41:12, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.22s]
Epoch 0: 14%|█▍ | 1787/12384 [3:48:10<22:38:02, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.22s]
Epoch 0: 14%|█▍ | 1787/12384 [3:48:18<22:38:02, 7.69s/it, loss=0.0005, acc=0.9996, iter_time=10.07s]
Epoch 0: 14%|█▍ | 1788/12384 [3:48:18<22:35:55, 7.68s/it, loss=0.0005, acc=0.9996, iter_time=10.07s]
Epoch 0: 14%|█▍ | 1788/12384 [3:48:26<22:35:55, 7.68s/it, loss=0.0015, acc=0.9947, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1789/12384 [3:48:26<22:31:41, 7.65s/it, loss=0.0015, acc=0.9947, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1789/12384 [3:48:33<22:31:41, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1790/12384 [3:48:33<22:30:12, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1790/12384 [3:48:41<22:30:12, 7.65s/it, loss=0.0006, acc=0.9992, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1791/12384 [3:48:41<22:29:33, 7.64s/it, loss=0.0006, acc=0.9992, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1791/12384 [3:48:48<22:29:33, 7.64s/it, loss=0.0028, acc=0.9943, iter_time=8.02s]
Epoch 0: 14%|█▍ | 1792/12384 [3:48:48<22:33:12, 7.67s/it, loss=0.0028, acc=0.9943, iter_time=8.02s]
Epoch 0: 14%|█▍ | 1792/12384 [3:48:56<22:33:12, 7.67s/it, loss=0.0006, acc=0.9999, iter_time=7.32s]
Epoch 0: 14%|█▍ | 1793/12384 [3:48:56<22:30:13, 7.65s/it, loss=0.0006, acc=0.9999, iter_time=7.32s]
Epoch 0: 14%|█▍ | 1793/12384 [3:49:04<22:30:13, 7.65s/it, loss=0.0009, acc=0.9980, iter_time=5.63s]
Epoch 0: 14%|█▍ | 1794/12384 [3:49:04<22:31:36, 7.66s/it, loss=0.0009, acc=0.9980, iter_time=5.63s]
Epoch 0: 14%|█▍ | 1794/12384 [3:49:12<22:31:36, 7.66s/it, loss=0.0004, acc=0.9986, iter_time=9.79s]
Epoch 0: 14%|█▍ | 1795/12384 [3:49:12<22:35:26, 7.68s/it, loss=0.0004, acc=0.9986, iter_time=9.79s]
Epoch 0: 14%|█▍ | 1795/12384 [3:49:19<22:35:26, 7.68s/it, loss=0.0036, acc=0.9935, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1796/12384 [3:49:19<22:31:52, 7.66s/it, loss=0.0036, acc=0.9935, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1796/12384 [3:49:27<22:31:52, 7.66s/it, loss=0.0019, acc=0.9972, iter_time=6.20s]
Epoch 0: 15%|█▍ | 1797/12384 [3:49:27<22:52:26, 7.78s/it, loss=0.0019, acc=0.9972, iter_time=6.20s]
Epoch 0: 15%|█▍ | 1797/12384 [3:49:35<22:52:26, 7.78s/it, loss=0.0027, acc=0.9931, iter_time=7.16s]
Epoch 0: 15%|█▍ | 1798/12384 [3:49:35<22:45:24, 7.74s/it, loss=0.0027, acc=0.9931, iter_time=7.16s]
Epoch 0: 15%|█▍ | 1798/12384 [3:49:42<22:45:24, 7.74s/it, loss=0.0003, acc=1.0000, iter_time=8.44s]
Epoch 0: 15%|█▍ | 1799/12384 [3:49:42<22:39:07, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=8.44s]
Epoch 0: 15%|█▍ | 1799/12384 [3:49:50<22:39:07, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=9.64s]
Epoch 0: 15%|█▍ | 1800/12384 [3:49:50<22:40:22, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=9.64s]
Epoch 0: 15%|█▍ | 1800/12384 [3:49:58<22:40:22, 7.71s/it, loss=0.0003, acc=0.9998, iter_time=7.23s]
Epoch 0: 15%|█▍ | 1801/12384 [3:49:58<22:41:26, 7.72s/it, loss=0.0003, acc=0.9998, iter_time=7.23s]
Epoch 0: 15%|█▍ | 1801/12384 [3:50:06<22:41:26, 7.72s/it, loss=0.0002, acc=0.9978, iter_time=6.78s]
Epoch 0: 15%|█▍ | 1802/12384 [3:50:06<22:36:15, 7.69s/it, loss=0.0002, acc=0.9978, iter_time=6.78s]
Epoch 0: 15%|█▍ | 1802/12384 [3:50:13<22:36:15, 7.69s/it, loss=0.0006, acc=0.9969, iter_time=7.07s]
Epoch 0: 15%|█▍ | 1803/12384 [3:50:13<22:35:02, 7.68s/it, loss=0.0006, acc=0.9969, iter_time=7.07s]
Epoch 0: 15%|█▍ | 1803/12384 [3:50:21<22:35:02, 7.68s/it, loss=0.0010, acc=0.9975, iter_time=9.16s]
Epoch 0: 15%|█▍ | 1804/12384 [3:50:21<22:33:40, 7.68s/it, loss=0.0010, acc=0.9975, iter_time=9.16s]
Epoch 0: 15%|█▍ | 1804/12384 [3:50:28<22:33:40, 7.68s/it, loss=0.0005, acc=0.9983, iter_time=7.37s]
Epoch 0: 15%|█▍ | 1805/12384 [3:50:28<22:30:29, 7.66s/it, loss=0.0005, acc=0.9983, iter_time=7.37s]
Epoch 0: 15%|█▍ | 1805/12384 [3:50:36<22:30:29, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1806/12384 [3:50:36<22:30:26, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1806/12384 [3:50:44<22:30:26, 7.66s/it, loss=0.0006, acc=0.9973, iter_time=8.08s]
Epoch 0: 15%|█▍ | 1807/12384 [3:50:44<22:36:42, 7.70s/it, loss=0.0006, acc=0.9973, iter_time=8.08s]
Epoch 0: 15%|█▍ | 1807/12384 [3:50:52<22:36:42, 7.70s/it, loss=0.0022, acc=0.9913, iter_time=8.05s]
Epoch 0: 15%|█▍ | 1808/12384 [3:50:52<22:33:57, 7.68s/it, loss=0.0022, acc=0.9913, iter_time=8.05s]
Epoch 0: 15%|█▍ | 1808/12384 [3:50:59<22:33:57, 7.68s/it, loss=0.0011, acc=0.9975, iter_time=7.30s]
Epoch 0: 15%|█▍ | 1809/12384 [3:50:59<22:32:59, 7.68s/it, loss=0.0011, acc=0.9975, iter_time=7.30s]
Epoch 0: 15%|█▍ | 1809/12384 [3:51:07<22:32:59, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1810/12384 [3:51:07<22:29:42, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1810/12384 [3:51:14<22:29:42, 7.66s/it, loss=0.0033, acc=0.9906, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1811/12384 [3:51:14<22:28:04, 7.65s/it, loss=0.0033, acc=0.9906, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1811/12384 [3:51:22<22:28:04, 7.65s/it, loss=0.0009, acc=0.9976, iter_time=7.66s]
Epoch 0: 15%|█▍ | 1812/12384 [3:51:22<22:27:44, 7.65s/it, loss=0.0009, acc=0.9976, iter_time=7.66s]
Epoch 0: 15%|█▍ | 1812/12384 [3:51:30<22:27:44, 7.65s/it, loss=0.0002, acc=0.9999, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1813/12384 [3:51:30<22:27:28, 7.65s/it, loss=0.0002, acc=0.9999, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1813/12384 [3:51:37<22:27:28, 7.65s/it, loss=0.0015, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1814/12384 [3:51:37<22:25:19, 7.64s/it, loss=0.0015, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1814/12384 [3:51:45<22:25:19, 7.64s/it, loss=0.0005, acc=0.9999, iter_time=7.72s]
Epoch 0: 15%|█▍ | 1815/12384 [3:51:45<22:33:20, 7.68s/it, loss=0.0005, acc=0.9999, iter_time=7.72s]
Epoch 0: 15%|█▍ | 1815/12384 [3:51:53<22:33:20, 7.68s/it, loss=0.0013, acc=0.9975, iter_time=8.07s]
Epoch 0: 15%|█▍ | 1816/12384 [3:51:53<22:29:58, 7.66s/it, loss=0.0013, acc=0.9975, iter_time=8.07s]
Epoch 0: 15%|█▍ | 1816/12384 [3:52:00<22:29:58, 7.66s/it, loss=0.0018, acc=0.9935, iter_time=7.23s]
Epoch 0: 15%|█▍ | 1817/12384 [3:52:00<22:27:13, 7.65s/it, loss=0.0018, acc=0.9935, iter_time=7.23s]
Epoch 0: 15%|█▍ | 1817/12384 [3:52:08<22:27:13, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1818/12384 [3:52:08<22:26:06, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1818/12384 [3:52:16<22:26:06, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.39s]
Epoch 0: 15%|█▍ | 1819/12384 [3:52:16<22:24:22, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.39s]
Epoch 0: 15%|█▍ | 1819/12384 [3:52:23<22:24:22, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.86s]
Epoch 0: 15%|█▍ | 1820/12384 [3:52:23<22:23:22, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.86s]
Epoch 0: 15%|█▍ | 1820/12384 [3:52:31<22:23:22, 7.63s/it, loss=0.0008, acc=0.9997, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1821/12384 [3:52:31<22:25:28, 7.64s/it, loss=0.0008, acc=0.9997, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1821/12384 [3:52:39<22:25:28, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=7.67s]
Epoch 0: 15%|█▍ | 1822/12384 [3:52:39<22:25:30, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=7.67s]
Epoch 0: 15%|█▍ | 1822/12384 [3:52:47<22:25:30, 7.64s/it, loss=0.0032, acc=0.9905, iter_time=7.32s]
Epoch 0: 15%|█▍ | 1823/12384 [3:52:47<22:45:21, 7.76s/it, loss=0.0032, acc=0.9905, iter_time=7.32s]
Epoch 0: 15%|█▍ | 1823/12384 [3:52:54<22:45:21, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 0: 15%|█▍ | 1824/12384 [3:52:54<22:42:28, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 0: 15%|█▍ | 1824/12384 [3:53:02<22:42:28, 7.74s/it, loss=0.0006, acc=0.9988, iter_time=7.32s]
Epoch 0: 15%|█▍ | 1825/12384 [3:53:02<22:36:33, 7.71s/it, loss=0.0006, acc=0.9988, iter_time=7.32s]
Epoch 0: 15%|█▍ | 1825/12384 [3:53:10<22:36:33, 7.71s/it, loss=0.0020, acc=0.9928, iter_time=7.64s]
Epoch 0: 15%|█▍ | 1826/12384 [3:53:10<22:31:40, 7.68s/it, loss=0.0020, acc=0.9928, iter_time=7.64s]
Epoch 0: 15%|█▍ | 1826/12384 [3:53:17<22:31:40, 7.68s/it, loss=0.0028, acc=0.9947, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1827/12384 [3:53:17<22:29:02, 7.67s/it, loss=0.0028, acc=0.9947, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1827/12384 [3:53:25<22:29:02, 7.67s/it, loss=0.0008, acc=0.9974, iter_time=5.63s]
Epoch 0: 15%|█▍ | 1828/12384 [3:53:25<22:31:10, 7.68s/it, loss=0.0008, acc=0.9974, iter_time=5.63s]
Epoch 0: 15%|█▍ | 1828/12384 [3:53:33<22:31:10, 7.68s/it, loss=0.0004, acc=0.9997, iter_time=9.71s]
Epoch 0: 15%|█▍ | 1829/12384 [3:53:33<22:28:01, 7.66s/it, loss=0.0004, acc=0.9997, iter_time=9.71s]
Epoch 0: 15%|█▍ | 1829/12384 [3:53:40<22:28:01, 7.66s/it, loss=0.0006, acc=1.0000, iter_time=6.44s]
Epoch 0: 15%|█▍ | 1830/12384 [3:53:40<22:27:40, 7.66s/it, loss=0.0006, acc=1.0000, iter_time=6.44s]
Epoch 0: 15%|█▍ | 1830/12384 [3:53:48<22:27:40, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.96s]
Epoch 0: 15%|█▍ | 1831/12384 [3:53:48<22:30:49, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=8.96s]
Epoch 0: 15%|█▍ | 1831/12384 [3:53:56<22:30:49, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.57s]
Epoch 0: 15%|█▍ | 1832/12384 [3:53:56<22:27:57, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.57s]
Epoch 0: 15%|█▍ | 1832/12384 [3:54:03<22:27:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.47s]
Epoch 0: 15%|█▍ | 1833/12384 [3:54:03<22:26:22, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.47s]
Epoch 0: 15%|█▍ | 1833/12384 [3:54:11<22:26:22, 7.66s/it, loss=0.0003, acc=0.9999, iter_time=8.85s]
Epoch 0: 15%|█▍ | 1834/12384 [3:54:11<22:24:13, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=8.85s]
Epoch 0: 15%|█▍ | 1834/12384 [3:54:18<22:24:13, 7.64s/it, loss=0.0005, acc=0.9994, iter_time=6.38s]
Epoch 0: 15%|█▍ | 1835/12384 [3:54:18<22:23:38, 7.64s/it, loss=0.0005, acc=0.9994, iter_time=6.38s]
Epoch 0: 15%|█▍ | 1835/12384 [3:54:26<22:23:38, 7.64s/it, loss=0.0016, acc=0.9992, iter_time=8.55s]
Epoch 0: 15%|█▍ | 1836/12384 [3:54:26<22:19:57, 7.62s/it, loss=0.0016, acc=0.9992, iter_time=8.55s]
Epoch 0: 15%|█▍ | 1836/12384 [3:54:34<22:19:57, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=7.97s]
Epoch 0: 15%|█▍ | 1837/12384 [3:54:34<22:23:53, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=7.97s]
Epoch 0: 15%|█▍ | 1837/12384 [3:54:41<22:23:53, 7.65s/it, loss=0.0013, acc=0.9972, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1838/12384 [3:54:41<22:22:03, 7.64s/it, loss=0.0013, acc=0.9972, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1838/12384 [3:54:49<22:22:03, 7.64s/it, loss=0.0014, acc=0.9968, iter_time=5.35s]
Epoch 0: 15%|█▍ | 1839/12384 [3:54:49<22:20:34, 7.63s/it, loss=0.0014, acc=0.9968, iter_time=5.35s]
Epoch 0: 15%|█▍ | 1839/12384 [3:54:57<22:20:34, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.87s]
Epoch 0: 15%|█▍ | 1840/12384 [3:54:57<22:21:24, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.87s]
Epoch 0: 15%|█▍ | 1840/12384 [3:55:04<22:21:24, 7.63s/it, loss=0.0005, acc=0.9995, iter_time=6.70s]
Epoch 0: 15%|█▍ | 1841/12384 [3:55:04<22:21:49, 7.64s/it, loss=0.0005, acc=0.9995, iter_time=6.70s]
Epoch 0: 15%|█▍ | 1841/12384 [3:55:12<22:21:49, 7.64s/it, loss=0.0005, acc=0.9996, iter_time=8.60s]
Epoch 0: 15%|█▍ | 1842/12384 [3:55:12<22:19:42, 7.62s/it, loss=0.0005, acc=0.9996, iter_time=8.60s]
Epoch 0: 15%|█▍ | 1842/12384 [3:55:19<22:19:42, 7.62s/it, loss=0.0021, acc=0.9944, iter_time=5.26s]
Epoch 0: 15%|█▍ | 1843/12384 [3:55:19<22:20:46, 7.63s/it, loss=0.0021, acc=0.9944, iter_time=5.26s]
Epoch 0: 15%|█▍ | 1843/12384 [3:55:27<22:20:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.13s]
Epoch 0: 15%|█▍ | 1844/12384 [3:55:27<22:21:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.13s]
Epoch 0: 15%|█▍ | 1844/12384 [3:55:35<22:21:45, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.42s]
Epoch 0: 15%|█▍ | 1845/12384 [3:55:35<22:20:19, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.42s]
Epoch 0: 15%|█▍ | 1845/12384 [3:55:44<22:20:19, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.97s]
Epoch 0: 15%|█▍ | 1846/12384 [3:55:44<23:25:11, 8.00s/it, loss=0.0006, acc=0.9985, iter_time=7.97s]
Epoch 0: 15%|█▍ | 1846/12384 [3:55:51<23:25:11, 8.00s/it, loss=0.0019, acc=0.9927, iter_time=10.60s]
Epoch 0: 15%|█▍ | 1847/12384 [3:55:51<23:06:42, 7.90s/it, loss=0.0019, acc=0.9927, iter_time=10.60s]
Epoch 0: 15%|█▍ | 1847/12384 [3:55:59<23:06:42, 7.90s/it, loss=0.0001, acc=1.0000, iter_time=8.58s]
Epoch 0: 15%|█▍ | 1848/12384 [3:55:59<23:18:52, 7.97s/it, loss=0.0001, acc=1.0000, iter_time=8.58s]
Epoch 0: 15%|█▍ | 1848/12384 [3:56:07<23:18:52, 7.97s/it, loss=0.0002, acc=1.0000, iter_time=7.57s]
Epoch 0: 15%|█▍ | 1849/12384 [3:56:07<23:24:22, 8.00s/it, loss=0.0002, acc=1.0000, iter_time=7.57s]
Epoch 0: 15%|█▍ | 1849/12384 [3:56:15<23:24:22, 8.00s/it, loss=0.0013, acc=0.9980, iter_time=8.12s]
Epoch 0: 15%|█▍ | 1850/12384 [3:56:15<23:04:17, 7.88s/it, loss=0.0013, acc=0.9980, iter_time=8.12s]
Epoch 0: 15%|█▍ | 1850/12384 [3:56:23<23:04:17, 7.88s/it, loss=0.0005, acc=0.9987, iter_time=7.22s]
Epoch 0: 15%|█▍ | 1851/12384 [3:56:23<22:50:11, 7.81s/it, loss=0.0005, acc=0.9987, iter_time=7.22s]
Epoch 0: 15%|█▍ | 1851/12384 [3:56:30<22:50:11, 7.81s/it, loss=0.0088, acc=0.9897, iter_time=7.70s]
Epoch 0: 15%|█▍ | 1852/12384 [3:56:30<22:43:38, 7.77s/it, loss=0.0088, acc=0.9897, iter_time=7.70s]
Epoch 0: 15%|█▍ | 1852/12384 [3:56:38<22:43:38, 7.77s/it, loss=0.0016, acc=0.9961, iter_time=7.72s]
Epoch 0: 15%|█▍ | 1853/12384 [3:56:38<22:41:01, 7.75s/it, loss=0.0016, acc=0.9961, iter_time=7.72s]
Epoch 0: 15%|█▍ | 1853/12384 [3:56:46<22:41:01, 7.75s/it, loss=0.0006, acc=0.9979, iter_time=7.71s]
Epoch 0: 15%|█▍ | 1854/12384 [3:56:46<22:38:31, 7.74s/it, loss=0.0006, acc=0.9979, iter_time=7.71s]
Epoch 0: 15%|█▍ | 1854/12384 [3:56:53<22:38:31, 7.74s/it, loss=0.0009, acc=0.9983, iter_time=5.69s]
Epoch 0: 15%|█▍ | 1855/12384 [3:56:53<22:32:16, 7.71s/it, loss=0.0009, acc=0.9983, iter_time=5.69s]
Epoch 0: 15%|█▍ | 1855/12384 [3:57:01<22:32:16, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=9.47s]
Epoch 0: 15%|█▍ | 1856/12384 [3:57:01<22:26:12, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.47s]
Epoch 0: 15%|█▍ | 1856/12384 [3:57:09<22:26:12, 7.67s/it, loss=0.0005, acc=0.9979, iter_time=7.65s]
Epoch 0: 15%|█▍ | 1857/12384 [3:57:09<22:23:42, 7.66s/it, loss=0.0005, acc=0.9979, iter_time=7.65s]
Epoch 0: 15%|█▍ | 1857/12384 [3:57:16<22:23:42, 7.66s/it, loss=0.0003, acc=0.9993, iter_time=5.30s]
Epoch 0: 15%|█▌ | 1858/12384 [3:57:16<22:22:01, 7.65s/it, loss=0.0003, acc=0.9993, iter_time=5.30s]
Epoch 0: 15%|█▌ | 1858/12384 [3:57:24<22:22:01, 7.65s/it, loss=0.0005, acc=0.9974, iter_time=9.66s]
Epoch 0: 15%|█▌ | 1859/12384 [3:57:24<22:20:52, 7.64s/it, loss=0.0005, acc=0.9974, iter_time=9.66s]
Epoch 0: 15%|█▌ | 1859/12384 [3:57:32<22:20:52, 7.64s/it, loss=0.0010, acc=0.9964, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1860/12384 [3:57:32<22:18:57, 7.63s/it, loss=0.0010, acc=0.9964, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1860/12384 [3:57:39<22:18:57, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=6.70s]
Epoch 0: 15%|█▌ | 1861/12384 [3:57:39<22:18:08, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=6.70s]
Epoch 0: 15%|█▌ | 1861/12384 [3:57:47<22:18:08, 7.63s/it, loss=0.0065, acc=0.9889, iter_time=8.84s]
Epoch 0: 15%|█▌ | 1862/12384 [3:57:47<22:17:40, 7.63s/it, loss=0.0065, acc=0.9889, iter_time=8.84s]
Epoch 0: 15%|█▌ | 1862/12384 [3:57:54<22:17:40, 7.63s/it, loss=0.0028, acc=0.9897, iter_time=7.04s]
Epoch 0: 15%|█▌ | 1863/12384 [3:57:54<22:17:08, 7.63s/it, loss=0.0028, acc=0.9897, iter_time=7.04s]
Epoch 0: 15%|█▌ | 1863/12384 [3:58:02<22:17:08, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=8.16s]
Epoch 0: 15%|█▌ | 1864/12384 [3:58:02<22:16:13, 7.62s/it, loss=0.0004, acc=0.9998, iter_time=8.16s]
Epoch 0: 15%|█▌ | 1864/12384 [3:58:10<22:16:13, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.76s]
Epoch 0: 15%|█▌ | 1865/12384 [3:58:10<22:20:10, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.76s]
Epoch 0: 15%|█▌ | 1865/12384 [3:58:17<22:20:10, 7.64s/it, loss=0.0011, acc=0.9965, iter_time=7.68s]
Epoch 0: 15%|█▌ | 1866/12384 [3:58:17<22:21:24, 7.65s/it, loss=0.0011, acc=0.9965, iter_time=7.68s]
Epoch 0: 15%|█▌ | 1866/12384 [3:58:25<22:21:24, 7.65s/it, loss=0.0008, acc=0.9974, iter_time=7.72s]
Epoch 0: 15%|█▌ | 1867/12384 [3:58:25<22:24:40, 7.67s/it, loss=0.0008, acc=0.9974, iter_time=7.72s]
Epoch 0: 15%|█▌ | 1867/12384 [3:58:33<22:24:40, 7.67s/it, loss=0.0056, acc=0.9869, iter_time=4.66s]
Epoch 0: 15%|█▌ | 1868/12384 [3:58:33<22:24:17, 7.67s/it, loss=0.0056, acc=0.9869, iter_time=4.66s]
Epoch 0: 15%|█▌ | 1868/12384 [3:58:41<22:24:17, 7.67s/it, loss=0.0013, acc=0.9977, iter_time=10.81s]
Epoch 0: 15%|█▌ | 1869/12384 [3:58:41<22:31:24, 7.71s/it, loss=0.0013, acc=0.9977, iter_time=10.81s]
Epoch 0: 15%|█▌ | 1869/12384 [3:58:48<22:31:24, 7.71s/it, loss=0.0009, acc=0.9983, iter_time=7.69s]
Epoch 0: 15%|█▌ | 1870/12384 [3:58:48<22:33:55, 7.73s/it, loss=0.0009, acc=0.9983, iter_time=7.69s]
Epoch 0: 15%|█▌ | 1870/12384 [3:58:56<22:33:55, 7.73s/it, loss=0.0006, acc=0.9995, iter_time=6.27s]
Epoch 0: 15%|█▌ | 1871/12384 [3:58:56<22:27:42, 7.69s/it, loss=0.0006, acc=0.9995, iter_time=6.27s]
Epoch 0: 15%|█▌ | 1871/12384 [3:59:04<22:27:42, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=9.53s]
Epoch 0: 15%|█▌ | 1872/12384 [3:59:04<22:29:30, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.53s]
Epoch 0: 15%|█▌ | 1872/12384 [3:59:11<22:29:30, 7.70s/it, loss=0.0003, acc=0.9987, iter_time=4.37s]
Epoch 0: 15%|█▌ | 1873/12384 [3:59:11<22:27:31, 7.69s/it, loss=0.0003, acc=0.9987, iter_time=4.37s]
Epoch 0: 15%|█▌ | 1873/12384 [3:59:19<22:27:31, 7.69s/it, loss=0.0008, acc=0.9980, iter_time=10.50s]
Epoch 0: 15%|█▌ | 1874/12384 [3:59:19<22:24:08, 7.67s/it, loss=0.0008, acc=0.9980, iter_time=10.50s]
Epoch 0: 15%|█▌ | 1874/12384 [3:59:27<22:24:08, 7.67s/it, loss=0.0005, acc=0.9998, iter_time=7.75s]
Epoch 0: 15%|█▌ | 1875/12384 [3:59:27<22:41:02, 7.77s/it, loss=0.0005, acc=0.9998, iter_time=7.75s]
Epoch 0: 15%|█▌ | 1875/12384 [3:59:35<22:41:02, 7.77s/it, loss=0.0013, acc=0.9948, iter_time=8.00s]
Epoch 0: 15%|█▌ | 1876/12384 [3:59:35<22:38:26, 7.76s/it, loss=0.0013, acc=0.9948, iter_time=8.00s]
Epoch 0: 15%|█▌ | 1876/12384 [3:59:42<22:38:26, 7.76s/it, loss=0.0009, acc=0.9979, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1877/12384 [3:59:42<22:30:41, 7.71s/it, loss=0.0009, acc=0.9979, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1877/12384 [3:59:50<22:30:41, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 15%|█▌ | 1878/12384 [3:59:50<22:29:09, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 15%|█▌ | 1878/12384 [3:59:58<22:29:09, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1879/12384 [3:59:58<22:26:05, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1879/12384 [4:00:05<22:26:05, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.03s]
Epoch 0: 15%|█▌ | 1880/12384 [4:00:05<22:22:04, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=8.03s]
Epoch 0: 15%|█▌ | 1880/12384 [4:00:13<22:22:04, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 15%|█▌ | 1881/12384 [4:00:13<22:19:20, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 15%|█▌ | 1881/12384 [4:00:20<22:19:20, 7.65s/it, loss=0.0010, acc=0.9985, iter_time=6.42s]
Epoch 0: 15%|█▌ | 1882/12384 [4:00:20<22:17:42, 7.64s/it, loss=0.0010, acc=0.9985, iter_time=6.42s]
Epoch 0: 15%|█▌ | 1882/12384 [4:00:28<22:17:42, 7.64s/it, loss=0.0019, acc=0.9958, iter_time=8.83s]
Epoch 0: 15%|█▌ | 1883/12384 [4:00:28<22:17:15, 7.64s/it, loss=0.0019, acc=0.9958, iter_time=8.83s]
Epoch 0: 15%|█▌ | 1883/12384 [4:00:36<22:17:15, 7.64s/it, loss=0.0006, acc=0.9999, iter_time=7.64s]
Epoch 0: 15%|█▌ | 1884/12384 [4:00:36<22:15:04, 7.63s/it, loss=0.0006, acc=0.9999, iter_time=7.64s]
Epoch 0: 15%|█▌ | 1884/12384 [4:00:43<22:15:04, 7.63s/it, loss=0.0012, acc=0.9973, iter_time=7.59s]
Epoch 0: 15%|█▌ | 1885/12384 [4:00:43<22:14:50, 7.63s/it, loss=0.0012, acc=0.9973, iter_time=7.59s]
Epoch 0: 15%|█▌ | 1885/12384 [4:00:51<22:14:50, 7.63s/it, loss=0.0010, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1886/12384 [4:00:51<22:17:48, 7.65s/it, loss=0.0010, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1886/12384 [4:00:59<22:17:48, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.80s]
Epoch 0: 15%|█▌ | 1887/12384 [4:00:59<22:26:22, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.80s]
Epoch 0: 15%|█▌ | 1887/12384 [4:01:06<22:26:22, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=8.08s]
Epoch 0: 15%|█▌ | 1888/12384 [4:01:06<22:22:04, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=8.08s]
Epoch 0: 15%|█▌ | 1888/12384 [4:01:14<22:22:04, 7.67s/it, loss=0.0005, acc=0.9999, iter_time=6.92s]
Epoch 0: 15%|█▌ | 1889/12384 [4:01:14<22:21:10, 7.67s/it, loss=0.0005, acc=0.9999, iter_time=6.92s]
Epoch 0: 15%|█▌ | 1889/12384 [4:01:22<22:21:10, 7.67s/it, loss=0.0008, acc=0.9991, iter_time=7.99s]
Epoch 0: 15%|█▌ | 1890/12384 [4:01:22<22:18:31, 7.65s/it, loss=0.0008, acc=0.9991, iter_time=7.99s]
Epoch 0: 15%|█▌ | 1890/12384 [4:01:29<22:18:31, 7.65s/it, loss=0.0002, acc=0.9993, iter_time=6.49s]
Epoch 0: 15%|█▌ | 1891/12384 [4:01:29<22:15:38, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=6.49s]
Epoch 0: 15%|█▌ | 1891/12384 [4:01:37<22:15:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.69s]
Epoch 0: 15%|█▌ | 1892/12384 [4:01:37<22:15:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.69s]
Epoch 0: 15%|█▌ | 1892/12384 [4:01:45<22:15:05, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.74s]
Epoch 0: 15%|█▌ | 1893/12384 [4:01:45<22:22:16, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=6.74s]
Epoch 0: 15%|█▌ | 1893/12384 [4:01:52<22:22:16, 7.68s/it, loss=0.0003, acc=0.9998, iter_time=10.67s]
Epoch 0: 15%|█▌ | 1894/12384 [4:01:52<22:18:47, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=10.67s]
Epoch 0: 15%|█▌ | 1894/12384 [4:02:00<22:18:47, 7.66s/it, loss=0.0005, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1895/12384 [4:02:00<22:17:55, 7.65s/it, loss=0.0005, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1895/12384 [4:02:08<22:17:55, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=8.05s]
Epoch 0: 15%|█▌ | 1896/12384 [4:02:08<22:18:01, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=8.05s]
Epoch 0: 15%|█▌ | 1896/12384 [4:02:15<22:18:01, 7.65s/it, loss=0.0007, acc=0.9965, iter_time=7.25s]
Epoch 0: 15%|█▌ | 1897/12384 [4:02:15<22:17:06, 7.65s/it, loss=0.0007, acc=0.9965, iter_time=7.25s]
Epoch 0: 15%|█▌ | 1897/12384 [4:02:23<22:17:06, 7.65s/it, loss=0.0055, acc=0.9911, iter_time=4.79s]
Epoch 0: 15%|█▌ | 1898/12384 [4:02:23<22:14:52, 7.64s/it, loss=0.0055, acc=0.9911, iter_time=4.79s]
Epoch 0: 15%|█▌ | 1898/12384 [4:02:31<22:14:52, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=8.96s]
Epoch 0: 15%|█▌ | 1899/12384 [4:02:31<22:16:15, 7.65s/it, loss=0.0006, acc=1.0000, iter_time=8.96s]
Epoch 0: 15%|█▌ | 1899/12384 [4:02:38<22:16:15, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.63s]
Epoch 0: 15%|█▌ | 1900/12384 [4:02:38<22:17:22, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.63s]
Epoch 0: 15%|█▌ | 1900/12384 [4:02:46<22:17:22, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.48s]
Epoch 0: 15%|█▌ | 1901/12384 [4:02:46<22:32:45, 7.74s/it, loss=0.0002, acc=0.9998, iter_time=7.48s]
Epoch 0: 15%|█▌ | 1901/12384 [4:02:54<22:32:45, 7.74s/it, loss=0.0009, acc=0.9982, iter_time=4.90s]
Epoch 0: 15%|█▌ | 1902/12384 [4:02:54<22:27:06, 7.71s/it, loss=0.0009, acc=0.9982, iter_time=4.90s]
Epoch 0: 15%|█▌ | 1902/12384 [4:03:02<22:27:06, 7.71s/it, loss=0.0058, acc=0.9907, iter_time=10.42s]
Epoch 0: 15%|█▌ | 1903/12384 [4:03:02<22:25:23, 7.70s/it, loss=0.0058, acc=0.9907, iter_time=10.42s]
Epoch 0: 15%|█▌ | 1903/12384 [4:03:09<22:25:23, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 15%|█▌ | 1904/12384 [4:03:09<22:20:17, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 15%|█▌ | 1904/12384 [4:03:17<22:20:17, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.20s]
Epoch 0: 15%|█▌ | 1905/12384 [4:03:17<22:14:56, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.20s]
Epoch 0: 15%|█▌ | 1905/12384 [4:03:24<22:14:56, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1906/12384 [4:03:24<22:13:10, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1906/12384 [4:03:32<22:13:10, 7.63s/it, loss=0.0033, acc=0.9937, iter_time=4.75s]
Epoch 0: 15%|█▌ | 1907/12384 [4:03:32<22:14:40, 7.64s/it, loss=0.0033, acc=0.9937, iter_time=4.75s]
Epoch 0: 15%|█▌ | 1907/12384 [4:03:40<22:14:40, 7.64s/it, loss=0.0009, acc=0.9985, iter_time=10.53s]
Epoch 0: 15%|█▌ | 1908/12384 [4:03:40<22:13:16, 7.64s/it, loss=0.0009, acc=0.9985, iter_time=10.53s]
Epoch 0: 15%|█▌ | 1908/12384 [4:03:47<22:13:16, 7.64s/it, loss=0.0089, acc=0.9913, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1909/12384 [4:03:47<22:13:31, 7.64s/it, loss=0.0089, acc=0.9913, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1909/12384 [4:03:55<22:13:31, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=4.78s]
Epoch 0: 15%|█▌ | 1910/12384 [4:03:55<22:12:21, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=4.78s]
Epoch 0: 15%|█▌ | 1910/12384 [4:04:03<22:12:21, 7.63s/it, loss=0.0007, acc=0.9994, iter_time=10.51s]
Epoch 0: 15%|█▌ | 1911/12384 [4:04:03<22:12:55, 7.64s/it, loss=0.0007, acc=0.9994, iter_time=10.51s]
Epoch 0: 15%|█▌ | 1911/12384 [4:04:10<22:12:55, 7.64s/it, loss=0.0006, acc=0.9993, iter_time=7.57s]
Epoch 0: 15%|█▌ | 1912/12384 [4:04:10<22:12:22, 7.63s/it, loss=0.0006, acc=0.9993, iter_time=7.57s]
Epoch 0: 15%|█▌ | 1912/12384 [4:04:18<22:12:22, 7.63s/it, loss=0.0007, acc=0.9965, iter_time=4.14s]
Epoch 0: 15%|█▌ | 1913/12384 [4:04:18<22:13:53, 7.64s/it, loss=0.0007, acc=0.9965, iter_time=4.14s]
Epoch 0: 15%|█▌ | 1913/12384 [4:04:25<22:13:53, 7.64s/it, loss=0.0011, acc=0.9995, iter_time=9.97s]
Epoch 0: 15%|█▌ | 1914/12384 [4:04:25<22:14:11, 7.65s/it, loss=0.0011, acc=0.9995, iter_time=9.97s]
Epoch 0: 15%|█▌ | 1914/12384 [4:04:33<22:14:11, 7.65s/it, loss=0.0031, acc=0.9896, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1915/12384 [4:04:33<22:12:03, 7.63s/it, loss=0.0031, acc=0.9896, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1915/12384 [4:04:41<22:12:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1916/12384 [4:04:41<22:15:18, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1916/12384 [4:04:48<22:15:18, 7.65s/it, loss=0.0006, acc=0.9999, iter_time=7.72s]
Epoch 0: 15%|█▌ | 1917/12384 [4:04:48<22:13:26, 7.64s/it, loss=0.0006, acc=0.9999, iter_time=7.72s]
Epoch 0: 15%|█▌ | 1917/12384 [4:04:56<22:13:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 15%|█▌ | 1918/12384 [4:04:56<22:11:57, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 15%|█▌ | 1918/12384 [4:05:04<22:11:57, 7.64s/it, loss=0.0014, acc=0.9978, iter_time=9.21s]
Epoch 0: 15%|█▌ | 1919/12384 [4:05:04<22:18:12, 7.67s/it, loss=0.0014, acc=0.9978, iter_time=9.21s]
Epoch 0: 15%|█▌ | 1919/12384 [4:05:11<22:18:12, 7.67s/it, loss=0.0009, acc=0.9955, iter_time=8.03s]
Epoch 0: 16%|█▌ | 1920/12384 [4:05:11<22:16:31, 7.66s/it, loss=0.0009, acc=0.9955, iter_time=8.03s]
Epoch 0: 16%|█▌ | 1920/12384 [4:05:19<22:16:31, 7.66s/it, loss=0.0006, acc=0.9974, iter_time=7.35s]
Epoch 0: 16%|█▌ | 1921/12384 [4:05:19<22:18:38, 7.68s/it, loss=0.0006, acc=0.9974, iter_time=7.35s]
Epoch 0: 16%|█▌ | 1921/12384 [4:05:27<22:18:38, 7.68s/it, loss=0.0004, acc=0.9984, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1922/12384 [4:05:27<22:16:31, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1922/12384 [4:05:34<22:16:31, 7.67s/it, loss=0.0010, acc=0.9977, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1923/12384 [4:05:34<22:14:41, 7.66s/it, loss=0.0010, acc=0.9977, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1923/12384 [4:05:42<22:14:41, 7.66s/it, loss=0.0015, acc=0.9953, iter_time=3.81s]
Epoch 0: 16%|█▌ | 1924/12384 [4:05:42<22:14:22, 7.65s/it, loss=0.0015, acc=0.9953, iter_time=3.81s]
Epoch 0: 16%|█▌ | 1924/12384 [4:05:50<22:14:22, 7.65s/it, loss=0.0015, acc=0.9976, iter_time=11.48s]
Epoch 0: 16%|█▌ | 1925/12384 [4:05:50<22:19:12, 7.68s/it, loss=0.0015, acc=0.9976, iter_time=11.48s]
Epoch 0: 16%|█▌ | 1925/12384 [4:05:57<22:19:12, 7.68s/it, loss=0.0018, acc=0.9983, iter_time=7.74s]
Epoch 0: 16%|█▌ | 1926/12384 [4:05:57<22:17:39, 7.67s/it, loss=0.0018, acc=0.9983, iter_time=7.74s]
Epoch 0: 16%|█▌ | 1926/12384 [4:06:05<22:17:39, 7.67s/it, loss=0.0007, acc=0.9996, iter_time=4.61s]
Epoch 0: 16%|█▌ | 1927/12384 [4:06:05<22:16:06, 7.67s/it, loss=0.0007, acc=0.9996, iter_time=4.61s]
Epoch 0: 16%|█▌ | 1927/12384 [4:06:13<22:16:06, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=11.38s]
Epoch 0: 16%|█▌ | 1928/12384 [4:06:13<22:30:39, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=11.38s]
Epoch 0: 16%|█▌ | 1928/12384 [4:06:21<22:30:39, 7.75s/it, loss=0.0020, acc=0.9942, iter_time=7.23s]
Epoch 0: 16%|█▌ | 1929/12384 [4:06:21<22:23:05, 7.71s/it, loss=0.0020, acc=0.9942, iter_time=7.23s]
Epoch 0: 16%|█▌ | 1929/12384 [4:06:28<22:23:05, 7.71s/it, loss=0.0022, acc=0.9954, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1930/12384 [4:06:28<22:19:33, 7.69s/it, loss=0.0022, acc=0.9954, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1930/12384 [4:06:36<22:19:33, 7.69s/it, loss=0.0006, acc=0.9994, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1931/12384 [4:06:36<22:17:43, 7.68s/it, loss=0.0006, acc=0.9994, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1931/12384 [4:06:44<22:17:43, 7.68s/it, loss=0.0006, acc=0.9998, iter_time=7.35s]
Epoch 0: 16%|█▌ | 1932/12384 [4:06:44<22:14:33, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=7.35s]
Epoch 0: 16%|█▌ | 1932/12384 [4:06:51<22:14:33, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 16%|█▌ | 1933/12384 [4:06:51<22:13:47, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 16%|█▌ | 1933/12384 [4:06:59<22:13:47, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1934/12384 [4:06:59<22:14:58, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1934/12384 [4:07:07<22:14:58, 7.66s/it, loss=0.0009, acc=0.9995, iter_time=7.07s]
Epoch 0: 16%|█▌ | 1935/12384 [4:07:07<22:13:37, 7.66s/it, loss=0.0009, acc=0.9995, iter_time=7.07s]
Epoch 0: 16%|█▌ | 1935/12384 [4:07:14<22:13:37, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=8.62s]
Epoch 0: 16%|█▌ | 1936/12384 [4:07:14<22:15:40, 7.67s/it, loss=0.0005, acc=1.0000, iter_time=8.62s]
Epoch 0: 16%|█▌ | 1936/12384 [4:07:22<22:15:40, 7.67s/it, loss=0.0006, acc=0.9981, iter_time=6.11s]
Epoch 0: 16%|█▌ | 1937/12384 [4:07:22<22:11:57, 7.65s/it, loss=0.0006, acc=0.9981, iter_time=6.11s]
Epoch 0: 16%|█▌ | 1937/12384 [4:07:29<22:11:57, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1938/12384 [4:07:29<22:10:10, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1938/12384 [4:07:37<22:10:10, 7.64s/it, loss=0.0016, acc=0.9985, iter_time=8.87s]
Epoch 0: 16%|█▌ | 1939/12384 [4:07:37<22:08:42, 7.63s/it, loss=0.0016, acc=0.9985, iter_time=8.87s]
Epoch 0: 16%|█▌ | 1939/12384 [4:07:45<22:08:42, 7.63s/it, loss=0.0006, acc=0.9991, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1940/12384 [4:07:45<22:10:12, 7.64s/it, loss=0.0006, acc=0.9991, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1940/12384 [4:07:52<22:10:12, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=6.40s]
Epoch 0: 16%|█▌ | 1941/12384 [4:07:52<22:09:36, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=6.40s]
Epoch 0: 16%|█▌ | 1941/12384 [4:08:00<22:09:36, 7.64s/it, loss=0.0019, acc=0.9960, iter_time=8.83s]
Epoch 0: 16%|█▌ | 1942/12384 [4:08:00<22:08:45, 7.64s/it, loss=0.0019, acc=0.9960, iter_time=8.83s]
Epoch 0: 16%|█▌ | 1942/12384 [4:08:08<22:08:45, 7.64s/it, loss=0.0012, acc=0.9983, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1943/12384 [4:08:08<22:08:28, 7.63s/it, loss=0.0012, acc=0.9983, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1943/12384 [4:08:15<22:08:28, 7.63s/it, loss=0.0018, acc=0.9950, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1944/12384 [4:08:15<22:09:24, 7.64s/it, loss=0.0018, acc=0.9950, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1944/12384 [4:08:23<22:09:24, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=4.80s]
Epoch 0: 16%|█▌ | 1945/12384 [4:08:23<22:11:04, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=4.80s]
Epoch 0: 16%|█▌ | 1945/12384 [4:08:31<22:11:04, 7.65s/it, loss=0.0016, acc=0.9941, iter_time=8.20s]
Epoch 0: 16%|█▌ | 1946/12384 [4:08:31<22:09:29, 7.64s/it, loss=0.0016, acc=0.9941, iter_time=8.20s]
Epoch 0: 16%|█▌ | 1946/12384 [4:08:38<22:09:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.94s]
Epoch 0: 16%|█▌ | 1947/12384 [4:08:38<22:08:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.94s]
Epoch 0: 16%|█▌ | 1947/12384 [4:08:46<22:08:00, 7.63s/it, loss=0.0028, acc=0.9932, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1948/12384 [4:08:46<22:08:19, 7.64s/it, loss=0.0028, acc=0.9932, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1948/12384 [4:08:53<22:08:19, 7.64s/it, loss=0.0011, acc=0.9975, iter_time=6.44s]
Epoch 0: 16%|█▌ | 1949/12384 [4:08:53<22:07:14, 7.63s/it, loss=0.0011, acc=0.9975, iter_time=6.44s]
Epoch 0: 16%|█▌ | 1949/12384 [4:09:01<22:07:14, 7.63s/it, loss=0.0010, acc=0.9976, iter_time=9.22s]
Epoch 0: 16%|█▌ | 1950/12384 [4:09:01<22:06:02, 7.63s/it, loss=0.0010, acc=0.9976, iter_time=9.22s]
Epoch 0: 16%|█▌ | 1950/12384 [4:09:09<22:06:02, 7.63s/it, loss=0.0012, acc=0.9975, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1951/12384 [4:09:09<22:05:53, 7.63s/it, loss=0.0012, acc=0.9975, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1951/12384 [4:09:16<22:05:53, 7.63s/it, loss=0.0020, acc=0.9984, iter_time=8.02s]
Epoch 0: 16%|█▌ | 1952/12384 [4:09:16<22:05:05, 7.62s/it, loss=0.0020, acc=0.9984, iter_time=8.02s]
Epoch 0: 16%|█▌ | 1952/12384 [4:09:24<22:05:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 0: 16%|█▌ | 1953/12384 [4:09:24<22:10:12, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 0: 16%|█▌ | 1953/12384 [4:09:32<22:10:12, 7.65s/it, loss=0.0006, acc=0.9966, iter_time=6.84s]
Epoch 0: 16%|█▌ | 1954/12384 [4:09:32<22:27:12, 7.75s/it, loss=0.0006, acc=0.9966, iter_time=6.84s]
Epoch 0: 16%|█▌ | 1954/12384 [4:09:40<22:27:12, 7.75s/it, loss=0.0016, acc=0.9979, iter_time=7.73s]
Epoch 0: 16%|█▌ | 1955/12384 [4:09:40<22:21:00, 7.72s/it, loss=0.0016, acc=0.9979, iter_time=7.73s]
Epoch 0: 16%|█▌ | 1955/12384 [4:09:47<22:21:00, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=5.24s]
Epoch 0: 16%|█▌ | 1956/12384 [4:09:47<22:20:44, 7.71s/it, loss=0.0001, acc=0.9998, iter_time=5.24s]
Epoch 0: 16%|█▌ | 1956/12384 [4:09:55<22:20:44, 7.71s/it, loss=0.0005, acc=0.9980, iter_time=8.93s]
Epoch 0: 16%|█▌ | 1957/12384 [4:09:55<22:19:44, 7.71s/it, loss=0.0005, acc=0.9980, iter_time=8.93s]
Epoch 0: 16%|█▌ | 1957/12384 [4:10:03<22:19:44, 7.71s/it, loss=0.0009, acc=0.9999, iter_time=9.39s]
Epoch 0: 16%|█▌ | 1958/12384 [4:10:03<22:13:21, 7.67s/it, loss=0.0009, acc=0.9999, iter_time=9.39s]
Epoch 0: 16%|█▌ | 1958/12384 [4:10:10<22:13:21, 7.67s/it, loss=0.0110, acc=0.9852, iter_time=6.98s]
Epoch 0: 16%|█▌ | 1959/12384 [4:10:10<22:09:47, 7.65s/it, loss=0.0110, acc=0.9852, iter_time=6.98s]
Epoch 0: 16%|█▌ | 1959/12384 [4:10:18<22:09:47, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.80s]
Epoch 0: 16%|█▌ | 1960/12384 [4:10:18<22:09:09, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.80s]
Epoch 0: 16%|█▌ | 1960/12384 [4:10:26<22:09:09, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1961/12384 [4:10:26<22:11:04, 7.66s/it, loss=0.0004, acc=0.9988, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1961/12384 [4:10:33<22:11:04, 7.66s/it, loss=0.0009, acc=0.9980, iter_time=6.77s]
Epoch 0: 16%|█▌ | 1962/12384 [4:10:33<22:10:19, 7.66s/it, loss=0.0009, acc=0.9980, iter_time=6.77s]
Epoch 0: 16%|█▌ | 1962/12384 [4:10:41<22:10:19, 7.66s/it, loss=0.0237, acc=0.9555, iter_time=8.60s]
Epoch 0: 16%|█▌ | 1963/12384 [4:10:41<22:09:29, 7.65s/it, loss=0.0237, acc=0.9555, iter_time=8.60s]
Epoch 0: 16%|█▌ | 1963/12384 [4:10:49<22:09:29, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.85s]
Epoch 0: 16%|█▌ | 1964/12384 [4:10:49<22:09:08, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.85s]
Epoch 0: 16%|█▌ | 1964/12384 [4:10:56<22:09:08, 7.65s/it, loss=0.0012, acc=0.9981, iter_time=10.44s]
Epoch 0: 16%|█▌ | 1965/12384 [4:10:56<22:08:21, 7.65s/it, loss=0.0012, acc=0.9981, iter_time=10.44s]
Epoch 0: 16%|█▌ | 1965/12384 [4:11:04<22:08:21, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 16%|█▌ | 1966/12384 [4:11:04<22:12:08, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 16%|█▌ | 1966/12384 [4:11:12<22:12:08, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1967/12384 [4:11:12<22:13:45, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1967/12384 [4:11:19<22:13:45, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.74s]
Epoch 0: 16%|█▌ | 1968/12384 [4:11:19<22:13:45, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.74s]
Epoch 0: 16%|█▌ | 1968/12384 [4:11:27<22:13:45, 7.68s/it, loss=0.0007, acc=0.9980, iter_time=7.66s]
Epoch 0: 16%|█▌ | 1969/12384 [4:11:27<22:10:42, 7.67s/it, loss=0.0007, acc=0.9980, iter_time=7.66s]
Epoch 0: 16%|█▌ | 1969/12384 [4:11:35<22:10:42, 7.67s/it, loss=0.0019, acc=0.9948, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1970/12384 [4:11:35<22:08:00, 7.65s/it, loss=0.0019, acc=0.9948, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1970/12384 [4:11:42<22:08:00, 7.65s/it, loss=0.0022, acc=0.9961, iter_time=4.32s]
Epoch 0: 16%|█▌ | 1971/12384 [4:11:42<22:05:39, 7.64s/it, loss=0.0022, acc=0.9961, iter_time=4.32s]
Epoch 0: 16%|█▌ | 1971/12384 [4:11:50<22:05:39, 7.64s/it, loss=0.0010, acc=0.9983, iter_time=10.90s]
Epoch 0: 16%|█▌ | 1972/12384 [4:11:50<22:04:31, 7.63s/it, loss=0.0010, acc=0.9983, iter_time=10.90s]
Epoch 0: 16%|█▌ | 1972/12384 [4:11:57<22:04:31, 7.63s/it, loss=0.0008, acc=0.9980, iter_time=7.33s]
Epoch 0: 16%|█▌ | 1973/12384 [4:11:57<22:02:45, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.33s]
Epoch 0: 16%|█▌ | 1973/12384 [4:12:05<22:02:45, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=7.88s]
Epoch 0: 16%|█▌ | 1974/12384 [4:12:05<22:02:15, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=7.88s]
Epoch 0: 16%|█▌ | 1974/12384 [4:12:13<22:02:15, 7.62s/it, loss=0.0036, acc=0.9948, iter_time=6.69s]
Epoch 0: 16%|█▌ | 1975/12384 [4:12:13<22:03:26, 7.63s/it, loss=0.0036, acc=0.9948, iter_time=6.69s]
Epoch 0: 16%|█▌ | 1975/12384 [4:12:20<22:03:26, 7.63s/it, loss=0.0004, acc=0.9984, iter_time=8.97s]
Epoch 0: 16%|█▌ | 1976/12384 [4:12:20<22:05:14, 7.64s/it, loss=0.0004, acc=0.9984, iter_time=8.97s]
Epoch 0: 16%|█▌ | 1976/12384 [4:12:28<22:05:14, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=6.97s]
Epoch 0: 16%|█▌ | 1977/12384 [4:12:28<22:04:47, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=6.97s]
Epoch 0: 16%|█▌ | 1977/12384 [4:12:36<22:04:47, 7.64s/it, loss=0.0004, acc=0.9996, iter_time=7.95s]
Epoch 0: 16%|█▌ | 1978/12384 [4:12:36<22:03:52, 7.63s/it, loss=0.0004, acc=0.9996, iter_time=7.95s]
Epoch 0: 16%|█▌ | 1978/12384 [4:12:43<22:03:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1979/12384 [4:12:43<22:03:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1979/12384 [4:12:51<22:03:04, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1980/12384 [4:12:51<22:04:35, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1980/12384 [4:12:59<22:04:35, 7.64s/it, loss=0.0006, acc=0.9991, iter_time=7.98s]
Epoch 0: 16%|█▌ | 1981/12384 [4:12:59<22:24:27, 7.75s/it, loss=0.0006, acc=0.9991, iter_time=7.98s]
Epoch 0: 16%|█▌ | 1981/12384 [4:13:07<22:24:27, 7.75s/it, loss=0.0004, acc=0.9991, iter_time=7.76s]
Epoch 0: 16%|█▌ | 1982/12384 [4:13:07<22:20:20, 7.73s/it, loss=0.0004, acc=0.9991, iter_time=7.76s]
Epoch 0: 16%|█▌ | 1982/12384 [4:13:14<22:20:20, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1983/12384 [4:13:14<22:13:17, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1983/12384 [4:13:22<22:13:17, 7.69s/it, loss=0.0002, acc=0.9998, iter_time=8.10s]
Epoch 0: 16%|█▌ | 1984/12384 [4:13:22<22:14:39, 7.70s/it, loss=0.0002, acc=0.9998, iter_time=8.10s]
Epoch 0: 16%|█▌ | 1984/12384 [4:13:29<22:14:39, 7.70s/it, loss=0.0007, acc=0.9972, iter_time=6.29s]
Epoch 0: 16%|█▌ | 1985/12384 [4:13:29<22:10:48, 7.68s/it, loss=0.0007, acc=0.9972, iter_time=6.29s]
Epoch 0: 16%|█▌ | 1985/12384 [4:13:37<22:10:48, 7.68s/it, loss=0.0004, acc=0.9997, iter_time=8.55s]
Epoch 0: 16%|█▌ | 1986/12384 [4:13:37<22:06:18, 7.65s/it, loss=0.0004, acc=0.9997, iter_time=8.55s]
Epoch 0: 16%|█▌ | 1986/12384 [4:13:45<22:06:18, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=7.31s]
Epoch 0: 16%|█▌ | 1987/12384 [4:13:45<22:06:29, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=7.31s]
Epoch 0: 16%|█▌ | 1987/12384 [4:13:52<22:06:29, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=7.96s]
Epoch 0: 16%|█▌ | 1988/12384 [4:13:52<22:05:58, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=7.96s]
Epoch 0: 16%|█▌ | 1988/12384 [4:14:00<22:05:58, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=3.67s]
Epoch 0: 16%|█▌ | 1989/12384 [4:14:00<22:05:35, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=3.67s]
Epoch 0: 16%|█▌ | 1989/12384 [4:14:08<22:05:35, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=11.65s]
Epoch 0: 16%|█▌ | 1990/12384 [4:14:08<22:06:24, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=11.65s]
Epoch 0: 16%|█▌ | 1990/12384 [4:14:15<22:06:24, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.23s]
Epoch 0: 16%|█▌ | 1991/12384 [4:14:15<22:07:12, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.23s]
Epoch 0: 16%|█▌ | 1991/12384 [4:14:23<22:07:12, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=9.47s]
Epoch 0: 16%|█▌ | 1992/12384 [4:14:23<22:06:01, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=9.47s]
Epoch 0: 16%|█▌ | 1992/12384 [4:14:31<22:06:01, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.13s]
Epoch 0: 16%|█▌ | 1993/12384 [4:14:31<22:04:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.13s]
Epoch 0: 16%|█▌ | 1993/12384 [4:14:38<22:04:59, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.47s]
Epoch 0: 16%|█▌ | 1994/12384 [4:14:38<22:05:31, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.47s]
Epoch 0: 16%|█▌ | 1994/12384 [4:14:46<22:05:31, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=9.99s]
Epoch 0: 16%|█▌ | 1995/12384 [4:14:46<22:05:20, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=9.99s]
Epoch 0: 16%|█▌ | 1995/12384 [4:14:54<22:05:20, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1996/12384 [4:14:54<22:01:50, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1996/12384 [4:15:01<22:01:50, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1997/12384 [4:15:01<22:01:59, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1997/12384 [4:15:09<22:01:59, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.57s]
Epoch 0: 16%|█▌ | 1998/12384 [4:15:09<22:03:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.57s]
Epoch 0: 16%|█▌ | 1998/12384 [4:15:16<22:03:39, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=10.70s]
Epoch 0: 16%|█▌ | 1999/12384 [4:15:16<22:00:35, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.70s]
Epoch 0: 16%|█▌ | 1999/12384 [4:15:24<22:00:35, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=8.03s]
Epoch 0: 16%|█▌ | 2000/12384 [4:15:24<22:10:48, 7.69s/it, loss=0.0004, acc=0.9998, iter_time=8.03s]
Epoch 0: 16%|█▌ | 2000/12384 [4:15:32<22:10:48, 7.69s/it, loss=0.0011, acc=0.9961, iter_time=7.11s]
Epoch 0: 16%|█▌ | 2001/12384 [4:15:32<22:08:41, 7.68s/it, loss=0.0011, acc=0.9961, iter_time=7.11s]
Epoch 0: 16%|█▌ | 2001/12384 [4:15:40<22:08:41, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=7.41s]
Epoch 0: 16%|█▌ | 2002/12384 [4:15:40<22:07:36, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.41s]
Epoch 0: 16%|█▌ | 2002/12384 [4:15:47<22:07:36, 7.67s/it, loss=0.0008, acc=0.9977, iter_time=8.22s]
Epoch 0: 16%|█▌ | 2003/12384 [4:15:47<22:05:49, 7.66s/it, loss=0.0008, acc=0.9977, iter_time=8.22s]
Epoch 0: 16%|█▌ | 2003/12384 [4:15:55<22:05:49, 7.66s/it, loss=0.0028, acc=0.9974, iter_time=7.63s]
Epoch 0: 16%|█▌ | 2004/12384 [4:15:55<22:03:53, 7.65s/it, loss=0.0028, acc=0.9974, iter_time=7.63s]
Epoch 0: 16%|█▌ | 2004/12384 [4:16:02<22:03:53, 7.65s/it, loss=0.0013, acc=0.9964, iter_time=7.61s]
Epoch 0: 16%|█▌ | 2005/12384 [4:16:02<22:01:33, 7.64s/it, loss=0.0013, acc=0.9964, iter_time=7.61s]
Epoch 0: 16%|█▌ | 2005/12384 [4:16:10<22:01:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 16%|█▌ | 2006/12384 [4:16:10<22:13:24, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 16%|█▌ | 2006/12384 [4:16:18<22:13:24, 7.71s/it, loss=0.0004, acc=0.9995, iter_time=7.66s]
Epoch 0: 16%|█▌ | 2007/12384 [4:16:18<22:27:46, 7.79s/it, loss=0.0004, acc=0.9995, iter_time=7.66s]
Epoch 0: 16%|█▌ | 2007/12384 [4:16:26<22:27:46, 7.79s/it, loss=0.0003, acc=1.0000, iter_time=8.30s]
Epoch 0: 16%|█▌ | 2008/12384 [4:16:26<22:19:24, 7.75s/it, loss=0.0003, acc=1.0000, iter_time=8.30s]
Epoch 0: 16%|█▌ | 2008/12384 [4:16:34<22:19:24, 7.75s/it, loss=0.0008, acc=0.9988, iter_time=7.26s]
Epoch 0: 16%|█▌ | 2009/12384 [4:16:34<22:12:16, 7.70s/it, loss=0.0008, acc=0.9988, iter_time=7.26s]
Epoch 0: 16%|█▌ | 2009/12384 [4:16:41<22:12:16, 7.70s/it, loss=0.0106, acc=0.9933, iter_time=4.32s]
Epoch 0: 16%|█▌ | 2010/12384 [4:16:41<22:09:06, 7.69s/it, loss=0.0106, acc=0.9933, iter_time=4.32s]
Epoch 0: 16%|█▌ | 2010/12384 [4:16:49<22:09:06, 7.69s/it, loss=0.0006, acc=0.9983, iter_time=10.94s]
Epoch 0: 16%|█▌ | 2011/12384 [4:16:49<22:04:38, 7.66s/it, loss=0.0006, acc=0.9983, iter_time=10.94s]
Epoch 0: 16%|█▌ | 2011/12384 [4:16:56<22:04:38, 7.66s/it, loss=0.0019, acc=0.9972, iter_time=7.60s]
Epoch 0: 16%|█▌ | 2012/12384 [4:16:56<22:02:41, 7.65s/it, loss=0.0019, acc=0.9972, iter_time=7.60s]
Epoch 0: 16%|█▌ | 2012/12384 [4:17:04<22:02:41, 7.65s/it, loss=0.0006, acc=0.9987, iter_time=6.43s]
Epoch 0: 16%|█▋ | 2013/12384 [4:17:04<22:03:10, 7.66s/it, loss=0.0006, acc=0.9987, iter_time=6.43s]
Epoch 0: 16%|█▋ | 2013/12384 [4:17:12<22:03:10, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.24s]
Epoch 0: 16%|█▋ | 2014/12384 [4:17:12<22:01:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.24s]
Epoch 0: 16%|█▋ | 2014/12384 [4:17:19<22:01:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 16%|█▋ | 2015/12384 [4:17:19<22:07:21, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 16%|█▋ | 2015/12384 [4:17:27<22:07:21, 7.68s/it, loss=0.0017, acc=0.9963, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2016/12384 [4:17:27<22:07:43, 7.68s/it, loss=0.0017, acc=0.9963, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2016/12384 [4:17:35<22:07:43, 7.68s/it, loss=0.0007, acc=0.9967, iter_time=7.34s]
Epoch 0: 16%|█▋ | 2017/12384 [4:17:35<22:04:46, 7.67s/it, loss=0.0007, acc=0.9967, iter_time=7.34s]
Epoch 0: 16%|█▋ | 2017/12384 [4:17:42<22:04:46, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.00s]
Epoch 0: 16%|█▋ | 2018/12384 [4:17:42<22:04:33, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.00s]
Epoch 0: 16%|█▋ | 2018/12384 [4:17:50<22:04:33, 7.67s/it, loss=0.0019, acc=0.9958, iter_time=8.63s]
Epoch 0: 16%|█▋ | 2019/12384 [4:17:50<22:04:42, 7.67s/it, loss=0.0019, acc=0.9958, iter_time=8.63s]
Epoch 0: 16%|█▋ | 2019/12384 [4:17:58<22:04:42, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▋ | 2020/12384 [4:17:58<22:04:45, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▋ | 2020/12384 [4:18:05<22:04:45, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=7.68s]
Epoch 0: 16%|█▋ | 2021/12384 [4:18:05<22:01:19, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.68s]
Epoch 0: 16%|█▋ | 2021/12384 [4:18:13<22:01:19, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=4.76s]
Epoch 0: 16%|█▋ | 2022/12384 [4:18:13<22:01:05, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=4.76s]
Epoch 0: 16%|█▋ | 2022/12384 [4:18:21<22:01:05, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=10.50s]
Epoch 0: 16%|█▋ | 2023/12384 [4:18:21<22:00:32, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=10.50s]
Epoch 0: 16%|█▋ | 2023/12384 [4:18:28<22:00:32, 7.65s/it, loss=0.0016, acc=0.9940, iter_time=8.04s]
Epoch 0: 16%|█▋ | 2024/12384 [4:18:28<22:00:13, 7.65s/it, loss=0.0016, acc=0.9940, iter_time=8.04s]
Epoch 0: 16%|█▋ | 2024/12384 [4:18:36<22:00:13, 7.65s/it, loss=0.0006, acc=0.9985, iter_time=7.27s]
Epoch 0: 16%|█▋ | 2025/12384 [4:18:36<22:04:21, 7.67s/it, loss=0.0006, acc=0.9985, iter_time=7.27s]
Epoch 0: 16%|█▋ | 2025/12384 [4:18:44<22:04:21, 7.67s/it, loss=0.0017, acc=0.9965, iter_time=7.72s]
Epoch 0: 16%|█▋ | 2026/12384 [4:18:44<22:04:00, 7.67s/it, loss=0.0017, acc=0.9965, iter_time=7.72s]
Epoch 0: 16%|█▋ | 2026/12384 [4:18:51<22:04:00, 7.67s/it, loss=0.0033, acc=0.9953, iter_time=7.66s]
Epoch 0: 16%|█▋ | 2027/12384 [4:18:51<22:03:18, 7.67s/it, loss=0.0033, acc=0.9953, iter_time=7.66s]
Epoch 0: 16%|█▋ | 2027/12384 [4:18:59<22:03:18, 7.67s/it, loss=0.0007, acc=0.9979, iter_time=7.68s]
Epoch 0: 16%|█▋ | 2028/12384 [4:18:59<22:02:29, 7.66s/it, loss=0.0007, acc=0.9979, iter_time=7.68s]
Epoch 0: 16%|█▋ | 2028/12384 [4:19:07<22:02:29, 7.66s/it, loss=0.0007, acc=0.9980, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2029/12384 [4:19:07<22:02:47, 7.66s/it, loss=0.0007, acc=0.9980, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2029/12384 [4:19:14<22:02:47, 7.66s/it, loss=0.0022, acc=0.9895, iter_time=7.66s]
Epoch 0: 16%|█▋ | 2030/12384 [4:19:14<21:59:39, 7.65s/it, loss=0.0022, acc=0.9895, iter_time=7.66s]
Epoch 0: 16%|█▋ | 2030/12384 [4:19:22<21:59:39, 7.65s/it, loss=0.0003, acc=0.9979, iter_time=7.60s]
Epoch 0: 16%|█▋ | 2031/12384 [4:19:22<21:57:51, 7.64s/it, loss=0.0003, acc=0.9979, iter_time=7.60s]
Epoch 0: 16%|█▋ | 2031/12384 [4:19:30<21:57:51, 7.64s/it, loss=0.0012, acc=0.9958, iter_time=8.33s]
Epoch 0: 16%|█▋ | 2032/12384 [4:19:30<22:12:37, 7.72s/it, loss=0.0012, acc=0.9958, iter_time=8.33s]
Epoch 0: 16%|█▋ | 2032/12384 [4:19:38<22:12:37, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=3.68s]
Epoch 0: 16%|█▋ | 2033/12384 [4:19:38<22:26:28, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=3.68s]
Epoch 0: 16%|█▋ | 2033/12384 [4:19:46<22:26:28, 7.80s/it, loss=0.0003, acc=0.9998, iter_time=9.83s]
Epoch 0: 16%|█▋ | 2034/12384 [4:19:46<22:19:54, 7.77s/it, loss=0.0003, acc=0.9998, iter_time=9.83s]
Epoch 0: 16%|█▋ | 2034/12384 [4:19:53<22:19:54, 7.77s/it, loss=0.0080, acc=0.9892, iter_time=9.38s]
Epoch 0: 16%|█▋ | 2035/12384 [4:19:53<22:12:00, 7.72s/it, loss=0.0080, acc=0.9892, iter_time=9.38s]
Epoch 0: 16%|█▋ | 2035/12384 [4:20:01<22:12:00, 7.72s/it, loss=0.0016, acc=0.9959, iter_time=7.31s]
Epoch 0: 16%|█▋ | 2036/12384 [4:20:01<22:08:40, 7.70s/it, loss=0.0016, acc=0.9959, iter_time=7.31s]
Epoch 0: 16%|█▋ | 2036/12384 [4:20:09<22:08:40, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=6.52s]
Epoch 0: 16%|█▋ | 2037/12384 [4:20:09<22:07:42, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=6.52s]
Epoch 0: 16%|█▋ | 2037/12384 [4:20:16<22:07:42, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 16%|█▋ | 2038/12384 [4:20:16<22:04:05, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 16%|█▋ | 2038/12384 [4:20:24<22:04:05, 7.68s/it, loss=0.0006, acc=0.9980, iter_time=10.83s]
Epoch 0: 16%|█▋ | 2039/12384 [4:20:24<22:09:00, 7.71s/it, loss=0.0006, acc=0.9980, iter_time=10.83s]
Epoch 0: 16%|█▋ | 2039/12384 [4:20:32<22:09:00, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 16%|█▋ | 2040/12384 [4:20:32<22:03:05, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 16%|█▋ | 2040/12384 [4:20:39<22:03:05, 7.67s/it, loss=0.0014, acc=0.9969, iter_time=7.20s]
Epoch 0: 16%|█▋ | 2041/12384 [4:20:39<22:01:32, 7.67s/it, loss=0.0014, acc=0.9969, iter_time=7.20s]
Epoch 0: 16%|█▋ | 2041/12384 [4:20:47<22:01:32, 7.67s/it, loss=0.0009, acc=0.9990, iter_time=6.79s]
Epoch 0: 16%|█▋ | 2042/12384 [4:20:47<21:59:26, 7.65s/it, loss=0.0009, acc=0.9990, iter_time=6.79s]
Epoch 0: 16%|█▋ | 2042/12384 [4:20:54<21:59:26, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=8.49s]
Epoch 0: 16%|█▋ | 2043/12384 [4:20:54<21:56:41, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=8.49s]
Epoch 0: 16%|█▋ | 2043/12384 [4:21:02<21:56:41, 7.64s/it, loss=0.0015, acc=0.9952, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2044/12384 [4:21:02<21:55:31, 7.63s/it, loss=0.0015, acc=0.9952, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2044/12384 [4:21:10<21:55:31, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2045/12384 [4:21:10<21:57:28, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2045/12384 [4:21:17<21:57:28, 7.65s/it, loss=0.0004, acc=0.9998, iter_time=5.98s]
Epoch 0: 17%|█▋ | 2046/12384 [4:21:17<21:55:06, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=5.98s]
Epoch 0: 17%|█▋ | 2046/12384 [4:21:25<21:55:06, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=9.59s]
Epoch 0: 17%|█▋ | 2047/12384 [4:21:25<21:55:26, 7.64s/it, loss=0.0002, acc=0.9986, iter_time=9.59s]
Epoch 0: 17%|█▋ | 2047/12384 [4:21:33<21:55:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 17%|█▋ | 2048/12384 [4:21:33<21:53:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 17%|█▋ | 2048/12384 [4:21:40<21:53:39, 7.63s/it, loss=0.0020, acc=0.9946, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2049/12384 [4:21:40<21:55:14, 7.64s/it, loss=0.0020, acc=0.9946, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2049/12384 [4:21:48<21:55:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.11s]
Epoch 0: 17%|█▋ | 2050/12384 [4:21:48<21:57:11, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.11s]
Epoch 0: 17%|█▋ | 2050/12384 [4:21:56<21:57:11, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2051/12384 [4:21:56<21:56:52, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2051/12384 [4:22:03<21:56:52, 7.65s/it, loss=0.0006, acc=0.9985, iter_time=7.75s]
Epoch 0: 17%|█▋ | 2052/12384 [4:22:03<22:06:01, 7.70s/it, loss=0.0006, acc=0.9985, iter_time=7.75s]
Epoch 0: 17%|█▋ | 2052/12384 [4:22:11<22:06:01, 7.70s/it, loss=0.0001, acc=0.9995, iter_time=7.75s]
Epoch 0: 17%|█▋ | 2053/12384 [4:22:11<22:05:49, 7.70s/it, loss=0.0001, acc=0.9995, iter_time=7.75s]
Epoch 0: 17%|█▋ | 2053/12384 [4:22:19<22:05:49, 7.70s/it, loss=0.0018, acc=0.9981, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2054/12384 [4:22:19<22:03:20, 7.69s/it, loss=0.0018, acc=0.9981, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2054/12384 [4:22:26<22:03:20, 7.69s/it, loss=0.0010, acc=0.9964, iter_time=4.82s]
Epoch 0: 17%|█▋ | 2055/12384 [4:22:26<22:01:18, 7.68s/it, loss=0.0010, acc=0.9964, iter_time=4.82s]
Epoch 0: 17%|█▋ | 2055/12384 [4:22:34<22:01:18, 7.68s/it, loss=0.0008, acc=0.9981, iter_time=10.84s]
Epoch 0: 17%|█▋ | 2056/12384 [4:22:34<21:57:53, 7.66s/it, loss=0.0008, acc=0.9981, iter_time=10.84s]
Epoch 0: 17%|█▋ | 2056/12384 [4:22:42<21:57:53, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2057/12384 [4:22:42<21:55:39, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2057/12384 [4:22:49<21:55:39, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2058/12384 [4:22:49<21:54:56, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2058/12384 [4:22:57<21:54:56, 7.64s/it, loss=0.0124, acc=0.9792, iter_time=7.95s]
Epoch 0: 17%|█▋ | 2059/12384 [4:22:57<22:13:56, 7.75s/it, loss=0.0124, acc=0.9792, iter_time=7.95s]
Epoch 0: 17%|█▋ | 2059/12384 [4:23:05<22:13:56, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=6.21s]
Epoch 0: 17%|█▋ | 2060/12384 [4:23:05<22:06:13, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=6.21s]
Epoch 0: 17%|█▋ | 2060/12384 [4:23:12<22:06:13, 7.71s/it, loss=0.0168, acc=0.9786, iter_time=9.10s]
Epoch 0: 17%|█▋ | 2061/12384 [4:23:12<22:02:27, 7.69s/it, loss=0.0168, acc=0.9786, iter_time=9.10s]
Epoch 0: 17%|█▋ | 2061/12384 [4:23:20<22:02:27, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2062/12384 [4:23:20<22:00:58, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2062/12384 [4:23:28<22:00:58, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2063/12384 [4:23:28<21:57:34, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2063/12384 [4:23:35<21:57:34, 7.66s/it, loss=0.0004, acc=0.9998, iter_time=7.99s]
Epoch 0: 17%|█▋ | 2064/12384 [4:23:35<21:59:06, 7.67s/it, loss=0.0004, acc=0.9998, iter_time=7.99s]
Epoch 0: 17%|█▋ | 2064/12384 [4:23:43<21:59:06, 7.67s/it, loss=0.0017, acc=0.9990, iter_time=7.31s]
Epoch 0: 17%|█▋ | 2065/12384 [4:23:43<21:56:02, 7.65s/it, loss=0.0017, acc=0.9990, iter_time=7.31s]
Epoch 0: 17%|█▋ | 2065/12384 [4:23:51<21:56:02, 7.65s/it, loss=0.0009, acc=0.9958, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2066/12384 [4:23:51<21:55:53, 7.65s/it, loss=0.0009, acc=0.9958, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2066/12384 [4:23:58<21:55:53, 7.65s/it, loss=0.0006, acc=0.9994, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2067/12384 [4:23:58<21:54:21, 7.64s/it, loss=0.0006, acc=0.9994, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2067/12384 [4:24:06<21:54:21, 7.64s/it, loss=0.0020, acc=0.9943, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2068/12384 [4:24:06<21:52:42, 7.63s/it, loss=0.0020, acc=0.9943, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2068/12384 [4:24:14<21:52:42, 7.63s/it, loss=0.0008, acc=0.9972, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2069/12384 [4:24:14<21:52:45, 7.64s/it, loss=0.0008, acc=0.9972, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2069/12384 [4:24:21<21:52:45, 7.64s/it, loss=0.0008, acc=0.9986, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2070/12384 [4:24:21<21:52:55, 7.64s/it, loss=0.0008, acc=0.9986, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2070/12384 [4:24:29<21:52:55, 7.64s/it, loss=0.0005, acc=0.9963, iter_time=6.70s]
Epoch 0: 17%|█▋ | 2071/12384 [4:24:29<21:52:46, 7.64s/it, loss=0.0005, acc=0.9963, iter_time=6.70s]
Epoch 0: 17%|█▋ | 2071/12384 [4:24:36<21:52:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.95s]
Epoch 0: 17%|█▋ | 2072/12384 [4:24:36<21:51:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.95s]
Epoch 0: 17%|█▋ | 2072/12384 [4:24:44<21:51:37, 7.63s/it, loss=0.0007, acc=0.9979, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2073/12384 [4:24:44<21:52:08, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2073/12384 [4:24:52<21:52:08, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2074/12384 [4:24:52<21:50:30, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2074/12384 [4:24:59<21:50:30, 7.63s/it, loss=0.0010, acc=0.9999, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2075/12384 [4:24:59<21:50:29, 7.63s/it, loss=0.0010, acc=0.9999, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2075/12384 [4:25:07<21:50:29, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2076/12384 [4:25:07<21:49:31, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2076/12384 [4:25:15<21:49:31, 7.62s/it, loss=0.0005, acc=0.9984, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2077/12384 [4:25:15<21:50:56, 7.63s/it, loss=0.0005, acc=0.9984, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2077/12384 [4:25:22<21:50:56, 7.63s/it, loss=0.0011, acc=0.9990, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2078/12384 [4:25:22<21:49:58, 7.63s/it, loss=0.0011, acc=0.9990, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2078/12384 [4:25:30<21:49:58, 7.63s/it, loss=0.0018, acc=0.9956, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2079/12384 [4:25:30<21:52:03, 7.64s/it, loss=0.0018, acc=0.9956, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2079/12384 [4:25:37<21:52:03, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=8.04s]
Epoch 0: 17%|█▋ | 2080/12384 [4:25:37<21:50:24, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=8.04s]
Epoch 0: 17%|█▋ | 2080/12384 [4:25:45<21:50:24, 7.63s/it, loss=0.0006, acc=0.9966, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2081/12384 [4:25:45<21:54:14, 7.65s/it, loss=0.0006, acc=0.9966, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2081/12384 [4:25:53<21:54:14, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 17%|█▋ | 2082/12384 [4:25:53<21:52:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 17%|█▋ | 2082/12384 [4:26:00<21:52:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 0: 17%|█▋ | 2083/12384 [4:26:00<21:53:07, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 0: 17%|█▋ | 2083/12384 [4:26:08<21:53:07, 7.65s/it, loss=0.0006, acc=0.9991, iter_time=7.68s]
Epoch 0: 17%|█▋ | 2084/12384 [4:26:08<21:53:54, 7.65s/it, loss=0.0006, acc=0.9991, iter_time=7.68s]
Epoch 0: 17%|█▋ | 2084/12384 [4:26:16<21:53:54, 7.65s/it, loss=0.0054, acc=0.9774, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2085/12384 [4:26:16<22:10:00, 7.75s/it, loss=0.0054, acc=0.9774, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2085/12384 [4:26:24<22:10:00, 7.75s/it, loss=0.0002, acc=0.9998, iter_time=8.55s]
Epoch 0: 17%|█▋ | 2086/12384 [4:26:24<22:01:45, 7.70s/it, loss=0.0002, acc=0.9998, iter_time=8.55s]
Epoch 0: 17%|█▋ | 2086/12384 [4:26:31<22:01:45, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 17%|█▋ | 2087/12384 [4:26:31<21:59:05, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 17%|█▋ | 2087/12384 [4:26:39<21:59:05, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2088/12384 [4:26:39<21:57:50, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2088/12384 [4:26:47<21:57:50, 7.68s/it, loss=0.0004, acc=0.9984, iter_time=7.05s]
Epoch 0: 17%|█▋ | 2089/12384 [4:26:47<21:55:16, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=7.05s]
Epoch 0: 17%|█▋ | 2089/12384 [4:26:54<21:55:16, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=8.25s]
Epoch 0: 17%|█▋ | 2090/12384 [4:26:54<21:54:53, 7.66s/it, loss=0.0004, acc=0.9984, iter_time=8.25s]
Epoch 0: 17%|█▋ | 2090/12384 [4:27:02<21:54:53, 7.66s/it, loss=0.0007, acc=0.9988, iter_time=4.59s]
Epoch 0: 17%|█▋ | 2091/12384 [4:27:02<21:52:36, 7.65s/it, loss=0.0007, acc=0.9988, iter_time=4.59s]
Epoch 0: 17%|█▋ | 2091/12384 [4:27:10<21:52:36, 7.65s/it, loss=0.0008, acc=0.9981, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2092/12384 [4:27:10<21:54:39, 7.66s/it, loss=0.0008, acc=0.9981, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2092/12384 [4:27:17<21:54:39, 7.66s/it, loss=0.0010, acc=0.9992, iter_time=10.51s]
Epoch 0: 17%|█▋ | 2093/12384 [4:27:17<21:53:19, 7.66s/it, loss=0.0010, acc=0.9992, iter_time=10.51s]
Epoch 0: 17%|█▋ | 2093/12384 [4:27:25<21:53:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 17%|█▋ | 2094/12384 [4:27:25<21:50:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 17%|█▋ | 2094/12384 [4:27:33<21:50:49, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=5.83s]
Epoch 0: 17%|█▋ | 2095/12384 [4:27:33<21:51:15, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=5.83s]
Epoch 0: 17%|█▋ | 2095/12384 [4:27:40<21:51:15, 7.65s/it, loss=0.0012, acc=0.9955, iter_time=9.43s]
Epoch 0: 17%|█▋ | 2096/12384 [4:27:40<21:51:13, 7.65s/it, loss=0.0012, acc=0.9955, iter_time=9.43s]
Epoch 0: 17%|█▋ | 2096/12384 [4:27:48<21:51:13, 7.65s/it, loss=0.0053, acc=0.9871, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2097/12384 [4:27:48<21:48:55, 7.63s/it, loss=0.0053, acc=0.9871, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2097/12384 [4:27:55<21:48:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.01s]
Epoch 0: 17%|█▋ | 2098/12384 [4:27:55<21:49:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.01s]
Epoch 0: 17%|█▋ | 2098/12384 [4:28:03<21:49:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.26s]
Epoch 0: 17%|█▋ | 2099/12384 [4:28:03<21:48:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.26s]
Epoch 0: 17%|█▋ | 2099/12384 [4:28:11<21:48:05, 7.63s/it, loss=0.0025, acc=0.9951, iter_time=8.00s]
Epoch 0: 17%|█▋ | 2100/12384 [4:28:11<21:46:24, 7.62s/it, loss=0.0025, acc=0.9951, iter_time=8.00s]
Epoch 0: 17%|█▋ | 2100/12384 [4:28:18<21:46:24, 7.62s/it, loss=0.0016, acc=0.9949, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2101/12384 [4:28:18<21:47:21, 7.63s/it, loss=0.0016, acc=0.9949, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2101/12384 [4:28:26<21:47:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2102/12384 [4:28:26<21:47:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2102/12384 [4:28:34<21:47:15, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2103/12384 [4:28:34<21:47:19, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2103/12384 [4:28:41<21:47:19, 7.63s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2104/12384 [4:28:41<21:48:25, 7.64s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2104/12384 [4:28:49<21:48:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.01s]
Epoch 0: 17%|█▋ | 2105/12384 [4:28:49<21:46:15, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.01s]
Epoch 0: 17%|█▋ | 2105/12384 [4:28:56<21:46:15, 7.62s/it, loss=0.0004, acc=0.9997, iter_time=8.24s]
Epoch 0: 17%|█▋ | 2106/12384 [4:28:56<21:45:51, 7.62s/it, loss=0.0004, acc=0.9997, iter_time=8.24s]
Epoch 0: 17%|█▋ | 2106/12384 [4:29:04<21:45:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2107/12384 [4:29:04<21:46:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2107/12384 [4:29:12<21:46:43, 7.63s/it, loss=0.0007, acc=0.9978, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2108/12384 [4:29:12<21:48:01, 7.64s/it, loss=0.0007, acc=0.9978, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2108/12384 [4:29:19<21:48:01, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.39s]
Epoch 0: 17%|█▋ | 2109/12384 [4:29:19<21:49:49, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.39s]
Epoch 0: 17%|█▋ | 2109/12384 [4:29:27<21:49:49, 7.65s/it, loss=0.0010, acc=0.9992, iter_time=6.73s]
Epoch 0: 17%|█▋ | 2110/12384 [4:29:27<21:47:58, 7.64s/it, loss=0.0010, acc=0.9992, iter_time=6.73s]
Epoch 0: 17%|█▋ | 2110/12384 [4:29:35<21:47:58, 7.64s/it, loss=0.0007, acc=0.9998, iter_time=6.99s]
Epoch 0: 17%|█▋ | 2111/12384 [4:29:35<21:46:22, 7.63s/it, loss=0.0007, acc=0.9998, iter_time=6.99s]
Epoch 0: 17%|█▋ | 2111/12384 [4:29:43<21:46:22, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=9.87s]
Epoch 0: 17%|█▋ | 2112/12384 [4:29:43<22:04:32, 7.74s/it, loss=0.0005, acc=0.9983, iter_time=9.87s]
Epoch 0: 17%|█▋ | 2112/12384 [4:29:50<22:04:32, 7.74s/it, loss=0.0002, acc=1.0000, iter_time=7.53s]
Epoch 0: 17%|█▋ | 2113/12384 [4:29:50<21:58:25, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.53s]
Epoch 0: 17%|█▋ | 2113/12384 [4:29:58<21:58:25, 7.70s/it, loss=0.0001, acc=0.9999, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2114/12384 [4:29:58<21:56:59, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2114/12384 [4:30:06<21:56:59, 7.69s/it, loss=0.0002, acc=0.9983, iter_time=7.46s]
Epoch 0: 17%|█▋ | 2115/12384 [4:30:06<21:54:41, 7.68s/it, loss=0.0002, acc=0.9983, iter_time=7.46s]
Epoch 0: 17%|█▋ | 2115/12384 [4:30:13<21:54:41, 7.68s/it, loss=0.0002, acc=0.9999, iter_time=7.96s]
Epoch 0: 17%|█▋ | 2116/12384 [4:30:13<21:55:33, 7.69s/it, loss=0.0002, acc=0.9999, iter_time=7.96s]
Epoch 0: 17%|█▋ | 2116/12384 [4:30:21<21:55:33, 7.69s/it, loss=0.0005, acc=0.9994, iter_time=5.71s]
Epoch 0: 17%|█▋ | 2117/12384 [4:30:21<21:52:44, 7.67s/it, loss=0.0005, acc=0.9994, iter_time=5.71s]
Epoch 0: 17%|█▋ | 2117/12384 [4:30:29<21:52:44, 7.67s/it, loss=0.0022, acc=0.9939, iter_time=9.58s]
Epoch 0: 17%|█▋ | 2118/12384 [4:30:29<21:51:47, 7.67s/it, loss=0.0022, acc=0.9939, iter_time=9.58s]
Epoch 0: 17%|█▋ | 2118/12384 [4:30:36<21:51:47, 7.67s/it, loss=0.0004, acc=0.9987, iter_time=5.66s]
Epoch 0: 17%|█▋ | 2119/12384 [4:30:36<21:49:33, 7.65s/it, loss=0.0004, acc=0.9987, iter_time=5.66s]
Epoch 0: 17%|█▋ | 2119/12384 [4:30:44<21:49:33, 7.65s/it, loss=0.0003, acc=0.9986, iter_time=9.53s]
Epoch 0: 17%|█▋ | 2120/12384 [4:30:44<21:47:46, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=9.53s]
Epoch 0: 17%|█▋ | 2120/12384 [4:30:52<21:47:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.77s]
Epoch 0: 17%|█▋ | 2121/12384 [4:30:52<21:50:59, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.77s]
Epoch 0: 17%|█▋ | 2121/12384 [4:30:59<21:50:59, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2122/12384 [4:30:59<21:48:18, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2122/12384 [4:31:07<21:48:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2123/12384 [4:31:07<21:47:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2123/12384 [4:31:14<21:47:19, 7.64s/it, loss=0.0005, acc=0.9995, iter_time=5.65s]
Epoch 0: 17%|█▋ | 2124/12384 [4:31:14<21:46:57, 7.64s/it, loss=0.0005, acc=0.9995, iter_time=5.65s]
Epoch 0: 17%|█▋ | 2124/12384 [4:31:22<21:46:57, 7.64s/it, loss=0.0008, acc=0.9982, iter_time=9.69s]
Epoch 0: 17%|█▋ | 2125/12384 [4:31:22<21:47:46, 7.65s/it, loss=0.0008, acc=0.9982, iter_time=9.69s]
Epoch 0: 17%|█▋ | 2125/12384 [4:31:30<21:47:46, 7.65s/it, loss=0.0004, acc=0.9972, iter_time=7.69s]
Epoch 0: 17%|█▋ | 2126/12384 [4:31:30<21:50:25, 7.66s/it, loss=0.0004, acc=0.9972, iter_time=7.69s]
Epoch 0: 17%|█▋ | 2126/12384 [4:31:37<21:50:25, 7.66s/it, loss=0.0022, acc=0.9934, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2127/12384 [4:31:37<21:50:50, 7.67s/it, loss=0.0022, acc=0.9934, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2127/12384 [4:31:45<21:50:50, 7.67s/it, loss=0.0006, acc=0.9980, iter_time=8.14s]
Epoch 0: 17%|█▋ | 2128/12384 [4:31:45<21:56:56, 7.70s/it, loss=0.0006, acc=0.9980, iter_time=8.14s]
Epoch 0: 17%|█▋ | 2128/12384 [4:31:53<21:56:56, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.32s]
Epoch 0: 17%|█▋ | 2129/12384 [4:31:53<21:57:06, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.32s]
Epoch 0: 17%|█▋ | 2129/12384 [4:32:01<21:57:06, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2130/12384 [4:32:01<21:57:19, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2130/12384 [4:32:08<21:57:19, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 17%|█▋ | 2131/12384 [4:32:08<21:58:32, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 17%|█▋ | 2131/12384 [4:32:16<21:58:32, 7.72s/it, loss=0.0020, acc=0.9962, iter_time=7.69s]
Epoch 0: 17%|█▋ | 2132/12384 [4:32:16<21:56:54, 7.71s/it, loss=0.0020, acc=0.9962, iter_time=7.69s]
Epoch 0: 17%|█▋ | 2132/12384 [4:32:24<21:56:54, 7.71s/it, loss=0.0003, acc=0.9997, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2133/12384 [4:32:24<21:57:27, 7.71s/it, loss=0.0003, acc=0.9997, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2133/12384 [4:32:31<21:57:27, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2134/12384 [4:32:31<21:54:34, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2134/12384 [4:32:39<21:54:34, 7.70s/it, loss=0.0013, acc=0.9968, iter_time=8.85s]
Epoch 0: 17%|█▋ | 2135/12384 [4:32:39<21:53:44, 7.69s/it, loss=0.0013, acc=0.9968, iter_time=8.85s]
Epoch 0: 17%|█▋ | 2135/12384 [4:32:47<21:53:44, 7.69s/it, loss=0.0007, acc=0.9997, iter_time=7.56s]
Epoch 0: 17%|█▋ | 2136/12384 [4:32:47<21:49:32, 7.67s/it, loss=0.0007, acc=0.9997, iter_time=7.56s]
Epoch 0: 17%|█▋ | 2136/12384 [4:32:54<21:49:32, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 17%|█▋ | 2137/12384 [4:32:54<21:47:18, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 17%|█▋ | 2137/12384 [4:33:02<21:47:18, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.75s]
Epoch 0: 17%|█▋ | 2138/12384 [4:33:02<22:05:33, 7.76s/it, loss=0.0002, acc=1.0000, iter_time=9.75s]
Epoch 0: 17%|█▋ | 2138/12384 [4:33:10<22:05:33, 7.76s/it, loss=0.0002, acc=0.9996, iter_time=4.08s]
Epoch 0: 17%|█▋ | 2139/12384 [4:33:10<22:00:06, 7.73s/it, loss=0.0002, acc=0.9996, iter_time=4.08s]
Epoch 0: 17%|█▋ | 2139/12384 [4:33:18<22:00:06, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=11.35s]
Epoch 0: 17%|█▋ | 2140/12384 [4:33:18<21:57:12, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=11.35s]
Epoch 0: 17%|█▋ | 2140/12384 [4:33:25<21:57:12, 7.72s/it, loss=0.0003, acc=0.9999, iter_time=7.74s]
Epoch 0: 17%|█▋ | 2141/12384 [4:33:25<21:58:41, 7.72s/it, loss=0.0003, acc=0.9999, iter_time=7.74s]
Epoch 0: 17%|█▋ | 2141/12384 [4:33:33<21:58:41, 7.72s/it, loss=0.0023, acc=0.9967, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2142/12384 [4:33:33<21:58:18, 7.72s/it, loss=0.0023, acc=0.9967, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2142/12384 [4:33:41<21:58:18, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=4.81s]
Epoch 0: 17%|█▋ | 2143/12384 [4:33:41<21:53:26, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=4.81s]
Epoch 0: 17%|█▋ | 2143/12384 [4:33:49<21:53:26, 7.70s/it, loss=0.0003, acc=0.9989, iter_time=10.90s]
Epoch 0: 17%|█▋ | 2144/12384 [4:33:49<21:53:16, 7.69s/it, loss=0.0003, acc=0.9989, iter_time=10.90s]
Epoch 0: 17%|█▋ | 2144/12384 [4:33:56<21:53:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 0: 17%|█▋ | 2145/12384 [4:33:56<21:48:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 0: 17%|█▋ | 2145/12384 [4:34:04<21:48:31, 7.67s/it, loss=0.0027, acc=0.9913, iter_time=10.71s]
Epoch 0: 17%|█▋ | 2146/12384 [4:34:04<21:48:30, 7.67s/it, loss=0.0027, acc=0.9913, iter_time=10.71s]
Epoch 0: 17%|█▋ | 2146/12384 [4:34:11<21:48:30, 7.67s/it, loss=0.0004, acc=0.9996, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2147/12384 [4:34:11<21:45:39, 7.65s/it, loss=0.0004, acc=0.9996, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2147/12384 [4:34:19<21:45:39, 7.65s/it, loss=0.0005, acc=0.9993, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2148/12384 [4:34:19<21:43:07, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2148/12384 [4:34:27<21:43:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 17%|█▋ | 2149/12384 [4:34:27<21:42:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 17%|█▋ | 2149/12384 [4:34:34<21:42:26, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=8.09s]
Epoch 0: 17%|█▋ | 2150/12384 [4:34:34<21:43:07, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=8.09s]
Epoch 0: 17%|█▋ | 2150/12384 [4:34:42<21:43:07, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2151/12384 [4:34:42<21:42:54, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2151/12384 [4:34:50<21:42:54, 7.64s/it, loss=0.0005, acc=0.9976, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2152/12384 [4:34:50<21:41:46, 7.63s/it, loss=0.0005, acc=0.9976, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2152/12384 [4:34:57<21:41:46, 7.63s/it, loss=0.0013, acc=0.9983, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2153/12384 [4:34:57<21:41:52, 7.63s/it, loss=0.0013, acc=0.9983, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2153/12384 [4:35:05<21:41:52, 7.63s/it, loss=0.0007, acc=0.9977, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2154/12384 [4:35:05<21:41:19, 7.63s/it, loss=0.0007, acc=0.9977, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2154/12384 [4:35:12<21:41:19, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.78s]
Epoch 0: 17%|█▋ | 2155/12384 [4:35:12<21:40:52, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.78s]
Epoch 0: 17%|█▋ | 2155/12384 [4:35:20<21:40:52, 7.63s/it, loss=0.0007, acc=0.9982, iter_time=9.82s]
Epoch 0: 17%|█▋ | 2156/12384 [4:35:20<21:48:46, 7.68s/it, loss=0.0007, acc=0.9982, iter_time=9.82s]
Epoch 0: 17%|█▋ | 2156/12384 [4:35:28<21:48:46, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2157/12384 [4:35:28<21:50:02, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2157/12384 [4:35:36<21:50:02, 7.69s/it, loss=0.0007, acc=0.9963, iter_time=7.71s]
Epoch 0: 17%|█▋ | 2158/12384 [4:35:36<21:50:40, 7.69s/it, loss=0.0007, acc=0.9963, iter_time=7.71s]
Epoch 0: 17%|█▋ | 2158/12384 [4:35:43<21:50:40, 7.69s/it, loss=0.0032, acc=0.9922, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2159/12384 [4:35:43<21:49:26, 7.68s/it, loss=0.0032, acc=0.9922, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2159/12384 [4:35:51<21:49:26, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=8.17s]
Epoch 0: 17%|█▋ | 2160/12384 [4:35:51<21:54:20, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=8.17s]
Epoch 0: 17%|█▋ | 2160/12384 [4:35:59<21:54:20, 7.71s/it, loss=0.0006, acc=0.9963, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2161/12384 [4:35:59<21:55:04, 7.72s/it, loss=0.0006, acc=0.9963, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2161/12384 [4:36:07<21:55:04, 7.72s/it, loss=0.0006, acc=0.9978, iter_time=7.71s]
Epoch 0: 17%|█▋ | 2162/12384 [4:36:07<21:54:00, 7.71s/it, loss=0.0006, acc=0.9978, iter_time=7.71s]
Epoch 0: 17%|█▋ | 2162/12384 [4:36:14<21:54:00, 7.71s/it, loss=0.0021, acc=0.9954, iter_time=6.98s]
Epoch 0: 17%|█▋ | 2163/12384 [4:36:14<21:55:18, 7.72s/it, loss=0.0021, acc=0.9954, iter_time=6.98s]
Epoch 0: 17%|█▋ | 2163/12384 [4:36:22<21:55:18, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.35s]
Epoch 0: 17%|█▋ | 2164/12384 [4:36:22<21:51:15, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.35s]
Epoch 0: 17%|█▋ | 2164/12384 [4:36:30<21:51:15, 7.70s/it, loss=0.0004, acc=1.0000, iter_time=7.68s]
Epoch 0: 17%|█▋ | 2165/12384 [4:36:30<22:05:42, 7.78s/it, loss=0.0004, acc=1.0000, iter_time=7.68s]
Epoch 0: 17%|█▋ | 2165/12384 [4:36:38<22:05:42, 7.78s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 17%|█▋ | 2166/12384 [4:36:38<22:03:57, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 17%|█▋ | 2166/12384 [4:36:45<22:03:57, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=7.82s]
Epoch 0: 17%|█▋ | 2167/12384 [4:36:45<22:03:38, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=7.82s]
Epoch 0: 17%|█▋ | 2167/12384 [4:36:53<22:03:38, 7.77s/it, loss=0.0005, acc=0.9996, iter_time=7.57s]
Epoch 0: 18%|█▊ | 2168/12384 [4:36:53<21:56:24, 7.73s/it, loss=0.0005, acc=0.9996, iter_time=7.57s]
Epoch 0: 18%|█▊ | 2168/12384 [4:37:01<21:56:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 18%|█▊ | 2169/12384 [4:37:01<21:51:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 18%|█▊ | 2169/12384 [4:37:08<21:51:14, 7.70s/it, loss=0.0004, acc=0.9979, iter_time=8.27s]
Epoch 0: 18%|█▊ | 2170/12384 [4:37:08<21:48:22, 7.69s/it, loss=0.0004, acc=0.9979, iter_time=8.27s]
Epoch 0: 18%|█▊ | 2170/12384 [4:37:16<21:48:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 18%|█▊ | 2171/12384 [4:37:16<21:44:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 18%|█▊ | 2171/12384 [4:37:24<21:44:58, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.87s]
Epoch 0: 18%|█▊ | 2172/12384 [4:37:24<21:44:49, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.87s]
Epoch 0: 18%|█▊ | 2172/12384 [4:37:31<21:44:49, 7.67s/it, loss=0.0012, acc=0.9960, iter_time=9.09s]
Epoch 0: 18%|█▊ | 2173/12384 [4:37:31<21:44:14, 7.66s/it, loss=0.0012, acc=0.9960, iter_time=9.09s]
Epoch 0: 18%|█▊ | 2173/12384 [4:37:39<21:44:14, 7.66s/it, loss=0.0015, acc=0.9965, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2174/12384 [4:37:39<21:40:47, 7.64s/it, loss=0.0015, acc=0.9965, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2174/12384 [4:37:46<21:40:47, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=4.82s]
Epoch 0: 18%|█▊ | 2175/12384 [4:37:46<21:38:52, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=4.82s]
Epoch 0: 18%|█▊ | 2175/12384 [4:37:54<21:38:52, 7.63s/it, loss=0.0006, acc=0.9989, iter_time=10.78s]
Epoch 0: 18%|█▊ | 2176/12384 [4:37:54<21:42:44, 7.66s/it, loss=0.0006, acc=0.9989, iter_time=10.78s]
Epoch 0: 18%|█▊ | 2176/12384 [4:38:02<21:42:44, 7.66s/it, loss=0.0002, acc=0.9999, iter_time=7.33s]
Epoch 0: 18%|█▊ | 2177/12384 [4:38:02<21:46:22, 7.68s/it, loss=0.0002, acc=0.9999, iter_time=7.33s]
Epoch 0: 18%|█▊ | 2177/12384 [4:38:10<21:46:22, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.74s]
Epoch 0: 18%|█▊ | 2178/12384 [4:38:10<21:50:10, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.74s]
Epoch 0: 18%|█▊ | 2178/12384 [4:38:17<21:50:10, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 18%|█▊ | 2179/12384 [4:38:17<21:47:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 18%|█▊ | 2179/12384 [4:38:25<21:47:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 0: 18%|█▊ | 2180/12384 [4:38:25<21:43:43, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 0: 18%|█▊ | 2180/12384 [4:38:33<21:43:43, 7.67s/it, loss=0.0001, acc=0.9993, iter_time=6.42s]
Epoch 0: 18%|█▊ | 2181/12384 [4:38:33<21:43:53, 7.67s/it, loss=0.0001, acc=0.9993, iter_time=6.42s]
Epoch 0: 18%|█▊ | 2181/12384 [4:38:40<21:43:53, 7.67s/it, loss=0.0004, acc=0.9977, iter_time=9.15s]
Epoch 0: 18%|█▊ | 2182/12384 [4:38:40<21:39:51, 7.64s/it, loss=0.0004, acc=0.9977, iter_time=9.15s]
Epoch 0: 18%|█▊ | 2182/12384 [4:38:48<21:39:51, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2183/12384 [4:38:48<21:39:58, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2183/12384 [4:38:55<21:39:58, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2184/12384 [4:38:55<21:38:03, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2184/12384 [4:39:03<21:38:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 18%|█▊ | 2185/12384 [4:39:03<21:40:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 18%|█▊ | 2185/12384 [4:39:11<21:40:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 0: 18%|█▊ | 2186/12384 [4:39:11<21:40:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 0: 18%|█▊ | 2186/12384 [4:39:18<21:40:27, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 18%|█▊ | 2187/12384 [4:39:18<21:40:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 18%|█▊ | 2187/12384 [4:39:26<21:40:42, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.34s]
Epoch 0: 18%|█▊ | 2188/12384 [4:39:26<21:37:58, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.34s]
Epoch 0: 18%|█▊ | 2188/12384 [4:39:34<21:37:58, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.93s]
Epoch 0: 18%|█▊ | 2189/12384 [4:39:34<21:38:05, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.93s]
Epoch 0: 18%|█▊ | 2189/12384 [4:39:42<21:38:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 18%|█▊ | 2190/12384 [4:39:42<21:54:50, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 18%|█▊ | 2190/12384 [4:39:50<21:54:50, 7.74s/it, loss=0.0004, acc=0.9997, iter_time=7.70s]
Epoch 0: 18%|█▊ | 2191/12384 [4:39:50<22:08:02, 7.82s/it, loss=0.0004, acc=0.9997, iter_time=7.70s]
Epoch 0: 18%|█▊ | 2191/12384 [4:39:57<22:08:02, 7.82s/it, loss=0.0001, acc=1.0000, iter_time=8.30s]
Epoch 0: 18%|█▊ | 2192/12384 [4:39:57<21:57:58, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=8.30s]
Epoch 0: 18%|█▊ | 2192/12384 [4:40:05<21:57:58, 7.76s/it, loss=0.0007, acc=0.9980, iter_time=7.22s]
Epoch 0: 18%|█▊ | 2193/12384 [4:40:05<21:50:08, 7.71s/it, loss=0.0007, acc=0.9980, iter_time=7.22s]
Epoch 0: 18%|█▊ | 2193/12384 [4:40:13<21:50:08, 7.71s/it, loss=0.0011, acc=0.9981, iter_time=7.73s]
Epoch 0: 18%|█▊ | 2194/12384 [4:40:13<21:50:29, 7.72s/it, loss=0.0011, acc=0.9981, iter_time=7.73s]
Epoch 0: 18%|█▊ | 2194/12384 [4:40:20<21:50:29, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2195/12384 [4:40:20<21:46:19, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2195/12384 [4:40:28<21:46:19, 7.69s/it, loss=0.0003, acc=0.9998, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2196/12384 [4:40:28<21:48:29, 7.71s/it, loss=0.0003, acc=0.9998, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2196/12384 [4:40:36<21:48:29, 7.71s/it, loss=0.0006, acc=0.9979, iter_time=7.38s]
Epoch 0: 18%|█▊ | 2197/12384 [4:40:36<21:46:45, 7.70s/it, loss=0.0006, acc=0.9979, iter_time=7.38s]
Epoch 0: 18%|█▊ | 2197/12384 [4:40:43<21:46:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 0: 18%|█▊ | 2198/12384 [4:40:43<21:43:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 0: 18%|█▊ | 2198/12384 [4:40:51<21:43:46, 7.68s/it, loss=0.0016, acc=0.9944, iter_time=9.44s]
Epoch 0: 18%|█▊ | 2199/12384 [4:40:51<21:43:20, 7.68s/it, loss=0.0016, acc=0.9944, iter_time=9.44s]
Epoch 0: 18%|█▊ | 2199/12384 [4:40:59<21:43:20, 7.68s/it, loss=0.0012, acc=0.9976, iter_time=8.11s]
Epoch 0: 18%|█▊ | 2200/12384 [4:40:59<21:44:59, 7.69s/it, loss=0.0012, acc=0.9976, iter_time=8.11s]
Epoch 0: 18%|█▊ | 2200/12384 [4:41:06<21:44:59, 7.69s/it, loss=0.0014, acc=0.9973, iter_time=7.21s]
Epoch 0: 18%|█▊ | 2201/12384 [4:41:06<21:44:30, 7.69s/it, loss=0.0014, acc=0.9973, iter_time=7.21s]
Epoch 0: 18%|█▊ | 2201/12384 [4:41:14<21:44:30, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=6.56s]
Epoch 0: 18%|█▊ | 2202/12384 [4:41:14<21:39:51, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=6.56s]
Epoch 0: 18%|█▊ | 2202/12384 [4:41:22<21:39:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 18%|█▊ | 2203/12384 [4:41:22<21:39:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 18%|█▊ | 2203/12384 [4:41:29<21:39:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 18%|█▊ | 2204/12384 [4:41:29<21:39:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 18%|█▊ | 2204/12384 [4:41:37<21:39:33, 7.66s/it, loss=0.0005, acc=0.9973, iter_time=9.95s]
Epoch 0: 18%|█▊ | 2205/12384 [4:41:37<21:35:58, 7.64s/it, loss=0.0005, acc=0.9973, iter_time=9.95s]
Epoch 0: 18%|█▊ | 2205/12384 [4:41:45<21:35:58, 7.64s/it, loss=0.0030, acc=0.9909, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2206/12384 [4:41:45<21:37:03, 7.65s/it, loss=0.0030, acc=0.9909, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2206/12384 [4:41:52<21:37:03, 7.65s/it, loss=0.0005, acc=0.9997, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2207/12384 [4:41:52<21:40:48, 7.67s/it, loss=0.0005, acc=0.9997, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2207/12384 [4:42:00<21:40:48, 7.67s/it, loss=0.0014, acc=0.9955, iter_time=8.14s]
Epoch 0: 18%|█▊ | 2208/12384 [4:42:00<21:40:57, 7.67s/it, loss=0.0014, acc=0.9955, iter_time=8.14s]
Epoch 0: 18%|█▊ | 2208/12384 [4:42:08<21:40:57, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.47s]
Epoch 0: 18%|█▊ | 2209/12384 [4:42:08<21:36:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.47s]
Epoch 0: 18%|█▊ | 2209/12384 [4:42:15<21:36:39, 7.65s/it, loss=0.0006, acc=0.9974, iter_time=6.36s]
Epoch 0: 18%|█▊ | 2210/12384 [4:42:15<21:36:30, 7.65s/it, loss=0.0006, acc=0.9974, iter_time=6.36s]
Epoch 0: 18%|█▊ | 2210/12384 [4:42:23<21:36:30, 7.65s/it, loss=0.0007, acc=0.9986, iter_time=10.68s]
Epoch 0: 18%|█▊ | 2211/12384 [4:42:23<21:36:44, 7.65s/it, loss=0.0007, acc=0.9986, iter_time=10.68s]
Epoch 0: 18%|█▊ | 2211/12384 [4:42:31<21:36:44, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2212/12384 [4:42:31<21:37:47, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2212/12384 [4:42:38<21:37:47, 7.66s/it, loss=0.0005, acc=0.9996, iter_time=7.71s]
Epoch 0: 18%|█▊ | 2213/12384 [4:42:38<21:36:29, 7.65s/it, loss=0.0005, acc=0.9996, iter_time=7.71s]
Epoch 0: 18%|█▊ | 2213/12384 [4:42:46<21:36:29, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.67s]
Epoch 0: 18%|█▊ | 2214/12384 [4:42:46<21:34:42, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=6.67s]
Epoch 0: 18%|█▊ | 2214/12384 [4:42:54<21:34:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.88s]
Epoch 0: 18%|█▊ | 2215/12384 [4:42:54<21:49:18, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=8.88s]
Epoch 0: 18%|█▊ | 2215/12384 [4:43:01<21:49:18, 7.73s/it, loss=0.0009, acc=0.9983, iter_time=8.01s]
Epoch 0: 18%|█▊ | 2216/12384 [4:43:01<21:44:36, 7.70s/it, loss=0.0009, acc=0.9983, iter_time=8.01s]
Epoch 0: 18%|█▊ | 2216/12384 [4:43:09<21:44:36, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 18%|█▊ | 2217/12384 [4:43:09<21:55:17, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 18%|█▊ | 2217/12384 [4:43:17<21:55:17, 7.76s/it, loss=0.0009, acc=0.9967, iter_time=6.73s]
Epoch 0: 18%|█▊ | 2218/12384 [4:43:17<21:48:50, 7.72s/it, loss=0.0009, acc=0.9967, iter_time=6.73s]
Epoch 0: 18%|█▊ | 2218/12384 [4:43:25<21:48:50, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.77s]
Epoch 0: 18%|█▊ | 2219/12384 [4:43:25<21:44:53, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.77s]
Epoch 0: 18%|█▊ | 2219/12384 [4:43:32<21:44:53, 7.70s/it, loss=0.0004, acc=1.0000, iter_time=5.84s]
Epoch 0: 18%|█▊ | 2220/12384 [4:43:32<21:40:11, 7.68s/it, loss=0.0004, acc=1.0000, iter_time=5.84s]
Epoch 0: 18%|█▊ | 2220/12384 [4:43:40<21:40:11, 7.68s/it, loss=0.0004, acc=0.9984, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2221/12384 [4:43:40<21:39:00, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2221/12384 [4:43:47<21:39:00, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=8.32s]
Epoch 0: 18%|█▊ | 2222/12384 [4:43:47<21:35:13, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=8.32s]
Epoch 0: 18%|█▊ | 2222/12384 [4:43:55<21:35:13, 7.65s/it, loss=0.0007, acc=0.9979, iter_time=9.00s]
Epoch 0: 18%|█▊ | 2223/12384 [4:43:55<21:34:17, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=9.00s]
Epoch 0: 18%|█▊ | 2223/12384 [4:44:03<21:34:17, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=8.93s]
Epoch 0: 18%|█▊ | 2224/12384 [4:44:03<21:32:19, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=8.93s]
Epoch 0: 18%|█▊ | 2224/12384 [4:44:10<21:32:19, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.24s]
Epoch 0: 18%|█▊ | 2225/12384 [4:44:10<21:30:39, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.24s]
Epoch 0: 18%|█▊ | 2225/12384 [4:44:18<21:30:39, 7.62s/it, loss=0.0005, acc=0.9984, iter_time=6.77s]
Epoch 0: 18%|█▊ | 2226/12384 [4:44:18<21:31:37, 7.63s/it, loss=0.0005, acc=0.9984, iter_time=6.77s]
Epoch 0: 18%|█▊ | 2226/12384 [4:44:26<21:31:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 0: 18%|█▊ | 2227/12384 [4:44:26<21:32:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 0: 18%|█▊ | 2227/12384 [4:44:33<21:32:23, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=6.41s]
Epoch 0: 18%|█▊ | 2228/12384 [4:44:33<21:30:06, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.41s]
Epoch 0: 18%|█▊ | 2228/12384 [4:44:41<21:30:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.43s]
Epoch 0: 18%|█▊ | 2229/12384 [4:44:41<21:32:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.43s]
Epoch 0: 18%|█▊ | 2229/12384 [4:44:48<21:32:32, 7.64s/it, loss=0.0005, acc=0.9975, iter_time=7.29s]
Epoch 0: 18%|█▊ | 2230/12384 [4:44:48<21:30:19, 7.62s/it, loss=0.0005, acc=0.9975, iter_time=7.29s]
Epoch 0: 18%|█▊ | 2230/12384 [4:44:56<21:30:19, 7.62s/it, loss=0.0006, acc=0.9988, iter_time=11.35s]
Epoch 0: 18%|█▊ | 2231/12384 [4:44:56<21:29:02, 7.62s/it, loss=0.0006, acc=0.9988, iter_time=11.35s]
Epoch 0: 18%|█▊ | 2231/12384 [4:45:04<21:29:02, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.56s]
Epoch 0: 18%|█▊ | 2232/12384 [4:45:04<21:29:15, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.56s]
Epoch 0: 18%|█▊ | 2232/12384 [4:45:11<21:29:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2233/12384 [4:45:11<21:30:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2233/12384 [4:45:19<21:30:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.22s]
Epoch 0: 18%|█▊ | 2234/12384 [4:45:19<21:31:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.22s]
Epoch 0: 18%|█▊ | 2234/12384 [4:45:26<21:31:07, 7.63s/it, loss=0.0007, acc=0.9986, iter_time=9.10s]
Epoch 0: 18%|█▊ | 2235/12384 [4:45:26<21:29:50, 7.63s/it, loss=0.0007, acc=0.9986, iter_time=9.10s]
Epoch 0: 18%|█▊ | 2235/12384 [4:45:34<21:29:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 18%|█▊ | 2236/12384 [4:45:34<21:29:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 18%|█▊ | 2236/12384 [4:45:42<21:29:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.12s]
Epoch 0: 18%|█▊ | 2237/12384 [4:45:42<21:29:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.12s]
Epoch 0: 18%|█▊ | 2237/12384 [4:45:49<21:29:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2238/12384 [4:45:49<21:28:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2238/12384 [4:45:57<21:28:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2239/12384 [4:45:57<21:30:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2239/12384 [4:46:05<21:30:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.07s]
Epoch 0: 18%|█▊ | 2240/12384 [4:46:05<21:33:58, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.07s]
Epoch 0: 18%|█▊ | 2240/12384 [4:46:13<21:33:58, 7.65s/it, loss=0.0004, acc=0.9985, iter_time=7.55s]
Epoch 0: 18%|█▊ | 2241/12384 [4:46:13<21:44:06, 7.71s/it, loss=0.0004, acc=0.9985, iter_time=7.55s]
Epoch 0: 18%|█▊ | 2241/12384 [4:46:20<21:44:06, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2242/12384 [4:46:20<21:39:20, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2242/12384 [4:46:28<21:39:20, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=4.26s]
Epoch 0: 18%|█▊ | 2243/12384 [4:46:28<21:54:36, 7.78s/it, loss=0.0002, acc=1.0000, iter_time=4.26s]
Epoch 0: 18%|█▊ | 2243/12384 [4:46:36<21:54:36, 7.78s/it, loss=0.0005, acc=0.9990, iter_time=8.81s]
Epoch 0: 18%|█▊ | 2244/12384 [4:46:36<21:48:11, 7.74s/it, loss=0.0005, acc=0.9990, iter_time=8.81s]
Epoch 0: 18%|█▊ | 2244/12384 [4:46:43<21:48:11, 7.74s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2245/12384 [4:46:43<21:41:26, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2245/12384 [4:46:51<21:41:26, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=10.15s]
Epoch 0: 18%|█▊ | 2246/12384 [4:46:51<21:37:38, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=10.15s]
Epoch 0: 18%|█▊ | 2246/12384 [4:46:59<21:37:38, 7.68s/it, loss=0.0066, acc=0.9912, iter_time=5.38s]
Epoch 0: 18%|█▊ | 2247/12384 [4:46:59<21:32:38, 7.65s/it, loss=0.0066, acc=0.9912, iter_time=5.38s]
Epoch 0: 18%|█▊ | 2247/12384 [4:47:06<21:32:38, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.81s]
Epoch 0: 18%|█▊ | 2248/12384 [4:47:06<21:31:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.81s]
Epoch 0: 18%|█▊ | 2248/12384 [4:47:14<21:31:43, 7.65s/it, loss=0.0009, acc=0.9975, iter_time=5.89s]
Epoch 0: 18%|█▊ | 2249/12384 [4:47:14<21:28:42, 7.63s/it, loss=0.0009, acc=0.9975, iter_time=5.89s]
Epoch 0: 18%|█▊ | 2249/12384 [4:47:22<21:28:42, 7.63s/it, loss=0.0020, acc=0.9934, iter_time=9.76s]
Epoch 0: 18%|█▊ | 2250/12384 [4:47:22<21:27:40, 7.62s/it, loss=0.0020, acc=0.9934, iter_time=9.76s]
Epoch 0: 18%|█▊ | 2250/12384 [4:47:29<21:27:40, 7.62s/it, loss=0.0006, acc=0.9995, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2251/12384 [4:47:29<21:26:48, 7.62s/it, loss=0.0006, acc=0.9995, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2251/12384 [4:47:37<21:26:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 18%|█▊ | 2252/12384 [4:47:37<21:26:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 18%|█▊ | 2252/12384 [4:47:44<21:26:24, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=7.16s]
Epoch 0: 18%|█▊ | 2253/12384 [4:47:44<21:28:18, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=7.16s]
Epoch 0: 18%|█▊ | 2253/12384 [4:47:52<21:28:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 18%|█▊ | 2254/12384 [4:47:52<21:28:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 18%|█▊ | 2254/12384 [4:48:00<21:28:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2255/12384 [4:48:00<21:29:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2255/12384 [4:48:07<21:29:32, 7.64s/it, loss=0.0003, acc=0.9988, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2256/12384 [4:48:07<21:29:38, 7.64s/it, loss=0.0003, acc=0.9988, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2256/12384 [4:48:15<21:29:38, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2257/12384 [4:48:15<21:29:50, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2257/12384 [4:48:23<21:29:50, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.60s]
Epoch 0: 18%|█▊ | 2258/12384 [4:48:23<21:29:59, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.60s]
Epoch 0: 18%|█▊ | 2258/12384 [4:48:30<21:29:59, 7.64s/it, loss=0.0007, acc=0.9986, iter_time=8.48s]
Epoch 0: 18%|█▊ | 2259/12384 [4:48:30<21:29:52, 7.64s/it, loss=0.0007, acc=0.9986, iter_time=8.48s]
Epoch 0: 18%|█▊ | 2259/12384 [4:48:38<21:29:52, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=8.86s]
Epoch 0: 18%|█▊ | 2260/12384 [4:48:38<21:32:33, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=8.86s]
Epoch 0: 18%|█▊ | 2260/12384 [4:48:46<21:32:33, 7.66s/it, loss=0.0004, acc=0.9980, iter_time=7.10s]
Epoch 0: 18%|█▊ | 2261/12384 [4:48:46<21:29:07, 7.64s/it, loss=0.0004, acc=0.9980, iter_time=7.10s]
Epoch 0: 18%|█▊ | 2261/12384 [4:48:53<21:29:07, 7.64s/it, loss=0.0016, acc=0.9958, iter_time=8.20s]
Epoch 0: 18%|█▊ | 2262/12384 [4:48:53<21:30:14, 7.65s/it, loss=0.0016, acc=0.9958, iter_time=8.20s]
Epoch 0: 18%|█▊ | 2262/12384 [4:49:01<21:30:14, 7.65s/it, loss=0.0007, acc=0.9979, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2263/12384 [4:49:01<21:28:34, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2263/12384 [4:49:09<21:28:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2264/12384 [4:49:09<21:30:08, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2264/12384 [4:49:16<21:30:08, 7.65s/it, loss=0.0011, acc=0.9992, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2265/12384 [4:49:16<21:29:26, 7.65s/it, loss=0.0011, acc=0.9992, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2265/12384 [4:49:24<21:29:26, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.79s]
Epoch 0: 18%|█▊ | 2266/12384 [4:49:24<21:36:01, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.79s]
Epoch 0: 18%|█▊ | 2266/12384 [4:49:32<21:36:01, 7.69s/it, loss=0.0004, acc=1.0000, iter_time=7.97s]
Epoch 0: 18%|█▊ | 2267/12384 [4:49:32<21:47:48, 7.76s/it, loss=0.0004, acc=1.0000, iter_time=7.97s]
Epoch 0: 18%|█▊ | 2267/12384 [4:49:40<21:47:48, 7.76s/it, loss=0.0003, acc=0.9999, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2268/12384 [4:49:40<21:42:53, 7.73s/it, loss=0.0003, acc=0.9999, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2268/12384 [4:49:47<21:42:53, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2269/12384 [4:49:47<21:55:18, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2269/12384 [4:49:55<21:55:18, 7.80s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 18%|█▊ | 2270/12384 [4:49:55<21:47:44, 7.76s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 18%|█▊ | 2270/12384 [4:50:03<21:47:44, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2271/12384 [4:50:03<21:42:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2271/12384 [4:50:11<21:42:31, 7.73s/it, loss=0.0003, acc=0.9994, iter_time=8.14s]
Epoch 0: 18%|█▊ | 2272/12384 [4:50:11<21:42:18, 7.73s/it, loss=0.0003, acc=0.9994, iter_time=8.14s]
Epoch 0: 18%|█▊ | 2272/12384 [4:50:18<21:42:18, 7.73s/it, loss=0.0004, acc=0.9979, iter_time=5.46s]
Epoch 0: 18%|█▊ | 2273/12384 [4:50:18<21:38:59, 7.71s/it, loss=0.0004, acc=0.9979, iter_time=5.46s]
Epoch 0: 18%|█▊ | 2273/12384 [4:50:26<21:38:59, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 18%|█▊ | 2274/12384 [4:50:26<21:34:56, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 18%|█▊ | 2274/12384 [4:50:33<21:34:56, 7.69s/it, loss=0.0010, acc=0.9974, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2275/12384 [4:50:33<21:33:07, 7.68s/it, loss=0.0010, acc=0.9974, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2275/12384 [4:50:41<21:33:07, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 18%|█▊ | 2276/12384 [4:50:41<21:31:07, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 18%|█▊ | 2276/12384 [4:50:49<21:31:07, 7.66s/it, loss=0.0016, acc=0.9981, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2277/12384 [4:50:49<21:29:50, 7.66s/it, loss=0.0016, acc=0.9981, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2277/12384 [4:50:56<21:29:50, 7.66s/it, loss=0.0013, acc=0.9951, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2278/12384 [4:50:56<21:34:00, 7.68s/it, loss=0.0013, acc=0.9951, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2278/12384 [4:51:04<21:34:00, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.68s]
Epoch 0: 18%|█▊ | 2279/12384 [4:51:04<21:29:43, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.68s]
Epoch 0: 18%|█▊ | 2279/12384 [4:51:12<21:29:43, 7.66s/it, loss=0.0035, acc=0.9906, iter_time=11.05s]
Epoch 0: 18%|█▊ | 2280/12384 [4:51:12<21:29:42, 7.66s/it, loss=0.0035, acc=0.9906, iter_time=11.05s]
Epoch 0: 18%|█▊ | 2280/12384 [4:51:19<21:29:42, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=5.82s]
Epoch 0: 18%|█▊ | 2281/12384 [4:51:19<21:27:37, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=5.82s]
Epoch 0: 18%|█▊ | 2281/12384 [4:51:27<21:27:37, 7.65s/it, loss=0.0004, acc=0.9998, iter_time=9.15s]
Epoch 0: 18%|█▊ | 2282/12384 [4:51:27<21:28:55, 7.66s/it, loss=0.0004, acc=0.9998, iter_time=9.15s]
Epoch 0: 18%|█▊ | 2282/12384 [4:51:35<21:28:55, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 18%|█▊ | 2283/12384 [4:51:35<21:27:38, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 18%|█▊ | 2283/12384 [4:51:42<21:27:38, 7.65s/it, loss=0.0005, acc=0.9997, iter_time=8.57s]
Epoch 0: 18%|█▊ | 2284/12384 [4:51:42<21:26:06, 7.64s/it, loss=0.0005, acc=0.9997, iter_time=8.57s]
Epoch 0: 18%|█▊ | 2284/12384 [4:51:50<21:26:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2285/12384 [4:51:50<21:24:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2285/12384 [4:51:58<21:24:48, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2286/12384 [4:51:58<21:23:37, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2286/12384 [4:52:05<21:23:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2287/12384 [4:52:05<21:23:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2287/12384 [4:52:13<21:23:10, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2288/12384 [4:52:13<21:27:05, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2288/12384 [4:52:20<21:27:05, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 18%|█▊ | 2289/12384 [4:52:20<21:25:36, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 18%|█▊ | 2289/12384 [4:52:28<21:25:36, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2290/12384 [4:52:28<21:26:02, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2290/12384 [4:52:36<21:26:02, 7.64s/it, loss=0.0002, acc=0.9984, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2291/12384 [4:52:36<21:24:03, 7.63s/it, loss=0.0002, acc=0.9984, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2291/12384 [4:52:43<21:24:03, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▊ | 2292/12384 [4:52:43<21:25:58, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▊ | 2292/12384 [4:52:51<21:25:58, 7.65s/it, loss=0.0006, acc=0.9990, iter_time=7.93s]
Epoch 0: 19%|█▊ | 2293/12384 [4:52:51<21:36:59, 7.71s/it, loss=0.0006, acc=0.9990, iter_time=7.93s]
Epoch 0: 19%|█▊ | 2293/12384 [4:52:59<21:36:59, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 0: 19%|█▊ | 2294/12384 [4:52:59<21:33:13, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 0: 19%|█▊ | 2294/12384 [4:53:07<21:33:13, 7.69s/it, loss=0.0012, acc=0.9977, iter_time=7.86s]
Epoch 0: 19%|█▊ | 2295/12384 [4:53:07<21:30:13, 7.67s/it, loss=0.0012, acc=0.9977, iter_time=7.86s]
Epoch 0: 19%|█▊ | 2295/12384 [4:53:15<21:30:13, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 0: 19%|█▊ | 2296/12384 [4:53:15<21:44:10, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 0: 19%|█▊ | 2296/12384 [4:53:22<21:44:10, 7.76s/it, loss=0.0015, acc=0.9934, iter_time=5.40s]
Epoch 0: 19%|█▊ | 2297/12384 [4:53:22<21:43:18, 7.75s/it, loss=0.0015, acc=0.9934, iter_time=5.40s]
Epoch 0: 19%|█▊ | 2297/12384 [4:53:30<21:43:18, 7.75s/it, loss=0.0018, acc=0.9982, iter_time=10.10s]
Epoch 0: 19%|█▊ | 2298/12384 [4:53:30<21:40:11, 7.73s/it, loss=0.0018, acc=0.9982, iter_time=10.10s]
Epoch 0: 19%|█▊ | 2298/12384 [4:53:38<21:40:11, 7.73s/it, loss=0.0024, acc=0.9969, iter_time=7.60s]
Epoch 0: 19%|█▊ | 2299/12384 [4:53:38<21:33:48, 7.70s/it, loss=0.0024, acc=0.9969, iter_time=7.60s]
Epoch 0: 19%|█▊ | 2299/12384 [4:53:45<21:33:48, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 19%|█▊ | 2300/12384 [4:53:45<21:33:06, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 19%|█▊ | 2300/12384 [4:53:53<21:33:06, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 0: 19%|█▊ | 2301/12384 [4:53:53<21:29:27, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 0: 19%|█▊ | 2301/12384 [4:54:00<21:29:27, 7.67s/it, loss=0.0015, acc=0.9954, iter_time=7.63s]
Epoch 0: 19%|█▊ | 2302/12384 [4:54:00<21:27:41, 7.66s/it, loss=0.0015, acc=0.9954, iter_time=7.63s]
Epoch 0: 19%|█▊ | 2302/12384 [4:54:08<21:27:41, 7.66s/it, loss=0.0020, acc=0.9975, iter_time=5.92s]
Epoch 0: 19%|█▊ | 2303/12384 [4:54:08<21:27:25, 7.66s/it, loss=0.0020, acc=0.9975, iter_time=5.92s]
Epoch 0: 19%|█▊ | 2303/12384 [4:54:16<21:27:25, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.34s]
Epoch 0: 19%|█▊ | 2304/12384 [4:54:16<21:25:57, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.34s]
Epoch 0: 19%|█▊ | 2304/12384 [4:54:23<21:25:57, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 19%|█▊ | 2305/12384 [4:54:23<21:25:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 19%|█▊ | 2305/12384 [4:54:31<21:25:43, 7.65s/it, loss=0.0004, acc=0.9980, iter_time=9.09s]
Epoch 0: 19%|█▊ | 2306/12384 [4:54:31<21:25:05, 7.65s/it, loss=0.0004, acc=0.9980, iter_time=9.09s]
Epoch 0: 19%|█▊ | 2306/12384 [4:54:39<21:25:05, 7.65s/it, loss=0.0006, acc=0.9979, iter_time=5.26s]
Epoch 0: 19%|█▊ | 2307/12384 [4:54:39<21:24:44, 7.65s/it, loss=0.0006, acc=0.9979, iter_time=5.26s]
Epoch 0: 19%|█▊ | 2307/12384 [4:54:46<21:24:44, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 19%|█▊ | 2308/12384 [4:54:46<21:22:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 19%|█▊ | 2308/12384 [4:54:54<21:22:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.90s]
Epoch 0: 19%|█▊ | 2309/12384 [4:54:54<21:27:07, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.90s]
Epoch 0: 19%|█▊ | 2309/12384 [4:55:02<21:27:07, 7.67s/it, loss=0.0016, acc=0.9974, iter_time=6.88s]
Epoch 0: 19%|█▊ | 2310/12384 [4:55:02<21:25:48, 7.66s/it, loss=0.0016, acc=0.9974, iter_time=6.88s]
Epoch 0: 19%|█▊ | 2310/12384 [4:55:09<21:25:48, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=8.61s]
Epoch 0: 19%|█▊ | 2311/12384 [4:55:09<21:31:32, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.61s]
Epoch 0: 19%|█▊ | 2311/12384 [4:55:17<21:31:32, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.12s]
Epoch 0: 19%|█▊ | 2312/12384 [4:55:17<21:30:30, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.12s]
Epoch 0: 19%|█▊ | 2312/12384 [4:55:25<21:30:30, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 19%|█▊ | 2313/12384 [4:55:25<21:33:02, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 19%|█▊ | 2313/12384 [4:55:33<21:33:02, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.77s]
Epoch 0: 19%|█▊ | 2314/12384 [4:55:33<21:28:22, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.77s]
Epoch 0: 19%|█▊ | 2314/12384 [4:55:40<21:28:22, 7.68s/it, loss=0.0019, acc=0.9907, iter_time=7.54s]
Epoch 0: 19%|█▊ | 2315/12384 [4:55:40<21:25:45, 7.66s/it, loss=0.0019, acc=0.9907, iter_time=7.54s]
Epoch 0: 19%|█▊ | 2315/12384 [4:55:48<21:25:45, 7.66s/it, loss=0.0008, acc=0.9979, iter_time=6.53s]
Epoch 0: 19%|█▊ | 2316/12384 [4:55:48<21:24:27, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=6.53s]
Epoch 0: 19%|█▊ | 2316/12384 [4:55:55<21:24:27, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2317/12384 [4:55:55<21:24:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2317/12384 [4:56:03<21:24:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.51s]
Epoch 0: 19%|█▊ | 2318/12384 [4:56:03<21:23:30, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.51s]
Epoch 0: 19%|█▊ | 2318/12384 [4:56:11<21:23:30, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.80s]
Epoch 0: 19%|█▊ | 2319/12384 [4:56:11<21:24:04, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.80s]
Epoch 0: 19%|█▊ | 2319/12384 [4:56:18<21:24:04, 7.65s/it, loss=0.0008, acc=0.9978, iter_time=10.66s]
Epoch 0: 19%|█▊ | 2320/12384 [4:56:18<21:22:23, 7.65s/it, loss=0.0008, acc=0.9978, iter_time=10.66s]
Epoch 0: 19%|█▊ | 2320/12384 [4:56:26<21:22:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▊ | 2321/12384 [4:56:26<21:19:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▊ | 2321/12384 [4:56:34<21:19:55, 7.63s/it, loss=0.0013, acc=0.9958, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2322/12384 [4:56:34<21:37:44, 7.74s/it, loss=0.0013, acc=0.9958, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2322/12384 [4:56:42<21:37:44, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 19%|█▉ | 2323/12384 [4:56:42<21:33:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 19%|█▉ | 2323/12384 [4:56:49<21:33:08, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 19%|█▉ | 2324/12384 [4:56:49<21:28:52, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 19%|█▉ | 2324/12384 [4:56:57<21:28:52, 7.69s/it, loss=0.0005, acc=0.9998, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2325/12384 [4:56:57<21:27:37, 7.68s/it, loss=0.0005, acc=0.9998, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2325/12384 [4:57:05<21:27:37, 7.68s/it, loss=0.0008, acc=0.9973, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2326/12384 [4:57:05<21:24:47, 7.66s/it, loss=0.0008, acc=0.9973, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2326/12384 [4:57:12<21:24:47, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2327/12384 [4:57:12<21:23:06, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2327/12384 [4:57:20<21:23:06, 7.66s/it, loss=0.0011, acc=0.9985, iter_time=8.04s]
Epoch 0: 19%|█▉ | 2328/12384 [4:57:20<21:21:41, 7.65s/it, loss=0.0011, acc=0.9985, iter_time=8.04s]
Epoch 0: 19%|█▉ | 2328/12384 [4:57:27<21:21:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 0: 19%|█▉ | 2329/12384 [4:57:27<21:19:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 0: 19%|█▉ | 2329/12384 [4:57:35<21:19:25, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=9.09s]
Epoch 0: 19%|█▉ | 2330/12384 [4:57:35<21:19:03, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=9.09s]
Epoch 0: 19%|█▉ | 2330/12384 [4:57:43<21:19:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2331/12384 [4:57:43<21:20:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2331/12384 [4:57:50<21:20:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2332/12384 [4:57:50<21:19:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2332/12384 [4:57:58<21:19:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.71s]
Epoch 0: 19%|█▉ | 2333/12384 [4:57:58<21:17:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.71s]
Epoch 0: 19%|█▉ | 2333/12384 [4:58:06<21:17:19, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.44s]
Epoch 0: 19%|█▉ | 2334/12384 [4:58:06<21:17:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.44s]
Epoch 0: 19%|█▉ | 2334/12384 [4:58:13<21:17:23, 7.63s/it, loss=0.0017, acc=0.9957, iter_time=9.73s]
Epoch 0: 19%|█▉ | 2335/12384 [4:58:13<21:18:50, 7.64s/it, loss=0.0017, acc=0.9957, iter_time=9.73s]
Epoch 0: 19%|█▉ | 2335/12384 [4:58:21<21:18:50, 7.64s/it, loss=0.0010, acc=0.9963, iter_time=8.04s]
Epoch 0: 19%|█▉ | 2336/12384 [4:58:21<21:17:24, 7.63s/it, loss=0.0010, acc=0.9963, iter_time=8.04s]
Epoch 0: 19%|█▉ | 2336/12384 [4:58:28<21:17:24, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=4.90s]
Epoch 0: 19%|█▉ | 2337/12384 [4:58:28<21:16:46, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=4.90s]
Epoch 0: 19%|█▉ | 2337/12384 [4:58:36<21:16:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 19%|█▉ | 2338/12384 [4:58:36<21:15:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 19%|█▉ | 2338/12384 [4:58:44<21:15:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2339/12384 [4:58:44<21:15:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2339/12384 [4:58:51<21:15:33, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2340/12384 [4:58:51<21:19:30, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2340/12384 [4:58:59<21:19:30, 7.64s/it, loss=0.0006, acc=0.9978, iter_time=5.57s]
Epoch 0: 19%|█▉ | 2341/12384 [4:58:59<21:18:57, 7.64s/it, loss=0.0006, acc=0.9978, iter_time=5.57s]
Epoch 0: 19%|█▉ | 2341/12384 [4:59:07<21:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 0: 19%|█▉ | 2342/12384 [4:59:07<21:18:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 0: 19%|█▉ | 2342/12384 [4:59:14<21:18:42, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=11.16s]
Epoch 0: 19%|█▉ | 2343/12384 [4:59:14<21:18:15, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=11.16s]
Epoch 0: 19%|█▉ | 2343/12384 [4:59:22<21:18:15, 7.64s/it, loss=0.0004, acc=0.9991, iter_time=7.74s]
Epoch 0: 19%|█▉ | 2344/12384 [4:59:22<21:16:49, 7.63s/it, loss=0.0004, acc=0.9991, iter_time=7.74s]
Epoch 0: 19%|█▉ | 2344/12384 [4:59:30<21:16:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 19%|█▉ | 2345/12384 [4:59:30<21:17:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 19%|█▉ | 2345/12384 [4:59:37<21:17:13, 7.63s/it, loss=0.0011, acc=0.9975, iter_time=5.13s]
Epoch 0: 19%|█▉ | 2346/12384 [4:59:37<21:19:06, 7.65s/it, loss=0.0011, acc=0.9975, iter_time=5.13s]
Epoch 0: 19%|█▉ | 2346/12384 [4:59:45<21:19:06, 7.65s/it, loss=0.0004, acc=0.9974, iter_time=9.63s]
Epoch 0: 19%|█▉ | 2347/12384 [4:59:45<21:19:09, 7.65s/it, loss=0.0004, acc=0.9974, iter_time=9.63s]
Epoch 0: 19%|█▉ | 2347/12384 [4:59:53<21:19:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 19%|█▉ | 2348/12384 [4:59:53<21:21:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 19%|█▉ | 2348/12384 [5:00:00<21:21:40, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2349/12384 [5:00:00<21:36:16, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2349/12384 [5:00:08<21:36:16, 7.75s/it, loss=0.0005, acc=0.9976, iter_time=8.32s]
Epoch 0: 19%|█▉ | 2350/12384 [5:00:08<21:30:21, 7.72s/it, loss=0.0005, acc=0.9976, iter_time=8.32s]
Epoch 0: 19%|█▉ | 2350/12384 [5:00:16<21:30:21, 7.72s/it, loss=0.0011, acc=0.9984, iter_time=7.22s]
Epoch 0: 19%|█▉ | 2351/12384 [5:00:16<21:28:06, 7.70s/it, loss=0.0011, acc=0.9984, iter_time=7.22s]
Epoch 0: 19%|█▉ | 2351/12384 [5:00:23<21:28:06, 7.70s/it, loss=0.0005, acc=0.9995, iter_time=8.07s]
Epoch 0: 19%|█▉ | 2352/12384 [5:00:23<21:25:13, 7.69s/it, loss=0.0005, acc=0.9995, iter_time=8.07s]
Epoch 0: 19%|█▉ | 2352/12384 [5:00:31<21:25:13, 7.69s/it, loss=0.0004, acc=0.9984, iter_time=3.07s]
Epoch 0: 19%|█▉ | 2353/12384 [5:00:31<21:21:58, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=3.07s]
Epoch 0: 19%|█▉ | 2353/12384 [5:00:39<21:21:58, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.81s]
Epoch 0: 19%|█▉ | 2354/12384 [5:00:39<21:20:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=11.81s]
Epoch 0: 19%|█▉ | 2354/12384 [5:00:46<21:20:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2355/12384 [5:00:46<21:18:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2355/12384 [5:00:54<21:18:20, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2356/12384 [5:00:54<21:18:51, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2356/12384 [5:01:02<21:18:51, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2357/12384 [5:01:02<21:19:08, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2357/12384 [5:01:09<21:19:08, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=4.61s]
Epoch 0: 19%|█▉ | 2358/12384 [5:01:09<21:18:45, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=4.61s]
Epoch 0: 19%|█▉ | 2358/12384 [5:01:17<21:18:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 19%|█▉ | 2359/12384 [5:01:17<21:17:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 19%|█▉ | 2359/12384 [5:01:25<21:17:27, 7.65s/it, loss=0.0005, acc=0.9979, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2360/12384 [5:01:25<21:16:47, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2360/12384 [5:01:32<21:16:47, 7.64s/it, loss=0.0011, acc=0.9974, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2361/12384 [5:01:32<21:16:42, 7.64s/it, loss=0.0011, acc=0.9974, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2361/12384 [5:01:40<21:16:42, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2362/12384 [5:01:40<21:16:44, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2362/12384 [5:01:48<21:16:44, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2363/12384 [5:01:48<21:17:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2363/12384 [5:01:55<21:17:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 19%|█▉ | 2364/12384 [5:01:55<21:15:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 19%|█▉ | 2364/12384 [5:02:03<21:15:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 19%|█▉ | 2365/12384 [5:02:03<21:13:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 19%|█▉ | 2365/12384 [5:02:10<21:13:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2366/12384 [5:02:10<21:12:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2366/12384 [5:02:18<21:12:07, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=4.48s]
Epoch 0: 19%|█▉ | 2367/12384 [5:02:18<21:12:28, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=4.48s]
Epoch 0: 19%|█▉ | 2367/12384 [5:02:26<21:12:28, 7.62s/it, loss=0.0005, acc=0.9990, iter_time=11.14s]
Epoch 0: 19%|█▉ | 2368/12384 [5:02:26<21:12:17, 7.62s/it, loss=0.0005, acc=0.9990, iter_time=11.14s]
Epoch 0: 19%|█▉ | 2368/12384 [5:02:33<21:12:17, 7.62s/it, loss=0.0020, acc=0.9976, iter_time=7.25s]
Epoch 0: 19%|█▉ | 2369/12384 [5:02:33<21:12:20, 7.62s/it, loss=0.0020, acc=0.9976, iter_time=7.25s]
Epoch 0: 19%|█▉ | 2369/12384 [5:02:41<21:12:20, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2370/12384 [5:02:41<21:14:17, 7.64s/it, loss=0.0001, acc=0.9997, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2370/12384 [5:02:49<21:14:17, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2371/12384 [5:02:49<21:14:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2371/12384 [5:02:56<21:14:42, 7.64s/it, loss=0.0007, acc=0.9982, iter_time=5.65s]
Epoch 0: 19%|█▉ | 2372/12384 [5:02:56<21:13:50, 7.63s/it, loss=0.0007, acc=0.9982, iter_time=5.65s]
Epoch 0: 19%|█▉ | 2372/12384 [5:03:04<21:13:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 19%|█▉ | 2373/12384 [5:03:04<21:27:51, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 19%|█▉ | 2373/12384 [5:03:12<21:27:51, 7.72s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2374/12384 [5:03:12<21:25:48, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2374/12384 [5:03:20<21:25:48, 7.71s/it, loss=0.0001, acc=0.9999, iter_time=6.51s]
Epoch 0: 19%|█▉ | 2375/12384 [5:03:20<21:41:27, 7.80s/it, loss=0.0001, acc=0.9999, iter_time=6.51s]
Epoch 0: 19%|█▉ | 2375/12384 [5:03:27<21:41:27, 7.80s/it, loss=0.0003, acc=1.0000, iter_time=9.15s]
Epoch 0: 19%|█▉ | 2376/12384 [5:03:27<21:33:40, 7.76s/it, loss=0.0003, acc=1.0000, iter_time=9.15s]
Epoch 0: 19%|█▉ | 2376/12384 [5:03:35<21:33:40, 7.76s/it, loss=0.0012, acc=0.9973, iter_time=5.66s]
Epoch 0: 19%|█▉ | 2377/12384 [5:03:35<21:28:43, 7.73s/it, loss=0.0012, acc=0.9973, iter_time=5.66s]
Epoch 0: 19%|█▉ | 2377/12384 [5:03:43<21:28:43, 7.73s/it, loss=0.0004, acc=0.9995, iter_time=9.66s]
Epoch 0: 19%|█▉ | 2378/12384 [5:03:43<21:25:21, 7.71s/it, loss=0.0004, acc=0.9995, iter_time=9.66s]
Epoch 0: 19%|█▉ | 2378/12384 [5:03:50<21:25:21, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2379/12384 [5:03:50<21:25:01, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2379/12384 [5:03:58<21:25:01, 7.71s/it, loss=0.0003, acc=0.9986, iter_time=6.77s]
Epoch 0: 19%|█▉ | 2380/12384 [5:03:58<21:21:22, 7.69s/it, loss=0.0003, acc=0.9986, iter_time=6.77s]
Epoch 0: 19%|█▉ | 2380/12384 [5:04:06<21:21:22, 7.69s/it, loss=0.0003, acc=0.9997, iter_time=8.58s]
Epoch 0: 19%|█▉ | 2381/12384 [5:04:06<21:19:21, 7.67s/it, loss=0.0003, acc=0.9997, iter_time=8.58s]
Epoch 0: 19%|█▉ | 2381/12384 [5:04:13<21:19:21, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=6.43s]
Epoch 0: 19%|█▉ | 2382/12384 [5:04:13<21:17:16, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=6.43s]
Epoch 0: 19%|█▉ | 2382/12384 [5:04:21<21:17:16, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=8.84s]
Epoch 0: 19%|█▉ | 2383/12384 [5:04:21<21:19:30, 7.68s/it, loss=0.0006, acc=0.9998, iter_time=8.84s]
Epoch 0: 19%|█▉ | 2383/12384 [5:04:29<21:19:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 19%|█▉ | 2384/12384 [5:04:29<21:17:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 19%|█▉ | 2384/12384 [5:04:36<21:17:18, 7.66s/it, loss=0.0006, acc=0.9991, iter_time=5.70s]
Epoch 0: 19%|█▉ | 2385/12384 [5:04:36<21:16:13, 7.66s/it, loss=0.0006, acc=0.9991, iter_time=5.70s]
Epoch 0: 19%|█▉ | 2385/12384 [5:04:44<21:16:13, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=9.16s]
Epoch 0: 19%|█▉ | 2386/12384 [5:04:44<21:17:23, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=9.16s]
Epoch 0: 19%|█▉ | 2386/12384 [5:04:52<21:17:23, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 19%|█▉ | 2387/12384 [5:04:52<21:15:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 19%|█▉ | 2387/12384 [5:04:59<21:15:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2388/12384 [5:04:59<21:17:02, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2388/12384 [5:05:07<21:17:02, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=4.89s]
Epoch 0: 19%|█▉ | 2389/12384 [5:05:07<21:17:19, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=4.89s]
Epoch 0: 19%|█▉ | 2389/12384 [5:05:15<21:17:19, 7.67s/it, loss=0.0002, acc=0.9992, iter_time=10.45s]
Epoch 0: 19%|█▉ | 2390/12384 [5:05:15<21:15:34, 7.66s/it, loss=0.0002, acc=0.9992, iter_time=10.45s]
Epoch 0: 19%|█▉ | 2390/12384 [5:05:22<21:15:34, 7.66s/it, loss=0.0031, acc=0.9921, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2391/12384 [5:05:22<21:14:20, 7.65s/it, loss=0.0031, acc=0.9921, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2391/12384 [5:05:30<21:14:20, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2392/12384 [5:05:30<21:14:03, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2392/12384 [5:05:38<21:14:03, 7.65s/it, loss=0.0006, acc=0.9998, iter_time=7.26s]
Epoch 0: 19%|█▉ | 2393/12384 [5:05:38<21:12:35, 7.64s/it, loss=0.0006, acc=0.9998, iter_time=7.26s]
Epoch 0: 19%|█▉ | 2393/12384 [5:05:45<21:12:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2394/12384 [5:05:45<21:12:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2394/12384 [5:05:53<21:12:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2395/12384 [5:05:53<21:12:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2395/12384 [5:06:00<21:12:25, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2396/12384 [5:06:00<21:09:57, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2396/12384 [5:06:08<21:09:57, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2397/12384 [5:06:08<21:13:30, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2397/12384 [5:06:16<21:13:30, 7.65s/it, loss=0.0006, acc=0.9976, iter_time=7.70s]
Epoch 0: 19%|█▉ | 2398/12384 [5:06:16<21:11:57, 7.64s/it, loss=0.0006, acc=0.9976, iter_time=7.70s]
Epoch 0: 19%|█▉ | 2398/12384 [5:06:24<21:11:57, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=7.93s]
Epoch 0: 19%|█▉ | 2399/12384 [5:06:24<21:25:51, 7.73s/it, loss=0.0002, acc=0.9995, iter_time=7.93s]
Epoch 0: 19%|█▉ | 2399/12384 [5:06:31<21:25:51, 7.73s/it, loss=0.0007, acc=0.9974, iter_time=8.05s]
Epoch 0: 19%|█▉ | 2400/12384 [5:06:31<21:21:59, 7.70s/it, loss=0.0007, acc=0.9974, iter_time=8.05s]
Epoch 0: 19%|█▉ | 2400/12384 [5:06:39<21:21:59, 7.70s/it, loss=0.0004, acc=0.9981, iter_time=7.24s]
Epoch 0: 19%|█▉ | 2401/12384 [5:06:39<21:31:55, 7.76s/it, loss=0.0004, acc=0.9981, iter_time=7.24s]
Epoch 0: 19%|█▉ | 2401/12384 [5:06:47<21:31:55, 7.76s/it, loss=0.0009, acc=0.9955, iter_time=7.88s]
Epoch 0: 19%|█▉ | 2402/12384 [5:06:47<21:25:44, 7.73s/it, loss=0.0009, acc=0.9955, iter_time=7.88s]
Epoch 0: 19%|█▉ | 2402/12384 [5:06:55<21:25:44, 7.73s/it, loss=0.0007, acc=0.9995, iter_time=7.71s]
Epoch 0: 19%|█▉ | 2403/12384 [5:06:55<21:23:01, 7.71s/it, loss=0.0007, acc=0.9995, iter_time=7.71s]
Epoch 0: 19%|█▉ | 2403/12384 [5:07:02<21:23:01, 7.71s/it, loss=0.0003, acc=0.9994, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2404/12384 [5:07:02<21:19:19, 7.69s/it, loss=0.0003, acc=0.9994, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2404/12384 [5:07:10<21:19:19, 7.69s/it, loss=0.0005, acc=0.9985, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2405/12384 [5:07:10<21:17:47, 7.68s/it, loss=0.0005, acc=0.9985, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2405/12384 [5:07:18<21:17:47, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=7.77s]
Epoch 0: 19%|█▉ | 2406/12384 [5:07:18<21:19:30, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=7.77s]
Epoch 0: 19%|█▉ | 2406/12384 [5:07:25<21:19:30, 7.69s/it, loss=0.0004, acc=0.9978, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2407/12384 [5:07:25<21:16:22, 7.68s/it, loss=0.0004, acc=0.9978, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2407/12384 [5:07:33<21:16:22, 7.68s/it, loss=0.0013, acc=0.9973, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2408/12384 [5:07:33<21:14:15, 7.66s/it, loss=0.0013, acc=0.9973, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2408/12384 [5:07:40<21:14:15, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2409/12384 [5:07:40<21:11:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2409/12384 [5:07:48<21:11:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.05s]
Epoch 0: 19%|█▉ | 2410/12384 [5:07:48<21:09:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.05s]
Epoch 0: 19%|█▉ | 2410/12384 [5:07:56<21:09:10, 7.63s/it, loss=0.0008, acc=0.9971, iter_time=9.10s]
Epoch 0: 19%|█▉ | 2411/12384 [5:07:56<21:09:24, 7.64s/it, loss=0.0008, acc=0.9971, iter_time=9.10s]
Epoch 0: 19%|█▉ | 2411/12384 [5:08:03<21:09:24, 7.64s/it, loss=0.0008, acc=0.9982, iter_time=9.72s]
Epoch 0: 19%|█▉ | 2412/12384 [5:08:03<21:08:46, 7.63s/it, loss=0.0008, acc=0.9982, iter_time=9.72s]
Epoch 0: 19%|█▉ | 2412/12384 [5:08:11<21:08:46, 7.63s/it, loss=0.0010, acc=0.9971, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2413/12384 [5:08:11<21:10:42, 7.65s/it, loss=0.0010, acc=0.9971, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2413/12384 [5:08:19<21:10:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 19%|█▉ | 2414/12384 [5:08:19<21:10:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 19%|█▉ | 2414/12384 [5:08:26<21:10:11, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=8.28s]
Epoch 0: 20%|█▉ | 2415/12384 [5:08:26<21:08:49, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=8.28s]
Epoch 0: 20%|█▉ | 2415/12384 [5:08:34<21:08:49, 7.64s/it, loss=0.0007, acc=0.9951, iter_time=8.02s]
Epoch 0: 20%|█▉ | 2416/12384 [5:08:34<21:10:04, 7.64s/it, loss=0.0007, acc=0.9951, iter_time=8.02s]
Epoch 0: 20%|█▉ | 2416/12384 [5:08:42<21:10:04, 7.64s/it, loss=0.0003, acc=0.9987, iter_time=7.27s]
Epoch 0: 20%|█▉ | 2417/12384 [5:08:42<21:09:44, 7.64s/it, loss=0.0003, acc=0.9987, iter_time=7.27s]
Epoch 0: 20%|█▉ | 2417/12384 [5:08:49<21:09:44, 7.64s/it, loss=0.0006, acc=0.9966, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2418/12384 [5:08:49<21:08:45, 7.64s/it, loss=0.0006, acc=0.9966, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2418/12384 [5:08:57<21:08:45, 7.64s/it, loss=0.0004, acc=0.9995, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2419/12384 [5:08:57<21:08:47, 7.64s/it, loss=0.0004, acc=0.9995, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2419/12384 [5:09:04<21:08:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2420/12384 [5:09:04<21:08:52, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2420/12384 [5:09:12<21:08:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 20%|█▉ | 2421/12384 [5:09:12<21:07:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 20%|█▉ | 2421/12384 [5:09:20<21:07:05, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 20%|█▉ | 2422/12384 [5:09:20<21:06:08, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 20%|█▉ | 2422/12384 [5:09:27<21:06:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 20%|█▉ | 2423/12384 [5:09:27<21:06:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 20%|█▉ | 2423/12384 [5:09:35<21:06:18, 7.63s/it, loss=0.0008, acc=0.9979, iter_time=10.62s]
Epoch 0: 20%|█▉ | 2424/12384 [5:09:35<21:06:42, 7.63s/it, loss=0.0008, acc=0.9979, iter_time=10.62s]
Epoch 0: 20%|█▉ | 2424/12384 [5:09:43<21:06:42, 7.63s/it, loss=0.0018, acc=0.9978, iter_time=7.94s]
Epoch 0: 20%|█▉ | 2425/12384 [5:09:43<21:18:53, 7.70s/it, loss=0.0018, acc=0.9978, iter_time=7.94s]
Epoch 0: 20%|█▉ | 2425/12384 [5:09:51<21:18:53, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2426/12384 [5:09:51<21:16:04, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2426/12384 [5:09:58<21:16:04, 7.69s/it, loss=0.0006, acc=0.9998, iter_time=7.67s]
Epoch 0: 20%|█▉ | 2427/12384 [5:09:58<21:27:08, 7.76s/it, loss=0.0006, acc=0.9998, iter_time=7.67s]
Epoch 0: 20%|█▉ | 2427/12384 [5:10:06<21:27:08, 7.76s/it, loss=0.0023, acc=0.9939, iter_time=4.86s]
Epoch 0: 20%|█▉ | 2428/12384 [5:10:06<21:20:31, 7.72s/it, loss=0.0023, acc=0.9939, iter_time=4.86s]
Epoch 0: 20%|█▉ | 2428/12384 [5:10:14<21:20:31, 7.72s/it, loss=0.0001, acc=0.9999, iter_time=10.63s]
Epoch 0: 20%|█▉ | 2429/12384 [5:10:14<21:15:59, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=10.63s]
Epoch 0: 20%|█▉ | 2429/12384 [5:10:21<21:15:59, 7.69s/it, loss=0.0003, acc=0.9980, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2430/12384 [5:10:21<21:11:56, 7.67s/it, loss=0.0003, acc=0.9980, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2430/12384 [5:10:29<21:11:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2431/12384 [5:10:29<21:12:05, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2431/12384 [5:10:37<21:12:05, 7.67s/it, loss=0.0079, acc=0.9976, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2432/12384 [5:10:37<21:12:10, 7.67s/it, loss=0.0079, acc=0.9976, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2432/12384 [5:10:44<21:12:10, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2433/12384 [5:10:44<21:09:26, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2433/12384 [5:10:52<21:09:26, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2434/12384 [5:10:52<21:07:02, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2434/12384 [5:11:00<21:07:02, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2435/12384 [5:11:00<21:07:01, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2435/12384 [5:11:07<21:07:01, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2436/12384 [5:11:07<21:06:38, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2436/12384 [5:11:15<21:06:38, 7.64s/it, loss=0.0007, acc=0.9977, iter_time=7.67s]
Epoch 0: 20%|█▉ | 2437/12384 [5:11:15<21:07:45, 7.65s/it, loss=0.0007, acc=0.9977, iter_time=7.67s]
Epoch 0: 20%|█▉ | 2437/12384 [5:11:22<21:07:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2438/12384 [5:11:22<21:06:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2438/12384 [5:11:30<21:06:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2439/12384 [5:11:30<21:10:38, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2439/12384 [5:11:38<21:10:38, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2440/12384 [5:11:38<21:08:08, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2440/12384 [5:11:45<21:08:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2441/12384 [5:11:45<21:06:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2441/12384 [5:11:53<21:06:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 20%|█▉ | 2442/12384 [5:11:53<21:03:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 20%|█▉ | 2442/12384 [5:12:01<21:03:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 20%|█▉ | 2443/12384 [5:12:01<21:05:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 20%|█▉ | 2443/12384 [5:12:08<21:05:43, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.44s]
Epoch 0: 20%|█▉ | 2444/12384 [5:12:08<21:04:25, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.44s]
Epoch 0: 20%|█▉ | 2444/12384 [5:12:16<21:04:25, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2445/12384 [5:12:16<21:04:14, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2445/12384 [5:12:24<21:04:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2446/12384 [5:12:24<21:05:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2446/12384 [5:12:31<21:05:38, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=6.82s]
Epoch 0: 20%|█▉ | 2447/12384 [5:12:31<21:06:19, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=6.82s]
Epoch 0: 20%|█▉ | 2447/12384 [5:12:39<21:06:19, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.86s]
Epoch 0: 20%|█▉ | 2448/12384 [5:12:39<21:05:14, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.86s]
Epoch 0: 20%|█▉ | 2448/12384 [5:12:46<21:05:14, 7.64s/it, loss=0.0003, acc=0.9990, iter_time=7.25s]
Epoch 0: 20%|█▉ | 2449/12384 [5:12:46<21:03:58, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=7.25s]
Epoch 0: 20%|█▉ | 2449/12384 [5:12:54<21:03:58, 7.63s/it, loss=0.0042, acc=0.9888, iter_time=8.03s]
Epoch 0: 20%|█▉ | 2450/12384 [5:12:54<21:04:11, 7.64s/it, loss=0.0042, acc=0.9888, iter_time=8.03s]
Epoch 0: 20%|█▉ | 2450/12384 [5:13:02<21:04:11, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 20%|█▉ | 2451/12384 [5:13:02<21:17:09, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 20%|█▉ | 2451/12384 [5:13:10<21:17:09, 7.71s/it, loss=0.0007, acc=0.9985, iter_time=5.50s]
Epoch 0: 20%|█▉ | 2452/12384 [5:13:10<21:13:46, 7.69s/it, loss=0.0007, acc=0.9985, iter_time=5.50s]
Epoch 0: 20%|█▉ | 2452/12384 [5:13:18<21:13:46, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=9.18s]
Epoch 0: 20%|█▉ | 2453/12384 [5:13:18<21:29:35, 7.79s/it, loss=0.0003, acc=1.0000, iter_time=9.18s]
Epoch 0: 20%|█▉ | 2453/12384 [5:13:25<21:29:35, 7.79s/it, loss=0.0001, acc=1.0000, iter_time=8.60s]
Epoch 0: 20%|█▉ | 2454/12384 [5:13:25<21:21:05, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=8.60s]
Epoch 0: 20%|█▉ | 2454/12384 [5:13:33<21:21:05, 7.74s/it, loss=0.0007, acc=0.9981, iter_time=5.55s]
Epoch 0: 20%|█▉ | 2455/12384 [5:13:33<21:16:27, 7.71s/it, loss=0.0007, acc=0.9981, iter_time=5.55s]
Epoch 0: 20%|█▉ | 2455/12384 [5:13:41<21:16:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 20%|█▉ | 2456/12384 [5:13:41<21:13:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 20%|█▉ | 2456/12384 [5:13:48<21:13:46, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2457/12384 [5:13:48<21:11:05, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2457/12384 [5:13:56<21:11:05, 7.68s/it, loss=0.0009, acc=0.9953, iter_time=5.84s]
Epoch 0: 20%|█▉ | 2458/12384 [5:13:56<21:09:59, 7.68s/it, loss=0.0009, acc=0.9953, iter_time=5.84s]
Epoch 0: 20%|█▉ | 2458/12384 [5:14:04<21:09:59, 7.68s/it, loss=0.0002, acc=0.9987, iter_time=9.48s]
Epoch 0: 20%|█▉ | 2459/12384 [5:14:04<21:08:29, 7.67s/it, loss=0.0002, acc=0.9987, iter_time=9.48s]
Epoch 0: 20%|█▉ | 2459/12384 [5:14:11<21:08:29, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2460/12384 [5:14:11<21:08:24, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2460/12384 [5:14:19<21:08:24, 7.67s/it, loss=0.0001, acc=0.9996, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2461/12384 [5:14:19<21:06:19, 7.66s/it, loss=0.0001, acc=0.9996, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2461/12384 [5:14:27<21:06:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2462/12384 [5:14:27<21:09:18, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2462/12384 [5:14:34<21:09:18, 7.68s/it, loss=0.0013, acc=0.9985, iter_time=7.41s]
Epoch 0: 20%|█▉ | 2463/12384 [5:14:34<21:07:06, 7.66s/it, loss=0.0013, acc=0.9985, iter_time=7.41s]
Epoch 0: 20%|█▉ | 2463/12384 [5:14:42<21:07:06, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 20%|█▉ | 2464/12384 [5:14:42<21:07:27, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 20%|█▉ | 2464/12384 [5:14:50<21:07:27, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 20%|█▉ | 2465/12384 [5:14:50<21:05:24, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 20%|█▉ | 2465/12384 [5:14:57<21:05:24, 7.65s/it, loss=0.0003, acc=0.9985, iter_time=9.44s]
Epoch 0: 20%|█▉ | 2466/12384 [5:14:57<21:05:20, 7.65s/it, loss=0.0003, acc=0.9985, iter_time=9.44s]
Epoch 0: 20%|█▉ | 2466/12384 [5:15:05<21:05:20, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.60s]
Epoch 0: 20%|█▉ | 2467/12384 [5:15:05<21:05:36, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.60s]
Epoch 0: 20%|█▉ | 2467/12384 [5:15:12<21:05:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 20%|█▉ | 2468/12384 [5:15:12<21:05:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 20%|█▉ | 2468/12384 [5:15:20<21:05:46, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=9.42s]
Epoch 0: 20%|█▉ | 2469/12384 [5:15:20<21:03:07, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=9.42s]
Epoch 0: 20%|█▉ | 2469/12384 [5:15:28<21:03:07, 7.64s/it, loss=0.0004, acc=0.9992, iter_time=7.70s]
Epoch 0: 20%|█▉ | 2470/12384 [5:15:28<21:05:39, 7.66s/it, loss=0.0004, acc=0.9992, iter_time=7.70s]
Epoch 0: 20%|█▉ | 2470/12384 [5:15:35<21:05:39, 7.66s/it, loss=0.0005, acc=0.9977, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2471/12384 [5:15:35<21:04:22, 7.65s/it, loss=0.0005, acc=0.9977, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2471/12384 [5:15:43<21:04:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 20%|█▉ | 2472/12384 [5:15:43<21:03:46, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 20%|█▉ | 2472/12384 [5:15:51<21:03:46, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.27s]
Epoch 0: 20%|█▉ | 2473/12384 [5:15:51<21:02:11, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.27s]
Epoch 0: 20%|█▉ | 2473/12384 [5:15:58<21:02:11, 7.64s/it, loss=0.0009, acc=0.9980, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2474/12384 [5:15:58<21:01:32, 7.64s/it, loss=0.0009, acc=0.9980, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2474/12384 [5:16:06<21:01:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 20%|█▉ | 2475/12384 [5:16:06<21:02:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 20%|█▉ | 2475/12384 [5:16:14<21:02:21, 7.64s/it, loss=0.0001, acc=0.9995, iter_time=9.18s]
Epoch 0: 20%|█▉ | 2476/12384 [5:16:14<21:04:05, 7.65s/it, loss=0.0001, acc=0.9995, iter_time=9.18s]
Epoch 0: 20%|█▉ | 2476/12384 [5:16:21<21:04:05, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.69s]
Epoch 0: 20%|██ | 2477/12384 [5:16:21<21:07:01, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.69s]
Epoch 0: 20%|██ | 2477/12384 [5:16:29<21:07:01, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=4.68s]
Epoch 0: 20%|██ | 2478/12384 [5:16:29<21:05:01, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=4.68s]
Epoch 0: 20%|██ | 2478/12384 [5:16:37<21:05:01, 7.66s/it, loss=0.0011, acc=0.9960, iter_time=10.66s]
Epoch 0: 20%|██ | 2479/12384 [5:16:37<21:03:07, 7.65s/it, loss=0.0011, acc=0.9960, iter_time=10.66s]
Epoch 0: 20%|██ | 2479/12384 [5:16:45<21:03:07, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=8.11s]
Epoch 0: 20%|██ | 2480/12384 [5:16:45<21:22:33, 7.77s/it, loss=0.0003, acc=1.0000, iter_time=8.11s]
Epoch 0: 20%|██ | 2480/12384 [5:16:52<21:22:33, 7.77s/it, loss=0.0006, acc=0.9970, iter_time=7.60s]
Epoch 0: 20%|██ | 2481/12384 [5:16:52<21:19:33, 7.75s/it, loss=0.0006, acc=0.9970, iter_time=7.60s]
Epoch 0: 20%|██ | 2481/12384 [5:17:00<21:19:33, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 20%|██ | 2482/12384 [5:17:00<21:14:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 20%|██ | 2482/12384 [5:17:08<21:14:43, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=4.30s]
Epoch 0: 20%|██ | 2483/12384 [5:17:08<21:11:58, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=4.30s]
Epoch 0: 20%|██ | 2483/12384 [5:17:15<21:11:58, 7.71s/it, loss=0.0051, acc=0.9972, iter_time=10.43s]
Epoch 0: 20%|██ | 2484/12384 [5:17:15<21:12:11, 7.71s/it, loss=0.0051, acc=0.9972, iter_time=10.43s]
Epoch 0: 20%|██ | 2484/12384 [5:17:23<21:12:11, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=5.54s]
Epoch 0: 20%|██ | 2485/12384 [5:17:23<21:07:36, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=5.54s]
Epoch 0: 20%|██ | 2485/12384 [5:17:31<21:07:36, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 20%|██ | 2486/12384 [5:17:31<21:04:14, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 20%|██ | 2486/12384 [5:17:38<21:04:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2487/12384 [5:17:38<21:02:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2487/12384 [5:17:46<21:02:04, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 20%|██ | 2488/12384 [5:17:46<21:00:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 20%|██ | 2488/12384 [5:17:54<21:00:35, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=7.66s]
Epoch 0: 20%|██ | 2489/12384 [5:17:54<21:02:02, 7.65s/it, loss=0.0003, acc=0.9991, iter_time=7.66s]
Epoch 0: 20%|██ | 2489/12384 [5:18:01<21:02:02, 7.65s/it, loss=0.0012, acc=0.9982, iter_time=6.48s]
Epoch 0: 20%|██ | 2490/12384 [5:18:01<21:00:49, 7.65s/it, loss=0.0012, acc=0.9982, iter_time=6.48s]
Epoch 0: 20%|██ | 2490/12384 [5:18:09<21:00:49, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=8.83s]
Epoch 0: 20%|██ | 2491/12384 [5:18:09<21:04:05, 7.67s/it, loss=0.0002, acc=0.9992, iter_time=8.83s]
Epoch 0: 20%|██ | 2491/12384 [5:18:17<21:04:05, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.71s]
Epoch 0: 20%|██ | 2492/12384 [5:18:17<21:01:27, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.71s]
Epoch 0: 20%|██ | 2492/12384 [5:18:24<21:01:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2493/12384 [5:18:24<20:59:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2493/12384 [5:18:32<20:59:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 0: 20%|██ | 2494/12384 [5:18:32<20:59:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 0: 20%|██ | 2494/12384 [5:18:39<20:59:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 20%|██ | 2495/12384 [5:18:39<20:59:16, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 20%|██ | 2495/12384 [5:18:47<20:59:16, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=8.03s]
Epoch 0: 20%|██ | 2496/12384 [5:18:47<20:58:48, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=8.03s]
Epoch 0: 20%|██ | 2496/12384 [5:18:55<20:58:48, 7.64s/it, loss=0.0005, acc=0.9987, iter_time=7.23s]
Epoch 0: 20%|██ | 2497/12384 [5:18:55<20:58:25, 7.64s/it, loss=0.0005, acc=0.9987, iter_time=7.23s]
Epoch 0: 20%|██ | 2497/12384 [5:19:02<20:58:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.32s]
Epoch 0: 20%|██ | 2498/12384 [5:19:02<20:58:05, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.32s]
Epoch 0: 20%|██ | 2498/12384 [5:19:10<20:58:05, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.15s]
Epoch 0: 20%|██ | 2499/12384 [5:19:10<20:56:45, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.15s]
Epoch 0: 20%|██ | 2499/12384 [5:19:18<20:56:45, 7.63s/it, loss=0.0012, acc=0.9991, iter_time=9.83s]
Epoch 0: 20%|██ | 2500/12384 [5:19:18<21:06:46, 7.69s/it, loss=0.0012, acc=0.9991, iter_time=9.83s]
Epoch 0: 20%|██ | 2500/12384 [5:19:25<21:06:46, 7.69s/it, loss=0.0013, acc=0.9951, iter_time=5.15s]
Epoch 0: 20%|██ | 2501/12384 [5:19:25<21:04:06, 7.67s/it, loss=0.0013, acc=0.9951, iter_time=5.15s]
Epoch 0: 20%|██ | 2501/12384 [5:19:33<21:04:06, 7.67s/it, loss=0.0009, acc=1.0000, iter_time=9.89s]
Epoch 0: 20%|██ | 2502/12384 [5:19:33<21:01:38, 7.66s/it, loss=0.0009, acc=1.0000, iter_time=9.89s]
Epoch 0: 20%|██ | 2502/12384 [5:19:41<21:01:38, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|██ | 2503/12384 [5:19:41<21:02:29, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|██ | 2503/12384 [5:19:48<21:02:29, 7.67s/it, loss=0.0005, acc=0.9997, iter_time=8.02s]
Epoch 0: 20%|██ | 2504/12384 [5:19:48<21:01:25, 7.66s/it, loss=0.0005, acc=0.9997, iter_time=8.02s]
Epoch 0: 20%|██ | 2504/12384 [5:19:56<21:01:25, 7.66s/it, loss=0.0008, acc=0.9976, iter_time=7.25s]
Epoch 0: 20%|██ | 2505/12384 [5:19:56<20:58:29, 7.64s/it, loss=0.0008, acc=0.9976, iter_time=7.25s]
Epoch 0: 20%|██ | 2505/12384 [5:20:04<20:58:29, 7.64s/it, loss=0.0004, acc=0.9990, iter_time=7.04s]
Epoch 0: 20%|██ | 2506/12384 [5:20:04<21:14:29, 7.74s/it, loss=0.0004, acc=0.9990, iter_time=7.04s]
Epoch 0: 20%|██ | 2506/12384 [5:20:12<21:14:29, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 20%|██ | 2507/12384 [5:20:12<21:08:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 20%|██ | 2507/12384 [5:20:19<21:08:20, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 20%|██ | 2508/12384 [5:20:19<21:09:16, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 20%|██ | 2508/12384 [5:20:27<21:09:16, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.38s]
Epoch 0: 20%|██ | 2509/12384 [5:20:27<21:05:24, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.38s]
Epoch 0: 20%|██ | 2509/12384 [5:20:35<21:05:24, 7.69s/it, loss=0.0048, acc=0.9965, iter_time=7.61s]
Epoch 0: 20%|██ | 2510/12384 [5:20:35<21:01:22, 7.66s/it, loss=0.0048, acc=0.9965, iter_time=7.61s]
Epoch 0: 20%|██ | 2510/12384 [5:20:42<21:01:22, 7.66s/it, loss=0.0004, acc=0.9995, iter_time=4.75s]
Epoch 0: 20%|██ | 2511/12384 [5:20:42<21:00:02, 7.66s/it, loss=0.0004, acc=0.9995, iter_time=4.75s]
Epoch 0: 20%|██ | 2511/12384 [5:20:50<21:00:02, 7.66s/it, loss=0.0002, acc=0.9997, iter_time=10.56s]
Epoch 0: 20%|██ | 2512/12384 [5:20:50<21:03:11, 7.68s/it, loss=0.0002, acc=0.9997, iter_time=10.56s]
Epoch 0: 20%|██ | 2512/12384 [5:20:58<21:03:11, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2513/12384 [5:20:58<20:59:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2513/12384 [5:21:05<20:59:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.55s]
Epoch 0: 20%|██ | 2514/12384 [5:21:05<20:54:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.55s]
Epoch 0: 20%|██ | 2514/12384 [5:21:13<20:54:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 20%|██ | 2515/12384 [5:21:13<20:54:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 20%|██ | 2515/12384 [5:21:20<20:54:14, 7.63s/it, loss=0.0003, acc=0.9997, iter_time=6.72s]
Epoch 0: 20%|██ | 2516/12384 [5:21:20<20:53:12, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=6.72s]
Epoch 0: 20%|██ | 2516/12384 [5:21:28<20:53:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.50s]
Epoch 0: 20%|██ | 2517/12384 [5:21:28<20:52:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.50s]
Epoch 0: 20%|██ | 2517/12384 [5:21:36<20:52:26, 7.62s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 20%|██ | 2518/12384 [5:21:36<20:52:20, 7.62s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 20%|██ | 2518/12384 [5:21:43<20:52:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2519/12384 [5:21:43<20:52:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2519/12384 [5:21:51<20:52:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 20%|██ | 2520/12384 [5:21:51<20:55:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 20%|██ | 2520/12384 [5:21:58<20:55:25, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.27s]
Epoch 0: 20%|██ | 2521/12384 [5:21:58<20:55:17, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.27s]
Epoch 0: 20%|██ | 2521/12384 [5:22:06<20:55:17, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|██ | 2522/12384 [5:22:06<20:54:50, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|██ | 2522/12384 [5:22:14<20:54:50, 7.63s/it, loss=0.0043, acc=0.9953, iter_time=7.64s]
Epoch 0: 20%|██ | 2523/12384 [5:22:14<20:54:26, 7.63s/it, loss=0.0043, acc=0.9953, iter_time=7.64s]
Epoch 0: 20%|██ | 2523/12384 [5:22:21<20:54:26, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=7.62s]
Epoch 0: 20%|██ | 2524/12384 [5:22:21<20:54:32, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=7.62s]
Epoch 0: 20%|██ | 2524/12384 [5:22:29<20:54:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2525/12384 [5:22:29<20:54:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2525/12384 [5:22:37<20:54:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.25s]
Epoch 0: 20%|██ | 2526/12384 [5:22:37<20:55:08, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.25s]
Epoch 0: 20%|██ | 2526/12384 [5:22:44<20:55:08, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.04s]
Epoch 0: 20%|██ | 2527/12384 [5:22:44<20:54:59, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.04s]
Epoch 0: 20%|██ | 2527/12384 [5:22:52<20:54:59, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=8.03s]
Epoch 0: 20%|██ | 2528/12384 [5:22:52<20:55:31, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=8.03s]
Epoch 0: 20%|██ | 2528/12384 [5:23:00<20:55:31, 7.64s/it, loss=0.0057, acc=0.9915, iter_time=3.24s]
Epoch 0: 20%|██ | 2529/12384 [5:23:00<20:57:11, 7.65s/it, loss=0.0057, acc=0.9915, iter_time=3.24s]
Epoch 0: 20%|██ | 2529/12384 [5:23:07<20:57:11, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.43s]
Epoch 0: 20%|██ | 2530/12384 [5:23:07<20:55:18, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.43s]
Epoch 0: 20%|██ | 2530/12384 [5:23:15<20:55:18, 7.64s/it, loss=0.0011, acc=0.9967, iter_time=10.90s]
Epoch 0: 20%|██ | 2531/12384 [5:23:15<20:57:22, 7.66s/it, loss=0.0011, acc=0.9967, iter_time=10.90s]
Epoch 0: 20%|██ | 2531/12384 [5:23:23<20:57:22, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2532/12384 [5:23:23<20:56:03, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2532/12384 [5:23:31<20:56:03, 7.65s/it, loss=0.0019, acc=0.9966, iter_time=4.54s]
Epoch 0: 20%|██ | 2533/12384 [5:23:31<21:13:13, 7.75s/it, loss=0.0019, acc=0.9966, iter_time=4.54s]
Epoch 0: 20%|██ | 2533/12384 [5:23:38<21:13:13, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=11.09s]
Epoch 0: 20%|██ | 2534/12384 [5:23:38<21:05:53, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=11.09s]
Epoch 0: 20%|██ | 2534/12384 [5:23:46<21:05:53, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.30s]
Epoch 0: 20%|██ | 2535/12384 [5:23:46<21:02:10, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.30s]
Epoch 0: 20%|██ | 2535/12384 [5:23:54<21:02:10, 7.69s/it, loss=0.0024, acc=0.9950, iter_time=10.35s]
Epoch 0: 20%|██ | 2536/12384 [5:23:54<21:00:53, 7.68s/it, loss=0.0024, acc=0.9950, iter_time=10.35s]
Epoch 0: 20%|██ | 2536/12384 [5:24:01<21:00:53, 7.68s/it, loss=0.0005, acc=0.9998, iter_time=6.69s]
Epoch 0: 20%|██ | 2537/12384 [5:24:01<20:58:51, 7.67s/it, loss=0.0005, acc=0.9998, iter_time=6.69s]
Epoch 0: 20%|██ | 2537/12384 [5:24:09<20:58:51, 7.67s/it, loss=0.0003, acc=0.9999, iter_time=8.21s]
Epoch 0: 20%|██ | 2538/12384 [5:24:09<20:55:14, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=8.21s]
Epoch 0: 20%|██ | 2538/12384 [5:24:16<20:55:14, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=5.36s]
Epoch 0: 21%|██ | 2539/12384 [5:24:16<20:53:43, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=5.36s]
Epoch 0: 21%|██ | 2539/12384 [5:24:24<20:53:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.59s]
Epoch 0: 21%|██ | 2540/12384 [5:24:24<20:54:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.59s]
Epoch 0: 21%|██ | 2540/12384 [5:24:32<20:54:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 21%|██ | 2541/12384 [5:24:32<20:52:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 21%|██ | 2541/12384 [5:24:39<20:52:28, 7.63s/it, loss=0.0005, acc=0.9985, iter_time=7.67s]
Epoch 0: 21%|██ | 2542/12384 [5:24:39<20:56:55, 7.66s/it, loss=0.0005, acc=0.9985, iter_time=7.67s]
Epoch 0: 21%|██ | 2542/12384 [5:24:47<20:56:55, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=7.70s]
Epoch 0: 21%|██ | 2543/12384 [5:24:47<20:56:32, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=7.70s]
Epoch 0: 21%|██ | 2543/12384 [5:24:55<20:56:32, 7.66s/it, loss=0.0021, acc=0.9942, iter_time=7.57s]
Epoch 0: 21%|██ | 2544/12384 [5:24:55<20:54:25, 7.65s/it, loss=0.0021, acc=0.9942, iter_time=7.57s]
Epoch 0: 21%|██ | 2544/12384 [5:25:02<20:54:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 21%|██ | 2545/12384 [5:25:02<20:54:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 21%|██ | 2545/12384 [5:25:10<20:54:17, 7.65s/it, loss=0.0066, acc=0.9922, iter_time=6.14s]
Epoch 0: 21%|██ | 2546/12384 [5:25:10<20:52:14, 7.64s/it, loss=0.0066, acc=0.9922, iter_time=6.14s]
Epoch 0: 21%|██ | 2546/12384 [5:25:18<20:52:14, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=9.14s]
Epoch 0: 21%|██ | 2547/12384 [5:25:18<20:51:21, 7.63s/it, loss=0.0003, acc=0.9986, iter_time=9.14s]
Epoch 0: 21%|██ | 2547/12384 [5:25:25<20:51:21, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.58s]
Epoch 0: 21%|██ | 2548/12384 [5:25:25<20:51:04, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.58s]
Epoch 0: 21%|██ | 2548/12384 [5:25:33<20:51:04, 7.63s/it, loss=0.0015, acc=0.9976, iter_time=7.66s]
Epoch 0: 21%|██ | 2549/12384 [5:25:33<20:52:19, 7.64s/it, loss=0.0015, acc=0.9976, iter_time=7.66s]
Epoch 0: 21%|██ | 2549/12384 [5:25:40<20:52:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 21%|██ | 2550/12384 [5:25:40<20:51:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 21%|██ | 2550/12384 [5:25:48<20:51:45, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=7.22s]
Epoch 0: 21%|██ | 2551/12384 [5:25:48<20:52:42, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=7.22s]
Epoch 0: 21%|██ | 2551/12384 [5:25:56<20:52:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 21%|██ | 2552/12384 [5:25:56<20:50:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 21%|██ | 2552/12384 [5:26:03<20:50:03, 7.63s/it, loss=0.0004, acc=0.9994, iter_time=6.04s]
Epoch 0: 21%|██ | 2553/12384 [5:26:03<20:54:59, 7.66s/it, loss=0.0004, acc=0.9994, iter_time=6.04s]
Epoch 0: 21%|██ | 2553/12384 [5:26:11<20:54:59, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 21%|██ | 2554/12384 [5:26:11<20:52:48, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 21%|██ | 2554/12384 [5:26:19<20:52:48, 7.65s/it, loss=0.0009, acc=0.9967, iter_time=8.57s]
Epoch 0: 21%|██ | 2555/12384 [5:26:19<20:55:17, 7.66s/it, loss=0.0009, acc=0.9967, iter_time=8.57s]
Epoch 0: 21%|██ | 2555/12384 [5:26:26<20:55:17, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=7.40s]
Epoch 0: 21%|██ | 2556/12384 [5:26:26<20:52:11, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.40s]
Epoch 0: 21%|██ | 2556/12384 [5:26:34<20:52:11, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.88s]
Epoch 0: 21%|██ | 2557/12384 [5:26:34<20:49:48, 7.63s/it, loss=0.0003, acc=0.9986, iter_time=7.88s]
Epoch 0: 21%|██ | 2557/12384 [5:26:42<20:49:48, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██ | 2558/12384 [5:26:42<20:51:44, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██ | 2558/12384 [5:26:50<20:51:44, 7.64s/it, loss=0.0003, acc=0.9987, iter_time=7.65s]
Epoch 0: 21%|██ | 2559/12384 [5:26:50<21:08:22, 7.75s/it, loss=0.0003, acc=0.9987, iter_time=7.65s]
Epoch 0: 21%|██ | 2559/12384 [5:26:57<21:08:22, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 21%|██ | 2560/12384 [5:26:57<21:01:44, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 21%|██ | 2560/12384 [5:27:05<21:01:44, 7.71s/it, loss=0.0012, acc=0.9972, iter_time=7.66s]
Epoch 0: 21%|██ | 2561/12384 [5:27:05<20:59:56, 7.70s/it, loss=0.0012, acc=0.9972, iter_time=7.66s]
Epoch 0: 21%|██ | 2561/12384 [5:27:12<20:59:56, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██ | 2562/12384 [5:27:12<20:54:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██ | 2562/12384 [5:27:20<20:54:37, 7.66s/it, loss=0.0006, acc=0.9979, iter_time=7.01s]
Epoch 0: 21%|██ | 2563/12384 [5:27:20<20:53:33, 7.66s/it, loss=0.0006, acc=0.9979, iter_time=7.01s]
Epoch 0: 21%|██ | 2563/12384 [5:27:28<20:53:33, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2564/12384 [5:27:28<20:52:31, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2564/12384 [5:27:35<20:52:31, 7.65s/it, loss=0.0009, acc=0.9979, iter_time=7.31s]
Epoch 0: 21%|██ | 2565/12384 [5:27:35<20:51:49, 7.65s/it, loss=0.0009, acc=0.9979, iter_time=7.31s]
Epoch 0: 21%|██ | 2565/12384 [5:27:43<20:51:49, 7.65s/it, loss=0.0021, acc=0.9964, iter_time=7.97s]
Epoch 0: 21%|██ | 2566/12384 [5:27:43<20:49:39, 7.64s/it, loss=0.0021, acc=0.9964, iter_time=7.97s]
Epoch 0: 21%|██ | 2566/12384 [5:27:51<20:49:39, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.62s]
Epoch 0: 21%|██ | 2567/12384 [5:27:51<20:49:13, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.62s]
Epoch 0: 21%|██ | 2567/12384 [5:27:58<20:49:13, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 21%|██ | 2568/12384 [5:27:58<20:52:32, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 21%|██ | 2568/12384 [5:28:06<20:52:32, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.28s]
Epoch 0: 21%|██ | 2569/12384 [5:28:06<20:51:19, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.28s]
Epoch 0: 21%|██ | 2569/12384 [5:28:14<20:51:19, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.17s]
Epoch 0: 21%|██ | 2570/12384 [5:28:14<20:53:56, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.17s]
Epoch 0: 21%|██ | 2570/12384 [5:28:21<20:53:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2571/12384 [5:28:21<20:51:54, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2571/12384 [5:28:29<20:51:54, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.36s]
Epoch 0: 21%|██ | 2572/12384 [5:28:29<20:52:06, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=7.36s]
Epoch 0: 21%|██ | 2572/12384 [5:28:37<20:52:06, 7.66s/it, loss=0.0004, acc=0.9994, iter_time=8.86s]
Epoch 0: 21%|██ | 2573/12384 [5:28:37<20:48:37, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=8.86s]
Epoch 0: 21%|██ | 2573/12384 [5:28:44<20:48:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2574/12384 [5:28:44<20:49:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2574/12384 [5:28:52<20:49:43, 7.64s/it, loss=0.0316, acc=0.9499, iter_time=7.64s]
Epoch 0: 21%|██ | 2575/12384 [5:28:52<20:48:15, 7.64s/it, loss=0.0316, acc=0.9499, iter_time=7.64s]
Epoch 0: 21%|██ | 2575/12384 [5:28:59<20:48:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 21%|██ | 2576/12384 [5:28:59<20:48:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 21%|██ | 2576/12384 [5:29:07<20:48:45, 7.64s/it, loss=0.0002, acc=0.9987, iter_time=7.00s]
Epoch 0: 21%|██ | 2577/12384 [5:29:07<20:51:46, 7.66s/it, loss=0.0002, acc=0.9987, iter_time=7.00s]
Epoch 0: 21%|██ | 2577/12384 [5:29:15<20:51:46, 7.66s/it, loss=0.0002, acc=0.9990, iter_time=7.96s]
Epoch 0: 21%|██ | 2578/12384 [5:29:15<20:50:48, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=7.96s]
Epoch 0: 21%|██ | 2578/12384 [5:29:22<20:50:48, 7.65s/it, loss=0.0003, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██ | 2579/12384 [5:29:22<20:48:32, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██ | 2579/12384 [5:29:30<20:48:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2580/12384 [5:29:30<20:48:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2580/12384 [5:29:38<20:48:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 21%|██ | 2581/12384 [5:29:38<20:49:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 21%|██ | 2581/12384 [5:29:45<20:49:10, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=9.44s]
Epoch 0: 21%|██ | 2582/12384 [5:29:45<20:48:38, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=9.44s]
Epoch 0: 21%|██ | 2582/12384 [5:29:53<20:48:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 21%|██ | 2583/12384 [5:29:53<20:50:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 21%|██ | 2583/12384 [5:30:01<20:50:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 21%|██ | 2584/12384 [5:30:01<20:51:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 21%|██ | 2584/12384 [5:30:09<20:51:37, 7.66s/it, loss=0.0051, acc=0.9949, iter_time=7.32s]
Epoch 0: 21%|██ | 2585/12384 [5:30:09<21:07:25, 7.76s/it, loss=0.0051, acc=0.9949, iter_time=7.32s]
Epoch 0: 21%|██ | 2585/12384 [5:30:16<21:07:25, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 21%|██ | 2586/12384 [5:30:16<20:59:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 21%|██ | 2586/12384 [5:30:24<20:59:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 21%|██ | 2587/12384 [5:30:24<20:55:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 21%|██ | 2587/12384 [5:30:32<20:55:41, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2588/12384 [5:30:32<20:54:36, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2588/12384 [5:30:39<20:54:36, 7.68s/it, loss=0.0016, acc=0.9970, iter_time=7.67s]
Epoch 0: 21%|██ | 2589/12384 [5:30:39<20:52:42, 7.67s/it, loss=0.0016, acc=0.9970, iter_time=7.67s]
Epoch 0: 21%|██ | 2589/12384 [5:30:47<20:52:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 21%|██ | 2590/12384 [5:30:47<20:48:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 21%|██ | 2590/12384 [5:30:55<20:48:22, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.86s]
Epoch 0: 21%|██ | 2591/12384 [5:30:55<20:47:50, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.86s]
Epoch 0: 21%|██ | 2591/12384 [5:31:02<20:47:50, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=8.01s]
Epoch 0: 21%|██ | 2592/12384 [5:31:02<20:47:17, 7.64s/it, loss=0.0003, acc=0.9997, iter_time=8.01s]
Epoch 0: 21%|██ | 2592/12384 [5:31:10<20:47:17, 7.64s/it, loss=0.0005, acc=0.9989, iter_time=7.25s]
Epoch 0: 21%|██ | 2593/12384 [5:31:10<20:47:45, 7.65s/it, loss=0.0005, acc=0.9989, iter_time=7.25s]
Epoch 0: 21%|██ | 2593/12384 [5:31:17<20:47:45, 7.65s/it, loss=0.0004, acc=0.9995, iter_time=7.65s]
Epoch 0: 21%|██ | 2594/12384 [5:31:17<20:49:26, 7.66s/it, loss=0.0004, acc=0.9995, iter_time=7.65s]
Epoch 0: 21%|██ | 2594/12384 [5:31:25<20:49:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 21%|██ | 2595/12384 [5:31:25<20:49:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 21%|██ | 2595/12384 [5:31:33<20:49:45, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 0: 21%|██ | 2596/12384 [5:31:33<20:49:14, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 0: 21%|██ | 2596/12384 [5:31:40<20:49:14, 7.66s/it, loss=0.0005, acc=0.9974, iter_time=7.37s]
Epoch 0: 21%|██ | 2597/12384 [5:31:40<20:48:47, 7.66s/it, loss=0.0005, acc=0.9974, iter_time=7.37s]
Epoch 0: 21%|██ | 2597/12384 [5:31:48<20:48:47, 7.66s/it, loss=0.0004, acc=0.9977, iter_time=9.43s]
Epoch 0: 21%|██ | 2598/12384 [5:31:48<20:51:00, 7.67s/it, loss=0.0004, acc=0.9977, iter_time=9.43s]
Epoch 0: 21%|██ | 2598/12384 [5:31:56<20:51:00, 7.67s/it, loss=0.0007, acc=0.9971, iter_time=7.71s]
Epoch 0: 21%|██ | 2599/12384 [5:31:56<20:49:39, 7.66s/it, loss=0.0007, acc=0.9971, iter_time=7.71s]
Epoch 0: 21%|██ | 2599/12384 [5:32:03<20:49:39, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.07s]
Epoch 0: 21%|██ | 2600/12384 [5:32:03<20:48:37, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.07s]
Epoch 0: 21%|██ | 2600/12384 [5:32:11<20:48:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.35s]
Epoch 0: 21%|██ | 2601/12384 [5:32:11<20:47:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.35s]
Epoch 0: 21%|██ | 2601/12384 [5:32:19<20:47:43, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=8.49s]
Epoch 0: 21%|██ | 2602/12384 [5:32:19<20:50:00, 7.67s/it, loss=0.0006, acc=0.9975, iter_time=8.49s]
Epoch 0: 21%|██ | 2602/12384 [5:32:26<20:50:00, 7.67s/it, loss=0.0021, acc=0.9964, iter_time=7.71s]
Epoch 0: 21%|██ | 2603/12384 [5:32:26<20:46:27, 7.65s/it, loss=0.0021, acc=0.9964, iter_time=7.71s]
Epoch 0: 21%|██ | 2603/12384 [5:32:34<20:46:27, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=7.62s]
Epoch 0: 21%|██ | 2604/12384 [5:32:34<20:48:24, 7.66s/it, loss=0.0008, acc=0.9979, iter_time=7.62s]
Epoch 0: 21%|██ | 2604/12384 [5:32:42<20:48:24, 7.66s/it, loss=0.0002, acc=0.9991, iter_time=7.67s]
Epoch 0: 21%|██ | 2605/12384 [5:32:42<20:47:33, 7.65s/it, loss=0.0002, acc=0.9991, iter_time=7.67s]
Epoch 0: 21%|██ | 2605/12384 [5:32:49<20:47:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██ | 2606/12384 [5:32:49<20:44:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██ | 2606/12384 [5:32:57<20:44:43, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=7.62s]
Epoch 0: 21%|██ | 2607/12384 [5:32:57<20:44:52, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=7.62s]
Epoch 0: 21%|██ | 2607/12384 [5:33:05<20:44:52, 7.64s/it, loss=0.0005, acc=0.9983, iter_time=8.05s]
Epoch 0: 21%|██ | 2608/12384 [5:33:05<20:45:16, 7.64s/it, loss=0.0005, acc=0.9983, iter_time=8.05s]
Epoch 0: 21%|██ | 2608/12384 [5:33:12<20:45:16, 7.64s/it, loss=0.0017, acc=0.9954, iter_time=5.96s]
Epoch 0: 21%|██ | 2609/12384 [5:33:12<20:43:21, 7.63s/it, loss=0.0017, acc=0.9954, iter_time=5.96s]
Epoch 0: 21%|██ | 2609/12384 [5:33:20<20:43:21, 7.63s/it, loss=0.0006, acc=0.9992, iter_time=8.87s]
Epoch 0: 21%|██ | 2610/12384 [5:33:20<20:42:49, 7.63s/it, loss=0.0006, acc=0.9992, iter_time=8.87s]
Epoch 0: 21%|██ | 2610/12384 [5:33:28<20:42:49, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=5.64s]
Epoch 0: 21%|██ | 2611/12384 [5:33:28<20:58:12, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=5.64s]
Epoch 0: 21%|██ | 2611/12384 [5:33:35<20:58:12, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 21%|██ | 2612/12384 [5:33:35<20:53:25, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 21%|██ | 2612/12384 [5:33:43<20:53:25, 7.70s/it, loss=0.0006, acc=0.9986, iter_time=7.63s]
Epoch 0: 21%|██ | 2613/12384 [5:33:43<20:48:39, 7.67s/it, loss=0.0006, acc=0.9986, iter_time=7.63s]
Epoch 0: 21%|██ | 2613/12384 [5:33:51<20:48:39, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.29s]
Epoch 0: 21%|██ | 2614/12384 [5:33:51<20:46:16, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.29s]
Epoch 0: 21%|██ | 2614/12384 [5:33:58<20:46:16, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.94s]
Epoch 0: 21%|██ | 2615/12384 [5:33:58<20:45:22, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.94s]
Epoch 0: 21%|██ | 2615/12384 [5:34:06<20:45:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 21%|██ | 2616/12384 [5:34:06<20:47:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 21%|██ | 2616/12384 [5:34:14<20:47:09, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 21%|██ | 2617/12384 [5:34:14<20:46:16, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 21%|██ | 2617/12384 [5:34:21<20:46:16, 7.66s/it, loss=0.0006, acc=0.9983, iter_time=5.57s]
Epoch 0: 21%|██ | 2618/12384 [5:34:21<20:45:22, 7.65s/it, loss=0.0006, acc=0.9983, iter_time=5.57s]
Epoch 0: 21%|██ | 2618/12384 [5:34:29<20:45:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 21%|██ | 2619/12384 [5:34:29<20:45:30, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 21%|██ | 2619/12384 [5:34:37<20:45:30, 7.65s/it, loss=0.0024, acc=0.9961, iter_time=7.66s]
Epoch 0: 21%|██ | 2620/12384 [5:34:37<20:43:49, 7.64s/it, loss=0.0024, acc=0.9961, iter_time=7.66s]
Epoch 0: 21%|██ | 2620/12384 [5:34:44<20:43:49, 7.64s/it, loss=0.0013, acc=0.9957, iter_time=7.67s]
Epoch 0: 21%|██ | 2621/12384 [5:34:44<20:44:01, 7.65s/it, loss=0.0013, acc=0.9957, iter_time=7.67s]
Epoch 0: 21%|██ | 2621/12384 [5:34:52<20:44:01, 7.65s/it, loss=0.0006, acc=0.9996, iter_time=7.59s]
Epoch 0: 21%|██ | 2622/12384 [5:34:52<20:43:45, 7.64s/it, loss=0.0006, acc=0.9996, iter_time=7.59s]
Epoch 0: 21%|██ | 2622/12384 [5:35:00<20:43:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██ | 2623/12384 [5:35:00<20:46:10, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██ | 2623/12384 [5:35:07<20:46:10, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 21%|██ | 2624/12384 [5:35:07<20:46:39, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 21%|██ | 2624/12384 [5:35:15<20:46:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 0: 21%|██ | 2625/12384 [5:35:15<20:43:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 0: 21%|██ | 2625/12384 [5:35:22<20:43:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 21%|██ | 2626/12384 [5:35:22<20:43:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 21%|██ | 2626/12384 [5:35:30<20:43:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.55s]
Epoch 0: 21%|██ | 2627/12384 [5:35:30<20:44:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.55s]
Epoch 0: 21%|██ | 2627/12384 [5:35:38<20:44:17, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.30s]
Epoch 0: 21%|██ | 2628/12384 [5:35:38<20:44:52, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=7.30s]
Epoch 0: 21%|██ | 2628/12384 [5:35:45<20:44:52, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=5.80s]
Epoch 0: 21%|██ | 2629/12384 [5:35:45<20:44:23, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=5.80s]
Epoch 0: 21%|██ | 2629/12384 [5:35:53<20:44:23, 7.65s/it, loss=0.0006, acc=0.9990, iter_time=10.39s]
Epoch 0: 21%|██ | 2630/12384 [5:35:53<20:41:27, 7.64s/it, loss=0.0006, acc=0.9990, iter_time=10.39s]
Epoch 0: 21%|██ | 2630/12384 [5:36:01<20:41:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2631/12384 [5:36:01<20:41:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2631/12384 [5:36:08<20:41:00, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=7.61s]
Epoch 0: 21%|██▏ | 2632/12384 [5:36:08<20:41:45, 7.64s/it, loss=0.0009, acc=0.9979, iter_time=7.61s]
Epoch 0: 21%|██▏ | 2632/12384 [5:36:16<20:41:45, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 21%|██▏ | 2633/12384 [5:36:16<20:39:26, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 21%|██▏ | 2633/12384 [5:36:24<20:39:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 0: 21%|██▏ | 2634/12384 [5:36:24<20:42:11, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 0: 21%|██▏ | 2634/12384 [5:36:31<20:42:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 21%|██▏ | 2635/12384 [5:36:31<20:42:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 21%|██▏ | 2635/12384 [5:36:39<20:42:15, 7.65s/it, loss=0.0039, acc=0.9901, iter_time=7.95s]
Epoch 0: 21%|██▏ | 2636/12384 [5:36:39<20:54:16, 7.72s/it, loss=0.0039, acc=0.9901, iter_time=7.95s]
Epoch 0: 21%|██▏ | 2636/12384 [5:36:47<20:54:16, 7.72s/it, loss=0.0008, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2637/12384 [5:36:47<21:05:35, 7.79s/it, loss=0.0008, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2637/12384 [5:36:55<21:05:35, 7.79s/it, loss=0.0009, acc=0.9998, iter_time=6.10s]
Epoch 0: 21%|██▏ | 2638/12384 [5:36:55<20:56:44, 7.74s/it, loss=0.0009, acc=0.9998, iter_time=6.10s]
Epoch 0: 21%|██▏ | 2638/12384 [5:37:02<20:56:44, 7.74s/it, loss=0.0081, acc=0.9851, iter_time=9.43s]
Epoch 0: 21%|██▏ | 2639/12384 [5:37:02<20:52:45, 7.71s/it, loss=0.0081, acc=0.9851, iter_time=9.43s]
Epoch 0: 21%|██▏ | 2639/12384 [5:37:10<20:52:45, 7.71s/it, loss=0.0010, acc=0.9975, iter_time=8.04s]
Epoch 0: 21%|██▏ | 2640/12384 [5:37:10<20:48:40, 7.69s/it, loss=0.0010, acc=0.9975, iter_time=8.04s]
Epoch 0: 21%|██▏ | 2640/12384 [5:37:16<20:48:40, 7.69s/it, loss=0.0029, acc=0.9933, iter_time=4.04s]
Epoch 0: 21%|██▏ | 2641/12384 [5:37:16<19:39:46, 7.27s/it, loss=0.0029, acc=0.9933, iter_time=4.04s]
Epoch 0: 21%|██▏ | 2641/12384 [5:37:24<19:39:46, 7.27s/it, loss=0.0002, acc=0.9999, iter_time=9.51s]
Epoch 0: 21%|██▏ | 2642/12384 [5:37:24<20:00:36, 7.39s/it, loss=0.0002, acc=0.9999, iter_time=9.51s]
Epoch 0: 21%|██▏ | 2642/12384 [5:37:32<20:00:36, 7.39s/it, loss=0.0053, acc=0.9917, iter_time=7.68s]
Epoch 0: 21%|██▏ | 2643/12384 [5:37:32<20:11:03, 7.46s/it, loss=0.0053, acc=0.9917, iter_time=7.68s]
Epoch 0: 21%|██▏ | 2643/12384 [5:37:39<20:11:03, 7.46s/it, loss=0.0003, acc=0.9998, iter_time=4.99s]
Epoch 0: 21%|██▏ | 2644/12384 [5:37:39<20:22:37, 7.53s/it, loss=0.0003, acc=0.9998, iter_time=4.99s]
Epoch 0: 21%|██▏ | 2644/12384 [5:37:47<20:22:37, 7.53s/it, loss=0.0003, acc=1.0000, iter_time=10.31s]
Epoch 0: 21%|██▏ | 2645/12384 [5:37:47<20:32:35, 7.59s/it, loss=0.0003, acc=1.0000, iter_time=10.31s]
Epoch 0: 21%|██▏ | 2645/12384 [5:37:55<20:32:35, 7.59s/it, loss=0.0003, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██▏ | 2646/12384 [5:37:55<20:35:56, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██▏ | 2646/12384 [5:38:02<20:35:56, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 21%|██▏ | 2647/12384 [5:38:02<20:35:31, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 21%|██▏ | 2647/12384 [5:38:10<20:35:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 21%|██▏ | 2648/12384 [5:38:10<20:35:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 21%|██▏ | 2648/12384 [5:38:18<20:35:53, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.46s]
Epoch 0: 21%|██▏ | 2649/12384 [5:38:18<20:36:42, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.46s]
Epoch 0: 21%|██▏ | 2649/12384 [5:38:25<20:36:42, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=9.87s]
Epoch 0: 21%|██▏ | 2650/12384 [5:38:25<20:38:40, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=9.87s]
Epoch 0: 21%|██▏ | 2650/12384 [5:38:33<20:38:40, 7.64s/it, loss=0.0002, acc=0.9988, iter_time=7.21s]
Epoch 0: 21%|██▏ | 2651/12384 [5:38:33<20:39:33, 7.64s/it, loss=0.0002, acc=0.9988, iter_time=7.21s]
Epoch 0: 21%|██▏ | 2651/12384 [5:38:41<20:39:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██▏ | 2652/12384 [5:38:41<20:40:24, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██▏ | 2652/12384 [5:38:48<20:40:24, 7.65s/it, loss=0.0005, acc=0.9992, iter_time=4.52s]
Epoch 0: 21%|██▏ | 2653/12384 [5:38:48<20:42:17, 7.66s/it, loss=0.0005, acc=0.9992, iter_time=4.52s]
Epoch 0: 21%|██▏ | 2653/12384 [5:38:56<20:42:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 21%|██▏ | 2654/12384 [5:38:56<20:41:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 21%|██▏ | 2654/12384 [5:39:04<20:41:53, 7.66s/it, loss=0.0010, acc=0.9981, iter_time=8.59s]
Epoch 0: 21%|██▏ | 2655/12384 [5:39:04<20:44:28, 7.67s/it, loss=0.0010, acc=0.9981, iter_time=8.59s]
Epoch 0: 21%|██▏ | 2655/12384 [5:39:11<20:44:28, 7.67s/it, loss=0.0005, acc=0.9998, iter_time=8.10s]
Epoch 0: 21%|██▏ | 2656/12384 [5:39:11<20:44:17, 7.67s/it, loss=0.0005, acc=0.9998, iter_time=8.10s]
Epoch 0: 21%|██▏ | 2656/12384 [5:39:19<20:44:17, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 21%|██▏ | 2657/12384 [5:39:19<20:43:01, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 21%|██▏ | 2657/12384 [5:39:27<20:43:01, 7.67s/it, loss=0.0008, acc=0.9978, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2658/12384 [5:39:27<20:39:27, 7.65s/it, loss=0.0008, acc=0.9978, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2658/12384 [5:39:34<20:39:27, 7.65s/it, loss=0.0001, acc=0.9997, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2659/12384 [5:39:34<20:36:36, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2659/12384 [5:39:42<20:36:36, 7.63s/it, loss=0.0024, acc=0.9961, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2660/12384 [5:39:42<20:36:01, 7.63s/it, loss=0.0024, acc=0.9961, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2660/12384 [5:39:49<20:36:01, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2661/12384 [5:39:49<20:37:34, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2661/12384 [5:39:57<20:37:34, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 21%|██▏ | 2662/12384 [5:39:57<20:37:24, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 21%|██▏ | 2662/12384 [5:40:05<20:37:24, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=5.26s]
Epoch 0: 22%|██▏ | 2663/12384 [5:40:05<20:36:35, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=5.26s]
Epoch 0: 22%|██▏ | 2663/12384 [5:40:13<20:36:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 22%|██▏ | 2664/12384 [5:40:13<20:54:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 22%|██▏ | 2664/12384 [5:40:20<20:54:06, 7.74s/it, loss=0.0003, acc=0.9996, iter_time=7.66s]
Epoch 0: 22%|██▏ | 2665/12384 [5:40:20<20:47:29, 7.70s/it, loss=0.0003, acc=0.9996, iter_time=7.66s]
Epoch 0: 22%|██▏ | 2665/12384 [5:40:28<20:47:29, 7.70s/it, loss=0.0001, acc=0.9993, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2666/12384 [5:40:28<20:42:43, 7.67s/it, loss=0.0001, acc=0.9993, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2666/12384 [5:40:35<20:42:43, 7.67s/it, loss=0.0012, acc=0.9973, iter_time=7.58s]
Epoch 0: 22%|██▏ | 2667/12384 [5:40:35<20:38:59, 7.65s/it, loss=0.0012, acc=0.9973, iter_time=7.58s]
Epoch 0: 22%|██▏ | 2667/12384 [5:40:43<20:38:59, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2668/12384 [5:40:43<20:38:26, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2668/12384 [5:40:51<20:38:26, 7.65s/it, loss=0.0020, acc=0.9934, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2669/12384 [5:40:51<20:36:01, 7.63s/it, loss=0.0020, acc=0.9934, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2669/12384 [5:40:58<20:36:01, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2670/12384 [5:40:58<20:34:17, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2670/12384 [5:41:06<20:34:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 22%|██▏ | 2671/12384 [5:41:06<20:35:20, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 22%|██▏ | 2671/12384 [5:41:14<20:35:20, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.77s]
Epoch 0: 22%|██▏ | 2672/12384 [5:41:14<20:36:50, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.77s]
Epoch 0: 22%|██▏ | 2672/12384 [5:41:21<20:36:50, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=5.47s]
Epoch 0: 22%|██▏ | 2673/12384 [5:41:21<20:36:02, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=5.47s]
Epoch 0: 22%|██▏ | 2673/12384 [5:41:29<20:36:02, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=8.49s]
Epoch 0: 22%|██▏ | 2674/12384 [5:41:29<20:35:32, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=8.49s]
Epoch 0: 22%|██▏ | 2674/12384 [5:41:36<20:35:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2675/12384 [5:41:36<20:34:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2675/12384 [5:41:44<20:34:13, 7.63s/it, loss=0.0004, acc=0.9971, iter_time=4.80s]
Epoch 0: 22%|██▏ | 2676/12384 [5:41:44<20:37:23, 7.65s/it, loss=0.0004, acc=0.9971, iter_time=4.80s]
Epoch 0: 22%|██▏ | 2676/12384 [5:41:52<20:37:23, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 0: 22%|██▏ | 2677/12384 [5:41:52<20:36:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 0: 22%|██▏ | 2677/12384 [5:41:59<20:36:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 22%|██▏ | 2678/12384 [5:41:59<20:34:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 22%|██▏ | 2678/12384 [5:42:07<20:34:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 22%|██▏ | 2679/12384 [5:42:07<20:36:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 22%|██▏ | 2679/12384 [5:42:15<20:36:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 22%|██▏ | 2680/12384 [5:42:15<20:36:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 22%|██▏ | 2680/12384 [5:42:22<20:36:27, 7.65s/it, loss=0.0022, acc=0.9950, iter_time=7.25s]
Epoch 0: 22%|██▏ | 2681/12384 [5:42:22<20:34:18, 7.63s/it, loss=0.0022, acc=0.9950, iter_time=7.25s]
Epoch 0: 22%|██▏ | 2681/12384 [5:42:30<20:34:18, 7.63s/it, loss=0.0006, acc=0.9991, iter_time=6.68s]
Epoch 0: 22%|██▏ | 2682/12384 [5:42:30<20:34:02, 7.63s/it, loss=0.0006, acc=0.9991, iter_time=6.68s]
Epoch 0: 22%|██▏ | 2682/12384 [5:42:38<20:34:02, 7.63s/it, loss=0.0002, acc=0.9996, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2683/12384 [5:42:38<20:34:19, 7.63s/it, loss=0.0002, acc=0.9996, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2683/12384 [5:42:45<20:34:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 22%|██▏ | 2684/12384 [5:42:45<20:37:28, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 22%|██▏ | 2684/12384 [5:42:53<20:37:28, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.03s]
Epoch 0: 22%|██▏ | 2685/12384 [5:42:53<20:39:17, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=7.03s]
Epoch 0: 22%|██▏ | 2685/12384 [5:43:01<20:39:17, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 0: 22%|██▏ | 2686/12384 [5:43:01<20:38:04, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 0: 22%|██▏ | 2686/12384 [5:43:08<20:38:04, 7.66s/it, loss=0.0005, acc=0.9985, iter_time=7.68s]
Epoch 0: 22%|██▏ | 2687/12384 [5:43:08<20:38:29, 7.66s/it, loss=0.0005, acc=0.9985, iter_time=7.68s]
Epoch 0: 22%|██▏ | 2687/12384 [5:43:16<20:38:29, 7.66s/it, loss=0.0007, acc=0.9991, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2688/12384 [5:43:16<20:37:55, 7.66s/it, loss=0.0007, acc=0.9991, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2688/12384 [5:43:24<20:37:55, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2689/12384 [5:43:24<20:35:14, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2689/12384 [5:43:32<20:35:14, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=5.11s]
Epoch 0: 22%|██▏ | 2690/12384 [5:43:32<20:51:44, 7.75s/it, loss=0.0004, acc=0.9998, iter_time=5.11s]
Epoch 0: 22%|██▏ | 2690/12384 [5:43:39<20:51:44, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 22%|██▏ | 2691/12384 [5:43:39<20:47:21, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 22%|██▏ | 2691/12384 [5:43:47<20:47:21, 7.72s/it, loss=0.0022, acc=0.9954, iter_time=11.64s]
Epoch 0: 22%|██▏ | 2692/12384 [5:43:47<20:41:36, 7.69s/it, loss=0.0022, acc=0.9954, iter_time=11.64s]
Epoch 0: 22%|██▏ | 2692/12384 [5:43:55<20:41:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2693/12384 [5:43:55<20:40:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2693/12384 [5:44:02<20:40:58, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=6.82s]
Epoch 0: 22%|██▏ | 2694/12384 [5:44:02<20:38:19, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=6.82s]
Epoch 0: 22%|██▏ | 2694/12384 [5:44:10<20:38:19, 7.67s/it, loss=0.0003, acc=0.9998, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2695/12384 [5:44:10<20:35:11, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2695/12384 [5:44:17<20:35:11, 7.65s/it, loss=0.0004, acc=0.9991, iter_time=8.55s]
Epoch 0: 22%|██▏ | 2696/12384 [5:44:17<20:35:01, 7.65s/it, loss=0.0004, acc=0.9991, iter_time=8.55s]
Epoch 0: 22%|██▏ | 2696/12384 [5:44:25<20:35:01, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=4.00s]
Epoch 0: 22%|██▏ | 2697/12384 [5:44:25<20:33:10, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.00s]
Epoch 0: 22%|██▏ | 2697/12384 [5:44:33<20:33:10, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=8.09s]
Epoch 0: 22%|██▏ | 2698/12384 [5:44:33<20:35:25, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=8.09s]
Epoch 0: 22%|██▏ | 2698/12384 [5:44:40<20:35:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2699/12384 [5:44:40<20:33:51, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2699/12384 [5:44:48<20:33:51, 7.64s/it, loss=0.0048, acc=0.9951, iter_time=10.57s]
Epoch 0: 22%|██▏ | 2700/12384 [5:44:48<20:32:35, 7.64s/it, loss=0.0048, acc=0.9951, iter_time=10.57s]
Epoch 0: 22%|██▏ | 2700/12384 [5:44:56<20:32:35, 7.64s/it, loss=0.0002, acc=0.9996, iter_time=7.21s]
Epoch 0: 22%|██▏ | 2701/12384 [5:44:56<20:32:01, 7.63s/it, loss=0.0002, acc=0.9996, iter_time=7.21s]
Epoch 0: 22%|██▏ | 2701/12384 [5:45:03<20:32:01, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2702/12384 [5:45:03<20:32:50, 7.64s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2702/12384 [5:45:11<20:32:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 22%|██▏ | 2703/12384 [5:45:11<20:30:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 22%|██▏ | 2703/12384 [5:45:18<20:30:38, 7.63s/it, loss=0.0015, acc=0.9963, iter_time=7.82s]
Epoch 0: 22%|██▏ | 2704/12384 [5:45:18<20:32:14, 7.64s/it, loss=0.0015, acc=0.9963, iter_time=7.82s]
Epoch 0: 22%|██▏ | 2704/12384 [5:45:26<20:32:14, 7.64s/it, loss=0.0001, acc=0.9988, iter_time=4.81s]
Epoch 0: 22%|██▏ | 2705/12384 [5:45:26<20:32:37, 7.64s/it, loss=0.0001, acc=0.9988, iter_time=4.81s]
Epoch 0: 22%|██▏ | 2705/12384 [5:45:34<20:32:37, 7.64s/it, loss=0.0008, acc=1.0000, iter_time=10.48s]
Epoch 0: 22%|██▏ | 2706/12384 [5:45:34<20:31:07, 7.63s/it, loss=0.0008, acc=1.0000, iter_time=10.48s]
Epoch 0: 22%|██▏ | 2706/12384 [5:45:41<20:31:07, 7.63s/it, loss=0.0004, acc=0.9990, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2707/12384 [5:45:41<20:31:50, 7.64s/it, loss=0.0004, acc=0.9990, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2707/12384 [5:45:49<20:31:50, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2708/12384 [5:45:49<20:32:40, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2708/12384 [5:45:57<20:32:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 22%|██▏ | 2709/12384 [5:45:57<20:32:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 22%|██▏ | 2709/12384 [5:46:04<20:32:49, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=7.12s]
Epoch 0: 22%|██▏ | 2710/12384 [5:46:04<20:32:08, 7.64s/it, loss=0.0002, acc=0.9992, iter_time=7.12s]
Epoch 0: 22%|██▏ | 2710/12384 [5:46:12<20:32:08, 7.64s/it, loss=0.0063, acc=0.9969, iter_time=5.11s]
Epoch 0: 22%|██▏ | 2711/12384 [5:46:12<20:34:46, 7.66s/it, loss=0.0063, acc=0.9969, iter_time=5.11s]
Epoch 0: 22%|██▏ | 2711/12384 [5:46:20<20:34:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 22%|██▏ | 2712/12384 [5:46:20<20:32:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 22%|██▏ | 2712/12384 [5:46:27<20:32:41, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=5.30s]
Epoch 0: 22%|██▏ | 2713/12384 [5:46:27<20:38:36, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=5.30s]
Epoch 0: 22%|██▏ | 2713/12384 [5:46:35<20:38:36, 7.68s/it, loss=0.0005, acc=0.9962, iter_time=6.73s]
Epoch 0: 22%|██▏ | 2714/12384 [5:46:35<20:36:39, 7.67s/it, loss=0.0005, acc=0.9962, iter_time=6.73s]
Epoch 0: 22%|██▏ | 2714/12384 [5:46:43<20:36:39, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.89s]
Epoch 0: 22%|██▏ | 2715/12384 [5:46:43<20:34:54, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.89s]
Epoch 0: 22%|██▏ | 2715/12384 [5:46:50<20:34:54, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.12s]
Epoch 0: 22%|██▏ | 2716/12384 [5:46:50<20:32:41, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.12s]
Epoch 0: 22%|██▏ | 2716/12384 [5:46:58<20:32:41, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=7.33s]
Epoch 0: 22%|██▏ | 2717/12384 [5:46:58<20:47:40, 7.74s/it, loss=0.0003, acc=0.9999, iter_time=7.33s]
Epoch 0: 22%|██▏ | 2717/12384 [5:47:06<20:47:40, 7.74s/it, loss=0.0003, acc=0.9991, iter_time=8.79s]
Epoch 0: 22%|██▏ | 2718/12384 [5:47:06<20:42:23, 7.71s/it, loss=0.0003, acc=0.9991, iter_time=8.79s]
Epoch 0: 22%|██▏ | 2718/12384 [5:47:14<20:42:23, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2719/12384 [5:47:14<20:38:47, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2719/12384 [5:47:21<20:38:47, 7.69s/it, loss=0.0004, acc=0.9978, iter_time=8.03s]
Epoch 0: 22%|██▏ | 2720/12384 [5:47:21<20:36:57, 7.68s/it, loss=0.0004, acc=0.9978, iter_time=8.03s]W0310 14:09:33.982000 62051 site-packages/torch/distributed/elastic/agent/server/api.py:725] Received 15 death signal, shutting down workers
+W0310 14:09:33.986000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62184 closing signal SIGTERM
+W0310 14:09:33.987000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62185 closing signal SIGTERM
+W0310 14:09:33.987000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62186 closing signal SIGTERM
+W0310 14:09:33.987000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62187 closing signal SIGTERM
+W0310 14:09:33.987000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62188 closing signal SIGTERM
+W0310 14:09:33.988000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62189 closing signal SIGTERM
+W0310 14:09:33.988000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62190 closing signal SIGTERM
+W0310 14:09:33.988000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62191 closing signal SIGTERM
+Traceback (most recent call last):
+ File "", line 198, in _run_module_as_main
+ File "", line 88, in _run_code
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 940, in
+ main()
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/errors/__init__.py", line 357, in wrapper
+ return f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 936, in main
+ run(args)
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 927, in run
+ elastic_launch(
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 156, in __call__
+ return launch_agent(self._config, self._entrypoint, list(args))
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 284, in launch_agent
+ result = agent.run()
+ ^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/metrics/api.py", line 138, in wrapper
+ result = f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/agent/server/api.py", line 717, in run
+ result = self._invoke_run(role)
+ ^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/agent/server/api.py", line 881, in _invoke_run
+ time.sleep(monitor_interval)
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/api.py", line 85, in _terminate_process_handler
+ raise SignalException(f"Process {os.getpid()} got signal: {sigval}", sigval=sigval)
+torch.distributed.elastic.multiprocessing.api.SignalException: Process 62051 got signal: 15
diff --git a/syxin_old/dflash_8gpu_03-31-14:16.log b/syxin_old/dflash_8gpu_03-31-14:16.log
new file mode 100644
index 0000000000000000000000000000000000000000..82631e5647773ba5130bffbfa7ec734992aba86d
--- /dev/null
+++ b/syxin_old/dflash_8gpu_03-31-14:16.log
@@ -0,0 +1,198 @@
+nohup: ignoring input
+WARNING:__main__:
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+Traceback (most recent call last):
+ File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py", line 24, in
+ from specforge.args import SGLangBackendArgs, TrackerArgs
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/__init__.py", line 1, in
+ from .core import * # noqa
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/__init__.py", line 1, in
+ from .dflash import OnlineDFlashModel, create_dflash_loss_mask
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/dflash.py", line 11, in
+ from specforge.modeling.draft.dflash import DFlashDraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/__init__.py", line 2, in
+ from .auto import AutoDraftModelConfig, AutoEagle3DraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/auto.py", line 21, in
+ from .draft.llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/__init__.py", line 8, in
+ from .llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py", line 9, in
+ from torch.nn.attention.flex_attention import create_block_mask, flex_attention
+ModuleNotFoundError: No module named 'torch.nn.attention.flex_attention'
+Traceback (most recent call last):
+ File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py", line 24, in
+ from specforge.args import SGLangBackendArgs, TrackerArgs
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/__init__.py", line 1, in
+ from .core import * # noqa
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/__init__.py", line 1, in
+ from .dflash import OnlineDFlashModel, create_dflash_loss_mask
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/dflash.py", line 11, in
+ from specforge.modeling.draft.dflash import DFlashDraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/__init__.py", line 2, in
+ from .auto import AutoDraftModelConfig, AutoEagle3DraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/auto.py", line 21, in
+ from .draft.llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/__init__.py", line 8, in
+ from .llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py", line 9, in
+ from torch.nn.attention.flex_attention import create_block_mask, flex_attention
+ModuleNotFoundError: No module named 'torch.nn.attention.flex_attention'
+Traceback (most recent call last):
+ File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py", line 24, in
+ from specforge.args import SGLangBackendArgs, TrackerArgs
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/__init__.py", line 1, in
+ from .core import * # noqa
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/__init__.py", line 1, in
+ from .dflash import OnlineDFlashModel, create_dflash_loss_mask
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/dflash.py", line 11, in
+ from specforge.modeling.draft.dflash import DFlashDraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/__init__.py", line 2, in
+ from .auto import AutoDraftModelConfig, AutoEagle3DraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/auto.py", line 21, in
+ from .draft.llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/__init__.py", line 8, in
+ from .llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py", line 9, in
+ from torch.nn.attention.flex_attention import create_block_mask, flex_attention
+ModuleNotFoundError: No module named 'torch.nn.attention.flex_attention'
+Traceback (most recent call last):
+ File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py", line 24, in
+ from specforge.args import SGLangBackendArgs, TrackerArgs
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/__init__.py", line 1, in
+ from .core import * # noqa
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/__init__.py", line 1, in
+ from .dflash import OnlineDFlashModel, create_dflash_loss_mask
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/dflash.py", line 11, in
+ from specforge.modeling.draft.dflash import DFlashDraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/__init__.py", line 2, in
+ from .auto import AutoDraftModelConfig, AutoEagle3DraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/auto.py", line 21, in
+ from .draft.llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/__init__.py", line 8, in
+ from .llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py", line 9, in
+ from torch.nn.attention.flex_attention import create_block_mask, flex_attention
+ModuleNotFoundError: No module named 'torch.nn.attention.flex_attention'
+Traceback (most recent call last):
+ File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py", line 24, in
+ from specforge.args import SGLangBackendArgs, TrackerArgs
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/__init__.py", line 1, in
+ from .core import * # noqa
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/__init__.py", line 1, in
+ from .dflash import OnlineDFlashModel, create_dflash_loss_mask
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/dflash.py", line 11, in
+ from specforge.modeling.draft.dflash import DFlashDraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/__init__.py", line 2, in
+ from .auto import AutoDraftModelConfig, AutoEagle3DraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/auto.py", line 21, in
+ from .draft.llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/__init__.py", line 8, in
+ from .llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py", line 9, in
+ from torch.nn.attention.flex_attention import create_block_mask, flex_attention
+ModuleNotFoundError: No module named 'torch.nn.attention.flex_attention'
+Traceback (most recent call last):
+ File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py", line 24, in
+ from specforge.args import SGLangBackendArgs, TrackerArgs
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/__init__.py", line 1, in
+ from .core import * # noqa
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/__init__.py", line 1, in
+ from .dflash import OnlineDFlashModel, create_dflash_loss_mask
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/dflash.py", line 11, in
+ from specforge.modeling.draft.dflash import DFlashDraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/__init__.py", line 2, in
+ from .auto import AutoDraftModelConfig, AutoEagle3DraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/auto.py", line 21, in
+ from .draft.llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/__init__.py", line 8, in
+ from .llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py", line 9, in
+ from torch.nn.attention.flex_attention import create_block_mask, flex_attention
+ModuleNotFoundError: No module named 'torch.nn.attention.flex_attention'
+Traceback (most recent call last):
+ File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py", line 24, in
+ from specforge.args import SGLangBackendArgs, TrackerArgs
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/__init__.py", line 1, in
+ from .core import * # noqa
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/__init__.py", line 1, in
+ from .dflash import OnlineDFlashModel, create_dflash_loss_mask
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/dflash.py", line 11, in
+ from specforge.modeling.draft.dflash import DFlashDraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/__init__.py", line 2, in
+ from .auto import AutoDraftModelConfig, AutoEagle3DraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/auto.py", line 21, in
+ from .draft.llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/__init__.py", line 8, in
+ from .llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py", line 9, in
+ from torch.nn.attention.flex_attention import create_block_mask, flex_attention
+ModuleNotFoundError: No module named 'torch.nn.attention.flex_attention'
+Traceback (most recent call last):
+ File "/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py", line 24, in
+ from specforge.args import SGLangBackendArgs, TrackerArgs
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/__init__.py", line 1, in
+ from .core import * # noqa
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/__init__.py", line 1, in
+ from .dflash import OnlineDFlashModel, create_dflash_loss_mask
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/core/dflash.py", line 11, in
+ from specforge.modeling.draft.dflash import DFlashDraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/__init__.py", line 2, in
+ from .auto import AutoDraftModelConfig, AutoEagle3DraftModel
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/auto.py", line 21, in
+ from .draft.llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/__init__.py", line 8, in
+ from .llama3_eagle import LlamaForCausalLMEagle3
+ File "/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py", line 9, in
+ from torch.nn.attention.flex_attention import create_block_mask, flex_attention
+ModuleNotFoundError: No module named 'torch.nn.attention.flex_attention'
+W0331 14:16:59.909000 140326032656192 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1035 closing signal SIGTERM
+W0331 14:16:59.909000 140326032656192 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1036 closing signal SIGTERM
+W0331 14:16:59.910000 140326032656192 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1038 closing signal SIGTERM
+W0331 14:16:59.910000 140326032656192 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1039 closing signal SIGTERM
+W0331 14:16:59.911000 140326032656192 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1040 closing signal SIGTERM
+W0331 14:16:59.911000 140326032656192 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1041 closing signal SIGTERM
+W0331 14:16:59.912000 140326032656192 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1042 closing signal SIGTERM
+E0331 14:17:00.577000 140326032656192 torch/distributed/elastic/multiprocessing/api.py:833] failed (exitcode: 1) local_rank: 2 (pid: 1037) of binary: /workspace/miniconda3/envs/dflash/bin/python3
+Traceback (most recent call last):
+ File "", line 198, in _run_module_as_main
+ File "", line 88, in _run_code
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/run.py", line 905, in
+ main()
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/errors/__init__.py", line 348, in wrapper
+ return f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/run.py", line 901, in main
+ run(args)
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/run.py", line 892, in run
+ elastic_launch(
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 133, in __call__
+ return launch_agent(self._config, self._entrypoint, list(args))
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 264, in launch_agent
+ raise ChildFailedError(
+torch.distributed.elastic.multiprocessing.errors.ChildFailedError:
+============================================================
+/workspace/hanrui/syxin_old/Specforge/scripts/train_dflash.py FAILED
+------------------------------------------------------------
+Failures:
+
+------------------------------------------------------------
+Root Cause (first observed failure):
+[0]:
+ time : 2026-03-31_14:16:59
+ host : job-006ce80a7c47-20260302193512-5cd88f7cfc-mlbh9
+ rank : 2 (local_rank: 2)
+ exitcode : 1 (pid: 1037)
+ error_file:
+ traceback : To enable traceback see: https://pytorch.org/docs/stable/elastic/errors.html
+============================================================
diff --git a/syxin_old/dflash_lora_changelog.md b/syxin_old/dflash_lora_changelog.md
new file mode 100644
index 0000000000000000000000000000000000000000..09cdba4e72c1d91eff75bb1a974f2784f2bfca65
--- /dev/null
+++ b/syxin_old/dflash_lora_changelog.md
@@ -0,0 +1,232 @@
+# DFlash LoRA 全部改动记录
+
+## 概述
+
+为了让 Qwen3-8B DFlash LoRA 训练在 2×H100 上跑通(解决 OOM),共新增/修改了 **5 个文件,1084 行代码**。改动分为两大阶段:基础搭建 + OOM 修复。
+
+---
+
+## 新增文件清单
+
+| 文件 | 行数 | 用途 |
+|------|------|------|
+| `specforge/core/dflash_lora.py` | 453 | 训练 wrapper(OnlineDFlashLoRAModel) |
+| `specforge/modeling/draft/dflash_lora.py` | 141 | LoRA draft 模型(DFlashLoRADraftModel) |
+| `scripts/train_dflash_lora.py` | 449 | 训练入口脚本 |
+| `scripts/run_train_dflash_lora.sh` | 31 | 启动 shell 脚本 |
+| `configs/qwen3-8b-dflash-lora.json` | 10 | LoRA 配置文件 |
+
+---
+
+## Step 1 完成过程
+
+### 1.1 分析现有代码
+
+首先分析了非 LoRA 版 `train_dflash.py` 的完整流程:
+
+```
+input_ids → target_model.generate_dflash_data() → hidden_states
+ → OnlineDFlashModel.forward():
+ 1. 截断到 block 边界
+ 2. prepare_noise_input(): anchor 保留,其余 → MASK
+ 3. embed_tokens(noise_input_ids) → noise_embedding
+ 4. 构建 DFlash attention mask
+ 5. draft_model(noise_embedding, target_hidden, mask)
+ 6. lm_head(hidden) → logits → CE loss
+```
+
+非 LoRA 版使用独立的小型 draft model + 冻结 target model 提取 hidden states。
+
+### 1.2 确定 LoRA 版设计差异
+
+| 方面 | 非 LoRA 版 (`train_dflash.py`) | LoRA 版 (`train_dflash_lora.py`) |
+|------|------|------|
+| Draft model | 自定义小模型 (1-10 层) | Qwen3-8B + PEFT LoRA |
+| Target model | 冻结大模型提取 hidden states | 无需 — 模型用自身表征 |
+| Attention | 自定义 Qwen3DFlashAttention,KV = [ctx, noise] concat | 标准 HF attention + DFlash mask |
+| KV 结构 | Q_LEN = noise_len, KV_LEN = 2×noise_len | Q_LEN = KV_LEN = seq_len |
+| 可训练参数 | 全部 draft model 参数 | 仅 LoRA (q/k/v/o_proj) |
+
+### 1.3 新建 LoRA 版三个核心文件
+
+#### `specforge/modeling/draft/dflash_lora.py` — DFlashLoRADraftModel
+
+- `from_pretrained()`: 加载 Qwen3-8B,注入 PEFT LoRA,支持 `attn_implementation` 参数
+- `forward()`: 标准 HF forward,支持 `output_hidden_states` 参数(chunked loss 需要)
+- `get_lm_head()`: 穿透 PEFT 层级获取 lm_head 引用
+- `gradient_checkpointing_enable()`: 代理到底层模型
+- `save_pretrained()`: 仅保存 LoRA adapter 权重
+
+#### `specforge/core/dflash_lora.py` — OnlineDFlashLoRAModel
+
+- `prepare_noise_input()`: context 部分保持不变,block 部分只保留 anchor,其余替换为 MASK
+- `build_dflash_full_attn_mask_fast()`: 向量化构建 4D additive mask `[bsz, 1, seq, seq]`
+- `_compute_loss_weights()`: context + anchor 权重为 0,非 anchor 权重为 1(或 decay)
+- `_full_lm_loss()`: 标准 CE loss 路径
+- `_compute_accuracy()`: block-wise acceptance rate(累积正确预测长度 / block 非 anchor 长度)
+- `forward()`: 完整训练 forward pass
+
+LoRA 版 mask 规则:
+- context token i → 因果注意力 (j ≤ i)
+- block token i (属于 block b) → 所有 context + 同 block 内双向注意力
+
+#### `scripts/train_dflash_lora.py` — 训练脚本
+
+- 参数解析:model/lora/dataset/training/output/distributed/tracker 7 组参数
+- `build_model()`: 加载模型 + 注入 LoRA + 包装 OnlineDFlashLoRAModel
+- `build_dataloader()`: 复用 `build_eagle3_dataset` 和 `prepare_dp_dataloaders`
+- FSDP 包装 + BF16Optimizer
+- 训练循环:forward → backward → accumulation → optimizer step
+- checkpoint 保存/恢复
+
+---
+
+## OOM 修复改动(4 项)
+
+### 改动 1: FSDP FULL_SHARD (ZeRO-3)
+
+**问题**: `SHARD_GRAD_OP` (ZeRO-2) 每卡持有完整 Qwen3-8B 参数 (~16GB bf16)
+
+**修复**: `train_dflash_lora.py:362`
+```python
+# 之前
+sharding_strategy=ShardingStrategy.SHARD_GRAD_OP
+# 之后
+sharding_strategy=ShardingStrategy.FULL_SHARD
+```
+
+**效果**: 参数跨卡分片,每卡省 ~8-12GB
+
+### 改动 2: batch_size=1 + accumulation_steps=8
+
+**问题**: `batch_size=2` 时峰值显存过高
+
+**修复**: `run_train_dflash_lora.sh`
+```bash
+--batch-size 1 \
+--accumulation-steps 8 \
+```
+
+**效果**: 等效 global batch size 不变,峰值显存减半
+
+### 改动 3: flex_attention + BlockMask 替换 4D additive mask
+
+**问题**: SDPA 不支持 4D additive mask → fallback 到 math backend → 每层 materialize 完整 `[bsz, 32heads, 2048, 2048]` attention scores
+
+**修复**: 从非 LoRA 版 `dflash.py` 移植 `_get_or_create_block_mask()` 方法,适配 LoRA 场景
+
+涉及文件:
+
+1. **`specforge/core/dflash_lora.py`**
+ - `__init__()`: 添加 `attention_backend` 参数(默认 `"flex_attention"`),BlockMask 缓存字段
+ - 新增 `_get_or_create_block_mask()`: 用 `create_block_mask()` 构建零显存的 BlockMask
+ - `forward()`: 根据 `attention_backend` 选择 BlockMask 或 additive mask
+
+2. **`specforge/modeling/draft/dflash_lora.py`**
+ - `from_pretrained()`: 当 backend 为 flex_attention 时,传 `attn_implementation="flex_attention"` 给 HuggingFace
+
+3. **`scripts/train_dflash_lora.py`**
+ - `parse_args()`: `--attention-backend` 参数 (`flex_attention` | `additive`)
+ - `build_model()`: 根据 backend 选择 `attn_implementation`
+
+BlockMask mask function(LoRA 版):
+```python
+def dflash_lora_mask_fn(b, h, q_idx, kv_idx):
+ # Context query: 标准因果
+ is_q_ctx = q_idx < context_len
+ ctx_visible = is_q_ctx & (kv_idx <= q_idx)
+
+ # Block query: 全部 context + 同 block 双向
+ is_q_block = q_idx >= context_len
+ is_k_ctx = kv_idx < context_len
+ q_block_id = (q_idx - context_len) // block_size
+ k_block_id = (kv_idx - context_len) // block_size
+ block_attend_ctx = is_q_block & is_k_ctx
+ block_attend_same = is_q_block & (~is_k_ctx) & (q_block_id == k_block_id)
+
+ return ctx_visible | (block_attend_ctx | block_attend_same)
+```
+
+**验证**: 手动逐元素对比 BlockMask 和 additive mask 输出,三组测试 (context_len=4/0, seq=12/16/64) pattern 完全一致。
+
+**效果**: 不再 fallback 到 SDPA math backend,省去 `[bsz, heads, seq, seq]` attention scores 显存
+
+### 改动 4: chunked cross-entropy loss
+
+**问题**: `[bsz, 2048, 151936]` bf16 logits ≈ 1.18GB,加梯度 ~2.4GB+
+
+**修复**: 从非 LoRA 版 `dflash.py:419-478` 移植 chunked loss
+
+涉及文件:
+
+1. **`specforge/core/dflash_lora.py`**
+ - `__init__()`: 添加 `lm_head_chunk_size` 参数(默认 0 = 不启用)
+ - 新增 `_chunked_lm_loss()`: 分 chunk 过 lm_head + CE loss + gradient checkpointing
+ - 提取 `_full_lm_loss()`: 原始非 chunked 路径
+ - `forward()`: `lm_head_chunk_size > 0` 时走 chunked 路径
+
+2. **`specforge/modeling/draft/dflash_lora.py`**
+ - `forward()`: 新增 `output_hidden_states` 参数,True 时返回 last hidden state 而非 logits
+ - `get_lm_head()`: 穿透 PEFT 层级返回 `base_model.lm_head` 引用
+
+3. **`scripts/train_dflash_lora.py`**
+ - `parse_args()`: `--lm-head-chunk-size` 参数(默认 0,推荐 256)
+ - `build_model()`: 传递到 OnlineDFlashLoRAModel
+
+Chunked loss 核心逻辑:
+```python
+# 分 chunk 计算,每 chunk 用 gradient checkpointing(backward 时重算 logits,不存储)
+for start in range(0, effective_len, chunk_size):
+ end = min(start + chunk_size, effective_len)
+ chunk_loss, chunk_weight = grad_checkpoint(
+ _chunk_ce, # lm_head + CE
+ hidden[:, start:end, :], # 只取当前 chunk
+ input_ids[:, start:end],
+ combined_mask[:, start:end],
+ use_reentrant=False,
+ )
+ total_loss += chunk_loss
+ total_weight += chunk_weight
+loss = total_loss / total_weight
+```
+
+**效果**: logits 峰值显存从 `O(seq_len × vocab_size)` 降至 `O(chunk_size × vocab_size)`,256 chunk → ~150MB vs 1.18GB
+
+---
+
+## 当前训练命令
+
+```bash
+bash run_train_dflash_lora.sh 2 # 2 = GPU 数量
+```
+
+对应完整参数:
+```bash
+torchrun --nproc_per_node 2 scripts/train_dflash_lora.py \
+ --model-path /workspace/Qwen3-8B \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir outputs/qwen3-8b-dflash-lora \
+ --lora-config configs/qwen3-8b-dflash-lora.json \
+ --block-size 16 \
+ --max-length 2048 \
+ --batch-size 1 \
+ --num-epochs 3 \
+ --learning-rate 2e-4 \
+ --accumulation-steps 8 \
+ --loss-decay-gamma 7 \
+ --attention-backend flex_attention \
+ --lm-head-chunk-size 256 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500
+```
+
+---
+
+## 待验证
+
+- [ ] 跑 `bash run_train_dflash_lora.sh 2` 确认不再 OOM
+- [ ] 确认无 SDPA math fallback warning
+- [ ] 观察 GPU 显存峰值
+- [ ] 确认 loss 下降和 accuracy 上升趋势正常
diff --git a/syxin_old/eval_accepted_length.md b/syxin_old/eval_accepted_length.md
new file mode 100644
index 0000000000000000000000000000000000000000..5e9b4426efc43c8630650db25d5c7b060410cd56
--- /dev/null
+++ b/syxin_old/eval_accepted_length.md
@@ -0,0 +1,217 @@
+# DFlash-LoRA-Inject 评测:Accepted Length & Accuracy
+
+## 为什么不能用 sglang 在线评测?
+
+DFlash-LoRA-Inject 的推理需要**逐层注入 target 模型的 hidden states** 到 draft 模型中,
+这是 LoRA-Inject 训练时的核心机制。但 sglang 不支持这种推理模式:
+
+| sglang 算法 | 问题 |
+|---|---|
+| `STANDALONE` | 把 draft 当独立自回归模型跑,**完全忽略 layer injection**。merged 模型 ≈ 原始 Qwen3-8B,accept_length 恒 ≈ 4.7,跟 LoRA 训没训没关系 |
+| `DFLASH` | 期望 DFlash-b16 架构(5 层 + fc + hidden_norm),跟 LoRA-Inject(36 层全模型)结构不匹配 |
+
+因此必须**离线评测**:加载 target + draft 两个模型,手动实现带 layer injection 的 speculative decoding 循环。
+
+---
+
+## 基本信息
+
+| 项目 | 路径 / 值 |
+|---|---|
+| conda 环境 | `spec` |
+| 基座模型(target) | `/workspace/models/Qwen3-8B` |
+| 训练输出(最终 ckpt) | `.../outputs/qwen3-8b-dflash-lora-inject/epoch_3_step_1400` |
+| 合并后 draft 模型 | `.../outputs/qwen3-8b-dflash-lora-inject-merged` |
+| 评测脚本 | `/workspace/hanrui/syxin_old/eval_dflash_lora_inject.py` |
+| 本地数据集 | `/workspace/hanrui/datasets/{humaneval,mtbench,gsm8k}` |
+| 结果输出目录 | `/workspace/hanrui/syxin_old/Specforge/benchmarks/results/` |
+| GPU | 8 × H100 80GB(单卡即可,需 ~32GB 加载两个 8B 模型) |
+
+---
+
+## Step 1:合并 LoRA 权重
+
+LoRA-Inject 训练只保存 adapter 权重,评测时需要完整模型。
+
+```bash
+conda activate spec
+
+python3 -c "
+from peft import PeftModel
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch, os
+
+BASE = '/workspace/models/Qwen3-8B'
+ADAPTER = '/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject/epoch_3_step_1400'
+MERGED = '/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject-merged'
+
+if os.path.exists(MERGED):
+ print(f'[skip] Merged model already exists: {MERGED}')
+else:
+ print('[1/4] Loading base model to CPU ...')
+ model = AutoModelForCausalLM.from_pretrained(BASE, torch_dtype=torch.bfloat16, device_map='cpu')
+ print('[2/4] Loading LoRA adapter ...')
+ model = PeftModel.from_pretrained(model, ADAPTER)
+ print('[3/4] Merging weights ...')
+ model = model.merge_and_unload()
+ print('[4/4] Saving merged model ...')
+ os.makedirs(MERGED, exist_ok=True)
+ model.save_pretrained(MERGED, safe_serialization=True)
+ AutoTokenizer.from_pretrained(BASE).save_pretrained(MERGED)
+ print(f'Done. Merged model saved to: {MERGED}')
+"
+```
+
+> 耗时约 3–5 分钟,CPU 内存占用 ≈ 16 GB。已存在则自动跳过。
+
+---
+
+## Step 2:离线评测 accepted length
+
+**不需要启动 sglang server**,直接跑:
+
+### 全部 Bench(推荐)
+
+```bash
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh
+```
+
+### 单独跑 / 快速测试
+
+```bash
+# 只跑 HumanEval
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh humaneval
+
+# 快速测试(每个 bench 20 条)
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh --quick
+
+# 指定 checkpoint
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh --ckpt epoch_0_step_1000
+
+# 组合
+bash /workspace/hanrui/syxin_old/run_bench_dflash.sh humaneval gsm8k --quick
+```
+
+### 或者直接调 Python
+
+```bash
+conda activate spec
+
+python3 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --benchmarks humaneval mtbench gsm8k \
+ --block-size 16 \
+ --max-new-tokens 512 \
+ --temperature 0.0
+```
+
+---
+
+## 结果文件说明
+
+结果保存在 `results/` 下,文件名示例:
+```
+dflash_lora_inject_offline_epoch_3_step_1400_20260314_150000.json
+```
+
+```json
+{
+ "model": "dflash-lora-inject/epoch_3_step_1400",
+ "block_size": 16,
+ "humaneval": {
+ "avg_accept_length": 3.42,
+ "total_tokens": 28500,
+ "latency": 120.5,
+ "throughput": 236.5,
+ "num_samples": 164,
+ "num_verify_rounds": 8320
+ },
+ "mtbench": { ... },
+ "gsm8k": { ... }
+}
+```
+
+| 字段 | 含义 |
+|---|---|
+| `avg_accept_length` | **核心指标**:平均每次 verify 接受的 token 数(含 injection)。越高越好,`1.0` = draft 完全无效 |
+| `total_tokens` | 总生成 token 数 |
+| `throughput` | tokens/s(离线评测,不含 batching 优化) |
+| `num_verify_rounds` | 总验证轮数 |
+
+---
+
+## 对比 baseline
+
+对比未经 LoRA 训练的原始 Qwen3-8B 当 draft 的 accept_length:
+
+```bash
+python3 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --merged-path /workspace/models/Qwen3-8B \
+ --benchmarks humaneval mtbench gsm8k \
+ --num-samples 50
+```
+
+> 这会用原始 Qwen3-8B 同时当 target 和 draft(带 injection),
+> 对比 LoRA 训练前后 accept_length 是否有提升。
+
+---
+
+## 如何测其他 checkpoint
+
+```bash
+# 方法 1:直接加载 adapter(自动 merge,不保存)
+python3 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --ckpt epoch_0_step_1000 \
+ --benchmarks humaneval --num-samples 50
+
+# 方法 2:预先 merge 到不同目录
+python3 -c "
+from peft import PeftModel
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch, os
+BASE = '/workspace/models/Qwen3-8B'
+ADAPTER = '/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject/epoch_0_step_1000'
+MERGED = '/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject-merged-epoch_0_step_1000'
+model = AutoModelForCausalLM.from_pretrained(BASE, torch_dtype=torch.bfloat16, device_map='cpu')
+model = PeftModel.from_pretrained(model, ADAPTER).merge_and_unload()
+os.makedirs(MERGED, exist_ok=True)
+model.save_pretrained(MERGED, safe_serialization=True)
+AutoTokenizer.from_pretrained(BASE).save_pretrained(MERGED)
+"
+
+python3 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --merged-path .../qwen3-8b-dflash-lora-inject-merged-epoch_0_step_1000 \
+ --benchmarks humaneval --num-samples 50
+```
+
+可用 checkpoint:`epoch_0_step_500` / `epoch_0_step_1000` / `epoch_0_step_1400` / `epoch_2_step_34500` / `epoch_2_step_35000` / `epoch_3_step_1400`
+
+---
+
+## 常见问题
+
+### Q1:accept_length 和 STANDALONE 模式下差不多(都 ≈ 4.7)
+
+这说明 layer injection 没有真正起作用。检查:
+- 评测脚本确实用的是 `eval_dflash_lora_inject.py`(离线),不是 sglang bench
+- merged 模型确实是 LoRA-Inject 版本(不是原始 Qwen3-8B)
+
+### Q2:OOM(单卡放不下两个 8B 模型)
+
+两个 bf16 的 Qwen3-8B ≈ 32GB,单卡 H100 80GB 够用。如果 OOM:
+- 检查是否有其他进程占用显存
+- 减小 `--max-new-tokens`(试 256)
+- 减小 `--num-samples`
+
+### Q3:数据集下载失败(无外网)
+
+评测脚本优先读本地文件:
+
+| bench | 本地文件 |
+|---|---|
+| GSM8K | `/workspace/hanrui/datasets/gsm8k/test.jsonl` |
+| MT-Bench | `/workspace/hanrui/datasets/mtbench/question.jsonl` |
+| HumanEval | `/workspace/hanrui/datasets/humaneval/test.jsonl` |
+
+---
+
+*基座:`/workspace/models/Qwen3-8B` | 最终 ckpt:`epoch_3_step_1400` | block_size:16*
diff --git a/syxin_old/eval_gsm8k_humaneval_mtbench_new.log b/syxin_old/eval_gsm8k_humaneval_mtbench_new.log
new file mode 100644
index 0000000000000000000000000000000000000000..aca9cbb4567a3e10c9e5d2327d5e6e28e5602e7f
--- /dev/null
+++ b/syxin_old/eval_gsm8k_humaneval_mtbench_new.log
@@ -0,0 +1,81 @@
+nohup: ignoring input
+WARNING:__main__:
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+[W324 12:29:41.005805214 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 12:29:41.007112364 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 12:29:41.020081383 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 12:29:42.479819786 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 12:29:42.817874158 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 12:29:42.995464317 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 12:29:42.004907907 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 12:29:42.007805771 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]Running on 8 GPU(s)
+Using attn_implementation: target=flash_attention_2, draft=sdpa
+Loading target model: /workspace/models/Qwen3-8B
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.81s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.87s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.84s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.77s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.83s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.79s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.88s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.88s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.77s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.80s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.78s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.67s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.73s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.69s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.81s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.81s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.79s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.80s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.80s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.64s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.71s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.74s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.80s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.80s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.53s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.54s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.54s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.40s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.92s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.27s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.92s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.27s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.92s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.27s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.49s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.50s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.79s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.14s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.56s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.57s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.87s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.88s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.21s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.23s/it]
+Loading base + LoRA adapter: /workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject/epoch_3_step_4644
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.91s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.28s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.91s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.27s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.76s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.80s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.81s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.75s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.84s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.84s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.81s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.82s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.64s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.69s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.76s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.64s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.75s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.75s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.76s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.76s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.58s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.65s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.63s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.77s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.77s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.77s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.77s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.31s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.77s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.38s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.37s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.70s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.07s/it]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.55s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.77s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.13s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.78s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.13s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.89s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.25s/it]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.51s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.51s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.58s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.54s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.88s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.88s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.24s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.24s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.94s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.92s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.28s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.26s/it]
+
+
+============================================================
+Benchmark: gsm8k (8 GPUs)
+============================================================
+Total 128 samples, distributed across 8 GPUs
+
[GPU0] gsm8k: 0%| | 0/16 [00:00, ?sample/s]
[GPU0] gsm8k: 0%| | 0/16 [00:09, ?sample/s, accept_len=4.00]
[GPU0] gsm8k: 6%|▋ | 1/16 [00:09<02:29, 9.94s/sample, accept_len=4.00]
[GPU0] gsm8k: 6%|▋ | 1/16 [00:24<02:29, 9.94s/sample, accept_len=4.11]
[GPU0] gsm8k: 12%|█▎ | 2/16 [00:24<02:59, 12.81s/sample, accept_len=4.11]
[GPU0] gsm8k: 12%|█▎ | 2/16 [00:36<02:59, 12.81s/sample, accept_len=4.10]
[GPU0] gsm8k: 19%|█▉ | 3/16 [00:36<02:38, 12.16s/sample, accept_len=4.10]
[GPU0] gsm8k: 19%|█▉ | 3/16 [00:54<02:38, 12.16s/sample, accept_len=4.17]
[GPU0] gsm8k: 25%|██▌ | 4/16 [00:54<02:53, 14.42s/sample, accept_len=4.17]
[GPU0] gsm8k: 25%|██▌ | 4/16 [01:05<02:53, 14.42s/sample, accept_len=4.22]
[GPU0] gsm8k: 31%|███▏ | 5/16 [01:05<02:28, 13.46s/sample, accept_len=4.22]
[GPU0] gsm8k: 31%|███▏ | 5/16 [01:12<02:28, 13.46s/sample, accept_len=4.18]
[GPU0] gsm8k: 38%|███▊ | 6/16 [01:12<01:53, 11.31s/sample, accept_len=4.18]
[GPU0] gsm8k: 38%|███▊ | 6/16 [01:27<01:53, 11.31s/sample, accept_len=4.17]
[GPU0] gsm8k: 44%|████▍ | 7/16 [01:27<01:50, 12.32s/sample, accept_len=4.17]
[GPU0] gsm8k: 44%|████▍ | 7/16 [01:38<01:50, 12.32s/sample, accept_len=4.12]
[GPU0] gsm8k: 50%|█████ | 8/16 [01:38<01:35, 11.99s/sample, accept_len=4.12]
[GPU0] gsm8k: 50%|█████ | 8/16 [01:52<01:35, 11.99s/sample, accept_len=4.03]
[GPU0] gsm8k: 56%|█████▋ | 9/16 [01:52<01:27, 12.47s/sample, accept_len=4.03]
[GPU0] gsm8k: 56%|█████▋ | 9/16 [02:03<01:27, 12.47s/sample, accept_len=3.93]
[GPU0] gsm8k: 62%|██████▎ | 10/16 [02:03<01:11, 11.98s/sample, accept_len=3.93]
[GPU0] gsm8k: 62%|██████▎ | 10/16 [02:13<01:11, 11.98s/sample, accept_len=3.91]
[GPU0] gsm8k: 69%|██████▉ | 11/16 [02:13<00:57, 11.44s/sample, accept_len=3.91]
[GPU0] gsm8k: 69%|██████▉ | 11/16 [02:30<00:57, 11.44s/sample, accept_len=3.78]
[GPU0] gsm8k: 75%|███████▌ | 12/16 [02:30<00:52, 13.10s/sample, accept_len=3.78]
[GPU0] gsm8k: 75%|███████▌ | 12/16 [02:40<00:52, 13.10s/sample, accept_len=3.78]
[GPU0] gsm8k: 81%|████████▏ | 13/16 [02:40<00:36, 12.17s/sample, accept_len=3.78]
[GPU0] gsm8k: 81%|████████▏ | 13/16 [02:50<00:36, 12.17s/sample, accept_len=3.82]
[GPU0] gsm8k: 88%|████████▊ | 14/16 [02:50<00:23, 11.55s/sample, accept_len=3.82]
[GPU0] gsm8k: 88%|████████▊ | 14/16 [02:56<00:23, 11.55s/sample, accept_len=3.84]
[GPU0] gsm8k: 94%|█████████▍| 15/16 [02:56<00:09, 9.98s/sample, accept_len=3.84]
[GPU0] gsm8k: 94%|█████████▍| 15/16 [03:12<00:09, 9.98s/sample, accept_len=3.90]
[GPU0] gsm8k: 100%|██████████| 16/16 [03:12<00:00, 11.82s/sample, accept_len=3.90]
[GPU0] gsm8k: 100%|██████████| 16/16 [03:12<00:00, 12.04s/sample, accept_len=3.90]
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/storage.py:414: FutureWarning: You are using `torch.load` with `weights_only=False` (the current default value), which uses the default pickle module implicitly. It is possible to construct malicious pickle data which will execute arbitrary code during unpickling (See https://github.com/pytorch/pytorch/blob/main/SECURITY.md#untrusted-models for more details). In a future release, the default value for `weights_only` will be flipped to `True`. This limits the functions that could be executed during unpickling. Arbitrary objects will no longer be allowed to be loaded via this mode unless they are explicitly allowlisted by the user via `torch.serialization.add_safe_globals`. We recommend you start setting `weights_only=True` for any use case where you don't have full control of the loaded file. Please open an issue on GitHub for any issues related to this experimental feature.
+ return torch.load(io.BytesIO(b))
+
+gsm8k Results:
+ Decoding speedup: 1.99x
+ Average Acceptance length: 3.92
+ Acceptance length histogram: ['0.0%', '5.9%', '17.9%', '24.6%', '19.7%', '14.0%', '8.2%', '4.5%', '2.6%', '1.5%', '0.6%', '0.3%', '0.2%', '0.1%', '0.0%', '0.0%', '0.0%']
+ Num responses: 128
+
+============================================================
+Benchmark: humaneval (8 GPUs)
+============================================================
+Total 164 samples, distributed across 8 GPUs
+
[GPU0] humaneval: 0%| | 0/21 [00:00, ?sample/s]
[GPU0] humaneval: 0%| | 0/21 [00:24, ?sample/s, accept_len=3.49]
[GPU0] humaneval: 5%|▍ | 1/21 [00:24<08:17, 24.85s/sample, accept_len=3.49]
[GPU0] humaneval: 5%|▍ | 1/21 [00:37<08:17, 24.85s/sample, accept_len=3.68]
[GPU0] humaneval: 10%|▉ | 2/21 [00:37<05:34, 17.62s/sample, accept_len=3.68]
[GPU0] humaneval: 10%|▉ | 2/21 [00:51<05:34, 17.62s/sample, accept_len=3.67]
[GPU0] humaneval: 14%|█▍ | 3/21 [00:51<04:44, 15.82s/sample, accept_len=3.67]
[GPU0] humaneval: 14%|█▍ | 3/21 [01:08<04:44, 15.82s/sample, accept_len=3.63]
[GPU0] humaneval: 19%|█▉ | 4/21 [01:08<04:39, 16.47s/sample, accept_len=3.63]
[GPU0] humaneval: 19%|█▉ | 4/21 [01:49<04:39, 16.47s/sample, accept_len=3.60]
[GPU0] humaneval: 24%|██▍ | 5/21 [01:49<06:42, 25.18s/sample, accept_len=3.60]
[GPU0] humaneval: 24%|██▍ | 5/21 [02:14<06:42, 25.18s/sample, accept_len=3.59]
[GPU0] humaneval: 29%|██▊ | 6/21 [02:14<06:19, 25.28s/sample, accept_len=3.59]
[GPU0] humaneval: 29%|██▊ | 6/21 [02:26<06:19, 25.28s/sample, accept_len=3.60]
[GPU0] humaneval: 33%|███▎ | 7/21 [02:26<04:50, 20.74s/sample, accept_len=3.60]
[GPU0] humaneval: 33%|███▎ | 7/21 [02:40<04:50, 20.74s/sample, accept_len=3.63]
[GPU0] humaneval: 38%|███▊ | 8/21 [02:40<04:02, 18.67s/sample, accept_len=3.63]
[GPU0] humaneval: 38%|███▊ | 8/21 [03:09<04:02, 18.67s/sample, accept_len=3.67]
[GPU0] humaneval: 43%|████▎ | 9/21 [03:09<04:22, 21.89s/sample, accept_len=3.67]
[GPU0] humaneval: 43%|████▎ | 9/21 [03:31<04:22, 21.89s/sample, accept_len=3.83]
[GPU0] humaneval: 48%|████▊ | 10/21 [03:31<04:01, 21.96s/sample, accept_len=3.83]
[GPU0] humaneval: 48%|████▊ | 10/21 [03:49<04:01, 21.96s/sample, accept_len=3.83]
[GPU0] humaneval: 52%|█████▏ | 11/21 [03:49<03:28, 20.82s/sample, accept_len=3.83]
[GPU0] humaneval: 52%|█████▏ | 11/21 [04:14<03:28, 20.82s/sample, accept_len=3.92]
[GPU0] humaneval: 57%|█████▋ | 12/21 [04:14<03:17, 22.00s/sample, accept_len=3.92]
[GPU0] humaneval: 57%|█████▋ | 12/21 [04:38<03:17, 22.00s/sample, accept_len=3.90]
[GPU0] humaneval: 62%|██████▏ | 13/21 [04:38<03:00, 22.59s/sample, accept_len=3.90]
[GPU0] humaneval: 62%|██████▏ | 13/21 [04:58<03:00, 22.59s/sample, accept_len=3.92]
[GPU0] humaneval: 67%|██████▋ | 14/21 [04:58<02:32, 21.76s/sample, accept_len=3.92]
[GPU0] humaneval: 67%|██████▋ | 14/21 [05:16<02:32, 21.76s/sample, accept_len=3.74]
[GPU0] humaneval: 71%|███████▏ | 15/21 [05:16<02:04, 20.71s/sample, accept_len=3.74]
[GPU0] humaneval: 71%|███████▏ | 15/21 [05:38<02:04, 20.71s/sample, accept_len=3.90]
[GPU0] humaneval: 76%|███████▌ | 16/21 [05:38<01:45, 21.02s/sample, accept_len=3.90]
[GPU0] humaneval: 76%|███████▌ | 16/21 [06:02<01:45, 21.02s/sample, accept_len=3.82]
[GPU0] humaneval: 81%|████████ | 17/21 [06:02<01:28, 22.15s/sample, accept_len=3.82]
[GPU0] humaneval: 81%|████████ | 17/21 [06:25<01:28, 22.15s/sample, accept_len=3.88]
[GPU0] humaneval: 86%|████████▌ | 18/21 [06:25<01:06, 22.22s/sample, accept_len=3.88]
[GPU0] humaneval: 86%|████████▌ | 18/21 [06:43<01:06, 22.22s/sample, accept_len=3.96]
[GPU0] humaneval: 90%|█████████ | 19/21 [06:43<00:42, 21.05s/sample, accept_len=3.96]
[GPU0] humaneval: 90%|█████████ | 19/21 [07:00<00:42, 21.05s/sample, accept_len=4.03]
[GPU0] humaneval: 95%|█████████▌| 20/21 [07:00<00:19, 19.77s/sample, accept_len=4.03]
[GPU0] humaneval: 95%|█████████▌| 20/21 [07:27<00:19, 19.77s/sample, accept_len=3.92]
[GPU0] humaneval: 100%|██████████| 21/21 [07:27<00:00, 21.86s/sample, accept_len=3.92]
[GPU0] humaneval: 100%|██████████| 21/21 [07:27<00:00, 21.29s/sample, accept_len=3.92]
+
+humaneval Results:
+ Decoding speedup: 1.81x
+ Average Acceptance length: 3.74
+ Acceptance length histogram: ['0.0%', '7.7%', '21.4%', '23.6%', '18.6%', '12.1%', '7.5%', '4.4%', '2.3%', '1.4%', '0.6%', '0.3%', '0.1%', '0.0%', '0.0%', '0.0%', '0.0%']
+ Num responses: 164
+
+============================================================
+Benchmark: mt-bench (8 GPUs)
+============================================================
+Total 80 samples, distributed across 8 GPUs
+
[GPU0] mt-bench: 0%| | 0/10 [00:00, ?sample/s]
[GPU0] mt-bench: 0%| | 0/10 [01:30, ?sample/s, accept_len=2.68]
[GPU0] mt-bench: 10%|█ | 1/10 [01:30<13:34, 90.47s/sample, accept_len=2.68]
[GPU0] mt-bench: 10%|█ | 1/10 [01:46<13:34, 90.47s/sample, accept_len=2.74]
[GPU0] mt-bench: 20%|██ | 2/10 [01:46<06:14, 46.87s/sample, accept_len=2.74]
[GPU0] mt-bench: 20%|██ | 2/10 [03:44<06:14, 46.87s/sample, accept_len=2.88]
[GPU0] mt-bench: 30%|███ | 3/10 [03:44<09:14, 79.21s/sample, accept_len=2.88]
[GPU0] mt-bench: 30%|███ | 3/10 [05:45<09:14, 79.21s/sample, accept_len=3.22]
[GPU0] mt-bench: 40%|████ | 4/10 [05:45<09:34, 95.83s/sample, accept_len=3.22]
[GPU0] mt-bench: 40%|████ | 4/10 [06:20<09:34, 95.83s/sample, accept_len=3.62]
[GPU0] mt-bench: 50%|█████ | 5/10 [06:20<06:09, 73.90s/sample, accept_len=3.62]
[GPU0] mt-bench: 50%|█████ | 5/10 [07:34<06:09, 73.90s/sample, accept_len=3.58]
[GPU0] mt-bench: 60%|██████ | 6/10 [07:34<04:55, 73.89s/sample, accept_len=3.58]
[GPU0] mt-bench: 60%|██████ | 6/10 [09:12<04:55, 73.89s/sample, accept_len=3.47]
[GPU0] mt-bench: 70%|███████ | 7/10 [09:12<04:05, 81.85s/sample, accept_len=3.47]
[GPU0] mt-bench: 70%|███████ | 7/10 [09:16<04:05, 81.85s/sample, accept_len=3.87]
[GPU0] mt-bench: 80%|████████ | 8/10 [09:16<01:53, 56.90s/sample, accept_len=3.87]
[GPU0] mt-bench: 80%|████████ | 8/10 [10:06<01:53, 56.90s/sample, accept_len=3.69]
[GPU0] mt-bench: 90%|█████████ | 9/10 [10:06<00:54, 54.87s/sample, accept_len=3.69]
[GPU0] mt-bench: 90%|█████████ | 9/10 [13:09<00:54, 54.87s/sample, accept_len=3.24]
[GPU0] mt-bench: 100%|██████████| 10/10 [13:09<00:00, 94.36s/sample, accept_len=3.24]
[GPU0] mt-bench: 100%|██████████| 10/10 [13:09<00:00, 78.96s/sample, accept_len=3.24]
+
+mt-bench Results:
+ Decoding speedup: 1.36x
+ Average Acceptance length: 3.32
+ Acceptance length histogram: ['0.0%', '10.6%', '32.2%', '26.4%', '15.8%', '7.5%', '4.0%', '1.8%', '0.9%', '0.5%', '0.2%', '0.1%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%']
+ Num responses: 160
+
+Results saved to: /workspace/hanrui/syxin_old/Specforge/benchmarks/results/dflash_lora_inject_offline_epoch_3_step_4644_20260324_125735.json
diff --git a/syxin_old/eval_lora_inject.log b/syxin_old/eval_lora_inject.log
new file mode 100644
index 0000000000000000000000000000000000000000..4f302a5dc99d026fb883b0a6fcaf4f1c07e2d39e
--- /dev/null
+++ b/syxin_old/eval_lora_inject.log
@@ -0,0 +1,202 @@
+nohup: ignoring input
+WARNING:__main__:
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]Running on 8 GPU(s)
+Using attn_implementation: target=flash_attention_2, draft=sdpa
+Loading target model: /workspace/models/Qwen3-8B
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.55s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.55s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.41s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.56s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.50s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.55s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.50s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.64s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.54s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.54s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.37s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.63s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.58s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.61s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.62s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.66s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.58s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.58s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.45s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.62s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.63s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.60s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.62s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.62s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.36s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.43s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.43s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.86s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.86s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.15s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.81s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.15s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.07s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.43s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.49s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.48s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.49s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.47s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.89s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.88s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.88s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.19s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.17s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.18s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.85s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.17s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.89s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.19s/it]
+Loading base + LoRA adapter: /workspace/hanrui/syxin/Specforge/outputs/qwen3-8b-sft-32gpu-v3/epoch_0_step_2500
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.80s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.80s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.80s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.78s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.77s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.78s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.79s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.79s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.83s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.83s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.83s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.84s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.83s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.84s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.84s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.84s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.81s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.81s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.81s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.79s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.78s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.79s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.79s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.79s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.58s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.58s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.58s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.30s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.30s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.30s/it]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.57s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.57s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.57s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.57s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.58s/it]/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.29s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.29s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.29s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.29s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.29s/it]
+Using the latest cached version of the dataset since openai/openai_humaneval couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'openai_humaneval' at /workspace/hanrui/datasets/openai___openai_humaneval/openai_humaneval/0.0.0/7dce6050a7d6d172f3cc5c32aa97f52fa1a2e544 (last modified on Tue Mar 17 17:01:06 2026).
+Using the latest cached version of the dataset since openai/openai_humaneval couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'openai_humaneval' at /workspace/hanrui/datasets/openai___openai_humaneval/openai_humaneval/0.0.0/7dce6050a7d6d172f3cc5c32aa97f52fa1a2e544 (last modified on Tue Mar 17 17:01:06 2026).
+Using the latest cached version of the dataset since openai/openai_humaneval couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'openai_humaneval' at /workspace/hanrui/datasets/openai___openai_humaneval/openai_humaneval/0.0.0/7dce6050a7d6d172f3cc5c32aa97f52fa1a2e544 (last modified on Tue Mar 17 17:01:06 2026).
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+
+============================================================
+Benchmark: humaneval (8 GPUs)
+============================================================
+Using the latest cached version of the dataset since openai/openai_humaneval couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'openai_humaneval' at /workspace/hanrui/datasets/openai___openai_humaneval/openai_humaneval/0.0.0/7dce6050a7d6d172f3cc5c32aa97f52fa1a2e544 (last modified on Tue Mar 17 17:01:06 2026).
+Total 164 samples, distributed across 8 GPUs
+
[GPU0] humaneval: 0%| | 0/21 [00:00, ?sample/s]Using the latest cached version of the dataset since openai/openai_humaneval couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'openai_humaneval' at /workspace/hanrui/datasets/openai___openai_humaneval/openai_humaneval/0.0.0/7dce6050a7d6d172f3cc5c32aa97f52fa1a2e544 (last modified on Tue Mar 17 17:01:06 2026).
+Using the latest cached version of the dataset since openai/openai_humaneval couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'openai_humaneval' at /workspace/hanrui/datasets/openai___openai_humaneval/openai_humaneval/0.0.0/7dce6050a7d6d172f3cc5c32aa97f52fa1a2e544 (last modified on Tue Mar 17 17:01:06 2026).
+Using the latest cached version of the dataset since openai/openai_humaneval couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'openai_humaneval' at /workspace/hanrui/datasets/openai___openai_humaneval/openai_humaneval/0.0.0/7dce6050a7d6d172f3cc5c32aa97f52fa1a2e544 (last modified on Tue Mar 17 17:01:06 2026).
+Using the latest cached version of the dataset since openai/openai_humaneval couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'openai_humaneval' at /workspace/hanrui/datasets/openai___openai_humaneval/openai_humaneval/0.0.0/7dce6050a7d6d172f3cc5c32aa97f52fa1a2e544 (last modified on Tue Mar 17 17:01:06 2026).
+
[GPU0] humaneval: 0%| | 0/21 [00:33, ?sample/s, accept_len=2.01]
[GPU0] humaneval: 5%|▍ | 1/21 [00:33<11:17, 33.86s/sample, accept_len=2.01]
[GPU0] humaneval: 5%|▍ | 1/21 [00:51<11:17, 33.86s/sample, accept_len=1.98]
[GPU0] humaneval: 10%|▉ | 2/21 [00:51<07:40, 24.25s/sample, accept_len=1.98]
[GPU0] humaneval: 10%|▉ | 2/21 [01:07<07:40, 24.25s/sample, accept_len=1.99]
[GPU0] humaneval: 14%|█▍ | 3/21 [01:07<06:07, 20.43s/sample, accept_len=1.99]
[GPU0] humaneval: 14%|█▍ | 3/21 [01:30<06:07, 20.43s/sample, accept_len=1.98]
[GPU0] humaneval: 19%|█▉ | 4/21 [01:30<06:09, 21.71s/sample, accept_len=1.98]
[GPU0] humaneval: 19%|█▉ | 4/21 [02:26<06:09, 21.71s/sample, accept_len=1.98]
[GPU0] humaneval: 24%|██▍ | 5/21 [02:26<09:00, 33.81s/sample, accept_len=1.98]
[GPU0] humaneval: 24%|██▍ | 5/21 [02:59<09:00, 33.81s/sample, accept_len=1.98]
[GPU0] humaneval: 29%|██▊ | 6/21 [02:59<08:22, 33.53s/sample, accept_len=1.98]
[GPU0] humaneval: 29%|██▊ | 6/21 [03:14<08:22, 33.53s/sample, accept_len=1.99]
[GPU0] humaneval: 33%|███▎ | 7/21 [03:14<06:27, 27.67s/sample, accept_len=1.99]
[GPU0] humaneval: 33%|███▎ | 7/21 [03:34<06:27, 27.67s/sample, accept_len=1.97]
[GPU0] humaneval: 38%|███▊ | 8/21 [03:34<05:26, 25.11s/sample, accept_len=1.97]
[GPU0] humaneval: 38%|███▊ | 8/21 [04:15<05:26, 25.11s/sample, accept_len=1.99]
[GPU0] humaneval: 43%|████▎ | 9/21 [04:15<06:01, 30.13s/sample, accept_len=1.99]
[GPU0] humaneval: 43%|████▎ | 9/21 [04:46<06:01, 30.13s/sample, accept_len=2.00]
[GPU0] humaneval: 48%|████▊ | 10/21 [04:46<05:34, 30.39s/sample, accept_len=2.00]
[GPU0] humaneval: 48%|████▊ | 10/21 [05:10<05:34, 30.39s/sample, accept_len=1.99]
[GPU0] humaneval: 52%|█████▏ | 11/21 [05:10<04:43, 28.38s/sample, accept_len=1.99]
[GPU0] humaneval: 52%|█████▏ | 11/21 [05:45<04:43, 28.38s/sample, accept_len=2.00]
[GPU0] humaneval: 57%|█████▋ | 12/21 [05:45<04:32, 30.28s/sample, accept_len=2.00]
[GPU0] humaneval: 57%|█████▋ | 12/21 [06:16<04:32, 30.28s/sample, accept_len=2.02]
[GPU0] humaneval: 62%|██████▏ | 13/21 [06:16<04:05, 30.73s/sample, accept_len=2.02]
[GPU0] humaneval: 62%|██████▏ | 13/21 [06:44<04:05, 30.73s/sample, accept_len=2.00]
[GPU0] humaneval: 67%|██████▋ | 14/21 [06:44<03:28, 29.78s/sample, accept_len=2.00]
[GPU0] humaneval: 67%|██████▋ | 14/21 [07:06<03:28, 29.78s/sample, accept_len=1.99]
[GPU0] humaneval: 71%|███████▏ | 15/21 [07:06<02:45, 27.61s/sample, accept_len=1.99]
[GPU0] humaneval: 71%|███████▏ | 15/21 [07:37<02:45, 27.61s/sample, accept_len=2.00]
[GPU0] humaneval: 76%|███████▌ | 16/21 [07:37<02:22, 28.51s/sample, accept_len=2.00]
[GPU0] humaneval: 76%|███████▌ | 16/21 [08:11<02:22, 28.51s/sample, accept_len=1.98]
[GPU0] humaneval: 81%|████████ | 17/21 [08:11<02:01, 30.28s/sample, accept_len=1.98]
[GPU0] humaneval: 81%|████████ | 17/21 [08:42<02:01, 30.28s/sample, accept_len=1.98]
[GPU0] humaneval: 86%|████████▌ | 18/21 [08:42<01:31, 30.45s/sample, accept_len=1.98]
[GPU0] humaneval: 86%|████████▌ | 18/21 [09:08<01:31, 30.45s/sample, accept_len=1.98]
[GPU0] humaneval: 90%|█████████ | 19/21 [09:08<00:58, 29.06s/sample, accept_len=1.98]
[GPU0] humaneval: 90%|█████████ | 19/21 [09:31<00:58, 29.06s/sample, accept_len=1.99]
[GPU0] humaneval: 95%|█████████▌| 20/21 [09:31<00:27, 27.07s/sample, accept_len=1.99]
[GPU0] humaneval: 95%|█████████▌| 20/21 [10:07<00:27, 27.07s/sample, accept_len=1.97]
[GPU0] humaneval: 100%|██████████| 21/21 [10:07<00:00, 29.75s/sample, accept_len=1.97]
[GPU0] humaneval: 100%|██████████| 21/21 [10:07<00:00, 28.91s/sample, accept_len=1.97]
+Using the latest cached version of the dataset since openai/gsm8k couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Using the latest cached version of the dataset since openai/gsm8k couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Using the latest cached version of the dataset since openai/gsm8k couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Using the latest cached version of the dataset since openai/gsm8k couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Using the latest cached version of the dataset since openai/gsm8k couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'main' at /workspace/hanrui/datasets/openai___gsm8k/main/0.0.0/cc7b047b6e5bb11b4f1af84efc572db110a51b3c (last modified on Tue Mar 17 13:17:15 2026).
+Using the latest cached version of the dataset since openai/gsm8k couldn't be found on the Hugging Face Hub (offline mode is enabled).
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/storage.py:414: FutureWarning: You are using `torch.load` with `weights_only=False` (the current default value), which uses the default pickle module implicitly. It is possible to construct malicious pickle data which will execute arbitrary code during unpickling (See https://github.com/pytorch/pytorch/blob/main/SECURITY.md#untrusted-models for more details). In a future release, the default value for `weights_only` will be flipped to `True`. This limits the functions that could be executed during unpickling. Arbitrary objects will no longer be allowed to be loaded via this mode unless they are explicitly allowlisted by the user via `torch.serialization.add_safe_globals`. We recommend you start setting `weights_only=True` for any use case where you don't have full control of the loaded file. Please open an issue on GitHub for any issues related to this experimental feature.
+ return torch.load(io.BytesIO(b))
+Found the latest cached dataset configuration 'main' at /workspace/hanrui/datasets/openai___gsm8k/main/0.0.0/cc7b047b6e5bb11b4f1af84efc572db110a51b3c (last modified on Tue Mar 17 13:17:15 2026).
+Found the latest cached dataset configuration 'main' at /workspace/hanrui/datasets/openai___gsm8k/main/0.0.0/cc7b047b6e5bb11b4f1af84efc572db110a51b3c (last modified on Tue Mar 17 13:17:15 2026).
+Using the latest cached version of the dataset since openai/gsm8k couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'main' at /workspace/hanrui/datasets/openai___gsm8k/main/0.0.0/cc7b047b6e5bb11b4f1af84efc572db110a51b3c (last modified on Tue Mar 17 13:17:15 2026).
+Found the latest cached dataset configuration 'main' at /workspace/hanrui/datasets/openai___gsm8k/main/0.0.0/cc7b047b6e5bb11b4f1af84efc572db110a51b3c (last modified on Tue Mar 17 13:17:15 2026).
+Found the latest cached dataset configuration 'main' at /workspace/hanrui/datasets/openai___gsm8k/main/0.0.0/cc7b047b6e5bb11b4f1af84efc572db110a51b3c (last modified on Tue Mar 17 13:17:15 2026).
+Found the latest cached dataset configuration 'main' at /workspace/hanrui/datasets/openai___gsm8k/main/0.0.0/cc7b047b6e5bb11b4f1af84efc572db110a51b3c (last modified on Tue Mar 17 13:17:15 2026).
+
+humaneval Results:
+ Decoding speedup: 0.97x
+ Average Acceptance length: 2.00
+ Acceptance length histogram: ['0.0%', '9.9%', '80.7%', '9.2%', '0.2%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%']
+ Num responses: 164
+
+============================================================
+Benchmark: gsm8k (8 GPUs)
+============================================================
+Using the latest cached version of the dataset since openai/gsm8k couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'main' at /workspace/hanrui/datasets/openai___gsm8k/main/0.0.0/cc7b047b6e5bb11b4f1af84efc572db110a51b3c (last modified on Tue Mar 17 13:17:15 2026).
+Total 128 samples, distributed across 8 GPUs
+
[GPU0] gsm8k: 0%| | 0/16 [00:00, ?sample/s]
[GPU0] gsm8k: 0%| | 0/16 [00:13, ?sample/s, accept_len=1.98]
[GPU0] gsm8k: 6%|▋ | 1/16 [00:13<03:21, 13.42s/sample, accept_len=1.98]
[GPU0] gsm8k: 6%|▋ | 1/16 [00:34<03:21, 13.42s/sample, accept_len=2.01]
[GPU0] gsm8k: 12%|█▎ | 2/16 [00:34<04:08, 17.77s/sample, accept_len=2.01]
[GPU0] gsm8k: 12%|█▎ | 2/16 [00:49<04:08, 17.77s/sample, accept_len=2.02]
[GPU0] gsm8k: 19%|█▉ | 3/16 [00:49<03:38, 16.82s/sample, accept_len=2.02]
[GPU0] gsm8k: 19%|█▉ | 3/16 [01:15<03:38, 16.82s/sample, accept_len=2.01]
[GPU0] gsm8k: 25%|██▌ | 4/16 [01:15<04:04, 20.37s/sample, accept_len=2.01]
[GPU0] gsm8k: 25%|██▌ | 4/16 [01:32<04:04, 20.37s/sample, accept_len=2.02]
[GPU0] gsm8k: 31%|███▏ | 5/16 [01:32<03:28, 18.96s/sample, accept_len=2.02]
[GPU0] gsm8k: 31%|███▏ | 5/16 [01:41<03:28, 18.96s/sample, accept_len=2.03]
[GPU0] gsm8k: 38%|███▊ | 6/16 [01:41<02:37, 15.76s/sample, accept_len=2.03]
[GPU0] gsm8k: 38%|███▊ | 6/16 [02:01<02:37, 15.76s/sample, accept_len=2.04]
[GPU0] gsm8k: 44%|████▍ | 7/16 [02:01<02:33, 17.04s/sample, accept_len=2.04]
[GPU0] gsm8k: 44%|████▍ | 7/16 [02:16<02:33, 17.04s/sample, accept_len=2.07]
[GPU0] gsm8k: 50%|█████ | 8/16 [02:16<02:11, 16.45s/sample, accept_len=2.07]
[GPU0] gsm8k: 50%|█████ | 8/16 [02:35<02:11, 16.45s/sample, accept_len=2.08]
[GPU0] gsm8k: 56%|█████▋ | 9/16 [02:35<01:59, 17.06s/sample, accept_len=2.08]
[GPU0] gsm8k: 56%|█████▋ | 9/16 [02:49<01:59, 17.06s/sample, accept_len=2.08]
[GPU0] gsm8k: 62%|██████▎ | 10/16 [02:49<01:38, 16.38s/sample, accept_len=2.08]
[GPU0] gsm8k: 62%|██████▎ | 10/16 [03:03<01:38, 16.38s/sample, accept_len=2.07]
[GPU0] gsm8k: 69%|██████▉ | 11/16 [03:03<01:18, 15.65s/sample, accept_len=2.07]
[GPU0] gsm8k: 69%|██████▉ | 11/16 [03:25<01:18, 15.65s/sample, accept_len=2.07]
[GPU0] gsm8k: 75%|███████▌ | 12/16 [03:25<01:10, 17.60s/sample, accept_len=2.07]
[GPU0] gsm8k: 75%|███████▌ | 12/16 [03:39<01:10, 17.60s/sample, accept_len=2.05]
[GPU0] gsm8k: 81%|████████▏ | 13/16 [03:39<00:49, 16.38s/sample, accept_len=2.05]
[GPU0] gsm8k: 81%|████████▏ | 13/16 [03:54<00:49, 16.38s/sample, accept_len=2.05]
[GPU0] gsm8k: 88%|████████▊ | 14/16 [03:54<00:31, 15.84s/sample, accept_len=2.05]
[GPU0] gsm8k: 88%|████████▊ | 14/16 [04:02<00:31, 15.84s/sample, accept_len=2.04]
[GPU0] gsm8k: 94%|█████████▍| 15/16 [04:02<00:13, 13.68s/sample, accept_len=2.04]
[GPU0] gsm8k: 94%|█████████▍| 15/16 [04:25<00:13, 13.68s/sample, accept_len=2.05]
[GPU0] gsm8k: 100%|██████████| 16/16 [04:25<00:00, 16.29s/sample, accept_len=2.05]
[GPU0] gsm8k: 100%|██████████| 16/16 [04:25<00:00, 16.57s/sample, accept_len=2.05]
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+
+gsm8k Results:
+ Decoding speedup: 1.03x
+ Average Acceptance length: 2.04
+ Acceptance length histogram: ['0.0%', '7.2%', '82.7%', '9.8%', '0.3%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%']
+ Num responses: 128
+
+============================================================
+Benchmark: mt-bench (8 GPUs)
+============================================================
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Total 80 samples, distributed across 8 GPUs
+
[GPU0] mt-bench: 0%| | 0/10 [00:00, ?sample/s]
[GPU0] mt-bench: 0%| | 0/10 [03:54, ?sample/s, accept_len=1.94]
[GPU0] mt-bench: 10%|█ | 1/10 [03:54<35:07, 234.14s/sample, accept_len=1.94]
[GPU0] mt-bench: 10%|█ | 1/10 [04:12<35:07, 234.14s/sample, accept_len=1.92]
[GPU0] mt-bench: 20%|██ | 2/10 [04:12<14:19, 107.42s/sample, accept_len=1.92]
[GPU0] mt-bench: 20%|██ | 2/10 [06:25<14:19, 107.42s/sample, accept_len=1.93]
[GPU0] mt-bench: 30%|███ | 3/10 [06:25<13:53, 119.12s/sample, accept_len=1.93]
[GPU0] mt-bench: 30%|███ | 3/10 [10:01<13:53, 119.12s/sample, accept_len=1.94]
[GPU0] mt-bench: 40%|████ | 4/10 [10:01<15:43, 157.27s/sample, accept_len=1.94]
[GPU0] mt-bench: 40%|████ | 4/10 [10:40<15:43, 157.27s/sample, accept_len=2.02]
[GPU0] mt-bench: 50%|█████ | 5/10 [10:40<09:32, 114.42s/sample, accept_len=2.02]
[GPU0] mt-bench: 50%|█████ | 5/10 [12:13<09:32, 114.42s/sample, accept_len=2.03]
[GPU0] mt-bench: 60%|██████ | 6/10 [12:13<07:09, 107.35s/sample, accept_len=2.03]
[GPU0] mt-bench: 60%|██████ | 6/10 [15:15<07:09, 107.35s/sample, accept_len=2.02]
[GPU0] mt-bench: 70%|███████ | 7/10 [15:15<06:34, 131.53s/sample, accept_len=2.02]
[GPU0] mt-bench: 70%|███████ | 7/10 [15:19<06:34, 131.53s/sample, accept_len=2.04]
[GPU0] mt-bench: 80%|████████ | 8/10 [15:19<03:02, 91.21s/sample, accept_len=2.04]
[GPU0] mt-bench: 80%|████████ | 8/10 [16:23<03:02, 91.21s/sample, accept_len=2.04]
[GPU0] mt-bench: 90%|█████████ | 9/10 [16:23<01:22, 82.67s/sample, accept_len=2.04][rank7]:[E317 17:45:58.085400661 ProcessGroupNCCL.cpp:607] [Rank 7] Watchdog caught collective operation timeout: WorkNCCL(SeqNum=5, OpType=ALLGATHER, NumelIn=1, NumelOut=8, Timeout(ms)=600000) ran for 600058 milliseconds before timing out.
+[rank7]:[E317 17:45:58.085551647 ProcessGroupNCCL.cpp:1664] [PG 0 (default_pg) Rank 7] Exception (either an error or timeout) detected by watchdog at work: 5, last enqueued NCCL work: 5, last completed NCCL work: 4.
+[rank7]:[E317 17:45:59.795122977 ProcessGroupNCCL.cpp:1709] [PG 0 (default_pg) Rank 7] Timeout at NCCL work: 5, last enqueued NCCL work: 5, last completed NCCL work: 4.
+[rank7]:[E317 17:45:59.795159380 ProcessGroupNCCL.cpp:621] [Rank 7] Some NCCL operations have failed or timed out. Due to the asynchronous nature of CUDA kernels, subsequent GPU operations might run on corrupted/incomplete data.
+[rank7]:[E317 17:45:59.795168045 ProcessGroupNCCL.cpp:627] [Rank 7] To avoid data inconsistency, we are taking the entire process down.
+[rank7]:[E317 17:45:59.796632516 ProcessGroupNCCL.cpp:1515] [PG 0 (default_pg) Rank 7] Process group watchdog thread terminated with exception: [Rank 7] Watchdog caught collective operation timeout: WorkNCCL(SeqNum=5, OpType=ALLGATHER, NumelIn=1, NumelOut=8, Timeout(ms)=600000) ran for 600058 milliseconds before timing out.
+Exception raised from checkTimeout at ../torch/csrc/distributed/c10d/ProcessGroupNCCL.cpp:609 (most recent call first):
+frame #0: c10::Error::Error(c10::SourceLocation, std::string) + 0x96 (0x7f4b87177f86 in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libc10.so)
+frame #1: c10d::ProcessGroupNCCL::WorkNCCL::checkTimeout(std::optional > >) + 0x1d2 (0x7f4b393738d2 in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libtorch_cuda.so)
+frame #2: c10d::ProcessGroupNCCL::watchdogHandler() + 0x233 (0x7f4b3937a313 in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libtorch_cuda.so)
+frame #3: c10d::ProcessGroupNCCL::ncclCommWatchdog() + 0x10c (0x7f4b3937c6fc in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libtorch_cuda.so)
+frame #4: + 0xdf0e6 (0x7f4b8a6970e6 in /workspace/miniconda3/envs/dflash/bin/../lib/libstdc++.so.6)
+frame #5: + 0x891f5 (0x7f4b8cf991f5 in /usr/lib/x86_64-linux-gnu/libc.so.6)
+frame #6: + 0x1098dc (0x7f4b8d0198dc in /usr/lib/x86_64-linux-gnu/libc.so.6)
+
+terminate called after throwing an instance of 'c10::DistBackendError'
+ what(): [PG 0 (default_pg) Rank 7] Process group watchdog thread terminated with exception: [Rank 7] Watchdog caught collective operation timeout: WorkNCCL(SeqNum=5, OpType=ALLGATHER, NumelIn=1, NumelOut=8, Timeout(ms)=600000) ran for 600058 milliseconds before timing out.
+Exception raised from checkTimeout at ../torch/csrc/distributed/c10d/ProcessGroupNCCL.cpp:609 (most recent call first):
+frame #0: c10::Error::Error(c10::SourceLocation, std::string) + 0x96 (0x7f4b87177f86 in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libc10.so)
+frame #1: c10d::ProcessGroupNCCL::WorkNCCL::checkTimeout(std::optional > >) + 0x1d2 (0x7f4b393738d2 in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libtorch_cuda.so)
+frame #2: c10d::ProcessGroupNCCL::watchdogHandler() + 0x233 (0x7f4b3937a313 in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libtorch_cuda.so)
+frame #3: c10d::ProcessGroupNCCL::ncclCommWatchdog() + 0x10c (0x7f4b3937c6fc in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libtorch_cuda.so)
+frame #4: + 0xdf0e6 (0x7f4b8a6970e6 in /workspace/miniconda3/envs/dflash/bin/../lib/libstdc++.so.6)
+frame #5: + 0x891f5 (0x7f4b8cf991f5 in /usr/lib/x86_64-linux-gnu/libc.so.6)
+frame #6: + 0x1098dc (0x7f4b8d0198dc in /usr/lib/x86_64-linux-gnu/libc.so.6)
+
+Exception raised from ncclCommWatchdog at ../torch/csrc/distributed/c10d/ProcessGroupNCCL.cpp:1521 (most recent call first):
+frame #0: c10::Error::Error(c10::SourceLocation, std::string) + 0x96 (0x7f4b87177f86 in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libc10.so)
+frame #1: + 0xe5aa84 (0x7f4b39005a84 in /workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/lib/libtorch_cuda.so)
+frame #2: + 0xdf0e6 (0x7f4b8a6970e6 in /workspace/miniconda3/envs/dflash/bin/../lib/libstdc++.so.6)
+frame #3: + 0x891f5 (0x7f4b8cf991f5 in /usr/lib/x86_64-linux-gnu/libc.so.6)
+frame #4: + 0x1098dc (0x7f4b8d0198dc in /usr/lib/x86_64-linux-gnu/libc.so.6)
+
+W0317 17:45:59.989000 140168604448576 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1141 closing signal SIGTERM
+W0317 17:45:59.989000 140168604448576 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1142 closing signal SIGTERM
+W0317 17:45:59.990000 140168604448576 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1143 closing signal SIGTERM
+W0317 17:45:59.990000 140168604448576 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1144 closing signal SIGTERM
+W0317 17:45:59.991000 140168604448576 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1145 closing signal SIGTERM
+W0317 17:45:59.991000 140168604448576 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1146 closing signal SIGTERM
+W0317 17:45:59.991000 140168604448576 torch/distributed/elastic/multiprocessing/api.py:858] Sending process 1147 closing signal SIGTERM
+E0317 17:46:03.310000 140168604448576 torch/distributed/elastic/multiprocessing/api.py:833] failed (exitcode: -6) local_rank: 7 (pid: 1148) of binary: /workspace/miniconda3/envs/dflash/bin/python3
+Traceback (most recent call last):
+ File "", line 198, in _run_module_as_main
+ File "", line 88, in _run_code
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/run.py", line 905, in
+ main()
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/errors/__init__.py", line 348, in wrapper
+ return f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/run.py", line 901, in main
+ run(args)
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/run.py", line 892, in run
+ elastic_launch(
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 133, in __call__
+ return launch_agent(self._config, self._entrypoint, list(args))
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 264, in launch_agent
+ raise ChildFailedError(
+torch.distributed.elastic.multiprocessing.errors.ChildFailedError:
+============================================================
+/workspace/hanrui/syxin_old/eval_dflash_lora_inject.py FAILED
+------------------------------------------------------------
+Failures:
+
+------------------------------------------------------------
+Root Cause (first observed failure):
+[0]:
+ time : 2026-03-17_17:45:59
+ host : job-006ce80a7c47-20260302193512-5dcd4c9bbd-l5mjm
+ rank : 7 (local_rank: 7)
+ exitcode : -6 (pid: 1148)
+ error_file:
+ traceback : Signal 6 (SIGABRT) received by PID 1148
+============================================================
diff --git a/syxin_old/eval_mtbench.log b/syxin_old/eval_mtbench.log
new file mode 100644
index 0000000000000000000000000000000000000000..ba9fa6a10c17cd6c878851c96a45847174686ee7
--- /dev/null
+++ b/syxin_old/eval_mtbench.log
@@ -0,0 +1,89 @@
+nohup: ignoring input
+WARNING:__main__:
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+[W319 15:58:37.877946322 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s][W319 15:58:37.467988233 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W319 15:58:37.642464172 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W319 15:58:37.710061711 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W319 15:58:38.798998313 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W319 15:58:38.847226543 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W319 15:58:38.857628240 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W319 15:58:38.865435885 Utils.hpp:135] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+Running on 8 GPU(s)
+Using attn_implementation: target=flash_attention_2, draft=sdpa
+Loading target model: /workspace/models/Qwen3-8B
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.26s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.39s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.37s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.37s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.35s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:06, 2.21s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.67s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.67s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.67s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.51s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:06<00:04, 2.13s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.64s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.65s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.76s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.80s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.80s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.81s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:01, 1.93s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.41s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.52s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.78s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.64s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.65s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.68s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.73s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.72s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:02, 2.13s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.79s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:08, 2.07s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.58s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.92s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.44s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.44s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.42s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.51s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.51s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.61s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.87s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.87s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.86s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.16s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.17s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.18s/it]
+Loading base + LoRA adapter: /workspace/hanrui/syxin/Specforge/outputs/qwen3-8b-sft-32gpu-v3/epoch_3_step_9288
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:06, 2.08s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:08, 2.07s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.89s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.89s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.23s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.23s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.95s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.29s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 60%|██████ | 3/5 [00:06<00:04, 2.13s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:06, 2.09s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.82s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.82s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.83s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.67s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.67s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.84s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:02, 2.03s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:06<00:04, 2.06s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.55s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.79s/it]
+
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.88s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.88s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.94s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.76s/it]/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.85s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:07<00:01, 1.92s/it]Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.90s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.46s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.71s/it]
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.67s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.69s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.81s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.81s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.85s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.79s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.61s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.54s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.61s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.53s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.65s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.57s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.96s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.90s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.91s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.31s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.24s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.24s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.96s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.31s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.00s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.35s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 1.92s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:11<00:00, 2.29s/it]
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/peft/peft_model.py:598: UserWarning: Found missing adapter keys while loading the checkpoint: ['base_model.model.model.layers.0.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.0.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.1.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.2.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.3.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.4.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.5.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.6.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.7.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.8.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.9.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.10.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.11.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.12.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.13.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.14.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.15.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.16.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.17.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.18.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.19.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.20.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.21.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.22.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.23.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.24.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.25.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.26.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.27.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.28.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.29.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.30.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.31.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.32.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.33.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.34.self_attn.o_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.q_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.k_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.v_proj.lora_B.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_A.default.weight', 'base_model.model.model.layers.35.self_attn.o_proj.lora_B.default.weight'].
+ warnings.warn(warn_message)
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+
+============================================================
+Benchmark: mt-bench (8 GPUs)
+============================================================
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Total 80 samples, distributed across 8 GPUs
+
[GPU0] mt-bench: 0%| | 0/10 [00:00, ?sample/s]Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+Using the latest cached version of the dataset since HuggingFaceH4/mt_bench_prompts couldn't be found on the Hugging Face Hub (offline mode is enabled).
+Found the latest cached dataset configuration 'default' at /workspace/hanrui/datasets/HuggingFaceH4___mt_bench_prompts/default/0.0.0/e3a795c5e9a82ee40611c416b8a7786c73198991 (last modified on Tue Mar 17 13:17:15 2026).
+
[GPU0] mt-bench: 0%| | 0/10 [03:57, ?sample/s, accept_len=1.94]
[GPU0] mt-bench: 10%|█ | 1/10 [03:57<35:41, 237.92s/sample, accept_len=1.94]
[GPU0] mt-bench: 10%|█ | 1/10 [04:17<35:41, 237.92s/sample, accept_len=1.92]
[GPU0] mt-bench: 20%|██ | 2/10 [04:17<14:35, 109.46s/sample, accept_len=1.92]
[GPU0] mt-bench: 20%|██ | 2/10 [06:34<14:35, 109.46s/sample, accept_len=1.93]
[GPU0] mt-bench: 30%|███ | 3/10 [06:34<14:13, 121.99s/sample, accept_len=1.93]
[GPU0] mt-bench: 30%|███ | 3/10 [10:15<14:13, 121.99s/sample, accept_len=1.94]
[GPU0] mt-bench: 40%|████ | 4/10 [10:15<16:06, 161.14s/sample, accept_len=1.94]
[GPU0] mt-bench: 40%|████ | 4/10 [10:55<16:06, 161.14s/sample, accept_len=2.02]
[GPU0] mt-bench: 50%|█████ | 5/10 [10:55<09:46, 117.34s/sample, accept_len=2.02]
[GPU0] mt-bench: 50%|█████ | 5/10 [12:30<09:46, 117.34s/sample, accept_len=2.03]
[GPU0] mt-bench: 60%|██████ | 6/10 [12:30<07:19, 109.92s/sample, accept_len=2.03]
[GPU0] mt-bench: 60%|██████ | 6/10 [15:35<07:19, 109.92s/sample, accept_len=2.02]
[GPU0] mt-bench: 70%|███████ | 7/10 [15:35<06:43, 134.35s/sample, accept_len=2.02]
[GPU0] mt-bench: 70%|███████ | 7/10 [15:40<06:43, 134.35s/sample, accept_len=2.04]
[GPU0] mt-bench: 80%|████████ | 8/10 [15:40<03:06, 93.16s/sample, accept_len=2.04]
[GPU0] mt-bench: 80%|████████ | 8/10 [16:45<03:06, 93.16s/sample, accept_len=2.04]
[GPU0] mt-bench: 90%|█████████ | 9/10 [16:45<01:24, 84.48s/sample, accept_len=2.04]
[GPU0] mt-bench: 90%|█████████ | 9/10 [20:11<01:24, 84.48s/sample, accept_len=2.02]
[GPU0] mt-bench: 100%|██████████| 10/10 [20:11<00:00, 122.05s/sample, accept_len=2.02]
[GPU0] mt-bench: 100%|██████████| 10/10 [20:11<00:00, 121.19s/sample, accept_len=2.02]
+/workspace/miniconda3/envs/dflash/lib/python3.11/site-packages/torch/storage.py:414: FutureWarning: You are using `torch.load` with `weights_only=False` (the current default value), which uses the default pickle module implicitly. It is possible to construct malicious pickle data which will execute arbitrary code during unpickling (See https://github.com/pytorch/pytorch/blob/main/SECURITY.md#untrusted-models for more details). In a future release, the default value for `weights_only` will be flipped to `True`. This limits the functions that could be executed during unpickling. Arbitrary objects will no longer be allowed to be loaded via this mode unless they are explicitly allowlisted by the user via `torch.serialization.add_safe_globals`. We recommend you start setting `weights_only=True` for any use case where you don't have full control of the loaded file. Please open an issue on GitHub for any issues related to this experimental feature.
+ return torch.load(io.BytesIO(b))
+
+mt-bench Results:
+ Decoding speedup: 0.85x
+ Average Acceptance length: 1.96
+ Acceptance length histogram: ['0.0%', '13.2%', '77.5%', '9.0%', '0.3%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%', '0.0%']
+ Num responses: 160
+
+Results saved to: /workspace/hanrui/syxin_old/Specforge/benchmarks/results/dflash_lora_inject_offline_epoch_3_step_9288_20260319_161930.json
diff --git a/syxin_old/run_bench.sh b/syxin_old/run_bench.sh
new file mode 100644
index 0000000000000000000000000000000000000000..9164e86a1863415ce07f659233ff65cff7840615
--- /dev/null
+++ b/syxin_old/run_bench.sh
@@ -0,0 +1,68 @@
+#!/bin/bash
+# Step 3: Run HumanEval / MT-Bench / GSM8K benchmarks.
+# Run AFTER start_server.sh is up.
+# Usage:
+# bash run_bench.sh # all three benches, full dataset
+# bash run_bench.sh humaneval # only humaneval
+# bash run_bench.sh mtbench gsm8k # pick any subset
+
+set -e
+
+INTRANET_IP=10.1.1.131
+PORT=30000
+BASE_MODEL=/workspace/models/Qwen3-8B
+MERGED=/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-merged
+BENCH_DIR=/workspace/hanrui/syxin_old/Specforge/benchmarks
+RESULT_DIR=$BENCH_DIR/results
+
+# ---- sanity check ----
+echo "Checking server at http://$INTRANET_IP:$PORT ..."
+curl -sf http://$INTRANET_IP:$PORT/v1/models > /dev/null || {
+ echo "[ERROR] Server not reachable. Start it first: bash start_server.sh"
+ exit 1
+}
+echo "Server OK."
+
+mkdir -p $RESULT_DIR
+cd $BENCH_DIR
+export PYTHONPATH=/workspace/hanrui/syxin_old/Specforge:$PYTHONPATH
+
+# ---- decide which benches to run ----
+TARGETS=("$@")
+if [ ${#TARGETS[@]} -eq 0 ]; then
+ TARGETS=(humaneval mtbench gsm8k)
+fi
+
+BENCH_ARGS=""
+for t in "${TARGETS[@]}"; do
+ case $t in
+ humaneval) BENCH_ARGS="$BENCH_ARGS humaneval:164" ;;
+ mtbench) BENCH_ARGS="$BENCH_ARGS mtbench:80" ;;
+ gsm8k) BENCH_ARGS="$BENCH_ARGS gsm8k:1319" ;;
+ *)
+ echo "[ERROR] Unknown bench: $t (choices: humaneval mtbench gsm8k)"
+ exit 1
+ ;;
+ esac
+done
+
+TIMESTAMP=$(date +%Y%m%d_%H%M%S)
+echo "Running: $BENCH_ARGS"
+echo "Results -> $RESULT_DIR"
+echo ""
+
+python3 bench_eagle3.py \
+ --model-path $BASE_MODEL \
+ --speculative-draft-model-path $MERGED \
+ --host $INTRANET_IP \
+ --port $PORT \
+ --config-list "16,4,1,4" \
+ --benchmark-list $BENCH_ARGS \
+ --output-dir $RESULT_DIR \
+ --name dflash_lora_${TIMESTAMP} \
+ --skip-launch-server \
+ 2>&1 | tee $RESULT_DIR/bench_${TIMESTAMP}.log
+
+echo ""
+echo "Done. Latest result files:"
+ls -lht $RESULT_DIR/*.jsonl 2>/dev/null | head -5
diff --git a/syxin_old/run_eval.sh b/syxin_old/run_eval.sh
new file mode 100644
index 0000000000000000000000000000000000000000..83b46a9e26bf09da6e537969ba79662b7829264f
--- /dev/null
+++ b/syxin_old/run_eval.sh
@@ -0,0 +1,7 @@
+#!/bin/bash
+export NCCL_TIMEOUT=1800000
+export TORCH_NCCL_BLOCKING_WAIT=0
+export NCCL_ASYNC_ERROR_HANDLING=1
+/workspace/miniconda3/envs/dflash/bin/python3 -m torch.distributed.run --standalone --nproc_per_node 8 /workspace/hanrui/syxin_old/eval_dflash_lora_inject.py \
+ --ckpt epoch_3_step_4644 \
+ --datasets gsm8k humaneval mt-bench
diff --git a/syxin_old/run_random_anchor_64gpu.sh b/syxin_old/run_random_anchor_64gpu.sh
new file mode 100644
index 0000000000000000000000000000000000000000..4702301611c5c1d68cc6a6c7d4a80565dcb119f3
--- /dev/null
+++ b/syxin_old/run_random_anchor_64gpu.sh
@@ -0,0 +1,31 @@
+#!/bin/bash
+export JOB_NAME='qwen3-8b-sft'
+export GPU_NUMS=64
+export TRAIN_SCRIPT='/workspace/hanrui/syxin_old/launch_train_random_anchor.py'
+export WORK_DIR='/workspace/hanrui/syxin_old/Specforge'
+
+if [ $GPU_NUMS -lt 8 ]; then
+ export NNODES=1
+ export GPU_NUMS_PER_NODE=$GPU_NUMS
+else
+ export NNODES=$((GPU_NUMS/8))
+ export GPU_NUMS_PER_NODE=8
+fi
+
+# 使用 spec 环境的 northjob
+/workspace/miniconda3/envs/spec/bin/northjob \
+create \
+--job-type train \
+--nproc-per-node $GPU_NUMS_PER_NODE \
+--gpu-per-node $GPU_NUMS_PER_NODE \
+--nnodes $NNODES \
+--k8s-priority 3 \
+--k8s-queue bg-agentic-coding \
+--k8s-namespace bg-agentic-coding \
+--k8s-pvc-name i-xinsiyang-y4zy0sik0a \
+--k8s-pvc-mount-path /workspace \
+--k8s-no-reclaim \
+--k8s-images harbor.local.clusters/bp/megatron-bplm:25.03_fp8.ibgda.qwen3.next.fix_triton.fix_te.hf457.qwen3_vl \
+--job-name $JOB_NAME \
+--workspace $WORK_DIR \
+$TRAIN_SCRIPT $GPU_NUMS_PER_NODE
diff --git a/syxin_old/run_train_dflash_direct_inject.sh b/syxin_old/run_train_dflash_direct_inject.sh
new file mode 100644
index 0000000000000000000000000000000000000000..de7facae55444c8bdb6d4aeca56029cc169cdad8
--- /dev/null
+++ b/syxin_old/run_train_dflash_direct_inject.sh
@@ -0,0 +1,56 @@
+#!/bin/bash
+set -euo pipefail
+
+ROOT_DIR=/workspace/hanrui/syxin_old/Specforge
+NUM_GPUS=8
+OUTPUT_DIR=$ROOT_DIR/outputs/qwen3-8b-dflash-direct-inject
+if [[ $# -ge 1 ]]; then
+ NUM_GPUS=$1
+ shift
+fi
+if [[ $# -ge 1 && "${1:0:1}" != "-" ]]; then
+ OUTPUT_DIR=$1
+ shift
+fi
+EXTRA_ARGS=("$@")
+
+export TORCHINDUCTOR_CACHE_DIR=$ROOT_DIR/cache/compiled_kernels
+export SPECFORGE_DATA_NUM_PROC=16
+export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+export PYTORCH_ALLOC_CONF=expandable_segments:True
+export PYTHONPATH="$ROOT_DIR:${PYTHONPATH:-}"
+DEFAULT_SPECFORGE_PY=/workspace/hanrui/specforge/bin/python3
+if [[ -z "${PYTHON_BIN:-}" ]]; then
+ if [[ -x "$DEFAULT_SPECFORGE_PY" ]]; then
+ PYTHON_BIN="$DEFAULT_SPECFORGE_PY"
+ else
+ PYTHON_BIN=python3
+ fi
+fi
+
+cd $ROOT_DIR
+
+$PYTHON_BIN -m torch.distributed.run \
+ --standalone \
+ --nproc_per_node $NUM_GPUS \
+ scripts/train_dflash.py \
+ --target-model-path /workspace/models/Qwen3-8B \
+ --target-model-backend sglang \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir $OUTPUT_DIR \
+ --block-size 16 \
+ --num-draft-layers 36 \
+ --attention-backend flex_attention \
+ --max-length 2048 \
+ --batch-size 1 \
+ --accumulation-steps 8 \
+ --num-epochs 3 \
+ --learning-rate 6e-4 \
+ --loss-decay-gamma 7 \
+ --lm-head-chunk-size 256 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500 \
+ --cache-dir $ROOT_DIR/cache \
+ "${EXTRA_ARGS[@]}"
diff --git a/syxin_old/run_train_multinode_dflash.sh b/syxin_old/run_train_multinode_dflash.sh
new file mode 100644
index 0000000000000000000000000000000000000000..fa67cc7f6c12a003f3224a3adc2e6295c15ef00f
--- /dev/null
+++ b/syxin_old/run_train_multinode_dflash.sh
@@ -0,0 +1,76 @@
+#!/bin/bash
+set -euo pipefail
+
+# 多节点版本的 train_dflash.py 训练脚本
+# 对应 run_train_dflash_8gpu.sh 的逻辑,适配 northjob 多节点环境
+# effective batch = 64 x 4 x 2 = 512,与 8 卡版本一致
+
+ROOT_DIR=/workspace/hanrui/syxin_old/Specforge
+CACHE_DIR=/tmp/specforge_cache
+OUTPUT_DIR=$ROOT_DIR/outputs/qwen3-8b-dflash-official-64gpu
+
+# Parse arguments
+NUM_GPUS=8
+if [[ $# -ge 1 ]]; then
+ NUM_GPUS=$1
+ shift
+fi
+if [[ $# -ge 1 && "${1:0:1}" != "-" ]]; then
+ OUTPUT_DIR=$1
+ shift
+fi
+EXTRA_ARGS=("$@")
+
+# Environment variables
+export PYTHONPATH="$ROOT_DIR:${PYTHONPATH:-}"
+export HF_DATASETS_CACHE=$CACHE_DIR/hf_datasets
+export HF_HOME=$CACHE_DIR/hf_home
+export TORCHINDUCTOR_CACHE_DIR=$CACHE_DIR/compiled_kernels
+export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+export PYTORCH_ALLOC_CONF=expandable_segments:True
+export SPECFORGE_DATA_NUM_PROC=16
+
+# Python binary
+DEFAULT_SPECFORGE_PY=/workspace/miniconda3/envs/spec/bin/python3
+if [[ -z "${PYTHON_BIN:-}" ]]; then
+ if [[ -x "$DEFAULT_SPECFORGE_PY" ]]; then
+ PYTHON_BIN="$DEFAULT_SPECFORGE_PY"
+ else
+ PYTHON_BIN=python3
+ fi
+fi
+
+cd $ROOT_DIR
+
+# northjob 已经通过 torchrun 设置了分布式环境变量
+# 直接运行训练脚本,不要再启动 torch.distributed.run
+$PYTHON_BIN scripts/train_dflash.py \
+ --target-model-path /workspace/models/Qwen3-8B \
+ --target-model-backend hf \
+ --draft-config-path $ROOT_DIR/configs/qwen3-8b-dflash.json \
+ --attention-backend sdpa \
+ --trust-remote-code \
+ \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --chat-template qwen \
+ --max-length 3072 \
+ --dataloader-num-workers 4 \
+ \
+ --num-epochs 2 \
+ --batch-size 4 \
+ --accumulation-steps 2 \
+ --learning-rate 6e-4 \
+ --warmup-ratio 0.04 \
+ --max-grad-norm 1.0 \
+ --loss-decay-gamma 7 \
+ --random-anchor \
+ --num-anchors 512 \
+ --gradient-checkpointing \
+ \
+ --lm-head-chunk-size 256 \
+ \
+ --output-dir $OUTPUT_DIR \
+ --cache-dir $CACHE_DIR \
+ --log-interval 50 \
+ --save-interval 500 \
+ "${EXTRA_ARGS[@]}"
diff --git a/syxin_old/run_train_qwen3_8b_sft_32gpu.sh b/syxin_old/run_train_qwen3_8b_sft_32gpu.sh
new file mode 100644
index 0000000000000000000000000000000000000000..d617ec44ece15524dadaec908f9d054797fa6d75
--- /dev/null
+++ b/syxin_old/run_train_qwen3_8b_sft_32gpu.sh
@@ -0,0 +1,66 @@
+#!/bin/bash
+set -euo pipefail
+
+ROOT_DIR=/workspace/hanrui/syxin_old/Specforge
+NUM_GPUS=8
+OUTPUT_DIR=$ROOT_DIR/outputs/qwen3-8b-sft-32gpu-v2
+CACHE_DIR=/tmp/specforge_cache_sft
+
+# Parse arguments
+if [[ $# -ge 1 ]]; then
+ NUM_GPUS=$1
+ shift
+fi
+if [[ $# -ge 1 && "${1:0:1}" != "-" ]]; then
+ OUTPUT_DIR=$1
+ shift
+fi
+EXTRA_ARGS=("$@")
+
+# Environment variables
+export TORCHINDUCTOR_CACHE_DIR=/tmp/specforge_cache_sft/compiled_kernels
+export SPECFORGE_DATA_NUM_PROC=16
+export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
+export PYTORCH_ALLOC_CONF=expandable_segments:True
+export PYTHONPATH="$ROOT_DIR:${PYTHONPATH:-}"
+export HF_DATASETS_CACHE=/tmp/specforge_cache_sft/hf_datasets
+export HF_HOME=/tmp/specforge_cache_sft/hf_home
+
+# Python binary
+DEFAULT_SPECFORGE_PY=/workspace/hanrui/specforge/bin/python3
+if [[ -z "${PYTHON_BIN:-}" ]]; then
+ if [[ -x "$DEFAULT_SPECFORGE_PY" ]]; then
+ PYTHON_BIN="$DEFAULT_SPECFORGE_PY"
+ else
+ PYTHON_BIN=python3
+ fi
+fi
+
+cd $ROOT_DIR
+
+# northjob 已经通过 torchrun 启动了分布式,这里直接运行训练脚本
+$PYTHON_BIN $ROOT_DIR/scripts/train_dflash_lora_inject.py \
+ --target-model-path /workspace/models/Qwen3-8B \
+ --target-model-backend hf \
+ --train-data-path /workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K \
+ --output-dir $OUTPUT_DIR \
+ --block-size 16 \
+ --attention-backend additive \
+ --attn-implementation sdpa \
+ --max-length 2048 \
+ --batch-size 8 \
+ --accumulation-steps 8 \
+ --num-epochs 3 \
+ --learning-rate 5e-5 \
+ --loss-decay-gamma 7 \
+ --gradient-checkpointing \
+ --chat-template qwen \
+ --log-interval 50 \
+ --save-interval 500 \
+ --cache-dir $CACHE_DIR \
+ --lora-rank 32 \
+ --lora-alpha 64 \
+ --lora-dropout 0.1 \
+ --trust-remote-code \
+ --dataloader-num-workers 0 \
+ "${EXTRA_ARGS[@]}"
diff --git a/syxin_old/server.log b/syxin_old/server.log
new file mode 100644
index 0000000000000000000000000000000000000000..8de27bf5c7527cdaf2e01d5d86545a6d1828f236
--- /dev/null
+++ b/syxin_old/server.log
@@ -0,0 +1,186 @@
+/workspace/hanrui/sglang/python/sglang/launch_server.py:51: UserWarning: 'python -m sglang.launch_server' is still supported, but 'sglang serve' is the recommended entrypoint.
+ Example: sglang serve --model-path [options]
+ warnings.warn(
+[2026-03-07 15:24:13] INFO server_args.py:2048: Attention backend not specified. Use fa3 backend by default.
+[2026-03-07 15:24:13] WARNING server_args.py:2629: Max running requests is reset to 48 for speculative decoding. You can override this by explicitly setting --max-running-requests.
+[2026-03-07 15:24:13] WARNING server_args.py:2650: Overlap scheduler is disabled when spec v2 is off or using unsupported speculative algorithm. You can set env SGLANG_ENABLE_SPEC_V2=True to enable the experimental overlap scheduler.
+[2026-03-07 15:24:13] WARNING server_args.py:2712: speculative_num_draft_tokens is adjusted to speculative_num_steps + 1 when speculative_eagle_topk == 1
+[2026-03-07 15:24:14] server_args=ServerArgs(model_path='/workspace/models/Qwen3-8B', tokenizer_path='/workspace/models/Qwen3-8B', tokenizer_mode='auto', tokenizer_worker_num=1, skip_tokenizer_init=False, load_format='auto', model_loader_extra_config='{}', trust_remote_code=True, context_length=None, is_embedding=False, enable_multimodal=None, revision=None, model_impl='auto', host='10.233.100.123', port=30000, fastapi_root_path='', grpc_mode=False, skip_server_warmup=False, warmups=None, nccl_port=None, checkpoint_engine_wait_weights_before_ready=False, ssl_keyfile=None, ssl_certfile=None, ssl_ca_certs=None, ssl_keyfile_password=None, enable_ssl_refresh=False, dtype='bfloat16', quantization=None, quantization_param_path=None, kv_cache_dtype='auto', enable_fp32_lm_head=False, modelopt_quant=None, modelopt_checkpoint_restore_path=None, modelopt_checkpoint_save_path=None, modelopt_export_path=None, quantize_and_serve=False, rl_quant_profile=None, mem_fraction_static=0.8, max_running_requests=48, max_queued_requests=None, max_total_tokens=None, chunked_prefill_size=8192, enable_dynamic_chunking=False, max_prefill_tokens=16384, prefill_max_requests=None, schedule_policy='fcfs', enable_priority_scheduling=False, disable_priority_preemption=False, default_priority_value=None, abort_on_priority_when_disabled=False, schedule_low_priority_values_first=False, priority_scheduling_preemption_threshold=10, schedule_conservativeness=1.0, page_size=1, swa_full_tokens_ratio=0.8, disable_hybrid_swa_memory=False, radix_eviction_policy='lru', enable_prefill_delayer=False, prefill_delayer_max_delay_passes=30, prefill_delayer_token_usage_low_watermark=None, prefill_delayer_forward_passes_buckets=None, prefill_delayer_wait_seconds_buckets=None, device='cuda', tp_size=4, pp_size=1, pp_max_micro_batch_size=None, pp_async_batch_depth=0, stream_interval=1, stream_output=False, enable_streaming_session=False, random_seed=551181117, constrained_json_whitespace_pattern=None, constrained_json_disable_any_whitespace=False, watchdog_timeout=300, soft_watchdog_timeout=None, dist_timeout=None, download_dir=None, model_checksum=None, base_gpu_id=0, gpu_id_step=1, sleep_on_idle=False, use_ray=False, custom_sigquit_handler=None, log_level='info', log_level_http=None, log_requests=False, log_requests_level=2, log_requests_format='text', log_requests_target=None, uvicorn_access_log_exclude_prefixes=[], crash_dump_folder=None, show_time_cost=False, enable_metrics=False, enable_metrics_for_all_schedulers=False, tokenizer_metrics_custom_labels_header='x-custom-labels', tokenizer_metrics_allowed_custom_labels=None, extra_metric_labels=None, bucket_time_to_first_token=None, bucket_inter_token_latency=None, bucket_e2e_request_latency=None, collect_tokens_histogram=False, prompt_tokens_buckets=None, generation_tokens_buckets=None, gc_warning_threshold_secs=0.0, decode_log_interval=40, enable_request_time_stats_logging=False, kv_events_config=None, enable_trace=False, otlp_traces_endpoint='localhost:4317', export_metrics_to_file=False, export_metrics_to_file_dir=None, api_key=None, admin_api_key=None, served_model_name='/workspace/models/Qwen3-8B', weight_version='default', chat_template=None, hf_chat_template_name=None, completion_template=None, file_storage_path='sglang_storage', enable_cache_report=False, reasoning_parser=None, tool_call_parser=None, tool_server=None, sampling_defaults='model', dp_size=1, load_balance_method='round_robin', attn_cp_size=1, moe_dp_size=1, dist_init_addr=None, nnodes=1, node_rank=0, json_model_override_args='{}', preferred_sampling_params=None, enable_lora=None, enable_lora_overlap_loading=None, max_lora_rank=None, lora_target_modules=None, lora_paths=None, max_loaded_loras=None, max_loras_per_batch=8, lora_eviction_policy='lru', lora_backend='csgmv', max_lora_chunk_size=16, attention_backend='fa3', decode_attention_backend=None, prefill_attention_backend=None, sampling_backend='flashinfer', grammar_backend='xgrammar', mm_attention_backend=None, fp8_gemm_runner_backend='auto', fp4_gemm_runner_backend='flashinfer_cutlass', nsa_prefill_backend=None, nsa_decode_backend=None, disable_flashinfer_autotune=False, mamba_backend='triton', speculative_algorithm='STANDALONE', speculative_draft_model_path='/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-merged', speculative_draft_model_revision='main', speculative_draft_load_format=None, speculative_num_steps=4, speculative_eagle_topk=1, speculative_num_draft_tokens=5, speculative_accept_threshold_single=1.0, speculative_accept_threshold_acc=1.0, speculative_token_map=None, speculative_attention_mode='prefill', speculative_draft_attention_backend=None, speculative_moe_runner_backend='auto', speculative_moe_a2a_backend=None, speculative_draft_model_quantization=None, speculative_ngram_min_match_window_size=1, speculative_ngram_max_match_window_size=12, speculative_ngram_min_bfs_breadth=1, speculative_ngram_max_bfs_breadth=10, speculative_ngram_match_type='BFS', speculative_ngram_branch_length=18, speculative_ngram_capacity=10000000, enable_multi_layer_eagle=False, ep_size=1, moe_a2a_backend='none', moe_runner_backend='auto', flashinfer_mxfp4_moe_precision='default', enable_flashinfer_allreduce_fusion=False, enable_aiter_allreduce_fusion=False, deepep_mode='auto', ep_num_redundant_experts=0, ep_dispatch_algorithm=None, init_expert_location='trivial', enable_eplb=False, eplb_algorithm='auto', eplb_rebalance_num_iterations=1000, eplb_rebalance_layers_per_chunk=None, eplb_min_rebalancing_utilization_threshold=1.0, expert_distribution_recorder_mode=None, expert_distribution_recorder_buffer_size=1000, enable_expert_distribution_metrics=False, deepep_config=None, moe_dense_tp_size=None, elastic_ep_backend=None, enable_elastic_expert_backup=False, mooncake_ib_device=None, max_mamba_cache_size=None, mamba_ssm_dtype=None, mamba_full_memory_ratio=0.9, mamba_scheduler_strategy='no_buffer', mamba_track_interval=256, linear_attn_backend='triton', linear_attn_decode_backend=None, linear_attn_prefill_backend=None, enable_hierarchical_cache=False, hicache_ratio=2.0, hicache_size=0, hicache_write_policy='write_through', hicache_io_backend='kernel', hicache_mem_layout='layer_first', disable_hicache_numa_detect=False, hicache_storage_backend=None, hicache_storage_prefetch_policy='best_effort', hicache_storage_backend_extra_config=None, hierarchical_sparse_attention_extra_config=None, enable_lmcache=False, kt_weight_path=None, kt_method='AMXINT4', kt_cpuinfer=None, kt_threadpool_count=2, kt_num_gpu_experts=None, kt_max_deferred_experts_per_token=None, dllm_algorithm=None, dllm_algorithm_config=None, enable_double_sparsity=False, ds_channel_config_path=None, ds_heavy_channel_num=32, ds_heavy_token_num=256, ds_heavy_channel_type='qk', ds_sparse_decode_threshold=4096, cpu_offload_gb=0, offload_group_size=-1, offload_num_in_group=1, offload_prefetch_step=1, offload_mode='cpu', multi_item_scoring_delimiter=None, disable_radix_cache=False, cuda_graph_max_bs=512, cuda_graph_bs=[1, 2, 3, 4, 5, 6, 7, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32, 40, 44, 48, 52, 56, 60, 64, 72, 80, 88, 96, 104, 112, 120, 128, 136, 144, 152, 160, 168, 176, 184, 192, 200, 208, 216, 224, 232, 240, 248, 256, 272, 288, 304, 320, 336, 352, 368, 384, 400, 416, 432, 448, 464, 480, 496, 512], disable_cuda_graph=False, disable_cuda_graph_padding=False, enable_profile_cuda_graph=False, enable_cudagraph_gc=False, enable_layerwise_nvtx_marker=False, enable_nccl_nvls=False, enable_symm_mem=False, disable_flashinfer_cutlass_moe_fp4_allgather=False, enable_tokenizer_batch_encode=False, disable_tokenizer_batch_decode=False, disable_outlines_disk_cache=False, disable_custom_all_reduce=False, enable_mscclpp=False, enable_torch_symm_mem=False, disable_overlap_schedule=True, enable_mixed_chunk=False, enable_dp_attention=False, enable_dp_lm_head=False, enable_two_batch_overlap=False, enable_single_batch_overlap=False, tbo_token_distribution_threshold=0.48, enable_torch_compile=False, disable_piecewise_cuda_graph=True, enforce_piecewise_cuda_graph=False, enable_torch_compile_debug_mode=False, torch_compile_max_bs=32, piecewise_cuda_graph_max_tokens=8192, piecewise_cuda_graph_tokens=[4, 8, 12, 16, 20, 24, 28, 32, 48, 64, 80, 96, 112, 128, 144, 160, 176, 192, 208, 224, 240, 256, 288, 320, 352, 384, 416, 448, 480, 512, 576, 640, 704, 768, 832, 896, 960, 1024, 1280, 1536, 1792, 2048, 2304, 2560, 2816, 3072, 3328, 3584, 3840, 4096, 4608, 5120, 5632, 6144, 6656, 7168, 7680, 8192], piecewise_cuda_graph_compiler='eager', torchao_config='', enable_nan_detection=False, enable_p2p_check=False, triton_attention_reduce_in_fp32=False, triton_attention_num_kv_splits=8, triton_attention_split_tile_size=None, num_continuous_decode_steps=1, delete_ckpt_after_loading=False, enable_memory_saver=False, enable_weights_cpu_backup=False, enable_draft_weights_cpu_backup=False, allow_auto_truncate=False, enable_custom_logit_processor=False, flashinfer_mla_disable_ragged=False, disable_shared_experts_fusion=False, disable_chunked_prefix_cache=False, disable_fast_image_processor=False, keep_mm_feature_on_device=False, enable_return_hidden_states=False, enable_return_routed_experts=False, scheduler_recv_interval=1, numa_node=None, enable_deterministic_inference=False, rl_on_policy_target=None, enable_attn_tp_input_scattered=False, enable_nsa_prefill_context_parallel=False, nsa_prefill_cp_mode='round-robin-split', enable_fused_qk_norm_rope=False, enable_precise_embedding_interpolation=False, enable_fused_moe_sum_all_reduce=False, enable_dynamic_batch_tokenizer=False, dynamic_batch_tokenizer_batch_size=32, dynamic_batch_tokenizer_batch_timeout=0.002, debug_tensor_dump_output_folder=None, debug_tensor_dump_layers=None, debug_tensor_dump_input_file=None, debug_tensor_dump_inject=False, disaggregation_mode='null', disaggregation_transfer_backend='mooncake', disaggregation_bootstrap_port=8998, disaggregation_ib_device=None, disaggregation_decode_enable_offload_kvcache=False, num_reserved_decode_tokens=512, disaggregation_decode_polling_interval=1, encoder_only=False, language_only=False, encoder_transfer_backend='zmq_to_scheduler', encoder_urls=[], enable_adaptive_dispatch_to_encoder=False, custom_weight_loader=[], weight_loader_disable_mmap=False, remote_instance_weight_loader_seed_instance_ip=None, remote_instance_weight_loader_seed_instance_service_port=None, remote_instance_weight_loader_send_weights_group_ports=None, remote_instance_weight_loader_backend='nccl', remote_instance_weight_loader_start_seed_via_transfer_engine=False, enable_pdmux=False, pdmux_config_path=None, sm_group_num=8, mm_max_concurrent_calls=32, mm_per_request_timeout=10.0, enable_broadcast_mm_inputs_process=False, enable_prefix_mm_cache=False, mm_enable_dp_encoder=False, mm_process_config={}, limit_mm_data_per_request=None, enable_mm_global_cache=False, decrypted_config_file=None, decrypted_draft_config_file=None, forward_hooks=None)
+[2026-03-07 15:24:15] Using default HuggingFace chat template with detected content format: string
+[2026-03-07 15:24:25 TP2] Mamba selective_state_update backend initialized: triton
+[2026-03-07 15:24:25 TP2] Init torch distributed begin.
+[2026-03-07 15:24:26 TP0] Mamba selective_state_update backend initialized: triton
+[2026-03-07 15:24:26 TP0] Init torch distributed begin.
+[2026-03-07 15:24:26 TP3] Mamba selective_state_update backend initialized: triton
+[2026-03-07 15:24:26 TP1] Mamba selective_state_update backend initialized: triton
+[2026-03-07 15:24:26 TP3] Init torch distributed begin.
+[2026-03-07 15:24:26 TP1] Init torch distributed begin.
+[Gloo] Rank 1 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 0 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 3 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 2 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 0 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 2 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 1 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[Gloo] Rank 3 is connected to 3 peer ranks. Expected number of connected peer ranks is : 3
+[2026-03-07 15:24:27 TP0] sglang is using nccl==2.27.5
+[2026-03-07 15:24:29 TP0] Scheduler hit an exception: Traceback (most recent call last):
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 3239, in run_scheduler_process
+ scheduler = Scheduler(
+ ^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 365, in __init__
+ self.init_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 561, in init_model_worker
+ self.init_tp_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 519, in init_tp_model_worker
+ self.tp_worker = TpModelWorker(
+ ^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 258, in __init__
+ self._init_model_runner()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 341, in _init_model_runner
+ self._model_runner = ModelRunner(
+ ^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 395, in __init__
+ pre_model_load_memory = self.init_torch_distributed()
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 813, in init_torch_distributed
+ initialize_model_parallel(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1764, in initialize_model_parallel
+ _TP = init_model_parallel_group(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1450, in init_model_parallel_group
+ return GroupCoordinator(
+ ^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 357, in __init__
+ self.pynccl_comm = PyNcclCommunicator(
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl.py", line 113, in __init__
+ self.comm: ncclComm_t = self.nccl.ncclCommInitRank(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 401, in ncclCommInitRank
+ self.NCCL_CHECK(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 376, in NCCL_CHECK
+ raise RuntimeError(f"NCCL error: {error_str}")
+RuntimeError: NCCL error: unhandled system error (run with NCCL_DEBUG=INFO for details)
+
+[2026-03-07 15:24:29] Received sigquit from a child process. It usually means the child failed.
+[2026-03-07 15:24:29 TP2] Scheduler hit an exception: Traceback (most recent call last):
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 3239, in run_scheduler_process
+ scheduler = Scheduler(
+ ^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 365, in __init__
+ self.init_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 561, in init_model_worker
+ self.init_tp_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 519, in init_tp_model_worker
+ self.tp_worker = TpModelWorker(
+ ^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 258, in __init__
+ self._init_model_runner()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 341, in _init_model_runner
+ self._model_runner = ModelRunner(
+ ^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 395, in __init__
+ pre_model_load_memory = self.init_torch_distributed()
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 813, in init_torch_distributed
+ initialize_model_parallel(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1764, in initialize_model_parallel
+ _TP = init_model_parallel_group(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1450, in init_model_parallel_group
+ return GroupCoordinator(
+ ^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 357, in __init__
+ self.pynccl_comm = PyNcclCommunicator(
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl.py", line 113, in __init__
+ self.comm: ncclComm_t = self.nccl.ncclCommInitRank(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 401, in ncclCommInitRank
+ self.NCCL_CHECK(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 376, in NCCL_CHECK
+ raise RuntimeError(f"NCCL error: {error_str}")
+RuntimeError: NCCL error: unhandled system error (run with NCCL_DEBUG=INFO for details)
+
+[2026-03-07 15:24:29 TP1] Scheduler hit an exception: Traceback (most recent call last):
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 3239, in run_scheduler_process
+ scheduler = Scheduler(
+ ^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 365, in __init__
+ self.init_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 561, in init_model_worker
+ self.init_tp_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 519, in init_tp_model_worker
+ self.tp_worker = TpModelWorker(
+ ^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 258, in __init__
+ self._init_model_runner()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 341, in _init_model_runner
+ self._model_runner = ModelRunner(
+ ^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 395, in __init__
+ pre_model_load_memory = self.init_torch_distributed()
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 813, in init_torch_distributed
+ initialize_model_parallel(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1764, in initialize_model_parallel
+ _TP = init_model_parallel_group(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1450, in init_model_parallel_group
+ return GroupCoordinator(
+ ^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 357, in __init__
+ self.pynccl_comm = PyNcclCommunicator(
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl.py", line 113, in __init__
+ self.comm: ncclComm_t = self.nccl.ncclCommInitRank(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 401, in ncclCommInitRank
+ self.NCCL_CHECK(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 376, in NCCL_CHECK
+ raise RuntimeError(f"NCCL error: {error_str}")
+RuntimeError: NCCL error: unhandled system error (run with NCCL_DEBUG=INFO for details)
+
+[2026-03-07 15:24:29] Received sigquit from a child process. It usually means the child failed.
+[2026-03-07 15:24:29] Received sigquit from a child process. It usually means the child failed.
+[2026-03-07 15:24:29 TP3] Scheduler hit an exception: Traceback (most recent call last):
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 3239, in run_scheduler_process
+ scheduler = Scheduler(
+ ^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 365, in __init__
+ self.init_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 561, in init_model_worker
+ self.init_tp_model_worker()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/scheduler.py", line 519, in init_tp_model_worker
+ self.tp_worker = TpModelWorker(
+ ^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 258, in __init__
+ self._init_model_runner()
+ File "/workspace/hanrui/sglang/python/sglang/srt/managers/tp_worker.py", line 341, in _init_model_runner
+ self._model_runner = ModelRunner(
+ ^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 395, in __init__
+ pre_model_load_memory = self.init_torch_distributed()
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/model_executor/model_runner.py", line 813, in init_torch_distributed
+ initialize_model_parallel(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1764, in initialize_model_parallel
+ _TP = init_model_parallel_group(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 1450, in init_model_parallel_group
+ return GroupCoordinator(
+ ^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/parallel_state.py", line 357, in __init__
+ self.pynccl_comm = PyNcclCommunicator(
+ ^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl.py", line 113, in __init__
+ self.comm: ncclComm_t = self.nccl.ncclCommInitRank(
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 401, in ncclCommInitRank
+ self.NCCL_CHECK(
+ File "/workspace/hanrui/sglang/python/sglang/srt/distributed/device_communicators/pynccl_wrapper.py", line 376, in NCCL_CHECK
+ raise RuntimeError(f"NCCL error: {error_str}")
+RuntimeError: NCCL error: unhandled system error (run with NCCL_DEBUG=INFO for details)
+
+[2026-03-07 15:24:29] Received sigquit from a child process. It usually means the child failed.
diff --git a/syxin_old/step1.md b/syxin_old/step1.md
new file mode 100644
index 0000000000000000000000000000000000000000..76984c1000dac6765c033cca50a23deb199fe06d
--- /dev/null
+++ b/syxin_old/step1.md
@@ -0,0 +1,139 @@
+Now I have a complete picture. Here's the full analysis and proposed plan.
+
+ ---
+ Current Logic of train_dflash.py
+
+ This script trains a small, standalone DFlash draft model (1–10 transformer layers) that learns to predict token blocks in parallel,
+ guided by hidden states extracted from a frozen target model.
+
+ Architecture (two separate models)
+
+ 1. Target model (frozen, e.g. Qwen3-8B/32B) — runs a full forward pass to produce hidden states at selected layers.
+ 2. Draft model (DFlashDraftModel, ~1–10 layers) — a lightweight Qwen3-based decoder that takes noise embeddings + target hidden states
+ and predicts the block tokens.
+ 3. Target embed_tokens + lm_head — loaded separately via TargetEmbeddingsAndHead to avoid duplicating the full target model in memory.
+
+ Key locations
+
+ ┌──────────────────────────┬────────────────────────────────────┬───────────────────────────────────────────────────────┐
+ │ Component │ File │ Lines │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Model init │ scripts/train_dflash.py │ build_models() L254–311 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Target hidden extraction │ scripts/train_dflash.py │ L644–647 (target_model.generate_dflash_data) │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Forward pass │ specforge/core/dflash.py │ OnlineDFlashModel.forward() L243–332 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Loss calculation │ specforge/core/dflash.py │ _full_lm_loss() L382–417, _chunked_lm_loss() L419–478 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Loss mask │ specforge/core/dflash.py │ create_dflash_loss_mask() L481–509 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ Draft model architecture │ specforge/modeling/draft/dflash.py │ DFlashDraftModel L212–266 │
+ ├──────────────────────────┼────────────────────────────────────┼───────────────────────────────────────────────────────┤
+ │ DFlash attention │ specforge/modeling/draft/dflash.py │ Qwen3DFlashAttention L42–134 │
+ └──────────────────────────┴────────────────────────────────────┴───────────────────────────────────────────────────────┘
+
+ Forward pass flow (per training step)
+
+ input_ids, attention_mask, loss_mask → target_model.generate_dflash_data()
+ ↓
+ hidden_states (from target layers [1,9,17,25,33])
+ ↓
+ OnlineDFlashModel.forward():
+ 1. Truncate to block boundary
+ 2. prepare_noise_input(): anchor tokens kept, rest → MASK
+ 3. embed_tokens(noise_input_ids) → noise_embedding
+ 4. Build DFlash attention mask (flex_attention or additive)
+ 5. draft_model(noise_embedding, target_hidden, mask)
+ 6. lm_head(hidden) → logits
+ 7. CE loss on non-anchor positions (weighted by loss_mask × decay)
+
+ The draft model's custom Qwen3DFlashAttention concatenates [context_hidden, noise_hidden] as KV, with queries only from noise tokens. The
+ attention mask enforces: block tokens see all preceding blocks' context + bidirectional within their own block.
+
+ ---
+ What already exists: train_dflash_lora.py
+
+ Interestingly, the repo already has a LoRA variant at scripts/train_dflash_lora.py with its own model (DFlashLoRADraftModel) and wrapper
+ (OnlineDFlashLoRAModel). This is exactly the approach you described — Qwen3-8B + LoRA, no separate target model, 1-step diffusion
+ training. The key differences from train_dflash.py:
+
+ ┌─────────────────┬─────────────────────────────────────────────────────────────┬────────────────────────────────────────────────────┐
+ │ Aspect │ train_dflash.py │ train_dflash_lora.py │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Draft model │ Small custom DFlashDraftModel (1–10 layers) │ Full Qwen3-8B + LoRA adapters │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Target model │ Separate frozen model for hidden state extraction │ None — model uses its own representations │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Attention │ Custom Qwen3DFlashAttention (Q from noise, KV from [ctx, │ Standard HF attention with 4D additive DFlash mask │
+ │ │ noise]) │ │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Forward │ draft_model(noise_emb, target_hidden, mask) │ model(noise_input_ids, 4d_mask, position_ids) → │
+ │ │ │ logits │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ Trainable │ All draft model params │ Only LoRA (q/k/v/o_proj), base frozen │
+ │ params │ │ │
+ ├─────────────────┼─────────────────────────────────────────────────────────────┼────────────────────────────────────────────────────┤
+ │ FSDP strategy │ SHARD_GRAD_OP │ FULL_SHARD │
+ └─────────────────┴─────────────────────────────────────────────────────────────┴────────────────────────────────────────────────────┘
+
+ ---
+ Proposed Modification Plan
+
+ Since train_dflash_lora.py already implements the core idea, the plan focuses on what's missing or needs improvement to make it a proper
+ "1-step dLLM draft model" for your research:
+
+ Phase 1: Validate and extend the existing LoRA pipeline
+
+ 1. Add MLP to LoRA targets — The current config only targets q_proj, k_proj, v_proj, o_proj. For stronger 1-step diffusion capability,
+ add gate_proj, up_proj, down_proj to lora_target_modules. This gives the model more capacity to learn the non-autoregressive distribution
+ shift.
+ 2. Add multi-step noise schedule support — Currently the training is strictly 1-step (all non-anchors → MASK). For a proper diffusion/AR
+ fusion, add an option for a noise schedule where a fraction of block tokens are revealed (not just the anchor), controlled by a
+ noise_ratio parameter. This would modify prepare_noise_input() in OnlineDFlashLoRAModel:
+ # Instead of: all non-anchor → MASK
+ # Allow: randomly keep some non-anchor tokens with probability (1 - noise_ratio)
+ 3. Add configurable context_len strategy — Currently context_len=0 treats the whole sequence as blocks. Add a --context-ratio arg that
+ dynamically sets context_len as a fraction of the sequence, so the model learns to condition on varying amounts of AR-decoded prefix.
+
+ Phase 2: Training logic improvements
+
+ 4. Add KL divergence loss — In addition to CE loss against ground truth, add an optional KL loss against the base model's AR distribution
+ (teacher forcing). This regularizes the LoRA model to stay close to the original Qwen3-8B distribution. Modify
+ OnlineDFlashLoRAModel.forward():
+ # Compute base model logits (no_grad, no LoRA) as teacher
+ # KL(draft_logits || teacher_logits) on block positions
+ # total_loss = ce_loss + kl_weight * kl_loss
+ 5. Add evaluation with speculative decoding metrics — The current accuracy metric is block-wise acceptance rate. Add an eval loop that
+ actually runs speculative decoding (draft → verify) to measure real speedup, using the LoRA model as the drafter and the base model (with
+ LoRA disabled) as the verifier.
+
+ Phase 3: Integration with train_dflash.py style features
+
+ 6. Port random anchor sampling — train_dflash.py has --random-anchor (L147–156) which samples diverse anchor positions per sequence. This
+ is missing from the LoRA variant and would improve training diversity. Port _sample_anchor_positions and _build_blocks_from_anchors from
+ OnlineDFlashModel to OnlineDFlashLoRAModel.
+ 7. Port chunked lm_head — The LoRA variant materializes full [bsz, seq_len, vocab_size] logits. For Qwen3-8B's 152K vocab, this is ~1.2GB
+ per sample at seq_len=2048. Port the _chunked_lm_loss from OnlineDFlashModel for memory efficiency.
+ 8. Add tensor parallelism support — The LoRA script currently forces tp_size=1. For Qwen3-8B on multi-GPU setups, add TP support to shard
+ the base model across GPUs while keeping LoRA params on each rank.
+
+ Minimal starting point
+
+ If you want to just get training running immediately, the existing train_dflash_lora.py + configs/qwen3-8b-dflash-lora.json should work
+ out of the box:
+
+ torchrun --nproc_per_node=4 scripts/train_dflash_lora.py \
+ --model-path Qwen/Qwen3-8B \
+ --lora-config configs/qwen3-8b-dflash-lora.json \
+ --train-data-path /path/to/data.jsonl \
+ --output-dir ./outputs/qwen3-8b-dflash-lora \
+ --block-size 16 \
+ --gradient-checkpointing \
+ --learning-rate 2e-4 \
+ --batch-size 1 \
+ --max-length 2048 \
+ --num-epochs 3
+
+ Want me to start implementing any of these phases? I'd suggest starting with Phase 1 (noise schedule + MLP targets) since that's the most
+ impactful for the diffusion/AR fusion research angle.
\ No newline at end of file
diff --git a/syxin_old/test_indist_tau.py b/syxin_old/test_indist_tau.py
new file mode 100644
index 0000000000000000000000000000000000000000..ecea421cadada3f9e6c6d0952a6c2e195593d880
--- /dev/null
+++ b/syxin_old/test_indist_tau.py
@@ -0,0 +1,162 @@
+#!/usr/bin/env python3
+"""Quick test: run spec_generate_inject on training-distribution data (8 GPU).
+Checks if τ on in-distribution data matches training accuracy (~6).
+
+Usage:
+ /workspace/miniconda3/envs/dflash/bin/python3 -m torch.distributed.run \
+ --standalone --nproc_per_node 8 /workspace/hanrui/syxin_old/test_indist_tau.py
+"""
+import os, sys, random, warnings
+from itertools import chain
+import numpy as np
+import torch
+import torch.distributed as dist
+from transformers import AutoModelForCausalLM, AutoTokenizer
+from peft import PeftModel
+from tqdm import tqdm
+
+# Reuse spec_generate_inject from eval script
+sys.path.insert(0, "/workspace/hanrui/syxin_old")
+from eval_dflash_lora_inject import spec_generate_inject, MASK_TOKEN_ID, BLOCK_SIZE
+
+# Config
+BASE_MODEL = "/workspace/models/Qwen3-8B"
+MERGED_PATH = "/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject-merged"
+ADAPTER_PATH = "/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-dflash-lora-inject/epoch_3_step_4644"
+TRAIN_DATA = "/workspace/hanrui/datasets/Nemotron-CodeAlpaca-qwen3-8b-800K"
+NUM_SAMPLES = 80
+MAX_NEW_TOKENS = 512
+TEMPERATURE = 0.0
+
+
+def dist_init():
+ if "RANK" not in os.environ:
+ return
+ dist.init_process_group(backend="nccl", init_method="env://")
+
+def rank(): return int(os.environ.get("RANK", 0))
+def world(): return int(os.environ.get("WORLD_SIZE", 1))
+def local(): return int(os.environ.get("LOCAL_RANK", 0))
+def is_main(): return rank() == 0
+
+def print0(*a, **kw):
+ if is_main(): print(*a, **kw)
+
+
+def main():
+ random.seed(0); np.random.seed(0); torch.manual_seed(0); torch.cuda.manual_seed_all(0)
+
+ dist_init()
+ torch.cuda.set_device(local())
+ device = torch.device(f"cuda:{local()}")
+
+ print0(f"Running on {world()} GPU(s)")
+
+ tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL, trust_remote_code=True)
+ stop_token_ids = [tokenizer.eos_token_id]
+
+ print0("Loading target model...")
+ target_model = AutoModelForCausalLM.from_pretrained(
+ BASE_MODEL, torch_dtype=torch.bfloat16,
+ attn_implementation="sdpa", device_map=device, trust_remote_code=True,
+ )
+ target_model.eval()
+
+ print0("Loading draft model...")
+ if os.path.isdir(MERGED_PATH):
+ draft_model = AutoModelForCausalLM.from_pretrained(
+ MERGED_PATH, torch_dtype=torch.bfloat16,
+ attn_implementation="sdpa", device_map=device, trust_remote_code=True,
+ )
+ else:
+ print0(f"Merged not found, loading base + adapter from {ADAPTER_PATH}")
+ draft_model = AutoModelForCausalLM.from_pretrained(
+ BASE_MODEL, torch_dtype=torch.bfloat16,
+ attn_implementation="sdpa", device_map=device, trust_remote_code=True,
+ )
+ draft_model = PeftModel.from_pretrained(draft_model, ADAPTER_PATH)
+ draft_model = draft_model.merge_and_unload()
+ draft_model.eval()
+
+ # Load data via streaming (no disk write)
+ print0(f"Loading training data (streaming, {NUM_SAMPLES} samples)...")
+ from datasets import load_dataset
+ ds_stream = load_dataset(TRAIN_DATA, split="train", streaming=True)
+ candidates = []
+ for ex in ds_stream:
+ candidates.append(ex)
+ if len(candidates) >= NUM_SAMPLES * 3:
+ break
+ random.shuffle(candidates)
+ candidates = candidates[:NUM_SAMPLES]
+
+ # Distribute samples across GPUs
+ my_indices = list(range(rank(), len(candidates), world()))
+ results = []
+
+ iterator = tqdm(my_indices, desc=f"[GPU{rank()}]", disable=not is_main())
+ for idx in iterator:
+ ex = candidates[idx]
+ conversations = ex["conversations"]
+ messages = []
+ for turn in conversations:
+ if turn["role"] == "system" and turn["content"]:
+ messages.append({"role": "system", "content": turn["content"]})
+ elif turn["role"] == "user":
+ messages.append({"role": "user", "content": turn["content"]})
+ break
+
+ if not any(m["role"] == "user" for m in messages):
+ continue
+
+ input_text = tokenizer.apply_chat_template(
+ messages, tokenize=False, add_generation_prompt=True,
+ enable_thinking=False,
+ )
+ input_ids = tokenizer.encode(input_text, return_tensors="pt").to(device)
+ if input_ids.shape[1] > 1024:
+ continue
+
+ result = spec_generate_inject(
+ target_model=target_model, draft_model=draft_model,
+ input_ids=input_ids, max_new_tokens=MAX_NEW_TOKENS,
+ block_size=BLOCK_SIZE, mask_token_id=MASK_TOKEN_ID,
+ temperature=TEMPERATURE, stop_token_ids=stop_token_ids,
+ )
+
+ if result.acceptance_lengths:
+ avg_tau = np.mean(result.acceptance_lengths)
+ results.append(result.acceptance_lengths)
+ if is_main():
+ iterator.set_postfix(tau=f"{avg_tau:.2f}")
+
+ # Gather all results to rank 0
+ if dist.is_initialized():
+ if is_main():
+ gathered = [None] * world()
+ dist.gather_object(results, gathered, dst=0)
+ all_results = list(chain(*gathered))
+ else:
+ dist.gather_object(results, dst=0)
+ all_results = None
+ else:
+ all_results = results
+
+ if is_main() and all_results:
+ all_accept_lens = list(chain(*all_results))
+ overall_tau = np.mean(all_accept_lens)
+ per_sample_tau = [np.mean(r) for r in all_results]
+ print(f"\n{'='*60}")
+ print(f"In-distribution τ = {overall_tau:.2f}")
+ print(f" Per-sample mean τ = {np.mean(per_sample_tau):.2f}")
+ print(f" N = {len(all_results)} samples, {len(all_accept_lens)} decode steps")
+ print(f"{'='*60}")
+ print(f"\nComparison:")
+ print(f" Training accuracy ~33% → theoretical τ ≈ 6")
+ print(f" GSM8K eval τ = 3.92")
+ print(f" HumanEval eval τ = 3.74")
+ print(f" MT-Bench eval τ = 3.32")
+
+
+if __name__ == "__main__":
+ main()
diff --git a/syxin_old/train_dflash_lora_inject.log b/syxin_old/train_dflash_lora_inject.log
new file mode 100644
index 0000000000000000000000000000000000000000..4af7e198d9564fd7ae69e8eef1d792a3fdedcb10
--- /dev/null
+++ b/syxin_old/train_dflash_lora_inject.log
@@ -0,0 +1,105 @@
+nohup: ignoring input
+
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:14<00:57, 14.33s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:14<00:57, 14.44s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:14<00:57, 14.38s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:14<00:57, 14.38s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:14<00:57, 14.38s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:14<00:57, 14.40s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:14<00:57, 14.40s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:14<00:57, 14.40s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:29<00:43, 14.57s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:29<00:43, 14.64s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:29<00:43, 14.65s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:29<00:44, 14.67s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:29<00:44, 14.67s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:29<00:43, 14.65s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:29<00:43, 14.64s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:29<00:43, 14.64s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:42<00:28, 14.18s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:42<00:28, 14.23s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:42<00:28, 14.25s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:42<00:28, 14.23s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:42<00:28, 14.23s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:42<00:28, 14.23s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:42<00:28, 14.23s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:43<00:28, 14.24s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:54<00:13, 13.12s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:54<00:13, 13.16s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:54<00:13, 13.15s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:54<00:13, 13.16s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:54<00:13, 13.15s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:54<00:13, 13.18s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:54<00:13, 13.16s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:54<00:13, 13.17s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 9.89s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 11.71s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 9.90s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 9.89s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 9.89s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 9.90s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 11.73s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 9.90s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 11.71s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 11.71s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 11.72s/it]
+
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 11.71s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 9.90s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 9.91s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 11.72s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:58<00:00, 11.72s/it]
+
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 133.79it/s]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 141.08it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.70it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.93it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.16it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 137.91it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 141.85it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 142.03it/s]
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+
+
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/distributed_c10d.py:4876: UserWarning: barrier(): using the device under current context. You can specify `device_id` in `init_process_group` to mute this warning.
+ warnings.warn( # warn only once
+[rank0]:[W310 14:11:14.955842453 ProcessGroupNCCL.cpp:5072] Guessing device ID based on global rank. This can cause a hang if rank to GPU mapping is heterogeneous. You can specify device_id in init_process_group()
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkldataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
Epoch 0: 0%| | 0/12384 [00:00, ?it/s]
Epoch 0: 0%| | 0/12384 [00:08, ?it/s, loss=11.4616, acc=0.0002, iter_time=7.92s]
Epoch 0: 0%| | 1/12384 [00:08<28:43:37, 8.35s/it, loss=11.4616, acc=0.0002, iter_time=7.92s]
Epoch 0: 0%| | 1/12384 [00:15<28:43:37, 8.35s/it, loss=10.6726, acc=0.0003, iter_time=6.45s]
Epoch 0: 0%| | 2/12384 [00:15<27:16:28, 7.93s/it, loss=10.6726, acc=0.0003, iter_time=6.45s]
Epoch 0: 0%| | 2/12384 [00:23<27:16:28, 7.93s/it, loss=10.4985, acc=0.0011, iter_time=8.83s]
Epoch 0: 0%| | 3/12384 [00:23<26:49:06, 7.80s/it, loss=10.4985, acc=0.0011, iter_time=8.83s]
Epoch 0: 0%| | 3/12384 [00:31<26:49:06, 7.80s/it, loss=12.4512, acc=0.0002, iter_time=4.59s]
Epoch 0: 0%| | 4/12384 [00:31<26:35:32, 7.73s/it, loss=12.4512, acc=0.0002, iter_time=4.59s]
Epoch 0: 0%| | 4/12384 [00:38<26:35:32, 7.73s/it, loss=10.6913, acc=0.0007, iter_time=10.67s]
Epoch 0: 0%| | 5/12384 [00:38<26:31:19, 7.71s/it, loss=10.6913, acc=0.0007, iter_time=10.67s]
Epoch 0: 0%| | 5/12384 [00:46<26:31:19, 7.71s/it, loss=10.7935, acc=0.0006, iter_time=7.68s]
Epoch 0: 0%| | 6/12384 [00:46<26:24:50, 7.68s/it, loss=10.7935, acc=0.0006, iter_time=7.68s]
Epoch 0: 0%| | 6/12384 [00:54<26:24:50, 7.68s/it, loss=12.5651, acc=0.0002, iter_time=7.66s]
Epoch 0: 0%| | 7/12384 [00:55<27:51:06, 8.10s/it, loss=12.5651, acc=0.0002, iter_time=7.66s]
Epoch 0: 0%| | 7/12384 [01:03<27:51:06, 8.10s/it, loss=11.6807, acc=0.0003, iter_time=9.57s]
Epoch 0: 0%| | 8/12384 [01:03<27:33:41, 8.02s/it, loss=11.6807, acc=0.0003, iter_time=9.57s]
Epoch 0: 0%| | 8/12384 [01:10<27:33:41, 8.02s/it, loss=11.3781, acc=0.0005, iter_time=4.95s]
Epoch 0: 0%| | 9/12384 [01:10<27:07:50, 7.89s/it, loss=11.3781, acc=0.0005, iter_time=4.95s]
Epoch 0: 0%| | 9/12384 [01:19<27:07:50, 7.89s/it, loss=10.5337, acc=0.0003, iter_time=10.22s]
Epoch 0: 0%| | 10/12384 [01:19<28:17:39, 8.23s/it, loss=10.5337, acc=0.0003, iter_time=10.22s]
Epoch 0: 0%| | 10/12384 [01:27<28:17:39, 8.23s/it, loss=11.6155, acc=0.0004, iter_time=8.66s]
Epoch 0: 0%| | 11/12384 [01:27<27:40:25, 8.05s/it, loss=11.6155, acc=0.0004, iter_time=8.66s]
Epoch 0: 0%| | 11/12384 [01:35<27:40:25, 8.05s/it, loss=11.2007, acc=0.0002, iter_time=7.63s]
Epoch 0: 0%| | 12/12384 [01:35<27:12:13, 7.92s/it, loss=11.2007, acc=0.0002, iter_time=7.63s]
Epoch 0: 0%| | 12/12384 [01:42<27:12:13, 7.92s/it, loss=11.8506, acc=0.0011, iter_time=5.00s]
Epoch 0: 0%| | 13/12384 [01:42<26:53:01, 7.82s/it, loss=11.8506, acc=0.0011, iter_time=5.00s]
Epoch 0: 0%| | 13/12384 [01:50<26:53:01, 7.82s/it, loss=12.6669, acc=0.0004, iter_time=8.51s]
Epoch 0: 0%| | 14/12384 [01:50<26:40:21, 7.76s/it, loss=12.6669, acc=0.0004, iter_time=8.51s]
Epoch 0: 0%| | 14/12384 [01:58<26:40:21, 7.76s/it, loss=11.3247, acc=0.0002, iter_time=9.33s]
Epoch 0: 0%| | 15/12384 [01:58<26:31:55, 7.72s/it, loss=11.3247, acc=0.0002, iter_time=9.33s]
Epoch 0: 0%| | 15/12384 [02:05<26:31:55, 7.72s/it, loss=12.2029, acc=0.0000, iter_time=7.57s]
Epoch 0: 0%| | 16/12384 [02:05<26:24:10, 7.69s/it, loss=12.2029, acc=0.0000, iter_time=7.57s]
Epoch 0: 0%| | 16/12384 [02:13<26:24:10, 7.69s/it, loss=10.7728, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 17/12384 [02:13<26:20:17, 7.67s/it, loss=10.7728, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 17/12384 [02:20<26:20:17, 7.67s/it, loss=10.9697, acc=0.0001, iter_time=8.83s]
Epoch 0: 0%| | 18/12384 [02:20<26:17:02, 7.65s/it, loss=10.9697, acc=0.0001, iter_time=8.83s]
Epoch 0: 0%| | 18/12384 [02:28<26:17:02, 7.65s/it, loss=11.0639, acc=0.0002, iter_time=6.39s]
Epoch 0: 0%| | 19/12384 [02:28<26:17:41, 7.66s/it, loss=11.0639, acc=0.0002, iter_time=6.39s]
Epoch 0: 0%| | 19/12384 [02:36<26:17:41, 7.66s/it, loss=10.9894, acc=0.0011, iter_time=8.89s]
Epoch 0: 0%| | 20/12384 [02:36<26:17:04, 7.65s/it, loss=10.9894, acc=0.0011, iter_time=8.89s]
Epoch 0: 0%| | 20/12384 [02:43<26:17:04, 7.65s/it, loss=11.2999, acc=0.0000, iter_time=7.64s]
Epoch 0: 0%| | 21/12384 [02:43<26:13:37, 7.64s/it, loss=11.2999, acc=0.0000, iter_time=7.64s]
Epoch 0: 0%| | 21/12384 [02:51<26:13:37, 7.64s/it, loss=10.9248, acc=0.0007, iter_time=7.60s]
Epoch 0: 0%| | 22/12384 [02:51<26:12:19, 7.63s/it, loss=10.9248, acc=0.0007, iter_time=7.60s]
Epoch 0: 0%| | 22/12384 [02:59<26:12:19, 7.63s/it, loss=11.6886, acc=0.0004, iter_time=7.63s]
Epoch 0: 0%| | 23/12384 [02:59<26:10:42, 7.62s/it, loss=11.6886, acc=0.0004, iter_time=7.63s]
Epoch 0: 0%| | 23/12384 [03:06<26:10:42, 7.62s/it, loss=10.1440, acc=0.0008, iter_time=7.97s]
Epoch 0: 0%| | 24/12384 [03:06<26:09:29, 7.62s/it, loss=10.1440, acc=0.0008, iter_time=7.97s]
Epoch 0: 0%| | 24/12384 [03:14<26:09:29, 7.62s/it, loss=11.4346, acc=0.0007, iter_time=7.23s]
Epoch 0: 0%| | 25/12384 [03:14<26:08:22, 7.61s/it, loss=11.4346, acc=0.0007, iter_time=7.23s]
Epoch 0: 0%| | 25/12384 [03:21<26:08:22, 7.61s/it, loss=11.4066, acc=0.0004, iter_time=7.60s]
Epoch 0: 0%| | 26/12384 [03:21<26:07:20, 7.61s/it, loss=11.4066, acc=0.0004, iter_time=7.60s]
Epoch 0: 0%| | 26/12384 [03:29<26:07:20, 7.61s/it, loss=11.0379, acc=0.0009, iter_time=7.59s]
Epoch 0: 0%| | 27/12384 [03:29<26:05:48, 7.60s/it, loss=11.0379, acc=0.0009, iter_time=7.59s]
Epoch 0: 0%| | 27/12384 [03:37<26:05:48, 7.60s/it, loss=13.4660, acc=0.0000, iter_time=4.31s]
Epoch 0: 0%| | 28/12384 [03:37<26:07:08, 7.61s/it, loss=13.4660, acc=0.0000, iter_time=4.31s]
Epoch 0: 0%| | 28/12384 [03:44<26:07:08, 7.61s/it, loss=10.7066, acc=0.0000, iter_time=10.92s]
Epoch 0: 0%| | 29/12384 [03:44<26:09:12, 7.62s/it, loss=10.7066, acc=0.0000, iter_time=10.92s]
Epoch 0: 0%| | 29/12384 [03:52<26:09:12, 7.62s/it, loss=10.6313, acc=0.0007, iter_time=7.01s]
Epoch 0: 0%| | 30/12384 [03:52<26:08:45, 7.62s/it, loss=10.6313, acc=0.0007, iter_time=7.01s]
Epoch 0: 0%| | 30/12384 [03:59<26:08:45, 7.62s/it, loss=10.6740, acc=0.0005, iter_time=8.24s]
Epoch 0: 0%| | 31/12384 [03:59<26:09:23, 7.62s/it, loss=10.6740, acc=0.0005, iter_time=8.24s]
Epoch 0: 0%| | 31/12384 [04:07<26:09:23, 7.62s/it, loss=11.1384, acc=0.0004, iter_time=8.11s]
Epoch 0: 0%| | 32/12384 [04:07<26:15:35, 7.65s/it, loss=11.1384, acc=0.0004, iter_time=8.11s]
Epoch 0: 0%| | 32/12384 [04:15<26:15:35, 7.65s/it, loss=11.0637, acc=0.0006, iter_time=7.26s]
Epoch 0: 0%| | 33/12384 [04:15<26:13:39, 7.64s/it, loss=11.0637, acc=0.0006, iter_time=7.26s]
Epoch 0: 0%| | 33/12384 [04:22<26:13:39, 7.64s/it, loss=10.9383, acc=0.0015, iter_time=7.62s]
Epoch 0: 0%| | 34/12384 [04:22<26:11:32, 7.64s/it, loss=10.9383, acc=0.0015, iter_time=7.62s]
Epoch 0: 0%| | 34/12384 [04:30<26:11:32, 7.64s/it, loss=11.5278, acc=0.0016, iter_time=5.89s]
Epoch 0: 0%| | 35/12384 [04:30<26:11:41, 7.64s/it, loss=11.5278, acc=0.0016, iter_time=5.89s]
Epoch 0: 0%| | 35/12384 [04:38<26:11:41, 7.64s/it, loss=10.9104, acc=0.0004, iter_time=9.68s]
Epoch 0: 0%| | 36/12384 [04:38<26:30:08, 7.73s/it, loss=10.9104, acc=0.0004, iter_time=9.68s]
Epoch 0: 0%| | 36/12384 [04:46<26:30:08, 7.73s/it, loss=12.0855, acc=0.0006, iter_time=7.65s]
Epoch 0: 0%| | 37/12384 [04:46<26:43:56, 7.79s/it, loss=12.0855, acc=0.0006, iter_time=7.65s]
Epoch 0: 0%| | 37/12384 [04:54<26:43:56, 7.79s/it, loss=12.0048, acc=0.0010, iter_time=3.98s]
Epoch 0: 0%| | 38/12384 [04:54<26:35:41, 7.75s/it, loss=12.0048, acc=0.0010, iter_time=3.98s]
Epoch 0: 0%| | 38/12384 [05:01<26:35:41, 7.75s/it, loss=11.0767, acc=0.0005, iter_time=11.60s]
Epoch 0: 0%| | 39/12384 [05:01<26:28:09, 7.72s/it, loss=11.0767, acc=0.0005, iter_time=11.60s]
Epoch 0: 0%| | 39/12384 [05:09<26:28:09, 7.72s/it, loss=11.2619, acc=0.0001, iter_time=8.01s]
Epoch 0: 0%| | 40/12384 [05:09<26:20:58, 7.68s/it, loss=11.2619, acc=0.0001, iter_time=8.01s]
Epoch 0: 0%| | 40/12384 [05:17<26:20:58, 7.68s/it, loss=10.6736, acc=0.0005, iter_time=7.23s]
Epoch 0: 0%| | 41/12384 [05:17<26:17:47, 7.67s/it, loss=10.6736, acc=0.0005, iter_time=7.23s]
Epoch 0: 0%| | 41/12384 [05:24<26:17:47, 7.67s/it, loss=10.2685, acc=0.0005, iter_time=7.64s]
Epoch 0: 0%| | 42/12384 [05:24<26:13:42, 7.65s/it, loss=10.2685, acc=0.0005, iter_time=7.64s]
Epoch 0: 0%| | 42/12384 [05:32<26:13:42, 7.65s/it, loss=11.5057, acc=0.0001, iter_time=7.02s]
Epoch 0: 0%| | 43/12384 [05:32<26:12:05, 7.64s/it, loss=11.5057, acc=0.0001, iter_time=7.02s]
Epoch 0: 0%| | 43/12384 [05:39<26:12:05, 7.64s/it, loss=11.4146, acc=0.0005, iter_time=8.20s]
Epoch 0: 0%| | 44/12384 [05:39<26:09:31, 7.63s/it, loss=11.4146, acc=0.0005, iter_time=8.20s]
Epoch 0: 0%| | 44/12384 [05:47<26:09:31, 7.63s/it, loss=11.8327, acc=0.0000, iter_time=7.61s]
Epoch 0: 0%| | 45/12384 [05:47<26:09:00, 7.63s/it, loss=11.8327, acc=0.0000, iter_time=7.61s]
Epoch 0: 0%| | 45/12384 [05:55<26:09:00, 7.63s/it, loss=12.4940, acc=0.0009, iter_time=4.74s]
Epoch 0: 0%| | 46/12384 [05:55<26:07:01, 7.62s/it, loss=12.4940, acc=0.0009, iter_time=4.74s]
Epoch 0: 0%| | 46/12384 [06:02<26:07:01, 7.62s/it, loss=10.7219, acc=0.0009, iter_time=10.46s]
Epoch 0: 0%| | 47/12384 [06:02<26:05:45, 7.61s/it, loss=10.7219, acc=0.0009, iter_time=10.46s]
Epoch 0: 0%| | 47/12384 [06:10<26:05:45, 7.61s/it, loss=11.5296, acc=0.0005, iter_time=8.01s]
Epoch 0: 0%| | 48/12384 [06:10<26:04:55, 7.61s/it, loss=11.5296, acc=0.0005, iter_time=8.01s]
Epoch 0: 0%| | 48/12384 [06:17<26:04:55, 7.61s/it, loss=12.5215, acc=0.0004, iter_time=5.45s]
Epoch 0: 0%| | 49/12384 [06:17<26:08:27, 7.63s/it, loss=12.5215, acc=0.0004, iter_time=5.45s]
Epoch 0: 0%| | 49/12384 [06:25<26:08:27, 7.63s/it, loss=12.3765, acc=0.0006, iter_time=9.84s]
Epoch 0: 0%| | 50/12384 [06:25<26:07:12, 7.62s/it, loss=12.3765, acc=0.0006, iter_time=9.84s]
Epoch 0: 0%| | 50/12384 [06:33<26:07:12, 7.62s/it, loss=11.2575, acc=0.0005, iter_time=4.61s]
Epoch 0: 0%| | 51/12384 [06:33<26:07:42, 7.63s/it, loss=11.2575, acc=0.0005, iter_time=4.61s]
Epoch 0: 0%| | 51/12384 [06:40<26:07:42, 7.63s/it, loss=12.6789, acc=0.0005, iter_time=9.59s]
Epoch 0: 0%| | 52/12384 [06:40<26:07:14, 7.63s/it, loss=12.6789, acc=0.0005, iter_time=9.59s]
Epoch 0: 0%| | 52/12384 [06:48<26:07:14, 7.63s/it, loss=11.2759, acc=0.0006, iter_time=8.30s]
Epoch 0: 0%| | 53/12384 [06:48<26:07:22, 7.63s/it, loss=11.2759, acc=0.0006, iter_time=8.30s]
Epoch 0: 0%| | 53/12384 [06:56<26:07:22, 7.63s/it, loss=12.0094, acc=0.0004, iter_time=4.82s]
Epoch 0: 0%| | 54/12384 [06:56<26:05:27, 7.62s/it, loss=12.0094, acc=0.0004, iter_time=4.82s]
Epoch 0: 0%| | 54/12384 [07:03<26:05:27, 7.62s/it, loss=12.1372, acc=0.0006, iter_time=10.42s]
Epoch 0: 0%| | 55/12384 [07:03<26:06:51, 7.63s/it, loss=12.1372, acc=0.0006, iter_time=10.42s]
Epoch 0: 0%| | 55/12384 [07:11<26:06:51, 7.63s/it, loss=10.7949, acc=0.0001, iter_time=8.00s]
Epoch 0: 0%| | 56/12384 [07:11<26:11:18, 7.65s/it, loss=10.7949, acc=0.0001, iter_time=8.00s]
Epoch 0: 0%| | 56/12384 [07:19<26:11:18, 7.65s/it, loss=11.5858, acc=0.0005, iter_time=6.44s]
Epoch 0: 0%| | 57/12384 [07:19<26:11:14, 7.65s/it, loss=11.5858, acc=0.0005, iter_time=6.44s]
Epoch 0: 0%| | 57/12384 [07:26<26:11:14, 7.65s/it, loss=14.1049, acc=0.0005, iter_time=5.19s]
Epoch 0: 0%| | 58/12384 [07:26<26:10:11, 7.64s/it, loss=14.1049, acc=0.0005, iter_time=5.19s]
Epoch 0: 0%| | 58/12384 [07:34<26:10:11, 7.64s/it, loss=10.7898, acc=0.0008, iter_time=10.94s]
Epoch 0: 0%| | 59/12384 [07:34<26:09:02, 7.64s/it, loss=10.7898, acc=0.0008, iter_time=10.94s]
Epoch 0: 0%| | 59/12384 [07:41<26:09:02, 7.64s/it, loss=10.9025, acc=0.0003, iter_time=7.65s]
Epoch 0: 0%| | 60/12384 [07:41<26:07:16, 7.63s/it, loss=10.9025, acc=0.0003, iter_time=7.65s]
Epoch 0: 0%| | 60/12384 [07:49<26:07:16, 7.63s/it, loss=11.4171, acc=0.0004, iter_time=6.66s]
Epoch 0: 0%| | 61/12384 [07:49<26:08:20, 7.64s/it, loss=11.4171, acc=0.0004, iter_time=6.66s]
Epoch 0: 0%| | 61/12384 [07:57<26:08:20, 7.64s/it, loss=13.1503, acc=0.0002, iter_time=7.13s]
Epoch 0: 1%| | 62/12384 [07:57<26:27:30, 7.73s/it, loss=13.1503, acc=0.0002, iter_time=7.13s]
Epoch 0: 1%| | 62/12384 [08:05<26:27:30, 7.73s/it, loss=10.5598, acc=0.0006, iter_time=9.41s]
Epoch 0: 1%| | 63/12384 [08:05<26:19:16, 7.69s/it, loss=10.5598, acc=0.0006, iter_time=9.41s]
Epoch 0: 1%| | 63/12384 [08:12<26:19:16, 7.69s/it, loss=11.2138, acc=0.0007, iter_time=7.69s]
Epoch 0: 1%| | 64/12384 [08:12<26:15:54, 7.67s/it, loss=11.2138, acc=0.0007, iter_time=7.69s]
Epoch 0: 1%| | 64/12384 [08:20<26:15:54, 7.67s/it, loss=11.6299, acc=0.0006, iter_time=6.99s]
Epoch 0: 1%| | 65/12384 [08:20<26:13:51, 7.67s/it, loss=11.6299, acc=0.0006, iter_time=6.99s]
Epoch 0: 1%| | 65/12384 [08:27<26:13:51, 7.67s/it, loss=11.6998, acc=0.0006, iter_time=8.20s]
Epoch 0: 1%| | 66/12384 [08:27<26:10:27, 7.65s/it, loss=11.6998, acc=0.0006, iter_time=8.20s]
Epoch 0: 1%| | 66/12384 [08:35<26:10:27, 7.65s/it, loss=11.1124, acc=0.0009, iter_time=7.65s]
Epoch 0: 1%| | 67/12384 [08:35<26:09:40, 7.65s/it, loss=11.1124, acc=0.0009, iter_time=7.65s]
Epoch 0: 1%| | 67/12384 [08:43<26:09:40, 7.65s/it, loss=10.5870, acc=0.0003, iter_time=7.60s]
Epoch 0: 1%| | 68/12384 [08:43<26:06:52, 7.63s/it, loss=10.5870, acc=0.0003, iter_time=7.60s]
Epoch 0: 1%| | 68/12384 [08:50<26:06:52, 7.63s/it, loss=12.2968, acc=0.0002, iter_time=6.40s]
Epoch 0: 1%| | 69/12384 [08:50<26:07:45, 7.64s/it, loss=12.2968, acc=0.0002, iter_time=6.40s]
Epoch 0: 1%| | 69/12384 [08:58<26:07:45, 7.64s/it, loss=10.6622, acc=0.0003, iter_time=8.85s]
Epoch 0: 1%| | 70/12384 [08:58<26:07:55, 7.64s/it, loss=10.6622, acc=0.0003, iter_time=8.85s]
Epoch 0: 1%| | 70/12384 [09:06<26:07:55, 7.64s/it, loss=10.8811, acc=0.0005, iter_time=7.65s]
Epoch 0: 1%| | 71/12384 [09:06<26:07:24, 7.64s/it, loss=10.8811, acc=0.0005, iter_time=7.65s]
Epoch 0: 1%| | 71/12384 [09:13<26:07:24, 7.64s/it, loss=10.7392, acc=0.0006, iter_time=8.02s]
Epoch 0: 1%| | 72/12384 [09:13<26:05:47, 7.63s/it, loss=10.7392, acc=0.0006, iter_time=8.02s]
Epoch 0: 1%| | 72/12384 [09:21<26:05:47, 7.63s/it, loss=12.1961, acc=0.0007, iter_time=5.12s]
Epoch 0: 1%| | 73/12384 [09:21<26:08:08, 7.64s/it, loss=12.1961, acc=0.0007, iter_time=5.12s]
Epoch 0: 1%| | 73/12384 [09:29<26:08:08, 7.64s/it, loss=10.5526, acc=0.0004, iter_time=9.75s]
Epoch 0: 1%| | 74/12384 [09:29<26:06:34, 7.64s/it, loss=10.5526, acc=0.0004, iter_time=9.75s]
Epoch 0: 1%| | 74/12384 [09:36<26:06:34, 7.64s/it, loss=10.1922, acc=0.0006, iter_time=7.65s]
Epoch 0: 1%| | 75/12384 [09:36<26:08:22, 7.64s/it, loss=10.1922, acc=0.0006, iter_time=7.65s]
Epoch 0: 1%| | 75/12384 [09:44<26:08:22, 7.64s/it, loss=11.6403, acc=0.0000, iter_time=7.01s]
Epoch 0: 1%| | 76/12384 [09:44<26:05:04, 7.63s/it, loss=11.6403, acc=0.0000, iter_time=7.01s]
Epoch 0: 1%| | 76/12384 [09:51<26:05:04, 7.63s/it, loss=10.9350, acc=0.0004, iter_time=7.31s]
Epoch 0: 1%| | 77/12384 [09:51<26:03:29, 7.62s/it, loss=10.9350, acc=0.0004, iter_time=7.31s]
Epoch 0: 1%| | 77/12384 [09:59<26:03:29, 7.62s/it, loss=11.0107, acc=0.0003, iter_time=8.51s]
Epoch 0: 1%| | 78/12384 [09:59<26:01:53, 7.62s/it, loss=11.0107, acc=0.0003, iter_time=8.51s]
Epoch 0: 1%| | 78/12384 [10:07<26:01:53, 7.62s/it, loss=10.8719, acc=0.0004, iter_time=7.61s]
Epoch 0: 1%| | 79/12384 [10:07<26:01:22, 7.61s/it, loss=10.8719, acc=0.0004, iter_time=7.61s]
Epoch 0: 1%| | 79/12384 [10:14<26:01:22, 7.61s/it, loss=11.3606, acc=0.0013, iter_time=7.57s]
Epoch 0: 1%| | 80/12384 [10:14<26:01:58, 7.62s/it, loss=11.3606, acc=0.0013, iter_time=7.57s]
Epoch 0: 1%| | 80/12384 [10:22<26:01:58, 7.62s/it, loss=12.4500, acc=0.0004, iter_time=4.84s]
Epoch 0: 1%| | 81/12384 [10:22<26:01:47, 7.62s/it, loss=12.4500, acc=0.0004, iter_time=4.84s]
Epoch 0: 1%| | 81/12384 [10:29<26:01:47, 7.62s/it, loss=11.2265, acc=0.0006, iter_time=10.42s]
Epoch 0: 1%| | 82/12384 [10:29<26:01:16, 7.61s/it, loss=11.2265, acc=0.0006, iter_time=10.42s]
Epoch 0: 1%| | 82/12384 [10:37<26:01:16, 7.61s/it, loss=11.5241, acc=0.0009, iter_time=7.62s]
Epoch 0: 1%| | 83/12384 [10:37<25:59:49, 7.61s/it, loss=11.5241, acc=0.0009, iter_time=7.62s]
Epoch 0: 1%| | 83/12384 [10:45<25:59:49, 7.61s/it, loss=11.2920, acc=0.0005, iter_time=7.29s]
Epoch 0: 1%| | 84/12384 [10:45<26:01:26, 7.62s/it, loss=11.2920, acc=0.0005, iter_time=7.29s]
Epoch 0: 1%| | 84/12384 [10:52<26:01:26, 7.62s/it, loss=10.4827, acc=0.0003, iter_time=7.95s]
Epoch 0: 1%| | 85/12384 [10:52<26:01:02, 7.62s/it, loss=10.4827, acc=0.0003, iter_time=7.95s]
Epoch 0: 1%| | 85/12384 [11:00<26:01:02, 7.62s/it, loss=10.6120, acc=0.0000, iter_time=7.60s]
Epoch 0: 1%| | 86/12384 [11:00<26:00:28, 7.61s/it, loss=10.6120, acc=0.0000, iter_time=7.60s]
Epoch 0: 1%| | 86/12384 [11:08<26:00:28, 7.61s/it, loss=10.8524, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 87/12384 [11:08<26:00:45, 7.62s/it, loss=10.8524, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 87/12384 [11:15<26:00:45, 7.62s/it, loss=11.2721, acc=0.0003, iter_time=8.02s]
Epoch 0: 1%| | 88/12384 [11:15<26:00:34, 7.62s/it, loss=11.2721, acc=0.0003, iter_time=8.02s]
Epoch 0: 1%| | 88/12384 [11:23<26:00:34, 7.62s/it, loss=11.2253, acc=0.0007, iter_time=5.75s]
Epoch 0: 1%| | 89/12384 [11:23<26:20:59, 7.72s/it, loss=11.2253, acc=0.0007, iter_time=5.75s]
Epoch 0: 1%| | 89/12384 [11:31<26:20:59, 7.72s/it, loss=11.0977, acc=0.0007, iter_time=9.41s]
Epoch 0: 1%| | 90/12384 [11:31<26:14:47, 7.69s/it, loss=11.0977, acc=0.0007, iter_time=9.41s]
Epoch 0: 1%| | 90/12384 [11:38<26:14:47, 7.69s/it, loss=10.9589, acc=0.0001, iter_time=7.65s]
Epoch 0: 1%| | 91/12384 [11:38<26:10:44, 7.67s/it, loss=10.9589, acc=0.0001, iter_time=7.65s]
Epoch 0: 1%| | 91/12384 [11:46<26:10:44, 7.67s/it, loss=10.6815, acc=0.0009, iter_time=7.59s]
Epoch 0: 1%| | 92/12384 [11:46<26:07:41, 7.65s/it, loss=10.6815, acc=0.0009, iter_time=7.59s]
Epoch 0: 1%| | 92/12384 [11:54<26:07:41, 7.65s/it, loss=12.3931, acc=0.0003, iter_time=5.90s]
Epoch 0: 1%| | 93/12384 [11:54<26:05:34, 7.64s/it, loss=12.3931, acc=0.0003, iter_time=5.90s]
Epoch 0: 1%| | 93/12384 [12:01<26:05:34, 7.64s/it, loss=10.8815, acc=0.0004, iter_time=9.38s]
Epoch 0: 1%| | 94/12384 [12:01<26:05:19, 7.64s/it, loss=10.8815, acc=0.0004, iter_time=9.38s]
Epoch 0: 1%| | 94/12384 [12:09<26:05:19, 7.64s/it, loss=12.1400, acc=0.0006, iter_time=6.18s]
Epoch 0: 1%| | 95/12384 [12:09<26:03:45, 7.63s/it, loss=12.1400, acc=0.0006, iter_time=6.18s]
Epoch 0: 1%| | 95/12384 [12:16<26:03:45, 7.63s/it, loss=12.2851, acc=0.0003, iter_time=9.01s]
Epoch 0: 1%| | 96/12384 [12:16<26:02:36, 7.63s/it, loss=12.2851, acc=0.0003, iter_time=9.01s]
Epoch 0: 1%| | 96/12384 [12:24<26:02:36, 7.63s/it, loss=12.4757, acc=0.0002, iter_time=4.84s]
Epoch 0: 1%| | 97/12384 [12:24<26:03:13, 7.63s/it, loss=12.4757, acc=0.0002, iter_time=4.84s]
Epoch 0: 1%| | 97/12384 [12:32<26:03:13, 7.63s/it, loss=11.9545, acc=0.0002, iter_time=10.46s]
Epoch 0: 1%| | 98/12384 [12:32<26:00:56, 7.62s/it, loss=11.9545, acc=0.0002, iter_time=10.46s]
Epoch 0: 1%| | 98/12384 [12:39<26:00:56, 7.62s/it, loss=10.9790, acc=0.0004, iter_time=7.61s]
Epoch 0: 1%| | 99/12384 [12:39<26:00:48, 7.62s/it, loss=10.9790, acc=0.0004, iter_time=7.61s]
Epoch 0: 1%| | 99/12384 [12:47<26:00:48, 7.62s/it, loss=10.7841, acc=0.0000, iter_time=8.01s]
Epoch 0: 1%| | 100/12384 [12:47<25:59:42, 7.62s/it, loss=10.7841, acc=0.0000, iter_time=8.01s]
Epoch 0: 1%| | 100/12384 [12:55<25:59:42, 7.62s/it, loss=11.4378, acc=0.0003, iter_time=7.21s]
Epoch 0: 1%| | 101/12384 [12:55<25:59:07, 7.62s/it, loss=11.4378, acc=0.0003, iter_time=7.21s]
Epoch 0: 1%| | 101/12384 [13:02<25:59:07, 7.62s/it, loss=11.4611, acc=0.0003, iter_time=7.60s]
Epoch 0: 1%| | 102/12384 [13:02<25:58:42, 7.61s/it, loss=11.4611, acc=0.0003, iter_time=7.60s]
Epoch 0: 1%| | 102/12384 [13:10<25:58:42, 7.61s/it, loss=11.0371, acc=0.0003, iter_time=7.65s]
Epoch 0: 1%| | 103/12384 [13:10<25:59:00, 7.62s/it, loss=11.0371, acc=0.0003, iter_time=7.65s]
Epoch 0: 1%| | 103/12384 [13:17<25:59:00, 7.62s/it, loss=11.2041, acc=0.0004, iter_time=8.03s]
Epoch 0: 1%| | 104/12384 [13:17<26:00:48, 7.63s/it, loss=11.2041, acc=0.0004, iter_time=8.03s]
Epoch 0: 1%| | 104/12384 [13:25<26:00:48, 7.63s/it, loss=12.3050, acc=0.0006, iter_time=4.88s]
Epoch 0: 1%| | 105/12384 [13:25<26:00:20, 7.62s/it, loss=12.3050, acc=0.0006, iter_time=4.88s]
Epoch 0: 1%| | 105/12384 [13:33<26:00:20, 7.62s/it, loss=10.6289, acc=0.0004, iter_time=9.07s]
Epoch 0: 1%| | 106/12384 [13:33<26:04:00, 7.64s/it, loss=10.6289, acc=0.0004, iter_time=9.07s]
Epoch 0: 1%| | 106/12384 [13:40<26:04:00, 7.64s/it, loss=11.4028, acc=0.0003, iter_time=8.58s]
Epoch 0: 1%| | 107/12384 [13:40<26:09:01, 7.67s/it, loss=11.4028, acc=0.0003, iter_time=8.58s]
Epoch 0: 1%| | 107/12384 [13:48<26:09:01, 7.67s/it, loss=10.5002, acc=0.0008, iter_time=7.73s]
Epoch 0: 1%| | 108/12384 [13:48<26:05:12, 7.65s/it, loss=10.5002, acc=0.0008, iter_time=7.73s]
Epoch 0: 1%| | 108/12384 [13:56<26:05:12, 7.65s/it, loss=10.0314, acc=0.0009, iter_time=7.62s]
Epoch 0: 1%| | 109/12384 [13:56<26:03:52, 7.64s/it, loss=10.0314, acc=0.0009, iter_time=7.62s]
Epoch 0: 1%| | 109/12384 [14:03<26:03:52, 7.64s/it, loss=10.4425, acc=0.0003, iter_time=7.61s]
Epoch 0: 1%| | 110/12384 [14:03<26:01:06, 7.63s/it, loss=10.4425, acc=0.0003, iter_time=7.61s]
Epoch 0: 1%| | 110/12384 [14:11<26:01:06, 7.63s/it, loss=11.6140, acc=0.0005, iter_time=7.70s]
Epoch 0: 1%| | 111/12384 [14:11<26:05:44, 7.65s/it, loss=11.6140, acc=0.0005, iter_time=7.70s]
Epoch 0: 1%| | 111/12384 [14:19<26:05:44, 7.65s/it, loss=11.2666, acc=0.0000, iter_time=8.00s]
Epoch 0: 1%| | 112/12384 [14:19<26:03:37, 7.64s/it, loss=11.2666, acc=0.0000, iter_time=8.00s]
Epoch 0: 1%| | 112/12384 [14:26<26:03:37, 7.64s/it, loss=11.4732, acc=0.0005, iter_time=5.10s]
Epoch 0: 1%| | 113/12384 [14:26<26:00:29, 7.63s/it, loss=11.4732, acc=0.0005, iter_time=5.10s]
Epoch 0: 1%| | 113/12384 [14:34<26:00:29, 7.63s/it, loss=11.8465, acc=0.0004, iter_time=6.20s]
Epoch 0: 1%| | 114/12384 [14:34<25:57:26, 7.62s/it, loss=11.8465, acc=0.0004, iter_time=6.20s]
Epoch 0: 1%| | 114/12384 [14:41<25:57:26, 7.62s/it, loss=11.5433, acc=0.0006, iter_time=7.81s]
Epoch 0: 1%| | 115/12384 [14:41<25:57:11, 7.62s/it, loss=11.5433, acc=0.0006, iter_time=7.81s]
Epoch 0: 1%| | 115/12384 [14:49<25:57:11, 7.62s/it, loss=11.3701, acc=0.0004, iter_time=10.93s]
Epoch 0: 1%| | 116/12384 [14:49<26:19:34, 7.73s/it, loss=11.3701, acc=0.0004, iter_time=10.93s]
Epoch 0: 1%| | 116/12384 [14:57<26:19:34, 7.73s/it, loss=10.0672, acc=0.0009, iter_time=8.00s]
Epoch 0: 1%| | 117/12384 [14:57<26:13:07, 7.69s/it, loss=10.0672, acc=0.0009, iter_time=8.00s]
Epoch 0: 1%| | 117/12384 [15:05<26:13:07, 7.69s/it, loss=10.2971, acc=0.0002, iter_time=7.58s]
Epoch 0: 1%| | 118/12384 [15:05<26:08:30, 7.67s/it, loss=10.2971, acc=0.0002, iter_time=7.58s]
Epoch 0: 1%| | 118/12384 [15:12<26:08:30, 7.67s/it, loss=11.7278, acc=0.0002, iter_time=6.43s]
Epoch 0: 1%| | 119/12384 [15:12<26:05:23, 7.66s/it, loss=11.7278, acc=0.0002, iter_time=6.43s]
Epoch 0: 1%| | 119/12384 [15:20<26:05:23, 7.66s/it, loss=9.5484, acc=0.0020, iter_time=9.22s]
Epoch 0: 1%| | 120/12384 [15:20<26:02:54, 7.65s/it, loss=9.5484, acc=0.0020, iter_time=9.22s]
Epoch 0: 1%| | 120/12384 [15:28<26:02:54, 7.65s/it, loss=11.3585, acc=0.0003, iter_time=7.24s]
Epoch 0: 1%| | 121/12384 [15:28<26:00:32, 7.64s/it, loss=11.3585, acc=0.0003, iter_time=7.24s]
Epoch 0: 1%| | 121/12384 [15:35<26:00:32, 7.64s/it, loss=10.2829, acc=0.0015, iter_time=7.62s]
Epoch 0: 1%| | 122/12384 [15:35<25:59:56, 7.63s/it, loss=10.2829, acc=0.0015, iter_time=7.62s]
Epoch 0: 1%| | 122/12384 [15:43<25:59:56, 7.63s/it, loss=11.4828, acc=0.0000, iter_time=4.04s]
Epoch 0: 1%| | 123/12384 [15:43<25:58:02, 7.62s/it, loss=11.4828, acc=0.0000, iter_time=4.04s]
Epoch 0: 1%| | 123/12384 [15:50<25:58:02, 7.62s/it, loss=10.4930, acc=0.0008, iter_time=11.16s]
Epoch 0: 1%| | 124/12384 [15:50<25:56:40, 7.62s/it, loss=10.4930, acc=0.0008, iter_time=11.16s]
Epoch 0: 1%| | 124/12384 [15:58<25:56:40, 7.62s/it, loss=10.7814, acc=0.0002, iter_time=7.63s]
Epoch 0: 1%| | 125/12384 [15:58<25:55:20, 7.61s/it, loss=10.7814, acc=0.0002, iter_time=7.63s]
Epoch 0: 1%| | 125/12384 [16:06<25:55:20, 7.61s/it, loss=11.1825, acc=0.0004, iter_time=3.98s]
Epoch 0: 1%| | 126/12384 [16:06<26:00:15, 7.64s/it, loss=11.1825, acc=0.0004, iter_time=3.98s]
Epoch 0: 1%| | 126/12384 [16:13<26:00:15, 7.64s/it, loss=9.8605, acc=0.0010, iter_time=11.32s]
Epoch 0: 1%| | 127/12384 [16:13<25:58:58, 7.63s/it, loss=9.8605, acc=0.0010, iter_time=11.32s]
Epoch 0: 1%| | 127/12384 [16:21<25:58:58, 7.63s/it, loss=9.6568, acc=0.0017, iter_time=8.00s]
Epoch 0: 1%| | 128/12384 [16:21<25:58:26, 7.63s/it, loss=9.6568, acc=0.0017, iter_time=8.00s]
Epoch 0: 1%| | 128/12384 [16:28<25:58:26, 7.63s/it, loss=9.7294, acc=0.0003, iter_time=7.23s]
Epoch 0: 1%| | 129/12384 [16:28<25:57:21, 7.62s/it, loss=9.7294, acc=0.0003, iter_time=7.23s]
Epoch 0: 1%| | 129/12384 [16:36<25:57:21, 7.62s/it, loss=11.0125, acc=0.0008, iter_time=4.04s]
Epoch 0: 1%| | 130/12384 [16:36<25:56:17, 7.62s/it, loss=11.0125, acc=0.0008, iter_time=4.04s]
Epoch 0: 1%| | 130/12384 [16:44<25:56:17, 7.62s/it, loss=10.1296, acc=0.0012, iter_time=11.19s]
Epoch 0: 1%| | 131/12384 [16:44<25:56:05, 7.62s/it, loss=10.1296, acc=0.0012, iter_time=11.19s]
Epoch 0: 1%| | 131/12384 [16:51<25:56:05, 7.62s/it, loss=10.1372, acc=0.0007, iter_time=7.61s]
Epoch 0: 1%| | 132/12384 [16:51<25:55:28, 7.62s/it, loss=10.1372, acc=0.0007, iter_time=7.61s]
Epoch 0: 1%| | 132/12384 [16:59<25:55:28, 7.62s/it, loss=11.0524, acc=0.0005, iter_time=7.63s]
Epoch 0: 1%| | 133/12384 [16:59<25:55:34, 7.62s/it, loss=11.0524, acc=0.0005, iter_time=7.63s]
Epoch 0: 1%| | 133/12384 [17:07<25:55:34, 7.62s/it, loss=10.4664, acc=0.0001, iter_time=7.63s]
Epoch 0: 1%| | 134/12384 [17:07<25:56:00, 7.62s/it, loss=10.4664, acc=0.0001, iter_time=7.63s]
Epoch 0: 1%| | 134/12384 [17:14<25:56:00, 7.62s/it, loss=10.1932, acc=0.0002, iter_time=7.59s]
Epoch 0: 1%| | 135/12384 [17:14<25:53:51, 7.61s/it, loss=10.1932, acc=0.0002, iter_time=7.59s]
Epoch 0: 1%| | 135/12384 [17:22<25:53:51, 7.61s/it, loss=10.0629, acc=0.0014, iter_time=8.00s]
Epoch 0: 1%| | 136/12384 [17:22<25:53:48, 7.61s/it, loss=10.0629, acc=0.0014, iter_time=8.00s]
Epoch 0: 1%| | 136/12384 [17:29<25:53:48, 7.61s/it, loss=9.8734, acc=0.0004, iter_time=7.20s]
Epoch 0: 1%| | 137/12384 [17:29<25:54:19, 7.61s/it, loss=9.8734, acc=0.0004, iter_time=7.20s]
Epoch 0: 1%| | 137/12384 [17:37<25:54:19, 7.61s/it, loss=9.8371, acc=0.0002, iter_time=7.64s]
Epoch 0: 1%| | 138/12384 [17:37<25:57:14, 7.63s/it, loss=9.8371, acc=0.0002, iter_time=7.64s]
Epoch 0: 1%| | 138/12384 [17:45<25:57:14, 7.63s/it, loss=11.1795, acc=0.0004, iter_time=5.40s]
Epoch 0: 1%| | 139/12384 [17:45<25:54:51, 7.62s/it, loss=11.1795, acc=0.0004, iter_time=5.40s]
Epoch 0: 1%| | 139/12384 [17:52<25:54:51, 7.62s/it, loss=10.2292, acc=0.0009, iter_time=9.87s]
Epoch 0: 1%| | 140/12384 [17:52<25:55:35, 7.62s/it, loss=10.2292, acc=0.0009, iter_time=9.87s]
Epoch 0: 1%| | 140/12384 [18:00<25:55:35, 7.62s/it, loss=9.6422, acc=0.0007, iter_time=7.61s]
Epoch 0: 1%| | 141/12384 [18:00<25:54:59, 7.62s/it, loss=9.6422, acc=0.0007, iter_time=7.61s]
Epoch 0: 1%| | 141/12384 [18:08<25:54:59, 7.62s/it, loss=9.4567, acc=0.0005, iter_time=7.97s]
Epoch 0: 1%| | 142/12384 [18:08<26:15:02, 7.72s/it, loss=9.4567, acc=0.0005, iter_time=7.97s]
Epoch 0: 1%| | 142/12384 [18:15<26:15:02, 7.72s/it, loss=10.2324, acc=0.0003, iter_time=7.61s]
Epoch 0: 1%| | 143/12384 [18:15<26:08:21, 7.69s/it, loss=10.2324, acc=0.0003, iter_time=7.61s]
Epoch 0: 1%| | 143/12384 [18:23<26:08:21, 7.69s/it, loss=10.6632, acc=0.0008, iter_time=7.99s]
Epoch 0: 1%| | 144/12384 [18:23<26:03:11, 7.66s/it, loss=10.6632, acc=0.0008, iter_time=7.99s]
Epoch 0: 1%| | 144/12384 [18:31<26:03:11, 7.66s/it, loss=10.3803, acc=0.0003, iter_time=5.69s]
Epoch 0: 1%| | 145/12384 [18:31<26:00:16, 7.65s/it, loss=10.3803, acc=0.0003, iter_time=5.69s]
Epoch 0: 1%| | 145/12384 [18:38<26:00:16, 7.65s/it, loss=10.4196, acc=0.0005, iter_time=7.04s]
Epoch 0: 1%| | 146/12384 [18:38<25:58:28, 7.64s/it, loss=10.4196, acc=0.0005, iter_time=7.04s]
Epoch 0: 1%| | 146/12384 [18:46<25:58:28, 7.64s/it, loss=10.2963, acc=0.0005, iter_time=9.72s]
Epoch 0: 1%| | 147/12384 [18:46<25:59:32, 7.65s/it, loss=10.2963, acc=0.0005, iter_time=9.72s]
Epoch 0: 1%| | 147/12384 [18:54<25:59:32, 7.65s/it, loss=10.8822, acc=0.0004, iter_time=5.57s]
Epoch 0: 1%| | 148/12384 [18:54<25:56:15, 7.63s/it, loss=10.8822, acc=0.0004, iter_time=5.57s]
Epoch 0: 1%| | 148/12384 [19:01<25:56:15, 7.63s/it, loss=9.8738, acc=0.0004, iter_time=9.70s]
Epoch 0: 1%| | 149/12384 [19:01<25:56:42, 7.63s/it, loss=9.8738, acc=0.0004, iter_time=9.70s]
Epoch 0: 1%| | 149/12384 [19:09<25:56:42, 7.63s/it, loss=9.4181, acc=0.0008, iter_time=8.04s]
Epoch 0: 1%| | 150/12384 [19:09<25:55:19, 7.63s/it, loss=9.4181, acc=0.0008, iter_time=8.04s]
Epoch 0: 1%| | 150/12384 [19:16<25:55:19, 7.63s/it, loss=9.5931, acc=0.0012, iter_time=7.22s]
Epoch 0: 1%| | 151/12384 [19:16<25:55:08, 7.63s/it, loss=9.5931, acc=0.0012, iter_time=7.22s]
Epoch 0: 1%| | 151/12384 [19:24<25:55:08, 7.63s/it, loss=10.0816, acc=0.0001, iter_time=8.01s]
Epoch 0: 1%| | 152/12384 [19:24<25:53:38, 7.62s/it, loss=10.0816, acc=0.0001, iter_time=8.01s]
Epoch 0: 1%| | 152/12384 [19:32<25:53:38, 7.62s/it, loss=10.7061, acc=0.0000, iter_time=5.11s]
Epoch 0: 1%| | 153/12384 [19:32<25:52:31, 7.62s/it, loss=10.7061, acc=0.0000, iter_time=5.11s]
Epoch 0: 1%| | 153/12384 [19:39<25:52:31, 7.62s/it, loss=11.3992, acc=0.0005, iter_time=7.15s]
Epoch 0: 1%| | 154/12384 [19:39<25:50:59, 7.61s/it, loss=11.3992, acc=0.0005, iter_time=7.15s]
Epoch 0: 1%| | 154/12384 [19:47<25:50:59, 7.61s/it, loss=9.8613, acc=0.0006, iter_time=9.54s]
Epoch 0: 1%|▏ | 155/12384 [19:47<25:50:05, 7.61s/it, loss=9.8613, acc=0.0006, iter_time=9.54s]
Epoch 0: 1%|▏ | 155/12384 [19:54<25:50:05, 7.61s/it, loss=9.9140, acc=0.0012, iter_time=4.82s]
Epoch 0: 1%|▏ | 156/12384 [19:54<25:49:53, 7.60s/it, loss=9.9140, acc=0.0012, iter_time=4.82s]
Epoch 0: 1%|▏ | 156/12384 [20:02<25:49:53, 7.60s/it, loss=10.2191, acc=0.0009, iter_time=10.07s]
Epoch 0: 1%|▏ | 157/12384 [20:02<25:49:54, 7.61s/it, loss=10.2191, acc=0.0009, iter_time=10.07s]
Epoch 0: 1%|▏ | 157/12384 [20:10<25:49:54, 7.61s/it, loss=8.8124, acc=0.0006, iter_time=8.53s]
Epoch 0: 1%|▏ | 158/12384 [20:10<25:49:12, 7.60s/it, loss=8.8124, acc=0.0006, iter_time=8.53s]
Epoch 0: 1%|▏ | 158/12384 [20:17<25:49:12, 7.60s/it, loss=9.9854, acc=0.0003, iter_time=7.60s]
Epoch 0: 1%|▏ | 159/12384 [20:17<25:49:43, 7.61s/it, loss=9.9854, acc=0.0003, iter_time=7.60s]
Epoch 0: 1%|▏ | 159/12384 [20:25<25:49:43, 7.61s/it, loss=10.0365, acc=0.0004, iter_time=8.01s]
Epoch 0: 1%|▏ | 160/12384 [20:25<25:50:15, 7.61s/it, loss=10.0365, acc=0.0004, iter_time=8.01s]
Epoch 0: 1%|▏ | 160/12384 [20:33<25:50:15, 7.61s/it, loss=10.1688, acc=0.0002, iter_time=4.42s]
Epoch 0: 1%|▏ | 161/12384 [20:33<25:51:42, 7.62s/it, loss=10.1688, acc=0.0002, iter_time=4.42s]
Epoch 0: 1%|▏ | 161/12384 [20:40<25:51:42, 7.62s/it, loss=9.5088, acc=0.0001, iter_time=9.57s]
Epoch 0: 1%|▏ | 162/12384 [20:40<25:51:06, 7.61s/it, loss=9.5088, acc=0.0001, iter_time=9.57s]
Epoch 0: 1%|▏ | 162/12384 [20:48<25:51:06, 7.61s/it, loss=10.1466, acc=0.0009, iter_time=8.47s]
Epoch 0: 1%|▏ | 163/12384 [20:48<25:51:49, 7.62s/it, loss=10.1466, acc=0.0009, iter_time=8.47s]
Epoch 0: 1%|▏ | 163/12384 [20:55<25:51:49, 7.62s/it, loss=9.8549, acc=0.0006, iter_time=5.58s]
Epoch 0: 1%|▏ | 164/12384 [20:55<25:52:35, 7.62s/it, loss=9.8549, acc=0.0006, iter_time=5.58s]
Epoch 0: 1%|▏ | 164/12384 [21:03<25:52:35, 7.62s/it, loss=9.5383, acc=0.0011, iter_time=8.15s]
Epoch 0: 1%|▏ | 165/12384 [21:03<25:50:41, 7.61s/it, loss=9.5383, acc=0.0011, iter_time=8.15s]
Epoch 0: 1%|▏ | 165/12384 [21:11<25:50:41, 7.61s/it, loss=10.1700, acc=0.0001, iter_time=7.59s]
Epoch 0: 1%|▏ | 166/12384 [21:11<25:50:49, 7.62s/it, loss=10.1700, acc=0.0001, iter_time=7.59s]
Epoch 0: 1%|▏ | 166/12384 [21:19<25:50:49, 7.62s/it, loss=9.0799, acc=0.0002, iter_time=9.48s]
Epoch 0: 1%|▏ | 167/12384 [21:19<26:11:59, 7.72s/it, loss=9.0799, acc=0.0002, iter_time=9.48s]
Epoch 0: 1%|▏ | 167/12384 [21:26<26:11:59, 7.72s/it, loss=10.0764, acc=0.0000, iter_time=7.59s]
Epoch 0: 1%|▏ | 168/12384 [21:26<26:05:14, 7.69s/it, loss=10.0764, acc=0.0000, iter_time=7.59s]
Epoch 0: 1%|▏ | 168/12384 [21:34<26:05:14, 7.69s/it, loss=9.7896, acc=0.0004, iter_time=4.79s]
Epoch 0: 1%|▏ | 169/12384 [21:34<25:58:41, 7.66s/it, loss=9.7896, acc=0.0004, iter_time=4.79s]
Epoch 0: 1%|▏ | 169/12384 [21:41<25:58:41, 7.66s/it, loss=11.7126, acc=0.0006, iter_time=7.66s]
Epoch 0: 1%|▏ | 170/12384 [21:41<25:56:37, 7.65s/it, loss=11.7126, acc=0.0006, iter_time=7.66s]
Epoch 0: 1%|▏ | 170/12384 [21:49<25:56:37, 7.65s/it, loss=9.3127, acc=0.0011, iter_time=10.42s]
Epoch 0: 1%|▏ | 171/12384 [21:49<25:58:07, 7.65s/it, loss=9.3127, acc=0.0011, iter_time=10.42s]
Epoch 0: 1%|▏ | 171/12384 [21:57<25:58:07, 7.65s/it, loss=9.5550, acc=0.0008, iter_time=7.12s]
Epoch 0: 1%|▏ | 172/12384 [21:57<25:59:57, 7.66s/it, loss=9.5550, acc=0.0008, iter_time=7.12s]
Epoch 0: 1%|▏ | 172/12384 [22:04<25:59:57, 7.66s/it, loss=8.9660, acc=0.0003, iter_time=8.23s]
Epoch 0: 1%|▏ | 173/12384 [22:04<25:56:31, 7.65s/it, loss=8.9660, acc=0.0003, iter_time=8.23s]
Epoch 0: 1%|▏ | 173/12384 [22:12<25:56:31, 7.65s/it, loss=11.1203, acc=0.0010, iter_time=6.43s]
Epoch 0: 1%|▏ | 174/12384 [22:12<25:53:30, 7.63s/it, loss=11.1203, acc=0.0010, iter_time=6.43s]
Epoch 0: 1%|▏ | 174/12384 [22:20<25:53:30, 7.63s/it, loss=9.4668, acc=0.0002, iter_time=7.01s]
Epoch 0: 1%|▏ | 175/12384 [22:20<25:52:02, 7.63s/it, loss=9.4668, acc=0.0002, iter_time=7.01s]
Epoch 0: 1%|▏ | 175/12384 [22:27<25:52:02, 7.63s/it, loss=9.2470, acc=0.0005, iter_time=9.78s]
Epoch 0: 1%|▏ | 176/12384 [22:27<25:50:51, 7.62s/it, loss=9.2470, acc=0.0005, iter_time=9.78s]
Epoch 0: 1%|▏ | 176/12384 [22:35<25:50:51, 7.62s/it, loss=9.1590, acc=0.0007, iter_time=7.22s]
Epoch 0: 1%|▏ | 177/12384 [22:35<25:49:37, 7.62s/it, loss=9.1590, acc=0.0007, iter_time=7.22s]
Epoch 0: 1%|▏ | 177/12384 [22:42<25:49:37, 7.62s/it, loss=9.4669, acc=0.0010, iter_time=5.80s]
Epoch 0: 1%|▏ | 178/12384 [22:42<25:47:19, 7.61s/it, loss=9.4669, acc=0.0010, iter_time=5.80s]
Epoch 0: 1%|▏ | 178/12384 [22:50<25:47:19, 7.61s/it, loss=9.2095, acc=0.0009, iter_time=9.37s]
Epoch 0: 1%|▏ | 179/12384 [22:50<25:48:30, 7.61s/it, loss=9.2095, acc=0.0009, iter_time=9.37s]
Epoch 0: 1%|▏ | 179/12384 [22:58<25:48:30, 7.61s/it, loss=9.3064, acc=0.0003, iter_time=7.63s]
Epoch 0: 1%|▏ | 180/12384 [22:58<25:48:06, 7.61s/it, loss=9.3064, acc=0.0003, iter_time=7.63s]
Epoch 0: 1%|▏ | 180/12384 [23:05<25:48:06, 7.61s/it, loss=9.2088, acc=0.0019, iter_time=7.62s]
Epoch 0: 1%|▏ | 181/12384 [23:05<25:47:39, 7.61s/it, loss=9.2088, acc=0.0019, iter_time=7.62s]
Epoch 0: 1%|▏ | 181/12384 [23:13<25:47:39, 7.61s/it, loss=9.0347, acc=0.0000, iter_time=5.51s]
Epoch 0: 1%|▏ | 182/12384 [23:13<25:48:15, 7.61s/it, loss=9.0347, acc=0.0000, iter_time=5.51s]
Epoch 0: 1%|▏ | 182/12384 [23:20<25:48:15, 7.61s/it, loss=8.9292, acc=0.0003, iter_time=7.97s]
Epoch 0: 1%|▏ | 183/12384 [23:20<25:48:41, 7.62s/it, loss=8.9292, acc=0.0003, iter_time=7.97s]
Epoch 0: 1%|▏ | 183/12384 [23:28<25:48:41, 7.62s/it, loss=9.0322, acc=0.0004, iter_time=9.73s]
Epoch 0: 1%|▏ | 184/12384 [23:28<25:48:52, 7.62s/it, loss=9.0322, acc=0.0004, iter_time=9.73s]
Epoch 0: 1%|▏ | 184/12384 [23:36<25:48:52, 7.62s/it, loss=9.1662, acc=0.0003, iter_time=7.25s]
Epoch 0: 1%|▏ | 185/12384 [23:36<25:50:14, 7.62s/it, loss=9.1662, acc=0.0003, iter_time=7.25s]
Epoch 0: 1%|▏ | 185/12384 [23:43<25:50:14, 7.62s/it, loss=8.8746, acc=0.0000, iter_time=4.39s]
Epoch 0: 2%|▏ | 186/12384 [23:43<25:54:35, 7.65s/it, loss=8.8746, acc=0.0000, iter_time=4.39s]
Epoch 0: 2%|▏ | 186/12384 [23:51<25:54:35, 7.65s/it, loss=8.9561, acc=0.0007, iter_time=10.96s]
Epoch 0: 2%|▏ | 187/12384 [23:51<25:52:37, 7.64s/it, loss=8.9561, acc=0.0007, iter_time=10.96s]
Epoch 0: 2%|▏ | 187/12384 [23:59<25:52:37, 7.64s/it, loss=8.7833, acc=0.0015, iter_time=7.62s]
Epoch 0: 2%|▏ | 188/12384 [23:59<25:54:46, 7.65s/it, loss=8.7833, acc=0.0015, iter_time=7.62s]
Epoch 0: 2%|▏ | 188/12384 [24:06<25:54:46, 7.65s/it, loss=9.0253, acc=0.0021, iter_time=5.94s]
Epoch 0: 2%|▏ | 189/12384 [24:06<25:51:40, 7.63s/it, loss=9.0253, acc=0.0021, iter_time=5.94s]
Epoch 0: 2%|▏ | 189/12384 [24:14<25:51:40, 7.63s/it, loss=9.4630, acc=0.0007, iter_time=9.02s]
Epoch 0: 2%|▏ | 190/12384 [24:14<25:51:09, 7.63s/it, loss=9.4630, acc=0.0007, iter_time=9.02s]
Epoch 0: 2%|▏ | 190/12384 [24:22<25:51:09, 7.63s/it, loss=8.8498, acc=0.0006, iter_time=7.92s]
Epoch 0: 2%|▏ | 191/12384 [24:22<25:47:52, 7.62s/it, loss=8.8498, acc=0.0006, iter_time=7.92s]
Epoch 0: 2%|▏ | 191/12384 [24:29<25:47:52, 7.62s/it, loss=9.3568, acc=0.0002, iter_time=7.55s]
Epoch 0: 2%|▏ | 192/12384 [24:29<25:47:53, 7.62s/it, loss=9.3568, acc=0.0002, iter_time=7.55s]
Epoch 0: 2%|▏ | 192/12384 [24:37<25:47:53, 7.62s/it, loss=8.7064, acc=0.0008, iter_time=8.01s]
Epoch 0: 2%|▏ | 193/12384 [24:37<26:09:22, 7.72s/it, loss=8.7064, acc=0.0008, iter_time=8.01s]
Epoch 0: 2%|▏ | 193/12384 [24:45<26:09:22, 7.72s/it, loss=9.0487, acc=0.0007, iter_time=7.65s]
Epoch 0: 2%|▏ | 194/12384 [24:45<26:04:38, 7.70s/it, loss=9.0487, acc=0.0007, iter_time=7.65s]
Epoch 0: 2%|▏ | 194/12384 [24:52<26:04:38, 7.70s/it, loss=9.0839, acc=0.0005, iter_time=5.53s]
Epoch 0: 2%|▏ | 195/12384 [24:52<25:59:26, 7.68s/it, loss=9.0839, acc=0.0005, iter_time=5.53s]
Epoch 0: 2%|▏ | 195/12384 [25:00<25:59:26, 7.68s/it, loss=8.1845, acc=0.0004, iter_time=9.71s]
Epoch 0: 2%|▏ | 196/12384 [25:00<25:54:10, 7.65s/it, loss=8.1845, acc=0.0004, iter_time=9.71s]
Epoch 0: 2%|▏ | 196/12384 [25:08<25:54:10, 7.65s/it, loss=8.0781, acc=0.0012, iter_time=7.69s]
Epoch 0: 2%|▏ | 197/12384 [25:08<25:56:08, 7.66s/it, loss=8.0781, acc=0.0012, iter_time=7.69s]
Epoch 0: 2%|▏ | 197/12384 [25:15<25:56:08, 7.66s/it, loss=8.8953, acc=0.0010, iter_time=7.39s]
Epoch 0: 2%|▏ | 198/12384 [25:15<26:02:32, 7.69s/it, loss=8.8953, acc=0.0010, iter_time=7.39s]
Epoch 0: 2%|▏ | 198/12384 [25:23<26:02:32, 7.69s/it, loss=9.0396, acc=0.0004, iter_time=7.96s]
Epoch 0: 2%|▏ | 199/12384 [25:23<25:56:17, 7.66s/it, loss=9.0396, acc=0.0004, iter_time=7.96s]
Epoch 0: 2%|▏ | 199/12384 [25:31<25:56:17, 7.66s/it, loss=9.1129, acc=0.0009, iter_time=8.02s]
Epoch 0: 2%|▏ | 200/12384 [25:31<25:53:56, 7.65s/it, loss=9.1129, acc=0.0009, iter_time=8.02s]
Epoch 0: 2%|▏ | 200/12384 [25:38<25:53:56, 7.65s/it, loss=8.4465, acc=0.0007, iter_time=6.25s]
Epoch 0: 2%|▏ | 201/12384 [25:38<25:51:29, 7.64s/it, loss=8.4465, acc=0.0007, iter_time=6.25s]
Epoch 0: 2%|▏ | 201/12384 [25:46<25:51:29, 7.64s/it, loss=8.7059, acc=0.0011, iter_time=8.56s]
Epoch 0: 2%|▏ | 202/12384 [25:46<25:49:30, 7.63s/it, loss=8.7059, acc=0.0011, iter_time=8.56s]
Epoch 0: 2%|▏ | 202/12384 [25:53<25:49:30, 7.63s/it, loss=8.5992, acc=0.0011, iter_time=7.63s]
Epoch 0: 2%|▏ | 203/12384 [25:53<25:48:30, 7.63s/it, loss=8.5992, acc=0.0011, iter_time=7.63s]
Epoch 0: 2%|▏ | 203/12384 [26:01<25:48:30, 7.63s/it, loss=8.7102, acc=0.0012, iter_time=7.30s]
Epoch 0: 2%|▏ | 204/12384 [26:01<25:46:32, 7.62s/it, loss=8.7102, acc=0.0012, iter_time=7.30s]
Epoch 0: 2%|▏ | 204/12384 [26:09<25:46:32, 7.62s/it, loss=8.7894, acc=0.0019, iter_time=6.98s]
Epoch 0: 2%|▏ | 205/12384 [26:09<25:46:09, 7.62s/it, loss=8.7894, acc=0.0019, iter_time=6.98s]
Epoch 0: 2%|▏ | 205/12384 [26:16<25:46:09, 7.62s/it, loss=9.4527, acc=0.0002, iter_time=5.51s]
Epoch 0: 2%|▏ | 206/12384 [26:16<25:47:22, 7.62s/it, loss=9.4527, acc=0.0002, iter_time=5.51s]
Epoch 0: 2%|▏ | 206/12384 [26:24<25:47:22, 7.62s/it, loss=8.4351, acc=0.0012, iter_time=10.66s]
Epoch 0: 2%|▏ | 207/12384 [26:24<25:45:33, 7.62s/it, loss=8.4351, acc=0.0012, iter_time=10.66s]
Epoch 0: 2%|▏ | 207/12384 [26:32<25:45:33, 7.62s/it, loss=8.3410, acc=0.0008, iter_time=7.53s]
Epoch 0: 2%|▏ | 208/12384 [26:32<25:44:22, 7.61s/it, loss=8.3410, acc=0.0008, iter_time=7.53s]
Epoch 0: 2%|▏ | 208/12384 [26:39<25:44:22, 7.61s/it, loss=8.4003, acc=0.0017, iter_time=5.92s]
Epoch 0: 2%|▏ | 209/12384 [26:39<25:43:12, 7.61s/it, loss=8.4003, acc=0.0017, iter_time=5.92s]
Epoch 0: 2%|▏ | 209/12384 [26:47<25:43:12, 7.61s/it, loss=8.1942, acc=0.0015, iter_time=6.05s]
Epoch 0: 2%|▏ | 210/12384 [26:47<25:42:56, 7.60s/it, loss=8.1942, acc=0.0015, iter_time=6.05s]
Epoch 0: 2%|▏ | 210/12384 [26:54<25:42:56, 7.60s/it, loss=8.5600, acc=0.0008, iter_time=10.88s]
Epoch 0: 2%|▏ | 211/12384 [26:54<25:43:20, 7.61s/it, loss=8.5600, acc=0.0008, iter_time=10.88s]
Epoch 0: 2%|▏ | 211/12384 [27:02<25:43:20, 7.61s/it, loss=8.1708, acc=0.0016, iter_time=7.62s]
Epoch 0: 2%|▏ | 212/12384 [27:02<25:43:44, 7.61s/it, loss=8.1708, acc=0.0016, iter_time=7.62s]
Epoch 0: 2%|▏ | 212/12384 [27:10<25:43:44, 7.61s/it, loss=8.1449, acc=0.0007, iter_time=7.62s]
Epoch 0: 2%|▏ | 213/12384 [27:10<25:42:50, 7.61s/it, loss=8.1449, acc=0.0007, iter_time=7.62s]
Epoch 0: 2%|▏ | 213/12384 [27:17<25:42:50, 7.61s/it, loss=8.5393, acc=0.0014, iter_time=4.30s]
Epoch 0: 2%|▏ | 214/12384 [27:17<25:42:27, 7.60s/it, loss=8.5393, acc=0.0014, iter_time=4.30s]
Epoch 0: 2%|▏ | 214/12384 [27:25<25:42:27, 7.60s/it, loss=8.1967, acc=0.0009, iter_time=10.90s]
Epoch 0: 2%|▏ | 215/12384 [27:25<25:41:34, 7.60s/it, loss=8.1967, acc=0.0009, iter_time=10.90s]
Epoch 0: 2%|▏ | 215/12384 [27:32<25:41:34, 7.60s/it, loss=9.2189, acc=0.0004, iter_time=7.56s]
Epoch 0: 2%|▏ | 216/12384 [27:32<25:42:09, 7.60s/it, loss=9.2189, acc=0.0004, iter_time=7.56s]
Epoch 0: 2%|▏ | 216/12384 [27:40<25:42:09, 7.60s/it, loss=8.2695, acc=0.0009, iter_time=4.80s]
Epoch 0: 2%|▏ | 217/12384 [27:40<25:42:56, 7.61s/it, loss=8.2695, acc=0.0009, iter_time=4.80s]
Epoch 0: 2%|▏ | 217/12384 [27:48<25:42:56, 7.61s/it, loss=7.8203, acc=0.0006, iter_time=8.23s]
Epoch 0: 2%|▏ | 218/12384 [27:48<25:45:37, 7.62s/it, loss=7.8203, acc=0.0006, iter_time=8.23s]
Epoch 0: 2%|▏ | 218/12384 [27:56<25:45:37, 7.62s/it, loss=8.0925, acc=0.0007, iter_time=10.25s]
Epoch 0: 2%|▏ | 219/12384 [27:56<26:06:18, 7.73s/it, loss=8.0925, acc=0.0007, iter_time=10.25s]
Epoch 0: 2%|▏ | 219/12384 [28:03<26:06:18, 7.73s/it, loss=8.1302, acc=0.0021, iter_time=7.64s]
Epoch 0: 2%|▏ | 220/12384 [28:03<25:58:52, 7.69s/it, loss=8.1302, acc=0.0021, iter_time=7.64s]
Epoch 0: 2%|▏ | 220/12384 [28:11<25:58:52, 7.69s/it, loss=7.9559, acc=0.0017, iter_time=7.61s]
Epoch 0: 2%|▏ | 221/12384 [28:11<25:53:52, 7.67s/it, loss=7.9559, acc=0.0017, iter_time=7.61s]
Epoch 0: 2%|▏ | 221/12384 [28:18<25:53:52, 7.67s/it, loss=8.0055, acc=0.0012, iter_time=7.60s]
Epoch 0: 2%|▏ | 222/12384 [28:18<25:51:18, 7.65s/it, loss=8.0055, acc=0.0012, iter_time=7.60s]
Epoch 0: 2%|▏ | 222/12384 [28:26<25:51:18, 7.65s/it, loss=8.2762, acc=0.0003, iter_time=7.62s]
Epoch 0: 2%|▏ | 223/12384 [28:26<25:49:22, 7.64s/it, loss=8.2762, acc=0.0003, iter_time=7.62s]
Epoch 0: 2%|▏ | 223/12384 [28:34<25:49:22, 7.64s/it, loss=8.1733, acc=0.0003, iter_time=8.02s]
Epoch 0: 2%|▏ | 224/12384 [28:34<25:48:10, 7.64s/it, loss=8.1733, acc=0.0003, iter_time=8.02s]
Epoch 0: 2%|▏ | 224/12384 [28:41<25:48:10, 7.64s/it, loss=8.0469, acc=0.0007, iter_time=7.25s]
Epoch 0: 2%|▏ | 225/12384 [28:41<25:47:04, 7.63s/it, loss=8.0469, acc=0.0007, iter_time=7.25s]
Epoch 0: 2%|▏ | 225/12384 [28:49<25:47:04, 7.63s/it, loss=7.5721, acc=0.0013, iter_time=7.63s]
Epoch 0: 2%|▏ | 226/12384 [28:49<25:46:18, 7.63s/it, loss=7.5721, acc=0.0013, iter_time=7.63s]
Epoch 0: 2%|▏ | 226/12384 [28:57<25:46:18, 7.63s/it, loss=8.4092, acc=0.0011, iter_time=6.10s]
Epoch 0: 2%|▏ | 227/12384 [28:57<25:44:58, 7.63s/it, loss=8.4092, acc=0.0011, iter_time=6.10s]
Epoch 0: 2%|▏ | 227/12384 [29:04<25:44:58, 7.63s/it, loss=8.6103, acc=0.0008, iter_time=9.11s]
Epoch 0: 2%|▏ | 228/12384 [29:04<25:43:04, 7.62s/it, loss=8.6103, acc=0.0008, iter_time=9.11s]
Epoch 0: 2%|▏ | 228/12384 [29:12<25:43:04, 7.62s/it, loss=7.8254, acc=0.0010, iter_time=7.62s]
Epoch 0: 2%|▏ | 229/12384 [29:12<25:43:22, 7.62s/it, loss=7.8254, acc=0.0010, iter_time=7.62s]
Epoch 0: 2%|▏ | 229/12384 [29:19<25:43:22, 7.62s/it, loss=8.3213, acc=0.0004, iter_time=7.60s]
Epoch 0: 2%|▏ | 230/12384 [29:19<25:42:10, 7.61s/it, loss=8.3213, acc=0.0004, iter_time=7.60s]
Epoch 0: 2%|▏ | 230/12384 [29:27<25:42:10, 7.61s/it, loss=7.7028, acc=0.0012, iter_time=7.60s]
Epoch 0: 2%|▏ | 231/12384 [29:27<25:41:10, 7.61s/it, loss=7.7028, acc=0.0012, iter_time=7.60s]
Epoch 0: 2%|▏ | 231/12384 [29:35<25:41:10, 7.61s/it, loss=7.7464, acc=0.0008, iter_time=7.98s]
Epoch 0: 2%|▏ | 232/12384 [29:35<25:41:33, 7.61s/it, loss=7.7464, acc=0.0008, iter_time=7.98s]
Epoch 0: 2%|▏ | 232/12384 [29:42<25:41:33, 7.61s/it, loss=7.7255, acc=0.0011, iter_time=7.24s]
Epoch 0: 2%|▏ | 233/12384 [29:42<25:41:24, 7.61s/it, loss=7.7255, acc=0.0011, iter_time=7.24s]
Epoch 0: 2%|▏ | 233/12384 [29:50<25:41:24, 7.61s/it, loss=7.4921, acc=0.0031, iter_time=7.37s]
Epoch 0: 2%|▏ | 234/12384 [29:50<25:43:31, 7.62s/it, loss=7.4921, acc=0.0031, iter_time=7.37s]
Epoch 0: 2%|▏ | 234/12384 [29:57<25:43:31, 7.62s/it, loss=7.4017, acc=0.0012, iter_time=7.88s]
Epoch 0: 2%|▏ | 235/12384 [29:57<25:42:08, 7.62s/it, loss=7.4017, acc=0.0012, iter_time=7.88s]
Epoch 0: 2%|▏ | 235/12384 [30:05<25:42:08, 7.62s/it, loss=7.7226, acc=0.0014, iter_time=7.61s]
Epoch 0: 2%|▏ | 236/12384 [30:05<25:41:06, 7.61s/it, loss=7.7226, acc=0.0014, iter_time=7.61s]
Epoch 0: 2%|▏ | 236/12384 [30:13<25:41:06, 7.61s/it, loss=7.8968, acc=0.0015, iter_time=4.29s]
Epoch 0: 2%|▏ | 237/12384 [30:13<25:41:28, 7.61s/it, loss=7.8968, acc=0.0015, iter_time=4.29s]
Epoch 0: 2%|▏ | 237/12384 [30:20<25:41:28, 7.61s/it, loss=7.7653, acc=0.0008, iter_time=9.73s]
Epoch 0: 2%|▏ | 238/12384 [30:20<25:41:26, 7.61s/it, loss=7.7653, acc=0.0008, iter_time=9.73s]
Epoch 0: 2%|▏ | 238/12384 [30:28<25:41:26, 7.61s/it, loss=7.4441, acc=0.0005, iter_time=8.81s]
Epoch 0: 2%|▏ | 239/12384 [30:28<25:41:40, 7.62s/it, loss=7.4441, acc=0.0005, iter_time=8.81s]
Epoch 0: 2%|▏ | 239/12384 [30:36<25:41:40, 7.62s/it, loss=7.7818, acc=0.0017, iter_time=7.72s]
Epoch 0: 2%|▏ | 240/12384 [30:36<25:41:15, 7.61s/it, loss=7.7818, acc=0.0017, iter_time=7.72s]
Epoch 0: 2%|▏ | 240/12384 [30:43<25:41:15, 7.61s/it, loss=7.3092, acc=0.0016, iter_time=7.51s]
Epoch 0: 2%|▏ | 241/12384 [30:43<25:41:55, 7.62s/it, loss=7.3092, acc=0.0016, iter_time=7.51s]
Epoch 0: 2%|▏ | 241/12384 [30:51<25:41:55, 7.62s/it, loss=7.3285, acc=0.0004, iter_time=7.62s]
Epoch 0: 2%|▏ | 242/12384 [30:51<25:41:39, 7.62s/it, loss=7.3285, acc=0.0004, iter_time=7.62s]
Epoch 0: 2%|▏ | 242/12384 [30:58<25:41:39, 7.62s/it, loss=7.2497, acc=0.0021, iter_time=5.08s]
Epoch 0: 2%|▏ | 243/12384 [30:58<25:41:46, 7.62s/it, loss=7.2497, acc=0.0021, iter_time=5.08s]
Epoch 0: 2%|▏ | 243/12384 [31:06<25:41:46, 7.62s/it, loss=7.8699, acc=0.0010, iter_time=10.18s]
Epoch 0: 2%|▏ | 244/12384 [31:06<25:41:38, 7.62s/it, loss=7.8699, acc=0.0010, iter_time=10.18s]
Epoch 0: 2%|▏ | 244/12384 [31:14<25:41:38, 7.62s/it, loss=7.1896, acc=0.0005, iter_time=6.50s]
Epoch 0: 2%|▏ | 245/12384 [31:14<26:03:25, 7.73s/it, loss=7.1896, acc=0.0005, iter_time=6.50s]
Epoch 0: 2%|▏ | 245/12384 [31:22<26:03:25, 7.73s/it, loss=7.3709, acc=0.0019, iter_time=9.09s]
Epoch 0: 2%|▏ | 246/12384 [31:22<25:58:01, 7.70s/it, loss=7.3709, acc=0.0019, iter_time=9.09s]
Epoch 0: 2%|▏ | 246/12384 [31:29<25:58:01, 7.70s/it, loss=7.8744, acc=0.0013, iter_time=7.64s]
Epoch 0: 2%|▏ | 247/12384 [31:29<25:53:01, 7.68s/it, loss=7.8744, acc=0.0013, iter_time=7.64s]
Epoch 0: 2%|▏ | 247/12384 [31:37<25:53:01, 7.68s/it, loss=7.2414, acc=0.0013, iter_time=7.58s]
Epoch 0: 2%|▏ | 248/12384 [31:37<25:49:33, 7.66s/it, loss=7.2414, acc=0.0013, iter_time=7.58s]
Epoch 0: 2%|▏ | 248/12384 [31:44<25:49:33, 7.66s/it, loss=7.3171, acc=0.0023, iter_time=7.36s]
Epoch 0: 2%|▏ | 249/12384 [31:44<25:47:31, 7.65s/it, loss=7.3171, acc=0.0023, iter_time=7.36s]
Epoch 0: 2%|▏ | 249/12384 [31:52<25:47:31, 7.65s/it, loss=7.6077, acc=0.0017, iter_time=8.38s]
Epoch 0: 2%|▏ | 250/12384 [31:52<25:47:53, 7.65s/it, loss=7.6077, acc=0.0017, iter_time=8.38s]
Epoch 0: 2%|▏ | 250/12384 [32:00<25:47:53, 7.65s/it, loss=7.2557, acc=0.0007, iter_time=7.23s]
Epoch 0: 2%|▏ | 251/12384 [32:00<25:46:13, 7.65s/it, loss=7.2557, acc=0.0007, iter_time=7.23s]
Epoch 0: 2%|▏ | 251/12384 [32:07<25:46:13, 7.65s/it, loss=7.6219, acc=0.0037, iter_time=7.60s]
Epoch 0: 2%|▏ | 252/12384 [32:07<25:43:47, 7.63s/it, loss=7.6219, acc=0.0037, iter_time=7.60s]
Epoch 0: 2%|▏ | 252/12384 [32:15<25:43:47, 7.63s/it, loss=7.3821, acc=0.0010, iter_time=7.63s]
Epoch 0: 2%|▏ | 253/12384 [32:15<25:41:50, 7.63s/it, loss=7.3821, acc=0.0010, iter_time=7.63s]
Epoch 0: 2%|▏ | 253/12384 [32:23<25:41:50, 7.63s/it, loss=7.3558, acc=0.0023, iter_time=7.60s]
Epoch 0: 2%|▏ | 254/12384 [32:23<25:40:58, 7.62s/it, loss=7.3558, acc=0.0023, iter_time=7.60s]
Epoch 0: 2%|▏ | 254/12384 [32:30<25:40:58, 7.62s/it, loss=7.2150, acc=0.0005, iter_time=7.63s]
Epoch 0: 2%|▏ | 255/12384 [32:30<25:40:46, 7.62s/it, loss=7.2150, acc=0.0005, iter_time=7.63s]
Epoch 0: 2%|▏ | 255/12384 [32:38<25:40:46, 7.62s/it, loss=7.7335, acc=0.0030, iter_time=8.01s]
Epoch 0: 2%|▏ | 256/12384 [32:38<25:40:48, 7.62s/it, loss=7.7335, acc=0.0030, iter_time=8.01s]
Epoch 0: 2%|▏ | 256/12384 [32:46<25:40:48, 7.62s/it, loss=7.2011, acc=0.0032, iter_time=7.31s]
Epoch 0: 2%|▏ | 257/12384 [32:46<25:45:35, 7.65s/it, loss=7.2011, acc=0.0032, iter_time=7.31s]
Epoch 0: 2%|▏ | 257/12384 [32:53<25:45:35, 7.65s/it, loss=7.1936, acc=0.0010, iter_time=4.09s]
Epoch 0: 2%|▏ | 258/12384 [32:53<25:41:55, 7.63s/it, loss=7.1936, acc=0.0010, iter_time=4.09s]
Epoch 0: 2%|▏ | 258/12384 [33:01<25:41:55, 7.63s/it, loss=7.2091, acc=0.0023, iter_time=8.49s]
Epoch 0: 2%|▏ | 259/12384 [33:01<25:44:24, 7.64s/it, loss=7.2091, acc=0.0023, iter_time=8.49s]
Epoch 0: 2%|▏ | 259/12384 [33:08<25:44:24, 7.64s/it, loss=7.0181, acc=0.0028, iter_time=8.86s]
Epoch 0: 2%|▏ | 260/12384 [33:08<25:41:36, 7.63s/it, loss=7.0181, acc=0.0028, iter_time=8.86s]
Epoch 0: 2%|▏ | 260/12384 [33:16<25:41:36, 7.63s/it, loss=6.9521, acc=0.0031, iter_time=9.03s]
Epoch 0: 2%|▏ | 261/12384 [33:16<25:41:04, 7.63s/it, loss=6.9521, acc=0.0031, iter_time=9.03s]
Epoch 0: 2%|▏ | 261/12384 [33:24<25:41:04, 7.63s/it, loss=7.0568, acc=0.0019, iter_time=7.63s]
Epoch 0: 2%|▏ | 262/12384 [33:24<25:40:38, 7.63s/it, loss=7.0568, acc=0.0019, iter_time=7.63s]
Epoch 0: 2%|▏ | 262/12384 [33:31<25:40:38, 7.63s/it, loss=7.2068, acc=0.0025, iter_time=7.62s]
Epoch 0: 2%|▏ | 263/12384 [33:31<25:43:03, 7.64s/it, loss=7.2068, acc=0.0025, iter_time=7.62s]
Epoch 0: 2%|▏ | 263/12384 [33:39<25:43:03, 7.64s/it, loss=7.3054, acc=0.0012, iter_time=8.03s]
Epoch 0: 2%|▏ | 264/12384 [33:39<25:39:58, 7.62s/it, loss=7.3054, acc=0.0012, iter_time=8.03s]
Epoch 0: 2%|▏ | 264/12384 [33:47<25:39:58, 7.62s/it, loss=7.0947, acc=0.0027, iter_time=7.20s]
Epoch 0: 2%|▏ | 265/12384 [33:47<25:40:44, 7.63s/it, loss=7.0947, acc=0.0027, iter_time=7.20s]
Epoch 0: 2%|▏ | 265/12384 [33:54<25:40:44, 7.63s/it, loss=6.9332, acc=0.0029, iter_time=5.57s]
Epoch 0: 2%|▏ | 266/12384 [33:54<25:40:32, 7.63s/it, loss=6.9332, acc=0.0029, iter_time=5.57s]
Epoch 0: 2%|▏ | 266/12384 [34:02<25:40:32, 7.63s/it, loss=6.8398, acc=0.0025, iter_time=9.71s]
Epoch 0: 2%|▏ | 267/12384 [34:02<25:39:43, 7.62s/it, loss=6.8398, acc=0.0025, iter_time=9.71s]
Epoch 0: 2%|▏ | 267/12384 [34:09<25:39:43, 7.62s/it, loss=7.1971, acc=0.0026, iter_time=5.55s]
Epoch 0: 2%|▏ | 268/12384 [34:09<25:38:02, 7.62s/it, loss=7.1971, acc=0.0026, iter_time=5.55s]
Epoch 0: 2%|▏ | 268/12384 [34:17<25:38:02, 7.62s/it, loss=7.0218, acc=0.0014, iter_time=7.66s]
Epoch 0: 2%|▏ | 269/12384 [34:17<25:36:22, 7.61s/it, loss=7.0218, acc=0.0014, iter_time=7.66s]
Epoch 0: 2%|▏ | 269/12384 [34:25<25:36:22, 7.61s/it, loss=6.9738, acc=0.0023, iter_time=9.57s]
Epoch 0: 2%|▏ | 270/12384 [34:25<25:36:18, 7.61s/it, loss=6.9738, acc=0.0023, iter_time=9.57s]
Epoch 0: 2%|▏ | 270/12384 [34:32<25:36:18, 7.61s/it, loss=7.2857, acc=0.0023, iter_time=7.61s]
Epoch 0: 2%|▏ | 271/12384 [34:32<25:38:55, 7.62s/it, loss=7.2857, acc=0.0023, iter_time=7.61s]
Epoch 0: 2%|▏ | 271/12384 [34:40<25:38:55, 7.62s/it, loss=7.3402, acc=0.0024, iter_time=8.04s]
Epoch 0: 2%|▏ | 272/12384 [34:40<26:04:00, 7.75s/it, loss=7.3402, acc=0.0024, iter_time=8.04s]
Epoch 0: 2%|▏ | 272/12384 [34:48<26:04:00, 7.75s/it, loss=6.7737, acc=0.0021, iter_time=7.66s]
Epoch 0: 2%|▏ | 273/12384 [34:48<25:55:07, 7.70s/it, loss=6.7737, acc=0.0021, iter_time=7.66s]
Epoch 0: 2%|▏ | 273/12384 [34:55<25:55:07, 7.70s/it, loss=6.9054, acc=0.0030, iter_time=7.59s]
Epoch 0: 2%|▏ | 274/12384 [34:55<25:47:58, 7.67s/it, loss=6.9054, acc=0.0030, iter_time=7.59s]
Epoch 0: 2%|▏ | 274/12384 [35:03<25:47:58, 7.67s/it, loss=6.9787, acc=0.0025, iter_time=7.61s]
Epoch 0: 2%|▏ | 275/12384 [35:03<25:44:12, 7.65s/it, loss=6.9787, acc=0.0025, iter_time=7.61s]
Epoch 0: 2%|▏ | 275/12384 [35:11<25:44:12, 7.65s/it, loss=7.3321, acc=0.0043, iter_time=7.60s]
Epoch 0: 2%|▏ | 276/12384 [35:11<25:42:26, 7.64s/it, loss=7.3321, acc=0.0043, iter_time=7.60s]
Epoch 0: 2%|▏ | 276/12384 [35:18<25:42:26, 7.64s/it, loss=6.9456, acc=0.0037, iter_time=7.61s]
Epoch 0: 2%|▏ | 277/12384 [35:18<25:40:17, 7.63s/it, loss=6.9456, acc=0.0037, iter_time=7.61s]
Epoch 0: 2%|▏ | 277/12384 [35:26<25:40:17, 7.63s/it, loss=6.8192, acc=0.0020, iter_time=7.61s]
Epoch 0: 2%|▏ | 278/12384 [35:26<25:41:23, 7.64s/it, loss=6.8192, acc=0.0020, iter_time=7.61s]
Epoch 0: 2%|▏ | 278/12384 [35:34<25:41:23, 7.64s/it, loss=6.8747, acc=0.0022, iter_time=7.67s]
Epoch 0: 2%|▏ | 279/12384 [35:34<25:41:17, 7.64s/it, loss=6.8747, acc=0.0022, iter_time=7.67s]
Epoch 0: 2%|▏ | 279/12384 [35:41<25:41:17, 7.64s/it, loss=7.0972, acc=0.0034, iter_time=7.74s]
Epoch 0: 2%|▏ | 280/12384 [35:41<25:39:15, 7.63s/it, loss=7.0972, acc=0.0034, iter_time=7.74s]
Epoch 0: 2%|▏ | 280/12384 [35:49<25:39:15, 7.63s/it, loss=7.0766, acc=0.0040, iter_time=7.47s]
Epoch 0: 2%|▏ | 281/12384 [35:49<25:38:00, 7.62s/it, loss=7.0766, acc=0.0040, iter_time=7.47s]
Epoch 0: 2%|▏ | 281/12384 [35:56<25:38:00, 7.62s/it, loss=6.6613, acc=0.0049, iter_time=7.01s]
Epoch 0: 2%|▏ | 282/12384 [35:56<25:36:47, 7.62s/it, loss=6.6613, acc=0.0049, iter_time=7.01s]
Epoch 0: 2%|▏ | 282/12384 [36:04<25:36:47, 7.62s/it, loss=7.0218, acc=0.0014, iter_time=5.92s]
Epoch 0: 2%|▏ | 283/12384 [36:04<25:36:00, 7.62s/it, loss=7.0218, acc=0.0014, iter_time=5.92s]
Epoch 0: 2%|▏ | 283/12384 [36:12<25:36:00, 7.62s/it, loss=6.9400, acc=0.0038, iter_time=9.91s]
Epoch 0: 2%|▏ | 284/12384 [36:12<25:35:35, 7.61s/it, loss=6.9400, acc=0.0038, iter_time=9.91s]
Epoch 0: 2%|▏ | 284/12384 [36:19<25:35:35, 7.61s/it, loss=7.3453, acc=0.0021, iter_time=7.62s]
Epoch 0: 2%|▏ | 285/12384 [36:19<25:34:29, 7.61s/it, loss=7.3453, acc=0.0021, iter_time=7.62s]
Epoch 0: 2%|▏ | 285/12384 [36:27<25:34:29, 7.61s/it, loss=6.8005, acc=0.0029, iter_time=7.59s]
Epoch 0: 2%|▏ | 286/12384 [36:27<25:34:10, 7.61s/it, loss=6.8005, acc=0.0029, iter_time=7.59s]
Epoch 0: 2%|▏ | 286/12384 [36:34<25:34:10, 7.61s/it, loss=6.7767, acc=0.0041, iter_time=7.61s]
Epoch 0: 2%|▏ | 287/12384 [36:34<25:33:33, 7.61s/it, loss=6.7767, acc=0.0041, iter_time=7.61s]
Epoch 0: 2%|▏ | 287/12384 [36:42<25:33:33, 7.61s/it, loss=7.3385, acc=0.0036, iter_time=7.98s]
Epoch 0: 2%|▏ | 288/12384 [36:42<25:34:34, 7.61s/it, loss=7.3385, acc=0.0036, iter_time=7.98s]
Epoch 0: 2%|▏ | 288/12384 [36:50<25:34:34, 7.61s/it, loss=6.7447, acc=0.0030, iter_time=6.94s]
Epoch 0: 2%|▏ | 289/12384 [36:50<25:33:41, 7.61s/it, loss=6.7447, acc=0.0030, iter_time=6.94s]
Epoch 0: 2%|▏ | 289/12384 [36:57<25:33:41, 7.61s/it, loss=6.3976, acc=0.0030, iter_time=7.93s]
Epoch 0: 2%|▏ | 290/12384 [36:57<25:35:48, 7.62s/it, loss=6.3976, acc=0.0030, iter_time=7.93s]
Epoch 0: 2%|▏ | 290/12384 [37:05<25:35:48, 7.62s/it, loss=6.7188, acc=0.0074, iter_time=7.60s]
Epoch 0: 2%|▏ | 291/12384 [37:05<25:35:20, 7.62s/it, loss=6.7188, acc=0.0074, iter_time=7.60s]
Epoch 0: 2%|▏ | 291/12384 [37:13<25:35:20, 7.62s/it, loss=6.7773, acc=0.0036, iter_time=7.63s]
Epoch 0: 2%|▏ | 292/12384 [37:13<25:35:30, 7.62s/it, loss=6.7773, acc=0.0036, iter_time=7.63s]
Epoch 0: 2%|▏ | 292/12384 [37:20<25:35:30, 7.62s/it, loss=6.5078, acc=0.0038, iter_time=7.65s]
Epoch 0: 2%|▏ | 293/12384 [37:20<25:35:38, 7.62s/it, loss=6.5078, acc=0.0038, iter_time=7.65s]
Epoch 0: 2%|▏ | 293/12384 [37:28<25:35:38, 7.62s/it, loss=6.6936, acc=0.0027, iter_time=5.04s]
Epoch 0: 2%|▏ | 294/12384 [37:28<25:34:47, 7.62s/it, loss=6.6936, acc=0.0027, iter_time=5.04s]
Epoch 0: 2%|▏ | 294/12384 [37:35<25:34:47, 7.62s/it, loss=6.3950, acc=0.0052, iter_time=8.06s]
Epoch 0: 2%|▏ | 295/12384 [37:35<25:32:53, 7.61s/it, loss=6.3950, acc=0.0052, iter_time=8.06s]
Epoch 0: 2%|▏ | 295/12384 [37:43<25:32:53, 7.61s/it, loss=6.7578, acc=0.0028, iter_time=9.65s]
Epoch 0: 2%|▏ | 296/12384 [37:43<25:33:48, 7.61s/it, loss=6.7578, acc=0.0028, iter_time=9.65s]
Epoch 0: 2%|▏ | 296/12384 [37:51<25:33:48, 7.61s/it, loss=6.1198, acc=0.0040, iter_time=7.66s]
Epoch 0: 2%|▏ | 297/12384 [37:51<25:33:16, 7.61s/it, loss=6.1198, acc=0.0040, iter_time=7.66s]
Epoch 0: 2%|▏ | 297/12384 [37:59<25:33:16, 7.61s/it, loss=7.0963, acc=0.0038, iter_time=7.94s]
Epoch 0: 2%|▏ | 298/12384 [37:59<25:54:06, 7.72s/it, loss=7.0963, acc=0.0038, iter_time=7.94s]
Epoch 0: 2%|▏ | 298/12384 [38:06<25:54:06, 7.72s/it, loss=6.2475, acc=0.0037, iter_time=7.04s]
Epoch 0: 2%|▏ | 299/12384 [38:06<25:48:57, 7.69s/it, loss=6.2475, acc=0.0037, iter_time=7.04s]
Epoch 0: 2%|▏ | 299/12384 [38:14<25:48:57, 7.69s/it, loss=6.3536, acc=0.0050, iter_time=8.63s]
Epoch 0: 2%|▏ | 300/12384 [38:14<25:44:31, 7.67s/it, loss=6.3536, acc=0.0050, iter_time=8.63s]
Epoch 0: 2%|▏ | 300/12384 [38:21<25:44:31, 7.67s/it, loss=5.8288, acc=0.0066, iter_time=4.62s]
Epoch 0: 2%|▏ | 301/12384 [38:21<25:41:24, 7.65s/it, loss=5.8288, acc=0.0066, iter_time=4.62s]
Epoch 0: 2%|▏ | 301/12384 [38:29<25:41:24, 7.65s/it, loss=6.3084, acc=0.0032, iter_time=10.22s]
Epoch 0: 2%|▏ | 302/12384 [38:29<25:39:26, 7.64s/it, loss=6.3084, acc=0.0032, iter_time=10.22s]
Epoch 0: 2%|▏ | 302/12384 [38:37<25:39:26, 7.64s/it, loss=6.6379, acc=0.0032, iter_time=5.58s]
Epoch 0: 2%|▏ | 303/12384 [38:37<25:36:05, 7.63s/it, loss=6.6379, acc=0.0032, iter_time=5.58s]
Epoch 0: 2%|▏ | 303/12384 [38:44<25:36:05, 7.63s/it, loss=6.8155, acc=0.0037, iter_time=10.02s]
Epoch 0: 2%|▏ | 304/12384 [38:44<25:36:50, 7.63s/it, loss=6.8155, acc=0.0037, iter_time=10.02s]
Epoch 0: 2%|▏ | 304/12384 [38:52<25:36:50, 7.63s/it, loss=5.8002, acc=0.0080, iter_time=4.19s]
Epoch 0: 2%|▏ | 305/12384 [38:52<25:35:19, 7.63s/it, loss=5.8002, acc=0.0080, iter_time=4.19s]
Epoch 0: 2%|▏ | 305/12384 [39:00<25:35:19, 7.63s/it, loss=6.6646, acc=0.0053, iter_time=10.67s]
Epoch 0: 2%|▏ | 306/12384 [39:00<25:34:52, 7.62s/it, loss=6.6646, acc=0.0053, iter_time=10.67s]
Epoch 0: 2%|▏ | 306/12384 [39:07<25:34:52, 7.62s/it, loss=6.6740, acc=0.0038, iter_time=5.31s]
Epoch 0: 2%|▏ | 307/12384 [39:07<25:32:20, 7.61s/it, loss=6.6740, acc=0.0038, iter_time=5.31s]
Epoch 0: 2%|▏ | 307/12384 [39:15<25:32:20, 7.61s/it, loss=6.4498, acc=0.0060, iter_time=9.90s]
Epoch 0: 2%|▏ | 308/12384 [39:15<25:32:20, 7.61s/it, loss=6.4498, acc=0.0060, iter_time=9.90s]
Epoch 0: 2%|▏ | 308/12384 [39:22<25:32:20, 7.61s/it, loss=6.1424, acc=0.0047, iter_time=4.75s]
Epoch 0: 2%|▏ | 309/12384 [39:22<25:31:14, 7.61s/it, loss=6.1424, acc=0.0047, iter_time=4.75s]
Epoch 0: 2%|▏ | 309/12384 [39:30<25:31:14, 7.61s/it, loss=5.9922, acc=0.0045, iter_time=6.95s]
Epoch 0: 3%|▎ | 310/12384 [39:30<25:31:36, 7.61s/it, loss=5.9922, acc=0.0045, iter_time=6.95s]
Epoch 0: 3%|▎ | 310/12384 [39:38<25:31:36, 7.61s/it, loss=6.0709, acc=0.0058, iter_time=11.11s]
Epoch 0: 3%|▎ | 311/12384 [39:38<25:31:29, 7.61s/it, loss=6.0709, acc=0.0058, iter_time=11.11s]
Epoch 0: 3%|▎ | 311/12384 [39:45<25:31:29, 7.61s/it, loss=6.5126, acc=0.0035, iter_time=7.75s]
Epoch 0: 3%|▎ | 312/12384 [39:45<25:35:06, 7.63s/it, loss=6.5126, acc=0.0035, iter_time=7.75s]
Epoch 0: 3%|▎ | 312/12384 [39:53<25:35:06, 7.63s/it, loss=5.6130, acc=0.0070, iter_time=5.02s]
Epoch 0: 3%|▎ | 313/12384 [39:53<25:34:35, 7.63s/it, loss=5.6130, acc=0.0070, iter_time=5.02s]
Epoch 0: 3%|▎ | 313/12384 [40:01<25:34:35, 7.63s/it, loss=6.2546, acc=0.0051, iter_time=10.16s]
Epoch 0: 3%|▎ | 314/12384 [40:01<25:35:55, 7.64s/it, loss=6.2546, acc=0.0051, iter_time=10.16s]
Epoch 0: 3%|▎ | 314/12384 [40:08<25:35:55, 7.64s/it, loss=5.9705, acc=0.0077, iter_time=5.66s]
Epoch 0: 3%|▎ | 315/12384 [40:08<25:37:48, 7.65s/it, loss=5.9705, acc=0.0077, iter_time=5.66s]
Epoch 0: 3%|▎ | 315/12384 [40:16<25:37:48, 7.65s/it, loss=6.4452, acc=0.0053, iter_time=9.66s]
Epoch 0: 3%|▎ | 316/12384 [40:16<25:36:39, 7.64s/it, loss=6.4452, acc=0.0053, iter_time=9.66s]
Epoch 0: 3%|▎ | 316/12384 [40:23<25:36:39, 7.64s/it, loss=5.5123, acc=0.0078, iter_time=5.34s]
Epoch 0: 3%|▎ | 317/12384 [40:23<25:35:31, 7.64s/it, loss=5.5123, acc=0.0078, iter_time=5.34s]
Epoch 0: 3%|▎ | 317/12384 [40:31<25:35:31, 7.64s/it, loss=5.9085, acc=0.0053, iter_time=9.90s]
Epoch 0: 3%|▎ | 318/12384 [40:31<25:37:28, 7.65s/it, loss=5.9085, acc=0.0053, iter_time=9.90s]
Epoch 0: 3%|▎ | 318/12384 [40:39<25:37:28, 7.65s/it, loss=5.7049, acc=0.0059, iter_time=4.80s]
Epoch 0: 3%|▎ | 319/12384 [40:39<25:37:33, 7.65s/it, loss=5.7049, acc=0.0059, iter_time=4.80s]
Epoch 0: 3%|▎ | 319/12384 [40:46<25:37:33, 7.65s/it, loss=6.1760, acc=0.0074, iter_time=10.51s]
Epoch 0: 3%|▎ | 320/12384 [40:46<25:37:15, 7.65s/it, loss=6.1760, acc=0.0074, iter_time=10.51s]
Epoch 0: 3%|▎ | 320/12384 [40:54<25:37:15, 7.65s/it, loss=5.7460, acc=0.0067, iter_time=7.68s]
Epoch 0: 3%|▎ | 321/12384 [40:54<25:35:53, 7.64s/it, loss=5.7460, acc=0.0067, iter_time=7.68s]
Epoch 0: 3%|▎ | 321/12384 [41:02<25:35:53, 7.64s/it, loss=5.8593, acc=0.0101, iter_time=4.79s]
Epoch 0: 3%|▎ | 322/12384 [41:02<25:32:30, 7.62s/it, loss=5.8593, acc=0.0101, iter_time=4.79s]
Epoch 0: 3%|▎ | 322/12384 [41:09<25:32:30, 7.62s/it, loss=6.2380, acc=0.0057, iter_time=10.39s]
Epoch 0: 3%|▎ | 323/12384 [41:09<25:31:45, 7.62s/it, loss=6.2380, acc=0.0057, iter_time=10.39s]
Epoch 0: 3%|▎ | 323/12384 [41:17<25:31:45, 7.62s/it, loss=5.9155, acc=0.0102, iter_time=7.32s]
Epoch 0: 3%|▎ | 324/12384 [41:17<25:33:00, 7.63s/it, loss=5.9155, acc=0.0102, iter_time=7.32s]
Epoch 0: 3%|▎ | 324/12384 [41:25<25:33:00, 7.63s/it, loss=5.6637, acc=0.0062, iter_time=8.30s]
Epoch 0: 3%|▎ | 325/12384 [41:25<25:52:25, 7.72s/it, loss=5.6637, acc=0.0062, iter_time=8.30s]
Epoch 0: 3%|▎ | 325/12384 [41:32<25:52:25, 7.72s/it, loss=5.8483, acc=0.0070, iter_time=7.61s]
Epoch 0: 3%|▎ | 326/12384 [41:32<25:45:57, 7.69s/it, loss=5.8483, acc=0.0070, iter_time=7.61s]
Epoch 0: 3%|▎ | 326/12384 [41:40<25:45:57, 7.69s/it, loss=5.6499, acc=0.0069, iter_time=7.61s]
Epoch 0: 3%|▎ | 327/12384 [41:40<25:41:30, 7.67s/it, loss=5.6499, acc=0.0069, iter_time=7.61s]
Epoch 0: 3%|▎ | 327/12384 [41:48<25:41:30, 7.67s/it, loss=5.8533, acc=0.0057, iter_time=8.03s]
Epoch 0: 3%|▎ | 328/12384 [41:48<25:37:56, 7.65s/it, loss=5.8533, acc=0.0057, iter_time=8.03s]
Epoch 0: 3%|▎ | 328/12384 [41:55<25:37:56, 7.65s/it, loss=5.3488, acc=0.0093, iter_time=7.21s]
Epoch 0: 3%|▎ | 329/12384 [41:55<25:37:23, 7.65s/it, loss=5.3488, acc=0.0093, iter_time=7.21s]
Epoch 0: 3%|▎ | 329/12384 [42:03<25:37:23, 7.65s/it, loss=5.3455, acc=0.0087, iter_time=7.66s]
Epoch 0: 3%|▎ | 330/12384 [42:03<25:34:46, 7.64s/it, loss=5.3455, acc=0.0087, iter_time=7.66s]
Epoch 0: 3%|▎ | 330/12384 [42:11<25:34:46, 7.64s/it, loss=5.8478, acc=0.0066, iter_time=7.60s]
Epoch 0: 3%|▎ | 331/12384 [42:11<25:31:43, 7.62s/it, loss=5.8478, acc=0.0066, iter_time=7.60s]
Epoch 0: 3%|▎ | 331/12384 [42:18<25:31:43, 7.62s/it, loss=5.9462, acc=0.0068, iter_time=7.60s]
Epoch 0: 3%|▎ | 332/12384 [42:18<25:30:13, 7.62s/it, loss=5.9462, acc=0.0068, iter_time=7.60s]
Epoch 0: 3%|▎ | 332/12384 [42:26<25:30:13, 7.62s/it, loss=5.4071, acc=0.0106, iter_time=7.62s]
Epoch 0: 3%|▎ | 333/12384 [42:26<25:31:03, 7.62s/it, loss=5.4071, acc=0.0106, iter_time=7.62s]
Epoch 0: 3%|▎ | 333/12384 [42:33<25:31:03, 7.62s/it, loss=5.3136, acc=0.0103, iter_time=5.01s]
Epoch 0: 3%|▎ | 334/12384 [42:33<25:31:28, 7.63s/it, loss=5.3136, acc=0.0103, iter_time=5.01s]
Epoch 0: 3%|▎ | 334/12384 [42:41<25:31:28, 7.63s/it, loss=5.3291, acc=0.0075, iter_time=10.24s]
Epoch 0: 3%|▎ | 335/12384 [42:41<25:30:20, 7.62s/it, loss=5.3291, acc=0.0075, iter_time=10.24s]
Epoch 0: 3%|▎ | 335/12384 [42:49<25:30:20, 7.62s/it, loss=5.7864, acc=0.0084, iter_time=8.02s]
Epoch 0: 3%|▎ | 336/12384 [42:49<25:30:32, 7.62s/it, loss=5.7864, acc=0.0084, iter_time=8.02s]
Epoch 0: 3%|▎ | 336/12384 [42:56<25:30:32, 7.62s/it, loss=5.7995, acc=0.0072, iter_time=7.22s]
Epoch 0: 3%|▎ | 337/12384 [42:56<25:35:12, 7.65s/it, loss=5.7995, acc=0.0072, iter_time=7.22s]
Epoch 0: 3%|▎ | 337/12384 [43:04<25:35:12, 7.65s/it, loss=6.0975, acc=0.0071, iter_time=7.70s]
Epoch 0: 3%|▎ | 338/12384 [43:04<25:37:02, 7.66s/it, loss=6.0975, acc=0.0071, iter_time=7.70s]
Epoch 0: 3%|▎ | 338/12384 [43:12<25:37:02, 7.66s/it, loss=5.6665, acc=0.0068, iter_time=7.70s]
Epoch 0: 3%|▎ | 339/12384 [43:12<25:35:07, 7.65s/it, loss=5.6665, acc=0.0068, iter_time=7.70s]
Epoch 0: 3%|▎ | 339/12384 [43:19<25:35:07, 7.65s/it, loss=5.7335, acc=0.0093, iter_time=5.84s]
Epoch 0: 3%|▎ | 340/12384 [43:19<25:34:28, 7.64s/it, loss=5.7335, acc=0.0093, iter_time=5.84s]
Epoch 0: 3%|▎ | 340/12384 [43:27<25:34:28, 7.64s/it, loss=5.4921, acc=0.0104, iter_time=9.40s]
Epoch 0: 3%|▎ | 341/12384 [43:27<25:33:24, 7.64s/it, loss=5.4921, acc=0.0104, iter_time=9.40s]
Epoch 0: 3%|▎ | 341/12384 [43:35<25:33:24, 7.64s/it, loss=5.7705, acc=0.0058, iter_time=7.65s]
Epoch 0: 3%|▎ | 342/12384 [43:35<25:34:18, 7.64s/it, loss=5.7705, acc=0.0058, iter_time=7.65s]
Epoch 0: 3%|▎ | 342/12384 [43:42<25:34:18, 7.64s/it, loss=5.6818, acc=0.0080, iter_time=7.65s]
Epoch 0: 3%|▎ | 343/12384 [43:42<25:32:12, 7.63s/it, loss=5.6818, acc=0.0080, iter_time=7.65s]
Epoch 0: 3%|▎ | 343/12384 [43:50<25:32:12, 7.63s/it, loss=5.4836, acc=0.0111, iter_time=7.99s]
Epoch 0: 3%|▎ | 344/12384 [43:50<25:29:46, 7.62s/it, loss=5.4836, acc=0.0111, iter_time=7.99s]
Epoch 0: 3%|▎ | 344/12384 [43:57<25:29:46, 7.62s/it, loss=5.6669, acc=0.0124, iter_time=7.21s]
Epoch 0: 3%|▎ | 345/12384 [43:57<25:30:59, 7.63s/it, loss=5.6669, acc=0.0124, iter_time=7.21s]
Epoch 0: 3%|▎ | 345/12384 [44:05<25:30:59, 7.63s/it, loss=5.4490, acc=0.0080, iter_time=7.65s]
Epoch 0: 3%|▎ | 346/12384 [44:05<25:29:32, 7.62s/it, loss=5.4490, acc=0.0080, iter_time=7.65s]
Epoch 0: 3%|▎ | 346/12384 [44:13<25:29:32, 7.62s/it, loss=5.3377, acc=0.0114, iter_time=7.63s]
Epoch 0: 3%|▎ | 347/12384 [44:13<25:29:05, 7.62s/it, loss=5.3377, acc=0.0114, iter_time=7.63s]
Epoch 0: 3%|▎ | 347/12384 [44:20<25:29:05, 7.62s/it, loss=5.9492, acc=0.0055, iter_time=7.61s]
Epoch 0: 3%|▎ | 348/12384 [44:20<25:28:33, 7.62s/it, loss=5.9492, acc=0.0055, iter_time=7.61s]
Epoch 0: 3%|▎ | 348/12384 [44:28<25:28:33, 7.62s/it, loss=5.5126, acc=0.0067, iter_time=7.59s]
Epoch 0: 3%|▎ | 349/12384 [44:28<25:26:54, 7.61s/it, loss=5.5126, acc=0.0067, iter_time=7.59s]
Epoch 0: 3%|▎ | 349/12384 [44:35<25:26:54, 7.61s/it, loss=5.4042, acc=0.0112, iter_time=8.00s]
Epoch 0: 3%|▎ | 350/12384 [44:35<25:26:16, 7.61s/it, loss=5.4042, acc=0.0112, iter_time=8.00s]
Epoch 0: 3%|▎ | 350/12384 [44:43<25:26:16, 7.61s/it, loss=5.0055, acc=0.0098, iter_time=7.59s]
Epoch 0: 3%|▎ | 351/12384 [44:43<25:49:19, 7.73s/it, loss=5.0055, acc=0.0098, iter_time=7.59s]
Epoch 0: 3%|▎ | 351/12384 [44:51<25:49:19, 7.73s/it, loss=4.9367, acc=0.0127, iter_time=7.55s]
Epoch 0: 3%|▎ | 352/12384 [44:51<25:41:34, 7.69s/it, loss=4.9367, acc=0.0127, iter_time=7.55s]
Epoch 0: 3%|▎ | 352/12384 [44:59<25:41:34, 7.69s/it, loss=5.2550, acc=0.0144, iter_time=7.68s]
Epoch 0: 3%|▎ | 353/12384 [44:59<25:37:18, 7.67s/it, loss=5.2550, acc=0.0144, iter_time=7.68s]
Epoch 0: 3%|▎ | 353/12384 [45:06<25:37:18, 7.67s/it, loss=4.6456, acc=0.0174, iter_time=7.61s]
Epoch 0: 3%|▎ | 354/12384 [45:06<25:33:35, 7.65s/it, loss=4.6456, acc=0.0174, iter_time=7.61s]
Epoch 0: 3%|▎ | 354/12384 [45:14<25:33:35, 7.65s/it, loss=4.7150, acc=0.0128, iter_time=7.60s]
Epoch 0: 3%|▎ | 355/12384 [45:14<25:33:30, 7.65s/it, loss=4.7150, acc=0.0128, iter_time=7.60s]
Epoch 0: 3%|▎ | 355/12384 [45:22<25:33:30, 7.65s/it, loss=5.1594, acc=0.0104, iter_time=3.61s]
Epoch 0: 3%|▎ | 356/12384 [45:22<25:37:23, 7.67s/it, loss=5.1594, acc=0.0104, iter_time=3.61s]
Epoch 0: 3%|▎ | 356/12384 [45:29<25:37:23, 7.67s/it, loss=5.1750, acc=0.0101, iter_time=11.74s]
Epoch 0: 3%|▎ | 357/12384 [45:29<25:33:23, 7.65s/it, loss=5.1750, acc=0.0101, iter_time=11.74s]
Epoch 0: 3%|▎ | 357/12384 [45:37<25:33:23, 7.65s/it, loss=5.2103, acc=0.0132, iter_time=7.60s]
Epoch 0: 3%|▎ | 358/12384 [45:37<25:31:17, 7.64s/it, loss=5.2103, acc=0.0132, iter_time=7.60s]
Epoch 0: 3%|▎ | 358/12384 [45:45<25:31:17, 7.64s/it, loss=5.5444, acc=0.0121, iter_time=7.68s]
Epoch 0: 3%|▎ | 359/12384 [45:45<25:31:53, 7.64s/it, loss=5.5444, acc=0.0121, iter_time=7.68s]
Epoch 0: 3%|▎ | 359/12384 [45:52<25:31:53, 7.64s/it, loss=4.6944, acc=0.0179, iter_time=7.55s]
Epoch 0: 3%|▎ | 360/12384 [45:52<25:29:21, 7.63s/it, loss=4.6944, acc=0.0179, iter_time=7.55s]
Epoch 0: 3%|▎ | 360/12384 [46:00<25:29:21, 7.63s/it, loss=5.2815, acc=0.0146, iter_time=7.65s]
Epoch 0: 3%|▎ | 361/12384 [46:00<25:26:45, 7.62s/it, loss=5.2815, acc=0.0146, iter_time=7.65s]
Epoch 0: 3%|▎ | 361/12384 [46:07<25:26:45, 7.62s/it, loss=4.4691, acc=0.0205, iter_time=5.53s]
Epoch 0: 3%|▎ | 362/12384 [46:07<25:27:31, 7.62s/it, loss=4.4691, acc=0.0205, iter_time=5.53s]
Epoch 0: 3%|▎ | 362/12384 [46:15<25:27:31, 7.62s/it, loss=4.8074, acc=0.0239, iter_time=9.72s]
Epoch 0: 3%|▎ | 363/12384 [46:15<25:28:06, 7.63s/it, loss=4.8074, acc=0.0239, iter_time=9.72s]
Epoch 0: 3%|▎ | 363/12384 [46:23<25:28:06, 7.63s/it, loss=4.4950, acc=0.0185, iter_time=7.63s]
Epoch 0: 3%|▎ | 364/12384 [46:23<25:28:08, 7.63s/it, loss=4.4950, acc=0.0185, iter_time=7.63s]
Epoch 0: 3%|▎ | 364/12384 [46:30<25:28:08, 7.63s/it, loss=5.0366, acc=0.0109, iter_time=7.66s]
Epoch 0: 3%|▎ | 365/12384 [46:30<25:28:06, 7.63s/it, loss=5.0366, acc=0.0109, iter_time=7.66s]
Epoch 0: 3%|▎ | 365/12384 [46:38<25:28:06, 7.63s/it, loss=4.6967, acc=0.0150, iter_time=7.63s]
Epoch 0: 3%|▎ | 366/12384 [46:38<25:30:47, 7.64s/it, loss=4.6967, acc=0.0150, iter_time=7.63s]
Epoch 0: 3%|▎ | 366/12384 [46:46<25:30:47, 7.64s/it, loss=4.7908, acc=0.0161, iter_time=7.66s]
Epoch 0: 3%|▎ | 367/12384 [46:46<25:29:06, 7.63s/it, loss=4.7908, acc=0.0161, iter_time=7.66s]
Epoch 0: 3%|▎ | 367/12384 [46:53<25:29:06, 7.63s/it, loss=4.8590, acc=0.0198, iter_time=7.55s]
Epoch 0: 3%|▎ | 368/12384 [46:53<25:27:24, 7.63s/it, loss=4.8590, acc=0.0198, iter_time=7.55s]
Epoch 0: 3%|▎ | 368/12384 [47:01<25:27:24, 7.63s/it, loss=4.6134, acc=0.0147, iter_time=7.65s]
Epoch 0: 3%|▎ | 369/12384 [47:01<25:27:43, 7.63s/it, loss=4.6134, acc=0.0147, iter_time=7.65s]
Epoch 0: 3%|▎ | 369/12384 [47:08<25:27:43, 7.63s/it, loss=4.9901, acc=0.0128, iter_time=7.63s]
Epoch 0: 3%|▎ | 370/12384 [47:08<25:26:37, 7.62s/it, loss=4.9901, acc=0.0128, iter_time=7.63s]
Epoch 0: 3%|▎ | 370/12384 [47:16<25:26:37, 7.62s/it, loss=4.8866, acc=0.0132, iter_time=7.64s]
Epoch 0: 3%|▎ | 371/12384 [47:16<25:25:57, 7.62s/it, loss=4.8866, acc=0.0132, iter_time=7.64s]
Epoch 0: 3%|▎ | 371/12384 [47:24<25:25:57, 7.62s/it, loss=4.9946, acc=0.0124, iter_time=7.61s]
Epoch 0: 3%|▎ | 372/12384 [47:24<25:24:57, 7.62s/it, loss=4.9946, acc=0.0124, iter_time=7.61s]
Epoch 0: 3%|▎ | 372/12384 [47:31<25:24:57, 7.62s/it, loss=4.9886, acc=0.0133, iter_time=7.63s]
Epoch 0: 3%|▎ | 373/12384 [47:31<25:25:41, 7.62s/it, loss=4.9886, acc=0.0133, iter_time=7.63s]
Epoch 0: 3%|▎ | 373/12384 [47:39<25:25:41, 7.62s/it, loss=4.7238, acc=0.0206, iter_time=4.29s]
Epoch 0: 3%|▎ | 374/12384 [47:39<25:25:52, 7.62s/it, loss=4.7238, acc=0.0206, iter_time=4.29s]
Epoch 0: 3%|▎ | 374/12384 [47:47<25:25:52, 7.62s/it, loss=5.1229, acc=0.0122, iter_time=10.95s]
Epoch 0: 3%|▎ | 375/12384 [47:47<25:27:39, 7.63s/it, loss=5.1229, acc=0.0122, iter_time=10.95s]
Epoch 0: 3%|▎ | 375/12384 [47:54<25:27:39, 7.63s/it, loss=5.1174, acc=0.0135, iter_time=8.04s]
Epoch 0: 3%|▎ | 376/12384 [47:54<25:27:22, 7.63s/it, loss=5.1174, acc=0.0135, iter_time=8.04s]
Epoch 0: 3%|▎ | 376/12384 [48:02<25:27:22, 7.63s/it, loss=5.0234, acc=0.0115, iter_time=7.55s]
Epoch 0: 3%|▎ | 377/12384 [48:02<25:44:43, 7.72s/it, loss=5.0234, acc=0.0115, iter_time=7.55s]
Epoch 0: 3%|▎ | 377/12384 [48:10<25:44:43, 7.72s/it, loss=4.2413, acc=0.0260, iter_time=4.33s]
Epoch 0: 3%|▎ | 378/12384 [48:10<25:36:09, 7.68s/it, loss=4.2413, acc=0.0260, iter_time=4.33s]
Epoch 0: 3%|▎ | 378/12384 [48:17<25:36:09, 7.68s/it, loss=4.5985, acc=0.0186, iter_time=10.21s]
Epoch 0: 3%|▎ | 379/12384 [48:17<25:34:08, 7.67s/it, loss=4.5985, acc=0.0186, iter_time=10.21s]
Epoch 0: 3%|▎ | 379/12384 [48:25<25:34:08, 7.67s/it, loss=5.0600, acc=0.0156, iter_time=7.41s]
Epoch 0: 3%|▎ | 380/12384 [48:25<25:30:53, 7.65s/it, loss=5.0600, acc=0.0156, iter_time=7.41s]
Epoch 0: 3%|▎ | 380/12384 [48:33<25:30:53, 7.65s/it, loss=4.7221, acc=0.0148, iter_time=8.50s]
Epoch 0: 3%|▎ | 381/12384 [48:33<25:29:00, 7.64s/it, loss=4.7221, acc=0.0148, iter_time=8.50s]
Epoch 0: 3%|▎ | 381/12384 [48:40<25:29:00, 7.64s/it, loss=4.8478, acc=0.0155, iter_time=7.61s]
Epoch 0: 3%|▎ | 382/12384 [48:40<25:27:40, 7.64s/it, loss=4.8478, acc=0.0155, iter_time=7.61s]
Epoch 0: 3%|▎ | 382/12384 [48:48<25:27:40, 7.64s/it, loss=4.2736, acc=0.0191, iter_time=7.62s]
Epoch 0: 3%|▎ | 383/12384 [48:48<25:27:55, 7.64s/it, loss=4.2736, acc=0.0191, iter_time=7.62s]
Epoch 0: 3%|▎ | 383/12384 [48:55<25:27:55, 7.64s/it, loss=4.7019, acc=0.0203, iter_time=8.04s]
Epoch 0: 3%|▎ | 384/12384 [48:55<25:25:58, 7.63s/it, loss=4.7019, acc=0.0203, iter_time=8.04s]
Epoch 0: 3%|▎ | 384/12384 [49:03<25:25:58, 7.63s/it, loss=4.2788, acc=0.0248, iter_time=7.28s]
Epoch 0: 3%|▎ | 385/12384 [49:03<25:28:41, 7.64s/it, loss=4.2788, acc=0.0248, iter_time=7.28s]
Epoch 0: 3%|▎ | 385/12384 [49:11<25:28:41, 7.64s/it, loss=4.4542, acc=0.0242, iter_time=7.61s]
Epoch 0: 3%|▎ | 386/12384 [49:11<25:26:02, 7.63s/it, loss=4.4542, acc=0.0242, iter_time=7.61s]
Epoch 0: 3%|▎ | 386/12384 [49:18<25:26:02, 7.63s/it, loss=4.2838, acc=0.0280, iter_time=6.74s]
Epoch 0: 3%|▎ | 387/12384 [49:18<25:24:25, 7.62s/it, loss=4.2838, acc=0.0280, iter_time=6.74s]
Epoch 0: 3%|▎ | 387/12384 [49:26<25:24:25, 7.62s/it, loss=4.1713, acc=0.0223, iter_time=8.47s]
Epoch 0: 3%|▎ | 388/12384 [49:26<25:25:46, 7.63s/it, loss=4.1713, acc=0.0223, iter_time=8.47s]
Epoch 0: 3%|▎ | 388/12384 [49:34<25:25:46, 7.63s/it, loss=4.2651, acc=0.0206, iter_time=7.65s]
Epoch 0: 3%|▎ | 389/12384 [49:34<25:30:41, 7.66s/it, loss=4.2651, acc=0.0206, iter_time=7.65s]
Epoch 0: 3%|▎ | 389/12384 [49:41<25:30:41, 7.66s/it, loss=4.3558, acc=0.0296, iter_time=7.42s]
Epoch 0: 3%|▎ | 390/12384 [49:41<25:26:14, 7.64s/it, loss=4.3558, acc=0.0296, iter_time=7.42s]
Epoch 0: 3%|▎ | 390/12384 [49:49<25:26:14, 7.64s/it, loss=4.5466, acc=0.0197, iter_time=7.89s]
Epoch 0: 3%|▎ | 391/12384 [49:49<25:24:47, 7.63s/it, loss=4.5466, acc=0.0197, iter_time=7.89s]
Epoch 0: 3%|▎ | 391/12384 [49:56<25:24:47, 7.63s/it, loss=4.4060, acc=0.0168, iter_time=8.00s]
Epoch 0: 3%|▎ | 392/12384 [49:56<25:25:04, 7.63s/it, loss=4.4060, acc=0.0168, iter_time=8.00s]
Epoch 0: 3%|▎ | 392/12384 [50:04<25:25:04, 7.63s/it, loss=4.1032, acc=0.0200, iter_time=7.24s]
Epoch 0: 3%|▎ | 393/12384 [50:04<25:23:56, 7.63s/it, loss=4.1032, acc=0.0200, iter_time=7.24s]
Epoch 0: 3%|▎ | 393/12384 [50:12<25:23:56, 7.63s/it, loss=4.2513, acc=0.0246, iter_time=6.80s]
Epoch 0: 3%|▎ | 394/12384 [50:12<25:24:57, 7.63s/it, loss=4.2513, acc=0.0246, iter_time=6.80s]
Epoch 0: 3%|▎ | 394/12384 [50:19<25:24:57, 7.63s/it, loss=4.0354, acc=0.0292, iter_time=5.42s]
Epoch 0: 3%|▎ | 395/12384 [50:19<25:26:21, 7.64s/it, loss=4.0354, acc=0.0292, iter_time=5.42s]
Epoch 0: 3%|▎ | 395/12384 [50:27<25:26:21, 7.64s/it, loss=4.0350, acc=0.0261, iter_time=10.70s]
Epoch 0: 3%|▎ | 396/12384 [50:27<25:25:40, 7.64s/it, loss=4.0350, acc=0.0261, iter_time=10.70s]
Epoch 0: 3%|▎ | 396/12384 [50:35<25:25:40, 7.64s/it, loss=3.8220, acc=0.0275, iter_time=7.60s]
Epoch 0: 3%|▎ | 397/12384 [50:35<25:22:25, 7.62s/it, loss=3.8220, acc=0.0275, iter_time=7.60s]
Epoch 0: 3%|▎ | 397/12384 [50:42<25:22:25, 7.62s/it, loss=4.3688, acc=0.0204, iter_time=7.62s]
Epoch 0: 3%|▎ | 398/12384 [50:42<25:24:10, 7.63s/it, loss=4.3688, acc=0.0204, iter_time=7.62s]
Epoch 0: 3%|▎ | 398/12384 [50:50<25:24:10, 7.63s/it, loss=3.7476, acc=0.0247, iter_time=6.44s]
Epoch 0: 3%|▎ | 399/12384 [50:50<25:21:44, 7.62s/it, loss=3.7476, acc=0.0247, iter_time=6.44s]
Epoch 0: 3%|▎ | 399/12384 [50:57<25:21:44, 7.62s/it, loss=4.3552, acc=0.0242, iter_time=9.19s]
Epoch 0: 3%|▎ | 400/12384 [50:57<25:21:01, 7.62s/it, loss=4.3552, acc=0.0242, iter_time=9.19s]
Epoch 0: 3%|▎ | 400/12384 [51:05<25:21:01, 7.62s/it, loss=3.7937, acc=0.0266, iter_time=7.19s]
Epoch 0: 3%|▎ | 401/12384 [51:05<25:19:33, 7.61s/it, loss=3.7937, acc=0.0266, iter_time=7.19s]
Epoch 0: 3%|▎ | 401/12384 [51:13<25:19:33, 7.61s/it, loss=4.2323, acc=0.0224, iter_time=7.61s]
Epoch 0: 3%|▎ | 402/12384 [51:13<25:20:13, 7.61s/it, loss=4.2323, acc=0.0224, iter_time=7.61s]
Epoch 0: 3%|▎ | 402/12384 [51:21<25:20:13, 7.61s/it, loss=3.9382, acc=0.0295, iter_time=7.98s]
Epoch 0: 3%|▎ | 403/12384 [51:21<25:40:52, 7.72s/it, loss=3.9382, acc=0.0295, iter_time=7.98s]
Epoch 0: 3%|▎ | 403/12384 [51:28<25:40:52, 7.72s/it, loss=4.2452, acc=0.0229, iter_time=6.69s]
Epoch 0: 3%|▎ | 404/12384 [51:28<25:36:10, 7.69s/it, loss=4.2452, acc=0.0229, iter_time=6.69s]
Epoch 0: 3%|▎ | 404/12384 [51:36<25:36:10, 7.69s/it, loss=3.7493, acc=0.0288, iter_time=7.10s]
Epoch 0: 3%|▎ | 405/12384 [51:36<25:35:10, 7.69s/it, loss=3.7493, acc=0.0288, iter_time=7.10s]
Epoch 0: 3%|▎ | 405/12384 [51:44<25:35:10, 7.69s/it, loss=3.5714, acc=0.0382, iter_time=7.12s]
Epoch 0: 3%|▎ | 406/12384 [51:44<25:30:21, 7.67s/it, loss=3.5714, acc=0.0382, iter_time=7.12s]
Epoch 0: 3%|▎ | 406/12384 [51:51<25:30:21, 7.67s/it, loss=4.2235, acc=0.0191, iter_time=9.62s]
Epoch 0: 3%|▎ | 407/12384 [51:51<25:28:42, 7.66s/it, loss=4.2235, acc=0.0191, iter_time=9.62s]
Epoch 0: 3%|▎ | 407/12384 [51:59<25:28:42, 7.66s/it, loss=3.8109, acc=0.0302, iter_time=8.02s]
Epoch 0: 3%|▎ | 408/12384 [51:59<25:27:07, 7.65s/it, loss=3.8109, acc=0.0302, iter_time=8.02s]
Epoch 0: 3%|▎ | 408/12384 [52:06<25:27:07, 7.65s/it, loss=3.6993, acc=0.0338, iter_time=7.24s]
Epoch 0: 3%|▎ | 409/12384 [52:06<25:24:56, 7.64s/it, loss=3.6993, acc=0.0338, iter_time=7.24s]
Epoch 0: 3%|▎ | 409/12384 [52:14<25:24:56, 7.64s/it, loss=3.5757, acc=0.0314, iter_time=7.63s]
Epoch 0: 3%|▎ | 410/12384 [52:14<25:29:17, 7.66s/it, loss=3.5757, acc=0.0314, iter_time=7.63s]
Epoch 0: 3%|▎ | 410/12384 [52:22<25:29:17, 7.66s/it, loss=3.8747, acc=0.0277, iter_time=7.71s]
Epoch 0: 3%|▎ | 411/12384 [52:22<25:28:27, 7.66s/it, loss=3.8747, acc=0.0277, iter_time=7.71s]
Epoch 0: 3%|▎ | 411/12384 [52:29<25:28:27, 7.66s/it, loss=3.5088, acc=0.0345, iter_time=7.07s]
Epoch 0: 3%|▎ | 412/12384 [52:29<25:27:59, 7.66s/it, loss=3.5088, acc=0.0345, iter_time=7.07s]
Epoch 0: 3%|▎ | 412/12384 [52:37<25:27:59, 7.66s/it, loss=3.2465, acc=0.0367, iter_time=4.62s]
Epoch 0: 3%|▎ | 413/12384 [52:37<25:24:32, 7.64s/it, loss=3.2465, acc=0.0367, iter_time=4.62s]
Epoch 0: 3%|▎ | 413/12384 [52:45<25:24:32, 7.64s/it, loss=2.8895, acc=0.0576, iter_time=8.37s]
Epoch 0: 3%|▎ | 414/12384 [52:45<25:23:05, 7.63s/it, loss=2.8895, acc=0.0576, iter_time=8.37s]
Epoch 0: 3%|▎ | 414/12384 [52:52<25:23:05, 7.63s/it, loss=3.6638, acc=0.0276, iter_time=10.47s]
Epoch 0: 3%|▎ | 415/12384 [52:52<25:20:43, 7.62s/it, loss=3.6638, acc=0.0276, iter_time=10.47s]
Epoch 0: 3%|▎ | 415/12384 [53:00<25:20:43, 7.62s/it, loss=3.8815, acc=0.0317, iter_time=7.99s]
Epoch 0: 3%|▎ | 416/12384 [53:00<25:21:52, 7.63s/it, loss=3.8815, acc=0.0317, iter_time=7.99s]
Epoch 0: 3%|▎ | 416/12384 [53:08<25:21:52, 7.63s/it, loss=3.2567, acc=0.0427, iter_time=4.48s]
Epoch 0: 3%|▎ | 417/12384 [53:08<25:24:43, 7.64s/it, loss=3.2567, acc=0.0427, iter_time=4.48s]
Epoch 0: 3%|▎ | 417/12384 [53:15<25:24:43, 7.64s/it, loss=3.5078, acc=0.0293, iter_time=10.46s]
Epoch 0: 3%|▎ | 418/12384 [53:15<25:27:19, 7.66s/it, loss=3.5078, acc=0.0293, iter_time=10.46s]
Epoch 0: 3%|▎ | 418/12384 [53:23<25:27:19, 7.66s/it, loss=3.0900, acc=0.0372, iter_time=7.68s]
Epoch 0: 3%|▎ | 419/12384 [53:23<25:25:13, 7.65s/it, loss=3.0900, acc=0.0372, iter_time=7.68s]
Epoch 0: 3%|▎ | 419/12384 [53:31<25:25:13, 7.65s/it, loss=3.4927, acc=0.0377, iter_time=7.65s]
Epoch 0: 3%|▎ | 420/12384 [53:31<25:24:40, 7.65s/it, loss=3.4927, acc=0.0377, iter_time=7.65s]
Epoch 0: 3%|▎ | 420/12384 [53:38<25:24:40, 7.65s/it, loss=3.4465, acc=0.0396, iter_time=7.65s]
Epoch 0: 3%|▎ | 421/12384 [53:38<25:23:32, 7.64s/it, loss=3.4465, acc=0.0396, iter_time=7.65s]
Epoch 0: 3%|▎ | 421/12384 [53:46<25:23:32, 7.64s/it, loss=3.3145, acc=0.0347, iter_time=7.60s]
Epoch 0: 3%|▎ | 422/12384 [53:46<25:20:53, 7.63s/it, loss=3.3145, acc=0.0347, iter_time=7.60s]
Epoch 0: 3%|▎ | 422/12384 [53:53<25:20:53, 7.63s/it, loss=3.3241, acc=0.0352, iter_time=6.65s]
Epoch 0: 3%|▎ | 423/12384 [53:53<25:20:29, 7.63s/it, loss=3.3241, acc=0.0352, iter_time=6.65s]
Epoch 0: 3%|▎ | 423/12384 [54:01<25:20:29, 7.63s/it, loss=3.2751, acc=0.0368, iter_time=8.55s]
Epoch 0: 3%|▎ | 424/12384 [54:01<25:21:08, 7.63s/it, loss=3.2751, acc=0.0368, iter_time=8.55s]
Epoch 0: 3%|▎ | 424/12384 [54:09<25:21:08, 7.63s/it, loss=3.0368, acc=0.0447, iter_time=7.64s]
Epoch 0: 3%|▎ | 425/12384 [54:09<25:20:16, 7.63s/it, loss=3.0368, acc=0.0447, iter_time=7.64s]
Epoch 0: 3%|▎ | 425/12384 [54:16<25:20:16, 7.63s/it, loss=3.0443, acc=0.0398, iter_time=7.65s]
Epoch 0: 3%|▎ | 426/12384 [54:16<25:21:23, 7.63s/it, loss=3.0443, acc=0.0398, iter_time=7.65s]
Epoch 0: 3%|▎ | 426/12384 [54:24<25:21:23, 7.63s/it, loss=3.2301, acc=0.0384, iter_time=7.73s]
Epoch 0: 3%|▎ | 427/12384 [54:24<25:25:29, 7.65s/it, loss=3.2301, acc=0.0384, iter_time=7.73s]
Epoch 0: 3%|▎ | 427/12384 [54:32<25:25:29, 7.65s/it, loss=3.2365, acc=0.0331, iter_time=7.62s]
Epoch 0: 3%|▎ | 428/12384 [54:32<25:22:52, 7.64s/it, loss=3.2365, acc=0.0331, iter_time=7.62s]
Epoch 0: 3%|▎ | 428/12384 [54:40<25:22:52, 7.64s/it, loss=3.1299, acc=0.0454, iter_time=5.61s]
Epoch 0: 3%|▎ | 429/12384 [54:40<25:41:59, 7.74s/it, loss=3.1299, acc=0.0454, iter_time=5.61s]
Epoch 0: 3%|▎ | 429/12384 [54:47<25:41:59, 7.74s/it, loss=2.9860, acc=0.0458, iter_time=9.94s]
Epoch 0: 3%|▎ | 430/12384 [54:47<25:34:39, 7.70s/it, loss=2.9860, acc=0.0458, iter_time=9.94s]
Epoch 0: 3%|▎ | 430/12384 [54:55<25:34:39, 7.70s/it, loss=3.1382, acc=0.0419, iter_time=7.63s]
Epoch 0: 3%|▎ | 431/12384 [54:55<25:32:47, 7.69s/it, loss=3.1382, acc=0.0419, iter_time=7.63s]
Epoch 0: 3%|▎ | 431/12384 [55:03<25:32:47, 7.69s/it, loss=3.2816, acc=0.0410, iter_time=8.05s]
Epoch 0: 3%|▎ | 432/12384 [55:03<25:28:53, 7.68s/it, loss=3.2816, acc=0.0410, iter_time=8.05s]
Epoch 0: 3%|▎ | 432/12384 [55:10<25:28:53, 7.68s/it, loss=3.0645, acc=0.0497, iter_time=7.25s]
Epoch 0: 3%|▎ | 433/12384 [55:10<25:26:43, 7.66s/it, loss=3.0645, acc=0.0497, iter_time=7.25s]
Epoch 0: 3%|▎ | 433/12384 [55:18<25:26:43, 7.66s/it, loss=3.4913, acc=0.0414, iter_time=7.67s]
Epoch 0: 4%|▎ | 434/12384 [55:18<25:23:56, 7.65s/it, loss=3.4913, acc=0.0414, iter_time=7.67s]
Epoch 0: 4%|▎ | 434/12384 [55:25<25:23:56, 7.65s/it, loss=3.1578, acc=0.0391, iter_time=7.62s]
Epoch 0: 4%|▎ | 435/12384 [55:25<25:21:39, 7.64s/it, loss=3.1578, acc=0.0391, iter_time=7.62s]
Epoch 0: 4%|▎ | 435/12384 [55:33<25:21:39, 7.64s/it, loss=2.9039, acc=0.0442, iter_time=7.60s]
Epoch 0: 4%|▎ | 436/12384 [55:33<25:18:53, 7.63s/it, loss=2.9039, acc=0.0442, iter_time=7.60s]
Epoch 0: 4%|▎ | 436/12384 [55:41<25:18:53, 7.63s/it, loss=2.8473, acc=0.0499, iter_time=7.60s]
Epoch 0: 4%|▎ | 437/12384 [55:41<25:18:18, 7.63s/it, loss=2.8473, acc=0.0499, iter_time=7.60s]
Epoch 0: 4%|▎ | 437/12384 [55:48<25:18:18, 7.63s/it, loss=2.5499, acc=0.0715, iter_time=4.31s]
Epoch 0: 4%|▎ | 438/12384 [55:48<25:18:42, 7.63s/it, loss=2.5499, acc=0.0715, iter_time=4.31s]
Epoch 0: 4%|▎ | 438/12384 [55:56<25:18:42, 7.63s/it, loss=3.1874, acc=0.0472, iter_time=10.91s]
Epoch 0: 4%|▎ | 439/12384 [55:56<25:16:25, 7.62s/it, loss=3.1874, acc=0.0472, iter_time=10.91s]
Epoch 0: 4%|▎ | 439/12384 [56:03<25:16:25, 7.62s/it, loss=3.7267, acc=0.0346, iter_time=8.00s]
Epoch 0: 4%|▎ | 440/12384 [56:03<25:15:48, 7.61s/it, loss=3.7267, acc=0.0346, iter_time=8.00s]
Epoch 0: 4%|▎ | 440/12384 [56:11<25:15:48, 7.61s/it, loss=2.6213, acc=0.0567, iter_time=4.87s]
Epoch 0: 4%|▎ | 441/12384 [56:11<25:15:27, 7.61s/it, loss=2.6213, acc=0.0567, iter_time=4.87s]
Epoch 0: 4%|▎ | 441/12384 [56:19<25:15:27, 7.61s/it, loss=2.8995, acc=0.0430, iter_time=9.97s]
Epoch 0: 4%|▎ | 442/12384 [56:19<25:16:08, 7.62s/it, loss=2.8995, acc=0.0430, iter_time=9.97s]
Epoch 0: 4%|▎ | 442/12384 [56:26<25:16:08, 7.62s/it, loss=2.9259, acc=0.0582, iter_time=5.05s]
Epoch 0: 4%|▎ | 443/12384 [56:26<25:17:59, 7.63s/it, loss=2.9259, acc=0.0582, iter_time=5.05s]
Epoch 0: 4%|▎ | 443/12384 [56:34<25:17:59, 7.63s/it, loss=3.0748, acc=0.0482, iter_time=9.93s]
Epoch 0: 4%|▎ | 444/12384 [56:34<25:16:15, 7.62s/it, loss=3.0748, acc=0.0482, iter_time=9.93s]
Epoch 0: 4%|▎ | 444/12384 [56:42<25:16:15, 7.62s/it, loss=2.9716, acc=0.0498, iter_time=7.88s]
Epoch 0: 4%|▎ | 445/12384 [56:42<25:14:42, 7.61s/it, loss=2.9716, acc=0.0498, iter_time=7.88s]
Epoch 0: 4%|▎ | 445/12384 [56:49<25:14:42, 7.61s/it, loss=2.7518, acc=0.0540, iter_time=7.61s]
Epoch 0: 4%|▎ | 446/12384 [56:49<25:13:56, 7.61s/it, loss=2.7518, acc=0.0540, iter_time=7.61s]
Epoch 0: 4%|▎ | 446/12384 [56:57<25:13:56, 7.61s/it, loss=3.1282, acc=0.0490, iter_time=7.60s]
Epoch 0: 4%|▎ | 447/12384 [56:57<25:13:32, 7.61s/it, loss=3.1282, acc=0.0490, iter_time=7.60s]
Epoch 0: 4%|▎ | 447/12384 [57:04<25:13:32, 7.61s/it, loss=2.8421, acc=0.0526, iter_time=7.55s]
Epoch 0: 4%|▎ | 448/12384 [57:04<25:13:24, 7.61s/it, loss=2.8421, acc=0.0526, iter_time=7.55s]
Epoch 0: 4%|▎ | 448/12384 [57:12<25:13:24, 7.61s/it, loss=2.3614, acc=0.0661, iter_time=7.65s]
Epoch 0: 4%|▎ | 449/12384 [57:12<25:13:11, 7.61s/it, loss=2.3614, acc=0.0661, iter_time=7.65s]
Epoch 0: 4%|▎ | 449/12384 [57:20<25:13:11, 7.61s/it, loss=2.8640, acc=0.0625, iter_time=8.01s]
Epoch 0: 4%|▎ | 450/12384 [57:20<25:12:50, 7.61s/it, loss=2.8640, acc=0.0625, iter_time=8.01s]
Epoch 0: 4%|▎ | 450/12384 [57:27<25:12:50, 7.61s/it, loss=2.6807, acc=0.0533, iter_time=7.20s]
Epoch 0: 4%|▎ | 451/12384 [57:27<25:13:52, 7.61s/it, loss=2.6807, acc=0.0533, iter_time=7.20s]
Epoch 0: 4%|▎ | 451/12384 [57:35<25:13:52, 7.61s/it, loss=2.7574, acc=0.0650, iter_time=7.65s]
Epoch 0: 4%|▎ | 452/12384 [57:35<25:14:25, 7.62s/it, loss=2.7574, acc=0.0650, iter_time=7.65s]
Epoch 0: 4%|▎ | 452/12384 [57:42<25:14:25, 7.62s/it, loss=2.5684, acc=0.0499, iter_time=7.31s]
Epoch 0: 4%|▎ | 453/12384 [57:42<25:15:21, 7.62s/it, loss=2.5684, acc=0.0499, iter_time=7.31s]
Epoch 0: 4%|▎ | 453/12384 [57:50<25:15:21, 7.62s/it, loss=2.9275, acc=0.0412, iter_time=7.95s]
Epoch 0: 4%|▎ | 454/12384 [57:50<25:14:58, 7.62s/it, loss=2.9275, acc=0.0412, iter_time=7.95s]
Epoch 0: 4%|▎ | 454/12384 [57:58<25:14:58, 7.62s/it, loss=2.5883, acc=0.0616, iter_time=7.61s]
Epoch 0: 4%|▎ | 455/12384 [57:58<25:17:37, 7.63s/it, loss=2.5883, acc=0.0616, iter_time=7.61s]
Epoch 0: 4%|▎ | 455/12384 [58:06<25:17:37, 7.63s/it, loss=2.7614, acc=0.0706, iter_time=8.39s]
Epoch 0: 4%|▎ | 456/12384 [58:06<25:36:31, 7.73s/it, loss=2.7614, acc=0.0706, iter_time=8.39s]
Epoch 0: 4%|▎ | 456/12384 [58:13<25:36:31, 7.73s/it, loss=2.6479, acc=0.0569, iter_time=7.24s]
Epoch 0: 4%|▎ | 457/12384 [58:13<25:30:33, 7.70s/it, loss=2.6479, acc=0.0569, iter_time=7.24s]
Epoch 0: 4%|▎ | 457/12384 [58:21<25:30:33, 7.70s/it, loss=2.1883, acc=0.0812, iter_time=5.27s]
Epoch 0: 4%|▎ | 458/12384 [58:21<25:31:00, 7.70s/it, loss=2.1883, acc=0.0812, iter_time=5.27s]
Epoch 0: 4%|▎ | 458/12384 [58:29<25:31:00, 7.70s/it, loss=2.3805, acc=0.0605, iter_time=10.05s]
Epoch 0: 4%|▎ | 459/12384 [58:29<25:26:05, 7.68s/it, loss=2.3805, acc=0.0605, iter_time=10.05s]
Epoch 0: 4%|▎ | 459/12384 [58:36<25:26:05, 7.68s/it, loss=2.1740, acc=0.0653, iter_time=7.63s]
Epoch 0: 4%|▎ | 460/12384 [58:36<25:21:08, 7.65s/it, loss=2.1740, acc=0.0653, iter_time=7.63s]
Epoch 0: 4%|▎ | 460/12384 [58:44<25:21:08, 7.65s/it, loss=2.9239, acc=0.0425, iter_time=7.61s]
Epoch 0: 4%|▎ | 461/12384 [58:44<25:19:13, 7.65s/it, loss=2.9239, acc=0.0425, iter_time=7.61s]
Epoch 0: 4%|▎ | 461/12384 [58:52<25:19:13, 7.65s/it, loss=2.4065, acc=0.0625, iter_time=7.63s]
Epoch 0: 4%|▎ | 462/12384 [58:52<25:19:55, 7.65s/it, loss=2.4065, acc=0.0625, iter_time=7.63s]
Epoch 0: 4%|▎ | 462/12384 [58:59<25:19:55, 7.65s/it, loss=2.2045, acc=0.0711, iter_time=5.10s]
Epoch 0: 4%|▎ | 463/12384 [58:59<25:20:46, 7.65s/it, loss=2.2045, acc=0.0711, iter_time=5.10s]
Epoch 0: 4%|▎ | 463/12384 [59:07<25:20:46, 7.65s/it, loss=2.6987, acc=0.0551, iter_time=10.60s]
Epoch 0: 4%|▎ | 464/12384 [59:07<25:23:44, 7.67s/it, loss=2.6987, acc=0.0551, iter_time=10.60s]
Epoch 0: 4%|▎ | 464/12384 [59:15<25:23:44, 7.67s/it, loss=2.0229, acc=0.0816, iter_time=4.25s]
Epoch 0: 4%|▍ | 465/12384 [59:15<25:20:25, 7.65s/it, loss=2.0229, acc=0.0816, iter_time=4.25s]
Epoch 0: 4%|▍ | 465/12384 [59:22<25:20:25, 7.65s/it, loss=2.1349, acc=0.0808, iter_time=8.87s]
Epoch 0: 4%|▍ | 466/12384 [59:22<25:19:06, 7.65s/it, loss=2.1349, acc=0.0808, iter_time=8.87s]
Epoch 0: 4%|▍ | 466/12384 [59:30<25:19:06, 7.65s/it, loss=1.8659, acc=0.0879, iter_time=7.18s]
Epoch 0: 4%|▍ | 467/12384 [59:30<25:18:34, 7.65s/it, loss=1.8659, acc=0.0879, iter_time=7.18s]
Epoch 0: 4%|▍ | 467/12384 [59:37<25:18:34, 7.65s/it, loss=2.3690, acc=0.0590, iter_time=9.92s]
Epoch 0: 4%|▍ | 468/12384 [59:37<25:16:30, 7.64s/it, loss=2.3690, acc=0.0590, iter_time=9.92s]
Epoch 0: 4%|▍ | 468/12384 [59:45<25:16:30, 7.64s/it, loss=2.5095, acc=0.0757, iter_time=7.60s]
Epoch 0: 4%|▍ | 469/12384 [59:45<25:14:16, 7.63s/it, loss=2.5095, acc=0.0757, iter_time=7.60s]
Epoch 0: 4%|▍ | 469/12384 [59:53<25:14:16, 7.63s/it, loss=2.3407, acc=0.0611, iter_time=7.61s]
Epoch 0: 4%|▍ | 470/12384 [59:53<25:13:19, 7.62s/it, loss=2.3407, acc=0.0611, iter_time=7.61s]
Epoch 0: 4%|▍ | 470/12384 [1:00:00<25:13:19, 7.62s/it, loss=2.4194, acc=0.0613, iter_time=7.59s]
Epoch 0: 4%|▍ | 471/12384 [1:00:00<25:12:40, 7.62s/it, loss=2.4194, acc=0.0613, iter_time=7.59s]
Epoch 0: 4%|▍ | 471/12384 [1:00:08<25:12:40, 7.62s/it, loss=2.3377, acc=0.0702, iter_time=7.56s]
Epoch 0: 4%|▍ | 472/12384 [1:00:08<25:11:31, 7.61s/it, loss=2.3377, acc=0.0702, iter_time=7.56s]
Epoch 0: 4%|▍ | 472/12384 [1:00:15<25:11:31, 7.61s/it, loss=2.0761, acc=0.0801, iter_time=7.67s]
Epoch 0: 4%|▍ | 473/12384 [1:00:15<25:11:33, 7.61s/it, loss=2.0761, acc=0.0801, iter_time=7.67s]
Epoch 0: 4%|▍ | 473/12384 [1:00:23<25:11:33, 7.61s/it, loss=1.9358, acc=0.0912, iter_time=6.75s]
Epoch 0: 4%|▍ | 474/12384 [1:00:23<25:12:33, 7.62s/it, loss=1.9358, acc=0.0912, iter_time=6.75s]
Epoch 0: 4%|▍ | 474/12384 [1:00:31<25:12:33, 7.62s/it, loss=1.9073, acc=0.0842, iter_time=7.90s]
Epoch 0: 4%|▍ | 475/12384 [1:00:31<25:10:54, 7.61s/it, loss=1.9073, acc=0.0842, iter_time=7.90s]
Epoch 0: 4%|▍ | 475/12384 [1:00:38<25:10:54, 7.61s/it, loss=2.1782, acc=0.0658, iter_time=8.19s]
Epoch 0: 4%|▍ | 476/12384 [1:00:38<25:12:04, 7.62s/it, loss=2.1782, acc=0.0658, iter_time=8.19s]
Epoch 0: 4%|▍ | 476/12384 [1:00:46<25:12:04, 7.62s/it, loss=2.6810, acc=0.0632, iter_time=5.05s]
Epoch 0: 4%|▍ | 477/12384 [1:00:46<25:18:12, 7.65s/it, loss=2.6810, acc=0.0632, iter_time=5.05s]
Epoch 0: 4%|▍ | 477/12384 [1:00:54<25:18:12, 7.65s/it, loss=2.1881, acc=0.0752, iter_time=10.31s]
Epoch 0: 4%|▍ | 478/12384 [1:00:54<25:17:19, 7.65s/it, loss=2.1881, acc=0.0752, iter_time=10.31s]
Epoch 0: 4%|▍ | 478/12384 [1:01:01<25:17:19, 7.65s/it, loss=2.0383, acc=0.0787, iter_time=7.66s]
Epoch 0: 4%|▍ | 479/12384 [1:01:01<25:16:02, 7.64s/it, loss=2.0383, acc=0.0787, iter_time=7.66s]
Epoch 0: 4%|▍ | 479/12384 [1:01:09<25:16:02, 7.64s/it, loss=2.1226, acc=0.0653, iter_time=7.98s]
Epoch 0: 4%|▍ | 480/12384 [1:01:09<25:14:05, 7.63s/it, loss=2.1226, acc=0.0653, iter_time=7.98s]
Epoch 0: 4%|▍ | 480/12384 [1:01:17<25:14:05, 7.63s/it, loss=1.8728, acc=0.0937, iter_time=5.68s]
Epoch 0: 4%|▍ | 481/12384 [1:01:17<25:14:32, 7.63s/it, loss=1.8728, acc=0.0937, iter_time=5.68s]
Epoch 0: 4%|▍ | 481/12384 [1:01:25<25:14:32, 7.63s/it, loss=1.7137, acc=0.1056, iter_time=6.45s]
Epoch 0: 4%|▍ | 482/12384 [1:01:25<25:33:13, 7.73s/it, loss=1.7137, acc=0.1056, iter_time=6.45s]
Epoch 0: 4%|▍ | 482/12384 [1:01:32<25:33:13, 7.73s/it, loss=1.8815, acc=0.1097, iter_time=7.86s]
Epoch 0: 4%|▍ | 483/12384 [1:01:32<25:29:43, 7.71s/it, loss=1.8815, acc=0.1097, iter_time=7.86s]
Epoch 0: 4%|▍ | 483/12384 [1:01:40<25:29:43, 7.71s/it, loss=1.8511, acc=0.0913, iter_time=9.31s]
Epoch 0: 4%|▍ | 484/12384 [1:01:40<25:24:42, 7.69s/it, loss=1.8511, acc=0.0913, iter_time=9.31s]
Epoch 0: 4%|▍ | 484/12384 [1:01:47<25:24:42, 7.69s/it, loss=2.3645, acc=0.0781, iter_time=8.82s]
Epoch 0: 4%|▍ | 485/12384 [1:01:47<25:21:29, 7.67s/it, loss=2.3645, acc=0.0781, iter_time=8.82s]
Epoch 0: 4%|▍ | 485/12384 [1:01:55<25:21:29, 7.67s/it, loss=2.0252, acc=0.0707, iter_time=7.65s]
Epoch 0: 4%|▍ | 486/12384 [1:01:55<25:18:21, 7.66s/it, loss=2.0252, acc=0.0707, iter_time=7.65s]
Epoch 0: 4%|▍ | 486/12384 [1:02:03<25:18:21, 7.66s/it, loss=1.8400, acc=0.0926, iter_time=7.59s]
Epoch 0: 4%|▍ | 487/12384 [1:02:03<25:13:57, 7.64s/it, loss=1.8400, acc=0.0926, iter_time=7.59s]
Epoch 0: 4%|▍ | 487/12384 [1:02:10<25:13:57, 7.64s/it, loss=2.3608, acc=0.0671, iter_time=7.98s]
Epoch 0: 4%|▍ | 488/12384 [1:02:10<25:14:44, 7.64s/it, loss=2.3608, acc=0.0671, iter_time=7.98s]
Epoch 0: 4%|▍ | 488/12384 [1:02:18<25:14:44, 7.64s/it, loss=1.8955, acc=0.1027, iter_time=7.28s]
Epoch 0: 4%|▍ | 489/12384 [1:02:18<25:12:44, 7.63s/it, loss=1.8955, acc=0.1027, iter_time=7.28s]
Epoch 0: 4%|▍ | 489/12384 [1:02:26<25:12:44, 7.63s/it, loss=1.8594, acc=0.0871, iter_time=7.61s]
Epoch 0: 4%|▍ | 490/12384 [1:02:26<25:12:17, 7.63s/it, loss=1.8594, acc=0.0871, iter_time=7.61s]
Epoch 0: 4%|▍ | 490/12384 [1:02:33<25:12:17, 7.63s/it, loss=1.9777, acc=0.1014, iter_time=7.63s]
Epoch 0: 4%|▍ | 491/12384 [1:02:33<25:12:56, 7.63s/it, loss=1.9777, acc=0.1014, iter_time=7.63s]
Epoch 0: 4%|▍ | 491/12384 [1:02:41<25:12:56, 7.63s/it, loss=1.5701, acc=0.1003, iter_time=7.73s]
Epoch 0: 4%|▍ | 492/12384 [1:02:41<25:17:21, 7.66s/it, loss=1.5701, acc=0.1003, iter_time=7.73s]
Epoch 0: 4%|▍ | 492/12384 [1:02:49<25:17:21, 7.66s/it, loss=1.7921, acc=0.0975, iter_time=7.64s]
Epoch 0: 4%|▍ | 493/12384 [1:02:49<25:15:31, 7.65s/it, loss=1.7921, acc=0.0975, iter_time=7.64s]
Epoch 0: 4%|▍ | 493/12384 [1:02:56<25:15:31, 7.65s/it, loss=2.1800, acc=0.0715, iter_time=7.60s]
Epoch 0: 4%|▍ | 494/12384 [1:02:56<25:14:05, 7.64s/it, loss=2.1800, acc=0.0715, iter_time=7.60s]
Epoch 0: 4%|▍ | 494/12384 [1:03:04<25:14:05, 7.64s/it, loss=2.0812, acc=0.0773, iter_time=7.62s]
Epoch 0: 4%|▍ | 495/12384 [1:03:04<25:14:40, 7.64s/it, loss=2.0812, acc=0.0773, iter_time=7.62s]
Epoch 0: 4%|▍ | 495/12384 [1:03:11<25:14:40, 7.64s/it, loss=2.2030, acc=0.0776, iter_time=8.11s]
Epoch 0: 4%|▍ | 496/12384 [1:03:11<25:15:53, 7.65s/it, loss=2.2030, acc=0.0776, iter_time=8.11s]
Epoch 0: 4%|▍ | 496/12384 [1:03:19<25:15:53, 7.65s/it, loss=1.7504, acc=0.1286, iter_time=6.94s]
Epoch 0: 4%|▍ | 497/12384 [1:03:19<25:13:57, 7.64s/it, loss=1.7504, acc=0.1286, iter_time=6.94s]
Epoch 0: 4%|▍ | 497/12384 [1:03:27<25:13:57, 7.64s/it, loss=1.7378, acc=0.0863, iter_time=7.88s]
Epoch 0: 4%|▍ | 498/12384 [1:03:27<25:11:48, 7.63s/it, loss=1.7378, acc=0.0863, iter_time=7.88s]
Epoch 0: 4%|▍ | 498/12384 [1:03:34<25:11:48, 7.63s/it, loss=2.2853, acc=0.0859, iter_time=7.62s]
Epoch 0: 4%|▍ | 499/12384 [1:03:34<25:09:41, 7.62s/it, loss=2.2853, acc=0.0859, iter_time=7.62s]
Epoch 0: 4%|▍ | 499/12384 [1:03:42<25:09:41, 7.62s/it, loss=1.5631, acc=0.0978, iter_time=8.00s]
Epoch 0: 4%|▍ | 500/12384 [1:03:42<25:23:23, 7.69s/it, loss=1.5631, acc=0.0978, iter_time=8.00s]
Epoch 0: 4%|▍ | 500/12384 [1:03:50<25:23:23, 7.69s/it, loss=1.9879, acc=0.0980, iter_time=7.48s]
Epoch 0: 4%|▍ | 501/12384 [1:03:50<25:19:23, 7.67s/it, loss=1.9879, acc=0.0980, iter_time=7.48s]
Epoch 0: 4%|▍ | 501/12384 [1:03:57<25:19:23, 7.67s/it, loss=1.5320, acc=0.1144, iter_time=6.74s]
Epoch 0: 4%|▍ | 502/12384 [1:03:57<25:18:44, 7.67s/it, loss=1.5320, acc=0.1144, iter_time=6.74s]
Epoch 0: 4%|▍ | 502/12384 [1:04:05<25:18:44, 7.67s/it, loss=1.6257, acc=0.0942, iter_time=7.59s]
Epoch 0: 4%|▍ | 503/12384 [1:04:05<25:16:58, 7.66s/it, loss=1.6257, acc=0.0942, iter_time=7.59s]
Epoch 0: 4%|▍ | 503/12384 [1:04:13<25:16:58, 7.66s/it, loss=1.4932, acc=0.1111, iter_time=8.52s]
Epoch 0: 4%|▍ | 504/12384 [1:04:13<25:13:36, 7.64s/it, loss=1.4932, acc=0.1111, iter_time=8.52s]
Epoch 0: 4%|▍ | 504/12384 [1:04:20<25:13:36, 7.64s/it, loss=1.7782, acc=0.0995, iter_time=7.66s]
Epoch 0: 4%|▍ | 505/12384 [1:04:20<25:11:13, 7.63s/it, loss=1.7782, acc=0.0995, iter_time=7.66s]
Epoch 0: 4%|▍ | 505/12384 [1:04:28<25:11:13, 7.63s/it, loss=1.6812, acc=0.1112, iter_time=7.60s]
Epoch 0: 4%|▍ | 506/12384 [1:04:28<25:09:57, 7.63s/it, loss=1.6812, acc=0.1112, iter_time=7.60s]
Epoch 0: 4%|▍ | 506/12384 [1:04:36<25:09:57, 7.63s/it, loss=1.5152, acc=0.1154, iter_time=7.62s]
Epoch 0: 4%|▍ | 507/12384 [1:04:36<25:09:26, 7.63s/it, loss=1.5152, acc=0.1154, iter_time=7.62s]
Epoch 0: 4%|▍ | 507/12384 [1:04:43<25:09:26, 7.63s/it, loss=1.5246, acc=0.1014, iter_time=7.64s]
Epoch 0: 4%|▍ | 508/12384 [1:04:43<25:09:40, 7.63s/it, loss=1.5246, acc=0.1014, iter_time=7.64s]
Epoch 0: 4%|▍ | 508/12384 [1:04:51<25:09:40, 7.63s/it, loss=1.5045, acc=0.1239, iter_time=7.98s]
Epoch 0: 4%|▍ | 509/12384 [1:04:51<25:30:11, 7.73s/it, loss=1.5045, acc=0.1239, iter_time=7.98s]
Epoch 0: 4%|▍ | 509/12384 [1:04:59<25:30:11, 7.73s/it, loss=1.8039, acc=0.1163, iter_time=7.60s]
Epoch 0: 4%|▍ | 510/12384 [1:04:59<25:22:06, 7.69s/it, loss=1.8039, acc=0.1163, iter_time=7.60s]
Epoch 0: 4%|▍ | 510/12384 [1:05:06<25:22:06, 7.69s/it, loss=1.6832, acc=0.1060, iter_time=7.61s]
Epoch 0: 4%|▍ | 511/12384 [1:05:06<25:18:05, 7.67s/it, loss=1.6832, acc=0.1060, iter_time=7.61s]
Epoch 0: 4%|▍ | 511/12384 [1:05:14<25:18:05, 7.67s/it, loss=1.4026, acc=0.1389, iter_time=7.70s]
Epoch 0: 4%|▍ | 512/12384 [1:05:14<25:16:10, 7.66s/it, loss=1.4026, acc=0.1389, iter_time=7.70s]
Epoch 0: 4%|▍ | 512/12384 [1:05:22<25:16:10, 7.66s/it, loss=1.4026, acc=0.1326, iter_time=7.57s]
Epoch 0: 4%|▍ | 513/12384 [1:05:22<25:12:52, 7.65s/it, loss=1.4026, acc=0.1326, iter_time=7.57s]
Epoch 0: 4%|▍ | 513/12384 [1:05:29<25:12:52, 7.65s/it, loss=1.3706, acc=0.1561, iter_time=7.61s]
Epoch 0: 4%|▍ | 514/12384 [1:05:29<25:11:47, 7.64s/it, loss=1.3706, acc=0.1561, iter_time=7.61s]
Epoch 0: 4%|▍ | 514/12384 [1:05:37<25:11:47, 7.64s/it, loss=1.1810, acc=0.1485, iter_time=7.62s]
Epoch 0: 4%|▍ | 515/12384 [1:05:37<25:10:56, 7.64s/it, loss=1.1810, acc=0.1485, iter_time=7.62s]
Epoch 0: 4%|▍ | 515/12384 [1:05:45<25:10:56, 7.64s/it, loss=1.4294, acc=0.1398, iter_time=5.37s]
Epoch 0: 4%|▍ | 516/12384 [1:05:45<25:10:32, 7.64s/it, loss=1.4294, acc=0.1398, iter_time=5.37s]
Epoch 0: 4%|▍ | 516/12384 [1:05:52<25:10:32, 7.64s/it, loss=1.4812, acc=0.1189, iter_time=7.63s]
Epoch 0: 4%|▍ | 517/12384 [1:05:52<25:09:51, 7.63s/it, loss=1.4812, acc=0.1189, iter_time=7.63s]
Epoch 0: 4%|▍ | 517/12384 [1:06:00<25:09:51, 7.63s/it, loss=1.3486, acc=0.1673, iter_time=7.62s]
Epoch 0: 4%|▍ | 518/12384 [1:06:00<25:07:33, 7.62s/it, loss=1.3486, acc=0.1673, iter_time=7.62s]
Epoch 0: 4%|▍ | 518/12384 [1:06:07<25:07:33, 7.62s/it, loss=1.5645, acc=0.1115, iter_time=9.86s]
Epoch 0: 4%|▍ | 519/12384 [1:06:07<25:07:26, 7.62s/it, loss=1.5645, acc=0.1115, iter_time=9.86s]
Epoch 0: 4%|▍ | 519/12384 [1:06:15<25:07:26, 7.62s/it, loss=1.2986, acc=0.1397, iter_time=8.05s]
Epoch 0: 4%|▍ | 520/12384 [1:06:15<25:07:43, 7.63s/it, loss=1.2986, acc=0.1397, iter_time=8.05s]
Epoch 0: 4%|▍ | 520/12384 [1:06:23<25:07:43, 7.63s/it, loss=1.3660, acc=0.1134, iter_time=6.34s]
Epoch 0: 4%|▍ | 521/12384 [1:06:23<25:08:53, 7.63s/it, loss=1.3660, acc=0.1134, iter_time=6.34s]
Epoch 0: 4%|▍ | 521/12384 [1:06:30<25:08:53, 7.63s/it, loss=1.2057, acc=0.1543, iter_time=8.53s]
Epoch 0: 4%|▍ | 522/12384 [1:06:30<25:08:12, 7.63s/it, loss=1.2057, acc=0.1543, iter_time=8.53s]
Epoch 0: 4%|▍ | 522/12384 [1:06:38<25:08:12, 7.63s/it, loss=1.2758, acc=0.1470, iter_time=7.61s]
Epoch 0: 4%|▍ | 523/12384 [1:06:38<25:06:10, 7.62s/it, loss=1.2758, acc=0.1470, iter_time=7.61s]
Epoch 0: 4%|▍ | 523/12384 [1:06:46<25:06:10, 7.62s/it, loss=1.2106, acc=0.1270, iter_time=5.81s]
Epoch 0: 4%|▍ | 524/12384 [1:06:46<25:08:49, 7.63s/it, loss=1.2106, acc=0.1270, iter_time=5.81s]
Epoch 0: 4%|▍ | 524/12384 [1:06:53<25:08:49, 7.63s/it, loss=1.4548, acc=0.1425, iter_time=8.60s]
Epoch 0: 4%|▍ | 525/12384 [1:06:53<25:13:12, 7.66s/it, loss=1.4548, acc=0.1425, iter_time=8.60s]
Epoch 0: 4%|▍ | 525/12384 [1:07:01<25:13:12, 7.66s/it, loss=1.0490, acc=0.1899, iter_time=7.63s]
Epoch 0: 4%|▍ | 526/12384 [1:07:01<25:12:16, 7.65s/it, loss=1.0490, acc=0.1899, iter_time=7.63s]
Epoch 0: 4%|▍ | 526/12384 [1:07:08<25:12:16, 7.65s/it, loss=1.2715, acc=0.1341, iter_time=8.59s]
Epoch 0: 4%|▍ | 527/12384 [1:07:08<25:09:06, 7.64s/it, loss=1.2715, acc=0.1341, iter_time=8.59s]
Epoch 0: 4%|▍ | 527/12384 [1:07:16<25:09:06, 7.64s/it, loss=1.2496, acc=0.1371, iter_time=8.03s]
Epoch 0: 4%|▍ | 528/12384 [1:07:16<25:09:57, 7.64s/it, loss=1.2496, acc=0.1371, iter_time=8.03s]
Epoch 0: 4%|▍ | 528/12384 [1:07:24<25:09:57, 7.64s/it, loss=1.0451, acc=0.2323, iter_time=5.68s]
Epoch 0: 4%|▍ | 529/12384 [1:07:24<25:07:57, 7.63s/it, loss=1.0451, acc=0.2323, iter_time=5.68s]
Epoch 0: 4%|▍ | 529/12384 [1:07:31<25:07:57, 7.63s/it, loss=1.1173, acc=0.1597, iter_time=8.53s]
Epoch 0: 4%|▍ | 530/12384 [1:07:31<25:05:31, 7.62s/it, loss=1.1173, acc=0.1597, iter_time=8.53s]
Epoch 0: 4%|▍ | 530/12384 [1:07:39<25:05:31, 7.62s/it, loss=1.1128, acc=0.1946, iter_time=7.27s]
Epoch 0: 4%|▍ | 531/12384 [1:07:39<25:03:40, 7.61s/it, loss=1.1128, acc=0.1946, iter_time=7.27s]
Epoch 0: 4%|▍ | 531/12384 [1:07:47<25:03:40, 7.61s/it, loss=1.1996, acc=0.1418, iter_time=8.55s]
Epoch 0: 4%|▍ | 532/12384 [1:07:47<25:08:55, 7.64s/it, loss=1.1996, acc=0.1418, iter_time=8.55s]
Epoch 0: 4%|▍ | 532/12384 [1:07:54<25:08:55, 7.64s/it, loss=1.0982, acc=0.1792, iter_time=6.58s]
Epoch 0: 4%|▍ | 533/12384 [1:07:54<25:07:03, 7.63s/it, loss=1.0982, acc=0.1792, iter_time=6.58s]
Epoch 0: 4%|▍ | 533/12384 [1:08:02<25:07:03, 7.63s/it, loss=1.1806, acc=0.1673, iter_time=8.72s]
Epoch 0: 4%|▍ | 534/12384 [1:08:02<25:06:54, 7.63s/it, loss=1.1806, acc=0.1673, iter_time=8.72s]
Epoch 0: 4%|▍ | 534/12384 [1:08:10<25:06:54, 7.63s/it, loss=1.3007, acc=0.1542, iter_time=7.14s]
Epoch 0: 4%|▍ | 535/12384 [1:08:10<25:27:33, 7.74s/it, loss=1.3007, acc=0.1542, iter_time=7.14s]
Epoch 0: 4%|▍ | 535/12384 [1:08:17<25:27:33, 7.74s/it, loss=1.3142, acc=0.1642, iter_time=8.44s]
Epoch 0: 4%|▍ | 536/12384 [1:08:17<25:20:34, 7.70s/it, loss=1.3142, acc=0.1642, iter_time=8.44s]
Epoch 0: 4%|▍ | 536/12384 [1:08:25<25:20:34, 7.70s/it, loss=1.0738, acc=0.1843, iter_time=7.65s]
Epoch 0: 4%|▍ | 537/12384 [1:08:25<25:15:31, 7.68s/it, loss=1.0738, acc=0.1843, iter_time=7.65s]
Epoch 0: 4%|▍ | 537/12384 [1:08:33<25:15:31, 7.68s/it, loss=0.9641, acc=0.2415, iter_time=7.03s]
Epoch 0: 4%|▍ | 538/12384 [1:08:33<25:12:05, 7.66s/it, loss=0.9641, acc=0.2415, iter_time=7.03s]
Epoch 0: 4%|▍ | 538/12384 [1:08:40<25:12:05, 7.66s/it, loss=1.1022, acc=0.1791, iter_time=8.20s]
Epoch 0: 4%|▍ | 539/12384 [1:08:40<25:08:33, 7.64s/it, loss=1.1022, acc=0.1791, iter_time=8.20s]
Epoch 0: 4%|▍ | 539/12384 [1:08:48<25:08:33, 7.64s/it, loss=1.0274, acc=0.1949, iter_time=7.65s]
Epoch 0: 4%|▍ | 540/12384 [1:08:48<25:07:58, 7.64s/it, loss=1.0274, acc=0.1949, iter_time=7.65s]
Epoch 0: 4%|▍ | 540/12384 [1:08:56<25:07:58, 7.64s/it, loss=1.0623, acc=0.2338, iter_time=5.80s]
Epoch 0: 4%|▍ | 541/12384 [1:08:56<25:12:11, 7.66s/it, loss=1.0623, acc=0.2338, iter_time=5.80s]
Epoch 0: 4%|▍ | 541/12384 [1:09:03<25:12:11, 7.66s/it, loss=1.0341, acc=0.2291, iter_time=9.51s]
Epoch 0: 4%|▍ | 542/12384 [1:09:03<25:09:20, 7.65s/it, loss=1.0341, acc=0.2291, iter_time=9.51s]
Epoch 0: 4%|▍ | 542/12384 [1:09:11<25:09:20, 7.65s/it, loss=1.2094, acc=0.1707, iter_time=7.63s]
Epoch 0: 4%|▍ | 543/12384 [1:09:11<25:07:26, 7.64s/it, loss=1.2094, acc=0.1707, iter_time=7.63s]
Epoch 0: 4%|▍ | 543/12384 [1:09:18<25:07:26, 7.64s/it, loss=1.0553, acc=0.1781, iter_time=8.01s]
Epoch 0: 4%|▍ | 544/12384 [1:09:18<25:06:29, 7.63s/it, loss=1.0553, acc=0.1781, iter_time=8.01s]
Epoch 0: 4%|▍ | 544/12384 [1:09:26<25:06:29, 7.63s/it, loss=0.9190, acc=0.2209, iter_time=3.87s]
Epoch 0: 4%|▍ | 545/12384 [1:09:26<25:07:30, 7.64s/it, loss=0.9190, acc=0.2209, iter_time=3.87s]
Epoch 0: 4%|▍ | 545/12384 [1:09:34<25:07:30, 7.64s/it, loss=1.3884, acc=0.1503, iter_time=10.99s]
Epoch 0: 4%|▍ | 546/12384 [1:09:34<25:05:31, 7.63s/it, loss=1.3884, acc=0.1503, iter_time=10.99s]
Epoch 0: 4%|▍ | 546/12384 [1:09:41<25:05:31, 7.63s/it, loss=0.8358, acc=0.2316, iter_time=7.63s]
Epoch 0: 4%|▍ | 547/12384 [1:09:41<25:03:58, 7.62s/it, loss=0.8358, acc=0.2316, iter_time=7.63s]
Epoch 0: 4%|▍ | 547/12384 [1:09:49<25:03:58, 7.62s/it, loss=1.1356, acc=0.1741, iter_time=7.31s]
Epoch 0: 4%|▍ | 548/12384 [1:09:49<25:04:11, 7.63s/it, loss=1.1356, acc=0.1741, iter_time=7.31s]
Epoch 0: 4%|▍ | 548/12384 [1:09:57<25:04:11, 7.63s/it, loss=1.0155, acc=0.2051, iter_time=7.94s]
Epoch 0: 4%|▍ | 549/12384 [1:09:57<25:04:27, 7.63s/it, loss=1.0155, acc=0.2051, iter_time=7.94s]
Epoch 0: 4%|▍ | 549/12384 [1:10:04<25:04:27, 7.63s/it, loss=1.0704, acc=0.2173, iter_time=8.04s]
Epoch 0: 4%|▍ | 550/12384 [1:10:04<25:04:24, 7.63s/it, loss=1.0704, acc=0.2173, iter_time=8.04s]
Epoch 0: 4%|▍ | 550/12384 [1:10:12<25:04:24, 7.63s/it, loss=0.9250, acc=0.2215, iter_time=5.12s]
Epoch 0: 4%|▍ | 551/12384 [1:10:12<25:02:36, 7.62s/it, loss=0.9250, acc=0.2215, iter_time=5.12s]
Epoch 0: 4%|▍ | 551/12384 [1:10:19<25:02:36, 7.62s/it, loss=0.9213, acc=0.2145, iter_time=10.09s]
Epoch 0: 4%|▍ | 552/12384 [1:10:19<25:03:25, 7.62s/it, loss=0.9213, acc=0.2145, iter_time=10.09s]
Epoch 0: 4%|▍ | 552/12384 [1:10:27<25:03:25, 7.62s/it, loss=0.8215, acc=0.2492, iter_time=7.28s]
Epoch 0: 4%|▍ | 553/12384 [1:10:27<25:05:11, 7.63s/it, loss=0.8215, acc=0.2492, iter_time=7.28s]
Epoch 0: 4%|▍ | 553/12384 [1:10:35<25:05:11, 7.63s/it, loss=1.0849, acc=0.2338, iter_time=7.62s]
Epoch 0: 4%|▍ | 554/12384 [1:10:35<25:03:28, 7.63s/it, loss=1.0849, acc=0.2338, iter_time=7.62s]
Epoch 0: 4%|▍ | 554/12384 [1:10:42<25:03:28, 7.63s/it, loss=0.9731, acc=0.2144, iter_time=7.31s]
Epoch 0: 4%|▍ | 555/12384 [1:10:42<25:01:26, 7.62s/it, loss=0.9731, acc=0.2144, iter_time=7.31s]
Epoch 0: 4%|▍ | 555/12384 [1:10:50<25:01:26, 7.62s/it, loss=0.7430, acc=0.2805, iter_time=5.56s]
Epoch 0: 4%|▍ | 556/12384 [1:10:50<25:02:05, 7.62s/it, loss=0.7430, acc=0.2805, iter_time=5.56s]
Epoch 0: 4%|▍ | 556/12384 [1:10:58<25:02:05, 7.62s/it, loss=0.8999, acc=0.2453, iter_time=9.96s]
Epoch 0: 4%|▍ | 557/12384 [1:10:58<25:01:57, 7.62s/it, loss=0.8999, acc=0.2453, iter_time=9.96s]
Epoch 0: 4%|▍ | 557/12384 [1:11:05<25:01:57, 7.62s/it, loss=0.8742, acc=0.2299, iter_time=7.61s]
Epoch 0: 5%|▍ | 558/12384 [1:11:05<25:02:26, 7.62s/it, loss=0.8742, acc=0.2299, iter_time=7.61s]
Epoch 0: 5%|▍ | 558/12384 [1:11:13<25:02:26, 7.62s/it, loss=0.8946, acc=0.2639, iter_time=7.62s]
Epoch 0: 5%|▍ | 559/12384 [1:11:13<25:02:41, 7.62s/it, loss=0.8946, acc=0.2639, iter_time=7.62s]
Epoch 0: 5%|▍ | 559/12384 [1:11:21<25:02:41, 7.62s/it, loss=0.7925, acc=0.2735, iter_time=7.64s]
Epoch 0: 5%|▍ | 560/12384 [1:11:21<25:05:43, 7.64s/it, loss=0.7925, acc=0.2735, iter_time=7.64s]
Epoch 0: 5%|▍ | 560/12384 [1:11:28<25:05:43, 7.64s/it, loss=0.7928, acc=0.3094, iter_time=8.03s]
Epoch 0: 5%|▍ | 561/12384 [1:11:28<25:24:59, 7.74s/it, loss=0.7928, acc=0.3094, iter_time=8.03s]
Epoch 0: 5%|▍ | 561/12384 [1:11:36<25:24:59, 7.74s/it, loss=0.6651, acc=0.3165, iter_time=7.66s]
Epoch 0: 5%|▍ | 562/12384 [1:11:36<25:18:52, 7.71s/it, loss=0.6651, acc=0.3165, iter_time=7.66s]
Epoch 0: 5%|▍ | 562/12384 [1:11:44<25:18:52, 7.71s/it, loss=0.7884, acc=0.2710, iter_time=7.03s]
Epoch 0: 5%|▍ | 563/12384 [1:11:44<25:13:15, 7.68s/it, loss=0.7884, acc=0.2710, iter_time=7.03s]
Epoch 0: 5%|▍ | 563/12384 [1:11:51<25:13:15, 7.68s/it, loss=0.6573, acc=0.3580, iter_time=6.39s]
Epoch 0: 5%|▍ | 564/12384 [1:11:51<25:10:16, 7.67s/it, loss=0.6573, acc=0.3580, iter_time=6.39s]
Epoch 0: 5%|▍ | 564/12384 [1:11:59<25:10:16, 7.67s/it, loss=0.6049, acc=0.3428, iter_time=7.32s]
Epoch 0: 5%|▍ | 565/12384 [1:11:59<25:06:22, 7.65s/it, loss=0.6049, acc=0.3428, iter_time=7.32s]
Epoch 0: 5%|▍ | 565/12384 [1:12:07<25:06:22, 7.65s/it, loss=0.7711, acc=0.2828, iter_time=9.72s]
Epoch 0: 5%|▍ | 566/12384 [1:12:07<25:05:29, 7.64s/it, loss=0.7711, acc=0.2828, iter_time=9.72s]
Epoch 0: 5%|▍ | 566/12384 [1:12:14<25:05:29, 7.64s/it, loss=0.6675, acc=0.3612, iter_time=3.87s]
Epoch 0: 5%|▍ | 567/12384 [1:12:14<25:03:08, 7.63s/it, loss=0.6675, acc=0.3612, iter_time=3.87s]
Epoch 0: 5%|▍ | 567/12384 [1:12:22<25:03:08, 7.63s/it, loss=0.8658, acc=0.2541, iter_time=11.74s]
Epoch 0: 5%|▍ | 568/12384 [1:12:22<25:04:40, 7.64s/it, loss=0.8658, acc=0.2541, iter_time=11.74s]
Epoch 0: 5%|▍ | 568/12384 [1:12:30<25:04:40, 7.64s/it, loss=0.5568, acc=0.4313, iter_time=5.19s]
Epoch 0: 5%|▍ | 569/12384 [1:12:30<25:04:49, 7.64s/it, loss=0.5568, acc=0.4313, iter_time=5.19s]
Epoch 0: 5%|▍ | 569/12384 [1:12:37<25:04:49, 7.64s/it, loss=0.6657, acc=0.3456, iter_time=9.72s]
Epoch 0: 5%|▍ | 570/12384 [1:12:37<25:02:18, 7.63s/it, loss=0.6657, acc=0.3456, iter_time=9.72s]
Epoch 0: 5%|▍ | 570/12384 [1:12:45<25:02:18, 7.63s/it, loss=0.6790, acc=0.3148, iter_time=7.60s]
Epoch 0: 5%|▍ | 571/12384 [1:12:45<24:59:50, 7.62s/it, loss=0.6790, acc=0.3148, iter_time=7.60s]
Epoch 0: 5%|▍ | 571/12384 [1:12:52<24:59:50, 7.62s/it, loss=0.6821, acc=0.3241, iter_time=6.15s]
Epoch 0: 5%|▍ | 572/12384 [1:12:52<24:59:18, 7.62s/it, loss=0.6821, acc=0.3241, iter_time=6.15s]
Epoch 0: 5%|▍ | 572/12384 [1:13:00<24:59:18, 7.62s/it, loss=0.6189, acc=0.3369, iter_time=9.05s]
Epoch 0: 5%|▍ | 573/12384 [1:13:00<24:57:34, 7.61s/it, loss=0.6189, acc=0.3369, iter_time=9.05s]
Epoch 0: 5%|▍ | 573/12384 [1:13:08<24:57:34, 7.61s/it, loss=0.6918, acc=0.3116, iter_time=7.61s]
Epoch 0: 5%|▍ | 574/12384 [1:13:08<24:58:42, 7.61s/it, loss=0.6918, acc=0.3116, iter_time=7.61s]
Epoch 0: 5%|▍ | 574/12384 [1:13:15<24:58:42, 7.61s/it, loss=0.6950, acc=0.2795, iter_time=7.62s]
Epoch 0: 5%|▍ | 575/12384 [1:13:15<24:58:58, 7.62s/it, loss=0.6950, acc=0.2795, iter_time=7.62s]
Epoch 0: 5%|▍ | 575/12384 [1:13:23<24:58:58, 7.62s/it, loss=0.7175, acc=0.2974, iter_time=8.02s]
Epoch 0: 5%|▍ | 576/12384 [1:13:23<24:58:50, 7.62s/it, loss=0.7175, acc=0.2974, iter_time=8.02s]
Epoch 0: 5%|▍ | 576/12384 [1:13:30<24:58:50, 7.62s/it, loss=0.7201, acc=0.3191, iter_time=6.00s]
Epoch 0: 5%|▍ | 577/12384 [1:13:30<24:59:51, 7.62s/it, loss=0.7201, acc=0.3191, iter_time=6.00s]
Epoch 0: 5%|▍ | 577/12384 [1:13:38<24:59:51, 7.62s/it, loss=0.5478, acc=0.3998, iter_time=5.48s]
Epoch 0: 5%|▍ | 578/12384 [1:13:38<24:59:56, 7.62s/it, loss=0.5478, acc=0.3998, iter_time=5.48s]
Epoch 0: 5%|▍ | 578/12384 [1:13:46<24:59:56, 7.62s/it, loss=0.5959, acc=0.4250, iter_time=8.22s]
Epoch 0: 5%|▍ | 579/12384 [1:13:46<25:03:06, 7.64s/it, loss=0.5959, acc=0.4250, iter_time=8.22s]
Epoch 0: 5%|▍ | 579/12384 [1:13:53<25:03:06, 7.64s/it, loss=0.5690, acc=0.3461, iter_time=10.46s]
Epoch 0: 5%|▍ | 580/12384 [1:13:53<25:01:19, 7.63s/it, loss=0.5690, acc=0.3461, iter_time=10.46s]
Epoch 0: 5%|▍ | 580/12384 [1:14:01<25:01:19, 7.63s/it, loss=0.5498, acc=0.4017, iter_time=7.58s]
Epoch 0: 5%|▍ | 581/12384 [1:14:01<24:59:15, 7.62s/it, loss=0.5498, acc=0.4017, iter_time=7.58s]
Epoch 0: 5%|▍ | 581/12384 [1:14:09<24:59:15, 7.62s/it, loss=0.6157, acc=0.3405, iter_time=7.63s]
Epoch 0: 5%|▍ | 582/12384 [1:14:09<25:00:35, 7.63s/it, loss=0.6157, acc=0.3405, iter_time=7.63s]
Epoch 0: 5%|▍ | 582/12384 [1:14:16<25:00:35, 7.63s/it, loss=0.7109, acc=0.3274, iter_time=7.63s]
Epoch 0: 5%|▍ | 583/12384 [1:14:16<24:58:35, 7.62s/it, loss=0.7109, acc=0.3274, iter_time=7.63s]
Epoch 0: 5%|▍ | 583/12384 [1:14:24<24:58:35, 7.62s/it, loss=0.6712, acc=0.3274, iter_time=8.01s]
Epoch 0: 5%|▍ | 584/12384 [1:14:24<24:59:13, 7.62s/it, loss=0.6712, acc=0.3274, iter_time=8.01s]
Epoch 0: 5%|▍ | 584/12384 [1:14:31<24:59:13, 7.62s/it, loss=0.6787, acc=0.3461, iter_time=6.94s]
Epoch 0: 5%|▍ | 585/12384 [1:14:31<24:59:22, 7.62s/it, loss=0.6787, acc=0.3461, iter_time=6.94s]
Epoch 0: 5%|▍ | 585/12384 [1:14:39<24:59:22, 7.62s/it, loss=0.5954, acc=0.4031, iter_time=7.91s]
Epoch 0: 5%|▍ | 586/12384 [1:14:39<24:56:42, 7.61s/it, loss=0.5954, acc=0.4031, iter_time=7.91s]
Epoch 0: 5%|▍ | 586/12384 [1:14:47<24:56:42, 7.61s/it, loss=0.3957, acc=0.5013, iter_time=5.41s]
Epoch 0: 5%|▍ | 587/12384 [1:14:47<25:18:35, 7.72s/it, loss=0.3957, acc=0.5013, iter_time=5.41s]
Epoch 0: 5%|▍ | 587/12384 [1:14:55<25:18:35, 7.72s/it, loss=0.5949, acc=0.3541, iter_time=10.18s]
Epoch 0: 5%|▍ | 588/12384 [1:14:55<25:12:43, 7.69s/it, loss=0.5949, acc=0.3541, iter_time=10.18s]
Epoch 0: 5%|▍ | 588/12384 [1:15:02<25:12:43, 7.69s/it, loss=0.4972, acc=0.4393, iter_time=7.61s]
Epoch 0: 5%|▍ | 589/12384 [1:15:02<25:07:34, 7.67s/it, loss=0.4972, acc=0.4393, iter_time=7.61s]
Epoch 0: 5%|▍ | 589/12384 [1:15:10<25:07:34, 7.67s/it, loss=0.5481, acc=0.4159, iter_time=7.32s]
Epoch 0: 5%|▍ | 590/12384 [1:15:10<25:05:02, 7.66s/it, loss=0.5481, acc=0.4159, iter_time=7.32s]
Epoch 0: 5%|▍ | 590/12384 [1:15:17<25:05:02, 7.66s/it, loss=0.5105, acc=0.4439, iter_time=7.92s]
Epoch 0: 5%|▍ | 591/12384 [1:15:17<25:02:00, 7.64s/it, loss=0.5105, acc=0.4439, iter_time=7.92s]
Epoch 0: 5%|▍ | 591/12384 [1:15:25<25:02:00, 7.64s/it, loss=0.5195, acc=0.4352, iter_time=7.57s]
Epoch 0: 5%|▍ | 592/12384 [1:15:25<25:00:38, 7.64s/it, loss=0.5195, acc=0.4352, iter_time=7.57s]
Epoch 0: 5%|▍ | 592/12384 [1:15:33<25:00:38, 7.64s/it, loss=0.4510, acc=0.4830, iter_time=5.93s]
Epoch 0: 5%|▍ | 593/12384 [1:15:33<24:59:17, 7.63s/it, loss=0.4510, acc=0.4830, iter_time=5.93s]
Epoch 0: 5%|▍ | 593/12384 [1:15:40<24:59:17, 7.63s/it, loss=0.4679, acc=0.4683, iter_time=6.20s]
Epoch 0: 5%|▍ | 594/12384 [1:15:40<24:58:53, 7.63s/it, loss=0.4679, acc=0.4683, iter_time=6.20s]
Epoch 0: 5%|▍ | 594/12384 [1:15:48<24:58:53, 7.63s/it, loss=0.3771, acc=0.4850, iter_time=9.74s]
Epoch 0: 5%|▍ | 595/12384 [1:15:48<24:59:10, 7.63s/it, loss=0.3771, acc=0.4850, iter_time=9.74s]
Epoch 0: 5%|▍ | 595/12384 [1:15:56<24:59:10, 7.63s/it, loss=0.6307, acc=0.4445, iter_time=8.67s]
Epoch 0: 5%|▍ | 596/12384 [1:15:56<24:58:36, 7.63s/it, loss=0.6307, acc=0.4445, iter_time=8.67s]
Epoch 0: 5%|▍ | 596/12384 [1:16:03<24:58:36, 7.63s/it, loss=0.4217, acc=0.5000, iter_time=7.71s]
Epoch 0: 5%|▍ | 597/12384 [1:16:03<25:02:34, 7.65s/it, loss=0.4217, acc=0.5000, iter_time=7.71s]
Epoch 0: 5%|▍ | 597/12384 [1:16:11<25:02:34, 7.65s/it, loss=0.4723, acc=0.4528, iter_time=7.03s]
Epoch 0: 5%|▍ | 598/12384 [1:16:11<25:01:09, 7.64s/it, loss=0.4723, acc=0.4528, iter_time=7.03s]
Epoch 0: 5%|▍ | 598/12384 [1:16:19<25:01:09, 7.64s/it, loss=0.4469, acc=0.4722, iter_time=8.33s]
Epoch 0: 5%|▍ | 599/12384 [1:16:19<25:05:52, 7.67s/it, loss=0.4469, acc=0.4722, iter_time=8.33s]
Epoch 0: 5%|▍ | 599/12384 [1:16:26<25:05:52, 7.67s/it, loss=0.4552, acc=0.4872, iter_time=8.02s]
Epoch 0: 5%|▍ | 600/12384 [1:16:26<25:03:41, 7.66s/it, loss=0.4552, acc=0.4872, iter_time=8.02s]
Epoch 0: 5%|▍ | 600/12384 [1:16:34<25:03:41, 7.66s/it, loss=0.3595, acc=0.5681, iter_time=7.20s]
Epoch 0: 5%|▍ | 601/12384 [1:16:34<25:00:03, 7.64s/it, loss=0.3595, acc=0.5681, iter_time=7.20s]
Epoch 0: 5%|▍ | 601/12384 [1:16:41<25:00:03, 7.64s/it, loss=0.3609, acc=0.5647, iter_time=4.75s]
Epoch 0: 5%|▍ | 602/12384 [1:16:41<24:58:07, 7.63s/it, loss=0.3609, acc=0.5647, iter_time=4.75s]
Epoch 0: 5%|▍ | 602/12384 [1:16:49<24:58:07, 7.63s/it, loss=0.4165, acc=0.4867, iter_time=10.46s]
Epoch 0: 5%|▍ | 603/12384 [1:16:49<24:57:00, 7.62s/it, loss=0.4165, acc=0.4867, iter_time=10.46s]
Epoch 0: 5%|▍ | 603/12384 [1:16:57<24:57:00, 7.62s/it, loss=0.3329, acc=0.5583, iter_time=7.63s]
Epoch 0: 5%|▍ | 604/12384 [1:16:57<24:57:40, 7.63s/it, loss=0.3329, acc=0.5583, iter_time=7.63s]
Epoch 0: 5%|▍ | 604/12384 [1:17:04<24:57:40, 7.63s/it, loss=0.3727, acc=0.6073, iter_time=6.43s]
Epoch 0: 5%|▍ | 605/12384 [1:17:04<24:56:31, 7.62s/it, loss=0.3727, acc=0.6073, iter_time=6.43s]
Epoch 0: 5%|▍ | 605/12384 [1:17:12<24:56:31, 7.62s/it, loss=0.4353, acc=0.5041, iter_time=8.80s]
Epoch 0: 5%|▍ | 606/12384 [1:17:12<24:55:38, 7.62s/it, loss=0.4353, acc=0.5041, iter_time=8.80s]
Epoch 0: 5%|▍ | 606/12384 [1:17:20<24:55:38, 7.62s/it, loss=0.3878, acc=0.5552, iter_time=7.61s]
Epoch 0: 5%|▍ | 607/12384 [1:17:20<24:56:49, 7.63s/it, loss=0.3878, acc=0.5552, iter_time=7.61s]
Epoch 0: 5%|▍ | 607/12384 [1:17:27<24:56:49, 7.63s/it, loss=0.4017, acc=0.5565, iter_time=7.63s]
Epoch 0: 5%|▍ | 608/12384 [1:17:27<24:58:56, 7.64s/it, loss=0.4017, acc=0.5565, iter_time=7.63s]
Epoch 0: 5%|▍ | 608/12384 [1:17:35<24:58:56, 7.64s/it, loss=0.3317, acc=0.5880, iter_time=7.65s]
Epoch 0: 5%|▍ | 609/12384 [1:17:35<24:56:06, 7.62s/it, loss=0.3317, acc=0.5880, iter_time=7.65s]
Epoch 0: 5%|▍ | 609/12384 [1:17:42<24:56:06, 7.62s/it, loss=0.4519, acc=0.5520, iter_time=4.08s]
Epoch 0: 5%|▍ | 610/12384 [1:17:42<24:56:05, 7.62s/it, loss=0.4519, acc=0.5520, iter_time=4.08s]
Epoch 0: 5%|▍ | 610/12384 [1:17:50<24:56:05, 7.62s/it, loss=0.3435, acc=0.5490, iter_time=11.14s]
Epoch 0: 5%|▍ | 611/12384 [1:17:50<24:55:35, 7.62s/it, loss=0.3435, acc=0.5490, iter_time=11.14s]
Epoch 0: 5%|▍ | 611/12384 [1:17:58<24:55:35, 7.62s/it, loss=0.2755, acc=0.6547, iter_time=7.69s]
Epoch 0: 5%|▍ | 612/12384 [1:17:58<24:58:16, 7.64s/it, loss=0.2755, acc=0.6547, iter_time=7.69s]
Epoch 0: 5%|▍ | 612/12384 [1:18:06<24:58:16, 7.64s/it, loss=0.3744, acc=0.5785, iter_time=7.95s]
Epoch 0: 5%|▍ | 613/12384 [1:18:06<25:16:26, 7.73s/it, loss=0.3744, acc=0.5785, iter_time=7.95s]
Epoch 0: 5%|▍ | 613/12384 [1:18:13<25:16:26, 7.73s/it, loss=0.3048, acc=0.5805, iter_time=6.67s]
Epoch 0: 5%|▍ | 614/12384 [1:18:13<25:09:52, 7.70s/it, loss=0.3048, acc=0.5805, iter_time=6.67s]
Epoch 0: 5%|▍ | 614/12384 [1:18:21<25:09:52, 7.70s/it, loss=0.3549, acc=0.5883, iter_time=5.78s]
Epoch 0: 5%|▍ | 615/12384 [1:18:21<25:04:59, 7.67s/it, loss=0.3549, acc=0.5883, iter_time=5.78s]
Epoch 0: 5%|▍ | 615/12384 [1:18:29<25:04:59, 7.67s/it, loss=0.2801, acc=0.6477, iter_time=10.87s]
Epoch 0: 5%|▍ | 616/12384 [1:18:29<25:05:43, 7.68s/it, loss=0.2801, acc=0.6477, iter_time=10.87s]
Epoch 0: 5%|▍ | 616/12384 [1:18:36<25:05:43, 7.68s/it, loss=0.3853, acc=0.5475, iter_time=7.20s]
Epoch 0: 5%|▍ | 617/12384 [1:18:36<25:00:20, 7.65s/it, loss=0.3853, acc=0.5475, iter_time=7.20s]
Epoch 0: 5%|▍ | 617/12384 [1:18:44<25:00:20, 7.65s/it, loss=0.2466, acc=0.6661, iter_time=5.80s]
Epoch 0: 5%|▍ | 618/12384 [1:18:44<24:59:16, 7.65s/it, loss=0.2466, acc=0.6661, iter_time=5.80s]
Epoch 0: 5%|▍ | 618/12384 [1:18:52<24:59:16, 7.65s/it, loss=0.3300, acc=0.6636, iter_time=9.45s]
Epoch 0: 5%|▍ | 619/12384 [1:18:52<24:59:15, 7.65s/it, loss=0.3300, acc=0.6636, iter_time=9.45s]
Epoch 0: 5%|▍ | 619/12384 [1:18:59<24:59:15, 7.65s/it, loss=0.3192, acc=0.5931, iter_time=7.65s]
Epoch 0: 5%|▌ | 620/12384 [1:18:59<24:56:42, 7.63s/it, loss=0.3192, acc=0.5931, iter_time=7.65s]
Epoch 0: 5%|▌ | 620/12384 [1:19:07<24:56:42, 7.63s/it, loss=0.2891, acc=0.6302, iter_time=7.60s]
Epoch 0: 5%|▌ | 621/12384 [1:19:07<24:55:28, 7.63s/it, loss=0.2891, acc=0.6302, iter_time=7.60s]
Epoch 0: 5%|▌ | 621/12384 [1:19:14<24:55:28, 7.63s/it, loss=0.2765, acc=0.6749, iter_time=7.62s]
Epoch 0: 5%|▌ | 622/12384 [1:19:14<24:55:28, 7.63s/it, loss=0.2765, acc=0.6749, iter_time=7.62s]
Epoch 0: 5%|▌ | 622/12384 [1:19:22<24:55:28, 7.63s/it, loss=0.2860, acc=0.6268, iter_time=7.62s]
Epoch 0: 5%|▌ | 623/12384 [1:19:22<24:55:29, 7.63s/it, loss=0.2860, acc=0.6268, iter_time=7.62s]
Epoch 0: 5%|▌ | 623/12384 [1:19:30<24:55:29, 7.63s/it, loss=0.2743, acc=0.6085, iter_time=8.03s]
Epoch 0: 5%|▌ | 624/12384 [1:19:30<24:58:00, 7.64s/it, loss=0.2743, acc=0.6085, iter_time=8.03s]
Epoch 0: 5%|▌ | 624/12384 [1:19:37<24:58:00, 7.64s/it, loss=0.3086, acc=0.5790, iter_time=7.30s]
Epoch 0: 5%|▌ | 625/12384 [1:19:37<24:58:40, 7.65s/it, loss=0.3086, acc=0.5790, iter_time=7.30s]
Epoch 0: 5%|▌ | 625/12384 [1:19:45<24:58:40, 7.65s/it, loss=0.2277, acc=0.7522, iter_time=4.04s]
Epoch 0: 5%|▌ | 626/12384 [1:19:45<24:56:33, 7.64s/it, loss=0.2277, acc=0.7522, iter_time=4.04s]
Epoch 0: 5%|▌ | 626/12384 [1:19:53<24:56:33, 7.64s/it, loss=0.2726, acc=0.6821, iter_time=11.19s]
Epoch 0: 5%|▌ | 627/12384 [1:19:53<24:56:15, 7.64s/it, loss=0.2726, acc=0.6821, iter_time=11.19s]
Epoch 0: 5%|▌ | 627/12384 [1:20:00<24:56:15, 7.64s/it, loss=0.2736, acc=0.6190, iter_time=7.63s]
Epoch 0: 5%|▌ | 628/12384 [1:20:00<24:53:31, 7.62s/it, loss=0.2736, acc=0.6190, iter_time=7.63s]
Epoch 0: 5%|▌ | 628/12384 [1:20:08<24:53:31, 7.62s/it, loss=0.2692, acc=0.6231, iter_time=7.60s]
Epoch 0: 5%|▌ | 629/12384 [1:20:08<24:53:11, 7.62s/it, loss=0.2692, acc=0.6231, iter_time=7.60s]
Epoch 0: 5%|▌ | 629/12384 [1:20:15<24:53:11, 7.62s/it, loss=0.3091, acc=0.6119, iter_time=7.65s]
Epoch 0: 5%|▌ | 630/12384 [1:20:15<24:54:08, 7.63s/it, loss=0.3091, acc=0.6119, iter_time=7.65s]
Epoch 0: 5%|▌ | 630/12384 [1:20:23<24:54:08, 7.63s/it, loss=0.2454, acc=0.6875, iter_time=7.60s]
Epoch 0: 5%|▌ | 631/12384 [1:20:23<24:53:49, 7.63s/it, loss=0.2454, acc=0.6875, iter_time=7.60s]
Epoch 0: 5%|▌ | 631/12384 [1:20:31<24:53:49, 7.63s/it, loss=0.3181, acc=0.5758, iter_time=8.02s]
Epoch 0: 5%|▌ | 632/12384 [1:20:31<24:54:42, 7.63s/it, loss=0.3181, acc=0.5758, iter_time=8.02s]
Epoch 0: 5%|▌ | 632/12384 [1:20:38<24:54:42, 7.63s/it, loss=0.2353, acc=0.6825, iter_time=7.26s]
Epoch 0: 5%|▌ | 633/12384 [1:20:38<24:54:11, 7.63s/it, loss=0.2353, acc=0.6825, iter_time=7.26s]
Epoch 0: 5%|▌ | 633/12384 [1:20:46<24:54:11, 7.63s/it, loss=0.2374, acc=0.6985, iter_time=7.63s]
Epoch 0: 5%|▌ | 634/12384 [1:20:46<24:54:02, 7.63s/it, loss=0.2374, acc=0.6985, iter_time=7.63s]
Epoch 0: 5%|▌ | 634/12384 [1:20:54<24:54:02, 7.63s/it, loss=0.2306, acc=0.6765, iter_time=7.62s]
Epoch 0: 5%|▌ | 635/12384 [1:20:54<24:54:11, 7.63s/it, loss=0.2306, acc=0.6765, iter_time=7.62s]
Epoch 0: 5%|▌ | 635/12384 [1:21:01<24:54:11, 7.63s/it, loss=0.1760, acc=0.7782, iter_time=7.64s]
Epoch 0: 5%|▌ | 636/12384 [1:21:01<24:55:33, 7.64s/it, loss=0.1760, acc=0.7782, iter_time=7.64s]
Epoch 0: 5%|▌ | 636/12384 [1:21:09<24:55:33, 7.64s/it, loss=0.1989, acc=0.7082, iter_time=7.66s]
Epoch 0: 5%|▌ | 637/12384 [1:21:09<24:54:22, 7.63s/it, loss=0.1989, acc=0.7082, iter_time=7.66s]
Epoch 0: 5%|▌ | 637/12384 [1:21:16<24:54:22, 7.63s/it, loss=0.2891, acc=0.6458, iter_time=7.59s]
Epoch 0: 5%|▌ | 638/12384 [1:21:16<24:53:03, 7.63s/it, loss=0.2891, acc=0.6458, iter_time=7.59s]
Epoch 0: 5%|▌ | 638/12384 [1:21:24<24:53:03, 7.63s/it, loss=0.2284, acc=0.6844, iter_time=7.63s]
Epoch 0: 5%|▌ | 639/12384 [1:21:24<24:54:25, 7.63s/it, loss=0.2284, acc=0.6844, iter_time=7.63s]
Epoch 0: 5%|▌ | 639/12384 [1:21:32<24:54:25, 7.63s/it, loss=0.2104, acc=0.7344, iter_time=7.96s]
Epoch 0: 5%|▌ | 640/12384 [1:21:32<25:14:01, 7.74s/it, loss=0.2104, acc=0.7344, iter_time=7.96s]
Epoch 0: 5%|▌ | 640/12384 [1:21:40<25:14:01, 7.74s/it, loss=0.2158, acc=0.6910, iter_time=7.66s]
Epoch 0: 5%|▌ | 641/12384 [1:21:40<25:12:03, 7.73s/it, loss=0.2158, acc=0.6910, iter_time=7.66s]
Epoch 0: 5%|▌ | 641/12384 [1:21:47<25:12:03, 7.73s/it, loss=0.1842, acc=0.7450, iter_time=7.72s]
Epoch 0: 5%|▌ | 642/12384 [1:21:47<25:05:16, 7.69s/it, loss=0.1842, acc=0.7450, iter_time=7.72s]
Epoch 0: 5%|▌ | 642/12384 [1:21:55<25:05:16, 7.69s/it, loss=0.2026, acc=0.7683, iter_time=6.66s]
Epoch 0: 5%|▌ | 643/12384 [1:21:55<25:00:55, 7.67s/it, loss=0.2026, acc=0.7683, iter_time=6.66s]
Epoch 0: 5%|▌ | 643/12384 [1:22:03<25:00:55, 7.67s/it, loss=0.1983, acc=0.7110, iter_time=8.55s]
Epoch 0: 5%|▌ | 644/12384 [1:22:03<24:58:22, 7.66s/it, loss=0.1983, acc=0.7110, iter_time=8.55s]
Epoch 0: 5%|▌ | 644/12384 [1:22:10<24:58:22, 7.66s/it, loss=0.1784, acc=0.7248, iter_time=7.65s]
Epoch 0: 5%|▌ | 645/12384 [1:22:10<24:57:46, 7.66s/it, loss=0.1784, acc=0.7248, iter_time=7.65s]
Epoch 0: 5%|▌ | 645/12384 [1:22:18<24:57:46, 7.66s/it, loss=0.1878, acc=0.7608, iter_time=7.65s]
Epoch 0: 5%|▌ | 646/12384 [1:22:18<24:55:50, 7.65s/it, loss=0.1878, acc=0.7608, iter_time=7.65s]
Epoch 0: 5%|▌ | 646/12384 [1:22:26<24:55:50, 7.65s/it, loss=0.1741, acc=0.7487, iter_time=7.61s]
Epoch 0: 5%|▌ | 647/12384 [1:22:26<24:54:07, 7.64s/it, loss=0.1741, acc=0.7487, iter_time=7.61s]
Epoch 0: 5%|▌ | 647/12384 [1:22:33<24:54:07, 7.64s/it, loss=0.1593, acc=0.7560, iter_time=7.99s]
Epoch 0: 5%|▌ | 648/12384 [1:22:33<24:50:56, 7.62s/it, loss=0.1593, acc=0.7560, iter_time=7.99s]
Epoch 0: 5%|▌ | 648/12384 [1:22:41<24:50:56, 7.62s/it, loss=0.1457, acc=0.7830, iter_time=7.22s]
Epoch 0: 5%|▌ | 649/12384 [1:22:41<24:50:07, 7.62s/it, loss=0.1457, acc=0.7830, iter_time=7.22s]
Epoch 0: 5%|▌ | 649/12384 [1:22:48<24:50:07, 7.62s/it, loss=0.5472, acc=0.6766, iter_time=8.09s]
Epoch 0: 5%|▌ | 650/12384 [1:22:48<24:54:13, 7.64s/it, loss=0.5472, acc=0.6766, iter_time=8.09s]
Epoch 0: 5%|▌ | 650/12384 [1:22:56<24:54:13, 7.64s/it, loss=0.1702, acc=0.7698, iter_time=7.23s]
Epoch 0: 5%|▌ | 651/12384 [1:22:56<24:58:10, 7.66s/it, loss=0.1702, acc=0.7698, iter_time=7.23s]
Epoch 0: 5%|▌ | 651/12384 [1:23:04<24:58:10, 7.66s/it, loss=0.1583, acc=0.7757, iter_time=7.71s]
Epoch 0: 5%|▌ | 652/12384 [1:23:04<24:56:24, 7.65s/it, loss=0.1583, acc=0.7757, iter_time=7.71s]
Epoch 0: 5%|▌ | 652/12384 [1:23:11<24:56:24, 7.65s/it, loss=0.2294, acc=0.7074, iter_time=7.64s]
Epoch 0: 5%|▌ | 653/12384 [1:23:11<24:54:14, 7.64s/it, loss=0.2294, acc=0.7074, iter_time=7.64s]
Epoch 0: 5%|▌ | 653/12384 [1:23:19<24:54:14, 7.64s/it, loss=0.1887, acc=0.7309, iter_time=4.91s]
Epoch 0: 5%|▌ | 654/12384 [1:23:19<24:55:45, 7.65s/it, loss=0.1887, acc=0.7309, iter_time=4.91s]
Epoch 0: 5%|▌ | 654/12384 [1:23:27<24:55:45, 7.65s/it, loss=0.1997, acc=0.7227, iter_time=10.36s]
Epoch 0: 5%|▌ | 655/12384 [1:23:27<24:53:39, 7.64s/it, loss=0.1997, acc=0.7227, iter_time=10.36s]
Epoch 0: 5%|▌ | 655/12384 [1:23:34<24:53:39, 7.64s/it, loss=0.1883, acc=0.7143, iter_time=8.01s]
Epoch 0: 5%|▌ | 656/12384 [1:23:34<24:56:41, 7.66s/it, loss=0.1883, acc=0.7143, iter_time=8.01s]
Epoch 0: 5%|▌ | 656/12384 [1:23:42<24:56:41, 7.66s/it, loss=0.1850, acc=0.7220, iter_time=7.31s]
Epoch 0: 5%|▌ | 657/12384 [1:23:42<24:54:15, 7.65s/it, loss=0.1850, acc=0.7220, iter_time=7.31s]
Epoch 0: 5%|▌ | 657/12384 [1:23:50<24:54:15, 7.65s/it, loss=0.1589, acc=0.7959, iter_time=7.60s]
Epoch 0: 5%|▌ | 658/12384 [1:23:50<24:51:19, 7.63s/it, loss=0.1589, acc=0.7959, iter_time=7.60s]
Epoch 0: 5%|▌ | 658/12384 [1:23:57<24:51:19, 7.63s/it, loss=0.1804, acc=0.7430, iter_time=7.63s]
Epoch 0: 5%|▌ | 659/12384 [1:23:57<24:50:51, 7.63s/it, loss=0.1804, acc=0.7430, iter_time=7.63s]
Epoch 0: 5%|▌ | 659/12384 [1:24:05<24:50:51, 7.63s/it, loss=0.1689, acc=0.7517, iter_time=6.64s]
Epoch 0: 5%|▌ | 660/12384 [1:24:05<24:49:57, 7.63s/it, loss=0.1689, acc=0.7517, iter_time=6.64s]
Epoch 0: 5%|▌ | 660/12384 [1:24:12<24:49:57, 7.63s/it, loss=0.1542, acc=0.7555, iter_time=8.60s]
Epoch 0: 5%|▌ | 661/12384 [1:24:12<24:49:37, 7.62s/it, loss=0.1542, acc=0.7555, iter_time=8.60s]
Epoch 0: 5%|▌ | 661/12384 [1:24:20<24:49:37, 7.62s/it, loss=0.1465, acc=0.7940, iter_time=7.61s]
Epoch 0: 5%|▌ | 662/12384 [1:24:20<24:50:38, 7.63s/it, loss=0.1465, acc=0.7940, iter_time=7.61s]
Epoch 0: 5%|▌ | 662/12384 [1:24:28<24:50:38, 7.63s/it, loss=0.2699, acc=0.7406, iter_time=4.85s]
Epoch 0: 5%|▌ | 663/12384 [1:24:28<24:50:10, 7.63s/it, loss=0.2699, acc=0.7406, iter_time=4.85s]
Epoch 0: 5%|▌ | 663/12384 [1:24:35<24:50:10, 7.63s/it, loss=0.1460, acc=0.7966, iter_time=10.34s]
Epoch 0: 5%|▌ | 664/12384 [1:24:35<24:48:23, 7.62s/it, loss=0.1460, acc=0.7966, iter_time=10.34s]
Epoch 0: 5%|▌ | 664/12384 [1:24:43<24:48:23, 7.62s/it, loss=0.2011, acc=0.7543, iter_time=7.66s]
Epoch 0: 5%|▌ | 665/12384 [1:24:43<24:47:21, 7.62s/it, loss=0.2011, acc=0.7543, iter_time=7.66s]
Epoch 0: 5%|▌ | 665/12384 [1:24:51<24:47:21, 7.62s/it, loss=0.1033, acc=0.8417, iter_time=7.97s]
Epoch 0: 5%|▌ | 666/12384 [1:24:51<25:07:31, 7.72s/it, loss=0.1033, acc=0.8417, iter_time=7.97s]
Epoch 0: 5%|▌ | 666/12384 [1:24:58<25:07:31, 7.72s/it, loss=0.1325, acc=0.8130, iter_time=4.24s]
Epoch 0: 5%|▌ | 667/12384 [1:24:58<25:00:41, 7.68s/it, loss=0.1325, acc=0.8130, iter_time=4.24s]
Epoch 0: 5%|▌ | 667/12384 [1:25:06<25:00:41, 7.68s/it, loss=0.1301, acc=0.8045, iter_time=10.98s]
Epoch 0: 5%|▌ | 668/12384 [1:25:06<24:57:19, 7.67s/it, loss=0.1301, acc=0.8045, iter_time=10.98s]
Epoch 0: 5%|▌ | 668/12384 [1:25:14<24:57:19, 7.67s/it, loss=0.0870, acc=0.8850, iter_time=7.61s]
Epoch 0: 5%|▌ | 669/12384 [1:25:14<24:53:58, 7.65s/it, loss=0.0870, acc=0.8850, iter_time=7.61s]
Epoch 0: 5%|▌ | 669/12384 [1:25:21<24:53:58, 7.65s/it, loss=0.1284, acc=0.8570, iter_time=5.55s]
Epoch 0: 5%|▌ | 670/12384 [1:25:21<24:51:27, 7.64s/it, loss=0.1284, acc=0.8570, iter_time=5.55s]
Epoch 0: 5%|▌ | 670/12384 [1:25:29<24:51:27, 7.64s/it, loss=0.1239, acc=0.8027, iter_time=9.45s]
Epoch 0: 5%|▌ | 671/12384 [1:25:29<24:48:41, 7.63s/it, loss=0.1239, acc=0.8027, iter_time=9.45s]
Epoch 0: 5%|▌ | 671/12384 [1:25:37<24:48:41, 7.63s/it, loss=0.1621, acc=0.7987, iter_time=7.77s]
Epoch 0: 5%|▌ | 672/12384 [1:25:37<24:47:36, 7.62s/it, loss=0.1621, acc=0.7987, iter_time=7.77s]
Epoch 0: 5%|▌ | 672/12384 [1:25:44<24:47:36, 7.62s/it, loss=0.1057, acc=0.8301, iter_time=6.71s]
Epoch 0: 5%|▌ | 673/12384 [1:25:44<24:45:45, 7.61s/it, loss=0.1057, acc=0.8301, iter_time=6.71s]
Epoch 0: 5%|▌ | 673/12384 [1:25:52<24:45:45, 7.61s/it, loss=0.1210, acc=0.8217, iter_time=5.03s]
Epoch 0: 5%|▌ | 674/12384 [1:25:52<24:44:23, 7.61s/it, loss=0.1210, acc=0.8217, iter_time=5.03s]
Epoch 0: 5%|▌ | 674/12384 [1:25:59<24:44:23, 7.61s/it, loss=0.1094, acc=0.8175, iter_time=11.12s]
Epoch 0: 5%|▌ | 675/12384 [1:25:59<24:45:14, 7.61s/it, loss=0.1094, acc=0.8175, iter_time=11.12s]
Epoch 0: 5%|▌ | 675/12384 [1:26:07<24:45:14, 7.61s/it, loss=0.1182, acc=0.8119, iter_time=7.63s]
Epoch 0: 5%|▌ | 676/12384 [1:26:07<24:46:54, 7.62s/it, loss=0.1182, acc=0.8119, iter_time=7.63s]
Epoch 0: 5%|▌ | 676/12384 [1:26:15<24:46:54, 7.62s/it, loss=0.1030, acc=0.8589, iter_time=7.62s]
Epoch 0: 5%|▌ | 677/12384 [1:26:15<24:45:25, 7.61s/it, loss=0.1030, acc=0.8589, iter_time=7.62s]
Epoch 0: 5%|▌ | 677/12384 [1:26:22<24:45:25, 7.61s/it, loss=0.1066, acc=0.8447, iter_time=7.60s]
Epoch 0: 5%|▌ | 678/12384 [1:26:22<24:45:09, 7.61s/it, loss=0.1066, acc=0.8447, iter_time=7.60s]
Epoch 0: 5%|▌ | 678/12384 [1:26:30<24:45:09, 7.61s/it, loss=0.2320, acc=0.7491, iter_time=5.89s]
Epoch 0: 5%|▌ | 679/12384 [1:26:30<24:48:34, 7.63s/it, loss=0.2320, acc=0.7491, iter_time=5.89s]
Epoch 0: 5%|▌ | 679/12384 [1:26:37<24:48:34, 7.63s/it, loss=0.1286, acc=0.8239, iter_time=9.36s]
Epoch 0: 5%|▌ | 680/12384 [1:26:37<24:48:24, 7.63s/it, loss=0.1286, acc=0.8239, iter_time=9.36s]
Epoch 0: 5%|▌ | 680/12384 [1:26:45<24:48:24, 7.63s/it, loss=0.1085, acc=0.8316, iter_time=7.74s]
Epoch 0: 5%|▌ | 681/12384 [1:26:45<24:51:48, 7.65s/it, loss=0.1085, acc=0.8316, iter_time=7.74s]
Epoch 0: 5%|▌ | 681/12384 [1:26:53<24:51:48, 7.65s/it, loss=0.1281, acc=0.8363, iter_time=4.83s]
Epoch 0: 6%|▌ | 682/12384 [1:26:53<24:48:47, 7.63s/it, loss=0.1281, acc=0.8363, iter_time=4.83s]
Epoch 0: 6%|▌ | 682/12384 [1:27:00<24:48:47, 7.63s/it, loss=0.1252, acc=0.7980, iter_time=10.37s]
Epoch 0: 6%|▌ | 683/12384 [1:27:00<24:47:03, 7.63s/it, loss=0.1252, acc=0.7980, iter_time=10.37s]
Epoch 0: 6%|▌ | 683/12384 [1:27:08<24:47:03, 7.63s/it, loss=0.1029, acc=0.8516, iter_time=6.39s]
Epoch 0: 6%|▌ | 684/12384 [1:27:08<24:46:05, 7.62s/it, loss=0.1029, acc=0.8516, iter_time=6.39s]
Epoch 0: 6%|▌ | 684/12384 [1:27:16<24:46:05, 7.62s/it, loss=0.1170, acc=0.8091, iter_time=7.89s]
Epoch 0: 6%|▌ | 685/12384 [1:27:16<24:45:17, 7.62s/it, loss=0.1170, acc=0.8091, iter_time=7.89s]
Epoch 0: 6%|▌ | 685/12384 [1:27:23<24:45:17, 7.62s/it, loss=0.1126, acc=0.8357, iter_time=8.57s]
Epoch 0: 6%|▌ | 686/12384 [1:27:23<24:46:02, 7.62s/it, loss=0.1126, acc=0.8357, iter_time=8.57s]
Epoch 0: 6%|▌ | 686/12384 [1:27:31<24:46:02, 7.62s/it, loss=0.1068, acc=0.8461, iter_time=7.61s]
Epoch 0: 6%|▌ | 687/12384 [1:27:31<24:48:58, 7.64s/it, loss=0.1068, acc=0.8461, iter_time=7.61s]
Epoch 0: 6%|▌ | 687/12384 [1:27:39<24:48:58, 7.64s/it, loss=0.1303, acc=0.7917, iter_time=8.08s]
Epoch 0: 6%|▌ | 688/12384 [1:27:39<24:47:10, 7.63s/it, loss=0.1303, acc=0.7917, iter_time=8.08s]
Epoch 0: 6%|▌ | 688/12384 [1:27:46<24:47:10, 7.63s/it, loss=0.0904, acc=0.8535, iter_time=7.22s]
Epoch 0: 6%|▌ | 689/12384 [1:27:46<24:45:44, 7.62s/it, loss=0.0904, acc=0.8535, iter_time=7.22s]
Epoch 0: 6%|▌ | 689/12384 [1:27:54<24:45:44, 7.62s/it, loss=0.0984, acc=0.8331, iter_time=6.41s]
Epoch 0: 6%|▌ | 690/12384 [1:27:54<24:45:29, 7.62s/it, loss=0.0984, acc=0.8331, iter_time=6.41s]
Epoch 0: 6%|▌ | 690/12384 [1:28:01<24:45:29, 7.62s/it, loss=0.0922, acc=0.8241, iter_time=8.82s]
Epoch 0: 6%|▌ | 691/12384 [1:28:01<24:45:17, 7.62s/it, loss=0.0922, acc=0.8241, iter_time=8.82s]
Epoch 0: 6%|▌ | 691/12384 [1:28:09<24:45:17, 7.62s/it, loss=0.0948, acc=0.8603, iter_time=7.63s]
Epoch 0: 6%|▌ | 692/12384 [1:28:09<24:44:53, 7.62s/it, loss=0.0948, acc=0.8603, iter_time=7.63s]
Epoch 0: 6%|▌ | 692/12384 [1:28:17<24:44:53, 7.62s/it, loss=0.1180, acc=0.7963, iter_time=7.98s]
Epoch 0: 6%|▌ | 693/12384 [1:28:17<25:05:51, 7.73s/it, loss=0.1180, acc=0.7963, iter_time=7.98s]
Epoch 0: 6%|▌ | 693/12384 [1:28:25<25:05:51, 7.73s/it, loss=0.0900, acc=0.8600, iter_time=7.04s]
Epoch 0: 6%|▌ | 694/12384 [1:28:25<24:58:35, 7.69s/it, loss=0.0900, acc=0.8600, iter_time=7.04s]
Epoch 0: 6%|▌ | 694/12384 [1:28:32<24:58:35, 7.69s/it, loss=0.0790, acc=0.8869, iter_time=4.62s]
Epoch 0: 6%|▌ | 695/12384 [1:28:32<24:53:40, 7.67s/it, loss=0.0790, acc=0.8869, iter_time=4.62s]
Epoch 0: 6%|▌ | 695/12384 [1:28:40<24:53:40, 7.67s/it, loss=0.0894, acc=0.8583, iter_time=11.24s]
Epoch 0: 6%|▌ | 696/12384 [1:28:40<24:48:52, 7.64s/it, loss=0.0894, acc=0.8583, iter_time=11.24s]
Epoch 0: 6%|▌ | 696/12384 [1:28:47<24:48:52, 7.64s/it, loss=0.0741, acc=0.9231, iter_time=4.88s]
Epoch 0: 6%|▌ | 697/12384 [1:28:47<24:48:18, 7.64s/it, loss=0.0741, acc=0.9231, iter_time=4.88s]
Epoch 0: 6%|▌ | 697/12384 [1:28:55<24:48:18, 7.64s/it, loss=0.0698, acc=0.9087, iter_time=8.45s]
Epoch 0: 6%|▌ | 698/12384 [1:28:55<24:49:37, 7.65s/it, loss=0.0698, acc=0.9087, iter_time=8.45s]
Epoch 0: 6%|▌ | 698/12384 [1:29:03<24:49:37, 7.65s/it, loss=0.1081, acc=0.8482, iter_time=8.52s]
Epoch 0: 6%|▌ | 699/12384 [1:29:03<24:46:36, 7.63s/it, loss=0.1081, acc=0.8482, iter_time=8.52s]
Epoch 0: 6%|▌ | 699/12384 [1:29:10<24:46:36, 7.63s/it, loss=0.0867, acc=0.8817, iter_time=8.95s]
Epoch 0: 6%|▌ | 700/12384 [1:29:10<24:45:36, 7.63s/it, loss=0.0867, acc=0.8817, iter_time=8.95s]
Epoch 0: 6%|▌ | 700/12384 [1:29:18<24:45:36, 7.63s/it, loss=0.0964, acc=0.8674, iter_time=7.21s]
Epoch 0: 6%|▌ | 701/12384 [1:29:18<24:43:55, 7.62s/it, loss=0.0964, acc=0.8674, iter_time=7.21s]
Epoch 0: 6%|▌ | 701/12384 [1:29:26<24:43:55, 7.62s/it, loss=0.0901, acc=0.8500, iter_time=7.59s]
Epoch 0: 6%|▌ | 702/12384 [1:29:26<24:43:02, 7.62s/it, loss=0.0901, acc=0.8500, iter_time=7.59s]
Epoch 0: 6%|▌ | 702/12384 [1:29:33<24:43:02, 7.62s/it, loss=0.0658, acc=0.9008, iter_time=7.62s]
Epoch 0: 6%|▌ | 703/12384 [1:29:33<24:43:34, 7.62s/it, loss=0.0658, acc=0.9008, iter_time=7.62s]
Epoch 0: 6%|▌ | 703/12384 [1:29:41<24:43:34, 7.62s/it, loss=0.0634, acc=0.9081, iter_time=7.60s]
Epoch 0: 6%|▌ | 704/12384 [1:29:41<24:44:49, 7.63s/it, loss=0.0634, acc=0.9081, iter_time=7.60s]
Epoch 0: 6%|▌ | 704/12384 [1:29:48<24:44:49, 7.63s/it, loss=0.0883, acc=0.8853, iter_time=5.11s]
Epoch 0: 6%|▌ | 705/12384 [1:29:48<24:45:56, 7.63s/it, loss=0.0883, acc=0.8853, iter_time=5.11s]
Epoch 0: 6%|▌ | 705/12384 [1:29:56<24:45:56, 7.63s/it, loss=0.0550, acc=0.9202, iter_time=10.22s]
Epoch 0: 6%|▌ | 706/12384 [1:29:56<24:44:36, 7.63s/it, loss=0.0550, acc=0.9202, iter_time=10.22s]
Epoch 0: 6%|▌ | 706/12384 [1:30:04<24:44:36, 7.63s/it, loss=0.0729, acc=0.8906, iter_time=7.59s]
Epoch 0: 6%|▌ | 707/12384 [1:30:04<24:43:05, 7.62s/it, loss=0.0729, acc=0.8906, iter_time=7.59s]
Epoch 0: 6%|▌ | 707/12384 [1:30:11<24:43:05, 7.62s/it, loss=0.0740, acc=0.8916, iter_time=7.60s]
Epoch 0: 6%|▌ | 708/12384 [1:30:11<24:42:30, 7.62s/it, loss=0.0740, acc=0.8916, iter_time=7.60s]
Epoch 0: 6%|▌ | 708/12384 [1:30:19<24:42:30, 7.62s/it, loss=0.0685, acc=0.8963, iter_time=7.65s]
Epoch 0: 6%|▌ | 709/12384 [1:30:19<24:42:55, 7.62s/it, loss=0.0685, acc=0.8963, iter_time=7.65s]
Epoch 0: 6%|▌ | 709/12384 [1:30:27<24:42:55, 7.62s/it, loss=0.0775, acc=0.8660, iter_time=4.74s]
Epoch 0: 6%|▌ | 710/12384 [1:30:27<24:42:58, 7.62s/it, loss=0.0775, acc=0.8660, iter_time=4.74s]
Epoch 0: 6%|▌ | 710/12384 [1:30:34<24:42:58, 7.62s/it, loss=0.0849, acc=0.8621, iter_time=10.49s]
Epoch 0: 6%|▌ | 711/12384 [1:30:34<24:43:06, 7.62s/it, loss=0.0849, acc=0.8621, iter_time=10.49s]
Epoch 0: 6%|▌ | 711/12384 [1:30:42<24:43:06, 7.62s/it, loss=0.1700, acc=0.8447, iter_time=8.01s]
Epoch 0: 6%|▌ | 712/12384 [1:30:42<24:44:20, 7.63s/it, loss=0.1700, acc=0.8447, iter_time=8.01s]
Epoch 0: 6%|▌ | 712/12384 [1:30:49<24:44:20, 7.63s/it, loss=0.1077, acc=0.8246, iter_time=7.25s]
Epoch 0: 6%|▌ | 713/12384 [1:30:49<24:44:01, 7.63s/it, loss=0.1077, acc=0.8246, iter_time=7.25s]
Epoch 0: 6%|▌ | 713/12384 [1:30:57<24:44:01, 7.63s/it, loss=0.0854, acc=0.8363, iter_time=7.00s]
Epoch 0: 6%|▌ | 714/12384 [1:30:57<24:44:32, 7.63s/it, loss=0.0854, acc=0.8363, iter_time=7.00s]
Epoch 0: 6%|▌ | 714/12384 [1:31:05<24:44:32, 7.63s/it, loss=0.0722, acc=0.8962, iter_time=8.28s]
Epoch 0: 6%|▌ | 715/12384 [1:31:05<24:44:02, 7.63s/it, loss=0.0722, acc=0.8962, iter_time=8.28s]
Epoch 0: 6%|▌ | 715/12384 [1:31:12<24:44:02, 7.63s/it, loss=0.0606, acc=0.8994, iter_time=7.63s]
Epoch 0: 6%|▌ | 716/12384 [1:31:12<24:43:10, 7.63s/it, loss=0.0606, acc=0.8994, iter_time=7.63s]
Epoch 0: 6%|▌ | 716/12384 [1:31:20<24:43:10, 7.63s/it, loss=0.0475, acc=0.9392, iter_time=7.63s]
Epoch 0: 6%|▌ | 717/12384 [1:31:20<24:44:41, 7.64s/it, loss=0.0475, acc=0.9392, iter_time=7.63s]
Epoch 0: 6%|▌ | 717/12384 [1:31:28<24:44:41, 7.64s/it, loss=0.0816, acc=0.8632, iter_time=5.83s]
Epoch 0: 6%|▌ | 718/12384 [1:31:28<24:46:54, 7.65s/it, loss=0.0816, acc=0.8632, iter_time=5.83s]
Epoch 0: 6%|▌ | 718/12384 [1:31:36<24:46:54, 7.65s/it, loss=0.0579, acc=0.9244, iter_time=9.53s]
Epoch 0: 6%|▌ | 719/12384 [1:31:36<25:03:12, 7.73s/it, loss=0.0579, acc=0.9244, iter_time=9.53s]
Epoch 0: 6%|▌ | 719/12384 [1:31:43<25:03:12, 7.73s/it, loss=0.0795, acc=0.8675, iter_time=8.25s]
Epoch 0: 6%|▌ | 720/12384 [1:31:43<24:56:20, 7.70s/it, loss=0.0795, acc=0.8675, iter_time=8.25s]
Epoch 0: 6%|▌ | 720/12384 [1:31:51<24:56:20, 7.70s/it, loss=0.1032, acc=0.8775, iter_time=7.23s]
Epoch 0: 6%|▌ | 721/12384 [1:31:51<24:50:47, 7.67s/it, loss=0.1032, acc=0.8775, iter_time=7.23s]
Epoch 0: 6%|▌ | 721/12384 [1:31:58<24:50:47, 7.67s/it, loss=0.0504, acc=0.9207, iter_time=6.40s]
Epoch 0: 6%|▌ | 722/12384 [1:31:58<24:47:12, 7.65s/it, loss=0.0504, acc=0.9207, iter_time=6.40s]
Epoch 0: 6%|▌ | 722/12384 [1:32:06<24:47:12, 7.65s/it, loss=0.0539, acc=0.9084, iter_time=8.82s]
Epoch 0: 6%|▌ | 723/12384 [1:32:06<24:44:49, 7.64s/it, loss=0.0539, acc=0.9084, iter_time=8.82s]
Epoch 0: 6%|▌ | 723/12384 [1:32:14<24:44:49, 7.64s/it, loss=0.0381, acc=0.9335, iter_time=7.64s]
Epoch 0: 6%|▌ | 724/12384 [1:32:14<24:44:05, 7.64s/it, loss=0.0381, acc=0.9335, iter_time=7.64s]
Epoch 0: 6%|▌ | 724/12384 [1:32:21<24:44:05, 7.64s/it, loss=0.0722, acc=0.8600, iter_time=4.24s]
Epoch 0: 6%|▌ | 725/12384 [1:32:21<24:44:21, 7.64s/it, loss=0.0722, acc=0.8600, iter_time=4.24s]
Epoch 0: 6%|▌ | 725/12384 [1:32:29<24:44:21, 7.64s/it, loss=0.0608, acc=0.9031, iter_time=10.99s]
Epoch 0: 6%|▌ | 726/12384 [1:32:29<24:41:09, 7.62s/it, loss=0.0608, acc=0.9031, iter_time=10.99s]
Epoch 0: 6%|▌ | 726/12384 [1:32:36<24:41:09, 7.62s/it, loss=0.0619, acc=0.8999, iter_time=7.61s]
Epoch 0: 6%|▌ | 727/12384 [1:32:36<24:40:09, 7.62s/it, loss=0.0619, acc=0.8999, iter_time=7.61s]
Epoch 0: 6%|▌ | 727/12384 [1:32:44<24:40:09, 7.62s/it, loss=0.0478, acc=0.9378, iter_time=7.56s]
Epoch 0: 6%|▌ | 728/12384 [1:32:44<24:40:33, 7.62s/it, loss=0.0478, acc=0.9378, iter_time=7.56s]
Epoch 0: 6%|▌ | 728/12384 [1:32:52<24:40:33, 7.62s/it, loss=0.0641, acc=0.8799, iter_time=7.67s]
Epoch 0: 6%|▌ | 729/12384 [1:32:52<24:40:07, 7.62s/it, loss=0.0641, acc=0.8799, iter_time=7.67s]
Epoch 0: 6%|▌ | 729/12384 [1:32:59<24:40:07, 7.62s/it, loss=0.0731, acc=0.8553, iter_time=7.61s]
Epoch 0: 6%|▌ | 730/12384 [1:32:59<24:40:31, 7.62s/it, loss=0.0731, acc=0.8553, iter_time=7.61s]
Epoch 0: 6%|▌ | 730/12384 [1:33:07<24:40:31, 7.62s/it, loss=0.1067, acc=0.8781, iter_time=4.57s]
Epoch 0: 6%|▌ | 731/12384 [1:33:07<24:40:21, 7.62s/it, loss=0.1067, acc=0.8781, iter_time=4.57s]
Epoch 0: 6%|▌ | 731/12384 [1:33:15<24:40:21, 7.62s/it, loss=0.0433, acc=0.9237, iter_time=7.88s]
Epoch 0: 6%|▌ | 732/12384 [1:33:15<24:47:29, 7.66s/it, loss=0.0433, acc=0.9237, iter_time=7.88s]
Epoch 0: 6%|▌ | 732/12384 [1:33:22<24:47:29, 7.66s/it, loss=0.0792, acc=0.8588, iter_time=10.54s]
Epoch 0: 6%|▌ | 733/12384 [1:33:22<24:43:54, 7.64s/it, loss=0.0792, acc=0.8588, iter_time=10.54s]
Epoch 0: 6%|▌ | 733/12384 [1:33:30<24:43:54, 7.64s/it, loss=0.0611, acc=0.8962, iter_time=6.12s]
Epoch 0: 6%|▌ | 734/12384 [1:33:30<24:42:06, 7.63s/it, loss=0.0611, acc=0.8962, iter_time=6.12s]
Epoch 0: 6%|▌ | 734/12384 [1:33:38<24:42:06, 7.63s/it, loss=0.0508, acc=0.9140, iter_time=7.90s]
Epoch 0: 6%|▌ | 735/12384 [1:33:38<24:42:42, 7.64s/it, loss=0.0508, acc=0.9140, iter_time=7.90s]
Epoch 0: 6%|▌ | 735/12384 [1:33:45<24:42:42, 7.64s/it, loss=0.0514, acc=0.9079, iter_time=9.23s]
Epoch 0: 6%|▌ | 736/12384 [1:33:45<24:43:22, 7.64s/it, loss=0.0514, acc=0.9079, iter_time=9.23s]
Epoch 0: 6%|▌ | 736/12384 [1:33:53<24:43:22, 7.64s/it, loss=0.0416, acc=0.9099, iter_time=4.97s]
Epoch 0: 6%|▌ | 737/12384 [1:33:53<24:40:51, 7.63s/it, loss=0.0416, acc=0.9099, iter_time=4.97s]
Epoch 0: 6%|▌ | 737/12384 [1:34:00<24:40:51, 7.63s/it, loss=0.0669, acc=0.9022, iter_time=9.88s]
Epoch 0: 6%|▌ | 738/12384 [1:34:00<24:39:41, 7.62s/it, loss=0.0669, acc=0.9022, iter_time=9.88s]
Epoch 0: 6%|▌ | 738/12384 [1:34:08<24:39:41, 7.62s/it, loss=0.0615, acc=0.8823, iter_time=7.64s]
Epoch 0: 6%|▌ | 739/12384 [1:34:08<24:40:06, 7.63s/it, loss=0.0615, acc=0.8823, iter_time=7.64s]
Epoch 0: 6%|▌ | 739/12384 [1:34:16<24:40:06, 7.63s/it, loss=0.0527, acc=0.9117, iter_time=5.84s]
Epoch 0: 6%|▌ | 740/12384 [1:34:16<24:38:56, 7.62s/it, loss=0.0527, acc=0.9117, iter_time=5.84s]
Epoch 0: 6%|▌ | 740/12384 [1:34:23<24:38:56, 7.62s/it, loss=0.2882, acc=0.8259, iter_time=9.40s]
Epoch 0: 6%|▌ | 741/12384 [1:34:23<24:38:08, 7.62s/it, loss=0.2882, acc=0.8259, iter_time=9.40s]
Epoch 0: 6%|▌ | 741/12384 [1:34:31<24:38:08, 7.62s/it, loss=0.0423, acc=0.9260, iter_time=7.61s]
Epoch 0: 6%|▌ | 742/12384 [1:34:31<24:39:11, 7.62s/it, loss=0.0423, acc=0.9260, iter_time=7.61s]
Epoch 0: 6%|▌ | 742/12384 [1:34:39<24:39:11, 7.62s/it, loss=0.1944, acc=0.8498, iter_time=7.62s]
Epoch 0: 6%|▌ | 743/12384 [1:34:39<24:39:03, 7.62s/it, loss=0.1944, acc=0.8498, iter_time=7.62s]
Epoch 0: 6%|▌ | 743/12384 [1:34:46<24:39:03, 7.62s/it, loss=0.0475, acc=0.9173, iter_time=8.01s]
Epoch 0: 6%|▌ | 744/12384 [1:34:46<24:37:39, 7.62s/it, loss=0.0475, acc=0.9173, iter_time=8.01s]
Epoch 0: 6%|▌ | 744/12384 [1:34:54<24:37:39, 7.62s/it, loss=0.0418, acc=0.9344, iter_time=7.58s]
Epoch 0: 6%|▌ | 745/12384 [1:34:54<24:57:56, 7.72s/it, loss=0.0418, acc=0.9344, iter_time=7.58s]
Epoch 0: 6%|▌ | 745/12384 [1:35:02<24:57:56, 7.72s/it, loss=0.0362, acc=0.9393, iter_time=7.64s]
Epoch 0: 6%|▌ | 746/12384 [1:35:02<24:55:48, 7.71s/it, loss=0.0362, acc=0.9393, iter_time=7.64s]
Epoch 0: 6%|▌ | 746/12384 [1:35:09<24:55:48, 7.71s/it, loss=0.0492, acc=0.9118, iter_time=7.68s]
Epoch 0: 6%|▌ | 747/12384 [1:35:09<24:50:59, 7.69s/it, loss=0.0492, acc=0.9118, iter_time=7.68s]
Epoch 0: 6%|▌ | 747/12384 [1:35:17<24:50:59, 7.69s/it, loss=0.0421, acc=0.9215, iter_time=7.60s]
Epoch 0: 6%|▌ | 748/12384 [1:35:17<24:46:44, 7.67s/it, loss=0.0421, acc=0.9215, iter_time=7.60s]
Epoch 0: 6%|▌ | 748/12384 [1:35:25<24:46:44, 7.67s/it, loss=0.0498, acc=0.9077, iter_time=7.03s]
Epoch 0: 6%|▌ | 749/12384 [1:35:25<24:43:10, 7.65s/it, loss=0.0498, acc=0.9077, iter_time=7.03s]
Epoch 0: 6%|▌ | 749/12384 [1:35:32<24:43:10, 7.65s/it, loss=0.0403, acc=0.9203, iter_time=8.60s]
Epoch 0: 6%|▌ | 750/12384 [1:35:32<24:41:13, 7.64s/it, loss=0.0403, acc=0.9203, iter_time=8.60s]
Epoch 0: 6%|▌ | 750/12384 [1:35:40<24:41:13, 7.64s/it, loss=0.0426, acc=0.9344, iter_time=4.62s]
Epoch 0: 6%|▌ | 751/12384 [1:35:40<24:38:10, 7.62s/it, loss=0.0426, acc=0.9344, iter_time=4.62s]
Epoch 0: 6%|▌ | 751/12384 [1:35:47<24:38:10, 7.62s/it, loss=0.0385, acc=0.9451, iter_time=10.55s]
Epoch 0: 6%|▌ | 752/12384 [1:35:47<24:38:11, 7.62s/it, loss=0.0385, acc=0.9451, iter_time=10.55s]
Epoch 0: 6%|▌ | 752/12384 [1:35:55<24:38:11, 7.62s/it, loss=0.0454, acc=0.9209, iter_time=7.26s]
Epoch 0: 6%|▌ | 753/12384 [1:35:55<24:38:31, 7.63s/it, loss=0.0454, acc=0.9209, iter_time=7.26s]
Epoch 0: 6%|▌ | 753/12384 [1:36:03<24:38:31, 7.63s/it, loss=0.0460, acc=0.9189, iter_time=7.63s]
Epoch 0: 6%|▌ | 754/12384 [1:36:03<24:37:45, 7.62s/it, loss=0.0460, acc=0.9189, iter_time=7.63s]
Epoch 0: 6%|▌ | 754/12384 [1:36:10<24:37:45, 7.62s/it, loss=0.0374, acc=0.9321, iter_time=7.63s]
Epoch 0: 6%|▌ | 755/12384 [1:36:10<24:38:37, 7.63s/it, loss=0.0374, acc=0.9321, iter_time=7.63s]
Epoch 0: 6%|▌ | 755/12384 [1:36:18<24:38:37, 7.63s/it, loss=0.2389, acc=0.8068, iter_time=7.64s]
Epoch 0: 6%|▌ | 756/12384 [1:36:18<24:38:25, 7.63s/it, loss=0.2389, acc=0.8068, iter_time=7.64s]
Epoch 0: 6%|▌ | 756/12384 [1:36:26<24:38:25, 7.63s/it, loss=0.0358, acc=0.9233, iter_time=6.42s]
Epoch 0: 6%|▌ | 757/12384 [1:36:26<24:36:58, 7.62s/it, loss=0.0358, acc=0.9233, iter_time=6.42s]
Epoch 0: 6%|▌ | 757/12384 [1:36:33<24:36:58, 7.62s/it, loss=0.0413, acc=0.9177, iter_time=5.06s]
Epoch 0: 6%|▌ | 758/12384 [1:36:33<24:38:14, 7.63s/it, loss=0.0413, acc=0.9177, iter_time=5.06s]
Epoch 0: 6%|▌ | 758/12384 [1:36:41<24:38:14, 7.63s/it, loss=0.0433, acc=0.9107, iter_time=11.39s]
Epoch 0: 6%|▌ | 759/12384 [1:36:41<24:36:46, 7.62s/it, loss=0.0433, acc=0.9107, iter_time=11.39s]
Epoch 0: 6%|▌ | 759/12384 [1:36:48<24:36:46, 7.62s/it, loss=0.0476, acc=0.9100, iter_time=7.99s]
Epoch 0: 6%|▌ | 760/12384 [1:36:48<24:36:50, 7.62s/it, loss=0.0476, acc=0.9100, iter_time=7.99s]
Epoch 0: 6%|▌ | 760/12384 [1:36:56<24:36:50, 7.62s/it, loss=0.0376, acc=0.9324, iter_time=7.24s]
Epoch 0: 6%|▌ | 761/12384 [1:36:56<24:36:22, 7.62s/it, loss=0.0376, acc=0.9324, iter_time=7.24s]
Epoch 0: 6%|▌ | 761/12384 [1:37:04<24:36:22, 7.62s/it, loss=0.0320, acc=0.9410, iter_time=7.63s]
Epoch 0: 6%|▌ | 762/12384 [1:37:04<24:35:58, 7.62s/it, loss=0.0320, acc=0.9410, iter_time=7.63s]
Epoch 0: 6%|▌ | 762/12384 [1:37:11<24:35:58, 7.62s/it, loss=0.0305, acc=0.9541, iter_time=7.59s]
Epoch 0: 6%|▌ | 763/12384 [1:37:11<24:33:59, 7.61s/it, loss=0.0305, acc=0.9541, iter_time=7.59s]
Epoch 0: 6%|▌ | 763/12384 [1:37:19<24:33:59, 7.61s/it, loss=0.0218, acc=0.9674, iter_time=4.48s]
Epoch 0: 6%|▌ | 764/12384 [1:37:19<24:34:14, 7.61s/it, loss=0.0218, acc=0.9674, iter_time=4.48s]
Epoch 0: 6%|▌ | 764/12384 [1:37:27<24:34:14, 7.61s/it, loss=0.0439, acc=0.9072, iter_time=10.14s]
Epoch 0: 6%|▌ | 765/12384 [1:37:27<24:32:56, 7.61s/it, loss=0.0439, acc=0.9072, iter_time=10.14s]
Epoch 0: 6%|▌ | 765/12384 [1:37:34<24:32:56, 7.61s/it, loss=0.0369, acc=0.9161, iter_time=6.69s]
Epoch 0: 6%|▌ | 766/12384 [1:37:34<24:32:13, 7.60s/it, loss=0.0369, acc=0.9161, iter_time=6.69s]
Epoch 0: 6%|▌ | 766/12384 [1:37:42<24:32:13, 7.60s/it, loss=0.0224, acc=0.9585, iter_time=6.51s]
Epoch 0: 6%|▌ | 767/12384 [1:37:42<24:32:33, 7.61s/it, loss=0.0224, acc=0.9585, iter_time=6.51s]
Epoch 0: 6%|▌ | 767/12384 [1:37:49<24:32:33, 7.61s/it, loss=0.0324, acc=0.9430, iter_time=10.57s]
Epoch 0: 6%|▌ | 768/12384 [1:37:49<24:37:40, 7.63s/it, loss=0.0324, acc=0.9430, iter_time=10.57s]
Epoch 0: 6%|▌ | 768/12384 [1:37:57<24:37:40, 7.63s/it, loss=0.0343, acc=0.9382, iter_time=7.31s]
Epoch 0: 6%|▌ | 769/12384 [1:37:57<24:36:58, 7.63s/it, loss=0.0343, acc=0.9382, iter_time=7.31s]
Epoch 0: 6%|▌ | 769/12384 [1:38:05<24:36:58, 7.63s/it, loss=0.0252, acc=0.9551, iter_time=7.64s]
Epoch 0: 6%|▌ | 770/12384 [1:38:05<24:36:26, 7.63s/it, loss=0.0252, acc=0.9551, iter_time=7.64s]
Epoch 0: 6%|▌ | 770/12384 [1:38:13<24:36:26, 7.63s/it, loss=0.0245, acc=0.9624, iter_time=7.96s]
Epoch 0: 6%|▌ | 771/12384 [1:38:13<24:59:13, 7.75s/it, loss=0.0245, acc=0.9624, iter_time=7.96s]
Epoch 0: 6%|▌ | 771/12384 [1:38:20<24:59:13, 7.75s/it, loss=0.0603, acc=0.9035, iter_time=7.69s]
Epoch 0: 6%|▌ | 772/12384 [1:38:20<24:50:49, 7.70s/it, loss=0.0603, acc=0.9035, iter_time=7.69s]
Epoch 0: 6%|▌ | 772/12384 [1:38:28<24:50:49, 7.70s/it, loss=0.0358, acc=0.9470, iter_time=7.61s]
Epoch 0: 6%|▌ | 773/12384 [1:38:28<24:45:23, 7.68s/it, loss=0.0358, acc=0.9470, iter_time=7.61s]
Epoch 0: 6%|▌ | 773/12384 [1:38:35<24:45:23, 7.68s/it, loss=0.0329, acc=0.9433, iter_time=7.59s]
Epoch 0: 6%|▋ | 774/12384 [1:38:35<24:40:34, 7.65s/it, loss=0.0329, acc=0.9433, iter_time=7.59s]
Epoch 0: 6%|▋ | 774/12384 [1:38:43<24:40:34, 7.65s/it, loss=0.0414, acc=0.9172, iter_time=7.62s]
Epoch 0: 6%|▋ | 775/12384 [1:38:43<24:38:40, 7.64s/it, loss=0.0414, acc=0.9172, iter_time=7.62s]
Epoch 0: 6%|▋ | 775/12384 [1:38:51<24:38:40, 7.64s/it, loss=0.0435, acc=0.9129, iter_time=7.61s]
Epoch 0: 6%|▋ | 776/12384 [1:38:51<24:39:52, 7.65s/it, loss=0.0435, acc=0.9129, iter_time=7.61s]
Epoch 0: 6%|▋ | 776/12384 [1:38:58<24:39:52, 7.65s/it, loss=0.0413, acc=0.9174, iter_time=7.66s]
Epoch 0: 6%|▋ | 777/12384 [1:38:58<24:42:41, 7.66s/it, loss=0.0413, acc=0.9174, iter_time=7.66s]
Epoch 0: 6%|▋ | 777/12384 [1:39:06<24:42:41, 7.66s/it, loss=0.0217, acc=0.9563, iter_time=7.70s]
Epoch 0: 6%|▋ | 778/12384 [1:39:06<24:38:23, 7.64s/it, loss=0.0217, acc=0.9563, iter_time=7.70s]
Epoch 0: 6%|▋ | 778/12384 [1:39:14<24:38:23, 7.64s/it, loss=0.0147, acc=0.9767, iter_time=7.61s]
Epoch 0: 6%|▋ | 779/12384 [1:39:14<24:35:56, 7.63s/it, loss=0.0147, acc=0.9767, iter_time=7.61s]
Epoch 0: 6%|▋ | 779/12384 [1:39:21<24:35:56, 7.63s/it, loss=0.0325, acc=0.9460, iter_time=7.61s]
Epoch 0: 6%|▋ | 780/12384 [1:39:21<24:35:58, 7.63s/it, loss=0.0325, acc=0.9460, iter_time=7.61s]
Epoch 0: 6%|▋ | 780/12384 [1:39:29<24:35:58, 7.63s/it, loss=0.0236, acc=0.9511, iter_time=7.62s]
Epoch 0: 6%|▋ | 781/12384 [1:39:29<24:35:44, 7.63s/it, loss=0.0236, acc=0.9511, iter_time=7.62s]
Epoch 0: 6%|▋ | 781/12384 [1:39:37<24:35:44, 7.63s/it, loss=0.0372, acc=0.9306, iter_time=7.65s]
Epoch 0: 6%|▋ | 782/12384 [1:39:37<24:35:02, 7.63s/it, loss=0.0372, acc=0.9306, iter_time=7.65s]
Epoch 0: 6%|▋ | 782/12384 [1:39:44<24:35:02, 7.63s/it, loss=0.0322, acc=0.9463, iter_time=7.62s]
Epoch 0: 6%|▋ | 783/12384 [1:39:44<24:34:30, 7.63s/it, loss=0.0322, acc=0.9463, iter_time=7.62s]
Epoch 0: 6%|▋ | 783/12384 [1:39:52<24:34:30, 7.63s/it, loss=0.0329, acc=0.9219, iter_time=7.98s]
Epoch 0: 6%|▋ | 784/12384 [1:39:52<24:34:14, 7.63s/it, loss=0.0329, acc=0.9219, iter_time=7.98s]
Epoch 0: 6%|▋ | 784/12384 [1:39:59<24:34:14, 7.63s/it, loss=0.0226, acc=0.9606, iter_time=7.25s]
Epoch 0: 6%|▋ | 785/12384 [1:39:59<24:32:39, 7.62s/it, loss=0.0226, acc=0.9606, iter_time=7.25s]
Epoch 0: 6%|▋ | 785/12384 [1:40:07<24:32:39, 7.62s/it, loss=0.0223, acc=0.9485, iter_time=4.48s]
Epoch 0: 6%|▋ | 786/12384 [1:40:07<24:33:25, 7.62s/it, loss=0.0223, acc=0.9485, iter_time=4.48s]
Epoch 0: 6%|▋ | 786/12384 [1:40:15<24:33:25, 7.62s/it, loss=0.0278, acc=0.9428, iter_time=7.70s]
Epoch 0: 6%|▋ | 787/12384 [1:40:15<24:33:07, 7.62s/it, loss=0.0278, acc=0.9428, iter_time=7.70s]
Epoch 0: 6%|▋ | 787/12384 [1:40:22<24:33:07, 7.62s/it, loss=0.0504, acc=0.9505, iter_time=10.66s]
Epoch 0: 6%|▋ | 788/12384 [1:40:22<24:33:30, 7.62s/it, loss=0.0504, acc=0.9505, iter_time=10.66s]
Epoch 0: 6%|▋ | 788/12384 [1:40:30<24:33:30, 7.62s/it, loss=0.0368, acc=0.9307, iter_time=5.65s]
Epoch 0: 6%|▋ | 789/12384 [1:40:30<24:32:01, 7.62s/it, loss=0.0368, acc=0.9307, iter_time=5.65s]
Epoch 0: 6%|▋ | 789/12384 [1:40:37<24:32:01, 7.62s/it, loss=0.0212, acc=0.9632, iter_time=9.59s]
Epoch 0: 6%|▋ | 790/12384 [1:40:37<24:30:39, 7.61s/it, loss=0.0212, acc=0.9632, iter_time=9.59s]
Epoch 0: 6%|▋ | 790/12384 [1:40:45<24:30:39, 7.61s/it, loss=0.0132, acc=0.9784, iter_time=7.60s]
Epoch 0: 6%|▋ | 791/12384 [1:40:45<24:30:50, 7.61s/it, loss=0.0132, acc=0.9784, iter_time=7.60s]
Epoch 0: 6%|▋ | 791/12384 [1:40:53<24:30:50, 7.61s/it, loss=0.0365, acc=0.9404, iter_time=8.01s]
Epoch 0: 6%|▋ | 792/12384 [1:40:53<24:34:18, 7.63s/it, loss=0.0365, acc=0.9404, iter_time=8.01s]
Epoch 0: 6%|▋ | 792/12384 [1:41:00<24:34:18, 7.63s/it, loss=0.0260, acc=0.9553, iter_time=7.26s]
Epoch 0: 6%|▋ | 793/12384 [1:41:00<24:32:09, 7.62s/it, loss=0.0260, acc=0.9553, iter_time=7.26s]
Epoch 0: 6%|▋ | 793/12384 [1:41:08<24:32:09, 7.62s/it, loss=0.0291, acc=0.9496, iter_time=7.60s]
Epoch 0: 6%|▋ | 794/12384 [1:41:08<24:31:51, 7.62s/it, loss=0.0291, acc=0.9496, iter_time=7.60s]
Epoch 0: 6%|▋ | 794/12384 [1:41:16<24:31:51, 7.62s/it, loss=0.0271, acc=0.9485, iter_time=7.64s]
Epoch 0: 6%|▋ | 795/12384 [1:41:16<24:31:05, 7.62s/it, loss=0.0271, acc=0.9485, iter_time=7.64s]
Epoch 0: 6%|▋ | 795/12384 [1:41:23<24:31:05, 7.62s/it, loss=0.0204, acc=0.9546, iter_time=6.99s]
Epoch 0: 6%|▋ | 796/12384 [1:41:23<24:31:46, 7.62s/it, loss=0.0204, acc=0.9546, iter_time=6.99s]
Epoch 0: 6%|▋ | 796/12384 [1:41:31<24:31:46, 7.62s/it, loss=0.0223, acc=0.9566, iter_time=7.37s]
Epoch 0: 6%|▋ | 797/12384 [1:41:31<24:52:50, 7.73s/it, loss=0.0223, acc=0.9566, iter_time=7.37s]
Epoch 0: 6%|▋ | 797/12384 [1:41:39<24:52:50, 7.73s/it, loss=0.0206, acc=0.9566, iter_time=7.95s]
Epoch 0: 6%|▋ | 798/12384 [1:41:39<24:46:00, 7.70s/it, loss=0.0206, acc=0.9566, iter_time=7.95s]
Epoch 0: 6%|▋ | 798/12384 [1:41:46<24:46:00, 7.70s/it, loss=0.0391, acc=0.9299, iter_time=8.51s]
Epoch 0: 6%|▋ | 799/12384 [1:41:46<24:40:22, 7.67s/it, loss=0.0391, acc=0.9299, iter_time=8.51s]
Epoch 0: 6%|▋ | 799/12384 [1:41:54<24:40:22, 7.67s/it, loss=0.0206, acc=0.9578, iter_time=8.03s]
Epoch 0: 6%|▋ | 800/12384 [1:41:54<24:38:09, 7.66s/it, loss=0.0206, acc=0.9578, iter_time=8.03s]
Epoch 0: 6%|▋ | 800/12384 [1:42:02<24:38:09, 7.66s/it, loss=0.0146, acc=0.9847, iter_time=6.97s]
Epoch 0: 6%|▋ | 801/12384 [1:42:02<24:35:28, 7.64s/it, loss=0.0146, acc=0.9847, iter_time=6.97s]
Epoch 0: 6%|▋ | 801/12384 [1:42:09<24:35:28, 7.64s/it, loss=0.0232, acc=0.9486, iter_time=7.84s]
Epoch 0: 6%|▋ | 802/12384 [1:42:09<24:35:17, 7.64s/it, loss=0.0232, acc=0.9486, iter_time=7.84s]
Epoch 0: 6%|▋ | 802/12384 [1:42:17<24:35:17, 7.64s/it, loss=0.0218, acc=0.9438, iter_time=7.68s]
Epoch 0: 6%|▋ | 803/12384 [1:42:17<24:34:29, 7.64s/it, loss=0.0218, acc=0.9438, iter_time=7.68s]
Epoch 0: 6%|▋ | 803/12384 [1:42:25<24:34:29, 7.64s/it, loss=0.0136, acc=0.9779, iter_time=4.57s]
Epoch 0: 6%|▋ | 804/12384 [1:42:25<24:32:18, 7.63s/it, loss=0.0136, acc=0.9779, iter_time=4.57s]
Epoch 0: 6%|▋ | 804/12384 [1:42:32<24:32:18, 7.63s/it, loss=0.1280, acc=0.8572, iter_time=10.64s]
Epoch 0: 7%|▋ | 805/12384 [1:42:32<24:34:21, 7.64s/it, loss=0.1280, acc=0.8572, iter_time=10.64s]
Epoch 0: 7%|▋ | 805/12384 [1:42:40<24:34:21, 7.64s/it, loss=0.0136, acc=0.9759, iter_time=5.36s]
Epoch 0: 7%|▋ | 806/12384 [1:42:40<24:31:52, 7.63s/it, loss=0.0136, acc=0.9759, iter_time=5.36s]
Epoch 0: 7%|▋ | 806/12384 [1:42:47<24:31:52, 7.63s/it, loss=0.0248, acc=0.9487, iter_time=9.88s]
Epoch 0: 7%|▋ | 807/12384 [1:42:47<24:31:40, 7.63s/it, loss=0.0248, acc=0.9487, iter_time=9.88s]
Epoch 0: 7%|▋ | 807/12384 [1:42:55<24:31:40, 7.63s/it, loss=0.0342, acc=0.9406, iter_time=8.02s]
Epoch 0: 7%|▋ | 808/12384 [1:42:55<24:30:15, 7.62s/it, loss=0.0342, acc=0.9406, iter_time=8.02s]
Epoch 0: 7%|▋ | 808/12384 [1:43:03<24:30:15, 7.62s/it, loss=0.0202, acc=0.9641, iter_time=7.25s]
Epoch 0: 7%|▋ | 809/12384 [1:43:03<24:30:12, 7.62s/it, loss=0.0202, acc=0.9641, iter_time=7.25s]
Epoch 0: 7%|▋ | 809/12384 [1:43:10<24:30:12, 7.62s/it, loss=0.0208, acc=0.9636, iter_time=7.30s]
Epoch 0: 7%|▋ | 810/12384 [1:43:10<24:28:29, 7.61s/it, loss=0.0208, acc=0.9636, iter_time=7.30s]
Epoch 0: 7%|▋ | 810/12384 [1:43:18<24:28:29, 7.61s/it, loss=0.0102, acc=0.9779, iter_time=7.61s]
Epoch 0: 7%|▋ | 811/12384 [1:43:18<24:28:02, 7.61s/it, loss=0.0102, acc=0.9779, iter_time=7.61s]
Epoch 0: 7%|▋ | 811/12384 [1:43:25<24:28:02, 7.61s/it, loss=0.0138, acc=0.9719, iter_time=7.88s]
Epoch 0: 7%|▋ | 812/12384 [1:43:25<24:26:40, 7.60s/it, loss=0.0138, acc=0.9719, iter_time=7.88s]
Epoch 0: 7%|▋ | 812/12384 [1:43:33<24:26:40, 7.60s/it, loss=0.0200, acc=0.9673, iter_time=6.10s]
Epoch 0: 7%|▋ | 813/12384 [1:43:33<24:26:11, 7.60s/it, loss=0.0200, acc=0.9673, iter_time=6.10s]
Epoch 0: 7%|▋ | 813/12384 [1:43:41<24:26:11, 7.60s/it, loss=0.0177, acc=0.9668, iter_time=9.10s]
Epoch 0: 7%|▋ | 814/12384 [1:43:41<24:27:26, 7.61s/it, loss=0.0177, acc=0.9668, iter_time=9.10s]
Epoch 0: 7%|▋ | 814/12384 [1:43:48<24:27:26, 7.61s/it, loss=0.0260, acc=0.9547, iter_time=7.64s]
Epoch 0: 7%|▋ | 815/12384 [1:43:48<24:29:34, 7.62s/it, loss=0.0260, acc=0.9547, iter_time=7.64s]
Epoch 0: 7%|▋ | 815/12384 [1:43:56<24:29:34, 7.62s/it, loss=0.0171, acc=0.9675, iter_time=8.02s]
Epoch 0: 7%|▋ | 816/12384 [1:43:56<24:29:59, 7.62s/it, loss=0.0171, acc=0.9675, iter_time=8.02s]
Epoch 0: 7%|▋ | 816/12384 [1:44:04<24:29:59, 7.62s/it, loss=0.0211, acc=0.9575, iter_time=7.24s]
Epoch 0: 7%|▋ | 817/12384 [1:44:04<24:31:41, 7.63s/it, loss=0.0211, acc=0.9575, iter_time=7.24s]
Epoch 0: 7%|▋ | 817/12384 [1:44:11<24:31:41, 7.63s/it, loss=0.0166, acc=0.9642, iter_time=7.67s]
Epoch 0: 7%|▋ | 818/12384 [1:44:11<24:30:48, 7.63s/it, loss=0.0166, acc=0.9642, iter_time=7.67s]
Epoch 0: 7%|▋ | 818/12384 [1:44:19<24:30:48, 7.63s/it, loss=0.0184, acc=0.9657, iter_time=7.32s]
Epoch 0: 7%|▋ | 819/12384 [1:44:19<24:29:42, 7.62s/it, loss=0.0184, acc=0.9657, iter_time=7.32s]
Epoch 0: 7%|▋ | 819/12384 [1:44:26<24:29:42, 7.62s/it, loss=0.0115, acc=0.9805, iter_time=7.90s]
Epoch 0: 7%|▋ | 820/12384 [1:44:26<24:29:39, 7.63s/it, loss=0.0115, acc=0.9805, iter_time=7.90s]
Epoch 0: 7%|▋ | 820/12384 [1:44:34<24:29:39, 7.63s/it, loss=0.0213, acc=0.9653, iter_time=7.62s]
Epoch 0: 7%|▋ | 821/12384 [1:44:34<24:29:19, 7.62s/it, loss=0.0213, acc=0.9653, iter_time=7.62s]
Epoch 0: 7%|▋ | 821/12384 [1:44:42<24:29:19, 7.62s/it, loss=0.0547, acc=0.9348, iter_time=7.63s]
Epoch 0: 7%|▋ | 822/12384 [1:44:42<24:27:59, 7.62s/it, loss=0.0547, acc=0.9348, iter_time=7.63s]
Epoch 0: 7%|▋ | 822/12384 [1:44:49<24:27:59, 7.62s/it, loss=0.0178, acc=0.9724, iter_time=7.61s]
Epoch 0: 7%|▋ | 823/12384 [1:44:49<24:27:58, 7.62s/it, loss=0.0178, acc=0.9724, iter_time=7.61s]
Epoch 0: 7%|▋ | 823/12384 [1:44:57<24:27:58, 7.62s/it, loss=0.0149, acc=0.9660, iter_time=8.37s]
Epoch 0: 7%|▋ | 824/12384 [1:44:57<24:52:53, 7.75s/it, loss=0.0149, acc=0.9660, iter_time=8.37s]
Epoch 0: 7%|▋ | 824/12384 [1:45:05<24:52:53, 7.75s/it, loss=0.0109, acc=0.9790, iter_time=7.30s]
Epoch 0: 7%|▋ | 825/12384 [1:45:05<24:44:43, 7.71s/it, loss=0.0109, acc=0.9790, iter_time=7.30s]
Epoch 0: 7%|▋ | 825/12384 [1:45:13<24:44:43, 7.71s/it, loss=0.0300, acc=0.9550, iter_time=7.61s]
Epoch 0: 7%|▋ | 826/12384 [1:45:13<24:39:17, 7.68s/it, loss=0.0300, acc=0.9550, iter_time=7.61s]
Epoch 0: 7%|▋ | 826/12384 [1:45:20<24:39:17, 7.68s/it, loss=0.0191, acc=0.9618, iter_time=7.63s]
Epoch 0: 7%|▋ | 827/12384 [1:45:20<24:36:00, 7.66s/it, loss=0.0191, acc=0.9618, iter_time=7.63s]
Epoch 0: 7%|▋ | 827/12384 [1:45:28<24:36:00, 7.66s/it, loss=0.0233, acc=0.9660, iter_time=7.63s]
Epoch 0: 7%|▋ | 828/12384 [1:45:28<24:33:13, 7.65s/it, loss=0.0233, acc=0.9660, iter_time=7.63s]
Epoch 0: 7%|▋ | 828/12384 [1:45:35<24:33:13, 7.65s/it, loss=0.0082, acc=0.9861, iter_time=4.22s]
Epoch 0: 7%|▋ | 829/12384 [1:45:35<24:31:18, 7.64s/it, loss=0.0082, acc=0.9861, iter_time=4.22s]
Epoch 0: 7%|▋ | 829/12384 [1:45:43<24:31:18, 7.64s/it, loss=0.0175, acc=0.9750, iter_time=10.98s]
Epoch 0: 7%|▋ | 830/12384 [1:45:43<24:29:22, 7.63s/it, loss=0.0175, acc=0.9750, iter_time=10.98s]
Epoch 0: 7%|▋ | 830/12384 [1:45:51<24:29:22, 7.63s/it, loss=0.0136, acc=0.9682, iter_time=5.82s]
Epoch 0: 7%|▋ | 831/12384 [1:45:51<24:28:44, 7.63s/it, loss=0.0136, acc=0.9682, iter_time=5.82s]
Epoch 0: 7%|▋ | 831/12384 [1:45:58<24:28:44, 7.63s/it, loss=0.0292, acc=0.9414, iter_time=9.80s]
Epoch 0: 7%|▋ | 832/12384 [1:45:58<24:27:19, 7.62s/it, loss=0.0292, acc=0.9414, iter_time=9.80s]
Epoch 0: 7%|▋ | 832/12384 [1:46:06<24:27:19, 7.62s/it, loss=0.0427, acc=0.9348, iter_time=7.23s]
Epoch 0: 7%|▋ | 833/12384 [1:46:06<24:26:31, 7.62s/it, loss=0.0427, acc=0.9348, iter_time=7.23s]
Epoch 0: 7%|▋ | 833/12384 [1:46:14<24:26:31, 7.62s/it, loss=0.0132, acc=0.9743, iter_time=7.62s]
Epoch 0: 7%|▋ | 834/12384 [1:46:14<24:25:49, 7.61s/it, loss=0.0132, acc=0.9743, iter_time=7.62s]
Epoch 0: 7%|▋ | 834/12384 [1:46:21<24:25:49, 7.61s/it, loss=0.0149, acc=0.9716, iter_time=7.62s]
Epoch 0: 7%|▋ | 835/12384 [1:46:21<24:29:43, 7.64s/it, loss=0.0149, acc=0.9716, iter_time=7.62s]
Epoch 0: 7%|▋ | 835/12384 [1:46:29<24:29:43, 7.64s/it, loss=0.0830, acc=0.8892, iter_time=7.69s]
Epoch 0: 7%|▋ | 836/12384 [1:46:29<24:29:57, 7.64s/it, loss=0.0830, acc=0.8892, iter_time=7.69s]
Epoch 0: 7%|▋ | 836/12384 [1:46:36<24:29:57, 7.64s/it, loss=0.0171, acc=0.9771, iter_time=7.61s]
Epoch 0: 7%|▋ | 837/12384 [1:46:36<24:27:30, 7.63s/it, loss=0.0171, acc=0.9771, iter_time=7.61s]
Epoch 0: 7%|▋ | 837/12384 [1:46:44<24:27:30, 7.63s/it, loss=0.0181, acc=0.9716, iter_time=7.29s]
Epoch 0: 7%|▋ | 838/12384 [1:46:44<24:29:08, 7.63s/it, loss=0.0181, acc=0.9716, iter_time=7.29s]
Epoch 0: 7%|▋ | 838/12384 [1:46:52<24:29:08, 7.63s/it, loss=0.0183, acc=0.9586, iter_time=7.99s]
Epoch 0: 7%|▋ | 839/12384 [1:46:52<24:28:19, 7.63s/it, loss=0.0183, acc=0.9586, iter_time=7.99s]
Epoch 0: 7%|▋ | 839/12384 [1:46:59<24:28:19, 7.63s/it, loss=0.0255, acc=0.9595, iter_time=8.01s]
Epoch 0: 7%|▋ | 840/12384 [1:46:59<24:28:12, 7.63s/it, loss=0.0255, acc=0.9595, iter_time=8.01s]
Epoch 0: 7%|▋ | 840/12384 [1:47:07<24:28:12, 7.63s/it, loss=0.0117, acc=0.9781, iter_time=6.90s]
Epoch 0: 7%|▋ | 841/12384 [1:47:07<24:25:48, 7.62s/it, loss=0.0117, acc=0.9781, iter_time=6.90s]
Epoch 0: 7%|▋ | 841/12384 [1:47:15<24:25:48, 7.62s/it, loss=0.0146, acc=0.9687, iter_time=3.73s]
Epoch 0: 7%|▋ | 842/12384 [1:47:15<24:24:26, 7.61s/it, loss=0.0146, acc=0.9687, iter_time=3.73s]
Epoch 0: 7%|▋ | 842/12384 [1:47:22<24:24:26, 7.61s/it, loss=0.0187, acc=0.9623, iter_time=11.78s]
Epoch 0: 7%|▋ | 843/12384 [1:47:22<24:24:18, 7.61s/it, loss=0.0187, acc=0.9623, iter_time=11.78s]
Epoch 0: 7%|▋ | 843/12384 [1:47:30<24:24:18, 7.61s/it, loss=0.0185, acc=0.9599, iter_time=7.61s]
Epoch 0: 7%|▋ | 844/12384 [1:47:30<24:24:06, 7.61s/it, loss=0.0185, acc=0.9599, iter_time=7.61s]
Epoch 0: 7%|▋ | 844/12384 [1:47:37<24:24:06, 7.61s/it, loss=0.0190, acc=0.9611, iter_time=7.62s]
Epoch 0: 7%|▋ | 845/12384 [1:47:37<24:23:46, 7.61s/it, loss=0.0190, acc=0.9611, iter_time=7.62s]
Epoch 0: 7%|▋ | 845/12384 [1:47:45<24:23:46, 7.61s/it, loss=0.0199, acc=0.9600, iter_time=7.60s]
Epoch 0: 7%|▋ | 846/12384 [1:47:45<24:23:04, 7.61s/it, loss=0.0199, acc=0.9600, iter_time=7.60s]
Epoch 0: 7%|▋ | 846/12384 [1:47:53<24:23:04, 7.61s/it, loss=0.0184, acc=0.9687, iter_time=7.64s]
Epoch 0: 7%|▋ | 847/12384 [1:47:53<24:24:40, 7.62s/it, loss=0.0184, acc=0.9687, iter_time=7.64s]
Epoch 0: 7%|▋ | 847/12384 [1:48:00<24:24:40, 7.62s/it, loss=0.0247, acc=0.9549, iter_time=7.99s]
Epoch 0: 7%|▋ | 848/12384 [1:48:00<24:23:45, 7.61s/it, loss=0.0247, acc=0.9549, iter_time=7.99s]
Epoch 0: 7%|▋ | 848/12384 [1:48:08<24:23:45, 7.61s/it, loss=0.0103, acc=0.9804, iter_time=6.92s]
Epoch 0: 7%|▋ | 849/12384 [1:48:08<24:21:59, 7.60s/it, loss=0.0103, acc=0.9804, iter_time=6.92s]
Epoch 0: 7%|▋ | 849/12384 [1:48:16<24:21:59, 7.60s/it, loss=0.0157, acc=0.9599, iter_time=8.61s]
Epoch 0: 7%|▋ | 850/12384 [1:48:16<24:41:16, 7.71s/it, loss=0.0157, acc=0.9599, iter_time=8.61s]
Epoch 0: 7%|▋ | 850/12384 [1:48:23<24:41:16, 7.71s/it, loss=0.0110, acc=0.9740, iter_time=4.39s]
Epoch 0: 7%|▋ | 851/12384 [1:48:23<24:36:22, 7.68s/it, loss=0.0110, acc=0.9740, iter_time=4.39s]
Epoch 0: 7%|▋ | 851/12384 [1:48:31<24:36:22, 7.68s/it, loss=0.0098, acc=0.9892, iter_time=10.11s]
Epoch 0: 7%|▋ | 852/12384 [1:48:31<24:31:42, 7.66s/it, loss=0.0098, acc=0.9892, iter_time=10.11s]
Epoch 0: 7%|▋ | 852/12384 [1:48:39<24:31:42, 7.66s/it, loss=0.0091, acc=0.9914, iter_time=7.93s]
Epoch 0: 7%|▋ | 853/12384 [1:48:39<24:28:46, 7.64s/it, loss=0.0091, acc=0.9914, iter_time=7.93s]
Epoch 0: 7%|▋ | 853/12384 [1:48:46<24:28:46, 7.64s/it, loss=0.0138, acc=0.9651, iter_time=7.61s]
Epoch 0: 7%|▋ | 854/12384 [1:48:46<24:26:26, 7.63s/it, loss=0.0138, acc=0.9651, iter_time=7.61s]
Epoch 0: 7%|▋ | 854/12384 [1:48:54<24:26:26, 7.63s/it, loss=0.0156, acc=0.9751, iter_time=7.02s]
Epoch 0: 7%|▋ | 855/12384 [1:48:54<24:26:08, 7.63s/it, loss=0.0156, acc=0.9751, iter_time=7.02s]
Epoch 0: 7%|▋ | 855/12384 [1:49:01<24:26:08, 7.63s/it, loss=0.0105, acc=0.9799, iter_time=8.16s]
Epoch 0: 7%|▋ | 856/12384 [1:49:01<24:25:03, 7.63s/it, loss=0.0105, acc=0.9799, iter_time=8.16s]
Epoch 0: 7%|▋ | 856/12384 [1:49:09<24:25:03, 7.63s/it, loss=0.0139, acc=0.9761, iter_time=4.64s]
Epoch 0: 7%|▋ | 857/12384 [1:49:09<24:26:17, 7.63s/it, loss=0.0139, acc=0.9761, iter_time=4.64s]
Epoch 0: 7%|▋ | 857/12384 [1:49:17<24:26:17, 7.63s/it, loss=0.0122, acc=0.9790, iter_time=10.65s]
Epoch 0: 7%|▋ | 858/12384 [1:49:17<24:25:08, 7.63s/it, loss=0.0122, acc=0.9790, iter_time=10.65s]
Epoch 0: 7%|▋ | 858/12384 [1:49:24<24:25:08, 7.63s/it, loss=0.0114, acc=0.9785, iter_time=7.61s]
Epoch 0: 7%|▋ | 859/12384 [1:49:24<24:22:49, 7.62s/it, loss=0.0114, acc=0.9785, iter_time=7.61s]
Epoch 0: 7%|▋ | 859/12384 [1:49:32<24:22:49, 7.62s/it, loss=0.0241, acc=0.9603, iter_time=7.62s]
Epoch 0: 7%|▋ | 860/12384 [1:49:32<24:23:36, 7.62s/it, loss=0.0241, acc=0.9603, iter_time=7.62s]
Epoch 0: 7%|▋ | 860/12384 [1:49:40<24:23:36, 7.62s/it, loss=0.0264, acc=0.9568, iter_time=7.63s]
Epoch 0: 7%|▋ | 861/12384 [1:49:40<24:24:32, 7.63s/it, loss=0.0264, acc=0.9568, iter_time=7.63s]
Epoch 0: 7%|▋ | 861/12384 [1:49:47<24:24:32, 7.63s/it, loss=0.0171, acc=0.9744, iter_time=7.33s]
Epoch 0: 7%|▋ | 862/12384 [1:49:47<24:22:07, 7.61s/it, loss=0.0171, acc=0.9744, iter_time=7.33s]
Epoch 0: 7%|▋ | 862/12384 [1:49:55<24:22:07, 7.61s/it, loss=0.0183, acc=0.9586, iter_time=7.88s]
Epoch 0: 7%|▋ | 863/12384 [1:49:55<24:21:42, 7.61s/it, loss=0.0183, acc=0.9586, iter_time=7.88s]
Epoch 0: 7%|▋ | 863/12384 [1:50:02<24:21:42, 7.61s/it, loss=0.0103, acc=0.9789, iter_time=8.02s]
Epoch 0: 7%|▋ | 864/12384 [1:50:02<24:26:35, 7.64s/it, loss=0.0103, acc=0.9789, iter_time=8.02s]
Epoch 0: 7%|▋ | 864/12384 [1:50:10<24:26:35, 7.64s/it, loss=0.0187, acc=0.9501, iter_time=7.29s]
Epoch 0: 7%|▋ | 865/12384 [1:50:10<24:30:13, 7.66s/it, loss=0.0187, acc=0.9501, iter_time=7.29s]
Epoch 0: 7%|▋ | 865/12384 [1:50:18<24:30:13, 7.66s/it, loss=0.0153, acc=0.9754, iter_time=4.40s]
Epoch 0: 7%|▋ | 866/12384 [1:50:18<24:27:55, 7.65s/it, loss=0.0153, acc=0.9754, iter_time=4.40s]
Epoch 0: 7%|▋ | 866/12384 [1:50:25<24:27:55, 7.65s/it, loss=0.0112, acc=0.9740, iter_time=10.91s]
Epoch 0: 7%|▋ | 867/12384 [1:50:25<24:25:58, 7.64s/it, loss=0.0112, acc=0.9740, iter_time=10.91s]
Epoch 0: 7%|▋ | 867/12384 [1:50:33<24:25:58, 7.64s/it, loss=0.0184, acc=0.9793, iter_time=7.63s]
Epoch 0: 7%|▋ | 868/12384 [1:50:33<24:26:01, 7.64s/it, loss=0.0184, acc=0.9793, iter_time=7.63s]
Epoch 0: 7%|▋ | 868/12384 [1:50:41<24:26:01, 7.64s/it, loss=0.0242, acc=0.9358, iter_time=5.84s]
Epoch 0: 7%|▋ | 869/12384 [1:50:41<24:25:23, 7.64s/it, loss=0.0242, acc=0.9358, iter_time=5.84s]
Epoch 0: 7%|▋ | 869/12384 [1:50:48<24:25:23, 7.64s/it, loss=0.0123, acc=0.9805, iter_time=9.44s]
Epoch 0: 7%|▋ | 870/12384 [1:50:48<24:24:33, 7.63s/it, loss=0.0123, acc=0.9805, iter_time=9.44s]
Epoch 0: 7%|▋ | 870/12384 [1:50:56<24:24:33, 7.63s/it, loss=0.0182, acc=0.9721, iter_time=7.62s]
Epoch 0: 7%|▋ | 871/12384 [1:50:56<24:23:33, 7.63s/it, loss=0.0182, acc=0.9721, iter_time=7.62s]
Epoch 0: 7%|▋ | 871/12384 [1:51:04<24:23:33, 7.63s/it, loss=0.0118, acc=0.9708, iter_time=8.04s]
Epoch 0: 7%|▋ | 872/12384 [1:51:04<24:23:29, 7.63s/it, loss=0.0118, acc=0.9708, iter_time=8.04s]
Epoch 0: 7%|▋ | 872/12384 [1:51:11<24:23:29, 7.63s/it, loss=0.0070, acc=0.9855, iter_time=7.20s]
Epoch 0: 7%|▋ | 873/12384 [1:51:11<24:21:53, 7.62s/it, loss=0.0070, acc=0.9855, iter_time=7.20s]
Epoch 0: 7%|▋ | 873/12384 [1:51:19<24:21:53, 7.62s/it, loss=0.0155, acc=0.9646, iter_time=7.62s]
Epoch 0: 7%|▋ | 874/12384 [1:51:19<24:22:50, 7.63s/it, loss=0.0155, acc=0.9646, iter_time=7.62s]
Epoch 0: 7%|▋ | 874/12384 [1:51:26<24:22:50, 7.63s/it, loss=0.0104, acc=0.9835, iter_time=6.19s]
Epoch 0: 7%|▋ | 875/12384 [1:51:26<24:21:05, 7.62s/it, loss=0.0104, acc=0.9835, iter_time=6.19s]
Epoch 0: 7%|▋ | 875/12384 [1:51:34<24:21:05, 7.62s/it, loss=0.0385, acc=0.9483, iter_time=6.48s]
Epoch 0: 7%|▋ | 876/12384 [1:51:34<24:20:03, 7.61s/it, loss=0.0385, acc=0.9483, iter_time=6.48s]
Epoch 0: 7%|▋ | 876/12384 [1:51:42<24:20:03, 7.61s/it, loss=0.0079, acc=0.9851, iter_time=7.64s]
Epoch 0: 7%|▋ | 877/12384 [1:51:42<24:41:43, 7.73s/it, loss=0.0079, acc=0.9851, iter_time=7.64s]
Epoch 0: 7%|▋ | 877/12384 [1:51:50<24:41:43, 7.73s/it, loss=0.0183, acc=0.9665, iter_time=9.57s]
Epoch 0: 7%|▋ | 878/12384 [1:51:50<24:35:23, 7.69s/it, loss=0.0183, acc=0.9665, iter_time=9.57s]
Epoch 0: 7%|▋ | 878/12384 [1:51:57<24:35:23, 7.69s/it, loss=0.0435, acc=0.9518, iter_time=7.42s]
Epoch 0: 7%|▋ | 879/12384 [1:51:57<24:30:29, 7.67s/it, loss=0.0435, acc=0.9518, iter_time=7.42s]
Epoch 0: 7%|▋ | 879/12384 [1:52:05<24:30:29, 7.67s/it, loss=0.0347, acc=0.9581, iter_time=9.13s]
Epoch 0: 7%|▋ | 880/12384 [1:52:05<24:27:29, 7.65s/it, loss=0.0347, acc=0.9581, iter_time=9.13s]
Epoch 0: 7%|▋ | 880/12384 [1:52:12<24:27:29, 7.65s/it, loss=0.0079, acc=0.9885, iter_time=7.24s]
Epoch 0: 7%|▋ | 881/12384 [1:52:12<24:24:42, 7.64s/it, loss=0.0079, acc=0.9885, iter_time=7.24s]
Epoch 0: 7%|▋ | 881/12384 [1:52:20<24:24:42, 7.64s/it, loss=0.0067, acc=0.9911, iter_time=5.04s]
Epoch 0: 7%|▋ | 882/12384 [1:52:20<24:23:41, 7.64s/it, loss=0.0067, acc=0.9911, iter_time=5.04s]
Epoch 0: 7%|▋ | 882/12384 [1:52:28<24:23:41, 7.64s/it, loss=0.0186, acc=0.9672, iter_time=10.21s]
Epoch 0: 7%|▋ | 883/12384 [1:52:28<24:25:46, 7.65s/it, loss=0.0186, acc=0.9672, iter_time=10.21s]
Epoch 0: 7%|▋ | 883/12384 [1:52:35<24:25:46, 7.65s/it, loss=0.0914, acc=0.8901, iter_time=7.66s]
Epoch 0: 7%|▋ | 884/12384 [1:52:35<24:25:41, 7.65s/it, loss=0.0914, acc=0.8901, iter_time=7.66s]
Epoch 0: 7%|▋ | 884/12384 [1:52:43<24:25:41, 7.65s/it, loss=0.0095, acc=0.9872, iter_time=4.25s]
Epoch 0: 7%|▋ | 885/12384 [1:52:43<24:24:07, 7.64s/it, loss=0.0095, acc=0.9872, iter_time=4.25s]
Epoch 0: 7%|▋ | 885/12384 [1:52:51<24:24:07, 7.64s/it, loss=0.0097, acc=0.9795, iter_time=11.02s]
Epoch 0: 7%|▋ | 886/12384 [1:52:51<24:22:16, 7.63s/it, loss=0.0097, acc=0.9795, iter_time=11.02s]
Epoch 0: 7%|▋ | 886/12384 [1:52:58<24:22:16, 7.63s/it, loss=0.0124, acc=0.9840, iter_time=7.60s]
Epoch 0: 7%|▋ | 887/12384 [1:52:58<24:20:04, 7.62s/it, loss=0.0124, acc=0.9840, iter_time=7.60s]
Epoch 0: 7%|▋ | 887/12384 [1:53:06<24:20:04, 7.62s/it, loss=0.0123, acc=0.9846, iter_time=7.71s]
Epoch 0: 7%|▋ | 888/12384 [1:53:06<24:18:59, 7.61s/it, loss=0.0123, acc=0.9846, iter_time=7.71s]
Epoch 0: 7%|▋ | 888/12384 [1:53:13<24:18:59, 7.61s/it, loss=0.0082, acc=0.9848, iter_time=3.95s]
Epoch 0: 7%|▋ | 889/12384 [1:53:13<24:19:04, 7.62s/it, loss=0.0082, acc=0.9848, iter_time=3.95s]
Epoch 0: 7%|▋ | 889/12384 [1:53:21<24:19:04, 7.62s/it, loss=0.0099, acc=0.9743, iter_time=8.60s]
Epoch 0: 7%|▋ | 890/12384 [1:53:21<24:18:04, 7.61s/it, loss=0.0099, acc=0.9743, iter_time=8.60s]
Epoch 0: 7%|▋ | 890/12384 [1:53:29<24:18:04, 7.61s/it, loss=0.0048, acc=0.9975, iter_time=10.16s]
Epoch 0: 7%|▋ | 891/12384 [1:53:29<24:18:37, 7.61s/it, loss=0.0048, acc=0.9975, iter_time=10.16s]
Epoch 0: 7%|▋ | 891/12384 [1:53:36<24:18:37, 7.61s/it, loss=0.0111, acc=0.9736, iter_time=4.81s]
Epoch 0: 7%|▋ | 892/12384 [1:53:36<24:20:04, 7.62s/it, loss=0.0111, acc=0.9736, iter_time=4.81s]
Epoch 0: 7%|▋ | 892/12384 [1:53:44<24:20:04, 7.62s/it, loss=0.0163, acc=0.9813, iter_time=10.44s]
Epoch 0: 7%|▋ | 893/12384 [1:53:44<24:18:37, 7.62s/it, loss=0.0163, acc=0.9813, iter_time=10.44s]
Epoch 0: 7%|▋ | 893/12384 [1:53:51<24:18:37, 7.62s/it, loss=0.0307, acc=0.9701, iter_time=3.87s]
Epoch 0: 7%|▋ | 894/12384 [1:53:51<24:19:07, 7.62s/it, loss=0.0307, acc=0.9701, iter_time=3.87s]
Epoch 0: 7%|▋ | 894/12384 [1:53:59<24:19:07, 7.62s/it, loss=0.0089, acc=0.9872, iter_time=11.36s]
Epoch 0: 7%|▋ | 895/12384 [1:53:59<24:17:32, 7.61s/it, loss=0.0089, acc=0.9872, iter_time=11.36s]
Epoch 0: 7%|▋ | 895/12384 [1:54:07<24:17:32, 7.61s/it, loss=0.0164, acc=0.9581, iter_time=8.01s]
Epoch 0: 7%|▋ | 896/12384 [1:54:07<24:17:22, 7.61s/it, loss=0.0164, acc=0.9581, iter_time=8.01s]
Epoch 0: 7%|▋ | 896/12384 [1:54:14<24:17:22, 7.61s/it, loss=0.0134, acc=0.9746, iter_time=7.22s]
Epoch 0: 7%|▋ | 897/12384 [1:54:14<24:18:28, 7.62s/it, loss=0.0134, acc=0.9746, iter_time=7.22s]
Epoch 0: 7%|▋ | 897/12384 [1:54:22<24:18:28, 7.62s/it, loss=0.0070, acc=0.9907, iter_time=7.09s]
Epoch 0: 7%|▋ | 898/12384 [1:54:22<24:16:47, 7.61s/it, loss=0.0070, acc=0.9907, iter_time=7.09s]
Epoch 0: 7%|▋ | 898/12384 [1:54:30<24:16:47, 7.61s/it, loss=0.0068, acc=0.9903, iter_time=8.14s]
Epoch 0: 7%|▋ | 899/12384 [1:54:30<24:16:35, 7.61s/it, loss=0.0068, acc=0.9903, iter_time=8.14s]
Epoch 0: 7%|▋ | 899/12384 [1:54:37<24:16:35, 7.61s/it, loss=0.0055, acc=0.9915, iter_time=8.00s]
Epoch 0: 7%|▋ | 900/12384 [1:54:37<24:16:31, 7.61s/it, loss=0.0055, acc=0.9915, iter_time=8.00s]
Epoch 0: 7%|▋ | 900/12384 [1:54:45<24:16:31, 7.61s/it, loss=0.0071, acc=0.9881, iter_time=7.21s]
Epoch 0: 7%|▋ | 901/12384 [1:54:45<24:18:07, 7.62s/it, loss=0.0071, acc=0.9881, iter_time=7.21s]
Epoch 0: 7%|▋ | 901/12384 [1:54:52<24:18:07, 7.62s/it, loss=0.0111, acc=0.9778, iter_time=7.64s]
Epoch 0: 7%|▋ | 902/12384 [1:54:52<24:16:50, 7.61s/it, loss=0.0111, acc=0.9778, iter_time=7.64s]
Epoch 0: 7%|▋ | 902/12384 [1:55:00<24:16:50, 7.61s/it, loss=0.0091, acc=0.9803, iter_time=7.95s]
Epoch 0: 7%|▋ | 903/12384 [1:55:00<24:35:53, 7.71s/it, loss=0.0091, acc=0.9803, iter_time=7.95s]
Epoch 0: 7%|▋ | 903/12384 [1:55:08<24:35:53, 7.71s/it, loss=0.0026, acc=0.9954, iter_time=7.56s]
Epoch 0: 7%|▋ | 904/12384 [1:55:08<24:31:01, 7.69s/it, loss=0.0026, acc=0.9954, iter_time=7.56s]
Epoch 0: 7%|▋ | 904/12384 [1:55:16<24:31:01, 7.69s/it, loss=0.0045, acc=0.9914, iter_time=7.65s]
Epoch 0: 7%|▋ | 905/12384 [1:55:16<24:27:39, 7.67s/it, loss=0.0045, acc=0.9914, iter_time=7.65s]
Epoch 0: 7%|▋ | 905/12384 [1:55:23<24:27:39, 7.67s/it, loss=0.0098, acc=0.9801, iter_time=5.54s]
Epoch 0: 7%|▋ | 906/12384 [1:55:23<24:25:19, 7.66s/it, loss=0.0098, acc=0.9801, iter_time=5.54s]
Epoch 0: 7%|▋ | 906/12384 [1:55:31<24:25:19, 7.66s/it, loss=0.0061, acc=0.9900, iter_time=7.19s]
Epoch 0: 7%|▋ | 907/12384 [1:55:31<24:21:27, 7.64s/it, loss=0.0061, acc=0.9900, iter_time=7.19s]
Epoch 0: 7%|▋ | 907/12384 [1:55:38<24:21:27, 7.64s/it, loss=0.0144, acc=0.9691, iter_time=8.66s]
Epoch 0: 7%|▋ | 908/12384 [1:55:38<24:19:48, 7.63s/it, loss=0.0144, acc=0.9691, iter_time=8.66s]
Epoch 0: 7%|▋ | 908/12384 [1:55:46<24:19:48, 7.63s/it, loss=0.0047, acc=0.9894, iter_time=6.51s]
Epoch 0: 7%|▋ | 909/12384 [1:55:46<24:20:05, 7.63s/it, loss=0.0047, acc=0.9894, iter_time=6.51s]
Epoch 0: 7%|▋ | 909/12384 [1:55:54<24:20:05, 7.63s/it, loss=0.0068, acc=0.9882, iter_time=10.22s]
Epoch 0: 7%|▋ | 910/12384 [1:55:54<24:19:12, 7.63s/it, loss=0.0068, acc=0.9882, iter_time=10.22s]
Epoch 0: 7%|▋ | 910/12384 [1:56:01<24:19:12, 7.63s/it, loss=0.0253, acc=0.9611, iter_time=7.62s]
Epoch 0: 7%|▋ | 911/12384 [1:56:01<24:18:25, 7.63s/it, loss=0.0253, acc=0.9611, iter_time=7.62s]
Epoch 0: 7%|▋ | 911/12384 [1:56:09<24:18:25, 7.63s/it, loss=0.0072, acc=0.9845, iter_time=8.01s]
Epoch 0: 7%|▋ | 912/12384 [1:56:09<24:16:39, 7.62s/it, loss=0.0072, acc=0.9845, iter_time=8.01s]
Epoch 0: 7%|▋ | 912/12384 [1:56:17<24:16:39, 7.62s/it, loss=0.0061, acc=0.9947, iter_time=7.22s]
Epoch 0: 7%|▋ | 913/12384 [1:56:17<24:16:08, 7.62s/it, loss=0.0061, acc=0.9947, iter_time=7.22s]
Epoch 0: 7%|▋ | 913/12384 [1:56:24<24:16:08, 7.62s/it, loss=0.0149, acc=0.9700, iter_time=5.53s]
Epoch 0: 7%|▋ | 914/12384 [1:56:24<24:17:05, 7.62s/it, loss=0.0149, acc=0.9700, iter_time=5.53s]
Epoch 0: 7%|▋ | 914/12384 [1:56:32<24:17:05, 7.62s/it, loss=0.0047, acc=0.9863, iter_time=9.71s]
Epoch 0: 7%|▋ | 915/12384 [1:56:32<24:19:31, 7.64s/it, loss=0.0047, acc=0.9863, iter_time=9.71s]
Epoch 0: 7%|▋ | 915/12384 [1:56:39<24:19:31, 7.64s/it, loss=0.0041, acc=0.9897, iter_time=7.66s]
Epoch 0: 7%|▋ | 916/12384 [1:56:39<24:16:41, 7.62s/it, loss=0.0041, acc=0.9897, iter_time=7.66s]
Epoch 0: 7%|▋ | 916/12384 [1:56:47<24:16:41, 7.62s/it, loss=0.0326, acc=0.9392, iter_time=7.62s]
Epoch 0: 7%|▋ | 917/12384 [1:56:47<24:18:10, 7.63s/it, loss=0.0326, acc=0.9392, iter_time=7.62s]
Epoch 0: 7%|▋ | 917/12384 [1:56:55<24:18:10, 7.63s/it, loss=0.0061, acc=0.9862, iter_time=7.62s]
Epoch 0: 7%|▋ | 918/12384 [1:56:55<24:17:42, 7.63s/it, loss=0.0061, acc=0.9862, iter_time=7.62s]
Epoch 0: 7%|▋ | 918/12384 [1:57:02<24:17:42, 7.63s/it, loss=0.0315, acc=0.9741, iter_time=5.10s]
Epoch 0: 7%|▋ | 919/12384 [1:57:02<24:18:17, 7.63s/it, loss=0.0315, acc=0.9741, iter_time=5.10s]
Epoch 0: 7%|▋ | 919/12384 [1:57:10<24:18:17, 7.63s/it, loss=0.0098, acc=0.9772, iter_time=10.09s]
Epoch 0: 7%|▋ | 920/12384 [1:57:10<24:15:40, 7.62s/it, loss=0.0098, acc=0.9772, iter_time=10.09s]
Epoch 0: 7%|▋ | 920/12384 [1:57:18<24:15:40, 7.62s/it, loss=0.0050, acc=0.9933, iter_time=7.05s]
Epoch 0: 7%|▋ | 921/12384 [1:57:18<24:17:17, 7.63s/it, loss=0.0050, acc=0.9933, iter_time=7.05s]
Epoch 0: 7%|▋ | 921/12384 [1:57:25<24:17:17, 7.63s/it, loss=0.0143, acc=0.9628, iter_time=8.26s]
Epoch 0: 7%|▋ | 922/12384 [1:57:25<24:15:01, 7.62s/it, loss=0.0143, acc=0.9628, iter_time=8.26s]
Epoch 0: 7%|▋ | 922/12384 [1:57:33<24:15:01, 7.62s/it, loss=0.0085, acc=0.9817, iter_time=4.25s]
Epoch 0: 7%|▋ | 923/12384 [1:57:33<24:16:50, 7.63s/it, loss=0.0085, acc=0.9817, iter_time=4.25s]
Epoch 0: 7%|▋ | 923/12384 [1:57:40<24:16:50, 7.63s/it, loss=0.0057, acc=0.9900, iter_time=10.99s]
Epoch 0: 7%|▋ | 924/12384 [1:57:40<24:15:10, 7.62s/it, loss=0.0057, acc=0.9900, iter_time=10.99s]
Epoch 0: 7%|▋ | 924/12384 [1:57:48<24:15:10, 7.62s/it, loss=0.0348, acc=0.9755, iter_time=7.61s]
Epoch 0: 7%|▋ | 925/12384 [1:57:48<24:15:06, 7.62s/it, loss=0.0348, acc=0.9755, iter_time=7.61s]
Epoch 0: 7%|▋ | 925/12384 [1:57:56<24:15:06, 7.62s/it, loss=0.0068, acc=0.9897, iter_time=7.64s]
Epoch 0: 7%|▋ | 926/12384 [1:57:56<24:14:52, 7.62s/it, loss=0.0068, acc=0.9897, iter_time=7.64s]
Epoch 0: 7%|▋ | 926/12384 [1:58:03<24:14:52, 7.62s/it, loss=0.0072, acc=0.9885, iter_time=5.48s]
Epoch 0: 7%|▋ | 927/12384 [1:58:03<24:12:36, 7.61s/it, loss=0.0072, acc=0.9885, iter_time=5.48s]
Epoch 0: 7%|▋ | 927/12384 [1:58:11<24:12:36, 7.61s/it, loss=0.0072, acc=0.9860, iter_time=10.09s]
Epoch 0: 7%|▋ | 928/12384 [1:58:11<24:17:29, 7.63s/it, loss=0.0072, acc=0.9860, iter_time=10.09s]
Epoch 0: 7%|▋ | 928/12384 [1:58:19<24:17:29, 7.63s/it, loss=0.0101, acc=0.9736, iter_time=7.67s]
Epoch 0: 8%|▊ | 929/12384 [1:58:19<24:36:26, 7.73s/it, loss=0.0101, acc=0.9736, iter_time=7.67s]
Epoch 0: 8%|▊ | 929/12384 [1:58:26<24:36:26, 7.73s/it, loss=0.0029, acc=0.9981, iter_time=7.61s]
Epoch 0: 8%|▊ | 930/12384 [1:58:26<24:28:43, 7.69s/it, loss=0.0029, acc=0.9981, iter_time=7.61s]
Epoch 0: 8%|▊ | 930/12384 [1:58:34<24:28:43, 7.69s/it, loss=0.0290, acc=0.9722, iter_time=7.60s]
Epoch 0: 8%|▊ | 931/12384 [1:58:34<24:24:43, 7.67s/it, loss=0.0290, acc=0.9722, iter_time=7.60s]
Epoch 0: 8%|▊ | 931/12384 [1:58:42<24:24:43, 7.67s/it, loss=0.0083, acc=0.9780, iter_time=6.42s]
Epoch 0: 8%|▊ | 932/12384 [1:58:42<24:19:53, 7.65s/it, loss=0.0083, acc=0.9780, iter_time=6.42s]
Epoch 0: 8%|▊ | 932/12384 [1:58:49<24:19:53, 7.65s/it, loss=0.0092, acc=0.9878, iter_time=8.79s]
Epoch 0: 8%|▊ | 933/12384 [1:58:49<24:17:44, 7.64s/it, loss=0.0092, acc=0.9878, iter_time=8.79s]
Epoch 0: 8%|▊ | 933/12384 [1:58:57<24:17:44, 7.64s/it, loss=0.0110, acc=0.9763, iter_time=7.61s]
Epoch 0: 8%|▊ | 934/12384 [1:58:57<24:15:34, 7.63s/it, loss=0.0110, acc=0.9763, iter_time=7.61s]
Epoch 0: 8%|▊ | 934/12384 [1:59:05<24:15:34, 7.63s/it, loss=0.0128, acc=0.9751, iter_time=7.61s]
Epoch 0: 8%|▊ | 935/12384 [1:59:05<24:18:12, 7.64s/it, loss=0.0128, acc=0.9751, iter_time=7.61s]
Epoch 0: 8%|▊ | 935/12384 [1:59:12<24:18:12, 7.64s/it, loss=0.0038, acc=0.9964, iter_time=7.61s]
Epoch 0: 8%|▊ | 936/12384 [1:59:12<24:15:55, 7.63s/it, loss=0.0038, acc=0.9964, iter_time=7.61s]
Epoch 0: 8%|▊ | 936/12384 [1:59:20<24:15:55, 7.63s/it, loss=0.0040, acc=0.9937, iter_time=7.65s]
Epoch 0: 8%|▊ | 937/12384 [1:59:20<24:14:51, 7.63s/it, loss=0.0040, acc=0.9937, iter_time=7.65s]
Epoch 0: 8%|▊ | 937/12384 [1:59:27<24:14:51, 7.63s/it, loss=0.0168, acc=0.9595, iter_time=7.64s]
Epoch 0: 8%|▊ | 938/12384 [1:59:27<24:14:25, 7.62s/it, loss=0.0168, acc=0.9595, iter_time=7.64s]
Epoch 0: 8%|▊ | 938/12384 [1:59:35<24:14:25, 7.62s/it, loss=0.0281, acc=0.9559, iter_time=7.32s]
Epoch 0: 8%|▊ | 939/12384 [1:59:35<24:14:08, 7.62s/it, loss=0.0281, acc=0.9559, iter_time=7.32s]
Epoch 0: 8%|▊ | 939/12384 [1:59:43<24:14:08, 7.62s/it, loss=0.0076, acc=0.9813, iter_time=5.93s]
Epoch 0: 8%|▊ | 940/12384 [1:59:43<24:18:53, 7.65s/it, loss=0.0076, acc=0.9813, iter_time=5.93s]
Epoch 0: 8%|▊ | 940/12384 [1:59:50<24:18:53, 7.65s/it, loss=0.0069, acc=0.9818, iter_time=6.87s]
Epoch 0: 8%|▊ | 941/12384 [1:59:50<24:16:48, 7.64s/it, loss=0.0069, acc=0.9818, iter_time=6.87s]
Epoch 0: 8%|▊ | 941/12384 [1:59:58<24:16:48, 7.64s/it, loss=0.0056, acc=0.9913, iter_time=7.32s]
Epoch 0: 8%|▊ | 942/12384 [1:59:58<24:16:38, 7.64s/it, loss=0.0056, acc=0.9913, iter_time=7.32s]
Epoch 0: 8%|▊ | 942/12384 [2:00:06<24:16:38, 7.64s/it, loss=0.0029, acc=0.9945, iter_time=7.23s]
Epoch 0: 8%|▊ | 943/12384 [2:00:06<24:16:56, 7.64s/it, loss=0.0029, acc=0.9945, iter_time=7.23s]
Epoch 0: 8%|▊ | 943/12384 [2:00:13<24:16:56, 7.64s/it, loss=0.0161, acc=0.9687, iter_time=11.55s]
Epoch 0: 8%|▊ | 944/12384 [2:00:13<24:15:37, 7.63s/it, loss=0.0161, acc=0.9687, iter_time=11.55s]
Epoch 0: 8%|▊ | 944/12384 [2:00:21<24:15:37, 7.63s/it, loss=0.0048, acc=0.9973, iter_time=7.26s]
Epoch 0: 8%|▊ | 945/12384 [2:00:21<24:14:56, 7.63s/it, loss=0.0048, acc=0.9973, iter_time=7.26s]
Epoch 0: 8%|▊ | 945/12384 [2:00:29<24:14:56, 7.63s/it, loss=0.0056, acc=0.9894, iter_time=7.61s]
Epoch 0: 8%|▊ | 946/12384 [2:00:29<24:18:02, 7.65s/it, loss=0.0056, acc=0.9894, iter_time=7.61s]
Epoch 0: 8%|▊ | 946/12384 [2:00:36<24:18:02, 7.65s/it, loss=0.0072, acc=0.9825, iter_time=7.67s]
Epoch 0: 8%|▊ | 947/12384 [2:00:36<24:17:44, 7.65s/it, loss=0.0072, acc=0.9825, iter_time=7.67s]
Epoch 0: 8%|▊ | 947/12384 [2:00:44<24:17:44, 7.65s/it, loss=0.0051, acc=0.9963, iter_time=7.37s]
Epoch 0: 8%|▊ | 948/12384 [2:00:44<24:17:08, 7.65s/it, loss=0.0051, acc=0.9963, iter_time=7.37s]
Epoch 0: 8%|▊ | 948/12384 [2:00:52<24:17:08, 7.65s/it, loss=0.0054, acc=0.9898, iter_time=7.95s]
Epoch 0: 8%|▊ | 949/12384 [2:00:52<24:16:32, 7.64s/it, loss=0.0054, acc=0.9898, iter_time=7.95s]
Epoch 0: 8%|▊ | 949/12384 [2:00:59<24:16:32, 7.64s/it, loss=0.0045, acc=0.9906, iter_time=8.07s]
Epoch 0: 8%|▊ | 950/12384 [2:00:59<24:17:38, 7.65s/it, loss=0.0045, acc=0.9906, iter_time=8.07s]
Epoch 0: 8%|▊ | 950/12384 [2:01:07<24:17:38, 7.65s/it, loss=0.0064, acc=0.9899, iter_time=7.21s]
Epoch 0: 8%|▊ | 951/12384 [2:01:07<24:15:48, 7.64s/it, loss=0.0064, acc=0.9899, iter_time=7.21s]
Epoch 0: 8%|▊ | 951/12384 [2:01:14<24:15:48, 7.64s/it, loss=0.0127, acc=0.9806, iter_time=7.57s]
Epoch 0: 8%|▊ | 952/12384 [2:01:14<24:13:57, 7.63s/it, loss=0.0127, acc=0.9806, iter_time=7.57s]
Epoch 0: 8%|▊ | 952/12384 [2:01:22<24:13:57, 7.63s/it, loss=0.0081, acc=0.9812, iter_time=6.15s]
Epoch 0: 8%|▊ | 953/12384 [2:01:22<24:11:07, 7.62s/it, loss=0.0081, acc=0.9812, iter_time=6.15s]
Epoch 0: 8%|▊ | 953/12384 [2:01:30<24:11:07, 7.62s/it, loss=0.0069, acc=0.9834, iter_time=9.09s]
Epoch 0: 8%|▊ | 954/12384 [2:01:30<24:10:11, 7.61s/it, loss=0.0069, acc=0.9834, iter_time=9.09s]
Epoch 0: 8%|▊ | 954/12384 [2:01:38<24:10:11, 7.61s/it, loss=0.0085, acc=0.9863, iter_time=5.15s]
Epoch 0: 8%|▊ | 955/12384 [2:01:38<24:29:25, 7.71s/it, loss=0.0085, acc=0.9863, iter_time=5.15s]
Epoch 0: 8%|▊ | 955/12384 [2:01:45<24:29:25, 7.71s/it, loss=0.0138, acc=0.9684, iter_time=10.41s]
Epoch 0: 8%|▊ | 956/12384 [2:01:45<24:24:23, 7.69s/it, loss=0.0138, acc=0.9684, iter_time=10.41s]
Epoch 0: 8%|▊ | 956/12384 [2:01:53<24:24:23, 7.69s/it, loss=0.0068, acc=0.9853, iter_time=7.66s]
Epoch 0: 8%|▊ | 957/12384 [2:01:53<24:21:36, 7.67s/it, loss=0.0068, acc=0.9853, iter_time=7.66s]
Epoch 0: 8%|▊ | 957/12384 [2:02:00<24:21:36, 7.67s/it, loss=0.0045, acc=0.9881, iter_time=7.63s]
Epoch 0: 8%|▊ | 958/12384 [2:02:00<24:19:26, 7.66s/it, loss=0.0045, acc=0.9881, iter_time=7.63s]
Epoch 0: 8%|▊ | 958/12384 [2:02:08<24:19:26, 7.66s/it, loss=0.0051, acc=0.9858, iter_time=7.67s]
Epoch 0: 8%|▊ | 959/12384 [2:02:08<24:18:03, 7.66s/it, loss=0.0051, acc=0.9858, iter_time=7.67s]
Epoch 0: 8%|▊ | 959/12384 [2:02:16<24:18:03, 7.66s/it, loss=0.0079, acc=0.9780, iter_time=7.54s]
Epoch 0: 8%|▊ | 960/12384 [2:02:16<24:15:12, 7.64s/it, loss=0.0079, acc=0.9780, iter_time=7.54s]
Epoch 0: 8%|▊ | 960/12384 [2:02:23<24:15:12, 7.64s/it, loss=0.0174, acc=0.9649, iter_time=7.67s]
Epoch 0: 8%|▊ | 961/12384 [2:02:23<24:13:38, 7.64s/it, loss=0.0174, acc=0.9649, iter_time=7.67s]
Epoch 0: 8%|▊ | 961/12384 [2:02:31<24:13:38, 7.64s/it, loss=0.0061, acc=0.9880, iter_time=7.65s]
Epoch 0: 8%|▊ | 962/12384 [2:02:31<24:13:25, 7.63s/it, loss=0.0061, acc=0.9880, iter_time=7.65s]
Epoch 0: 8%|▊ | 962/12384 [2:02:39<24:13:25, 7.63s/it, loss=0.0074, acc=0.9793, iter_time=6.67s]
Epoch 0: 8%|▊ | 963/12384 [2:02:39<24:13:25, 7.64s/it, loss=0.0074, acc=0.9793, iter_time=6.67s]
Epoch 0: 8%|▊ | 963/12384 [2:02:46<24:13:25, 7.64s/it, loss=0.0127, acc=0.9735, iter_time=8.56s]
Epoch 0: 8%|▊ | 964/12384 [2:02:46<24:12:39, 7.63s/it, loss=0.0127, acc=0.9735, iter_time=8.56s]
Epoch 0: 8%|▊ | 964/12384 [2:02:54<24:12:39, 7.63s/it, loss=0.0049, acc=0.9939, iter_time=4.49s]
Epoch 0: 8%|▊ | 965/12384 [2:02:54<24:11:59, 7.63s/it, loss=0.0049, acc=0.9939, iter_time=4.49s]
Epoch 0: 8%|▊ | 965/12384 [2:03:01<24:11:59, 7.63s/it, loss=0.0042, acc=0.9962, iter_time=8.44s]
Epoch 0: 8%|▊ | 966/12384 [2:03:01<24:09:57, 7.62s/it, loss=0.0042, acc=0.9962, iter_time=8.44s]
Epoch 0: 8%|▊ | 966/12384 [2:03:09<24:09:57, 7.62s/it, loss=0.0045, acc=0.9878, iter_time=9.31s]
Epoch 0: 8%|▊ | 967/12384 [2:03:09<24:09:09, 7.62s/it, loss=0.0045, acc=0.9878, iter_time=9.31s]
Epoch 0: 8%|▊ | 967/12384 [2:03:17<24:09:09, 7.62s/it, loss=0.0041, acc=0.9892, iter_time=8.61s]
Epoch 0: 8%|▊ | 968/12384 [2:03:17<24:11:56, 7.63s/it, loss=0.0041, acc=0.9892, iter_time=8.61s]
Epoch 0: 8%|▊ | 968/12384 [2:03:24<24:11:56, 7.63s/it, loss=0.0119, acc=0.9771, iter_time=7.26s]
Epoch 0: 8%|▊ | 969/12384 [2:03:24<24:11:11, 7.63s/it, loss=0.0119, acc=0.9771, iter_time=7.26s]
Epoch 0: 8%|▊ | 969/12384 [2:03:32<24:11:11, 7.63s/it, loss=0.0022, acc=0.9920, iter_time=4.26s]
Epoch 0: 8%|▊ | 970/12384 [2:03:32<24:09:00, 7.62s/it, loss=0.0022, acc=0.9920, iter_time=4.26s]
Epoch 0: 8%|▊ | 970/12384 [2:03:40<24:09:00, 7.62s/it, loss=0.0054, acc=0.9921, iter_time=10.96s]
Epoch 0: 8%|▊ | 971/12384 [2:03:40<24:07:55, 7.61s/it, loss=0.0054, acc=0.9921, iter_time=10.96s]
Epoch 0: 8%|▊ | 971/12384 [2:03:47<24:07:55, 7.61s/it, loss=0.0066, acc=0.9866, iter_time=7.60s]
Epoch 0: 8%|▊ | 972/12384 [2:03:47<24:06:34, 7.61s/it, loss=0.0066, acc=0.9866, iter_time=7.60s]
Epoch 0: 8%|▊ | 972/12384 [2:03:55<24:06:34, 7.61s/it, loss=0.0050, acc=0.9938, iter_time=7.61s]
Epoch 0: 8%|▊ | 973/12384 [2:03:55<24:06:45, 7.61s/it, loss=0.0050, acc=0.9938, iter_time=7.61s]
Epoch 0: 8%|▊ | 973/12384 [2:04:02<24:06:45, 7.61s/it, loss=0.0054, acc=0.9927, iter_time=7.60s]
Epoch 0: 8%|▊ | 974/12384 [2:04:02<24:06:35, 7.61s/it, loss=0.0054, acc=0.9927, iter_time=7.60s]
Epoch 0: 8%|▊ | 974/12384 [2:04:10<24:06:35, 7.61s/it, loss=0.0125, acc=0.9880, iter_time=7.62s]
Epoch 0: 8%|▊ | 975/12384 [2:04:10<24:06:29, 7.61s/it, loss=0.0125, acc=0.9880, iter_time=7.62s]
Epoch 0: 8%|▊ | 975/12384 [2:04:18<24:06:29, 7.61s/it, loss=0.0120, acc=0.9766, iter_time=7.99s]
Epoch 0: 8%|▊ | 976/12384 [2:04:18<24:06:59, 7.61s/it, loss=0.0120, acc=0.9766, iter_time=7.99s]
Epoch 0: 8%|▊ | 976/12384 [2:04:25<24:06:59, 7.61s/it, loss=0.0060, acc=0.9853, iter_time=6.00s]
Epoch 0: 8%|▊ | 977/12384 [2:04:25<24:06:48, 7.61s/it, loss=0.0060, acc=0.9853, iter_time=6.00s]
Epoch 0: 8%|▊ | 977/12384 [2:04:33<24:06:48, 7.61s/it, loss=0.0064, acc=0.9838, iter_time=5.51s]
Epoch 0: 8%|▊ | 978/12384 [2:04:33<24:07:45, 7.62s/it, loss=0.0064, acc=0.9838, iter_time=5.51s]
Epoch 0: 8%|▊ | 978/12384 [2:04:40<24:07:45, 7.62s/it, loss=0.0104, acc=0.9818, iter_time=8.16s]
Epoch 0: 8%|▊ | 979/12384 [2:04:40<24:06:35, 7.61s/it, loss=0.0104, acc=0.9818, iter_time=8.16s]
Epoch 0: 8%|▊ | 979/12384 [2:04:48<24:06:35, 7.61s/it, loss=0.0154, acc=0.9745, iter_time=7.60s]
Epoch 0: 8%|▊ | 980/12384 [2:04:48<24:07:12, 7.61s/it, loss=0.0154, acc=0.9745, iter_time=7.60s]
Epoch 0: 8%|▊ | 980/12384 [2:04:56<24:07:12, 7.61s/it, loss=0.0097, acc=0.9804, iter_time=10.75s]
Epoch 0: 8%|▊ | 981/12384 [2:04:56<24:26:12, 7.71s/it, loss=0.0097, acc=0.9804, iter_time=10.75s]
Epoch 0: 8%|▊ | 981/12384 [2:05:04<24:26:12, 7.71s/it, loss=0.0065, acc=0.9835, iter_time=7.61s]
Epoch 0: 8%|▊ | 982/12384 [2:05:04<24:19:01, 7.68s/it, loss=0.0065, acc=0.9835, iter_time=7.61s]
Epoch 0: 8%|▊ | 982/12384 [2:05:11<24:19:01, 7.68s/it, loss=0.0123, acc=0.9675, iter_time=7.61s]
Epoch 0: 8%|▊ | 983/12384 [2:05:11<24:14:51, 7.66s/it, loss=0.0123, acc=0.9675, iter_time=7.61s]
Epoch 0: 8%|▊ | 983/12384 [2:05:19<24:14:51, 7.66s/it, loss=0.0034, acc=0.9942, iter_time=7.54s]
Epoch 0: 8%|▊ | 984/12384 [2:05:19<24:11:50, 7.64s/it, loss=0.0034, acc=0.9942, iter_time=7.54s]
Epoch 0: 8%|▊ | 984/12384 [2:05:26<24:11:50, 7.64s/it, loss=0.0046, acc=0.9860, iter_time=7.66s]
Epoch 0: 8%|▊ | 985/12384 [2:05:26<24:09:06, 7.63s/it, loss=0.0046, acc=0.9860, iter_time=7.66s]
Epoch 0: 8%|▊ | 985/12384 [2:05:34<24:09:06, 7.63s/it, loss=0.0083, acc=0.9807, iter_time=7.58s]
Epoch 0: 8%|▊ | 986/12384 [2:05:34<24:07:55, 7.62s/it, loss=0.0083, acc=0.9807, iter_time=7.58s]
Epoch 0: 8%|▊ | 986/12384 [2:05:42<24:07:55, 7.62s/it, loss=0.0048, acc=0.9887, iter_time=6.69s]
Epoch 0: 8%|▊ | 987/12384 [2:05:42<24:08:31, 7.63s/it, loss=0.0048, acc=0.9887, iter_time=6.69s]
Epoch 0: 8%|▊ | 987/12384 [2:05:49<24:08:31, 7.63s/it, loss=0.0028, acc=0.9948, iter_time=8.56s]
Epoch 0: 8%|▊ | 988/12384 [2:05:49<24:07:07, 7.62s/it, loss=0.0028, acc=0.9948, iter_time=8.56s]
Epoch 0: 8%|▊ | 988/12384 [2:05:57<24:07:07, 7.62s/it, loss=0.0074, acc=0.9777, iter_time=7.62s]
Epoch 0: 8%|▊ | 989/12384 [2:05:57<24:05:40, 7.61s/it, loss=0.0074, acc=0.9777, iter_time=7.62s]
Epoch 0: 8%|▊ | 989/12384 [2:06:04<24:05:40, 7.61s/it, loss=0.0043, acc=0.9838, iter_time=6.95s]
Epoch 0: 8%|▊ | 990/12384 [2:06:04<24:05:03, 7.61s/it, loss=0.0043, acc=0.9838, iter_time=6.95s]
Epoch 0: 8%|▊ | 990/12384 [2:06:12<24:05:03, 7.61s/it, loss=0.0053, acc=0.9880, iter_time=8.27s]
Epoch 0: 8%|▊ | 991/12384 [2:06:12<24:05:32, 7.61s/it, loss=0.0053, acc=0.9880, iter_time=8.27s]
Epoch 0: 8%|▊ | 991/12384 [2:06:20<24:05:32, 7.61s/it, loss=0.0059, acc=0.9923, iter_time=7.55s]
Epoch 0: 8%|▊ | 992/12384 [2:06:20<24:04:47, 7.61s/it, loss=0.0059, acc=0.9923, iter_time=7.55s]
Epoch 0: 8%|▊ | 992/12384 [2:06:27<24:04:47, 7.61s/it, loss=0.0017, acc=0.9995, iter_time=7.64s]
Epoch 0: 8%|▊ | 993/12384 [2:06:27<24:04:04, 7.61s/it, loss=0.0017, acc=0.9995, iter_time=7.64s]
Epoch 0: 8%|▊ | 993/12384 [2:06:35<24:04:04, 7.61s/it, loss=0.0125, acc=0.9854, iter_time=7.61s]
Epoch 0: 8%|▊ | 994/12384 [2:06:35<24:04:21, 7.61s/it, loss=0.0125, acc=0.9854, iter_time=7.61s]
Epoch 0: 8%|▊ | 994/12384 [2:06:42<24:04:21, 7.61s/it, loss=0.0209, acc=0.9659, iter_time=7.63s]
Epoch 0: 8%|▊ | 995/12384 [2:06:42<24:05:30, 7.62s/it, loss=0.0209, acc=0.9659, iter_time=7.63s]
Epoch 0: 8%|▊ | 995/12384 [2:06:50<24:05:30, 7.62s/it, loss=0.0029, acc=0.9942, iter_time=7.60s]
Epoch 0: 8%|▊ | 996/12384 [2:06:50<24:03:37, 7.61s/it, loss=0.0029, acc=0.9942, iter_time=7.60s]
Epoch 0: 8%|▊ | 996/12384 [2:06:58<24:03:37, 7.61s/it, loss=0.0052, acc=0.9909, iter_time=7.60s]
Epoch 0: 8%|▊ | 997/12384 [2:06:58<24:03:51, 7.61s/it, loss=0.0052, acc=0.9909, iter_time=7.60s]
Epoch 0: 8%|▊ | 997/12384 [2:07:05<24:03:51, 7.61s/it, loss=0.0037, acc=0.9914, iter_time=7.63s]
Epoch 0: 8%|▊ | 998/12384 [2:07:05<24:04:19, 7.61s/it, loss=0.0037, acc=0.9914, iter_time=7.63s]
Epoch 0: 8%|▊ | 998/12384 [2:07:13<24:04:19, 7.61s/it, loss=0.0072, acc=0.9852, iter_time=7.61s]
Epoch 0: 8%|▊ | 999/12384 [2:07:13<24:04:13, 7.61s/it, loss=0.0072, acc=0.9852, iter_time=7.61s]
Epoch 0: 8%|▊ | 999/12384 [2:07:21<24:04:13, 7.61s/it, loss=0.0031, acc=0.9893, iter_time=8.02s]
Epoch 0: 8%|▊ | 1000/12384 [2:07:21<24:15:20, 7.67s/it, loss=0.0031, acc=0.9893, iter_time=8.02s]
Epoch 0: 8%|▊ | 1000/12384 [2:07:28<24:15:20, 7.67s/it, loss=0.0036, acc=0.9925, iter_time=7.39s]
Epoch 0: 8%|▊ | 1001/12384 [2:07:28<24:13:21, 7.66s/it, loss=0.0036, acc=0.9925, iter_time=7.39s]
Epoch 0: 8%|▊ | 1001/12384 [2:07:36<24:13:21, 7.66s/it, loss=0.0036, acc=0.9900, iter_time=7.65s]
Epoch 0: 8%|▊ | 1002/12384 [2:07:36<24:11:12, 7.65s/it, loss=0.0036, acc=0.9900, iter_time=7.65s]
Epoch 0: 8%|▊ | 1002/12384 [2:07:44<24:11:12, 7.65s/it, loss=0.0147, acc=0.9796, iter_time=7.63s]
Epoch 0: 8%|▊ | 1003/12384 [2:07:44<24:09:10, 7.64s/it, loss=0.0147, acc=0.9796, iter_time=7.63s]
Epoch 0: 8%|▊ | 1003/12384 [2:07:51<24:09:10, 7.64s/it, loss=0.0058, acc=0.9831, iter_time=7.59s]
Epoch 0: 8%|▊ | 1004/12384 [2:07:51<24:05:39, 7.62s/it, loss=0.0058, acc=0.9831, iter_time=7.59s]
Epoch 0: 8%|▊ | 1004/12384 [2:07:59<24:05:39, 7.62s/it, loss=0.0033, acc=0.9912, iter_time=7.60s]
Epoch 0: 8%|▊ | 1005/12384 [2:07:59<24:06:19, 7.63s/it, loss=0.0033, acc=0.9912, iter_time=7.60s]
Epoch 0: 8%|▊ | 1005/12384 [2:08:07<24:06:19, 7.63s/it, loss=0.0047, acc=0.9879, iter_time=7.92s]
Epoch 0: 8%|▊ | 1006/12384 [2:08:07<24:20:26, 7.70s/it, loss=0.0047, acc=0.9879, iter_time=7.92s]
Epoch 0: 8%|▊ | 1006/12384 [2:08:14<24:20:26, 7.70s/it, loss=0.0050, acc=0.9908, iter_time=5.26s]
Epoch 0: 8%|▊ | 1007/12384 [2:08:14<24:14:35, 7.67s/it, loss=0.0050, acc=0.9908, iter_time=5.26s]
Epoch 0: 8%|▊ | 1007/12384 [2:08:22<24:14:35, 7.67s/it, loss=0.0139, acc=0.9727, iter_time=10.38s]
Epoch 0: 8%|▊ | 1008/12384 [2:08:22<24:28:09, 7.74s/it, loss=0.0139, acc=0.9727, iter_time=10.38s]
Epoch 0: 8%|▊ | 1008/12384 [2:08:30<24:28:09, 7.74s/it, loss=0.0037, acc=0.9910, iter_time=7.47s]
Epoch 0: 8%|▊ | 1009/12384 [2:08:30<24:20:55, 7.71s/it, loss=0.0037, acc=0.9910, iter_time=7.47s]
Epoch 0: 8%|▊ | 1009/12384 [2:08:37<24:20:55, 7.71s/it, loss=0.0131, acc=0.9770, iter_time=7.64s]
Epoch 0: 8%|▊ | 1010/12384 [2:08:37<24:15:48, 7.68s/it, loss=0.0131, acc=0.9770, iter_time=7.64s]
Epoch 0: 8%|▊ | 1010/12384 [2:08:45<24:15:48, 7.68s/it, loss=0.0032, acc=0.9924, iter_time=7.61s]
Epoch 0: 8%|▊ | 1011/12384 [2:08:45<24:11:43, 7.66s/it, loss=0.0032, acc=0.9924, iter_time=7.61s]
Epoch 0: 8%|▊ | 1011/12384 [2:08:53<24:11:43, 7.66s/it, loss=0.0113, acc=0.9840, iter_time=7.60s]
Epoch 0: 8%|▊ | 1012/12384 [2:08:53<24:10:10, 7.65s/it, loss=0.0113, acc=0.9840, iter_time=7.60s]
Epoch 0: 8%|▊ | 1012/12384 [2:09:00<24:10:10, 7.65s/it, loss=0.0065, acc=0.9886, iter_time=7.64s]
Epoch 0: 8%|▊ | 1013/12384 [2:09:00<24:06:58, 7.64s/it, loss=0.0065, acc=0.9886, iter_time=7.64s]
Epoch 0: 8%|▊ | 1013/12384 [2:09:08<24:06:58, 7.64s/it, loss=0.0024, acc=0.9921, iter_time=7.59s]
Epoch 0: 8%|▊ | 1014/12384 [2:09:08<24:05:19, 7.63s/it, loss=0.0024, acc=0.9921, iter_time=7.59s]
Epoch 0: 8%|▊ | 1014/12384 [2:09:16<24:05:19, 7.63s/it, loss=0.0066, acc=0.9930, iter_time=7.62s]
Epoch 0: 8%|▊ | 1015/12384 [2:09:16<24:06:09, 7.63s/it, loss=0.0066, acc=0.9930, iter_time=7.62s]
Epoch 0: 8%|▊ | 1015/12384 [2:09:23<24:06:09, 7.63s/it, loss=0.0040, acc=0.9915, iter_time=8.02s]
Epoch 0: 8%|▊ | 1016/12384 [2:09:23<24:05:24, 7.63s/it, loss=0.0040, acc=0.9915, iter_time=8.02s]
Epoch 0: 8%|▊ | 1016/12384 [2:09:31<24:05:24, 7.63s/it, loss=0.0077, acc=0.9856, iter_time=7.23s]
Epoch 0: 8%|▊ | 1017/12384 [2:09:31<24:03:19, 7.62s/it, loss=0.0077, acc=0.9856, iter_time=7.23s]
Epoch 0: 8%|▊ | 1017/12384 [2:09:38<24:03:19, 7.62s/it, loss=0.0107, acc=0.9814, iter_time=7.61s]
Epoch 0: 8%|▊ | 1018/12384 [2:09:38<24:02:47, 7.62s/it, loss=0.0107, acc=0.9814, iter_time=7.61s]
Epoch 0: 8%|▊ | 1018/12384 [2:09:46<24:02:47, 7.62s/it, loss=0.0055, acc=0.9881, iter_time=5.82s]
Epoch 0: 8%|▊ | 1019/12384 [2:09:46<24:01:55, 7.61s/it, loss=0.0055, acc=0.9881, iter_time=5.82s]
Epoch 0: 8%|▊ | 1019/12384 [2:09:54<24:01:55, 7.61s/it, loss=0.0039, acc=0.9879, iter_time=7.85s]
Epoch 0: 8%|▊ | 1020/12384 [2:09:54<24:00:55, 7.61s/it, loss=0.0039, acc=0.9879, iter_time=7.85s]
Epoch 0: 8%|▊ | 1020/12384 [2:10:01<24:00:55, 7.61s/it, loss=0.0121, acc=0.9763, iter_time=9.12s]
Epoch 0: 8%|▊ | 1021/12384 [2:10:01<23:59:12, 7.60s/it, loss=0.0121, acc=0.9763, iter_time=9.12s]
Epoch 0: 8%|▊ | 1021/12384 [2:10:09<23:59:12, 7.60s/it, loss=0.0046, acc=0.9898, iter_time=7.60s]
Epoch 0: 8%|▊ | 1022/12384 [2:10:09<24:00:21, 7.61s/it, loss=0.0046, acc=0.9898, iter_time=7.60s]
Epoch 0: 8%|▊ | 1022/12384 [2:10:16<24:00:21, 7.61s/it, loss=0.0020, acc=0.9966, iter_time=7.64s]
Epoch 0: 8%|▊ | 1023/12384 [2:10:16<24:03:25, 7.62s/it, loss=0.0020, acc=0.9966, iter_time=7.64s]
Epoch 0: 8%|▊ | 1023/12384 [2:10:24<24:03:25, 7.62s/it, loss=0.0020, acc=0.9976, iter_time=7.61s]
Epoch 0: 8%|▊ | 1024/12384 [2:10:24<24:03:10, 7.62s/it, loss=0.0020, acc=0.9976, iter_time=7.61s]
Epoch 0: 8%|▊ | 1024/12384 [2:10:32<24:03:10, 7.62s/it, loss=0.0026, acc=0.9925, iter_time=7.66s]
Epoch 0: 8%|▊ | 1025/12384 [2:10:32<24:02:06, 7.62s/it, loss=0.0026, acc=0.9925, iter_time=7.66s]
Epoch 0: 8%|▊ | 1025/12384 [2:10:39<24:02:06, 7.62s/it, loss=0.0030, acc=0.9919, iter_time=4.57s]
Epoch 0: 8%|▊ | 1026/12384 [2:10:39<24:03:17, 7.62s/it, loss=0.0030, acc=0.9919, iter_time=4.57s]
Epoch 0: 8%|▊ | 1026/12384 [2:10:47<24:03:17, 7.62s/it, loss=0.0126, acc=0.9717, iter_time=10.66s]
Epoch 0: 8%|▊ | 1027/12384 [2:10:47<24:02:14, 7.62s/it, loss=0.0126, acc=0.9717, iter_time=10.66s]
Epoch 0: 8%|▊ | 1027/12384 [2:10:55<24:02:14, 7.62s/it, loss=0.0014, acc=0.9990, iter_time=7.29s]
Epoch 0: 8%|▊ | 1028/12384 [2:10:55<24:02:34, 7.62s/it, loss=0.0014, acc=0.9990, iter_time=7.29s]
Epoch 0: 8%|▊ | 1028/12384 [2:11:02<24:02:34, 7.62s/it, loss=0.0025, acc=0.9945, iter_time=6.22s]
Epoch 0: 8%|▊ | 1029/12384 [2:11:02<24:01:59, 7.62s/it, loss=0.0025, acc=0.9945, iter_time=6.22s]
Epoch 0: 8%|▊ | 1029/12384 [2:11:10<24:01:59, 7.62s/it, loss=0.0063, acc=0.9901, iter_time=9.34s]
Epoch 0: 8%|▊ | 1030/12384 [2:11:10<24:01:25, 7.62s/it, loss=0.0063, acc=0.9901, iter_time=9.34s]
Epoch 0: 8%|▊ | 1030/12384 [2:11:17<24:01:25, 7.62s/it, loss=0.0038, acc=0.9942, iter_time=7.63s]
Epoch 0: 8%|▊ | 1031/12384 [2:11:17<24:01:07, 7.62s/it, loss=0.0038, acc=0.9942, iter_time=7.63s]
Epoch 0: 8%|▊ | 1031/12384 [2:11:25<24:01:07, 7.62s/it, loss=0.0345, acc=0.9582, iter_time=7.58s]
Epoch 0: 8%|▊ | 1032/12384 [2:11:25<24:01:11, 7.62s/it, loss=0.0345, acc=0.9582, iter_time=7.58s]
Epoch 0: 8%|▊ | 1032/12384 [2:11:33<24:01:11, 7.62s/it, loss=0.0038, acc=0.9899, iter_time=7.95s]
Epoch 0: 8%|▊ | 1033/12384 [2:11:33<24:16:46, 7.70s/it, loss=0.0038, acc=0.9899, iter_time=7.95s]
Epoch 0: 8%|▊ | 1033/12384 [2:11:41<24:16:46, 7.70s/it, loss=0.0090, acc=0.9815, iter_time=6.13s]
Epoch 0: 8%|▊ | 1034/12384 [2:11:41<24:30:12, 7.77s/it, loss=0.0090, acc=0.9815, iter_time=6.13s]
Epoch 0: 8%|▊ | 1034/12384 [2:11:48<24:30:12, 7.77s/it, loss=0.0084, acc=0.9800, iter_time=9.39s]
Epoch 0: 8%|▊ | 1035/12384 [2:11:48<24:18:44, 7.71s/it, loss=0.0084, acc=0.9800, iter_time=9.39s]
Epoch 0: 8%|▊ | 1035/12384 [2:11:56<24:18:44, 7.71s/it, loss=0.0045, acc=0.9904, iter_time=7.65s]
Epoch 0: 8%|▊ | 1036/12384 [2:11:56<24:15:32, 7.70s/it, loss=0.0045, acc=0.9904, iter_time=7.65s]
Epoch 0: 8%|▊ | 1036/12384 [2:12:04<24:15:32, 7.70s/it, loss=0.0036, acc=0.9908, iter_time=5.34s]
Epoch 0: 8%|▊ | 1037/12384 [2:12:04<24:09:50, 7.67s/it, loss=0.0036, acc=0.9908, iter_time=5.34s]
Epoch 0: 8%|▊ | 1037/12384 [2:12:11<24:09:50, 7.67s/it, loss=0.0056, acc=0.9880, iter_time=9.86s]
Epoch 0: 8%|▊ | 1038/12384 [2:12:11<24:05:28, 7.64s/it, loss=0.0056, acc=0.9880, iter_time=9.86s]
Epoch 0: 8%|▊ | 1038/12384 [2:12:19<24:05:28, 7.64s/it, loss=0.0052, acc=0.9884, iter_time=7.59s]
Epoch 0: 8%|▊ | 1039/12384 [2:12:19<24:02:58, 7.63s/it, loss=0.0052, acc=0.9884, iter_time=7.59s]
Epoch 0: 8%|▊ | 1039/12384 [2:12:26<24:02:58, 7.63s/it, loss=0.0073, acc=0.9914, iter_time=7.99s]
Epoch 0: 8%|▊ | 1040/12384 [2:12:26<24:00:57, 7.62s/it, loss=0.0073, acc=0.9914, iter_time=7.99s]
Epoch 0: 8%|▊ | 1040/12384 [2:12:34<24:00:57, 7.62s/it, loss=0.0017, acc=0.9949, iter_time=4.07s]
Epoch 0: 8%|▊ | 1041/12384 [2:12:34<24:02:27, 7.63s/it, loss=0.0017, acc=0.9949, iter_time=4.07s]
Epoch 0: 8%|▊ | 1041/12384 [2:12:42<24:02:27, 7.63s/it, loss=0.5558, acc=0.7405, iter_time=10.48s]
Epoch 0: 8%|▊ | 1042/12384 [2:12:42<24:00:41, 7.62s/it, loss=0.5558, acc=0.7405, iter_time=10.48s]
Epoch 0: 8%|▊ | 1042/12384 [2:12:49<24:00:41, 7.62s/it, loss=0.0055, acc=0.9913, iter_time=7.91s]
Epoch 0: 8%|▊ | 1043/12384 [2:12:49<23:59:45, 7.62s/it, loss=0.0055, acc=0.9913, iter_time=7.91s]
Epoch 0: 8%|▊ | 1043/12384 [2:12:57<23:59:45, 7.62s/it, loss=0.0042, acc=0.9910, iter_time=4.31s]
Epoch 0: 8%|▊ | 1044/12384 [2:12:57<23:57:44, 7.61s/it, loss=0.0042, acc=0.9910, iter_time=4.31s]
Epoch 0: 8%|▊ | 1044/12384 [2:13:04<23:57:44, 7.61s/it, loss=0.0046, acc=0.9945, iter_time=9.15s]
Epoch 0: 8%|▊ | 1045/12384 [2:13:04<23:56:51, 7.60s/it, loss=0.0046, acc=0.9945, iter_time=9.15s]
Epoch 0: 8%|▊ | 1045/12384 [2:13:12<23:56:51, 7.60s/it, loss=0.0008, acc=0.9980, iter_time=7.06s]
Epoch 0: 8%|▊ | 1046/12384 [2:13:12<24:00:56, 7.63s/it, loss=0.0008, acc=0.9980, iter_time=7.06s]
Epoch 0: 8%|▊ | 1046/12384 [2:13:20<24:00:56, 7.63s/it, loss=0.0018, acc=0.9968, iter_time=9.93s]
Epoch 0: 8%|▊ | 1047/12384 [2:13:20<24:00:56, 7.63s/it, loss=0.0018, acc=0.9968, iter_time=9.93s]
Epoch 0: 8%|▊ | 1047/12384 [2:13:27<24:00:56, 7.63s/it, loss=0.0030, acc=0.9894, iter_time=8.03s]
Epoch 0: 8%|▊ | 1048/12384 [2:13:27<23:59:05, 7.62s/it, loss=0.0030, acc=0.9894, iter_time=8.03s]
Epoch 0: 8%|▊ | 1048/12384 [2:13:35<23:59:05, 7.62s/it, loss=0.0028, acc=0.9957, iter_time=7.20s]
Epoch 0: 8%|▊ | 1049/12384 [2:13:35<23:58:50, 7.62s/it, loss=0.0028, acc=0.9957, iter_time=7.20s]
Epoch 0: 8%|▊ | 1049/12384 [2:13:43<23:58:50, 7.62s/it, loss=0.0150, acc=0.9758, iter_time=8.04s]
Epoch 0: 8%|▊ | 1050/12384 [2:13:43<23:58:56, 7.62s/it, loss=0.0150, acc=0.9758, iter_time=8.04s]
Epoch 0: 8%|▊ | 1050/12384 [2:13:50<23:58:56, 7.62s/it, loss=0.0118, acc=0.9759, iter_time=6.59s]
Epoch 0: 8%|▊ | 1051/12384 [2:13:50<23:57:12, 7.61s/it, loss=0.0118, acc=0.9759, iter_time=6.59s]
Epoch 0: 8%|▊ | 1051/12384 [2:13:58<23:57:12, 7.61s/it, loss=0.0067, acc=0.9829, iter_time=8.20s]
Epoch 0: 8%|▊ | 1052/12384 [2:13:58<23:57:40, 7.61s/it, loss=0.0067, acc=0.9829, iter_time=8.20s]
Epoch 0: 8%|▊ | 1052/12384 [2:14:05<23:57:40, 7.61s/it, loss=0.0014, acc=0.9975, iter_time=4.34s]
Epoch 0: 9%|▊ | 1053/12384 [2:14:05<23:58:06, 7.62s/it, loss=0.0014, acc=0.9975, iter_time=4.34s]
Epoch 0: 9%|▊ | 1053/12384 [2:14:13<23:58:06, 7.62s/it, loss=0.0043, acc=0.9887, iter_time=9.12s]
Epoch 0: 9%|▊ | 1054/12384 [2:14:13<23:56:28, 7.61s/it, loss=0.0043, acc=0.9887, iter_time=9.12s]
Epoch 0: 9%|▊ | 1054/12384 [2:14:21<23:56:28, 7.61s/it, loss=0.0031, acc=0.9946, iter_time=9.37s]
Epoch 0: 9%|▊ | 1055/12384 [2:14:21<23:55:13, 7.60s/it, loss=0.0031, acc=0.9946, iter_time=9.37s]
Epoch 0: 9%|▊ | 1055/12384 [2:14:28<23:55:13, 7.60s/it, loss=0.0053, acc=0.9938, iter_time=7.54s]
Epoch 0: 9%|▊ | 1056/12384 [2:14:28<23:55:32, 7.60s/it, loss=0.0053, acc=0.9938, iter_time=7.54s]
Epoch 0: 9%|▊ | 1056/12384 [2:14:36<23:55:32, 7.60s/it, loss=0.0065, acc=0.9869, iter_time=3.92s]
Epoch 0: 9%|▊ | 1057/12384 [2:14:36<23:54:21, 7.60s/it, loss=0.0065, acc=0.9869, iter_time=3.92s]
Epoch 0: 9%|▊ | 1057/12384 [2:14:43<23:54:21, 7.60s/it, loss=0.0073, acc=0.9860, iter_time=11.30s]
Epoch 0: 9%|▊ | 1058/12384 [2:14:43<23:54:47, 7.60s/it, loss=0.0073, acc=0.9860, iter_time=11.30s]
Epoch 0: 9%|▊ | 1058/12384 [2:14:51<23:54:47, 7.60s/it, loss=0.0016, acc=0.9973, iter_time=7.64s]
Epoch 0: 9%|▊ | 1059/12384 [2:14:51<23:55:20, 7.60s/it, loss=0.0016, acc=0.9973, iter_time=7.64s]
Epoch 0: 9%|▊ | 1059/12384 [2:14:59<23:55:20, 7.60s/it, loss=0.0039, acc=0.9930, iter_time=7.89s]
Epoch 0: 9%|▊ | 1060/12384 [2:14:59<24:11:10, 7.69s/it, loss=0.0039, acc=0.9930, iter_time=7.89s]
Epoch 0: 9%|▊ | 1060/12384 [2:15:07<24:11:10, 7.69s/it, loss=0.0095, acc=0.9816, iter_time=7.67s]
Epoch 0: 9%|▊ | 1061/12384 [2:15:07<24:24:44, 7.76s/it, loss=0.0095, acc=0.9816, iter_time=7.67s]
Epoch 0: 9%|▊ | 1061/12384 [2:15:14<24:24:44, 7.76s/it, loss=0.0258, acc=0.9664, iter_time=7.55s]
Epoch 0: 9%|▊ | 1062/12384 [2:15:14<24:16:07, 7.72s/it, loss=0.0258, acc=0.9664, iter_time=7.55s]
Epoch 0: 9%|▊ | 1062/12384 [2:15:22<24:16:07, 7.72s/it, loss=0.0054, acc=0.9909, iter_time=7.93s]
Epoch 0: 9%|▊ | 1063/12384 [2:15:22<24:10:38, 7.69s/it, loss=0.0054, acc=0.9909, iter_time=7.93s]
Epoch 0: 9%|▊ | 1063/12384 [2:15:30<24:10:38, 7.69s/it, loss=0.0048, acc=0.9945, iter_time=7.98s]
Epoch 0: 9%|▊ | 1064/12384 [2:15:30<24:05:30, 7.66s/it, loss=0.0048, acc=0.9945, iter_time=7.98s]
Epoch 0: 9%|▊ | 1064/12384 [2:15:37<24:05:30, 7.66s/it, loss=0.0020, acc=0.9982, iter_time=4.10s]
Epoch 0: 9%|▊ | 1065/12384 [2:15:37<24:01:35, 7.64s/it, loss=0.0020, acc=0.9982, iter_time=4.10s]
Epoch 0: 9%|▊ | 1065/12384 [2:15:45<24:01:35, 7.64s/it, loss=0.0087, acc=0.9754, iter_time=6.97s]
Epoch 0: 9%|▊ | 1066/12384 [2:15:45<23:59:10, 7.63s/it, loss=0.0087, acc=0.9754, iter_time=6.97s]
Epoch 0: 9%|▊ | 1066/12384 [2:15:52<23:59:10, 7.63s/it, loss=0.0054, acc=0.9916, iter_time=11.33s]
Epoch 0: 9%|▊ | 1067/12384 [2:15:52<23:58:39, 7.63s/it, loss=0.0054, acc=0.9916, iter_time=11.33s]
Epoch 0: 9%|▊ | 1067/12384 [2:16:00<23:58:39, 7.63s/it, loss=0.0053, acc=0.9876, iter_time=7.73s]
Epoch 0: 9%|▊ | 1068/12384 [2:16:00<24:02:21, 7.65s/it, loss=0.0053, acc=0.9876, iter_time=7.73s]
Epoch 0: 9%|▊ | 1068/12384 [2:16:08<24:02:21, 7.65s/it, loss=0.0033, acc=0.9910, iter_time=7.60s]
Epoch 0: 9%|▊ | 1069/12384 [2:16:08<23:59:10, 7.63s/it, loss=0.0033, acc=0.9910, iter_time=7.60s]
Epoch 0: 9%|▊ | 1069/12384 [2:16:15<23:59:10, 7.63s/it, loss=0.0090, acc=0.9896, iter_time=7.59s]
Epoch 0: 9%|▊ | 1070/12384 [2:16:15<23:57:21, 7.62s/it, loss=0.0090, acc=0.9896, iter_time=7.59s]
Epoch 0: 9%|▊ | 1070/12384 [2:16:23<23:57:21, 7.62s/it, loss=0.0053, acc=0.9898, iter_time=7.60s]
Epoch 0: 9%|▊ | 1071/12384 [2:16:23<23:55:03, 7.61s/it, loss=0.0053, acc=0.9898, iter_time=7.60s]
Epoch 0: 9%|▊ | 1071/12384 [2:16:31<23:55:03, 7.61s/it, loss=0.0063, acc=0.9812, iter_time=7.63s]
Epoch 0: 9%|▊ | 1072/12384 [2:16:31<24:00:08, 7.64s/it, loss=0.0063, acc=0.9812, iter_time=7.63s]
Epoch 0: 9%|▊ | 1072/12384 [2:16:38<24:00:08, 7.64s/it, loss=0.0065, acc=0.9817, iter_time=7.65s]
Epoch 0: 9%|▊ | 1073/12384 [2:16:38<23:59:05, 7.63s/it, loss=0.0065, acc=0.9817, iter_time=7.65s]
Epoch 0: 9%|▊ | 1073/12384 [2:16:46<23:59:05, 7.63s/it, loss=0.0020, acc=0.9961, iter_time=5.90s]
Epoch 0: 9%|▊ | 1074/12384 [2:16:46<23:55:56, 7.62s/it, loss=0.0020, acc=0.9961, iter_time=5.90s]
Epoch 0: 9%|▊ | 1074/12384 [2:16:54<23:55:56, 7.62s/it, loss=0.0043, acc=0.9916, iter_time=9.33s]
Epoch 0: 9%|▊ | 1075/12384 [2:16:54<23:59:17, 7.64s/it, loss=0.0043, acc=0.9916, iter_time=9.33s]
Epoch 0: 9%|▊ | 1075/12384 [2:17:01<23:59:17, 7.64s/it, loss=0.0026, acc=0.9923, iter_time=7.67s]
Epoch 0: 9%|▊ | 1076/12384 [2:17:01<24:02:03, 7.65s/it, loss=0.0026, acc=0.9923, iter_time=7.67s]
Epoch 0: 9%|▊ | 1076/12384 [2:17:09<24:02:03, 7.65s/it, loss=0.0029, acc=0.9968, iter_time=7.69s]
Epoch 0: 9%|▊ | 1077/12384 [2:17:09<24:00:00, 7.64s/it, loss=0.0029, acc=0.9968, iter_time=7.69s]
Epoch 0: 9%|▊ | 1077/12384 [2:17:16<24:00:00, 7.64s/it, loss=0.0076, acc=0.9804, iter_time=7.61s]
Epoch 0: 9%|▊ | 1078/12384 [2:17:16<23:57:07, 7.63s/it, loss=0.0076, acc=0.9804, iter_time=7.61s]
Epoch 0: 9%|▊ | 1078/12384 [2:17:24<23:57:07, 7.63s/it, loss=0.0087, acc=0.9875, iter_time=7.60s]
Epoch 0: 9%|▊ | 1079/12384 [2:17:24<23:55:36, 7.62s/it, loss=0.0087, acc=0.9875, iter_time=7.60s]
Epoch 0: 9%|▊ | 1079/12384 [2:17:32<23:55:36, 7.62s/it, loss=0.0032, acc=0.9944, iter_time=7.99s]
Epoch 0: 9%|▊ | 1080/12384 [2:17:32<23:54:28, 7.61s/it, loss=0.0032, acc=0.9944, iter_time=7.99s]
Epoch 0: 9%|▊ | 1080/12384 [2:17:39<23:54:28, 7.61s/it, loss=0.0122, acc=0.9817, iter_time=7.21s]
Epoch 0: 9%|▊ | 1081/12384 [2:17:39<23:56:59, 7.63s/it, loss=0.0122, acc=0.9817, iter_time=7.21s]
Epoch 0: 9%|▊ | 1081/12384 [2:17:47<23:56:59, 7.63s/it, loss=0.0037, acc=0.9943, iter_time=7.66s]
Epoch 0: 9%|▊ | 1082/12384 [2:17:47<23:55:05, 7.62s/it, loss=0.0037, acc=0.9943, iter_time=7.66s]
Epoch 0: 9%|▊ | 1082/12384 [2:17:55<23:55:05, 7.62s/it, loss=0.0018, acc=0.9940, iter_time=4.53s]
Epoch 0: 9%|▊ | 1083/12384 [2:17:55<23:56:26, 7.63s/it, loss=0.0018, acc=0.9940, iter_time=4.53s]
Epoch 0: 9%|▊ | 1083/12384 [2:18:02<23:56:26, 7.63s/it, loss=0.0023, acc=0.9947, iter_time=10.70s]
Epoch 0: 9%|▉ | 1084/12384 [2:18:02<23:54:21, 7.62s/it, loss=0.0023, acc=0.9947, iter_time=10.70s]
Epoch 0: 9%|▉ | 1084/12384 [2:18:10<23:54:21, 7.62s/it, loss=0.0038, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▉ | 1085/12384 [2:18:10<23:54:14, 7.62s/it, loss=0.0038, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▉ | 1085/12384 [2:18:17<23:54:14, 7.62s/it, loss=0.0028, acc=0.9967, iter_time=7.61s]
Epoch 0: 9%|▉ | 1086/12384 [2:18:17<23:52:59, 7.61s/it, loss=0.0028, acc=0.9967, iter_time=7.61s]
Epoch 0: 9%|▉ | 1086/12384 [2:18:25<23:52:59, 7.61s/it, loss=0.0043, acc=0.9921, iter_time=7.90s]
Epoch 0: 9%|▉ | 1087/12384 [2:18:25<24:11:32, 7.71s/it, loss=0.0043, acc=0.9921, iter_time=7.90s]
Epoch 0: 9%|▉ | 1087/12384 [2:18:33<24:11:32, 7.71s/it, loss=0.0035, acc=0.9913, iter_time=7.67s]
Epoch 0: 9%|▉ | 1088/12384 [2:18:33<24:10:18, 7.70s/it, loss=0.0035, acc=0.9913, iter_time=7.67s]
Epoch 0: 9%|▉ | 1088/12384 [2:18:41<24:10:18, 7.70s/it, loss=0.0070, acc=0.9895, iter_time=7.65s]
Epoch 0: 9%|▉ | 1089/12384 [2:18:41<24:09:20, 7.70s/it, loss=0.0070, acc=0.9895, iter_time=7.65s]
Epoch 0: 9%|▉ | 1089/12384 [2:18:48<24:09:20, 7.70s/it, loss=0.0073, acc=0.9904, iter_time=7.70s]
Epoch 0: 9%|▉ | 1090/12384 [2:18:48<24:03:46, 7.67s/it, loss=0.0073, acc=0.9904, iter_time=7.70s]
Epoch 0: 9%|▉ | 1090/12384 [2:18:56<24:03:46, 7.67s/it, loss=0.0016, acc=0.9979, iter_time=7.61s]
Epoch 0: 9%|▉ | 1091/12384 [2:18:56<24:00:24, 7.65s/it, loss=0.0016, acc=0.9979, iter_time=7.61s]
Epoch 0: 9%|▉ | 1091/12384 [2:19:04<24:00:24, 7.65s/it, loss=0.0028, acc=0.9936, iter_time=7.64s]
Epoch 0: 9%|▉ | 1092/12384 [2:19:04<23:58:30, 7.64s/it, loss=0.0028, acc=0.9936, iter_time=7.64s]
Epoch 0: 9%|▉ | 1092/12384 [2:19:11<23:58:30, 7.64s/it, loss=0.0009, acc=0.9965, iter_time=4.30s]
Epoch 0: 9%|▉ | 1093/12384 [2:19:11<23:55:16, 7.63s/it, loss=0.0009, acc=0.9965, iter_time=4.30s]
Epoch 0: 9%|▉ | 1093/12384 [2:19:19<23:55:16, 7.63s/it, loss=0.0038, acc=0.9918, iter_time=10.89s]
Epoch 0: 9%|▉ | 1094/12384 [2:19:19<23:53:57, 7.62s/it, loss=0.0038, acc=0.9918, iter_time=10.89s]
Epoch 0: 9%|▉ | 1094/12384 [2:19:26<23:53:57, 7.62s/it, loss=0.0014, acc=0.9980, iter_time=4.29s]
Epoch 0: 9%|▉ | 1095/12384 [2:19:26<23:59:23, 7.65s/it, loss=0.0014, acc=0.9980, iter_time=4.29s]
Epoch 0: 9%|▉ | 1095/12384 [2:19:34<23:59:23, 7.65s/it, loss=0.0019, acc=0.9985, iter_time=11.41s]
Epoch 0: 9%|▉ | 1096/12384 [2:19:34<24:03:22, 7.67s/it, loss=0.0019, acc=0.9985, iter_time=11.41s]
Epoch 0: 9%|▉ | 1096/12384 [2:19:42<24:03:22, 7.67s/it, loss=0.0029, acc=0.9892, iter_time=7.35s]
Epoch 0: 9%|▉ | 1097/12384 [2:19:42<24:00:26, 7.66s/it, loss=0.0029, acc=0.9892, iter_time=7.35s]
Epoch 0: 9%|▉ | 1097/12384 [2:19:49<24:00:26, 7.66s/it, loss=0.0052, acc=0.9867, iter_time=7.63s]
Epoch 0: 9%|▉ | 1098/12384 [2:19:49<23:58:19, 7.65s/it, loss=0.0052, acc=0.9867, iter_time=7.63s]
Epoch 0: 9%|▉ | 1098/12384 [2:19:57<23:58:19, 7.65s/it, loss=0.0035, acc=0.9950, iter_time=7.62s]
Epoch 0: 9%|▉ | 1099/12384 [2:19:57<23:56:43, 7.64s/it, loss=0.0035, acc=0.9950, iter_time=7.62s]
Epoch 0: 9%|▉ | 1099/12384 [2:20:05<23:56:43, 7.64s/it, loss=0.0020, acc=0.9967, iter_time=8.07s]
Epoch 0: 9%|▉ | 1100/12384 [2:20:05<23:57:46, 7.65s/it, loss=0.0020, acc=0.9967, iter_time=8.07s]
Epoch 0: 9%|▉ | 1100/12384 [2:20:12<23:57:46, 7.65s/it, loss=0.0110, acc=0.9828, iter_time=4.90s]
Epoch 0: 9%|▉ | 1101/12384 [2:20:12<23:55:30, 7.63s/it, loss=0.0110, acc=0.9828, iter_time=4.90s]
Epoch 0: 9%|▉ | 1101/12384 [2:20:20<23:55:30, 7.63s/it, loss=0.0032, acc=0.9938, iter_time=9.90s]
Epoch 0: 9%|▉ | 1102/12384 [2:20:20<23:53:58, 7.63s/it, loss=0.0032, acc=0.9938, iter_time=9.90s]
Epoch 0: 9%|▉ | 1102/12384 [2:20:27<23:53:58, 7.63s/it, loss=0.0046, acc=0.9931, iter_time=7.63s]
Epoch 0: 9%|▉ | 1103/12384 [2:20:27<23:53:02, 7.62s/it, loss=0.0046, acc=0.9931, iter_time=7.63s]
Epoch 0: 9%|▉ | 1103/12384 [2:20:35<23:53:02, 7.62s/it, loss=0.0012, acc=0.9977, iter_time=7.98s]
Epoch 0: 9%|▉ | 1104/12384 [2:20:35<23:51:12, 7.61s/it, loss=0.0012, acc=0.9977, iter_time=7.98s]
Epoch 0: 9%|▉ | 1104/12384 [2:20:43<23:51:12, 7.61s/it, loss=0.0027, acc=0.9968, iter_time=7.21s]
Epoch 0: 9%|▉ | 1105/12384 [2:20:43<23:55:01, 7.63s/it, loss=0.0027, acc=0.9968, iter_time=7.21s]
Epoch 0: 9%|▉ | 1105/12384 [2:20:50<23:55:01, 7.63s/it, loss=0.0031, acc=0.9918, iter_time=7.70s]
Epoch 0: 9%|▉ | 1106/12384 [2:20:50<23:59:51, 7.66s/it, loss=0.0031, acc=0.9918, iter_time=7.70s]
Epoch 0: 9%|▉ | 1106/12384 [2:20:58<23:59:51, 7.66s/it, loss=0.0142, acc=0.9920, iter_time=7.16s]
Epoch 0: 9%|▉ | 1107/12384 [2:20:58<23:57:03, 7.65s/it, loss=0.0142, acc=0.9920, iter_time=7.16s]
Epoch 0: 9%|▉ | 1107/12384 [2:21:06<23:57:03, 7.65s/it, loss=0.0018, acc=0.9976, iter_time=8.18s]
Epoch 0: 9%|▉ | 1108/12384 [2:21:06<23:55:30, 7.64s/it, loss=0.0018, acc=0.9976, iter_time=8.18s]
Epoch 0: 9%|▉ | 1108/12384 [2:21:13<23:55:30, 7.64s/it, loss=0.0029, acc=0.9922, iter_time=7.61s]
Epoch 0: 9%|▉ | 1109/12384 [2:21:13<23:53:09, 7.63s/it, loss=0.0029, acc=0.9922, iter_time=7.61s]
Epoch 0: 9%|▉ | 1109/12384 [2:21:21<23:53:09, 7.63s/it, loss=0.0024, acc=0.9972, iter_time=7.60s]
Epoch 0: 9%|▉ | 1110/12384 [2:21:21<23:52:44, 7.63s/it, loss=0.0024, acc=0.9972, iter_time=7.60s]
Epoch 0: 9%|▉ | 1110/12384 [2:21:29<23:52:44, 7.63s/it, loss=0.0018, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1111/12384 [2:21:29<23:52:19, 7.62s/it, loss=0.0018, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1111/12384 [2:21:36<23:52:19, 7.62s/it, loss=0.0011, acc=1.0000, iter_time=8.29s]
Epoch 0: 9%|▉ | 1112/12384 [2:21:36<24:07:12, 7.70s/it, loss=0.0011, acc=1.0000, iter_time=8.29s]
Epoch 0: 9%|▉ | 1112/12384 [2:21:44<24:07:12, 7.70s/it, loss=0.0023, acc=0.9968, iter_time=7.25s]
Epoch 0: 9%|▉ | 1113/12384 [2:21:44<24:21:22, 7.78s/it, loss=0.0023, acc=0.9968, iter_time=7.25s]
Epoch 0: 9%|▉ | 1113/12384 [2:21:52<24:21:22, 7.78s/it, loss=0.0053, acc=0.9885, iter_time=5.62s]
Epoch 0: 9%|▉ | 1114/12384 [2:21:52<24:12:02, 7.73s/it, loss=0.0053, acc=0.9885, iter_time=5.62s]
Epoch 0: 9%|▉ | 1114/12384 [2:22:00<24:12:02, 7.73s/it, loss=0.0067, acc=0.9906, iter_time=9.92s]
Epoch 0: 9%|▉ | 1115/12384 [2:22:00<24:05:30, 7.70s/it, loss=0.0067, acc=0.9906, iter_time=9.92s]
Epoch 0: 9%|▉ | 1115/12384 [2:22:07<24:05:30, 7.70s/it, loss=0.0035, acc=0.9925, iter_time=4.30s]
Epoch 0: 9%|▉ | 1116/12384 [2:22:07<24:00:23, 7.67s/it, loss=0.0035, acc=0.9925, iter_time=4.30s]
Epoch 0: 9%|▉ | 1116/12384 [2:22:15<24:00:23, 7.67s/it, loss=0.0171, acc=0.9726, iter_time=10.91s]
Epoch 0: 9%|▉ | 1117/12384 [2:22:15<23:56:36, 7.65s/it, loss=0.0171, acc=0.9726, iter_time=10.91s]
Epoch 0: 9%|▉ | 1117/12384 [2:22:22<23:56:36, 7.65s/it, loss=0.0035, acc=0.9873, iter_time=7.61s]
Epoch 0: 9%|▉ | 1118/12384 [2:22:22<23:54:38, 7.64s/it, loss=0.0035, acc=0.9873, iter_time=7.61s]
Epoch 0: 9%|▉ | 1118/12384 [2:22:30<23:54:38, 7.64s/it, loss=0.0045, acc=0.9943, iter_time=7.62s]
Epoch 0: 9%|▉ | 1119/12384 [2:22:30<23:52:01, 7.63s/it, loss=0.0045, acc=0.9943, iter_time=7.62s]
Epoch 0: 9%|▉ | 1119/12384 [2:22:38<23:52:01, 7.63s/it, loss=0.0035, acc=0.9865, iter_time=7.54s]
Epoch 0: 9%|▉ | 1120/12384 [2:22:38<23:49:58, 7.62s/it, loss=0.0035, acc=0.9865, iter_time=7.54s]
Epoch 0: 9%|▉ | 1120/12384 [2:22:45<23:49:58, 7.62s/it, loss=0.0033, acc=0.9965, iter_time=7.62s]
Epoch 0: 9%|▉ | 1121/12384 [2:22:45<23:48:32, 7.61s/it, loss=0.0033, acc=0.9965, iter_time=7.62s]
Epoch 0: 9%|▉ | 1121/12384 [2:22:53<23:48:32, 7.61s/it, loss=0.0045, acc=0.9883, iter_time=7.07s]
Epoch 0: 9%|▉ | 1122/12384 [2:22:53<23:48:03, 7.61s/it, loss=0.0045, acc=0.9883, iter_time=7.07s]
Epoch 0: 9%|▉ | 1122/12384 [2:23:00<23:48:03, 7.61s/it, loss=0.0034, acc=0.9950, iter_time=4.43s]
Epoch 0: 9%|▉ | 1123/12384 [2:23:00<23:47:31, 7.61s/it, loss=0.0034, acc=0.9950, iter_time=4.43s]
Epoch 0: 9%|▉ | 1123/12384 [2:23:08<23:47:31, 7.61s/it, loss=0.0018, acc=0.9946, iter_time=11.10s]
Epoch 0: 9%|▉ | 1124/12384 [2:23:08<23:47:41, 7.61s/it, loss=0.0018, acc=0.9946, iter_time=11.10s]
Epoch 0: 9%|▉ | 1124/12384 [2:23:16<23:47:41, 7.61s/it, loss=0.0025, acc=0.9956, iter_time=7.85s]
Epoch 0: 9%|▉ | 1125/12384 [2:23:16<23:47:09, 7.61s/it, loss=0.0025, acc=0.9956, iter_time=7.85s]
Epoch 0: 9%|▉ | 1125/12384 [2:23:23<23:47:09, 7.61s/it, loss=0.0030, acc=0.9933, iter_time=6.15s]
Epoch 0: 9%|▉ | 1126/12384 [2:23:23<23:46:38, 7.60s/it, loss=0.0030, acc=0.9933, iter_time=6.15s]
Epoch 0: 9%|▉ | 1126/12384 [2:23:31<23:46:38, 7.60s/it, loss=0.0015, acc=0.9988, iter_time=9.11s]
Epoch 0: 9%|▉ | 1127/12384 [2:23:31<23:49:41, 7.62s/it, loss=0.0015, acc=0.9988, iter_time=9.11s]
Epoch 0: 9%|▉ | 1127/12384 [2:23:39<23:49:41, 7.62s/it, loss=0.0020, acc=0.9968, iter_time=7.98s]
Epoch 0: 9%|▉ | 1128/12384 [2:23:39<23:47:53, 7.61s/it, loss=0.0020, acc=0.9968, iter_time=7.98s]
Epoch 0: 9%|▉ | 1128/12384 [2:23:46<23:47:53, 7.61s/it, loss=0.0019, acc=0.9998, iter_time=4.18s]
Epoch 0: 9%|▉ | 1129/12384 [2:23:46<23:46:53, 7.61s/it, loss=0.0019, acc=0.9998, iter_time=4.18s]
Epoch 0: 9%|▉ | 1129/12384 [2:23:54<23:46:53, 7.61s/it, loss=0.0020, acc=0.9953, iter_time=9.11s]
Epoch 0: 9%|▉ | 1130/12384 [2:23:54<23:45:37, 7.60s/it, loss=0.0020, acc=0.9953, iter_time=9.11s]
Epoch 0: 9%|▉ | 1130/12384 [2:24:01<23:45:37, 7.60s/it, loss=0.0049, acc=0.9911, iter_time=9.09s]
Epoch 0: 9%|▉ | 1131/12384 [2:24:01<23:45:21, 7.60s/it, loss=0.0049, acc=0.9911, iter_time=9.09s]
Epoch 0: 9%|▉ | 1131/12384 [2:24:09<23:45:21, 7.60s/it, loss=0.0023, acc=0.9956, iter_time=7.62s]
Epoch 0: 9%|▉ | 1132/12384 [2:24:09<23:46:23, 7.61s/it, loss=0.0023, acc=0.9956, iter_time=7.62s]
Epoch 0: 9%|▉ | 1132/12384 [2:24:17<23:46:23, 7.61s/it, loss=0.0060, acc=0.9853, iter_time=7.30s]
Epoch 0: 9%|▉ | 1133/12384 [2:24:17<23:45:03, 7.60s/it, loss=0.0060, acc=0.9853, iter_time=7.30s]
Epoch 0: 9%|▉ | 1133/12384 [2:24:24<23:45:03, 7.60s/it, loss=0.0063, acc=0.9848, iter_time=6.69s]
Epoch 0: 9%|▉ | 1134/12384 [2:24:24<23:46:41, 7.61s/it, loss=0.0063, acc=0.9848, iter_time=6.69s]
Epoch 0: 9%|▉ | 1134/12384 [2:24:32<23:46:41, 7.61s/it, loss=0.0059, acc=0.9877, iter_time=7.89s]
Epoch 0: 9%|▉ | 1135/12384 [2:24:32<23:47:35, 7.61s/it, loss=0.0059, acc=0.9877, iter_time=7.89s]
Epoch 0: 9%|▉ | 1135/12384 [2:24:39<23:47:35, 7.61s/it, loss=0.0018, acc=0.9956, iter_time=8.97s]
Epoch 0: 9%|▉ | 1136/12384 [2:24:39<23:47:48, 7.62s/it, loss=0.0018, acc=0.9956, iter_time=8.97s]
Epoch 0: 9%|▉ | 1136/12384 [2:24:47<23:47:48, 7.62s/it, loss=0.0029, acc=0.9927, iter_time=7.21s]
Epoch 0: 9%|▉ | 1137/12384 [2:24:47<23:46:19, 7.61s/it, loss=0.0029, acc=0.9927, iter_time=7.21s]
Epoch 0: 9%|▉ | 1137/12384 [2:24:55<23:46:19, 7.61s/it, loss=0.0017, acc=0.9974, iter_time=7.88s]
Epoch 0: 9%|▉ | 1138/12384 [2:24:55<23:59:56, 7.68s/it, loss=0.0017, acc=0.9974, iter_time=7.88s]
Epoch 0: 9%|▉ | 1138/12384 [2:25:03<23:59:56, 7.68s/it, loss=0.0089, acc=0.9795, iter_time=7.63s]
Epoch 0: 9%|▉ | 1139/12384 [2:25:03<24:14:23, 7.76s/it, loss=0.0089, acc=0.9795, iter_time=7.63s]
Epoch 0: 9%|▉ | 1139/12384 [2:25:10<24:14:23, 7.76s/it, loss=0.0016, acc=0.9982, iter_time=5.41s]
Epoch 0: 9%|▉ | 1140/12384 [2:25:10<24:11:47, 7.75s/it, loss=0.0016, acc=0.9982, iter_time=5.41s]
Epoch 0: 9%|▉ | 1140/12384 [2:25:18<24:11:47, 7.75s/it, loss=0.0015, acc=0.9978, iter_time=10.25s]
Epoch 0: 9%|▉ | 1141/12384 [2:25:18<24:05:00, 7.71s/it, loss=0.0015, acc=0.9978, iter_time=10.25s]
Epoch 0: 9%|▉ | 1141/12384 [2:25:26<24:05:00, 7.71s/it, loss=0.0026, acc=0.9950, iter_time=5.08s]
Epoch 0: 9%|▉ | 1142/12384 [2:25:26<24:03:33, 7.70s/it, loss=0.0026, acc=0.9950, iter_time=5.08s]
Epoch 0: 9%|▉ | 1142/12384 [2:25:34<24:03:33, 7.70s/it, loss=0.0012, acc=0.9982, iter_time=9.41s]
Epoch 0: 9%|▉ | 1143/12384 [2:25:34<24:42:47, 7.91s/it, loss=0.0012, acc=0.9982, iter_time=9.41s]
Epoch 0: 9%|▉ | 1143/12384 [2:25:43<24:42:47, 7.91s/it, loss=0.0024, acc=0.9922, iter_time=10.29s]
Epoch 0: 9%|▉ | 1144/12384 [2:25:43<25:04:27, 8.03s/it, loss=0.0024, acc=0.9922, iter_time=10.29s]
Epoch 0: 9%|▉ | 1144/12384 [2:25:51<25:04:27, 8.03s/it, loss=0.0043, acc=0.9876, iter_time=7.62s]
Epoch 0: 9%|▉ | 1145/12384 [2:25:51<25:08:47, 8.05s/it, loss=0.0043, acc=0.9876, iter_time=7.62s]
Epoch 0: 9%|▉ | 1145/12384 [2:25:58<25:08:47, 8.05s/it, loss=0.0020, acc=0.9979, iter_time=6.26s]
Epoch 0: 9%|▉ | 1146/12384 [2:25:58<24:48:01, 7.94s/it, loss=0.0020, acc=0.9979, iter_time=6.26s]
Epoch 0: 9%|▉ | 1146/12384 [2:26:06<24:48:01, 7.94s/it, loss=0.0052, acc=0.9948, iter_time=9.18s]
Epoch 0: 9%|▉ | 1147/12384 [2:26:06<24:35:18, 7.88s/it, loss=0.0052, acc=0.9948, iter_time=9.18s]
Epoch 0: 9%|▉ | 1147/12384 [2:26:14<24:35:18, 7.88s/it, loss=0.0019, acc=0.9983, iter_time=4.43s]
Epoch 0: 9%|▉ | 1148/12384 [2:26:14<24:25:18, 7.82s/it, loss=0.0019, acc=0.9983, iter_time=4.43s]
Epoch 0: 9%|▉ | 1148/12384 [2:26:21<24:25:18, 7.82s/it, loss=0.0029, acc=0.9921, iter_time=11.04s]
Epoch 0: 9%|▉ | 1149/12384 [2:26:21<24:18:21, 7.79s/it, loss=0.0029, acc=0.9921, iter_time=11.04s]
Epoch 0: 9%|▉ | 1149/12384 [2:26:29<24:18:21, 7.79s/it, loss=0.0054, acc=0.9856, iter_time=8.08s]
Epoch 0: 9%|▉ | 1150/12384 [2:26:29<24:11:45, 7.75s/it, loss=0.0054, acc=0.9856, iter_time=8.08s]
Epoch 0: 9%|▉ | 1150/12384 [2:26:37<24:11:45, 7.75s/it, loss=0.0021, acc=0.9958, iter_time=7.27s]
Epoch 0: 9%|▉ | 1151/12384 [2:26:37<24:09:17, 7.74s/it, loss=0.0021, acc=0.9958, iter_time=7.27s]
Epoch 0: 9%|▉ | 1151/12384 [2:26:45<24:09:17, 7.74s/it, loss=0.0022, acc=0.9931, iter_time=7.67s]
Epoch 0: 9%|▉ | 1152/12384 [2:26:45<24:05:29, 7.72s/it, loss=0.0022, acc=0.9931, iter_time=7.67s]
Epoch 0: 9%|▉ | 1152/12384 [2:26:52<24:05:29, 7.72s/it, loss=0.0060, acc=0.9890, iter_time=5.67s]
Epoch 0: 9%|▉ | 1153/12384 [2:26:52<23:59:12, 7.69s/it, loss=0.0060, acc=0.9890, iter_time=5.67s]
Epoch 0: 9%|▉ | 1153/12384 [2:27:00<23:59:12, 7.69s/it, loss=0.0011, acc=0.9975, iter_time=5.86s]
Epoch 0: 9%|▉ | 1154/12384 [2:27:00<23:55:58, 7.67s/it, loss=0.0011, acc=0.9975, iter_time=5.86s]
Epoch 0: 9%|▉ | 1154/12384 [2:27:07<23:55:58, 7.67s/it, loss=0.0010, acc=0.9977, iter_time=9.89s]
Epoch 0: 9%|▉ | 1155/12384 [2:27:07<23:51:55, 7.65s/it, loss=0.0010, acc=0.9977, iter_time=9.89s]
Epoch 0: 9%|▉ | 1155/12384 [2:27:15<23:51:55, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=9.09s]
Epoch 0: 9%|▉ | 1156/12384 [2:27:15<23:51:07, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=9.09s]
Epoch 0: 9%|▉ | 1156/12384 [2:27:23<23:51:07, 7.65s/it, loss=0.0032, acc=0.9940, iter_time=4.80s]
Epoch 0: 9%|▉ | 1157/12384 [2:27:23<23:48:36, 7.63s/it, loss=0.0032, acc=0.9940, iter_time=4.80s]
Epoch 0: 9%|▉ | 1157/12384 [2:27:30<23:48:36, 7.63s/it, loss=0.0026, acc=0.9946, iter_time=7.59s]
Epoch 0: 9%|▉ | 1158/12384 [2:27:30<23:55:09, 7.67s/it, loss=0.0026, acc=0.9946, iter_time=7.59s]
Epoch 0: 9%|▉ | 1158/12384 [2:27:38<23:55:09, 7.67s/it, loss=0.0033, acc=0.9901, iter_time=10.62s]
Epoch 0: 9%|▉ | 1159/12384 [2:27:38<23:51:37, 7.65s/it, loss=0.0033, acc=0.9901, iter_time=10.62s]
Epoch 0: 9%|▉ | 1159/12384 [2:27:46<23:51:37, 7.65s/it, loss=0.0084, acc=0.9832, iter_time=7.99s]
Epoch 0: 9%|▉ | 1160/12384 [2:27:46<23:51:29, 7.65s/it, loss=0.0084, acc=0.9832, iter_time=7.99s]
Epoch 0: 9%|▉ | 1160/12384 [2:27:53<23:51:29, 7.65s/it, loss=0.0026, acc=0.9970, iter_time=7.28s]
Epoch 0: 9%|▉ | 1161/12384 [2:27:53<23:49:38, 7.64s/it, loss=0.0026, acc=0.9970, iter_time=7.28s]
Epoch 0: 9%|▉ | 1161/12384 [2:28:01<23:49:38, 7.64s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 9%|▉ | 1162/12384 [2:28:01<23:47:17, 7.63s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 9%|▉ | 1162/12384 [2:28:08<23:47:17, 7.63s/it, loss=0.0059, acc=0.9853, iter_time=7.62s]
Epoch 0: 9%|▉ | 1163/12384 [2:28:08<23:48:21, 7.64s/it, loss=0.0059, acc=0.9853, iter_time=7.62s]
Epoch 0: 9%|▉ | 1163/12384 [2:28:16<23:48:21, 7.64s/it, loss=0.0029, acc=0.9930, iter_time=7.65s]
Epoch 0: 9%|▉ | 1164/12384 [2:28:16<23:48:48, 7.64s/it, loss=0.0029, acc=0.9930, iter_time=7.65s]
Epoch 0: 9%|▉ | 1164/12384 [2:28:24<23:48:48, 7.64s/it, loss=0.0025, acc=0.9942, iter_time=7.93s]
Epoch 0: 9%|▉ | 1165/12384 [2:28:24<24:07:52, 7.74s/it, loss=0.0025, acc=0.9942, iter_time=7.93s]
Epoch 0: 9%|▉ | 1165/12384 [2:28:32<24:07:52, 7.74s/it, loss=0.0023, acc=0.9957, iter_time=5.89s]
Epoch 0: 9%|▉ | 1166/12384 [2:28:32<23:59:59, 7.70s/it, loss=0.0023, acc=0.9957, iter_time=5.89s]
Epoch 0: 9%|▉ | 1166/12384 [2:28:39<23:59:59, 7.70s/it, loss=0.0065, acc=0.9911, iter_time=9.41s]
Epoch 0: 9%|▉ | 1167/12384 [2:28:39<23:56:38, 7.68s/it, loss=0.0065, acc=0.9911, iter_time=9.41s]
Epoch 0: 9%|▉ | 1167/12384 [2:28:47<23:56:38, 7.68s/it, loss=0.0015, acc=0.9978, iter_time=8.04s]
Epoch 0: 9%|▉ | 1168/12384 [2:28:47<23:54:15, 7.67s/it, loss=0.0015, acc=0.9978, iter_time=8.04s]
Epoch 0: 9%|▉ | 1168/12384 [2:28:55<23:54:15, 7.67s/it, loss=0.0034, acc=0.9889, iter_time=7.23s]
Epoch 0: 9%|▉ | 1169/12384 [2:28:55<23:50:43, 7.65s/it, loss=0.0034, acc=0.9889, iter_time=7.23s]
Epoch 0: 9%|▉ | 1169/12384 [2:29:02<23:50:43, 7.65s/it, loss=0.0009, acc=0.9990, iter_time=5.84s]
Epoch 0: 9%|▉ | 1170/12384 [2:29:02<23:50:37, 7.65s/it, loss=0.0009, acc=0.9990, iter_time=5.84s]
Epoch 0: 9%|▉ | 1170/12384 [2:29:10<23:50:37, 7.65s/it, loss=0.0048, acc=0.9914, iter_time=9.45s]
Epoch 0: 9%|▉ | 1171/12384 [2:29:10<23:49:47, 7.65s/it, loss=0.0048, acc=0.9914, iter_time=9.45s]
Epoch 0: 9%|▉ | 1171/12384 [2:29:18<23:49:47, 7.65s/it, loss=0.0080, acc=0.9851, iter_time=7.64s]
Epoch 0: 9%|▉ | 1172/12384 [2:29:18<23:49:34, 7.65s/it, loss=0.0080, acc=0.9851, iter_time=7.64s]
Epoch 0: 9%|▉ | 1172/12384 [2:29:25<23:49:34, 7.65s/it, loss=0.0085, acc=0.9865, iter_time=7.63s]
Epoch 0: 9%|▉ | 1173/12384 [2:29:25<23:47:14, 7.64s/it, loss=0.0085, acc=0.9865, iter_time=7.63s]
Epoch 0: 9%|▉ | 1173/12384 [2:29:33<23:47:14, 7.64s/it, loss=0.0014, acc=0.9965, iter_time=7.63s]
Epoch 0: 9%|▉ | 1174/12384 [2:29:33<23:49:27, 7.65s/it, loss=0.0014, acc=0.9965, iter_time=7.63s]
Epoch 0: 9%|▉ | 1174/12384 [2:29:40<23:49:27, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=5.05s]
Epoch 0: 9%|▉ | 1175/12384 [2:29:40<23:46:19, 7.63s/it, loss=0.0007, acc=0.9980, iter_time=5.05s]
Epoch 0: 9%|▉ | 1175/12384 [2:29:48<23:46:19, 7.63s/it, loss=0.0024, acc=0.9959, iter_time=10.58s]
Epoch 0: 9%|▉ | 1176/12384 [2:29:48<23:44:17, 7.62s/it, loss=0.0024, acc=0.9959, iter_time=10.58s]
Epoch 0: 9%|▉ | 1176/12384 [2:29:56<23:44:17, 7.62s/it, loss=0.0027, acc=0.9958, iter_time=7.21s]
Epoch 0: 10%|▉ | 1177/12384 [2:29:56<23:41:59, 7.61s/it, loss=0.0027, acc=0.9958, iter_time=7.21s]
Epoch 0: 10%|▉ | 1177/12384 [2:30:03<23:41:59, 7.61s/it, loss=0.0034, acc=0.9944, iter_time=7.60s]
Epoch 0: 10%|▉ | 1178/12384 [2:30:03<23:40:52, 7.61s/it, loss=0.0034, acc=0.9944, iter_time=7.60s]
Epoch 0: 10%|▉ | 1178/12384 [2:30:11<23:40:52, 7.61s/it, loss=0.0028, acc=0.9944, iter_time=7.59s]
Epoch 0: 10%|▉ | 1179/12384 [2:30:11<23:43:21, 7.62s/it, loss=0.0028, acc=0.9944, iter_time=7.59s]
Epoch 0: 10%|▉ | 1179/12384 [2:30:18<23:43:21, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.65s]
Epoch 0: 10%|▉ | 1180/12384 [2:30:18<23:41:36, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.65s]
Epoch 0: 10%|▉ | 1180/12384 [2:30:26<23:41:36, 7.61s/it, loss=0.0013, acc=0.9968, iter_time=6.38s]
Epoch 0: 10%|▉ | 1181/12384 [2:30:26<23:37:06, 7.59s/it, loss=0.0013, acc=0.9968, iter_time=6.38s]
Epoch 0: 10%|▉ | 1181/12384 [2:30:34<23:37:06, 7.59s/it, loss=0.0040, acc=0.9926, iter_time=8.76s]
Epoch 0: 10%|▉ | 1182/12384 [2:30:34<23:37:24, 7.59s/it, loss=0.0040, acc=0.9926, iter_time=8.76s]
Epoch 0: 10%|▉ | 1182/12384 [2:30:41<23:37:24, 7.59s/it, loss=0.0040, acc=0.9918, iter_time=5.51s]
Epoch 0: 10%|▉ | 1183/12384 [2:30:41<23:37:25, 7.59s/it, loss=0.0040, acc=0.9918, iter_time=5.51s]
Epoch 0: 10%|▉ | 1183/12384 [2:30:49<23:37:25, 7.59s/it, loss=0.0034, acc=0.9964, iter_time=9.62s]
Epoch 0: 10%|▉ | 1184/12384 [2:30:49<23:37:21, 7.59s/it, loss=0.0034, acc=0.9964, iter_time=9.62s]
Epoch 0: 10%|▉ | 1184/12384 [2:30:56<23:37:21, 7.59s/it, loss=0.0060, acc=0.9922, iter_time=7.65s]
Epoch 0: 10%|▉ | 1185/12384 [2:30:56<23:38:10, 7.60s/it, loss=0.0060, acc=0.9922, iter_time=7.65s]
Epoch 0: 10%|▉ | 1185/12384 [2:31:04<23:38:10, 7.60s/it, loss=0.0023, acc=0.9958, iter_time=7.61s]
Epoch 0: 10%|▉ | 1186/12384 [2:31:04<23:38:02, 7.60s/it, loss=0.0023, acc=0.9958, iter_time=7.61s]
Epoch 0: 10%|▉ | 1186/12384 [2:31:12<23:38:02, 7.60s/it, loss=0.0068, acc=0.9873, iter_time=7.71s]
Epoch 0: 10%|▉ | 1187/12384 [2:31:12<23:44:00, 7.63s/it, loss=0.0068, acc=0.9873, iter_time=7.71s]
Epoch 0: 10%|▉ | 1187/12384 [2:31:19<23:44:00, 7.63s/it, loss=0.0028, acc=0.9921, iter_time=7.61s]
Epoch 0: 10%|▉ | 1188/12384 [2:31:19<23:43:35, 7.63s/it, loss=0.0028, acc=0.9921, iter_time=7.61s]
Epoch 0: 10%|▉ | 1188/12384 [2:31:27<23:43:35, 7.63s/it, loss=0.0047, acc=0.9948, iter_time=7.62s]
Epoch 0: 10%|▉ | 1189/12384 [2:31:27<23:43:00, 7.63s/it, loss=0.0047, acc=0.9948, iter_time=7.62s]
Epoch 0: 10%|▉ | 1189/12384 [2:31:35<23:43:00, 7.63s/it, loss=0.0006, acc=0.9994, iter_time=5.28s]
Epoch 0: 10%|▉ | 1190/12384 [2:31:35<23:40:29, 7.61s/it, loss=0.0006, acc=0.9994, iter_time=5.28s]
Epoch 0: 10%|▉ | 1190/12384 [2:31:42<23:40:29, 7.61s/it, loss=0.0020, acc=0.9951, iter_time=9.92s]
Epoch 0: 10%|▉ | 1191/12384 [2:31:42<23:39:26, 7.61s/it, loss=0.0020, acc=0.9951, iter_time=9.92s]
Epoch 0: 10%|▉ | 1191/12384 [2:31:50<23:39:26, 7.61s/it, loss=0.0023, acc=0.9951, iter_time=8.06s]
Epoch 0: 10%|▉ | 1192/12384 [2:31:50<24:00:01, 7.72s/it, loss=0.0023, acc=0.9951, iter_time=8.06s]
Epoch 0: 10%|▉ | 1192/12384 [2:31:58<24:00:01, 7.72s/it, loss=0.0045, acc=0.9959, iter_time=6.07s]
Epoch 0: 10%|▉ | 1193/12384 [2:31:58<23:58:48, 7.71s/it, loss=0.0045, acc=0.9959, iter_time=6.07s]
Epoch 0: 10%|▉ | 1193/12384 [2:32:05<23:58:48, 7.71s/it, loss=0.0011, acc=0.9997, iter_time=7.63s]
Epoch 0: 10%|▉ | 1194/12384 [2:32:05<23:52:38, 7.68s/it, loss=0.0011, acc=0.9997, iter_time=7.63s]
Epoch 0: 10%|▉ | 1194/12384 [2:32:13<23:52:38, 7.68s/it, loss=0.0057, acc=0.9909, iter_time=9.11s]
Epoch 0: 10%|▉ | 1195/12384 [2:32:13<23:48:06, 7.66s/it, loss=0.0057, acc=0.9909, iter_time=9.11s]
Epoch 0: 10%|▉ | 1195/12384 [2:32:21<23:48:06, 7.66s/it, loss=0.0006, acc=0.9986, iter_time=4.74s]
Epoch 0: 10%|▉ | 1196/12384 [2:32:21<23:44:32, 7.64s/it, loss=0.0006, acc=0.9986, iter_time=4.74s]
Epoch 0: 10%|▉ | 1196/12384 [2:32:28<23:44:32, 7.64s/it, loss=0.0021, acc=0.9961, iter_time=7.94s]
Epoch 0: 10%|▉ | 1197/12384 [2:32:28<23:41:37, 7.62s/it, loss=0.0021, acc=0.9961, iter_time=7.94s]
Epoch 0: 10%|▉ | 1197/12384 [2:32:36<23:41:37, 7.62s/it, loss=0.0096, acc=0.9871, iter_time=8.38s]
Epoch 0: 10%|▉ | 1198/12384 [2:32:36<23:41:37, 7.63s/it, loss=0.0096, acc=0.9871, iter_time=8.38s]
Epoch 0: 10%|▉ | 1198/12384 [2:32:43<23:41:37, 7.63s/it, loss=0.0017, acc=0.9974, iter_time=9.35s]
Epoch 0: 10%|▉ | 1199/12384 [2:32:43<23:41:02, 7.62s/it, loss=0.0017, acc=0.9974, iter_time=9.35s]
Epoch 0: 10%|▉ | 1199/12384 [2:32:51<23:41:02, 7.62s/it, loss=0.0046, acc=0.9872, iter_time=8.01s]
Epoch 0: 10%|▉ | 1200/12384 [2:32:51<23:38:52, 7.61s/it, loss=0.0046, acc=0.9872, iter_time=8.01s]
Epoch 0: 10%|▉ | 1200/12384 [2:32:59<23:38:52, 7.61s/it, loss=0.0009, acc=0.9962, iter_time=3.02s]
Epoch 0: 10%|▉ | 1201/12384 [2:32:59<23:35:57, 7.60s/it, loss=0.0009, acc=0.9962, iter_time=3.02s]
Epoch 0: 10%|▉ | 1201/12384 [2:33:06<23:35:57, 7.60s/it, loss=0.0046, acc=0.9904, iter_time=8.15s]
Epoch 0: 10%|▉ | 1202/12384 [2:33:06<23:41:37, 7.63s/it, loss=0.0046, acc=0.9904, iter_time=8.15s]
Epoch 0: 10%|▉ | 1202/12384 [2:33:14<23:41:37, 7.63s/it, loss=0.0036, acc=0.9887, iter_time=11.29s]
Epoch 0: 10%|▉ | 1203/12384 [2:33:14<23:41:38, 7.63s/it, loss=0.0036, acc=0.9887, iter_time=11.29s]
Epoch 0: 10%|▉ | 1203/12384 [2:33:22<23:41:38, 7.63s/it, loss=0.0030, acc=0.9949, iter_time=5.34s]
Epoch 0: 10%|▉ | 1204/12384 [2:33:22<23:40:38, 7.62s/it, loss=0.0030, acc=0.9949, iter_time=5.34s]
Epoch 0: 10%|▉ | 1204/12384 [2:33:29<23:40:38, 7.62s/it, loss=0.0010, acc=0.9977, iter_time=7.05s]
Epoch 0: 10%|▉ | 1205/12384 [2:33:29<23:38:40, 7.61s/it, loss=0.0010, acc=0.9977, iter_time=7.05s]
Epoch 0: 10%|▉ | 1205/12384 [2:33:37<23:38:40, 7.61s/it, loss=0.0027, acc=0.9942, iter_time=10.44s]
Epoch 0: 10%|▉ | 1206/12384 [2:33:37<23:37:57, 7.61s/it, loss=0.0027, acc=0.9942, iter_time=10.44s]
Epoch 0: 10%|▉ | 1206/12384 [2:33:44<23:37:57, 7.61s/it, loss=0.0029, acc=0.9955, iter_time=7.63s]
Epoch 0: 10%|▉ | 1207/12384 [2:33:44<23:37:48, 7.61s/it, loss=0.0029, acc=0.9955, iter_time=7.63s]
Epoch 0: 10%|▉ | 1207/12384 [2:33:52<23:37:48, 7.61s/it, loss=0.0036, acc=0.9897, iter_time=8.00s]
Epoch 0: 10%|▉ | 1208/12384 [2:33:52<23:37:05, 7.61s/it, loss=0.0036, acc=0.9897, iter_time=8.00s]
Epoch 0: 10%|▉ | 1208/12384 [2:34:00<23:37:05, 7.61s/it, loss=0.0008, acc=0.9981, iter_time=7.20s]
Epoch 0: 10%|▉ | 1209/12384 [2:34:00<23:37:46, 7.61s/it, loss=0.0008, acc=0.9981, iter_time=7.20s]
Epoch 0: 10%|▉ | 1209/12384 [2:34:07<23:37:46, 7.61s/it, loss=0.0037, acc=0.9939, iter_time=7.63s]
Epoch 0: 10%|▉ | 1210/12384 [2:34:07<23:37:23, 7.61s/it, loss=0.0037, acc=0.9939, iter_time=7.63s]
Epoch 0: 10%|▉ | 1210/12384 [2:34:15<23:37:23, 7.61s/it, loss=0.0050, acc=0.9901, iter_time=7.62s]
Epoch 0: 10%|▉ | 1211/12384 [2:34:15<23:36:57, 7.61s/it, loss=0.0050, acc=0.9901, iter_time=7.62s]
Epoch 0: 10%|▉ | 1211/12384 [2:34:22<23:36:57, 7.61s/it, loss=0.0014, acc=0.9969, iter_time=7.60s]
Epoch 0: 10%|▉ | 1212/12384 [2:34:22<23:36:38, 7.61s/it, loss=0.0014, acc=0.9969, iter_time=7.60s]
Epoch 0: 10%|▉ | 1212/12384 [2:34:30<23:36:38, 7.61s/it, loss=0.0008, acc=0.9986, iter_time=7.60s]
Epoch 0: 10%|▉ | 1213/12384 [2:34:30<23:36:11, 7.61s/it, loss=0.0008, acc=0.9986, iter_time=7.60s]
Epoch 0: 10%|▉ | 1213/12384 [2:34:38<23:36:11, 7.61s/it, loss=0.0086, acc=0.9859, iter_time=4.03s]
Epoch 0: 10%|▉ | 1214/12384 [2:34:38<23:55:57, 7.71s/it, loss=0.0086, acc=0.9859, iter_time=4.03s]
Epoch 0: 10%|▉ | 1214/12384 [2:34:46<23:55:57, 7.71s/it, loss=0.0025, acc=0.9962, iter_time=9.43s]
Epoch 0: 10%|▉ | 1215/12384 [2:34:46<23:49:47, 7.68s/it, loss=0.0025, acc=0.9962, iter_time=9.43s]
Epoch 0: 10%|▉ | 1215/12384 [2:34:53<23:49:47, 7.68s/it, loss=0.0025, acc=0.9972, iter_time=9.85s]
Epoch 0: 10%|▉ | 1216/12384 [2:34:53<23:46:58, 7.67s/it, loss=0.0025, acc=0.9972, iter_time=9.85s]
Epoch 0: 10%|▉ | 1216/12384 [2:35:01<23:46:58, 7.67s/it, loss=0.0047, acc=0.9911, iter_time=5.14s]
Epoch 0: 10%|▉ | 1217/12384 [2:35:01<23:44:23, 7.65s/it, loss=0.0047, acc=0.9911, iter_time=5.14s]
Epoch 0: 10%|▉ | 1217/12384 [2:35:09<23:44:23, 7.65s/it, loss=0.0006, acc=1.0000, iter_time=10.01s]
Epoch 0: 10%|▉ | 1218/12384 [2:35:09<24:01:14, 7.74s/it, loss=0.0006, acc=1.0000, iter_time=10.01s]
Epoch 0: 10%|▉ | 1218/12384 [2:35:16<24:01:14, 7.74s/it, loss=0.0005, acc=0.9992, iter_time=7.91s]
Epoch 0: 10%|▉ | 1219/12384 [2:35:16<23:53:07, 7.70s/it, loss=0.0005, acc=0.9992, iter_time=7.91s]
Epoch 0: 10%|▉ | 1219/12384 [2:35:24<23:53:07, 7.70s/it, loss=0.0035, acc=0.9884, iter_time=5.50s]
Epoch 0: 10%|▉ | 1220/12384 [2:35:24<23:52:00, 7.70s/it, loss=0.0035, acc=0.9884, iter_time=5.50s]
Epoch 0: 10%|▉ | 1220/12384 [2:35:32<23:52:00, 7.70s/it, loss=0.0015, acc=0.9915, iter_time=9.77s]
Epoch 0: 10%|▉ | 1221/12384 [2:35:32<23:46:25, 7.67s/it, loss=0.0015, acc=0.9915, iter_time=9.77s]
Epoch 0: 10%|▉ | 1221/12384 [2:35:39<23:46:25, 7.67s/it, loss=0.0010, acc=0.9999, iter_time=7.61s]
Epoch 0: 10%|▉ | 1222/12384 [2:35:39<23:42:45, 7.65s/it, loss=0.0010, acc=0.9999, iter_time=7.61s]
Epoch 0: 10%|▉ | 1222/12384 [2:35:47<23:42:45, 7.65s/it, loss=0.0045, acc=0.9887, iter_time=5.62s]
Epoch 0: 10%|▉ | 1223/12384 [2:35:47<23:40:22, 7.64s/it, loss=0.0045, acc=0.9887, iter_time=5.62s]
Epoch 0: 10%|▉ | 1223/12384 [2:35:55<23:40:22, 7.64s/it, loss=0.0046, acc=0.9916, iter_time=9.98s]
Epoch 0: 10%|▉ | 1224/12384 [2:35:55<23:38:53, 7.63s/it, loss=0.0046, acc=0.9916, iter_time=9.98s]
Epoch 0: 10%|▉ | 1224/12384 [2:36:02<23:38:53, 7.63s/it, loss=0.0026, acc=0.9983, iter_time=7.24s]
Epoch 0: 10%|▉ | 1225/12384 [2:36:02<23:37:23, 7.62s/it, loss=0.0026, acc=0.9983, iter_time=7.24s]
Epoch 0: 10%|▉ | 1225/12384 [2:36:10<23:37:23, 7.62s/it, loss=0.0012, acc=0.9985, iter_time=7.65s]
Epoch 0: 10%|▉ | 1226/12384 [2:36:10<23:38:59, 7.63s/it, loss=0.0012, acc=0.9985, iter_time=7.65s]
Epoch 0: 10%|▉ | 1226/12384 [2:36:17<23:38:59, 7.63s/it, loss=0.0017, acc=0.9919, iter_time=7.59s]
Epoch 0: 10%|▉ | 1227/12384 [2:36:17<23:36:34, 7.62s/it, loss=0.0017, acc=0.9919, iter_time=7.59s]
Epoch 0: 10%|▉ | 1227/12384 [2:36:25<23:36:34, 7.62s/it, loss=0.0050, acc=0.9953, iter_time=5.51s]
Epoch 0: 10%|▉ | 1228/12384 [2:36:25<23:37:00, 7.62s/it, loss=0.0050, acc=0.9953, iter_time=5.51s]
Epoch 0: 10%|▉ | 1228/12384 [2:36:33<23:37:00, 7.62s/it, loss=0.0035, acc=0.9960, iter_time=8.19s]
Epoch 0: 10%|▉ | 1229/12384 [2:36:33<23:37:34, 7.62s/it, loss=0.0035, acc=0.9960, iter_time=8.19s]
Epoch 0: 10%|▉ | 1229/12384 [2:36:40<23:37:34, 7.62s/it, loss=0.0022, acc=0.9935, iter_time=9.15s]
Epoch 0: 10%|▉ | 1230/12384 [2:36:40<23:35:27, 7.61s/it, loss=0.0022, acc=0.9935, iter_time=9.15s]
Epoch 0: 10%|▉ | 1230/12384 [2:36:48<23:35:27, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.59s]
Epoch 0: 10%|▉ | 1231/12384 [2:36:48<23:34:47, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.59s]
Epoch 0: 10%|▉ | 1231/12384 [2:36:55<23:34:47, 7.61s/it, loss=0.0009, acc=0.9971, iter_time=8.02s]
Epoch 0: 10%|▉ | 1232/12384 [2:36:55<23:34:33, 7.61s/it, loss=0.0009, acc=0.9971, iter_time=8.02s]
Epoch 0: 10%|▉ | 1232/12384 [2:37:03<23:34:33, 7.61s/it, loss=0.0058, acc=0.9894, iter_time=6.55s]
Epoch 0: 10%|▉ | 1233/12384 [2:37:03<23:34:02, 7.61s/it, loss=0.0058, acc=0.9894, iter_time=6.55s]
Epoch 0: 10%|▉ | 1233/12384 [2:37:11<23:34:02, 7.61s/it, loss=0.0028, acc=0.9957, iter_time=8.27s]
Epoch 0: 10%|▉ | 1234/12384 [2:37:11<23:34:37, 7.61s/it, loss=0.0028, acc=0.9957, iter_time=8.27s]
Epoch 0: 10%|▉ | 1234/12384 [2:37:18<23:34:37, 7.61s/it, loss=0.0018, acc=0.9926, iter_time=7.62s]
Epoch 0: 10%|▉ | 1235/12384 [2:37:18<23:34:42, 7.61s/it, loss=0.0018, acc=0.9926, iter_time=7.62s]
Epoch 0: 10%|▉ | 1235/12384 [2:37:26<23:34:42, 7.61s/it, loss=0.0026, acc=0.9932, iter_time=7.62s]
Epoch 0: 10%|▉ | 1236/12384 [2:37:26<23:33:53, 7.61s/it, loss=0.0026, acc=0.9932, iter_time=7.62s]
Epoch 0: 10%|▉ | 1236/12384 [2:37:33<23:33:53, 7.61s/it, loss=0.0009, acc=0.9973, iter_time=7.60s]
Epoch 0: 10%|▉ | 1237/12384 [2:37:33<23:34:30, 7.61s/it, loss=0.0009, acc=0.9973, iter_time=7.60s]
Epoch 0: 10%|▉ | 1237/12384 [2:37:41<23:34:30, 7.61s/it, loss=0.0013, acc=0.9989, iter_time=7.61s]
Epoch 0: 10%|▉ | 1238/12384 [2:37:41<23:33:50, 7.61s/it, loss=0.0013, acc=0.9989, iter_time=7.61s]
Epoch 0: 10%|▉ | 1238/12384 [2:37:49<23:33:50, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=4.31s]
Epoch 0: 10%|█ | 1239/12384 [2:37:49<23:33:02, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=4.31s]
Epoch 0: 10%|█ | 1239/12384 [2:37:56<23:33:02, 7.61s/it, loss=0.0028, acc=0.9905, iter_time=10.84s]
Epoch 0: 10%|█ | 1240/12384 [2:37:56<23:32:53, 7.61s/it, loss=0.0028, acc=0.9905, iter_time=10.84s]
Epoch 0: 10%|█ | 1240/12384 [2:38:04<23:32:53, 7.61s/it, loss=0.0017, acc=0.9968, iter_time=5.39s]
Epoch 0: 10%|█ | 1241/12384 [2:38:04<23:34:06, 7.61s/it, loss=0.0017, acc=0.9968, iter_time=5.39s]
Epoch 0: 10%|█ | 1241/12384 [2:38:12<23:34:06, 7.61s/it, loss=0.0018, acc=0.9977, iter_time=9.89s]
Epoch 0: 10%|█ | 1242/12384 [2:38:12<23:33:44, 7.61s/it, loss=0.0018, acc=0.9977, iter_time=9.89s]
Epoch 0: 10%|█ | 1242/12384 [2:38:19<23:33:44, 7.61s/it, loss=0.0013, acc=0.9955, iter_time=7.63s]
Epoch 0: 10%|█ | 1243/12384 [2:38:19<23:34:18, 7.62s/it, loss=0.0013, acc=0.9955, iter_time=7.63s]
Epoch 0: 10%|█ | 1243/12384 [2:38:27<23:34:18, 7.62s/it, loss=0.0013, acc=0.9978, iter_time=7.93s]
Epoch 0: 10%|█ | 1244/12384 [2:38:27<23:50:15, 7.70s/it, loss=0.0013, acc=0.9978, iter_time=7.93s]
Epoch 0: 10%|█ | 1244/12384 [2:38:35<23:50:15, 7.70s/it, loss=0.0019, acc=0.9973, iter_time=7.40s]
Epoch 0: 10%|█ | 1245/12384 [2:38:35<24:05:37, 7.79s/it, loss=0.0019, acc=0.9973, iter_time=7.40s]
Epoch 0: 10%|█ | 1245/12384 [2:38:43<24:05:37, 7.79s/it, loss=0.0016, acc=0.9977, iter_time=8.18s]
Epoch 0: 10%|█ | 1246/12384 [2:38:43<23:55:52, 7.73s/it, loss=0.0016, acc=0.9977, iter_time=8.18s]
Epoch 0: 10%|█ | 1246/12384 [2:38:50<23:55:52, 7.73s/it, loss=0.0052, acc=0.9893, iter_time=4.76s]
Epoch 0: 10%|█ | 1247/12384 [2:38:50<23:49:18, 7.70s/it, loss=0.0052, acc=0.9893, iter_time=4.76s]
Epoch 0: 10%|█ | 1247/12384 [2:38:58<23:49:18, 7.70s/it, loss=0.0005, acc=0.9991, iter_time=10.41s]
Epoch 0: 10%|█ | 1248/12384 [2:38:58<23:43:07, 7.67s/it, loss=0.0005, acc=0.9991, iter_time=10.41s]
Epoch 0: 10%|█ | 1248/12384 [2:39:05<23:43:07, 7.67s/it, loss=0.0011, acc=0.9984, iter_time=7.64s]
Epoch 0: 10%|█ | 1249/12384 [2:39:05<23:39:06, 7.65s/it, loss=0.0011, acc=0.9984, iter_time=7.64s]
Epoch 0: 10%|█ | 1249/12384 [2:39:13<23:39:06, 7.65s/it, loss=0.0049, acc=0.9874, iter_time=8.02s]
Epoch 0: 10%|█ | 1250/12384 [2:39:13<23:36:52, 7.64s/it, loss=0.0049, acc=0.9874, iter_time=8.02s]
Epoch 0: 10%|█ | 1250/12384 [2:39:21<23:36:52, 7.64s/it, loss=0.0012, acc=0.9988, iter_time=7.19s]
Epoch 0: 10%|█ | 1251/12384 [2:39:21<23:33:57, 7.62s/it, loss=0.0012, acc=0.9988, iter_time=7.19s]
Epoch 0: 10%|█ | 1251/12384 [2:39:28<23:33:57, 7.62s/it, loss=0.0021, acc=0.9985, iter_time=7.60s]
Epoch 0: 10%|█ | 1252/12384 [2:39:28<23:32:03, 7.61s/it, loss=0.0021, acc=0.9985, iter_time=7.60s]
Epoch 0: 10%|█ | 1252/12384 [2:39:36<23:32:03, 7.61s/it, loss=0.0024, acc=0.9948, iter_time=7.03s]
Epoch 0: 10%|█ | 1253/12384 [2:39:36<23:32:35, 7.61s/it, loss=0.0024, acc=0.9948, iter_time=7.03s]
Epoch 0: 10%|█ | 1253/12384 [2:39:43<23:32:35, 7.61s/it, loss=0.0023, acc=0.9969, iter_time=8.20s]
Epoch 0: 10%|█ | 1254/12384 [2:39:43<23:32:01, 7.61s/it, loss=0.0023, acc=0.9969, iter_time=8.20s]
Epoch 0: 10%|█ | 1254/12384 [2:39:51<23:32:01, 7.61s/it, loss=0.0039, acc=0.9939, iter_time=7.59s]
Epoch 0: 10%|█ | 1255/12384 [2:39:51<23:30:54, 7.61s/it, loss=0.0039, acc=0.9939, iter_time=7.59s]
Epoch 0: 10%|█ | 1255/12384 [2:39:59<23:30:54, 7.61s/it, loss=0.0047, acc=0.9950, iter_time=7.76s]
Epoch 0: 10%|█ | 1256/12384 [2:39:59<23:32:06, 7.61s/it, loss=0.0047, acc=0.9950, iter_time=7.76s]
Epoch 0: 10%|█ | 1256/12384 [2:40:06<23:32:06, 7.61s/it, loss=0.0023, acc=0.9920, iter_time=7.45s]
Epoch 0: 10%|█ | 1257/12384 [2:40:06<23:32:03, 7.61s/it, loss=0.0023, acc=0.9920, iter_time=7.45s]
Epoch 0: 10%|█ | 1257/12384 [2:40:14<23:32:03, 7.61s/it, loss=0.0018, acc=0.9976, iter_time=6.52s]
Epoch 0: 10%|█ | 1258/12384 [2:40:14<23:32:26, 7.62s/it, loss=0.0018, acc=0.9976, iter_time=6.52s]
Epoch 0: 10%|█ | 1258/12384 [2:40:22<23:32:26, 7.62s/it, loss=0.0065, acc=0.9937, iter_time=8.73s]
Epoch 0: 10%|█ | 1259/12384 [2:40:22<23:30:55, 7.61s/it, loss=0.0065, acc=0.9937, iter_time=8.73s]
Epoch 0: 10%|█ | 1259/12384 [2:40:29<23:30:55, 7.61s/it, loss=0.0008, acc=0.9995, iter_time=6.99s]
Epoch 0: 10%|█ | 1260/12384 [2:40:29<23:31:47, 7.61s/it, loss=0.0008, acc=0.9995, iter_time=6.99s]
Epoch 0: 10%|█ | 1260/12384 [2:40:37<23:31:47, 7.61s/it, loss=0.0020, acc=0.9966, iter_time=8.23s]
Epoch 0: 10%|█ | 1261/12384 [2:40:37<23:29:59, 7.61s/it, loss=0.0020, acc=0.9966, iter_time=8.23s]
Epoch 0: 10%|█ | 1261/12384 [2:40:44<23:29:59, 7.61s/it, loss=0.0031, acc=0.9925, iter_time=7.62s]
Epoch 0: 10%|█ | 1262/12384 [2:40:44<23:31:01, 7.61s/it, loss=0.0031, acc=0.9925, iter_time=7.62s]
Epoch 0: 10%|█ | 1262/12384 [2:40:52<23:31:01, 7.61s/it, loss=0.0014, acc=0.9984, iter_time=7.62s]
Epoch 0: 10%|█ | 1263/12384 [2:40:52<23:31:46, 7.62s/it, loss=0.0014, acc=0.9984, iter_time=7.62s]
Epoch 0: 10%|█ | 1263/12384 [2:41:00<23:31:46, 7.62s/it, loss=0.0015, acc=0.9957, iter_time=7.71s]
Epoch 0: 10%|█ | 1264/12384 [2:41:00<23:31:04, 7.61s/it, loss=0.0015, acc=0.9957, iter_time=7.71s]
Epoch 0: 10%|█ | 1264/12384 [2:41:07<23:31:04, 7.61s/it, loss=0.0033, acc=0.9949, iter_time=7.50s]
Epoch 0: 10%|█ | 1265/12384 [2:41:07<23:30:20, 7.61s/it, loss=0.0033, acc=0.9949, iter_time=7.50s]
Epoch 0: 10%|█ | 1265/12384 [2:41:15<23:30:20, 7.61s/it, loss=0.0019, acc=0.9945, iter_time=7.63s]
Epoch 0: 10%|█ | 1266/12384 [2:41:15<23:30:19, 7.61s/it, loss=0.0019, acc=0.9945, iter_time=7.63s]
Epoch 0: 10%|█ | 1266/12384 [2:41:22<23:30:19, 7.61s/it, loss=0.0023, acc=0.9921, iter_time=4.99s]
Epoch 0: 10%|█ | 1267/12384 [2:41:22<23:30:33, 7.61s/it, loss=0.0023, acc=0.9921, iter_time=4.99s]
Epoch 0: 10%|█ | 1267/12384 [2:41:30<23:30:33, 7.61s/it, loss=0.0022, acc=0.9947, iter_time=10.22s]
Epoch 0: 10%|█ | 1268/12384 [2:41:30<23:30:43, 7.61s/it, loss=0.0022, acc=0.9947, iter_time=10.22s]
Epoch 0: 10%|█ | 1268/12384 [2:41:38<23:30:43, 7.61s/it, loss=0.0020, acc=0.9968, iter_time=7.62s]
Epoch 0: 10%|█ | 1269/12384 [2:41:38<23:30:20, 7.61s/it, loss=0.0020, acc=0.9968, iter_time=7.62s]
Epoch 0: 10%|█ | 1269/12384 [2:41:45<23:30:20, 7.61s/it, loss=0.0016, acc=0.9966, iter_time=7.64s]
Epoch 0: 10%|█ | 1270/12384 [2:41:45<23:30:32, 7.61s/it, loss=0.0016, acc=0.9966, iter_time=7.64s]
Epoch 0: 10%|█ | 1270/12384 [2:41:53<23:30:32, 7.61s/it, loss=0.0022, acc=0.9949, iter_time=7.99s]
Epoch 0: 10%|█ | 1271/12384 [2:41:53<23:51:56, 7.73s/it, loss=0.0022, acc=0.9949, iter_time=7.99s]
Epoch 0: 10%|█ | 1271/12384 [2:42:01<23:51:56, 7.73s/it, loss=0.0111, acc=0.9800, iter_time=7.99s]
Epoch 0: 10%|█ | 1272/12384 [2:42:01<23:45:09, 7.70s/it, loss=0.0111, acc=0.9800, iter_time=7.99s]
Epoch 0: 10%|█ | 1272/12384 [2:42:09<23:45:09, 7.70s/it, loss=0.0036, acc=0.9902, iter_time=7.22s]
Epoch 0: 10%|█ | 1273/12384 [2:42:09<23:40:47, 7.67s/it, loss=0.0036, acc=0.9902, iter_time=7.22s]
Epoch 0: 10%|█ | 1273/12384 [2:42:16<23:40:47, 7.67s/it, loss=0.0007, acc=0.9990, iter_time=7.63s]
Epoch 0: 10%|█ | 1274/12384 [2:42:16<23:36:34, 7.65s/it, loss=0.0007, acc=0.9990, iter_time=7.63s]
Epoch 0: 10%|█ | 1274/12384 [2:42:24<23:36:34, 7.65s/it, loss=0.0225, acc=0.9629, iter_time=7.59s]
Epoch 0: 10%|█ | 1275/12384 [2:42:24<23:34:47, 7.64s/it, loss=0.0225, acc=0.9629, iter_time=7.59s]
Epoch 0: 10%|█ | 1275/12384 [2:42:31<23:34:47, 7.64s/it, loss=0.0045, acc=0.9963, iter_time=7.61s]
Epoch 0: 10%|█ | 1276/12384 [2:42:31<23:33:23, 7.63s/it, loss=0.0045, acc=0.9963, iter_time=7.61s]
Epoch 0: 10%|█ | 1276/12384 [2:42:39<23:33:23, 7.63s/it, loss=0.0020, acc=0.9943, iter_time=7.64s]
Epoch 0: 10%|█ | 1277/12384 [2:42:39<23:32:33, 7.63s/it, loss=0.0020, acc=0.9943, iter_time=7.64s]
Epoch 0: 10%|█ | 1277/12384 [2:42:47<23:32:33, 7.63s/it, loss=0.0007, acc=0.9991, iter_time=5.61s]
Epoch 0: 10%|█ | 1278/12384 [2:42:47<23:28:53, 7.61s/it, loss=0.0007, acc=0.9991, iter_time=5.61s]
Epoch 0: 10%|█ | 1278/12384 [2:42:54<23:28:53, 7.61s/it, loss=0.0024, acc=0.9970, iter_time=9.58s]
Epoch 0: 10%|█ | 1279/12384 [2:42:54<23:28:12, 7.61s/it, loss=0.0024, acc=0.9970, iter_time=9.58s]
Epoch 0: 10%|█ | 1279/12384 [2:43:02<23:28:12, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=7.55s]
Epoch 0: 10%|█ | 1280/12384 [2:43:02<23:28:28, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=7.55s]
Epoch 0: 10%|█ | 1280/12384 [2:43:09<23:28:28, 7.61s/it, loss=0.0019, acc=0.9980, iter_time=6.42s]
Epoch 0: 10%|█ | 1281/12384 [2:43:09<23:28:53, 7.61s/it, loss=0.0019, acc=0.9980, iter_time=6.42s]
Epoch 0: 10%|█ | 1281/12384 [2:43:17<23:28:53, 7.61s/it, loss=0.0369, acc=0.9466, iter_time=8.87s]
Epoch 0: 10%|█ | 1282/12384 [2:43:17<23:28:42, 7.61s/it, loss=0.0369, acc=0.9466, iter_time=8.87s]
Epoch 0: 10%|█ | 1282/12384 [2:43:25<23:28:42, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=5.52s]
Epoch 0: 10%|█ | 1283/12384 [2:43:25<23:29:16, 7.62s/it, loss=0.0005, acc=0.9993, iter_time=5.52s]
Epoch 0: 10%|█ | 1283/12384 [2:43:32<23:29:16, 7.62s/it, loss=0.0015, acc=0.9951, iter_time=9.70s]
Epoch 0: 10%|█ | 1284/12384 [2:43:32<23:29:57, 7.62s/it, loss=0.0015, acc=0.9951, iter_time=9.70s]
Epoch 0: 10%|█ | 1284/12384 [2:43:40<23:29:57, 7.62s/it, loss=0.0039, acc=0.9940, iter_time=4.32s]
Epoch 0: 10%|█ | 1285/12384 [2:43:40<23:29:38, 7.62s/it, loss=0.0039, acc=0.9940, iter_time=4.32s]
Epoch 0: 10%|█ | 1285/12384 [2:43:47<23:29:38, 7.62s/it, loss=0.0009, acc=1.0000, iter_time=10.90s]
Epoch 0: 10%|█ | 1286/12384 [2:43:47<23:29:06, 7.62s/it, loss=0.0009, acc=1.0000, iter_time=10.90s]
Epoch 0: 10%|█ | 1286/12384 [2:43:55<23:29:06, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=7.33s]
Epoch 0: 10%|█ | 1287/12384 [2:43:55<23:29:09, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=7.33s]
Epoch 0: 10%|█ | 1287/12384 [2:44:03<23:29:09, 7.62s/it, loss=0.0016, acc=0.9954, iter_time=7.90s]
Epoch 0: 10%|█ | 1288/12384 [2:44:03<23:29:08, 7.62s/it, loss=0.0016, acc=0.9954, iter_time=7.90s]
Epoch 0: 10%|█ | 1288/12384 [2:44:10<23:29:08, 7.62s/it, loss=0.0016, acc=0.9969, iter_time=7.65s]
Epoch 0: 10%|█ | 1289/12384 [2:44:10<23:27:59, 7.61s/it, loss=0.0016, acc=0.9969, iter_time=7.65s]
Epoch 0: 10%|█ | 1289/12384 [2:44:18<23:27:59, 7.61s/it, loss=0.0032, acc=0.9954, iter_time=7.62s]
Epoch 0: 10%|█ | 1290/12384 [2:44:18<23:27:41, 7.61s/it, loss=0.0032, acc=0.9954, iter_time=7.62s]
Epoch 0: 10%|█ | 1290/12384 [2:44:26<23:27:41, 7.61s/it, loss=0.0005, acc=0.9983, iter_time=5.26s]
Epoch 0: 10%|█ | 1291/12384 [2:44:26<23:27:58, 7.62s/it, loss=0.0005, acc=0.9983, iter_time=5.26s]
Epoch 0: 10%|█ | 1291/12384 [2:44:33<23:27:58, 7.62s/it, loss=0.0016, acc=0.9966, iter_time=9.95s]
Epoch 0: 10%|█ | 1292/12384 [2:44:33<23:27:27, 7.61s/it, loss=0.0016, acc=0.9966, iter_time=9.95s]
Epoch 0: 10%|█ | 1292/12384 [2:44:41<23:27:27, 7.61s/it, loss=0.0007, acc=0.9974, iter_time=7.62s]
Epoch 0: 10%|█ | 1293/12384 [2:44:41<23:26:17, 7.61s/it, loss=0.0007, acc=0.9974, iter_time=7.62s]
Epoch 0: 10%|█ | 1293/12384 [2:44:48<23:26:17, 7.61s/it, loss=0.0015, acc=0.9986, iter_time=6.39s]
Epoch 0: 10%|█ | 1294/12384 [2:44:48<23:26:23, 7.61s/it, loss=0.0015, acc=0.9986, iter_time=6.39s]
Epoch 0: 10%|█ | 1294/12384 [2:44:56<23:26:23, 7.61s/it, loss=0.0008, acc=0.9998, iter_time=8.83s]
Epoch 0: 10%|█ | 1295/12384 [2:44:56<23:26:15, 7.61s/it, loss=0.0008, acc=0.9998, iter_time=8.83s]
Epoch 0: 10%|█ | 1295/12384 [2:45:04<23:26:15, 7.61s/it, loss=0.0012, acc=0.9996, iter_time=7.56s]
Epoch 0: 10%|█ | 1296/12384 [2:45:04<23:26:53, 7.61s/it, loss=0.0012, acc=0.9996, iter_time=7.56s]
Epoch 0: 10%|█ | 1296/12384 [2:45:12<23:26:53, 7.61s/it, loss=0.0015, acc=0.9974, iter_time=7.68s]
Epoch 0: 10%|█ | 1297/12384 [2:45:12<23:43:27, 7.70s/it, loss=0.0015, acc=0.9974, iter_time=7.68s]
Epoch 0: 10%|█ | 1297/12384 [2:45:19<23:43:27, 7.70s/it, loss=0.0013, acc=0.9978, iter_time=7.89s]
Epoch 0: 10%|█ | 1298/12384 [2:45:19<23:39:02, 7.68s/it, loss=0.0013, acc=0.9978, iter_time=7.89s]
Epoch 0: 10%|█ | 1298/12384 [2:45:27<23:39:02, 7.68s/it, loss=0.0009, acc=0.9982, iter_time=7.60s]
Epoch 0: 10%|█ | 1299/12384 [2:45:27<23:33:20, 7.65s/it, loss=0.0009, acc=0.9982, iter_time=7.60s]
Epoch 0: 10%|█ | 1299/12384 [2:45:34<23:33:20, 7.65s/it, loss=0.0009, acc=0.9992, iter_time=7.99s]
Epoch 0: 10%|█ | 1300/12384 [2:45:34<23:30:21, 7.63s/it, loss=0.0009, acc=0.9992, iter_time=7.99s]
Epoch 0: 10%|█ | 1300/12384 [2:45:42<23:30:21, 7.63s/it, loss=0.0020, acc=0.9980, iter_time=5.11s]
Epoch 0: 11%|█ | 1301/12384 [2:45:42<23:30:25, 7.64s/it, loss=0.0020, acc=0.9980, iter_time=5.11s]
Epoch 0: 11%|█ | 1301/12384 [2:45:50<23:30:25, 7.64s/it, loss=0.0049, acc=0.9890, iter_time=9.72s]
Epoch 0: 11%|█ | 1302/12384 [2:45:50<23:28:05, 7.62s/it, loss=0.0049, acc=0.9890, iter_time=9.72s]
Epoch 0: 11%|█ | 1302/12384 [2:45:57<23:28:05, 7.62s/it, loss=0.0027, acc=0.9934, iter_time=7.59s]
Epoch 0: 11%|█ | 1303/12384 [2:45:57<23:27:08, 7.62s/it, loss=0.0027, acc=0.9934, iter_time=7.59s]
Epoch 0: 11%|█ | 1303/12384 [2:46:05<23:27:08, 7.62s/it, loss=0.0018, acc=0.9936, iter_time=8.00s]
Epoch 0: 11%|█ | 1304/12384 [2:46:05<23:25:54, 7.61s/it, loss=0.0018, acc=0.9936, iter_time=8.00s]
Epoch 0: 11%|█ | 1304/12384 [2:46:12<23:25:54, 7.61s/it, loss=0.0009, acc=0.9979, iter_time=7.21s]
Epoch 0: 11%|█ | 1305/12384 [2:46:12<23:25:49, 7.61s/it, loss=0.0009, acc=0.9979, iter_time=7.21s]
Epoch 0: 11%|█ | 1305/12384 [2:46:20<23:25:49, 7.61s/it, loss=0.0008, acc=1.0000, iter_time=2.76s]
Epoch 0: 11%|█ | 1306/12384 [2:46:20<23:24:48, 7.61s/it, loss=0.0008, acc=1.0000, iter_time=2.76s]
Epoch 0: 11%|█ | 1306/12384 [2:46:28<23:24:48, 7.61s/it, loss=0.0011, acc=0.9978, iter_time=12.46s]
Epoch 0: 11%|█ | 1307/12384 [2:46:28<23:25:41, 7.61s/it, loss=0.0011, acc=0.9978, iter_time=12.46s]
Epoch 0: 11%|█ | 1307/12384 [2:46:35<23:25:41, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 11%|█ | 1308/12384 [2:46:35<23:24:58, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 11%|█ | 1308/12384 [2:46:43<23:24:58, 7.61s/it, loss=0.0027, acc=0.9928, iter_time=7.63s]
Epoch 0: 11%|█ | 1309/12384 [2:46:43<23:28:46, 7.63s/it, loss=0.0027, acc=0.9928, iter_time=7.63s]
Epoch 0: 11%|█ | 1309/12384 [2:46:51<23:28:46, 7.63s/it, loss=0.0017, acc=0.9961, iter_time=7.66s]
Epoch 0: 11%|█ | 1310/12384 [2:46:51<23:28:29, 7.63s/it, loss=0.0017, acc=0.9961, iter_time=7.66s]
Epoch 0: 11%|█ | 1310/12384 [2:46:58<23:28:29, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 0: 11%|█ | 1311/12384 [2:46:58<23:27:19, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 0: 11%|█ | 1311/12384 [2:47:06<23:27:19, 7.63s/it, loss=0.0025, acc=0.9940, iter_time=7.60s]
Epoch 0: 11%|█ | 1312/12384 [2:47:06<23:29:07, 7.64s/it, loss=0.0025, acc=0.9940, iter_time=7.60s]
Epoch 0: 11%|█ | 1312/12384 [2:47:13<23:29:07, 7.64s/it, loss=0.0020, acc=0.9995, iter_time=7.68s]
Epoch 0: 11%|█ | 1313/12384 [2:47:13<23:28:24, 7.63s/it, loss=0.0020, acc=0.9995, iter_time=7.68s]
Epoch 0: 11%|█ | 1313/12384 [2:47:21<23:28:24, 7.63s/it, loss=0.0014, acc=0.9957, iter_time=7.62s]
Epoch 0: 11%|█ | 1314/12384 [2:47:21<23:27:56, 7.63s/it, loss=0.0014, acc=0.9957, iter_time=7.62s]
Epoch 0: 11%|█ | 1314/12384 [2:47:29<23:27:56, 7.63s/it, loss=0.0013, acc=0.9971, iter_time=7.62s]
Epoch 0: 11%|█ | 1315/12384 [2:47:29<23:27:02, 7.63s/it, loss=0.0013, acc=0.9971, iter_time=7.62s]
Epoch 0: 11%|█ | 1315/12384 [2:47:36<23:27:02, 7.63s/it, loss=0.0030, acc=0.9905, iter_time=7.63s]
Epoch 0: 11%|█ | 1316/12384 [2:47:36<23:26:27, 7.62s/it, loss=0.0030, acc=0.9905, iter_time=7.63s]
Epoch 0: 11%|█ | 1316/12384 [2:47:44<23:26:27, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.65s]
Epoch 0: 11%|█ | 1317/12384 [2:47:44<23:25:15, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.65s]
Epoch 0: 11%|█ | 1317/12384 [2:47:51<23:25:15, 7.62s/it, loss=0.0026, acc=0.9941, iter_time=8.54s]
Epoch 0: 11%|█ | 1318/12384 [2:47:51<23:25:04, 7.62s/it, loss=0.0026, acc=0.9941, iter_time=8.54s]
Epoch 0: 11%|█ | 1318/12384 [2:47:59<23:25:04, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=6.10s]
Epoch 0: 11%|█ | 1319/12384 [2:47:59<23:24:55, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=6.10s]
Epoch 0: 11%|█ | 1319/12384 [2:48:07<23:24:55, 7.62s/it, loss=0.0041, acc=0.9955, iter_time=9.54s]
Epoch 0: 11%|█ | 1320/12384 [2:48:07<23:29:08, 7.64s/it, loss=0.0041, acc=0.9955, iter_time=9.54s]
Epoch 0: 11%|█ | 1320/12384 [2:48:14<23:29:08, 7.64s/it, loss=0.0032, acc=0.9970, iter_time=3.02s]
Epoch 0: 11%|█ | 1321/12384 [2:48:14<23:26:38, 7.63s/it, loss=0.0032, acc=0.9970, iter_time=3.02s]
Epoch 0: 11%|█ | 1321/12384 [2:48:22<23:26:38, 7.63s/it, loss=0.0053, acc=0.9919, iter_time=8.61s]
Epoch 0: 11%|█ | 1322/12384 [2:48:22<23:27:35, 7.63s/it, loss=0.0053, acc=0.9919, iter_time=8.61s]
Epoch 0: 11%|█ | 1322/12384 [2:48:30<23:27:35, 7.63s/it, loss=0.0019, acc=0.9962, iter_time=10.96s]
Epoch 0: 11%|█ | 1323/12384 [2:48:30<23:45:54, 7.73s/it, loss=0.0019, acc=0.9962, iter_time=10.96s]
Epoch 0: 11%|█ | 1323/12384 [2:48:38<23:45:54, 7.73s/it, loss=0.0037, acc=0.9948, iter_time=7.93s]
Epoch 0: 11%|█ | 1324/12384 [2:48:38<23:37:19, 7.69s/it, loss=0.0037, acc=0.9948, iter_time=7.93s]
Epoch 0: 11%|█ | 1324/12384 [2:48:45<23:37:19, 7.69s/it, loss=0.0020, acc=0.9962, iter_time=7.05s]
Epoch 0: 11%|█ | 1325/12384 [2:48:45<23:32:51, 7.67s/it, loss=0.0020, acc=0.9962, iter_time=7.05s]
Epoch 0: 11%|█ | 1325/12384 [2:48:53<23:32:51, 7.67s/it, loss=0.0021, acc=0.9964, iter_time=8.15s]
Epoch 0: 11%|█ | 1326/12384 [2:48:53<23:31:45, 7.66s/it, loss=0.0021, acc=0.9964, iter_time=8.15s]
Epoch 0: 11%|█ | 1326/12384 [2:49:01<23:31:45, 7.66s/it, loss=0.0052, acc=0.9894, iter_time=7.67s]
Epoch 0: 11%|█ | 1327/12384 [2:49:01<23:30:26, 7.65s/it, loss=0.0052, acc=0.9894, iter_time=7.67s]
Epoch 0: 11%|█ | 1327/12384 [2:49:08<23:30:26, 7.65s/it, loss=0.0020, acc=0.9931, iter_time=8.02s]
Epoch 0: 11%|█ | 1328/12384 [2:49:08<23:27:51, 7.64s/it, loss=0.0020, acc=0.9931, iter_time=8.02s]
Epoch 0: 11%|█ | 1328/12384 [2:49:16<23:27:51, 7.64s/it, loss=0.0016, acc=0.9981, iter_time=7.22s]
Epoch 0: 11%|█ | 1329/12384 [2:49:16<23:26:06, 7.63s/it, loss=0.0016, acc=0.9981, iter_time=7.22s]
Epoch 0: 11%|█ | 1329/12384 [2:49:23<23:26:06, 7.63s/it, loss=0.0021, acc=0.9969, iter_time=6.38s]
Epoch 0: 11%|█ | 1330/12384 [2:49:23<23:23:49, 7.62s/it, loss=0.0021, acc=0.9969, iter_time=6.38s]
Epoch 0: 11%|█ | 1330/12384 [2:49:31<23:23:49, 7.62s/it, loss=0.0037, acc=0.9956, iter_time=8.80s]
Epoch 0: 11%|█ | 1331/12384 [2:49:31<23:22:12, 7.61s/it, loss=0.0037, acc=0.9956, iter_time=8.80s]
Epoch 0: 11%|█ | 1331/12384 [2:49:39<23:22:12, 7.61s/it, loss=0.0016, acc=0.9969, iter_time=7.06s]
Epoch 0: 11%|█ | 1332/12384 [2:49:39<23:26:23, 7.64s/it, loss=0.0016, acc=0.9969, iter_time=7.06s]
Epoch 0: 11%|█ | 1332/12384 [2:49:46<23:26:23, 7.64s/it, loss=0.0007, acc=0.9974, iter_time=5.39s]
Epoch 0: 11%|█ | 1333/12384 [2:49:46<23:30:56, 7.66s/it, loss=0.0007, acc=0.9974, iter_time=5.39s]
Epoch 0: 11%|█ | 1333/12384 [2:49:54<23:30:56, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.71s]
Epoch 0: 11%|█ | 1334/12384 [2:49:54<23:29:50, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.71s]
Epoch 0: 11%|█ | 1334/12384 [2:50:02<23:29:50, 7.66s/it, loss=0.0008, acc=0.9973, iter_time=10.49s]
Epoch 0: 11%|█ | 1335/12384 [2:50:02<23:28:11, 7.65s/it, loss=0.0008, acc=0.9973, iter_time=10.49s]
Epoch 0: 11%|█ | 1335/12384 [2:50:09<23:28:11, 7.65s/it, loss=0.0017, acc=0.9960, iter_time=8.01s]
Epoch 0: 11%|█ | 1336/12384 [2:50:09<23:26:03, 7.64s/it, loss=0.0017, acc=0.9960, iter_time=8.01s]
Epoch 0: 11%|█ | 1336/12384 [2:50:17<23:26:03, 7.64s/it, loss=0.0070, acc=0.9884, iter_time=7.24s]
Epoch 0: 11%|█ | 1337/12384 [2:50:17<23:25:41, 7.63s/it, loss=0.0070, acc=0.9884, iter_time=7.24s]
Epoch 0: 11%|█ | 1337/12384 [2:50:24<23:25:41, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 11%|█ | 1338/12384 [2:50:24<23:24:56, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 11%|█ | 1338/12384 [2:50:32<23:24:56, 7.63s/it, loss=0.0011, acc=0.9981, iter_time=7.62s]
Epoch 0: 11%|█ | 1339/12384 [2:50:32<23:24:09, 7.63s/it, loss=0.0011, acc=0.9981, iter_time=7.62s]
Epoch 0: 11%|█ | 1339/12384 [2:50:40<23:24:09, 7.63s/it, loss=0.0010, acc=0.9997, iter_time=7.61s]
Epoch 0: 11%|█ | 1340/12384 [2:50:40<23:23:59, 7.63s/it, loss=0.0010, acc=0.9997, iter_time=7.61s]
Epoch 0: 11%|█ | 1340/12384 [2:50:47<23:23:59, 7.63s/it, loss=0.0023, acc=0.9934, iter_time=7.65s]
Epoch 0: 11%|█ | 1341/12384 [2:50:47<23:22:40, 7.62s/it, loss=0.0023, acc=0.9934, iter_time=7.65s]
Epoch 0: 11%|█ | 1341/12384 [2:50:55<23:22:40, 7.62s/it, loss=0.0029, acc=0.9939, iter_time=7.60s]
Epoch 0: 11%|█ | 1342/12384 [2:50:55<23:21:25, 7.62s/it, loss=0.0029, acc=0.9939, iter_time=7.60s]
Epoch 0: 11%|█ | 1342/12384 [2:51:03<23:21:25, 7.62s/it, loss=0.0016, acc=0.9969, iter_time=7.60s]
Epoch 0: 11%|█ | 1343/12384 [2:51:03<23:21:53, 7.62s/it, loss=0.0016, acc=0.9969, iter_time=7.60s]
Epoch 0: 11%|█ | 1343/12384 [2:51:10<23:21:53, 7.62s/it, loss=0.0019, acc=0.9928, iter_time=7.59s]
Epoch 0: 11%|█ | 1344/12384 [2:51:10<23:21:55, 7.62s/it, loss=0.0019, acc=0.9928, iter_time=7.59s]
Epoch 0: 11%|█ | 1344/12384 [2:51:18<23:21:55, 7.62s/it, loss=0.0014, acc=0.9959, iter_time=6.44s]
Epoch 0: 11%|█ | 1345/12384 [2:51:18<23:21:10, 7.62s/it, loss=0.0014, acc=0.9959, iter_time=6.44s]
Epoch 0: 11%|█ | 1345/12384 [2:51:25<23:21:10, 7.62s/it, loss=0.0055, acc=0.9839, iter_time=8.83s]
Epoch 0: 11%|█ | 1346/12384 [2:51:25<23:25:42, 7.64s/it, loss=0.0055, acc=0.9839, iter_time=8.83s]
Epoch 0: 11%|█ | 1346/12384 [2:51:33<23:25:42, 7.64s/it, loss=0.0010, acc=0.9984, iter_time=7.10s]
Epoch 0: 11%|█ | 1347/12384 [2:51:33<23:26:36, 7.65s/it, loss=0.0010, acc=0.9984, iter_time=7.10s]
Epoch 0: 11%|█ | 1347/12384 [2:51:41<23:26:36, 7.65s/it, loss=0.0010, acc=0.9986, iter_time=7.02s]
Epoch 0: 11%|█ | 1348/12384 [2:51:41<23:23:57, 7.63s/it, loss=0.0010, acc=0.9986, iter_time=7.02s]
Epoch 0: 11%|█ | 1348/12384 [2:51:49<23:23:57, 7.63s/it, loss=0.0025, acc=0.9925, iter_time=9.13s]
Epoch 0: 11%|█ | 1349/12384 [2:51:49<23:40:32, 7.72s/it, loss=0.0025, acc=0.9925, iter_time=9.13s]
Epoch 0: 11%|█ | 1349/12384 [2:51:56<23:40:32, 7.72s/it, loss=0.0016, acc=0.9970, iter_time=8.03s]
Epoch 0: 11%|█ | 1350/12384 [2:51:56<23:34:08, 7.69s/it, loss=0.0016, acc=0.9970, iter_time=8.03s]
Epoch 0: 11%|█ | 1350/12384 [2:52:04<23:34:08, 7.69s/it, loss=0.0139, acc=0.9784, iter_time=7.21s]
Epoch 0: 11%|█ | 1351/12384 [2:52:04<23:29:05, 7.66s/it, loss=0.0139, acc=0.9784, iter_time=7.21s]
Epoch 0: 11%|█ | 1351/12384 [2:52:11<23:29:05, 7.66s/it, loss=0.0064, acc=0.9920, iter_time=7.56s]
Epoch 0: 11%|█ | 1352/12384 [2:52:12<23:26:52, 7.65s/it, loss=0.0064, acc=0.9920, iter_time=7.56s]
Epoch 0: 11%|█ | 1352/12384 [2:52:19<23:26:52, 7.65s/it, loss=0.0010, acc=0.9994, iter_time=4.52s]
Epoch 0: 11%|█ | 1353/12384 [2:52:19<23:24:48, 7.64s/it, loss=0.0010, acc=0.9994, iter_time=4.52s]
Epoch 0: 11%|█ | 1353/12384 [2:52:27<23:24:48, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.72s]
Epoch 0: 11%|█ | 1354/12384 [2:52:27<23:23:34, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.72s]
Epoch 0: 11%|█ | 1354/12384 [2:52:34<23:23:34, 7.64s/it, loss=0.0012, acc=0.9980, iter_time=10.64s]
Epoch 0: 11%|█ | 1355/12384 [2:52:34<23:21:45, 7.63s/it, loss=0.0012, acc=0.9980, iter_time=10.64s]
Epoch 0: 11%|█ | 1355/12384 [2:52:42<23:21:45, 7.63s/it, loss=0.0018, acc=0.9979, iter_time=5.53s]
Epoch 0: 11%|█ | 1356/12384 [2:52:42<23:21:11, 7.62s/it, loss=0.0018, acc=0.9979, iter_time=5.53s]
Epoch 0: 11%|█ | 1356/12384 [2:52:50<23:21:11, 7.62s/it, loss=0.0031, acc=0.9924, iter_time=9.69s]
Epoch 0: 11%|█ | 1357/12384 [2:52:50<23:19:25, 7.61s/it, loss=0.0031, acc=0.9924, iter_time=9.69s]
Epoch 0: 11%|█ | 1357/12384 [2:52:57<23:19:25, 7.61s/it, loss=0.0009, acc=0.9971, iter_time=7.60s]
Epoch 0: 11%|█ | 1358/12384 [2:52:57<23:19:47, 7.62s/it, loss=0.0009, acc=0.9971, iter_time=7.60s]
Epoch 0: 11%|█ | 1358/12384 [2:53:05<23:19:47, 7.62s/it, loss=0.0016, acc=0.9977, iter_time=7.63s]
Epoch 0: 11%|█ | 1359/12384 [2:53:05<23:18:07, 7.61s/it, loss=0.0016, acc=0.9977, iter_time=7.63s]
Epoch 0: 11%|█ | 1359/12384 [2:53:12<23:18:07, 7.61s/it, loss=0.0009, acc=0.9981, iter_time=7.98s]
Epoch 0: 11%|█ | 1360/12384 [2:53:12<23:17:48, 7.61s/it, loss=0.0009, acc=0.9981, iter_time=7.98s]
Epoch 0: 11%|█ | 1360/12384 [2:53:20<23:17:48, 7.61s/it, loss=0.0042, acc=0.9899, iter_time=7.22s]
Epoch 0: 11%|█ | 1361/12384 [2:53:20<23:18:43, 7.61s/it, loss=0.0042, acc=0.9899, iter_time=7.22s]
Epoch 0: 11%|█ | 1361/12384 [2:53:28<23:18:43, 7.61s/it, loss=0.0013, acc=0.9979, iter_time=7.62s]
Epoch 0: 11%|█ | 1362/12384 [2:53:28<23:18:28, 7.61s/it, loss=0.0013, acc=0.9979, iter_time=7.62s]
Epoch 0: 11%|█ | 1362/12384 [2:53:35<23:18:28, 7.61s/it, loss=0.0033, acc=0.9928, iter_time=7.37s]
Epoch 0: 11%|█ | 1363/12384 [2:53:35<23:18:33, 7.61s/it, loss=0.0033, acc=0.9928, iter_time=7.37s]
Epoch 0: 11%|█ | 1363/12384 [2:53:43<23:18:33, 7.61s/it, loss=0.0120, acc=0.9796, iter_time=7.88s]
Epoch 0: 11%|█ | 1364/12384 [2:53:43<23:17:58, 7.61s/it, loss=0.0120, acc=0.9796, iter_time=7.88s]
Epoch 0: 11%|█ | 1364/12384 [2:53:50<23:17:58, 7.61s/it, loss=0.0007, acc=0.9981, iter_time=7.59s]
Epoch 0: 11%|█ | 1365/12384 [2:53:50<23:16:52, 7.61s/it, loss=0.0007, acc=0.9981, iter_time=7.59s]
Epoch 0: 11%|█ | 1365/12384 [2:53:58<23:16:52, 7.61s/it, loss=0.0041, acc=0.9889, iter_time=7.65s]
Epoch 0: 11%|█ | 1366/12384 [2:53:58<23:19:13, 7.62s/it, loss=0.0041, acc=0.9889, iter_time=7.65s]
Epoch 0: 11%|█ | 1366/12384 [2:54:06<23:19:13, 7.62s/it, loss=0.0021, acc=0.9929, iter_time=5.80s]
Epoch 0: 11%|█ | 1367/12384 [2:54:06<23:22:44, 7.64s/it, loss=0.0021, acc=0.9929, iter_time=5.80s]
Epoch 0: 11%|█ | 1367/12384 [2:54:13<23:22:44, 7.64s/it, loss=0.0011, acc=0.9969, iter_time=9.87s]
Epoch 0: 11%|█ | 1368/12384 [2:54:13<23:21:35, 7.63s/it, loss=0.0011, acc=0.9969, iter_time=9.87s]
Epoch 0: 11%|█ | 1368/12384 [2:54:21<23:21:35, 7.63s/it, loss=0.0060, acc=0.9849, iter_time=7.25s]
Epoch 0: 11%|█ | 1369/12384 [2:54:21<23:20:26, 7.63s/it, loss=0.0060, acc=0.9849, iter_time=7.25s]
Epoch 0: 11%|█ | 1369/12384 [2:54:29<23:20:26, 7.63s/it, loss=0.0058, acc=0.9873, iter_time=7.60s]
Epoch 0: 11%|█ | 1370/12384 [2:54:29<23:18:20, 7.62s/it, loss=0.0058, acc=0.9873, iter_time=7.60s]
Epoch 0: 11%|█ | 1370/12384 [2:54:36<23:18:20, 7.62s/it, loss=0.0010, acc=0.9996, iter_time=7.61s]
Epoch 0: 11%|█ | 1371/12384 [2:54:36<23:18:49, 7.62s/it, loss=0.0010, acc=0.9996, iter_time=7.61s]
Epoch 0: 11%|█ | 1371/12384 [2:54:44<23:18:49, 7.62s/it, loss=0.0004, acc=0.9988, iter_time=7.61s]
Epoch 0: 11%|█ | 1372/12384 [2:54:44<23:18:27, 7.62s/it, loss=0.0004, acc=0.9988, iter_time=7.61s]
Epoch 0: 11%|█ | 1372/12384 [2:54:51<23:18:27, 7.62s/it, loss=0.0032, acc=0.9937, iter_time=5.54s]
Epoch 0: 11%|█ | 1373/12384 [2:54:51<23:16:31, 7.61s/it, loss=0.0032, acc=0.9937, iter_time=5.54s]
Epoch 0: 11%|█ | 1373/12384 [2:54:59<23:16:31, 7.61s/it, loss=0.0026, acc=0.9947, iter_time=9.92s]
Epoch 0: 11%|█ | 1374/12384 [2:54:59<23:29:33, 7.68s/it, loss=0.0026, acc=0.9947, iter_time=9.92s]
Epoch 0: 11%|█ | 1374/12384 [2:55:07<23:29:33, 7.68s/it, loss=0.0007, acc=0.9998, iter_time=7.57s]
Epoch 0: 11%|█ | 1375/12384 [2:55:07<23:25:18, 7.66s/it, loss=0.0007, acc=0.9998, iter_time=7.57s]
Epoch 0: 11%|█ | 1375/12384 [2:55:15<23:25:18, 7.66s/it, loss=0.0005, acc=0.9981, iter_time=8.08s]
Epoch 0: 11%|█ | 1376/12384 [2:55:15<23:40:24, 7.74s/it, loss=0.0005, acc=0.9981, iter_time=8.08s]
Epoch 0: 11%|█ | 1376/12384 [2:55:22<23:40:24, 7.74s/it, loss=0.0006, acc=0.9998, iter_time=4.86s]
Epoch 0: 11%|█ | 1377/12384 [2:55:22<23:33:40, 7.71s/it, loss=0.0006, acc=0.9998, iter_time=4.86s]
Epoch 0: 11%|█ | 1377/12384 [2:55:30<23:33:40, 7.71s/it, loss=0.0031, acc=0.9939, iter_time=10.25s]
Epoch 0: 11%|█ | 1378/12384 [2:55:30<23:28:59, 7.68s/it, loss=0.0031, acc=0.9939, iter_time=10.25s]
Epoch 0: 11%|█ | 1378/12384 [2:55:38<23:28:59, 7.68s/it, loss=0.0040, acc=0.9865, iter_time=7.61s]
Epoch 0: 11%|█ | 1379/12384 [2:55:38<23:24:33, 7.66s/it, loss=0.0040, acc=0.9865, iter_time=7.61s]
Epoch 0: 11%|█ | 1379/12384 [2:55:45<23:24:33, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.67s]
Epoch 0: 11%|█ | 1380/12384 [2:55:45<23:22:11, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.67s]
Epoch 0: 11%|█ | 1380/12384 [2:55:53<23:22:11, 7.65s/it, loss=0.0022, acc=0.9973, iter_time=8.55s]
Epoch 0: 11%|█ | 1381/12384 [2:55:53<23:20:26, 7.64s/it, loss=0.0022, acc=0.9973, iter_time=8.55s]
Epoch 0: 11%|█ | 1381/12384 [2:56:01<23:20:26, 7.64s/it, loss=0.0020, acc=0.9953, iter_time=5.32s]
Epoch 0: 11%|█ | 1382/12384 [2:56:01<23:19:44, 7.63s/it, loss=0.0020, acc=0.9953, iter_time=5.32s]
Epoch 0: 11%|█ | 1382/12384 [2:56:08<23:19:44, 7.63s/it, loss=0.0062, acc=0.9972, iter_time=9.69s]
Epoch 0: 11%|█ | 1383/12384 [2:56:08<23:18:45, 7.63s/it, loss=0.0062, acc=0.9972, iter_time=9.69s]
Epoch 0: 11%|█ | 1383/12384 [2:56:16<23:18:45, 7.63s/it, loss=0.0015, acc=0.9940, iter_time=8.22s]
Epoch 0: 11%|█ | 1384/12384 [2:56:16<23:18:10, 7.63s/it, loss=0.0015, acc=0.9940, iter_time=8.22s]
Epoch 0: 11%|█ | 1384/12384 [2:56:23<23:18:10, 7.63s/it, loss=0.0016, acc=0.9972, iter_time=7.23s]
Epoch 0: 11%|█ | 1385/12384 [2:56:23<23:17:31, 7.62s/it, loss=0.0016, acc=0.9972, iter_time=7.23s]
Epoch 0: 11%|█ | 1385/12384 [2:56:31<23:17:31, 7.62s/it, loss=0.0006, acc=1.0000, iter_time=7.64s]
Epoch 0: 11%|█ | 1386/12384 [2:56:31<23:17:12, 7.62s/it, loss=0.0006, acc=1.0000, iter_time=7.64s]
Epoch 0: 11%|█ | 1386/12384 [2:56:39<23:17:12, 7.62s/it, loss=0.0016, acc=0.9959, iter_time=7.61s]
Epoch 0: 11%|█ | 1387/12384 [2:56:39<23:16:31, 7.62s/it, loss=0.0016, acc=0.9959, iter_time=7.61s]
Epoch 0: 11%|█ | 1387/12384 [2:56:46<23:16:31, 7.62s/it, loss=0.0025, acc=0.9940, iter_time=6.68s]
Epoch 0: 11%|█ | 1388/12384 [2:56:46<23:15:23, 7.61s/it, loss=0.0025, acc=0.9940, iter_time=6.68s]
Epoch 0: 11%|█ | 1388/12384 [2:56:54<23:15:23, 7.61s/it, loss=0.0030, acc=0.9934, iter_time=8.54s]
Epoch 0: 11%|█ | 1389/12384 [2:56:54<23:14:10, 7.61s/it, loss=0.0030, acc=0.9934, iter_time=8.54s]
Epoch 0: 11%|█ | 1389/12384 [2:57:01<23:14:10, 7.61s/it, loss=0.0059, acc=0.9835, iter_time=5.25s]
Epoch 0: 11%|█ | 1390/12384 [2:57:01<23:12:52, 7.60s/it, loss=0.0059, acc=0.9835, iter_time=5.25s]
Epoch 0: 11%|█ | 1390/12384 [2:57:09<23:12:52, 7.60s/it, loss=0.0015, acc=0.9946, iter_time=9.93s]
Epoch 0: 11%|█ | 1391/12384 [2:57:09<23:13:30, 7.61s/it, loss=0.0015, acc=0.9946, iter_time=9.93s]
Epoch 0: 11%|█ | 1391/12384 [2:57:17<23:13:30, 7.61s/it, loss=0.0062, acc=0.9859, iter_time=7.57s]
Epoch 0: 11%|█ | 1392/12384 [2:57:17<23:13:14, 7.61s/it, loss=0.0062, acc=0.9859, iter_time=7.57s]
Epoch 0: 11%|█ | 1392/12384 [2:57:24<23:13:14, 7.61s/it, loss=0.0007, acc=0.9968, iter_time=7.64s]
Epoch 0: 11%|█ | 1393/12384 [2:57:24<23:14:22, 7.61s/it, loss=0.0007, acc=0.9968, iter_time=7.64s]
Epoch 0: 11%|█ | 1393/12384 [2:57:32<23:14:22, 7.61s/it, loss=0.0012, acc=0.9957, iter_time=5.84s]
Epoch 0: 11%|█▏ | 1394/12384 [2:57:32<23:13:10, 7.61s/it, loss=0.0012, acc=0.9957, iter_time=5.84s]
Epoch 0: 11%|█▏ | 1394/12384 [2:57:39<23:13:10, 7.61s/it, loss=0.0013, acc=0.9985, iter_time=9.39s]
Epoch 0: 11%|█▏ | 1395/12384 [2:57:39<23:13:10, 7.61s/it, loss=0.0013, acc=0.9985, iter_time=9.39s]
Epoch 0: 11%|█▏ | 1395/12384 [2:57:47<23:13:10, 7.61s/it, loss=0.0034, acc=0.9940, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1396/12384 [2:57:47<23:12:59, 7.61s/it, loss=0.0034, acc=0.9940, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1396/12384 [2:57:55<23:12:59, 7.61s/it, loss=0.0015, acc=0.9980, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1397/12384 [2:57:55<23:12:18, 7.60s/it, loss=0.0015, acc=0.9980, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1397/12384 [2:58:02<23:12:18, 7.60s/it, loss=0.0027, acc=0.9903, iter_time=6.08s]
Epoch 0: 11%|█▏ | 1398/12384 [2:58:02<23:11:38, 7.60s/it, loss=0.0027, acc=0.9903, iter_time=6.08s]
Epoch 0: 11%|█▏ | 1398/12384 [2:58:10<23:11:38, 7.60s/it, loss=0.0011, acc=0.9960, iter_time=9.12s]
Epoch 0: 11%|█▏ | 1399/12384 [2:58:10<23:13:14, 7.61s/it, loss=0.0011, acc=0.9960, iter_time=9.12s]
Epoch 0: 11%|█▏ | 1399/12384 [2:58:17<23:13:14, 7.61s/it, loss=0.0052, acc=0.9938, iter_time=8.03s]
Epoch 0: 11%|█▏ | 1400/12384 [2:58:17<23:12:50, 7.61s/it, loss=0.0052, acc=0.9938, iter_time=8.03s]
Epoch 0: 11%|█▏ | 1400/12384 [2:58:25<23:12:50, 7.61s/it, loss=0.0023, acc=0.9899, iter_time=7.50s]
Epoch 0: 11%|█▏ | 1401/12384 [2:58:25<23:28:25, 7.69s/it, loss=0.0023, acc=0.9899, iter_time=7.50s]
Epoch 0: 11%|█▏ | 1401/12384 [2:58:33<23:28:25, 7.69s/it, loss=0.0024, acc=0.9952, iter_time=7.65s]
Epoch 0: 11%|█▏ | 1402/12384 [2:58:33<23:42:19, 7.77s/it, loss=0.0024, acc=0.9952, iter_time=7.65s]
Epoch 0: 11%|█▏ | 1402/12384 [2:58:41<23:42:19, 7.77s/it, loss=0.0015, acc=0.9975, iter_time=4.62s]
Epoch 0: 11%|█▏ | 1403/12384 [2:58:41<23:32:17, 7.72s/it, loss=0.0015, acc=0.9975, iter_time=4.62s]
Epoch 0: 11%|█▏ | 1403/12384 [2:58:49<23:32:17, 7.72s/it, loss=0.0007, acc=0.9989, iter_time=8.26s]
Epoch 0: 11%|█▏ | 1404/12384 [2:58:49<23:26:02, 7.68s/it, loss=0.0007, acc=0.9989, iter_time=8.26s]
Epoch 0: 11%|█▏ | 1404/12384 [2:58:56<23:26:02, 7.68s/it, loss=0.0010, acc=0.9986, iter_time=9.62s]
Epoch 0: 11%|█▏ | 1405/12384 [2:58:56<23:22:51, 7.67s/it, loss=0.0010, acc=0.9986, iter_time=9.62s]
Epoch 0: 11%|█▏ | 1405/12384 [2:59:04<23:22:51, 7.67s/it, loss=0.0004, acc=0.9995, iter_time=8.23s]
Epoch 0: 11%|█▏ | 1406/12384 [2:59:04<23:20:11, 7.65s/it, loss=0.0004, acc=0.9995, iter_time=8.23s]
Epoch 0: 11%|█▏ | 1406/12384 [2:59:11<23:20:11, 7.65s/it, loss=0.0011, acc=0.9982, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1407/12384 [2:59:11<23:18:15, 7.64s/it, loss=0.0011, acc=0.9982, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1407/12384 [2:59:19<23:18:15, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=8.02s]
Epoch 0: 11%|█▏ | 1408/12384 [2:59:19<23:21:40, 7.66s/it, loss=0.0006, acc=1.0000, iter_time=8.02s]
Epoch 0: 11%|█▏ | 1408/12384 [2:59:27<23:21:40, 7.66s/it, loss=0.0033, acc=0.9934, iter_time=7.32s]
Epoch 0: 11%|█▏ | 1409/12384 [2:59:27<23:18:46, 7.65s/it, loss=0.0033, acc=0.9934, iter_time=7.32s]
Epoch 0: 11%|█▏ | 1409/12384 [2:59:34<23:18:46, 7.65s/it, loss=0.0015, acc=0.9966, iter_time=7.30s]
Epoch 0: 11%|█▏ | 1410/12384 [2:59:34<23:17:07, 7.64s/it, loss=0.0015, acc=0.9966, iter_time=7.30s]
Epoch 0: 11%|█▏ | 1410/12384 [2:59:42<23:17:07, 7.64s/it, loss=0.0011, acc=0.9982, iter_time=7.93s]
Epoch 0: 11%|█▏ | 1411/12384 [2:59:42<23:15:56, 7.63s/it, loss=0.0011, acc=0.9982, iter_time=7.93s]
Epoch 0: 11%|█▏ | 1411/12384 [2:59:50<23:15:56, 7.63s/it, loss=0.0020, acc=0.9981, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1412/12384 [2:59:50<23:15:04, 7.63s/it, loss=0.0020, acc=0.9981, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1412/12384 [2:59:57<23:15:04, 7.63s/it, loss=0.0020, acc=0.9950, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1413/12384 [2:59:57<23:13:09, 7.62s/it, loss=0.0020, acc=0.9950, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1413/12384 [3:00:05<23:13:09, 7.62s/it, loss=0.0021, acc=0.9964, iter_time=4.74s]
Epoch 0: 11%|█▏ | 1414/12384 [3:00:05<23:12:15, 7.61s/it, loss=0.0021, acc=0.9964, iter_time=4.74s]
Epoch 0: 11%|█▏ | 1414/12384 [3:00:12<23:12:15, 7.61s/it, loss=0.0007, acc=0.9998, iter_time=10.45s]
Epoch 0: 11%|█▏ | 1415/12384 [3:00:12<23:13:02, 7.62s/it, loss=0.0007, acc=0.9998, iter_time=10.45s]
Epoch 0: 11%|█▏ | 1415/12384 [3:00:20<23:13:02, 7.62s/it, loss=0.0006, acc=0.9977, iter_time=8.02s]
Epoch 0: 11%|█▏ | 1416/12384 [3:00:20<23:12:14, 7.62s/it, loss=0.0006, acc=0.9977, iter_time=8.02s]
Epoch 0: 11%|█▏ | 1416/12384 [3:00:28<23:12:14, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 11%|█▏ | 1417/12384 [3:00:28<23:12:27, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 11%|█▏ | 1417/12384 [3:00:35<23:12:27, 7.62s/it, loss=0.0050, acc=0.9926, iter_time=5.56s]
Epoch 0: 11%|█▏ | 1418/12384 [3:00:35<23:10:56, 7.61s/it, loss=0.0050, acc=0.9926, iter_time=5.56s]
Epoch 0: 11%|█▏ | 1418/12384 [3:00:43<23:10:56, 7.61s/it, loss=0.0021, acc=0.9930, iter_time=8.48s]
Epoch 0: 11%|█▏ | 1419/12384 [3:00:43<23:12:50, 7.62s/it, loss=0.0021, acc=0.9930, iter_time=8.48s]
Epoch 0: 11%|█▏ | 1419/12384 [3:00:50<23:12:50, 7.62s/it, loss=0.0011, acc=0.9988, iter_time=8.84s]
Epoch 0: 11%|█▏ | 1420/12384 [3:00:50<23:11:01, 7.61s/it, loss=0.0011, acc=0.9988, iter_time=8.84s]
Epoch 0: 11%|█▏ | 1420/12384 [3:00:58<23:11:01, 7.61s/it, loss=0.0003, acc=0.9995, iter_time=7.60s]
Epoch 0: 11%|█▏ | 1421/12384 [3:00:58<23:11:24, 7.62s/it, loss=0.0003, acc=0.9995, iter_time=7.60s]
Epoch 0: 11%|█▏ | 1421/12384 [3:01:06<23:11:24, 7.62s/it, loss=0.0062, acc=0.9903, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1422/12384 [3:01:06<23:12:30, 7.62s/it, loss=0.0062, acc=0.9903, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1422/12384 [3:01:13<23:12:30, 7.62s/it, loss=0.0008, acc=0.9978, iter_time=7.65s]
Epoch 0: 11%|█▏ | 1423/12384 [3:01:13<23:11:00, 7.61s/it, loss=0.0008, acc=0.9978, iter_time=7.65s]
Epoch 0: 11%|█▏ | 1423/12384 [3:01:21<23:11:00, 7.61s/it, loss=0.0031, acc=0.9919, iter_time=7.97s]
Epoch 0: 11%|█▏ | 1424/12384 [3:01:21<23:10:59, 7.61s/it, loss=0.0031, acc=0.9919, iter_time=7.97s]
Epoch 0: 11%|█▏ | 1424/12384 [3:01:29<23:10:59, 7.61s/it, loss=0.0028, acc=0.9949, iter_time=7.26s]
Epoch 0: 12%|█▏ | 1425/12384 [3:01:29<23:11:07, 7.62s/it, loss=0.0028, acc=0.9949, iter_time=7.26s]
Epoch 0: 12%|█▏ | 1425/12384 [3:01:36<23:11:07, 7.62s/it, loss=0.0007, acc=0.9964, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1426/12384 [3:01:36<23:10:13, 7.61s/it, loss=0.0007, acc=0.9964, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1426/12384 [3:01:44<23:10:13, 7.61s/it, loss=0.0003, acc=0.9996, iter_time=6.37s]
Epoch 0: 12%|█▏ | 1427/12384 [3:01:44<23:10:10, 7.61s/it, loss=0.0003, acc=0.9996, iter_time=6.37s]
Epoch 0: 12%|█▏ | 1427/12384 [3:01:51<23:10:10, 7.61s/it, loss=0.0009, acc=0.9981, iter_time=6.82s]
Epoch 0: 12%|█▏ | 1428/12384 [3:01:51<23:08:04, 7.60s/it, loss=0.0009, acc=0.9981, iter_time=6.82s]
Epoch 0: 12%|█▏ | 1428/12384 [3:01:59<23:08:04, 7.60s/it, loss=0.0012, acc=0.9981, iter_time=9.65s]
Epoch 0: 12%|█▏ | 1429/12384 [3:01:59<23:28:34, 7.71s/it, loss=0.0012, acc=0.9981, iter_time=9.65s]
Epoch 0: 12%|█▏ | 1429/12384 [3:02:07<23:28:34, 7.71s/it, loss=0.0014, acc=0.9982, iter_time=7.93s]
Epoch 0: 12%|█▏ | 1430/12384 [3:02:07<23:22:38, 7.68s/it, loss=0.0014, acc=0.9982, iter_time=7.93s]
Epoch 0: 12%|█▏ | 1430/12384 [3:02:15<23:22:38, 7.68s/it, loss=0.0027, acc=0.9930, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1431/12384 [3:02:15<23:19:13, 7.66s/it, loss=0.0027, acc=0.9930, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1431/12384 [3:02:22<23:19:13, 7.66s/it, loss=0.0011, acc=0.9973, iter_time=7.55s]
Epoch 0: 12%|█▏ | 1432/12384 [3:02:22<23:15:48, 7.65s/it, loss=0.0011, acc=0.9973, iter_time=7.55s]
Epoch 0: 12%|█▏ | 1432/12384 [3:02:30<23:15:48, 7.65s/it, loss=0.0040, acc=0.9932, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1433/12384 [3:02:30<23:12:13, 7.63s/it, loss=0.0040, acc=0.9932, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1433/12384 [3:02:37<23:12:13, 7.63s/it, loss=0.0021, acc=0.9966, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1434/12384 [3:02:37<23:11:58, 7.63s/it, loss=0.0021, acc=0.9966, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1434/12384 [3:02:45<23:11:58, 7.63s/it, loss=0.0005, acc=0.9998, iter_time=4.48s]
Epoch 0: 12%|█▏ | 1435/12384 [3:02:45<23:09:58, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=4.48s]
Epoch 0: 12%|█▏ | 1435/12384 [3:02:53<23:09:58, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=10.73s]
Epoch 0: 12%|█▏ | 1436/12384 [3:02:53<23:09:26, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=10.73s]
Epoch 0: 12%|█▏ | 1436/12384 [3:03:00<23:09:26, 7.61s/it, loss=0.0036, acc=0.9931, iter_time=7.59s]
Epoch 0: 12%|█▏ | 1437/12384 [3:03:00<23:08:34, 7.61s/it, loss=0.0036, acc=0.9931, iter_time=7.59s]
Epoch 0: 12%|█▏ | 1437/12384 [3:03:08<23:08:34, 7.61s/it, loss=0.0005, acc=0.9977, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1438/12384 [3:03:08<23:07:42, 7.61s/it, loss=0.0005, acc=0.9977, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1438/12384 [3:03:15<23:07:42, 7.61s/it, loss=0.0027, acc=0.9941, iter_time=7.58s]
Epoch 0: 12%|█▏ | 1439/12384 [3:03:15<23:07:14, 7.60s/it, loss=0.0027, acc=0.9941, iter_time=7.58s]
Epoch 0: 12%|█▏ | 1439/12384 [3:03:23<23:07:14, 7.60s/it, loss=0.0031, acc=0.9954, iter_time=7.98s]
Epoch 0: 12%|█▏ | 1440/12384 [3:03:23<23:06:43, 7.60s/it, loss=0.0031, acc=0.9954, iter_time=7.98s]
Epoch 0: 12%|█▏ | 1440/12384 [3:03:31<23:06:43, 7.60s/it, loss=0.0094, acc=0.9867, iter_time=7.21s]
Epoch 0: 12%|█▏ | 1441/12384 [3:03:31<23:05:50, 7.60s/it, loss=0.0094, acc=0.9867, iter_time=7.21s]
Epoch 0: 12%|█▏ | 1441/12384 [3:03:38<23:05:50, 7.60s/it, loss=0.0019, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1442/12384 [3:03:38<23:06:54, 7.61s/it, loss=0.0019, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1442/12384 [3:03:46<23:06:54, 7.61s/it, loss=0.0022, acc=0.9978, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1443/12384 [3:03:46<23:06:53, 7.61s/it, loss=0.0022, acc=0.9978, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1443/12384 [3:03:53<23:06:53, 7.61s/it, loss=0.0011, acc=0.9958, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1444/12384 [3:03:53<23:08:34, 7.62s/it, loss=0.0011, acc=0.9958, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1444/12384 [3:04:01<23:08:34, 7.62s/it, loss=0.0011, acc=0.9987, iter_time=6.78s]
Epoch 0: 12%|█▏ | 1445/12384 [3:04:01<23:06:41, 7.61s/it, loss=0.0011, acc=0.9987, iter_time=6.78s]
Epoch 0: 12%|█▏ | 1445/12384 [3:04:09<23:06:41, 7.61s/it, loss=0.0042, acc=0.9973, iter_time=8.43s]
Epoch 0: 12%|█▏ | 1446/12384 [3:04:09<23:09:43, 7.62s/it, loss=0.0042, acc=0.9973, iter_time=8.43s]
Epoch 0: 12%|█▏ | 1446/12384 [3:04:16<23:09:43, 7.62s/it, loss=0.0004, acc=0.9998, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1447/12384 [3:04:16<23:08:23, 7.62s/it, loss=0.0004, acc=0.9998, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1447/12384 [3:04:24<23:08:23, 7.62s/it, loss=0.0019, acc=0.9938, iter_time=7.76s]
Epoch 0: 12%|█▏ | 1448/12384 [3:04:24<23:07:55, 7.61s/it, loss=0.0019, acc=0.9938, iter_time=7.76s]
Epoch 0: 12%|█▏ | 1448/12384 [3:04:31<23:07:55, 7.61s/it, loss=0.0006, acc=0.9987, iter_time=5.44s]
Epoch 0: 12%|█▏ | 1449/12384 [3:04:31<23:07:35, 7.61s/it, loss=0.0006, acc=0.9987, iter_time=5.44s]
Epoch 0: 12%|█▏ | 1449/12384 [3:04:39<23:07:35, 7.61s/it, loss=0.0007, acc=0.9996, iter_time=10.03s]
Epoch 0: 12%|█▏ | 1450/12384 [3:04:39<23:07:40, 7.61s/it, loss=0.0007, acc=0.9996, iter_time=10.03s]
Epoch 0: 12%|█▏ | 1450/12384 [3:04:47<23:07:40, 7.61s/it, loss=0.0008, acc=0.9987, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1451/12384 [3:04:47<23:07:43, 7.62s/it, loss=0.0008, acc=0.9987, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1451/12384 [3:04:54<23:07:43, 7.62s/it, loss=0.0007, acc=0.9985, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1452/12384 [3:04:54<23:07:55, 7.62s/it, loss=0.0007, acc=0.9985, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1452/12384 [3:05:02<23:07:55, 7.62s/it, loss=0.0014, acc=0.9968, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1453/12384 [3:05:02<23:07:51, 7.62s/it, loss=0.0014, acc=0.9968, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1453/12384 [3:05:10<23:07:51, 7.62s/it, loss=0.0009, acc=0.9983, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1454/12384 [3:05:10<23:06:32, 7.61s/it, loss=0.0009, acc=0.9983, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1454/12384 [3:05:18<23:06:32, 7.61s/it, loss=0.0004, acc=0.9981, iter_time=7.71s]
Epoch 0: 12%|█▏ | 1455/12384 [3:05:18<23:28:14, 7.73s/it, loss=0.0004, acc=0.9981, iter_time=7.71s]
Epoch 0: 12%|█▏ | 1455/12384 [3:05:25<23:28:14, 7.73s/it, loss=0.0004, acc=0.9999, iter_time=9.22s]
Epoch 0: 12%|█▏ | 1456/12384 [3:05:25<23:21:01, 7.69s/it, loss=0.0004, acc=0.9999, iter_time=9.22s]
Epoch 0: 12%|█▏ | 1456/12384 [3:05:33<23:21:01, 7.69s/it, loss=0.0004, acc=0.9986, iter_time=6.27s]
Epoch 0: 12%|█▏ | 1457/12384 [3:05:33<23:16:29, 7.67s/it, loss=0.0004, acc=0.9986, iter_time=6.27s]
Epoch 0: 12%|█▏ | 1457/12384 [3:05:40<23:16:29, 7.67s/it, loss=0.0036, acc=0.9884, iter_time=8.55s]
Epoch 0: 12%|█▏ | 1458/12384 [3:05:40<23:13:22, 7.65s/it, loss=0.0036, acc=0.9884, iter_time=8.55s]
Epoch 0: 12%|█▏ | 1458/12384 [3:05:48<23:13:22, 7.65s/it, loss=0.0031, acc=0.9933, iter_time=5.28s]
Epoch 0: 12%|█▏ | 1459/12384 [3:05:48<23:10:07, 7.63s/it, loss=0.0031, acc=0.9933, iter_time=5.28s]
Epoch 0: 12%|█▏ | 1459/12384 [3:05:56<23:10:07, 7.63s/it, loss=0.0028, acc=0.9898, iter_time=9.94s]
Epoch 0: 12%|█▏ | 1460/12384 [3:05:56<23:08:04, 7.62s/it, loss=0.0028, acc=0.9898, iter_time=9.94s]
Epoch 0: 12%|█▏ | 1460/12384 [3:06:03<23:08:04, 7.62s/it, loss=0.0007, acc=0.9972, iter_time=6.09s]
Epoch 0: 12%|█▏ | 1461/12384 [3:06:03<23:06:28, 7.62s/it, loss=0.0007, acc=0.9972, iter_time=6.09s]
Epoch 0: 12%|█▏ | 1461/12384 [3:06:11<23:06:28, 7.62s/it, loss=0.0018, acc=0.9976, iter_time=9.10s]
Epoch 0: 12%|█▏ | 1462/12384 [3:06:11<23:05:38, 7.61s/it, loss=0.0018, acc=0.9976, iter_time=9.10s]
Epoch 0: 12%|█▏ | 1462/12384 [3:06:18<23:05:38, 7.61s/it, loss=0.0008, acc=0.9980, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1463/12384 [3:06:18<23:05:08, 7.61s/it, loss=0.0008, acc=0.9980, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1463/12384 [3:06:26<23:05:08, 7.61s/it, loss=0.0009, acc=0.9994, iter_time=7.52s]
Epoch 0: 12%|█▏ | 1464/12384 [3:06:26<23:03:34, 7.60s/it, loss=0.0009, acc=0.9994, iter_time=7.52s]
Epoch 0: 12%|█▏ | 1464/12384 [3:06:34<23:03:34, 7.60s/it, loss=0.0005, acc=0.9993, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1465/12384 [3:06:34<23:02:29, 7.60s/it, loss=0.0005, acc=0.9993, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1465/12384 [3:06:41<23:02:29, 7.60s/it, loss=0.0024, acc=0.9963, iter_time=7.36s]
Epoch 0: 12%|█▏ | 1466/12384 [3:06:41<23:02:27, 7.60s/it, loss=0.0024, acc=0.9963, iter_time=7.36s]
Epoch 0: 12%|█▏ | 1466/12384 [3:06:49<23:02:27, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.11s]
Epoch 0: 12%|█▏ | 1467/12384 [3:06:49<23:02:48, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.11s]
Epoch 0: 12%|█▏ | 1467/12384 [3:06:56<23:02:48, 7.60s/it, loss=0.0012, acc=0.9984, iter_time=9.34s]
Epoch 0: 12%|█▏ | 1468/12384 [3:06:56<23:02:17, 7.60s/it, loss=0.0012, acc=0.9984, iter_time=9.34s]
Epoch 0: 12%|█▏ | 1468/12384 [3:07:04<23:02:17, 7.60s/it, loss=0.0016, acc=0.9978, iter_time=7.58s]
Epoch 0: 12%|█▏ | 1469/12384 [3:07:04<23:02:14, 7.60s/it, loss=0.0016, acc=0.9978, iter_time=7.58s]
Epoch 0: 12%|█▏ | 1469/12384 [3:07:12<23:02:14, 7.60s/it, loss=0.0013, acc=0.9975, iter_time=5.29s]
Epoch 0: 12%|█▏ | 1470/12384 [3:07:12<23:06:05, 7.62s/it, loss=0.0013, acc=0.9975, iter_time=5.29s]
Epoch 0: 12%|█▏ | 1470/12384 [3:07:19<23:06:05, 7.62s/it, loss=0.0006, acc=0.9992, iter_time=10.00s]
Epoch 0: 12%|█▏ | 1471/12384 [3:07:19<23:05:07, 7.62s/it, loss=0.0006, acc=0.9992, iter_time=10.00s]
Epoch 0: 12%|█▏ | 1471/12384 [3:07:27<23:05:07, 7.62s/it, loss=0.0015, acc=0.9968, iter_time=7.97s]
Epoch 0: 12%|█▏ | 1472/12384 [3:07:27<23:03:50, 7.61s/it, loss=0.0015, acc=0.9968, iter_time=7.97s]
Epoch 0: 12%|█▏ | 1472/12384 [3:07:34<23:03:50, 7.61s/it, loss=0.0009, acc=0.9966, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1473/12384 [3:07:34<23:04:14, 7.61s/it, loss=0.0009, acc=0.9966, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1473/12384 [3:07:42<23:04:14, 7.61s/it, loss=0.0014, acc=0.9960, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1474/12384 [3:07:42<23:03:43, 7.61s/it, loss=0.0014, acc=0.9960, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1474/12384 [3:07:50<23:03:43, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=5.79s]
Epoch 0: 12%|█▏ | 1475/12384 [3:07:50<23:05:44, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=5.79s]
Epoch 0: 12%|█▏ | 1475/12384 [3:07:57<23:05:44, 7.62s/it, loss=0.0020, acc=0.9938, iter_time=9.16s]
Epoch 0: 12%|█▏ | 1476/12384 [3:07:57<23:05:31, 7.62s/it, loss=0.0020, acc=0.9938, iter_time=9.16s]
Epoch 0: 12%|█▏ | 1476/12384 [3:08:05<23:05:31, 7.62s/it, loss=0.0012, acc=0.9961, iter_time=4.61s]
Epoch 0: 12%|█▏ | 1477/12384 [3:08:05<23:04:24, 7.62s/it, loss=0.0012, acc=0.9961, iter_time=4.61s]
Epoch 0: 12%|█▏ | 1477/12384 [3:08:13<23:04:24, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=10.90s]
Epoch 0: 12%|█▏ | 1478/12384 [3:08:13<23:04:30, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=10.90s]
Epoch 0: 12%|█▏ | 1478/12384 [3:08:20<23:04:30, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1479/12384 [3:08:20<23:03:32, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1479/12384 [3:08:28<23:03:32, 7.61s/it, loss=0.0020, acc=0.9936, iter_time=8.30s]
Epoch 0: 12%|█▏ | 1480/12384 [3:08:28<23:19:52, 7.70s/it, loss=0.0020, acc=0.9936, iter_time=8.30s]
Epoch 0: 12%|█▏ | 1480/12384 [3:08:36<23:19:52, 7.70s/it, loss=0.0027, acc=0.9929, iter_time=5.76s]
Epoch 0: 12%|█▏ | 1481/12384 [3:08:36<23:30:50, 7.76s/it, loss=0.0027, acc=0.9929, iter_time=5.76s]
Epoch 0: 12%|█▏ | 1481/12384 [3:08:44<23:30:50, 7.76s/it, loss=0.0006, acc=0.9999, iter_time=8.82s]
Epoch 0: 12%|█▏ | 1482/12384 [3:08:44<23:22:36, 7.72s/it, loss=0.0006, acc=0.9999, iter_time=8.82s]
Epoch 0: 12%|█▏ | 1482/12384 [3:08:51<23:22:36, 7.72s/it, loss=0.0024, acc=0.9970, iter_time=6.12s]
Epoch 0: 12%|█▏ | 1483/12384 [3:08:51<23:17:10, 7.69s/it, loss=0.0024, acc=0.9970, iter_time=6.12s]
Epoch 0: 12%|█▏ | 1483/12384 [3:08:59<23:17:10, 7.69s/it, loss=0.0134, acc=0.9805, iter_time=9.65s]
Epoch 0: 12%|█▏ | 1484/12384 [3:08:59<23:13:50, 7.67s/it, loss=0.0134, acc=0.9805, iter_time=9.65s]
Epoch 0: 12%|█▏ | 1484/12384 [3:09:07<23:13:50, 7.67s/it, loss=0.0017, acc=0.9970, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1485/12384 [3:09:07<23:17:07, 7.69s/it, loss=0.0017, acc=0.9970, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1485/12384 [3:09:14<23:17:07, 7.69s/it, loss=0.0021, acc=0.9939, iter_time=4.70s]
Epoch 0: 12%|█▏ | 1486/12384 [3:09:14<23:12:42, 7.67s/it, loss=0.0021, acc=0.9939, iter_time=4.70s]
Epoch 0: 12%|█▏ | 1486/12384 [3:09:22<23:12:42, 7.67s/it, loss=0.0009, acc=0.9964, iter_time=10.62s]
Epoch 0: 12%|█▏ | 1487/12384 [3:09:22<23:08:29, 7.65s/it, loss=0.0009, acc=0.9964, iter_time=10.62s]
Epoch 0: 12%|█▏ | 1487/12384 [3:09:29<23:08:29, 7.65s/it, loss=0.0022, acc=0.9957, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1488/12384 [3:09:29<23:06:29, 7.63s/it, loss=0.0022, acc=0.9957, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1488/12384 [3:09:37<23:06:29, 7.63s/it, loss=0.0034, acc=0.9904, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1489/12384 [3:09:37<23:08:07, 7.64s/it, loss=0.0034, acc=0.9904, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1489/12384 [3:09:45<23:08:07, 7.64s/it, loss=0.0029, acc=0.9943, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1490/12384 [3:09:45<23:06:06, 7.63s/it, loss=0.0029, acc=0.9943, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1490/12384 [3:09:52<23:06:06, 7.63s/it, loss=0.0006, acc=0.9988, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1491/12384 [3:09:52<23:04:29, 7.63s/it, loss=0.0006, acc=0.9988, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1491/12384 [3:10:00<23:04:29, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 12%|█▏ | 1492/12384 [3:10:00<23:03:05, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 12%|█▏ | 1492/12384 [3:10:08<23:03:05, 7.62s/it, loss=0.0123, acc=0.9808, iter_time=7.32s]
Epoch 0: 12%|█▏ | 1493/12384 [3:10:08<23:03:33, 7.62s/it, loss=0.0123, acc=0.9808, iter_time=7.32s]
Epoch 0: 12%|█▏ | 1493/12384 [3:10:15<23:03:33, 7.62s/it, loss=0.0022, acc=0.9956, iter_time=6.74s]
Epoch 0: 12%|█▏ | 1494/12384 [3:10:15<23:02:41, 7.62s/it, loss=0.0022, acc=0.9956, iter_time=6.74s]
Epoch 0: 12%|█▏ | 1494/12384 [3:10:23<23:02:41, 7.62s/it, loss=0.0007, acc=0.9998, iter_time=5.73s]
Epoch 0: 12%|█▏ | 1495/12384 [3:10:23<23:01:29, 7.61s/it, loss=0.0007, acc=0.9998, iter_time=5.73s]
Epoch 0: 12%|█▏ | 1495/12384 [3:10:30<23:01:29, 7.61s/it, loss=0.0028, acc=0.9960, iter_time=11.04s]
Epoch 0: 12%|█▏ | 1496/12384 [3:10:30<23:01:15, 7.61s/it, loss=0.0028, acc=0.9960, iter_time=11.04s]
Epoch 0: 12%|█▏ | 1496/12384 [3:10:38<23:01:15, 7.61s/it, loss=0.0013, acc=0.9962, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1497/12384 [3:10:38<23:01:49, 7.62s/it, loss=0.0013, acc=0.9962, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1497/12384 [3:10:46<23:01:49, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1498/12384 [3:10:46<22:59:47, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1498/12384 [3:10:53<22:59:47, 7.60s/it, loss=0.0014, acc=0.9961, iter_time=7.29s]
Epoch 0: 12%|█▏ | 1499/12384 [3:10:53<23:00:29, 7.61s/it, loss=0.0014, acc=0.9961, iter_time=7.29s]
Epoch 0: 12%|█▏ | 1499/12384 [3:11:01<23:00:29, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=9.26s]
Epoch 0: 12%|█▏ | 1500/12384 [3:11:01<23:11:25, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=9.26s]
Epoch 0: 12%|█▏ | 1500/12384 [3:11:09<23:11:25, 7.67s/it, loss=0.0018, acc=0.9970, iter_time=5.88s]
Epoch 0: 12%|█▏ | 1501/12384 [3:11:09<23:07:23, 7.65s/it, loss=0.0018, acc=0.9970, iter_time=5.88s]
Epoch 0: 12%|█▏ | 1501/12384 [3:11:16<23:07:23, 7.65s/it, loss=0.0025, acc=0.9960, iter_time=9.13s]
Epoch 0: 12%|█▏ | 1502/12384 [3:11:16<23:09:53, 7.66s/it, loss=0.0025, acc=0.9960, iter_time=9.13s]
Epoch 0: 12%|█▏ | 1502/12384 [3:11:24<23:09:53, 7.66s/it, loss=0.0012, acc=0.9977, iter_time=7.69s]
Epoch 0: 12%|█▏ | 1503/12384 [3:11:24<23:05:58, 7.64s/it, loss=0.0012, acc=0.9977, iter_time=7.69s]
Epoch 0: 12%|█▏ | 1503/12384 [3:11:31<23:05:58, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.53s]
Epoch 0: 12%|█▏ | 1504/12384 [3:11:31<23:03:05, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.53s]
Epoch 0: 12%|█▏ | 1504/12384 [3:11:39<23:03:05, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1505/12384 [3:11:39<23:02:23, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1505/12384 [3:11:47<23:02:23, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1506/12384 [3:11:47<23:03:20, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1506/12384 [3:11:55<23:03:20, 7.63s/it, loss=0.0022, acc=0.9969, iter_time=4.81s]
Epoch 0: 12%|█▏ | 1507/12384 [3:11:55<23:19:20, 7.72s/it, loss=0.0022, acc=0.9969, iter_time=4.81s]
Epoch 0: 12%|█▏ | 1507/12384 [3:12:02<23:19:20, 7.72s/it, loss=0.0007, acc=0.9990, iter_time=9.26s]
Epoch 0: 12%|█▏ | 1508/12384 [3:12:02<23:12:42, 7.68s/it, loss=0.0007, acc=0.9990, iter_time=9.26s]
Epoch 0: 12%|█▏ | 1508/12384 [3:12:10<23:12:42, 7.68s/it, loss=0.0008, acc=0.9986, iter_time=9.10s]
Epoch 0: 12%|█▏ | 1509/12384 [3:12:10<23:09:01, 7.66s/it, loss=0.0008, acc=0.9986, iter_time=9.10s]
Epoch 0: 12%|█▏ | 1509/12384 [3:12:17<23:09:01, 7.66s/it, loss=0.0013, acc=0.9969, iter_time=4.74s]
Epoch 0: 12%|█▏ | 1510/12384 [3:12:17<23:05:54, 7.65s/it, loss=0.0013, acc=0.9969, iter_time=4.74s]
Epoch 0: 12%|█▏ | 1510/12384 [3:12:25<23:05:54, 7.65s/it, loss=0.0007, acc=0.9972, iter_time=10.47s]
Epoch 0: 12%|█▏ | 1511/12384 [3:12:25<23:04:15, 7.64s/it, loss=0.0007, acc=0.9972, iter_time=10.47s]
Epoch 0: 12%|█▏ | 1511/12384 [3:12:33<23:04:15, 7.64s/it, loss=0.0009, acc=0.9984, iter_time=8.03s]
Epoch 0: 12%|█▏ | 1512/12384 [3:12:33<23:03:54, 7.64s/it, loss=0.0009, acc=0.9984, iter_time=8.03s]
Epoch 0: 12%|█▏ | 1512/12384 [3:12:40<23:03:54, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=6.12s]
Epoch 0: 12%|█▏ | 1513/12384 [3:12:40<23:02:10, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.12s]
Epoch 0: 12%|█▏ | 1513/12384 [3:12:48<23:02:10, 7.63s/it, loss=0.0005, acc=0.9994, iter_time=8.74s]
Epoch 0: 12%|█▏ | 1514/12384 [3:12:48<23:00:59, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=8.74s]
Epoch 0: 12%|█▏ | 1514/12384 [3:12:56<23:00:59, 7.62s/it, loss=0.0021, acc=0.9975, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1515/12384 [3:12:56<23:00:19, 7.62s/it, loss=0.0021, acc=0.9975, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1515/12384 [3:13:03<23:00:19, 7.62s/it, loss=0.0019, acc=0.9969, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1516/12384 [3:13:03<22:59:55, 7.62s/it, loss=0.0019, acc=0.9969, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1516/12384 [3:13:11<22:59:55, 7.62s/it, loss=0.0150, acc=0.9878, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1517/12384 [3:13:11<22:58:36, 7.61s/it, loss=0.0150, acc=0.9878, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1517/12384 [3:13:18<22:58:36, 7.61s/it, loss=0.0010, acc=0.9995, iter_time=4.01s]
Epoch 0: 12%|█▏ | 1518/12384 [3:13:18<22:58:37, 7.61s/it, loss=0.0010, acc=0.9995, iter_time=4.01s]
Epoch 0: 12%|█▏ | 1518/12384 [3:13:26<22:58:37, 7.61s/it, loss=0.0019, acc=0.9972, iter_time=11.19s]
Epoch 0: 12%|█▏ | 1519/12384 [3:13:26<22:58:32, 7.61s/it, loss=0.0019, acc=0.9972, iter_time=11.19s]
Epoch 0: 12%|█▏ | 1519/12384 [3:13:34<22:58:32, 7.61s/it, loss=0.0075, acc=0.9868, iter_time=7.58s]
Epoch 0: 12%|█▏ | 1520/12384 [3:13:34<22:58:23, 7.61s/it, loss=0.0075, acc=0.9868, iter_time=7.58s]
Epoch 0: 12%|█▏ | 1520/12384 [3:13:41<22:58:23, 7.61s/it, loss=0.0009, acc=0.9977, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1521/12384 [3:13:41<23:00:18, 7.62s/it, loss=0.0009, acc=0.9977, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1521/12384 [3:13:49<23:00:18, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1522/12384 [3:13:49<22:59:47, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1522/12384 [3:13:56<22:59:47, 7.62s/it, loss=0.0009, acc=0.9973, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1523/12384 [3:13:56<23:01:03, 7.63s/it, loss=0.0009, acc=0.9973, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1523/12384 [3:14:04<23:01:03, 7.63s/it, loss=0.0015, acc=0.9973, iter_time=5.05s]
Epoch 0: 12%|█▏ | 1524/12384 [3:14:04<23:00:36, 7.63s/it, loss=0.0015, acc=0.9973, iter_time=5.05s]
Epoch 0: 12%|█▏ | 1524/12384 [3:14:12<23:00:36, 7.63s/it, loss=0.0008, acc=0.9992, iter_time=10.15s]
Epoch 0: 12%|█▏ | 1525/12384 [3:14:12<22:59:25, 7.62s/it, loss=0.0008, acc=0.9992, iter_time=10.15s]
Epoch 0: 12%|█▏ | 1525/12384 [3:14:19<22:59:25, 7.62s/it, loss=0.0009, acc=0.9974, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1526/12384 [3:14:19<22:58:42, 7.62s/it, loss=0.0009, acc=0.9974, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1526/12384 [3:14:27<22:58:42, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1527/12384 [3:14:27<22:57:38, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1527/12384 [3:14:35<22:57:38, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1528/12384 [3:14:35<22:57:37, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1528/12384 [3:14:42<22:57:37, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=5.68s]
Epoch 0: 12%|█▏ | 1529/12384 [3:14:42<22:57:22, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=5.68s]
Epoch 0: 12%|█▏ | 1529/12384 [3:14:50<22:57:22, 7.61s/it, loss=0.0014, acc=0.9963, iter_time=7.34s]
Epoch 0: 12%|█▏ | 1530/12384 [3:14:50<22:56:33, 7.61s/it, loss=0.0014, acc=0.9963, iter_time=7.34s]
Epoch 0: 12%|█▏ | 1530/12384 [3:14:57<22:56:33, 7.61s/it, loss=0.0008, acc=0.9983, iter_time=9.41s]
Epoch 0: 12%|█▏ | 1531/12384 [3:14:57<22:57:56, 7.62s/it, loss=0.0008, acc=0.9983, iter_time=9.41s]
Epoch 0: 12%|█▏ | 1531/12384 [3:15:05<22:57:56, 7.62s/it, loss=0.0009, acc=0.9979, iter_time=5.84s]
Epoch 0: 12%|█▏ | 1532/12384 [3:15:05<22:56:35, 7.61s/it, loss=0.0009, acc=0.9979, iter_time=5.84s]
Epoch 0: 12%|█▏ | 1532/12384 [3:15:13<22:56:35, 7.61s/it, loss=0.0004, acc=0.9985, iter_time=9.66s]
Epoch 0: 12%|█▏ | 1533/12384 [3:15:13<23:14:55, 7.71s/it, loss=0.0004, acc=0.9985, iter_time=9.66s]
Epoch 0: 12%|█▏ | 1533/12384 [3:15:21<23:14:55, 7.71s/it, loss=0.0029, acc=0.9919, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1534/12384 [3:15:21<23:08:57, 7.68s/it, loss=0.0029, acc=0.9919, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1534/12384 [3:15:28<23:08:57, 7.68s/it, loss=0.0009, acc=0.9962, iter_time=6.68s]
Epoch 0: 12%|█▏ | 1535/12384 [3:15:28<23:03:51, 7.65s/it, loss=0.0009, acc=0.9962, iter_time=6.68s]
Epoch 0: 12%|█▏ | 1535/12384 [3:15:36<23:03:51, 7.65s/it, loss=0.0022, acc=0.9937, iter_time=8.92s]
Epoch 0: 12%|█▏ | 1536/12384 [3:15:36<23:01:42, 7.64s/it, loss=0.0022, acc=0.9937, iter_time=8.92s]
Epoch 0: 12%|█▏ | 1536/12384 [3:15:43<23:01:42, 7.64s/it, loss=0.0012, acc=1.0000, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1537/12384 [3:15:43<23:01:12, 7.64s/it, loss=0.0012, acc=1.0000, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1537/12384 [3:15:51<23:01:12, 7.64s/it, loss=0.0012, acc=0.9967, iter_time=7.31s]
Epoch 0: 12%|█▏ | 1538/12384 [3:15:51<22:58:07, 7.62s/it, loss=0.0012, acc=0.9967, iter_time=7.31s]
Epoch 0: 12%|█▏ | 1538/12384 [3:15:59<22:58:07, 7.62s/it, loss=0.0006, acc=0.9982, iter_time=7.91s]
Epoch 0: 12%|█▏ | 1539/12384 [3:15:59<22:57:02, 7.62s/it, loss=0.0006, acc=0.9982, iter_time=7.91s]
Epoch 0: 12%|█▏ | 1539/12384 [3:16:06<22:57:02, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=7.59s]
Epoch 0: 12%|█▏ | 1540/12384 [3:16:06<22:55:26, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=7.59s]
Epoch 0: 12%|█▏ | 1540/12384 [3:16:14<22:55:26, 7.61s/it, loss=0.0025, acc=0.9947, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1541/12384 [3:16:14<22:54:37, 7.61s/it, loss=0.0025, acc=0.9947, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1541/12384 [3:16:21<22:54:37, 7.61s/it, loss=0.0050, acc=0.9866, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1542/12384 [3:16:21<22:55:09, 7.61s/it, loss=0.0050, acc=0.9866, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1542/12384 [3:16:29<22:55:09, 7.61s/it, loss=0.0007, acc=0.9980, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1543/12384 [3:16:29<22:54:43, 7.61s/it, loss=0.0007, acc=0.9980, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1543/12384 [3:16:37<22:54:43, 7.61s/it, loss=0.0010, acc=0.9980, iter_time=8.01s]
Epoch 0: 12%|█▏ | 1544/12384 [3:16:37<22:55:29, 7.61s/it, loss=0.0010, acc=0.9980, iter_time=8.01s]
Epoch 0: 12%|█▏ | 1544/12384 [3:16:44<22:55:29, 7.61s/it, loss=0.0013, acc=0.9992, iter_time=7.20s]
Epoch 0: 12%|█▏ | 1545/12384 [3:16:44<22:55:20, 7.61s/it, loss=0.0013, acc=0.9992, iter_time=7.20s]
Epoch 0: 12%|█▏ | 1545/12384 [3:16:52<22:55:20, 7.61s/it, loss=0.0049, acc=0.9919, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1546/12384 [3:16:52<22:55:29, 7.61s/it, loss=0.0049, acc=0.9919, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1546/12384 [3:16:59<22:55:29, 7.61s/it, loss=0.0003, acc=0.9997, iter_time=6.68s]
Epoch 0: 12%|█▏ | 1547/12384 [3:16:59<22:55:45, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=6.68s]
Epoch 0: 12%|█▏ | 1547/12384 [3:17:07<22:55:45, 7.62s/it, loss=0.0013, acc=0.9988, iter_time=8.58s]
Epoch 0: 12%|█▎ | 1548/12384 [3:17:07<22:55:43, 7.62s/it, loss=0.0013, acc=0.9988, iter_time=8.58s]
Epoch 0: 12%|█▎ | 1548/12384 [3:17:15<22:55:43, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1549/12384 [3:17:15<22:55:19, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1549/12384 [3:17:22<22:55:19, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=8.00s]
Epoch 0: 13%|█▎ | 1550/12384 [3:17:22<22:54:57, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.00s]
Epoch 0: 13%|█▎ | 1550/12384 [3:17:30<22:54:57, 7.61s/it, loss=0.0006, acc=0.9977, iter_time=4.14s]
Epoch 0: 13%|█▎ | 1551/12384 [3:17:30<22:55:04, 7.62s/it, loss=0.0006, acc=0.9977, iter_time=4.14s]
Epoch 0: 13%|█▎ | 1551/12384 [3:17:38<22:55:04, 7.62s/it, loss=0.0007, acc=0.9989, iter_time=11.06s]
Epoch 0: 13%|█▎ | 1552/12384 [3:17:38<22:53:47, 7.61s/it, loss=0.0007, acc=0.9989, iter_time=11.06s]
Epoch 0: 13%|█▎ | 1552/12384 [3:17:45<22:53:47, 7.61s/it, loss=0.0006, acc=0.9980, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1553/12384 [3:17:45<22:54:33, 7.61s/it, loss=0.0006, acc=0.9980, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1553/12384 [3:17:53<22:54:33, 7.61s/it, loss=0.0007, acc=0.9998, iter_time=7.65s]
Epoch 0: 13%|█▎ | 1554/12384 [3:17:53<22:55:41, 7.62s/it, loss=0.0007, acc=0.9998, iter_time=7.65s]
Epoch 0: 13%|█▎ | 1554/12384 [3:18:00<22:55:41, 7.62s/it, loss=0.0215, acc=0.9757, iter_time=8.78s]
Epoch 0: 13%|█▎ | 1555/12384 [3:18:00<22:53:49, 7.61s/it, loss=0.0215, acc=0.9757, iter_time=8.78s]
Epoch 0: 13%|█▎ | 1555/12384 [3:18:08<22:53:49, 7.61s/it, loss=0.0010, acc=0.9978, iter_time=9.04s]
Epoch 0: 13%|█▎ | 1556/12384 [3:18:08<22:53:01, 7.61s/it, loss=0.0010, acc=0.9978, iter_time=9.04s]
Epoch 0: 13%|█▎ | 1556/12384 [3:18:16<22:53:01, 7.61s/it, loss=0.0010, acc=0.9950, iter_time=4.82s]
Epoch 0: 13%|█▎ | 1557/12384 [3:18:16<22:52:27, 7.61s/it, loss=0.0010, acc=0.9950, iter_time=4.82s]
Epoch 0: 13%|█▎ | 1557/12384 [3:18:23<22:52:27, 7.61s/it, loss=0.0013, acc=0.9998, iter_time=7.07s]
Epoch 0: 13%|█▎ | 1558/12384 [3:18:23<22:52:59, 7.61s/it, loss=0.0013, acc=0.9998, iter_time=7.07s]
Epoch 0: 13%|█▎ | 1558/12384 [3:18:31<22:52:59, 7.61s/it, loss=0.0006, acc=0.9967, iter_time=7.53s]
Epoch 0: 13%|█▎ | 1559/12384 [3:18:31<22:52:59, 7.61s/it, loss=0.0006, acc=0.9967, iter_time=7.53s]
Epoch 0: 13%|█▎ | 1559/12384 [3:18:39<22:52:59, 7.61s/it, loss=0.0006, acc=0.9983, iter_time=11.70s]
Epoch 0: 13%|█▎ | 1560/12384 [3:18:39<23:08:10, 7.69s/it, loss=0.0006, acc=0.9983, iter_time=11.70s]
Epoch 0: 13%|█▎ | 1560/12384 [3:18:46<23:08:10, 7.69s/it, loss=0.0010, acc=0.9979, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1561/12384 [3:18:46<23:03:24, 7.67s/it, loss=0.0010, acc=0.9979, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1561/12384 [3:18:54<23:03:24, 7.67s/it, loss=0.0014, acc=0.9957, iter_time=5.07s]
Epoch 0: 13%|█▎ | 1562/12384 [3:18:54<22:58:05, 7.64s/it, loss=0.0014, acc=0.9957, iter_time=5.07s]
Epoch 0: 13%|█▎ | 1562/12384 [3:19:02<22:58:05, 7.64s/it, loss=0.0007, acc=0.9981, iter_time=10.12s]
Epoch 0: 13%|█▎ | 1563/12384 [3:19:02<22:57:11, 7.64s/it, loss=0.0007, acc=0.9981, iter_time=10.12s]
Epoch 0: 13%|█▎ | 1563/12384 [3:19:09<22:57:11, 7.64s/it, loss=0.0032, acc=0.9926, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1564/12384 [3:19:09<22:55:43, 7.63s/it, loss=0.0032, acc=0.9926, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1564/12384 [3:19:17<22:55:43, 7.63s/it, loss=0.0077, acc=0.9810, iter_time=10.63s]
Epoch 0: 13%|█▎ | 1565/12384 [3:19:17<22:54:01, 7.62s/it, loss=0.0077, acc=0.9810, iter_time=10.63s]
Epoch 0: 13%|█▎ | 1565/12384 [3:19:24<22:54:01, 7.62s/it, loss=0.0042, acc=0.9969, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1566/12384 [3:19:24<22:53:06, 7.62s/it, loss=0.0042, acc=0.9969, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1566/12384 [3:19:32<22:53:06, 7.62s/it, loss=0.0015, acc=0.9952, iter_time=5.81s]
Epoch 0: 13%|█▎ | 1567/12384 [3:19:32<22:51:44, 7.61s/it, loss=0.0015, acc=0.9952, iter_time=5.81s]
Epoch 0: 13%|█▎ | 1567/12384 [3:19:40<22:51:44, 7.61s/it, loss=0.0007, acc=0.9999, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1568/12384 [3:19:40<22:50:55, 7.61s/it, loss=0.0007, acc=0.9999, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1568/12384 [3:19:47<22:50:55, 7.61s/it, loss=0.0008, acc=0.9978, iter_time=3.85s]
Epoch 0: 13%|█▎ | 1569/12384 [3:19:47<22:51:06, 7.61s/it, loss=0.0008, acc=0.9978, iter_time=3.85s]
Epoch 0: 13%|█▎ | 1569/12384 [3:19:55<22:51:06, 7.61s/it, loss=0.0008, acc=0.9975, iter_time=9.54s]
Epoch 0: 13%|█▎ | 1570/12384 [3:19:55<22:51:47, 7.61s/it, loss=0.0008, acc=0.9975, iter_time=9.54s]
Epoch 0: 13%|█▎ | 1570/12384 [3:20:02<22:51:47, 7.61s/it, loss=0.0052, acc=0.9882, iter_time=7.53s]
Epoch 0: 13%|█▎ | 1571/12384 [3:20:02<22:52:14, 7.61s/it, loss=0.0052, acc=0.9882, iter_time=7.53s]
Epoch 0: 13%|█▎ | 1571/12384 [3:20:10<22:52:14, 7.61s/it, loss=0.0013, acc=0.9959, iter_time=9.13s]
Epoch 0: 13%|█▎ | 1572/12384 [3:20:10<22:51:10, 7.61s/it, loss=0.0013, acc=0.9959, iter_time=9.13s]
Epoch 0: 13%|█▎ | 1572/12384 [3:20:18<22:51:10, 7.61s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1573/12384 [3:20:18<22:50:48, 7.61s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1573/12384 [3:20:25<22:50:48, 7.61s/it, loss=0.0006, acc=0.9993, iter_time=4.76s]
Epoch 0: 13%|█▎ | 1574/12384 [3:20:25<22:51:17, 7.61s/it, loss=0.0006, acc=0.9993, iter_time=4.76s]
Epoch 0: 13%|█▎ | 1574/12384 [3:20:33<22:51:17, 7.61s/it, loss=0.0004, acc=0.9997, iter_time=10.46s]
Epoch 0: 13%|█▎ | 1575/12384 [3:20:33<22:53:17, 7.62s/it, loss=0.0004, acc=0.9997, iter_time=10.46s]
Epoch 0: 13%|█▎ | 1575/12384 [3:20:40<22:53:17, 7.62s/it, loss=0.0028, acc=0.9960, iter_time=8.05s]
Epoch 0: 13%|█▎ | 1576/12384 [3:20:40<22:53:01, 7.62s/it, loss=0.0028, acc=0.9960, iter_time=8.05s]
Epoch 0: 13%|█▎ | 1576/12384 [3:20:48<22:53:01, 7.62s/it, loss=0.0036, acc=0.9941, iter_time=7.21s]
Epoch 0: 13%|█▎ | 1577/12384 [3:20:48<22:53:00, 7.62s/it, loss=0.0036, acc=0.9941, iter_time=7.21s]
Epoch 0: 13%|█▎ | 1577/12384 [3:20:56<22:53:00, 7.62s/it, loss=0.0005, acc=0.9979, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1578/12384 [3:20:56<22:51:08, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1578/12384 [3:21:03<22:51:08, 7.61s/it, loss=0.0009, acc=0.9978, iter_time=6.66s]
Epoch 0: 13%|█▎ | 1579/12384 [3:21:03<22:50:12, 7.61s/it, loss=0.0009, acc=0.9978, iter_time=6.66s]
Epoch 0: 13%|█▎ | 1579/12384 [3:21:11<22:50:12, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.25s]
Epoch 0: 13%|█▎ | 1580/12384 [3:21:11<22:48:51, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=8.25s]
Epoch 0: 13%|█▎ | 1580/12384 [3:21:18<22:48:51, 7.60s/it, loss=0.0041, acc=0.9935, iter_time=6.17s]
Epoch 0: 13%|█▎ | 1581/12384 [3:21:18<22:48:12, 7.60s/it, loss=0.0041, acc=0.9935, iter_time=6.17s]
Epoch 0: 13%|█▎ | 1581/12384 [3:21:26<22:48:12, 7.60s/it, loss=0.0014, acc=0.9954, iter_time=9.32s]
Epoch 0: 13%|█▎ | 1582/12384 [3:21:26<22:48:55, 7.60s/it, loss=0.0014, acc=0.9954, iter_time=9.32s]
Epoch 0: 13%|█▎ | 1582/12384 [3:21:34<22:48:55, 7.60s/it, loss=0.0007, acc=0.9990, iter_time=7.67s]
Epoch 0: 13%|█▎ | 1583/12384 [3:21:34<22:52:32, 7.62s/it, loss=0.0007, acc=0.9990, iter_time=7.67s]
Epoch 0: 13%|█▎ | 1583/12384 [3:21:41<22:52:32, 7.62s/it, loss=0.0013, acc=0.9966, iter_time=8.00s]
Epoch 0: 13%|█▎ | 1584/12384 [3:21:41<22:52:46, 7.63s/it, loss=0.0013, acc=0.9966, iter_time=8.00s]
Epoch 0: 13%|█▎ | 1584/12384 [3:21:49<22:52:46, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.28s]
Epoch 0: 13%|█▎ | 1585/12384 [3:21:49<22:54:06, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.28s]
Epoch 0: 13%|█▎ | 1585/12384 [3:21:57<22:54:06, 7.63s/it, loss=0.0015, acc=0.9975, iter_time=5.58s]
Epoch 0: 13%|█▎ | 1586/12384 [3:21:57<23:10:13, 7.72s/it, loss=0.0015, acc=0.9975, iter_time=5.58s]
Epoch 0: 13%|█▎ | 1586/12384 [3:22:05<23:10:13, 7.72s/it, loss=0.0004, acc=0.9998, iter_time=9.95s]
Epoch 0: 13%|█▎ | 1587/12384 [3:22:05<23:03:13, 7.69s/it, loss=0.0004, acc=0.9998, iter_time=9.95s]
Epoch 0: 13%|█▎ | 1587/12384 [3:22:12<23:03:13, 7.69s/it, loss=0.0006, acc=0.9980, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1588/12384 [3:22:12<23:02:48, 7.69s/it, loss=0.0006, acc=0.9980, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1588/12384 [3:22:20<23:02:48, 7.69s/it, loss=0.0006, acc=0.9972, iter_time=6.10s]
Epoch 0: 13%|█▎ | 1589/12384 [3:22:20<22:59:39, 7.67s/it, loss=0.0006, acc=0.9972, iter_time=6.10s]
Epoch 0: 13%|█▎ | 1589/12384 [3:22:27<22:59:39, 7.67s/it, loss=0.0050, acc=0.9887, iter_time=9.12s]
Epoch 0: 13%|█▎ | 1590/12384 [3:22:27<22:54:53, 7.64s/it, loss=0.0050, acc=0.9887, iter_time=9.12s]
Epoch 0: 13%|█▎ | 1590/12384 [3:22:35<22:54:53, 7.64s/it, loss=0.0006, acc=0.9992, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1591/12384 [3:22:35<22:56:59, 7.65s/it, loss=0.0006, acc=0.9992, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1591/12384 [3:22:43<22:56:59, 7.65s/it, loss=0.0018, acc=0.9985, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1592/12384 [3:22:43<22:54:17, 7.64s/it, loss=0.0018, acc=0.9985, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1592/12384 [3:22:50<22:54:17, 7.64s/it, loss=0.0057, acc=0.9908, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1593/12384 [3:22:50<22:51:45, 7.63s/it, loss=0.0057, acc=0.9908, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1593/12384 [3:22:58<22:51:45, 7.63s/it, loss=0.0022, acc=0.9970, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1594/12384 [3:22:58<22:50:05, 7.62s/it, loss=0.0022, acc=0.9970, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1594/12384 [3:23:06<22:50:05, 7.62s/it, loss=0.0006, acc=0.9996, iter_time=5.48s]
Epoch 0: 13%|█▎ | 1595/12384 [3:23:06<22:51:13, 7.63s/it, loss=0.0006, acc=0.9996, iter_time=5.48s]
Epoch 0: 13%|█▎ | 1595/12384 [3:23:13<22:51:13, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=9.75s]
Epoch 0: 13%|█▎ | 1596/12384 [3:23:13<22:49:41, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=9.75s]
Epoch 0: 13%|█▎ | 1596/12384 [3:23:21<22:49:41, 7.62s/it, loss=0.0012, acc=0.9976, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1597/12384 [3:23:21<22:49:11, 7.62s/it, loss=0.0012, acc=0.9976, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1597/12384 [3:23:28<22:49:11, 7.62s/it, loss=0.0026, acc=0.9962, iter_time=5.00s]
Epoch 0: 13%|█▎ | 1598/12384 [3:23:28<22:49:18, 7.62s/it, loss=0.0026, acc=0.9962, iter_time=5.00s]
Epoch 0: 13%|█▎ | 1598/12384 [3:23:36<22:49:18, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=7.67s]
Epoch 0: 13%|█▎ | 1599/12384 [3:23:36<22:49:19, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=7.67s]
Epoch 0: 13%|█▎ | 1599/12384 [3:23:44<22:49:19, 7.62s/it, loss=0.0029, acc=0.9943, iter_time=10.59s]
Epoch 0: 13%|█▎ | 1600/12384 [3:23:44<22:49:31, 7.62s/it, loss=0.0029, acc=0.9943, iter_time=10.59s]
Epoch 0: 13%|█▎ | 1600/12384 [3:23:51<22:49:31, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.19s]
Epoch 0: 13%|█▎ | 1601/12384 [3:23:51<22:47:39, 7.61s/it, loss=0.0007, acc=0.9980, iter_time=7.19s]
Epoch 0: 13%|█▎ | 1601/12384 [3:23:59<22:47:39, 7.61s/it, loss=0.0022, acc=0.9979, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1602/12384 [3:23:59<22:47:36, 7.61s/it, loss=0.0022, acc=0.9979, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1602/12384 [3:24:06<22:47:36, 7.61s/it, loss=0.0006, acc=0.9977, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1603/12384 [3:24:06<22:47:10, 7.61s/it, loss=0.0006, acc=0.9977, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1603/12384 [3:24:14<22:47:10, 7.61s/it, loss=0.0017, acc=0.9905, iter_time=4.58s]
Epoch 0: 13%|█▎ | 1604/12384 [3:24:14<22:52:20, 7.64s/it, loss=0.0017, acc=0.9905, iter_time=4.58s]
Epoch 0: 13%|█▎ | 1604/12384 [3:24:22<22:52:20, 7.64s/it, loss=0.0010, acc=0.9991, iter_time=10.73s]
Epoch 0: 13%|█▎ | 1605/12384 [3:24:22<22:52:12, 7.64s/it, loss=0.0010, acc=0.9991, iter_time=10.73s]
Epoch 0: 13%|█▎ | 1605/12384 [3:24:29<22:52:12, 7.64s/it, loss=0.0038, acc=0.9920, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1606/12384 [3:24:29<22:50:20, 7.63s/it, loss=0.0038, acc=0.9920, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1606/12384 [3:24:37<22:50:20, 7.63s/it, loss=0.0023, acc=0.9961, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1607/12384 [3:24:37<22:49:47, 7.63s/it, loss=0.0023, acc=0.9961, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1607/12384 [3:24:45<22:49:47, 7.63s/it, loss=0.0010, acc=0.9969, iter_time=8.01s]
Epoch 0: 13%|█▎ | 1608/12384 [3:24:45<22:49:30, 7.63s/it, loss=0.0010, acc=0.9969, iter_time=8.01s]
Epoch 0: 13%|█▎ | 1608/12384 [3:24:52<22:49:30, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 13%|█▎ | 1609/12384 [3:24:52<22:48:41, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 13%|█▎ | 1609/12384 [3:25:00<22:48:41, 7.62s/it, loss=0.0033, acc=0.9928, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1610/12384 [3:25:00<22:48:37, 7.62s/it, loss=0.0033, acc=0.9928, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1610/12384 [3:25:08<22:48:37, 7.62s/it, loss=0.0008, acc=0.9998, iter_time=4.10s]
Epoch 0: 13%|█▎ | 1611/12384 [3:25:08<22:48:34, 7.62s/it, loss=0.0008, acc=0.9998, iter_time=4.10s]
Epoch 0: 13%|█▎ | 1611/12384 [3:25:15<22:48:34, 7.62s/it, loss=0.0006, acc=0.9997, iter_time=11.15s]
Epoch 0: 13%|█▎ | 1612/12384 [3:25:15<22:46:55, 7.61s/it, loss=0.0006, acc=0.9997, iter_time=11.15s]
Epoch 0: 13%|█▎ | 1612/12384 [3:25:23<22:46:55, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.90s]
Epoch 0: 13%|█▎ | 1613/12384 [3:25:23<23:04:43, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=7.90s]
Epoch 0: 13%|█▎ | 1613/12384 [3:25:31<23:04:43, 7.71s/it, loss=0.0050, acc=0.9924, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1614/12384 [3:25:31<22:58:11, 7.68s/it, loss=0.0050, acc=0.9924, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1614/12384 [3:25:38<22:58:11, 7.68s/it, loss=0.0006, acc=0.9986, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1615/12384 [3:25:38<22:54:35, 7.66s/it, loss=0.0006, acc=0.9986, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1615/12384 [3:25:46<22:54:35, 7.66s/it, loss=0.0011, acc=0.9966, iter_time=7.99s]
Epoch 0: 13%|█▎ | 1616/12384 [3:25:46<22:52:38, 7.65s/it, loss=0.0011, acc=0.9966, iter_time=7.99s]
Epoch 0: 13%|█▎ | 1616/12384 [3:25:54<22:52:38, 7.65s/it, loss=0.0032, acc=0.9960, iter_time=7.22s]
Epoch 0: 13%|█▎ | 1617/12384 [3:25:54<22:50:05, 7.63s/it, loss=0.0032, acc=0.9960, iter_time=7.22s]
Epoch 0: 13%|█▎ | 1617/12384 [3:26:01<22:50:05, 7.63s/it, loss=0.0006, acc=0.9975, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1618/12384 [3:26:01<22:50:42, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1618/12384 [3:26:09<22:50:42, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=4.78s]
Epoch 0: 13%|█▎ | 1619/12384 [3:26:09<22:48:20, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=4.78s]
Epoch 0: 13%|█▎ | 1619/12384 [3:26:16<22:48:20, 7.63s/it, loss=0.0040, acc=0.9900, iter_time=10.15s]
Epoch 0: 13%|█▎ | 1620/12384 [3:26:16<22:47:06, 7.62s/it, loss=0.0040, acc=0.9900, iter_time=10.15s]
Epoch 0: 13%|█▎ | 1620/12384 [3:26:24<22:47:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.39s]
Epoch 0: 13%|█▎ | 1621/12384 [3:26:24<22:47:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.39s]
Epoch 0: 13%|█▎ | 1621/12384 [3:26:32<22:47:27, 7.62s/it, loss=0.0013, acc=0.9965, iter_time=7.12s]
Epoch 0: 13%|█▎ | 1622/12384 [3:26:32<22:47:04, 7.62s/it, loss=0.0013, acc=0.9965, iter_time=7.12s]
Epoch 0: 13%|█▎ | 1622/12384 [3:26:39<22:47:04, 7.62s/it, loss=0.0040, acc=0.9894, iter_time=8.58s]
Epoch 0: 13%|█▎ | 1623/12384 [3:26:39<22:46:19, 7.62s/it, loss=0.0040, acc=0.9894, iter_time=8.58s]
Epoch 0: 13%|█▎ | 1623/12384 [3:26:47<22:46:19, 7.62s/it, loss=0.0009, acc=0.9986, iter_time=10.63s]
Epoch 0: 13%|█▎ | 1624/12384 [3:26:47<22:46:01, 7.62s/it, loss=0.0009, acc=0.9986, iter_time=10.63s]
Epoch 0: 13%|█▎ | 1624/12384 [3:26:54<22:46:01, 7.62s/it, loss=0.0005, acc=0.9989, iter_time=5.29s]
Epoch 0: 13%|█▎ | 1625/12384 [3:26:54<22:44:09, 7.61s/it, loss=0.0005, acc=0.9989, iter_time=5.29s]
Epoch 0: 13%|█▎ | 1625/12384 [3:27:02<22:44:09, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=9.94s]
Epoch 0: 13%|█▎ | 1626/12384 [3:27:02<22:43:59, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=9.94s]
Epoch 0: 13%|█▎ | 1626/12384 [3:27:10<22:43:59, 7.61s/it, loss=0.0032, acc=0.9947, iter_time=6.50s]
Epoch 0: 13%|█▎ | 1627/12384 [3:27:10<22:43:41, 7.61s/it, loss=0.0032, acc=0.9947, iter_time=6.50s]
Epoch 0: 13%|█▎ | 1627/12384 [3:27:17<22:43:41, 7.61s/it, loss=0.0012, acc=0.9979, iter_time=8.74s]
Epoch 0: 13%|█▎ | 1628/12384 [3:27:17<22:43:10, 7.60s/it, loss=0.0012, acc=0.9979, iter_time=8.74s]
Epoch 0: 13%|█▎ | 1628/12384 [3:27:25<22:43:10, 7.60s/it, loss=0.0011, acc=0.9976, iter_time=7.59s]
Epoch 0: 13%|█▎ | 1629/12384 [3:27:25<22:42:12, 7.60s/it, loss=0.0011, acc=0.9976, iter_time=7.59s]
Epoch 0: 13%|█▎ | 1629/12384 [3:27:32<22:42:12, 7.60s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1630/12384 [3:27:32<22:42:11, 7.60s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1630/12384 [3:27:40<22:42:11, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1631/12384 [3:27:40<22:42:39, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1631/12384 [3:27:48<22:42:39, 7.60s/it, loss=0.0059, acc=0.9873, iter_time=7.58s]
Epoch 0: 13%|█▎ | 1632/12384 [3:27:48<22:43:33, 7.61s/it, loss=0.0059, acc=0.9873, iter_time=7.58s]
Epoch 0: 13%|█▎ | 1632/12384 [3:27:55<22:43:33, 7.61s/it, loss=0.0006, acc=0.9977, iter_time=5.04s]
Epoch 0: 13%|█▎ | 1633/12384 [3:27:55<22:43:54, 7.61s/it, loss=0.0006, acc=0.9977, iter_time=5.04s]
Epoch 0: 13%|█▎ | 1633/12384 [3:28:03<22:43:54, 7.61s/it, loss=0.0003, acc=0.9996, iter_time=10.21s]
Epoch 0: 13%|█▎ | 1634/12384 [3:28:03<22:43:34, 7.61s/it, loss=0.0003, acc=0.9996, iter_time=10.21s]
Epoch 0: 13%|█▎ | 1634/12384 [3:28:10<22:43:34, 7.61s/it, loss=0.0006, acc=0.9991, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1635/12384 [3:28:10<22:43:29, 7.61s/it, loss=0.0006, acc=0.9991, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1635/12384 [3:28:18<22:43:29, 7.61s/it, loss=0.0010, acc=0.9962, iter_time=5.53s]
Epoch 0: 13%|█▎ | 1636/12384 [3:28:18<22:43:19, 7.61s/it, loss=0.0010, acc=0.9962, iter_time=5.53s]
Epoch 0: 13%|█▎ | 1636/12384 [3:28:26<22:43:19, 7.61s/it, loss=0.0029, acc=0.9880, iter_time=9.69s]
Epoch 0: 13%|█▎ | 1637/12384 [3:28:26<22:42:30, 7.61s/it, loss=0.0029, acc=0.9880, iter_time=9.69s]
Epoch 0: 13%|█▎ | 1637/12384 [3:28:33<22:42:30, 7.61s/it, loss=0.0014, acc=0.9971, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1638/12384 [3:28:33<22:42:41, 7.61s/it, loss=0.0014, acc=0.9971, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1638/12384 [3:28:41<22:42:41, 7.61s/it, loss=0.0009, acc=0.9967, iter_time=7.92s]
Epoch 0: 13%|█▎ | 1639/12384 [3:28:41<23:00:27, 7.71s/it, loss=0.0009, acc=0.9967, iter_time=7.92s]
Epoch 0: 13%|█▎ | 1639/12384 [3:28:49<23:00:27, 7.71s/it, loss=0.0004, acc=0.9998, iter_time=8.02s]
Epoch 0: 13%|█▎ | 1640/12384 [3:28:49<22:55:51, 7.68s/it, loss=0.0004, acc=0.9998, iter_time=8.02s]
Epoch 0: 13%|█▎ | 1640/12384 [3:28:56<22:55:51, 7.68s/it, loss=0.0013, acc=0.9970, iter_time=6.27s]
Epoch 0: 13%|█▎ | 1641/12384 [3:28:56<22:49:45, 7.65s/it, loss=0.0013, acc=0.9970, iter_time=6.27s]
Epoch 0: 13%|█▎ | 1641/12384 [3:29:04<22:49:45, 7.65s/it, loss=0.0004, acc=0.9979, iter_time=6.72s]
Epoch 0: 13%|█▎ | 1642/12384 [3:29:04<22:46:46, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=6.72s]
Epoch 0: 13%|█▎ | 1642/12384 [3:29:12<22:46:46, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 13%|█▎ | 1643/12384 [3:29:12<22:45:36, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 13%|█▎ | 1643/12384 [3:29:19<22:45:36, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=5.86s]
Epoch 0: 13%|█▎ | 1644/12384 [3:29:19<22:45:40, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=5.86s]
Epoch 0: 13%|█▎ | 1644/12384 [3:29:27<22:45:40, 7.63s/it, loss=0.0009, acc=0.9970, iter_time=9.21s]
Epoch 0: 13%|█▎ | 1645/12384 [3:29:27<22:45:00, 7.63s/it, loss=0.0009, acc=0.9970, iter_time=9.21s]
Epoch 0: 13%|█▎ | 1645/12384 [3:29:35<22:45:00, 7.63s/it, loss=0.0016, acc=0.9929, iter_time=6.82s]
Epoch 0: 13%|█▎ | 1646/12384 [3:29:35<22:44:33, 7.62s/it, loss=0.0016, acc=0.9929, iter_time=6.82s]
Epoch 0: 13%|█▎ | 1646/12384 [3:29:42<22:44:33, 7.62s/it, loss=0.0028, acc=0.9922, iter_time=9.75s]
Epoch 0: 13%|█▎ | 1647/12384 [3:29:42<22:43:03, 7.62s/it, loss=0.0028, acc=0.9922, iter_time=9.75s]
Epoch 0: 13%|█▎ | 1647/12384 [3:29:50<22:43:03, 7.62s/it, loss=0.0044, acc=0.9931, iter_time=8.49s]
Epoch 0: 13%|█▎ | 1648/12384 [3:29:50<22:42:02, 7.61s/it, loss=0.0044, acc=0.9931, iter_time=8.49s]
Epoch 0: 13%|█▎ | 1648/12384 [3:29:57<22:42:02, 7.61s/it, loss=0.0086, acc=0.9780, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1649/12384 [3:29:57<22:43:45, 7.62s/it, loss=0.0086, acc=0.9780, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1649/12384 [3:30:05<22:43:45, 7.62s/it, loss=0.0005, acc=0.9961, iter_time=11.10s]
Epoch 0: 13%|█▎ | 1650/12384 [3:30:05<22:43:38, 7.62s/it, loss=0.0005, acc=0.9961, iter_time=11.10s]
Epoch 0: 13%|█▎ | 1650/12384 [3:30:13<22:43:38, 7.62s/it, loss=0.0027, acc=0.9919, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1651/12384 [3:30:13<22:42:53, 7.62s/it, loss=0.0027, acc=0.9919, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1651/12384 [3:30:20<22:42:53, 7.62s/it, loss=0.0034, acc=0.9895, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1652/12384 [3:30:20<22:46:27, 7.64s/it, loss=0.0034, acc=0.9895, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1652/12384 [3:30:28<22:46:27, 7.64s/it, loss=0.0012, acc=0.9998, iter_time=5.11s]
Epoch 0: 13%|█▎ | 1653/12384 [3:30:28<22:43:09, 7.62s/it, loss=0.0012, acc=0.9998, iter_time=5.11s]
Epoch 0: 13%|█▎ | 1653/12384 [3:30:35<22:43:09, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=8.11s]
Epoch 0: 13%|█▎ | 1654/12384 [3:30:35<22:41:57, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=8.11s]
Epoch 0: 13%|█▎ | 1654/12384 [3:30:43<22:41:57, 7.62s/it, loss=0.0006, acc=0.9980, iter_time=8.71s]
Epoch 0: 13%|█▎ | 1655/12384 [3:30:43<22:43:04, 7.62s/it, loss=0.0006, acc=0.9980, iter_time=8.71s]
Epoch 0: 13%|█▎ | 1655/12384 [3:30:51<22:43:04, 7.62s/it, loss=0.0014, acc=0.9987, iter_time=8.96s]
Epoch 0: 13%|█▎ | 1656/12384 [3:30:51<22:41:56, 7.62s/it, loss=0.0014, acc=0.9987, iter_time=8.96s]
Epoch 0: 13%|█▎ | 1656/12384 [3:30:58<22:41:56, 7.62s/it, loss=0.0010, acc=0.9989, iter_time=7.22s]
Epoch 0: 13%|█▎ | 1657/12384 [3:30:58<22:41:12, 7.61s/it, loss=0.0010, acc=0.9989, iter_time=7.22s]
Epoch 0: 13%|█▎ | 1657/12384 [3:31:06<22:41:12, 7.61s/it, loss=0.0027, acc=0.9958, iter_time=4.31s]
Epoch 0: 13%|█▎ | 1658/12384 [3:31:06<22:41:23, 7.62s/it, loss=0.0027, acc=0.9958, iter_time=4.31s]
Epoch 0: 13%|█▎ | 1658/12384 [3:31:14<22:41:23, 7.62s/it, loss=0.0015, acc=0.9970, iter_time=9.68s]
Epoch 0: 13%|█▎ | 1659/12384 [3:31:14<22:41:30, 7.62s/it, loss=0.0015, acc=0.9970, iter_time=9.68s]
Epoch 0: 13%|█▎ | 1659/12384 [3:31:21<22:41:30, 7.62s/it, loss=0.0011, acc=0.9990, iter_time=8.90s]
Epoch 0: 13%|█▎ | 1660/12384 [3:31:21<22:43:10, 7.63s/it, loss=0.0011, acc=0.9990, iter_time=8.90s]
Epoch 0: 13%|█▎ | 1660/12384 [3:31:29<22:43:10, 7.63s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1661/12384 [3:31:29<22:43:36, 7.63s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1661/12384 [3:31:36<22:43:36, 7.63s/it, loss=0.0022, acc=0.9972, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1662/12384 [3:31:36<22:42:37, 7.63s/it, loss=0.0022, acc=0.9972, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1662/12384 [3:31:44<22:42:37, 7.63s/it, loss=0.0004, acc=0.9986, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1663/12384 [3:31:44<22:41:08, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1663/12384 [3:31:52<22:41:08, 7.62s/it, loss=0.0031, acc=0.9895, iter_time=7.99s]
Epoch 0: 13%|█▎ | 1664/12384 [3:31:52<22:41:13, 7.62s/it, loss=0.0031, acc=0.9895, iter_time=7.99s]
Epoch 0: 13%|█▎ | 1664/12384 [3:32:00<22:41:13, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=6.31s]
Epoch 0: 13%|█▎ | 1665/12384 [3:32:00<22:59:03, 7.72s/it, loss=0.0007, acc=0.9980, iter_time=6.31s]
Epoch 0: 13%|█▎ | 1665/12384 [3:32:07<22:59:03, 7.72s/it, loss=0.0079, acc=0.9933, iter_time=8.87s]
Epoch 0: 13%|█▎ | 1666/12384 [3:32:07<22:53:51, 7.69s/it, loss=0.0079, acc=0.9933, iter_time=8.87s]
Epoch 0: 13%|█▎ | 1666/12384 [3:32:15<22:53:51, 7.69s/it, loss=0.0013, acc=0.9973, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1667/12384 [3:32:15<22:49:52, 7.67s/it, loss=0.0013, acc=0.9973, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1667/12384 [3:32:22<22:49:52, 7.67s/it, loss=0.0013, acc=0.9971, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1668/12384 [3:32:22<22:45:52, 7.65s/it, loss=0.0013, acc=0.9971, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1668/12384 [3:32:30<22:45:52, 7.65s/it, loss=0.0026, acc=0.9915, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1669/12384 [3:32:30<22:44:22, 7.64s/it, loss=0.0026, acc=0.9915, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1669/12384 [3:32:38<22:44:22, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1670/12384 [3:32:38<22:42:28, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1670/12384 [3:32:45<22:42:28, 7.63s/it, loss=0.0015, acc=0.9982, iter_time=5.26s]
Epoch 0: 13%|█▎ | 1671/12384 [3:32:45<22:42:47, 7.63s/it, loss=0.0015, acc=0.9982, iter_time=5.26s]
Epoch 0: 13%|█▎ | 1671/12384 [3:32:53<22:42:47, 7.63s/it, loss=0.0023, acc=0.9957, iter_time=10.36s]
Epoch 0: 14%|█▎ | 1672/12384 [3:32:53<22:41:58, 7.63s/it, loss=0.0023, acc=0.9957, iter_time=10.36s]
Epoch 0: 14%|█▎ | 1672/12384 [3:33:01<22:41:58, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.23s]
Epoch 0: 14%|█▎ | 1673/12384 [3:33:01<22:40:36, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=7.23s]
Epoch 0: 14%|█▎ | 1673/12384 [3:33:08<22:40:36, 7.62s/it, loss=0.0027, acc=0.9923, iter_time=7.59s]
Epoch 0: 14%|█▎ | 1674/12384 [3:33:08<22:38:46, 7.61s/it, loss=0.0027, acc=0.9923, iter_time=7.59s]
Epoch 0: 14%|█▎ | 1674/12384 [3:33:16<22:38:46, 7.61s/it, loss=0.0017, acc=0.9952, iter_time=3.86s]
Epoch 0: 14%|█▎ | 1675/12384 [3:33:16<22:39:17, 7.62s/it, loss=0.0017, acc=0.9952, iter_time=3.86s]
Epoch 0: 14%|█▎ | 1675/12384 [3:33:23<22:39:17, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=8.06s]
Epoch 0: 14%|█▎ | 1676/12384 [3:33:23<22:39:08, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=8.06s]
Epoch 0: 14%|█▎ | 1676/12384 [3:33:31<22:39:08, 7.62s/it, loss=0.0006, acc=0.9981, iter_time=9.70s]
Epoch 0: 14%|█▎ | 1677/12384 [3:33:31<22:38:45, 7.61s/it, loss=0.0006, acc=0.9981, iter_time=9.70s]
Epoch 0: 14%|█▎ | 1677/12384 [3:33:39<22:38:45, 7.61s/it, loss=0.0134, acc=0.9840, iter_time=8.84s]
Epoch 0: 14%|█▎ | 1678/12384 [3:33:39<22:38:07, 7.61s/it, loss=0.0134, acc=0.9840, iter_time=8.84s]
Epoch 0: 14%|█▎ | 1678/12384 [3:33:46<22:38:07, 7.61s/it, loss=0.0004, acc=0.9999, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1679/12384 [3:33:46<22:38:55, 7.62s/it, loss=0.0004, acc=0.9999, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1679/12384 [3:33:54<22:38:55, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.01s]
Epoch 0: 14%|█▎ | 1680/12384 [3:33:54<22:39:09, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.01s]
Epoch 0: 14%|█▎ | 1680/12384 [3:34:01<22:39:09, 7.62s/it, loss=0.0015, acc=0.9980, iter_time=6.09s]
Epoch 0: 14%|█▎ | 1681/12384 [3:34:01<22:38:13, 7.61s/it, loss=0.0015, acc=0.9980, iter_time=6.09s]
Epoch 0: 14%|█▎ | 1681/12384 [3:34:09<22:38:13, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.75s]
Epoch 0: 14%|█▎ | 1682/12384 [3:34:09<22:39:44, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=8.75s]
Epoch 0: 14%|█▎ | 1682/12384 [3:34:17<22:39:44, 7.62s/it, loss=0.0004, acc=0.9987, iter_time=7.64s]
Epoch 0: 14%|█▎ | 1683/12384 [3:34:17<22:38:42, 7.62s/it, loss=0.0004, acc=0.9987, iter_time=7.64s]
Epoch 0: 14%|█▎ | 1683/12384 [3:34:24<22:38:42, 7.62s/it, loss=0.0031, acc=0.9975, iter_time=7.60s]
Epoch 0: 14%|█▎ | 1684/12384 [3:34:24<22:38:49, 7.62s/it, loss=0.0031, acc=0.9975, iter_time=7.60s]
Epoch 0: 14%|█▎ | 1684/12384 [3:34:32<22:38:49, 7.62s/it, loss=0.0009, acc=0.9973, iter_time=6.44s]
Epoch 0: 14%|█▎ | 1685/12384 [3:34:32<22:38:07, 7.62s/it, loss=0.0009, acc=0.9973, iter_time=6.44s]
Epoch 0: 14%|█▎ | 1685/12384 [3:34:40<22:38:07, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=8.79s]
Epoch 0: 14%|█▎ | 1686/12384 [3:34:40<22:38:33, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=8.79s]
Epoch 0: 14%|█▎ | 1686/12384 [3:34:47<22:38:33, 7.62s/it, loss=0.0015, acc=0.9972, iter_time=7.09s]
Epoch 0: 14%|█▎ | 1687/12384 [3:34:47<22:38:37, 7.62s/it, loss=0.0015, acc=0.9972, iter_time=7.09s]
Epoch 0: 14%|█▎ | 1687/12384 [3:34:55<22:38:37, 7.62s/it, loss=0.0020, acc=0.9973, iter_time=8.55s]
Epoch 0: 14%|█▎ | 1688/12384 [3:34:55<22:36:36, 7.61s/it, loss=0.0020, acc=0.9973, iter_time=8.55s]
Epoch 0: 14%|█▎ | 1688/12384 [3:35:02<22:36:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 14%|█▎ | 1689/12384 [3:35:02<22:36:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 14%|█▎ | 1689/12384 [3:35:10<22:36:32, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1690/12384 [3:35:10<22:38:03, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1690/12384 [3:35:18<22:38:03, 7.62s/it, loss=0.0016, acc=0.9976, iter_time=7.94s]
Epoch 0: 14%|█▎ | 1691/12384 [3:35:18<22:56:01, 7.72s/it, loss=0.0016, acc=0.9976, iter_time=7.94s]
Epoch 0: 14%|█▎ | 1691/12384 [3:35:26<22:56:01, 7.72s/it, loss=0.0008, acc=0.9981, iter_time=7.68s]
Epoch 0: 14%|█▎ | 1692/12384 [3:35:26<22:50:23, 7.69s/it, loss=0.0008, acc=0.9981, iter_time=7.68s]
Epoch 0: 14%|█▎ | 1692/12384 [3:35:33<22:50:23, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 14%|█▎ | 1693/12384 [3:35:33<22:46:54, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 14%|█▎ | 1693/12384 [3:35:41<22:46:54, 7.67s/it, loss=0.0006, acc=0.9978, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1694/12384 [3:35:41<22:43:56, 7.66s/it, loss=0.0006, acc=0.9978, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1694/12384 [3:35:48<22:43:56, 7.66s/it, loss=0.0032, acc=0.9913, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1695/12384 [3:35:48<22:42:03, 7.65s/it, loss=0.0032, acc=0.9913, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1695/12384 [3:35:56<22:42:03, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.50s]
Epoch 0: 14%|█▎ | 1696/12384 [3:35:56<22:40:26, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=9.50s]
Epoch 0: 14%|█▎ | 1696/12384 [3:36:04<22:40:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 14%|█▎ | 1697/12384 [3:36:04<22:44:10, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 14%|█▎ | 1697/12384 [3:36:11<22:44:10, 7.66s/it, loss=0.0023, acc=0.9965, iter_time=8.32s]
Epoch 0: 14%|█▎ | 1698/12384 [3:36:11<22:40:21, 7.64s/it, loss=0.0023, acc=0.9965, iter_time=8.32s]
Epoch 0: 14%|█▎ | 1698/12384 [3:36:19<22:40:21, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=7.90s]
Epoch 0: 14%|█▎ | 1699/12384 [3:36:19<22:37:49, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=7.90s]
Epoch 0: 14%|█▎ | 1699/12384 [3:36:27<22:37:49, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=8.02s]
Epoch 0: 14%|█▎ | 1700/12384 [3:36:27<22:37:51, 7.63s/it, loss=0.0003, acc=0.9982, iter_time=8.02s]
Epoch 0: 14%|█▎ | 1700/12384 [3:36:34<22:37:51, 7.63s/it, loss=0.0024, acc=0.9945, iter_time=7.20s]
Epoch 0: 14%|█▎ | 1701/12384 [3:36:34<22:37:41, 7.63s/it, loss=0.0024, acc=0.9945, iter_time=7.20s]
Epoch 0: 14%|█▎ | 1701/12384 [3:36:42<22:37:41, 7.63s/it, loss=0.0011, acc=0.9968, iter_time=7.64s]
Epoch 0: 14%|█▎ | 1702/12384 [3:36:42<22:37:10, 7.62s/it, loss=0.0011, acc=0.9968, iter_time=7.64s]
Epoch 0: 14%|█▎ | 1702/12384 [3:36:49<22:37:10, 7.62s/it, loss=0.0011, acc=0.9969, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1703/12384 [3:36:49<22:35:33, 7.61s/it, loss=0.0011, acc=0.9969, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1703/12384 [3:36:57<22:35:33, 7.61s/it, loss=0.0017, acc=0.9983, iter_time=7.54s]
Epoch 0: 14%|█▍ | 1704/12384 [3:36:57<22:34:49, 7.61s/it, loss=0.0017, acc=0.9983, iter_time=7.54s]
Epoch 0: 14%|█▍ | 1704/12384 [3:37:05<22:34:49, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.10s]
Epoch 0: 14%|█▍ | 1705/12384 [3:37:05<22:34:33, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.10s]
Epoch 0: 14%|█▍ | 1705/12384 [3:37:12<22:34:33, 7.61s/it, loss=0.0007, acc=0.9985, iter_time=8.16s]
Epoch 0: 14%|█▍ | 1706/12384 [3:37:12<22:33:30, 7.61s/it, loss=0.0007, acc=0.9985, iter_time=8.16s]
Epoch 0: 14%|█▍ | 1706/12384 [3:37:20<22:33:30, 7.61s/it, loss=0.0012, acc=0.9963, iter_time=7.60s]
Epoch 0: 14%|█▍ | 1707/12384 [3:37:20<22:33:34, 7.61s/it, loss=0.0012, acc=0.9963, iter_time=7.60s]
Epoch 0: 14%|█▍ | 1707/12384 [3:37:27<22:33:34, 7.61s/it, loss=0.0027, acc=0.9970, iter_time=6.10s]
Epoch 0: 14%|█▍ | 1708/12384 [3:37:27<22:32:51, 7.60s/it, loss=0.0027, acc=0.9970, iter_time=6.10s]
Epoch 0: 14%|█▍ | 1708/12384 [3:37:35<22:32:51, 7.60s/it, loss=0.0005, acc=0.9982, iter_time=7.55s]
Epoch 0: 14%|█▍ | 1709/12384 [3:37:35<22:32:33, 7.60s/it, loss=0.0005, acc=0.9982, iter_time=7.55s]
Epoch 0: 14%|█▍ | 1709/12384 [3:37:43<22:32:33, 7.60s/it, loss=0.0014, acc=0.9979, iter_time=7.69s]
Epoch 0: 14%|█▍ | 1710/12384 [3:37:43<22:35:51, 7.62s/it, loss=0.0014, acc=0.9979, iter_time=7.69s]
Epoch 0: 14%|█▍ | 1710/12384 [3:37:50<22:35:51, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.33s]
Epoch 0: 14%|█▍ | 1711/12384 [3:37:50<22:33:47, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.33s]
Epoch 0: 14%|█▍ | 1711/12384 [3:37:58<22:33:47, 7.61s/it, loss=0.0042, acc=0.9931, iter_time=9.77s]
Epoch 0: 14%|█▍ | 1712/12384 [3:37:58<22:37:16, 7.63s/it, loss=0.0042, acc=0.9931, iter_time=9.77s]
Epoch 0: 14%|█▍ | 1712/12384 [3:38:06<22:37:16, 7.63s/it, loss=0.0008, acc=0.9988, iter_time=7.29s]
Epoch 0: 14%|█▍ | 1713/12384 [3:38:06<22:35:45, 7.62s/it, loss=0.0008, acc=0.9988, iter_time=7.29s]
Epoch 0: 14%|█▍ | 1713/12384 [3:38:13<22:35:45, 7.62s/it, loss=0.0005, acc=0.9997, iter_time=5.27s]
Epoch 0: 14%|█▍ | 1714/12384 [3:38:13<22:35:23, 7.62s/it, loss=0.0005, acc=0.9997, iter_time=5.27s]
Epoch 0: 14%|█▍ | 1714/12384 [3:38:21<22:35:23, 7.62s/it, loss=0.0006, acc=0.9984, iter_time=9.96s]
Epoch 0: 14%|█▍ | 1715/12384 [3:38:21<22:35:08, 7.62s/it, loss=0.0006, acc=0.9984, iter_time=9.96s]
Epoch 0: 14%|█▍ | 1715/12384 [3:38:28<22:35:08, 7.62s/it, loss=0.0005, acc=0.9988, iter_time=6.18s]
Epoch 0: 14%|█▍ | 1716/12384 [3:38:28<22:35:04, 7.62s/it, loss=0.0005, acc=0.9988, iter_time=6.18s]
Epoch 0: 14%|█▍ | 1716/12384 [3:38:36<22:35:04, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=9.34s]
Epoch 0: 14%|█▍ | 1717/12384 [3:38:36<22:52:06, 7.72s/it, loss=0.0003, acc=1.0000, iter_time=9.34s]
Epoch 0: 14%|█▍ | 1717/12384 [3:38:44<22:52:06, 7.72s/it, loss=0.0010, acc=0.9999, iter_time=7.66s]
Epoch 0: 14%|█▍ | 1718/12384 [3:38:44<22:45:28, 7.68s/it, loss=0.0010, acc=0.9999, iter_time=7.66s]
Epoch 0: 14%|█▍ | 1718/12384 [3:38:52<22:45:28, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.29s]
Epoch 0: 14%|█▍ | 1719/12384 [3:38:52<22:39:50, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.29s]
Epoch 0: 14%|█▍ | 1719/12384 [3:38:59<22:39:50, 7.65s/it, loss=0.0012, acc=0.9983, iter_time=11.28s]
Epoch 0: 14%|█▍ | 1720/12384 [3:38:59<22:38:16, 7.64s/it, loss=0.0012, acc=0.9983, iter_time=11.28s]
Epoch 0: 14%|█▍ | 1720/12384 [3:39:07<22:38:16, 7.64s/it, loss=0.0039, acc=0.9931, iter_time=3.72s]
Epoch 0: 14%|█▍ | 1721/12384 [3:39:07<22:36:17, 7.63s/it, loss=0.0039, acc=0.9931, iter_time=3.72s]
Epoch 0: 14%|█▍ | 1721/12384 [3:39:14<22:36:17, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=9.93s]
Epoch 0: 14%|█▍ | 1722/12384 [3:39:14<22:35:02, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=9.93s]
Epoch 0: 14%|█▍ | 1722/12384 [3:39:22<22:35:02, 7.63s/it, loss=0.0129, acc=0.9713, iter_time=8.80s]
Epoch 0: 14%|█▍ | 1723/12384 [3:39:22<22:34:34, 7.62s/it, loss=0.0129, acc=0.9713, iter_time=8.80s]
Epoch 0: 14%|█▍ | 1723/12384 [3:39:30<22:34:34, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.07s]
Epoch 0: 14%|█▍ | 1724/12384 [3:39:30<22:34:18, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.07s]
Epoch 0: 14%|█▍ | 1724/12384 [3:39:37<22:34:18, 7.62s/it, loss=0.0009, acc=1.0000, iter_time=8.18s]
Epoch 0: 14%|█▍ | 1725/12384 [3:39:37<22:32:55, 7.62s/it, loss=0.0009, acc=1.0000, iter_time=8.18s]
Epoch 0: 14%|█▍ | 1725/12384 [3:39:45<22:32:55, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.29s]
Epoch 0: 14%|█▍ | 1726/12384 [3:39:45<22:33:01, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.29s]
Epoch 0: 14%|█▍ | 1726/12384 [3:39:53<22:33:01, 7.62s/it, loss=0.0013, acc=0.9972, iter_time=9.92s]
Epoch 0: 14%|█▍ | 1727/12384 [3:39:53<22:32:53, 7.62s/it, loss=0.0013, acc=0.9972, iter_time=9.92s]
Epoch 0: 14%|█▍ | 1727/12384 [3:40:00<22:32:53, 7.62s/it, loss=0.0023, acc=0.9962, iter_time=7.60s]
Epoch 0: 14%|█▍ | 1728/12384 [3:40:00<22:33:36, 7.62s/it, loss=0.0023, acc=0.9962, iter_time=7.60s]
Epoch 0: 14%|█▍ | 1728/12384 [3:40:08<22:33:36, 7.62s/it, loss=0.0009, acc=0.9978, iter_time=5.57s]
Epoch 0: 14%|█▍ | 1729/12384 [3:40:08<22:34:28, 7.63s/it, loss=0.0009, acc=0.9978, iter_time=5.57s]
Epoch 0: 14%|█▍ | 1729/12384 [3:40:15<22:34:28, 7.63s/it, loss=0.0006, acc=0.9984, iter_time=9.71s]
Epoch 0: 14%|█▍ | 1730/12384 [3:40:15<22:31:30, 7.61s/it, loss=0.0006, acc=0.9984, iter_time=9.71s]
Epoch 0: 14%|█▍ | 1730/12384 [3:40:23<22:31:30, 7.61s/it, loss=0.0007, acc=0.9983, iter_time=7.58s]
Epoch 0: 14%|█▍ | 1731/12384 [3:40:23<22:29:51, 7.60s/it, loss=0.0007, acc=0.9983, iter_time=7.58s]
Epoch 0: 14%|█▍ | 1731/12384 [3:40:31<22:29:51, 7.60s/it, loss=0.0012, acc=0.9969, iter_time=7.59s]
Epoch 0: 14%|█▍ | 1732/12384 [3:40:31<22:29:21, 7.60s/it, loss=0.0012, acc=0.9969, iter_time=7.59s]
Epoch 0: 14%|█▍ | 1732/12384 [3:40:38<22:29:21, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 0: 14%|█▍ | 1733/12384 [3:40:38<22:29:00, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 0: 14%|█▍ | 1733/12384 [3:40:46<22:29:00, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=5.19s]
Epoch 0: 14%|█▍ | 1734/12384 [3:40:46<22:30:15, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=5.19s]
Epoch 0: 14%|█▍ | 1734/12384 [3:40:53<22:30:15, 7.61s/it, loss=0.0016, acc=0.9975, iter_time=7.87s]
Epoch 0: 14%|█▍ | 1735/12384 [3:40:53<22:29:34, 7.60s/it, loss=0.0016, acc=0.9975, iter_time=7.87s]
Epoch 0: 14%|█▍ | 1735/12384 [3:41:01<22:29:34, 7.60s/it, loss=0.0016, acc=0.9965, iter_time=10.76s]
Epoch 0: 14%|█▍ | 1736/12384 [3:41:01<22:30:32, 7.61s/it, loss=0.0016, acc=0.9965, iter_time=10.76s]
Epoch 0: 14%|█▍ | 1736/12384 [3:41:09<22:30:32, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=7.23s]
Epoch 0: 14%|█▍ | 1737/12384 [3:41:09<22:30:06, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=7.23s]
Epoch 0: 14%|█▍ | 1737/12384 [3:41:16<22:30:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1738/12384 [3:41:16<22:30:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1738/12384 [3:41:24<22:30:12, 7.61s/it, loss=0.0006, acc=0.9982, iter_time=7.30s]
Epoch 0: 14%|█▍ | 1739/12384 [3:41:24<22:28:34, 7.60s/it, loss=0.0006, acc=0.9982, iter_time=7.30s]
Epoch 0: 14%|█▍ | 1739/12384 [3:41:31<22:28:34, 7.60s/it, loss=0.0007, acc=0.9994, iter_time=7.90s]
Epoch 0: 14%|█▍ | 1740/12384 [3:41:31<22:29:22, 7.61s/it, loss=0.0007, acc=0.9994, iter_time=7.90s]
Epoch 0: 14%|█▍ | 1740/12384 [3:41:39<22:29:22, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1741/12384 [3:41:39<22:29:29, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1741/12384 [3:41:47<22:29:29, 7.61s/it, loss=0.0040, acc=0.9914, iter_time=4.30s]
Epoch 0: 14%|█▍ | 1742/12384 [3:41:47<22:28:14, 7.60s/it, loss=0.0040, acc=0.9914, iter_time=4.30s]
Epoch 0: 14%|█▍ | 1742/12384 [3:41:54<22:28:14, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 0: 14%|█▍ | 1743/12384 [3:41:54<22:29:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 0: 14%|█▍ | 1743/12384 [3:42:02<22:29:21, 7.61s/it, loss=0.0023, acc=0.9954, iter_time=9.10s]
Epoch 0: 14%|█▍ | 1744/12384 [3:42:02<22:47:00, 7.71s/it, loss=0.0023, acc=0.9954, iter_time=9.10s]
Epoch 0: 14%|█▍ | 1744/12384 [3:42:10<22:47:00, 7.71s/it, loss=0.0021, acc=0.9948, iter_time=7.63s]
Epoch 0: 14%|█▍ | 1745/12384 [3:42:10<22:39:44, 7.67s/it, loss=0.0021, acc=0.9948, iter_time=7.63s]
Epoch 0: 14%|█▍ | 1745/12384 [3:42:17<22:39:44, 7.67s/it, loss=0.0005, acc=0.9994, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1746/12384 [3:42:17<22:37:06, 7.65s/it, loss=0.0005, acc=0.9994, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1746/12384 [3:42:25<22:37:06, 7.65s/it, loss=0.0018, acc=0.9937, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1747/12384 [3:42:25<22:35:13, 7.64s/it, loss=0.0018, acc=0.9937, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1747/12384 [3:42:33<22:35:13, 7.64s/it, loss=0.0007, acc=0.9973, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1748/12384 [3:42:33<22:33:48, 7.64s/it, loss=0.0007, acc=0.9973, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1748/12384 [3:42:40<22:33:48, 7.64s/it, loss=0.0025, acc=0.9947, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1749/12384 [3:42:40<22:32:46, 7.63s/it, loss=0.0025, acc=0.9947, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1749/12384 [3:42:48<22:32:46, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=8.02s]
Epoch 0: 14%|█▍ | 1750/12384 [3:42:48<22:30:55, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=8.02s]
Epoch 0: 14%|█▍ | 1750/12384 [3:42:55<22:30:55, 7.62s/it, loss=0.0005, acc=0.9997, iter_time=7.19s]
Epoch 0: 14%|█▍ | 1751/12384 [3:42:55<22:29:11, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=7.19s]
Epoch 0: 14%|█▍ | 1751/12384 [3:43:03<22:29:11, 7.61s/it, loss=0.0003, acc=0.9993, iter_time=7.56s]
Epoch 0: 14%|█▍ | 1752/12384 [3:43:03<22:28:56, 7.61s/it, loss=0.0003, acc=0.9993, iter_time=7.56s]
Epoch 0: 14%|█▍ | 1752/12384 [3:43:11<22:28:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 14%|█▍ | 1753/12384 [3:43:11<22:28:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 14%|█▍ | 1753/12384 [3:43:18<22:28:57, 7.61s/it, loss=0.0023, acc=0.9939, iter_time=6.68s]
Epoch 0: 14%|█▍ | 1754/12384 [3:43:18<22:29:19, 7.62s/it, loss=0.0023, acc=0.9939, iter_time=6.68s]
Epoch 0: 14%|█▍ | 1754/12384 [3:43:26<22:29:19, 7.62s/it, loss=0.0014, acc=0.9977, iter_time=7.93s]
Epoch 0: 14%|█▍ | 1755/12384 [3:43:26<22:28:39, 7.61s/it, loss=0.0014, acc=0.9977, iter_time=7.93s]
Epoch 0: 14%|█▍ | 1755/12384 [3:43:33<22:28:39, 7.61s/it, loss=0.0007, acc=0.9977, iter_time=7.63s]
Epoch 0: 14%|█▍ | 1756/12384 [3:43:33<22:27:44, 7.61s/it, loss=0.0007, acc=0.9977, iter_time=7.63s]
Epoch 0: 14%|█▍ | 1756/12384 [3:43:41<22:27:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 0: 14%|█▍ | 1757/12384 [3:43:41<22:27:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 0: 14%|█▍ | 1757/12384 [3:43:49<22:27:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 0: 14%|█▍ | 1758/12384 [3:43:49<22:28:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 0: 14%|█▍ | 1758/12384 [3:43:56<22:28:26, 7.61s/it, loss=0.0007, acc=0.9959, iter_time=7.88s]
Epoch 0: 14%|█▍ | 1759/12384 [3:43:56<22:28:39, 7.62s/it, loss=0.0007, acc=0.9959, iter_time=7.88s]
Epoch 0: 14%|█▍ | 1759/12384 [3:44:04<22:28:39, 7.62s/it, loss=0.0017, acc=0.9956, iter_time=7.86s]
Epoch 0: 14%|█▍ | 1760/12384 [3:44:04<22:28:25, 7.62s/it, loss=0.0017, acc=0.9956, iter_time=7.86s]
Epoch 0: 14%|█▍ | 1760/12384 [3:44:12<22:28:25, 7.62s/it, loss=0.0004, acc=0.9991, iter_time=5.56s]
Epoch 0: 14%|█▍ | 1761/12384 [3:44:12<22:27:17, 7.61s/it, loss=0.0004, acc=0.9991, iter_time=5.56s]
Epoch 0: 14%|█▍ | 1761/12384 [3:44:19<22:27:17, 7.61s/it, loss=0.0005, acc=0.9976, iter_time=7.90s]
Epoch 0: 14%|█▍ | 1762/12384 [3:44:19<22:26:55, 7.61s/it, loss=0.0005, acc=0.9976, iter_time=7.90s]
Epoch 0: 14%|█▍ | 1762/12384 [3:44:27<22:26:55, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.41s]
Epoch 0: 14%|█▍ | 1763/12384 [3:44:27<22:27:11, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.41s]
Epoch 0: 14%|█▍ | 1763/12384 [3:44:34<22:27:11, 7.61s/it, loss=0.0008, acc=0.9982, iter_time=4.80s]
Epoch 0: 14%|█▍ | 1764/12384 [3:44:34<22:26:58, 7.61s/it, loss=0.0008, acc=0.9982, iter_time=4.80s]
Epoch 0: 14%|█▍ | 1764/12384 [3:44:42<22:26:58, 7.61s/it, loss=0.0006, acc=0.9982, iter_time=10.41s]
Epoch 0: 14%|█▍ | 1765/12384 [3:44:42<22:26:46, 7.61s/it, loss=0.0006, acc=0.9982, iter_time=10.41s]
Epoch 0: 14%|█▍ | 1765/12384 [3:44:50<22:26:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 0: 14%|█▍ | 1766/12384 [3:44:50<22:26:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 0: 14%|█▍ | 1766/12384 [3:44:57<22:26:06, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1767/12384 [3:44:57<22:25:41, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1767/12384 [3:45:05<22:25:41, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 14%|█▍ | 1768/12384 [3:45:05<22:29:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 14%|█▍ | 1768/12384 [3:45:12<22:29:13, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=6.70s]
Epoch 0: 14%|█▍ | 1769/12384 [3:45:12<22:27:27, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.70s]
Epoch 0: 14%|█▍ | 1769/12384 [3:45:20<22:27:27, 7.62s/it, loss=0.0004, acc=0.9997, iter_time=8.52s]
Epoch 0: 14%|█▍ | 1770/12384 [3:45:20<22:44:54, 7.72s/it, loss=0.0004, acc=0.9997, iter_time=8.52s]
Epoch 0: 14%|█▍ | 1770/12384 [3:45:28<22:44:54, 7.72s/it, loss=0.0004, acc=0.9998, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1771/12384 [3:45:28<22:37:59, 7.68s/it, loss=0.0004, acc=0.9998, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1771/12384 [3:45:36<22:37:59, 7.68s/it, loss=0.0008, acc=0.9953, iter_time=7.65s]
Epoch 0: 14%|█▍ | 1772/12384 [3:45:36<22:37:53, 7.68s/it, loss=0.0008, acc=0.9953, iter_time=7.65s]
Epoch 0: 14%|█▍ | 1772/12384 [3:45:43<22:37:53, 7.68s/it, loss=0.0024, acc=0.9956, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1773/12384 [3:45:43<22:35:03, 7.66s/it, loss=0.0024, acc=0.9956, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1773/12384 [3:45:51<22:35:03, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1774/12384 [3:45:51<22:32:55, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1774/12384 [3:45:59<22:32:55, 7.65s/it, loss=0.0030, acc=0.9984, iter_time=5.87s]
Epoch 0: 14%|█▍ | 1775/12384 [3:45:59<22:30:31, 7.64s/it, loss=0.0030, acc=0.9984, iter_time=5.87s]
Epoch 0: 14%|█▍ | 1775/12384 [3:46:06<22:30:31, 7.64s/it, loss=0.0012, acc=0.9989, iter_time=9.32s]
Epoch 0: 14%|█▍ | 1776/12384 [3:46:06<22:30:15, 7.64s/it, loss=0.0012, acc=0.9989, iter_time=9.32s]
Epoch 0: 14%|█▍ | 1776/12384 [3:46:14<22:30:15, 7.64s/it, loss=0.0016, acc=0.9957, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1777/12384 [3:46:14<22:27:42, 7.62s/it, loss=0.0016, acc=0.9957, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1777/12384 [3:46:21<22:27:42, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1778/12384 [3:46:21<22:30:32, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1778/12384 [3:46:29<22:30:32, 7.64s/it, loss=0.0004, acc=0.9999, iter_time=7.68s]
Epoch 0: 14%|█▍ | 1779/12384 [3:46:29<22:29:29, 7.63s/it, loss=0.0004, acc=0.9999, iter_time=7.68s]
Epoch 0: 14%|█▍ | 1779/12384 [3:46:37<22:29:29, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.06s]
Epoch 0: 14%|█▍ | 1780/12384 [3:46:37<22:28:37, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.06s]
Epoch 0: 14%|█▍ | 1780/12384 [3:46:44<22:28:37, 7.63s/it, loss=0.0029, acc=0.9959, iter_time=8.17s]
Epoch 0: 14%|█▍ | 1781/12384 [3:46:44<22:28:02, 7.63s/it, loss=0.0029, acc=0.9959, iter_time=8.17s]
Epoch 0: 14%|█▍ | 1781/12384 [3:46:52<22:28:02, 7.63s/it, loss=0.0003, acc=0.9996, iter_time=6.98s]
Epoch 0: 14%|█▍ | 1782/12384 [3:46:52<22:25:01, 7.61s/it, loss=0.0003, acc=0.9996, iter_time=6.98s]
Epoch 0: 14%|█▍ | 1782/12384 [3:46:59<22:25:01, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=8.22s]
Epoch 0: 14%|█▍ | 1783/12384 [3:46:59<22:23:55, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=8.22s]
Epoch 0: 14%|█▍ | 1783/12384 [3:47:07<22:23:55, 7.61s/it, loss=0.0015, acc=0.9984, iter_time=7.57s]
Epoch 0: 14%|█▍ | 1784/12384 [3:47:07<22:25:14, 7.61s/it, loss=0.0015, acc=0.9984, iter_time=7.57s]
Epoch 0: 14%|█▍ | 1784/12384 [3:47:15<22:25:14, 7.61s/it, loss=0.0075, acc=0.9807, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1785/12384 [3:47:15<22:25:22, 7.62s/it, loss=0.0075, acc=0.9807, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1785/12384 [3:47:22<22:25:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.45s]
Epoch 0: 14%|█▍ | 1786/12384 [3:47:22<22:24:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.45s]
Epoch 0: 14%|█▍ | 1786/12384 [3:47:30<22:24:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.19s]
Epoch 0: 14%|█▍ | 1787/12384 [3:47:30<22:25:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.19s]
Epoch 0: 14%|█▍ | 1787/12384 [3:47:38<22:25:23, 7.62s/it, loss=0.0005, acc=0.9996, iter_time=10.03s]
Epoch 0: 14%|█▍ | 1788/12384 [3:47:38<22:24:13, 7.61s/it, loss=0.0005, acc=0.9996, iter_time=10.03s]
Epoch 0: 14%|█▍ | 1788/12384 [3:47:45<22:24:13, 7.61s/it, loss=0.0014, acc=0.9947, iter_time=8.79s]
Epoch 0: 14%|█▍ | 1789/12384 [3:47:45<22:22:44, 7.60s/it, loss=0.0014, acc=0.9947, iter_time=8.79s]
Epoch 0: 14%|█▍ | 1789/12384 [3:47:53<22:22:44, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=7.58s]
Epoch 0: 14%|█▍ | 1790/12384 [3:47:53<22:22:20, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=7.58s]
Epoch 0: 14%|█▍ | 1790/12384 [3:48:00<22:22:20, 7.60s/it, loss=0.0006, acc=0.9992, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1791/12384 [3:48:00<22:22:26, 7.60s/it, loss=0.0006, acc=0.9992, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1791/12384 [3:48:08<22:22:26, 7.60s/it, loss=0.0028, acc=0.9943, iter_time=7.98s]
Epoch 0: 14%|█▍ | 1792/12384 [3:48:08<22:26:04, 7.63s/it, loss=0.0028, acc=0.9943, iter_time=7.98s]
Epoch 0: 14%|█▍ | 1792/12384 [3:48:16<22:26:04, 7.63s/it, loss=0.0006, acc=0.9993, iter_time=7.30s]
Epoch 0: 14%|█▍ | 1793/12384 [3:48:16<22:24:59, 7.62s/it, loss=0.0006, acc=0.9993, iter_time=7.30s]
Epoch 0: 14%|█▍ | 1793/12384 [3:48:23<22:24:59, 7.62s/it, loss=0.0009, acc=0.9980, iter_time=5.52s]
Epoch 0: 14%|█▍ | 1794/12384 [3:48:23<22:25:01, 7.62s/it, loss=0.0009, acc=0.9980, iter_time=5.52s]
Epoch 0: 14%|█▍ | 1794/12384 [3:48:31<22:25:01, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=9.70s]
Epoch 0: 14%|█▍ | 1795/12384 [3:48:31<22:23:08, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=9.70s]
Epoch 0: 14%|█▍ | 1795/12384 [3:48:38<22:23:08, 7.61s/it, loss=0.0035, acc=0.9935, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1796/12384 [3:48:38<22:22:04, 7.61s/it, loss=0.0035, acc=0.9935, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1796/12384 [3:48:46<22:22:04, 7.61s/it, loss=0.0021, acc=0.9972, iter_time=6.13s]
Epoch 0: 15%|█▍ | 1797/12384 [3:48:46<22:40:08, 7.71s/it, loss=0.0021, acc=0.9972, iter_time=6.13s]
Epoch 0: 15%|█▍ | 1797/12384 [3:48:54<22:40:08, 7.71s/it, loss=0.0026, acc=0.9931, iter_time=7.09s]
Epoch 0: 15%|█▍ | 1798/12384 [3:48:54<22:35:19, 7.68s/it, loss=0.0026, acc=0.9931, iter_time=7.09s]
Epoch 0: 15%|█▍ | 1798/12384 [3:49:02<22:35:19, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=8.43s]
Epoch 0: 15%|█▍ | 1799/12384 [3:49:02<22:30:24, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=8.43s]
Epoch 0: 15%|█▍ | 1799/12384 [3:49:09<22:30:24, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=9.49s]
Epoch 0: 15%|█▍ | 1800/12384 [3:49:09<22:27:21, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=9.49s]
Epoch 0: 15%|█▍ | 1800/12384 [3:49:17<22:27:21, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=7.21s]
Epoch 0: 15%|█▍ | 1801/12384 [3:49:17<22:30:58, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=7.21s]
Epoch 0: 15%|█▍ | 1801/12384 [3:49:24<22:30:58, 7.66s/it, loss=0.0002, acc=0.9978, iter_time=6.75s]
Epoch 0: 15%|█▍ | 1802/12384 [3:49:24<22:28:10, 7.64s/it, loss=0.0002, acc=0.9978, iter_time=6.75s]
Epoch 0: 15%|█▍ | 1802/12384 [3:49:32<22:28:10, 7.64s/it, loss=0.0006, acc=0.9969, iter_time=7.03s]
Epoch 0: 15%|█▍ | 1803/12384 [3:49:32<22:25:09, 7.63s/it, loss=0.0006, acc=0.9969, iter_time=7.03s]
Epoch 0: 15%|█▍ | 1803/12384 [3:49:40<22:25:09, 7.63s/it, loss=0.0008, acc=0.9975, iter_time=9.11s]
Epoch 0: 15%|█▍ | 1804/12384 [3:49:40<22:24:49, 7.63s/it, loss=0.0008, acc=0.9975, iter_time=9.11s]
Epoch 0: 15%|█▍ | 1804/12384 [3:49:47<22:24:49, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=7.33s]
Epoch 0: 15%|█▍ | 1805/12384 [3:49:47<22:23:39, 7.62s/it, loss=0.0005, acc=0.9983, iter_time=7.33s]
Epoch 0: 15%|█▍ | 1805/12384 [3:49:55<22:23:39, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1806/12384 [3:49:55<22:22:56, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1806/12384 [3:50:03<22:22:56, 7.62s/it, loss=0.0006, acc=0.9973, iter_time=7.91s]
Epoch 0: 15%|█▍ | 1807/12384 [3:50:03<22:21:31, 7.61s/it, loss=0.0006, acc=0.9973, iter_time=7.91s]
Epoch 0: 15%|█▍ | 1807/12384 [3:50:10<22:21:31, 7.61s/it, loss=0.0022, acc=0.9913, iter_time=7.98s]
Epoch 0: 15%|█▍ | 1808/12384 [3:50:10<22:22:01, 7.61s/it, loss=0.0022, acc=0.9913, iter_time=7.98s]
Epoch 0: 15%|█▍ | 1808/12384 [3:50:18<22:22:01, 7.61s/it, loss=0.0011, acc=0.9975, iter_time=7.37s]
Epoch 0: 15%|█▍ | 1809/12384 [3:50:18<22:28:29, 7.65s/it, loss=0.0011, acc=0.9975, iter_time=7.37s]
Epoch 0: 15%|█▍ | 1809/12384 [3:50:25<22:28:29, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1810/12384 [3:50:25<22:25:31, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1810/12384 [3:50:33<22:25:31, 7.63s/it, loss=0.0033, acc=0.9906, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1811/12384 [3:50:33<22:24:10, 7.63s/it, loss=0.0033, acc=0.9906, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1811/12384 [3:50:41<22:24:10, 7.63s/it, loss=0.0008, acc=0.9976, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1812/12384 [3:50:41<22:22:39, 7.62s/it, loss=0.0008, acc=0.9976, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1812/12384 [3:50:48<22:22:39, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1813/12384 [3:50:48<22:22:21, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1813/12384 [3:50:56<22:22:21, 7.62s/it, loss=0.0015, acc=1.0000, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1814/12384 [3:50:56<22:21:01, 7.61s/it, loss=0.0015, acc=1.0000, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1814/12384 [3:51:04<22:21:01, 7.61s/it, loss=0.0005, acc=0.9999, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1815/12384 [3:51:04<22:21:00, 7.61s/it, loss=0.0005, acc=0.9999, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1815/12384 [3:51:11<22:21:00, 7.61s/it, loss=0.0014, acc=0.9975, iter_time=8.01s]
Epoch 0: 15%|█▍ | 1816/12384 [3:51:11<22:20:27, 7.61s/it, loss=0.0014, acc=0.9975, iter_time=8.01s]
Epoch 0: 15%|█▍ | 1816/12384 [3:51:19<22:20:27, 7.61s/it, loss=0.0019, acc=0.9936, iter_time=7.21s]
Epoch 0: 15%|█▍ | 1817/12384 [3:51:19<22:19:59, 7.61s/it, loss=0.0019, acc=0.9936, iter_time=7.21s]
Epoch 0: 15%|█▍ | 1817/12384 [3:51:26<22:19:59, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1818/12384 [3:51:26<22:19:27, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1818/12384 [3:51:34<22:19:27, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.36s]
Epoch 0: 15%|█▍ | 1819/12384 [3:51:34<22:19:11, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.36s]
Epoch 0: 15%|█▍ | 1819/12384 [3:51:42<22:19:11, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.84s]
Epoch 0: 15%|█▍ | 1820/12384 [3:51:42<22:18:41, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=7.84s]
Epoch 0: 15%|█▍ | 1820/12384 [3:51:49<22:18:41, 7.60s/it, loss=0.0008, acc=0.9997, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1821/12384 [3:51:49<22:20:05, 7.61s/it, loss=0.0008, acc=0.9997, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1821/12384 [3:51:57<22:20:05, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=7.64s]
Epoch 0: 15%|█▍ | 1822/12384 [3:51:57<22:19:38, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=7.64s]
Epoch 0: 15%|█▍ | 1822/12384 [3:52:05<22:19:38, 7.61s/it, loss=0.0034, acc=0.9905, iter_time=7.28s]
Epoch 0: 15%|█▍ | 1823/12384 [3:52:05<22:37:00, 7.71s/it, loss=0.0034, acc=0.9905, iter_time=7.28s]
Epoch 0: 15%|█▍ | 1823/12384 [3:52:12<22:37:00, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 15%|█▍ | 1824/12384 [3:52:12<22:36:29, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 15%|█▍ | 1824/12384 [3:52:20<22:36:29, 7.71s/it, loss=0.0005, acc=0.9989, iter_time=7.31s]
Epoch 0: 15%|█▍ | 1825/12384 [3:52:20<22:30:34, 7.67s/it, loss=0.0005, acc=0.9989, iter_time=7.31s]
Epoch 0: 15%|█▍ | 1825/12384 [3:52:28<22:30:34, 7.67s/it, loss=0.0021, acc=0.9927, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1826/12384 [3:52:28<22:26:24, 7.65s/it, loss=0.0021, acc=0.9927, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1826/12384 [3:52:35<22:26:24, 7.65s/it, loss=0.0028, acc=0.9947, iter_time=7.59s]
Epoch 0: 15%|█▍ | 1827/12384 [3:52:35<22:24:39, 7.64s/it, loss=0.0028, acc=0.9947, iter_time=7.59s]
Epoch 0: 15%|█▍ | 1827/12384 [3:52:43<22:24:39, 7.64s/it, loss=0.0008, acc=0.9974, iter_time=5.63s]
Epoch 0: 15%|█▍ | 1828/12384 [3:52:43<22:27:31, 7.66s/it, loss=0.0008, acc=0.9974, iter_time=5.63s]
Epoch 0: 15%|█▍ | 1828/12384 [3:52:51<22:27:31, 7.66s/it, loss=0.0004, acc=0.9997, iter_time=9.69s]
Epoch 0: 15%|█▍ | 1829/12384 [3:52:51<22:24:17, 7.64s/it, loss=0.0004, acc=0.9997, iter_time=9.69s]
Epoch 0: 15%|█▍ | 1829/12384 [3:52:58<22:24:17, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=6.41s]
Epoch 0: 15%|█▍ | 1830/12384 [3:52:58<22:22:41, 7.63s/it, loss=0.0006, acc=1.0000, iter_time=6.41s]
Epoch 0: 15%|█▍ | 1830/12384 [3:53:06<22:22:41, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.90s]
Epoch 0: 15%|█▍ | 1831/12384 [3:53:06<22:25:50, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.90s]
Epoch 0: 15%|█▍ | 1831/12384 [3:53:13<22:25:50, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.55s]
Epoch 0: 15%|█▍ | 1832/12384 [3:53:13<22:23:14, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.55s]
Epoch 0: 15%|█▍ | 1832/12384 [3:53:21<22:23:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.44s]
Epoch 0: 15%|█▍ | 1833/12384 [3:53:21<22:21:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.44s]
Epoch 0: 15%|█▍ | 1833/12384 [3:53:29<22:21:29, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=8.84s]
Epoch 0: 15%|█▍ | 1834/12384 [3:53:29<22:20:27, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=8.84s]
Epoch 0: 15%|█▍ | 1834/12384 [3:53:36<22:20:27, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=6.38s]
Epoch 0: 15%|█▍ | 1835/12384 [3:53:36<22:19:01, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=6.38s]
Epoch 0: 15%|█▍ | 1835/12384 [3:53:44<22:19:01, 7.62s/it, loss=0.0016, acc=0.9992, iter_time=8.53s]
Epoch 0: 15%|█▍ | 1836/12384 [3:53:44<22:15:36, 7.60s/it, loss=0.0016, acc=0.9992, iter_time=8.53s]
Epoch 0: 15%|█▍ | 1836/12384 [3:53:51<22:15:36, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=7.92s]
Epoch 0: 15%|█▍ | 1837/12384 [3:53:51<22:20:35, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.92s]
Epoch 0: 15%|█▍ | 1837/12384 [3:53:59<22:20:35, 7.63s/it, loss=0.0012, acc=0.9972, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1838/12384 [3:53:59<22:18:37, 7.62s/it, loss=0.0012, acc=0.9972, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1838/12384 [3:54:07<22:18:37, 7.62s/it, loss=0.0014, acc=0.9968, iter_time=5.33s]
Epoch 0: 15%|█▍ | 1839/12384 [3:54:07<22:17:06, 7.61s/it, loss=0.0014, acc=0.9968, iter_time=5.33s]
Epoch 0: 15%|█▍ | 1839/12384 [3:54:14<22:17:06, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.82s]
Epoch 0: 15%|█▍ | 1840/12384 [3:54:14<22:17:52, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.82s]
Epoch 0: 15%|█▍ | 1840/12384 [3:54:22<22:17:52, 7.61s/it, loss=0.0005, acc=0.9995, iter_time=6.70s]
Epoch 0: 15%|█▍ | 1841/12384 [3:54:22<22:17:53, 7.61s/it, loss=0.0005, acc=0.9995, iter_time=6.70s]
Epoch 0: 15%|█▍ | 1841/12384 [3:54:30<22:17:53, 7.61s/it, loss=0.0005, acc=0.9996, iter_time=8.58s]
Epoch 0: 15%|█▍ | 1842/12384 [3:54:30<22:17:44, 7.61s/it, loss=0.0005, acc=0.9996, iter_time=8.58s]
Epoch 0: 15%|█▍ | 1842/12384 [3:54:37<22:17:44, 7.61s/it, loss=0.0021, acc=0.9944, iter_time=5.27s]
Epoch 0: 15%|█▍ | 1843/12384 [3:54:37<22:18:52, 7.62s/it, loss=0.0021, acc=0.9944, iter_time=5.27s]
Epoch 0: 15%|█▍ | 1843/12384 [3:54:45<22:18:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.11s]
Epoch 0: 15%|█▍ | 1844/12384 [3:54:45<22:18:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.11s]
Epoch 0: 15%|█▍ | 1844/12384 [3:54:52<22:18:09, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.35s]
Epoch 0: 15%|█▍ | 1845/12384 [3:54:52<22:16:40, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.35s]
Epoch 0: 15%|█▍ | 1845/12384 [3:55:00<22:16:40, 7.61s/it, loss=0.0005, acc=0.9985, iter_time=7.41s]
Epoch 0: 15%|█▍ | 1846/12384 [3:55:00<22:16:34, 7.61s/it, loss=0.0005, acc=0.9985, iter_time=7.41s]
Epoch 0: 15%|█▍ | 1846/12384 [3:55:08<22:16:34, 7.61s/it, loss=0.0020, acc=0.9927, iter_time=9.92s]
Epoch 0: 15%|█▍ | 1847/12384 [3:55:08<22:16:46, 7.61s/it, loss=0.0020, acc=0.9927, iter_time=9.92s]
Epoch 0: 15%|█▍ | 1847/12384 [3:55:15<22:16:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 15%|█▍ | 1848/12384 [3:55:15<22:16:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 15%|█▍ | 1848/12384 [3:55:23<22:16:23, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.47s]
Epoch 0: 15%|█▍ | 1849/12384 [3:55:23<22:38:44, 7.74s/it, loss=0.0002, acc=1.0000, iter_time=7.47s]
Epoch 0: 15%|█▍ | 1849/12384 [3:55:31<22:38:44, 7.74s/it, loss=0.0013, acc=0.9980, iter_time=8.17s]
Epoch 0: 15%|█▍ | 1850/12384 [3:55:31<22:31:03, 7.70s/it, loss=0.0013, acc=0.9980, iter_time=8.17s]
Epoch 0: 15%|█▍ | 1850/12384 [3:55:38<22:31:03, 7.70s/it, loss=0.0005, acc=0.9987, iter_time=7.20s]
Epoch 0: 15%|█▍ | 1851/12384 [3:55:38<22:25:44, 7.67s/it, loss=0.0005, acc=0.9987, iter_time=7.20s]
Epoch 0: 15%|█▍ | 1851/12384 [3:55:46<22:25:44, 7.67s/it, loss=0.0088, acc=0.9897, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1852/12384 [3:55:46<22:23:42, 7.65s/it, loss=0.0088, acc=0.9897, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1852/12384 [3:55:54<22:23:42, 7.65s/it, loss=0.0015, acc=0.9961, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1853/12384 [3:55:54<22:22:22, 7.65s/it, loss=0.0015, acc=0.9961, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1853/12384 [3:56:01<22:22:22, 7.65s/it, loss=0.0007, acc=0.9979, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1854/12384 [3:56:01<22:21:24, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1854/12384 [3:56:09<22:21:24, 7.64s/it, loss=0.0010, acc=0.9983, iter_time=5.62s]
Epoch 0: 15%|█▍ | 1855/12384 [3:56:09<22:19:01, 7.63s/it, loss=0.0010, acc=0.9983, iter_time=5.62s]
Epoch 0: 15%|█▍ | 1855/12384 [3:56:17<22:19:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.54s]
Epoch 0: 15%|█▍ | 1856/12384 [3:56:17<22:16:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.54s]
Epoch 0: 15%|█▍ | 1856/12384 [3:56:24<22:16:29, 7.62s/it, loss=0.0005, acc=0.9979, iter_time=7.65s]
Epoch 0: 15%|█▍ | 1857/12384 [3:56:24<22:15:48, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=7.65s]
Epoch 0: 15%|█▍ | 1857/12384 [3:56:32<22:15:48, 7.61s/it, loss=0.0003, acc=0.9993, iter_time=5.28s]
Epoch 0: 15%|█▌ | 1858/12384 [3:56:32<22:14:49, 7.61s/it, loss=0.0003, acc=0.9993, iter_time=5.28s]
Epoch 0: 15%|█▌ | 1858/12384 [3:56:39<22:14:49, 7.61s/it, loss=0.0005, acc=0.9974, iter_time=9.62s]
Epoch 0: 15%|█▌ | 1859/12384 [3:56:39<22:14:53, 7.61s/it, loss=0.0005, acc=0.9974, iter_time=9.62s]
Epoch 0: 15%|█▌ | 1859/12384 [3:56:47<22:14:53, 7.61s/it, loss=0.0010, acc=0.9960, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1860/12384 [3:56:47<22:14:10, 7.61s/it, loss=0.0010, acc=0.9960, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1860/12384 [3:56:55<22:14:10, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=6.70s]
Epoch 0: 15%|█▌ | 1861/12384 [3:56:55<22:13:48, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=6.70s]
Epoch 0: 15%|█▌ | 1861/12384 [3:57:02<22:13:48, 7.61s/it, loss=0.0065, acc=0.9889, iter_time=8.81s]
Epoch 0: 15%|█▌ | 1862/12384 [3:57:02<22:13:50, 7.61s/it, loss=0.0065, acc=0.9889, iter_time=8.81s]
Epoch 0: 15%|█▌ | 1862/12384 [3:57:10<22:13:50, 7.61s/it, loss=0.0027, acc=0.9897, iter_time=7.02s]
Epoch 0: 15%|█▌ | 1863/12384 [3:57:10<22:13:56, 7.61s/it, loss=0.0027, acc=0.9897, iter_time=7.02s]
Epoch 0: 15%|█▌ | 1863/12384 [3:57:17<22:13:56, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=8.15s]
Epoch 0: 15%|█▌ | 1864/12384 [3:57:17<22:13:07, 7.60s/it, loss=0.0004, acc=0.9998, iter_time=8.15s]
Epoch 0: 15%|█▌ | 1864/12384 [3:57:25<22:13:07, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 15%|█▌ | 1865/12384 [3:57:25<22:13:49, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 15%|█▌ | 1865/12384 [3:57:33<22:13:49, 7.61s/it, loss=0.0011, acc=0.9965, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1866/12384 [3:57:33<22:13:15, 7.61s/it, loss=0.0011, acc=0.9965, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1866/12384 [3:57:40<22:13:15, 7.61s/it, loss=0.0007, acc=0.9974, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1867/12384 [3:57:40<22:12:18, 7.60s/it, loss=0.0007, acc=0.9974, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1867/12384 [3:57:48<22:12:18, 7.60s/it, loss=0.0056, acc=0.9869, iter_time=4.56s]
Epoch 0: 15%|█▌ | 1868/12384 [3:57:48<22:14:06, 7.61s/it, loss=0.0056, acc=0.9869, iter_time=4.56s]
Epoch 0: 15%|█▌ | 1868/12384 [3:57:55<22:14:06, 7.61s/it, loss=0.0012, acc=0.9977, iter_time=10.69s]
Epoch 0: 15%|█▌ | 1869/12384 [3:57:55<22:13:49, 7.61s/it, loss=0.0012, acc=0.9977, iter_time=10.69s]
Epoch 0: 15%|█▌ | 1869/12384 [3:58:03<22:13:49, 7.61s/it, loss=0.0009, acc=0.9983, iter_time=7.59s]
Epoch 0: 15%|█▌ | 1870/12384 [3:58:03<22:14:20, 7.61s/it, loss=0.0009, acc=0.9983, iter_time=7.59s]
Epoch 0: 15%|█▌ | 1870/12384 [3:58:11<22:14:20, 7.61s/it, loss=0.0006, acc=0.9995, iter_time=6.12s]
Epoch 0: 15%|█▌ | 1871/12384 [3:58:11<22:13:03, 7.61s/it, loss=0.0006, acc=0.9995, iter_time=6.12s]
Epoch 0: 15%|█▌ | 1871/12384 [3:58:18<22:13:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.50s]
Epoch 0: 15%|█▌ | 1872/12384 [3:58:18<22:14:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.50s]
Epoch 0: 15%|█▌ | 1872/12384 [3:58:26<22:14:09, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=4.38s]
Epoch 0: 15%|█▌ | 1873/12384 [3:58:26<22:14:11, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=4.38s]
Epoch 0: 15%|█▌ | 1873/12384 [3:58:33<22:14:11, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=10.46s]
Epoch 0: 15%|█▌ | 1874/12384 [3:58:33<22:13:32, 7.61s/it, loss=0.0008, acc=0.9980, iter_time=10.46s]
Epoch 0: 15%|█▌ | 1874/12384 [3:58:41<22:13:32, 7.61s/it, loss=0.0005, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1875/12384 [3:58:41<22:31:09, 7.71s/it, loss=0.0005, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1875/12384 [3:58:49<22:31:09, 7.71s/it, loss=0.0012, acc=0.9948, iter_time=7.96s]
Epoch 0: 15%|█▌ | 1876/12384 [3:58:49<22:25:23, 7.68s/it, loss=0.0012, acc=0.9948, iter_time=7.96s]
Epoch 0: 15%|█▌ | 1876/12384 [3:58:57<22:25:23, 7.68s/it, loss=0.0008, acc=0.9979, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1877/12384 [3:58:57<22:22:08, 7.66s/it, loss=0.0008, acc=0.9979, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1877/12384 [3:59:04<22:22:08, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.40s]
Epoch 0: 15%|█▌ | 1878/12384 [3:59:04<22:23:03, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.40s]
Epoch 0: 15%|█▌ | 1878/12384 [3:59:12<22:23:03, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1879/12384 [3:59:12<22:20:49, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1879/12384 [3:59:20<22:20:49, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=8.02s]
Epoch 0: 15%|█▌ | 1880/12384 [3:59:20<22:17:35, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=8.02s]
Epoch 0: 15%|█▌ | 1880/12384 [3:59:27<22:17:35, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.19s]
Epoch 0: 15%|█▌ | 1881/12384 [3:59:27<22:15:12, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.19s]
Epoch 0: 15%|█▌ | 1881/12384 [3:59:35<22:15:12, 7.63s/it, loss=0.0009, acc=0.9985, iter_time=6.39s]
Epoch 0: 15%|█▌ | 1882/12384 [3:59:35<22:13:08, 7.62s/it, loss=0.0009, acc=0.9985, iter_time=6.39s]
Epoch 0: 15%|█▌ | 1882/12384 [3:59:42<22:13:08, 7.62s/it, loss=0.0019, acc=0.9958, iter_time=8.82s]
Epoch 0: 15%|█▌ | 1883/12384 [3:59:42<22:13:43, 7.62s/it, loss=0.0019, acc=0.9958, iter_time=8.82s]
Epoch 0: 15%|█▌ | 1883/12384 [3:59:50<22:13:43, 7.62s/it, loss=0.0006, acc=0.9999, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1884/12384 [3:59:50<22:12:28, 7.61s/it, loss=0.0006, acc=0.9999, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1884/12384 [3:59:58<22:12:28, 7.61s/it, loss=0.0011, acc=0.9964, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1885/12384 [3:59:58<22:12:09, 7.61s/it, loss=0.0011, acc=0.9964, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1885/12384 [4:00:05<22:12:09, 7.61s/it, loss=0.0011, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1886/12384 [4:00:05<22:16:03, 7.64s/it, loss=0.0011, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1886/12384 [4:00:13<22:16:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 15%|█▌ | 1887/12384 [4:00:13<22:19:50, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 15%|█▌ | 1887/12384 [4:00:21<22:19:50, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=8.09s]
Epoch 0: 15%|█▌ | 1888/12384 [4:00:21<22:16:46, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=8.09s]
Epoch 0: 15%|█▌ | 1888/12384 [4:00:28<22:16:46, 7.64s/it, loss=0.0004, acc=0.9999, iter_time=6.89s]
Epoch 0: 15%|█▌ | 1889/12384 [4:00:28<22:15:50, 7.64s/it, loss=0.0004, acc=0.9999, iter_time=6.89s]
Epoch 0: 15%|█▌ | 1889/12384 [4:00:36<22:15:50, 7.64s/it, loss=0.0008, acc=0.9991, iter_time=7.94s]
Epoch 0: 15%|█▌ | 1890/12384 [4:00:36<22:13:55, 7.63s/it, loss=0.0008, acc=0.9991, iter_time=7.94s]
Epoch 0: 15%|█▌ | 1890/12384 [4:00:43<22:13:55, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=6.48s]
Epoch 0: 15%|█▌ | 1891/12384 [4:00:43<22:13:48, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=6.48s]
Epoch 0: 15%|█▌ | 1891/12384 [4:00:51<22:13:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 15%|█▌ | 1892/12384 [4:00:51<22:11:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 15%|█▌ | 1892/12384 [4:00:59<22:11:53, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.63s]
Epoch 0: 15%|█▌ | 1893/12384 [4:00:59<22:11:50, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.63s]
Epoch 0: 15%|█▌ | 1893/12384 [4:01:06<22:11:50, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=10.63s]
Epoch 0: 15%|█▌ | 1894/12384 [4:01:06<22:10:23, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=10.63s]
Epoch 0: 15%|█▌ | 1894/12384 [4:01:14<22:10:23, 7.61s/it, loss=0.0006, acc=0.9984, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1895/12384 [4:01:14<22:10:13, 7.61s/it, loss=0.0006, acc=0.9984, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1895/12384 [4:01:21<22:10:13, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=8.00s]
Epoch 0: 15%|█▌ | 1896/12384 [4:01:21<22:10:28, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=8.00s]
Epoch 0: 15%|█▌ | 1896/12384 [4:01:29<22:10:28, 7.61s/it, loss=0.0006, acc=0.9978, iter_time=7.22s]
Epoch 0: 15%|█▌ | 1897/12384 [4:01:29<22:10:56, 7.61s/it, loss=0.0006, acc=0.9978, iter_time=7.22s]
Epoch 0: 15%|█▌ | 1897/12384 [4:01:37<22:10:56, 7.61s/it, loss=0.0058, acc=0.9911, iter_time=4.76s]
Epoch 0: 15%|█▌ | 1898/12384 [4:01:37<22:09:24, 7.61s/it, loss=0.0058, acc=0.9911, iter_time=4.76s]
Epoch 0: 15%|█▌ | 1898/12384 [4:01:44<22:09:24, 7.61s/it, loss=0.0007, acc=0.9962, iter_time=8.95s]
Epoch 0: 15%|█▌ | 1899/12384 [4:01:44<22:09:50, 7.61s/it, loss=0.0007, acc=0.9962, iter_time=8.95s]
Epoch 0: 15%|█▌ | 1899/12384 [4:01:52<22:09:50, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.54s]
Epoch 0: 15%|█▌ | 1900/12384 [4:01:52<22:10:16, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.54s]
Epoch 0: 15%|█▌ | 1900/12384 [4:02:00<22:10:16, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.49s]
Epoch 0: 15%|█▌ | 1901/12384 [4:02:00<22:26:28, 7.71s/it, loss=0.0002, acc=0.9998, iter_time=7.49s]
Epoch 0: 15%|█▌ | 1901/12384 [4:02:07<22:26:28, 7.71s/it, loss=0.0008, acc=0.9982, iter_time=4.86s]
Epoch 0: 15%|█▌ | 1902/12384 [4:02:07<22:21:25, 7.68s/it, loss=0.0008, acc=0.9982, iter_time=4.86s]
Epoch 0: 15%|█▌ | 1902/12384 [4:02:15<22:21:25, 7.68s/it, loss=0.0058, acc=0.9907, iter_time=10.40s]
Epoch 0: 15%|█▌ | 1903/12384 [4:02:15<22:20:11, 7.67s/it, loss=0.0058, acc=0.9907, iter_time=10.40s]
Epoch 0: 15%|█▌ | 1903/12384 [4:02:23<22:20:11, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 15%|█▌ | 1904/12384 [4:02:23<22:16:37, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 15%|█▌ | 1904/12384 [4:02:30<22:16:37, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.19s]
Epoch 0: 15%|█▌ | 1905/12384 [4:02:30<22:12:14, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.19s]
Epoch 0: 15%|█▌ | 1905/12384 [4:02:38<22:12:14, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1906/12384 [4:02:38<22:11:28, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1906/12384 [4:02:46<22:11:28, 7.62s/it, loss=0.0033, acc=0.9930, iter_time=4.73s]
Epoch 0: 15%|█▌ | 1907/12384 [4:02:46<22:11:31, 7.63s/it, loss=0.0033, acc=0.9930, iter_time=4.73s]
Epoch 0: 15%|█▌ | 1907/12384 [4:02:53<22:11:31, 7.63s/it, loss=0.0008, acc=0.9985, iter_time=10.50s]
Epoch 0: 15%|█▌ | 1908/12384 [4:02:53<22:10:40, 7.62s/it, loss=0.0008, acc=0.9985, iter_time=10.50s]
Epoch 0: 15%|█▌ | 1908/12384 [4:03:01<22:10:40, 7.62s/it, loss=0.0089, acc=0.9913, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1909/12384 [4:03:01<22:09:29, 7.62s/it, loss=0.0089, acc=0.9913, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1909/12384 [4:03:08<22:09:29, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.74s]
Epoch 0: 15%|█▌ | 1910/12384 [4:03:08<22:10:03, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.74s]
Epoch 0: 15%|█▌ | 1910/12384 [4:03:16<22:10:03, 7.62s/it, loss=0.0008, acc=0.9994, iter_time=10.55s]
Epoch 0: 15%|█▌ | 1911/12384 [4:03:16<22:11:48, 7.63s/it, loss=0.0008, acc=0.9994, iter_time=10.55s]
Epoch 0: 15%|█▌ | 1911/12384 [4:03:24<22:11:48, 7.63s/it, loss=0.0006, acc=0.9993, iter_time=7.57s]
Epoch 0: 15%|█▌ | 1912/12384 [4:03:24<22:11:33, 7.63s/it, loss=0.0006, acc=0.9993, iter_time=7.57s]
Epoch 0: 15%|█▌ | 1912/12384 [4:03:31<22:11:33, 7.63s/it, loss=0.0007, acc=0.9965, iter_time=4.13s]
Epoch 0: 15%|█▌ | 1913/12384 [4:03:31<22:13:19, 7.64s/it, loss=0.0007, acc=0.9965, iter_time=4.13s]
Epoch 0: 15%|█▌ | 1913/12384 [4:03:39<22:13:19, 7.64s/it, loss=0.0010, acc=0.9995, iter_time=9.98s]
Epoch 0: 15%|█▌ | 1914/12384 [4:03:39<22:11:38, 7.63s/it, loss=0.0010, acc=0.9995, iter_time=9.98s]
Epoch 0: 15%|█▌ | 1914/12384 [4:03:47<22:11:38, 7.63s/it, loss=0.0032, acc=0.9896, iter_time=8.82s]
Epoch 0: 15%|█▌ | 1915/12384 [4:03:47<22:09:50, 7.62s/it, loss=0.0032, acc=0.9896, iter_time=8.82s]
Epoch 0: 15%|█▌ | 1915/12384 [4:03:54<22:09:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1916/12384 [4:03:54<22:12:04, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1916/12384 [4:04:02<22:12:04, 7.64s/it, loss=0.0006, acc=0.9999, iter_time=7.68s]
Epoch 0: 15%|█▌ | 1917/12384 [4:04:02<22:10:42, 7.63s/it, loss=0.0006, acc=0.9999, iter_time=7.68s]
Epoch 0: 15%|█▌ | 1917/12384 [4:04:09<22:10:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.09s]
Epoch 0: 15%|█▌ | 1918/12384 [4:04:09<22:09:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.09s]
Epoch 0: 15%|█▌ | 1918/12384 [4:04:17<22:09:07, 7.62s/it, loss=0.0013, acc=0.9978, iter_time=9.11s]
Epoch 0: 15%|█▌ | 1919/12384 [4:04:17<22:10:05, 7.63s/it, loss=0.0013, acc=0.9978, iter_time=9.11s]
Epoch 0: 15%|█▌ | 1919/12384 [4:04:25<22:10:05, 7.63s/it, loss=0.0009, acc=0.9955, iter_time=8.03s]
Epoch 0: 16%|█▌ | 1920/12384 [4:04:25<22:09:58, 7.63s/it, loss=0.0009, acc=0.9955, iter_time=8.03s]
Epoch 0: 16%|█▌ | 1920/12384 [4:04:32<22:09:58, 7.63s/it, loss=0.0006, acc=0.9974, iter_time=7.32s]
Epoch 0: 16%|█▌ | 1921/12384 [4:04:32<22:13:00, 7.64s/it, loss=0.0006, acc=0.9974, iter_time=7.32s]
Epoch 0: 16%|█▌ | 1921/12384 [4:04:40<22:13:00, 7.64s/it, loss=0.0003, acc=0.9984, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1922/12384 [4:04:40<22:11:12, 7.63s/it, loss=0.0003, acc=0.9984, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1922/12384 [4:04:48<22:11:12, 7.63s/it, loss=0.0009, acc=0.9977, iter_time=7.59s]
Epoch 0: 16%|█▌ | 1923/12384 [4:04:48<22:09:47, 7.63s/it, loss=0.0009, acc=0.9977, iter_time=7.59s]
Epoch 0: 16%|█▌ | 1923/12384 [4:04:55<22:09:47, 7.63s/it, loss=0.0015, acc=0.9953, iter_time=3.81s]
Epoch 0: 16%|█▌ | 1924/12384 [4:04:55<22:09:55, 7.63s/it, loss=0.0015, acc=0.9953, iter_time=3.81s]
Epoch 0: 16%|█▌ | 1924/12384 [4:05:03<22:09:55, 7.63s/it, loss=0.0014, acc=0.9976, iter_time=11.43s]
Epoch 0: 16%|█▌ | 1925/12384 [4:05:03<22:14:51, 7.66s/it, loss=0.0014, acc=0.9976, iter_time=11.43s]
Epoch 0: 16%|█▌ | 1925/12384 [4:05:11<22:14:51, 7.66s/it, loss=0.0018, acc=0.9983, iter_time=7.73s]
Epoch 0: 16%|█▌ | 1926/12384 [4:05:11<22:12:11, 7.64s/it, loss=0.0018, acc=0.9983, iter_time=7.73s]
Epoch 0: 16%|█▌ | 1926/12384 [4:05:18<22:12:11, 7.64s/it, loss=0.0007, acc=0.9996, iter_time=4.59s]
Epoch 0: 16%|█▌ | 1927/12384 [4:05:18<22:11:18, 7.64s/it, loss=0.0007, acc=0.9996, iter_time=4.59s]
Epoch 0: 16%|█▌ | 1927/12384 [4:05:26<22:11:18, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=11.42s]
Epoch 0: 16%|█▌ | 1928/12384 [4:05:26<22:29:13, 7.74s/it, loss=0.0002, acc=1.0000, iter_time=11.42s]
Epoch 0: 16%|█▌ | 1928/12384 [4:05:34<22:29:13, 7.74s/it, loss=0.0019, acc=0.9942, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1929/12384 [4:05:34<22:22:05, 7.70s/it, loss=0.0019, acc=0.9942, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1929/12384 [4:05:41<22:22:05, 7.70s/it, loss=0.0021, acc=0.9954, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1930/12384 [4:05:41<22:18:14, 7.68s/it, loss=0.0021, acc=0.9954, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1930/12384 [4:05:49<22:18:14, 7.68s/it, loss=0.0006, acc=0.9994, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1931/12384 [4:05:49<22:14:27, 7.66s/it, loss=0.0006, acc=0.9994, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1931/12384 [4:05:57<22:14:27, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=7.30s]
Epoch 0: 16%|█▌ | 1932/12384 [4:05:57<22:12:10, 7.65s/it, loss=0.0006, acc=0.9998, iter_time=7.30s]
Epoch 0: 16%|█▌ | 1932/12384 [4:06:04<22:12:10, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 16%|█▌ | 1933/12384 [4:06:04<22:10:41, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 16%|█▌ | 1933/12384 [4:06:12<22:10:41, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1934/12384 [4:06:12<22:11:38, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1934/12384 [4:06:20<22:11:38, 7.65s/it, loss=0.0009, acc=0.9995, iter_time=7.05s]
Epoch 0: 16%|█▌ | 1935/12384 [4:06:20<22:10:14, 7.64s/it, loss=0.0009, acc=0.9995, iter_time=7.05s]
Epoch 0: 16%|█▌ | 1935/12384 [4:06:27<22:10:14, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=8.60s]
Epoch 0: 16%|█▌ | 1936/12384 [4:06:27<22:12:35, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=8.60s]
Epoch 0: 16%|█▌ | 1936/12384 [4:06:35<22:12:35, 7.65s/it, loss=0.0005, acc=0.9981, iter_time=6.11s]
Epoch 0: 16%|█▌ | 1937/12384 [4:06:35<22:08:36, 7.63s/it, loss=0.0005, acc=0.9981, iter_time=6.11s]
Epoch 0: 16%|█▌ | 1937/12384 [4:06:42<22:08:36, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.58s]
Epoch 0: 16%|█▌ | 1938/12384 [4:06:42<22:05:59, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.58s]
Epoch 0: 16%|█▌ | 1938/12384 [4:06:50<22:05:59, 7.62s/it, loss=0.0016, acc=0.9985, iter_time=8.80s]
Epoch 0: 16%|█▌ | 1939/12384 [4:06:50<22:05:50, 7.62s/it, loss=0.0016, acc=0.9985, iter_time=8.80s]
Epoch 0: 16%|█▌ | 1939/12384 [4:06:58<22:05:50, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1940/12384 [4:06:58<22:06:55, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1940/12384 [4:07:05<22:06:55, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.39s]
Epoch 0: 16%|█▌ | 1941/12384 [4:07:05<22:05:47, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.39s]
Epoch 0: 16%|█▌ | 1941/12384 [4:07:13<22:05:47, 7.62s/it, loss=0.0019, acc=0.9960, iter_time=8.80s]
Epoch 0: 16%|█▌ | 1942/12384 [4:07:13<22:04:45, 7.61s/it, loss=0.0019, acc=0.9960, iter_time=8.80s]
Epoch 0: 16%|█▌ | 1942/12384 [4:07:20<22:04:45, 7.61s/it, loss=0.0012, acc=0.9983, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1943/12384 [4:07:20<22:04:37, 7.61s/it, loss=0.0012, acc=0.9983, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1943/12384 [4:07:28<22:04:37, 7.61s/it, loss=0.0018, acc=0.9950, iter_time=7.56s]
Epoch 0: 16%|█▌ | 1944/12384 [4:07:28<22:05:15, 7.62s/it, loss=0.0018, acc=0.9950, iter_time=7.56s]
Epoch 0: 16%|█▌ | 1944/12384 [4:07:36<22:05:15, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=4.80s]
Epoch 0: 16%|█▌ | 1945/12384 [4:07:36<22:06:10, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=4.80s]
Epoch 0: 16%|█▌ | 1945/12384 [4:07:43<22:06:10, 7.62s/it, loss=0.0017, acc=0.9941, iter_time=8.17s]
Epoch 0: 16%|█▌ | 1946/12384 [4:07:43<22:05:54, 7.62s/it, loss=0.0017, acc=0.9941, iter_time=8.17s]
Epoch 0: 16%|█▌ | 1946/12384 [4:07:51<22:05:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 16%|█▌ | 1947/12384 [4:07:51<22:04:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 16%|█▌ | 1947/12384 [4:07:59<22:04:25, 7.61s/it, loss=0.0027, acc=0.9932, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1948/12384 [4:07:59<22:05:21, 7.62s/it, loss=0.0027, acc=0.9932, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1948/12384 [4:08:06<22:05:21, 7.62s/it, loss=0.0011, acc=0.9975, iter_time=6.44s]
Epoch 0: 16%|█▌ | 1949/12384 [4:08:06<22:05:41, 7.62s/it, loss=0.0011, acc=0.9975, iter_time=6.44s]
Epoch 0: 16%|█▌ | 1949/12384 [4:08:14<22:05:41, 7.62s/it, loss=0.0010, acc=0.9976, iter_time=9.23s]
Epoch 0: 16%|█▌ | 1950/12384 [4:08:14<22:05:04, 7.62s/it, loss=0.0010, acc=0.9976, iter_time=9.23s]
Epoch 0: 16%|█▌ | 1950/12384 [4:08:21<22:05:04, 7.62s/it, loss=0.0012, acc=0.9975, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1951/12384 [4:08:21<22:04:14, 7.62s/it, loss=0.0012, acc=0.9975, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1951/12384 [4:08:29<22:04:14, 7.62s/it, loss=0.0020, acc=0.9984, iter_time=7.98s]
Epoch 0: 16%|█▌ | 1952/12384 [4:08:29<22:02:51, 7.61s/it, loss=0.0020, acc=0.9984, iter_time=7.98s]
Epoch 0: 16%|█▌ | 1952/12384 [4:08:37<22:02:51, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1953/12384 [4:08:37<22:03:39, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1953/12384 [4:08:45<22:03:39, 7.61s/it, loss=0.0006, acc=0.9966, iter_time=6.74s]
Epoch 0: 16%|█▌ | 1954/12384 [4:08:45<22:20:40, 7.71s/it, loss=0.0006, acc=0.9966, iter_time=6.74s]
Epoch 0: 16%|█▌ | 1954/12384 [4:08:52<22:20:40, 7.71s/it, loss=0.0015, acc=0.9979, iter_time=7.71s]
Epoch 0: 16%|█▌ | 1955/12384 [4:08:52<22:15:47, 7.69s/it, loss=0.0015, acc=0.9979, iter_time=7.71s]
Epoch 0: 16%|█▌ | 1955/12384 [4:09:00<22:15:47, 7.69s/it, loss=0.0001, acc=0.9998, iter_time=5.23s]
Epoch 0: 16%|█▌ | 1956/12384 [4:09:00<22:17:14, 7.69s/it, loss=0.0001, acc=0.9998, iter_time=5.23s]
Epoch 0: 16%|█▌ | 1956/12384 [4:09:08<22:17:14, 7.69s/it, loss=0.0005, acc=0.9980, iter_time=8.93s]
Epoch 0: 16%|█▌ | 1957/12384 [4:09:08<22:18:11, 7.70s/it, loss=0.0005, acc=0.9980, iter_time=8.93s]
Epoch 0: 16%|█▌ | 1957/12384 [4:09:15<22:18:11, 7.70s/it, loss=0.0009, acc=0.9999, iter_time=9.43s]
Epoch 0: 16%|█▌ | 1958/12384 [4:09:15<22:12:38, 7.67s/it, loss=0.0009, acc=0.9999, iter_time=9.43s]
Epoch 0: 16%|█▌ | 1958/12384 [4:09:23<22:12:38, 7.67s/it, loss=0.0110, acc=0.9863, iter_time=6.99s]
Epoch 0: 16%|█▌ | 1959/12384 [4:09:23<22:08:01, 7.64s/it, loss=0.0110, acc=0.9863, iter_time=6.99s]
Epoch 0: 16%|█▌ | 1959/12384 [4:09:30<22:08:01, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.75s]
Epoch 0: 16%|█▌ | 1960/12384 [4:09:30<22:06:55, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.75s]
Epoch 0: 16%|█▌ | 1960/12384 [4:09:38<22:06:55, 7.64s/it, loss=0.0005, acc=0.9988, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1961/12384 [4:09:38<22:07:47, 7.64s/it, loss=0.0005, acc=0.9988, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1961/12384 [4:09:46<22:07:47, 7.64s/it, loss=0.0009, acc=0.9980, iter_time=6.72s]
Epoch 0: 16%|█▌ | 1962/12384 [4:09:46<22:07:30, 7.64s/it, loss=0.0009, acc=0.9980, iter_time=6.72s]
Epoch 0: 16%|█▌ | 1962/12384 [4:09:53<22:07:30, 7.64s/it, loss=0.0234, acc=0.9554, iter_time=8.57s]
Epoch 0: 16%|█▌ | 1963/12384 [4:09:53<22:05:24, 7.63s/it, loss=0.0234, acc=0.9554, iter_time=8.57s]
Epoch 0: 16%|█▌ | 1963/12384 [4:10:01<22:05:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 16%|█▌ | 1964/12384 [4:10:01<22:04:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 16%|█▌ | 1964/12384 [4:10:09<22:04:22, 7.63s/it, loss=0.0012, acc=0.9981, iter_time=10.43s]
Epoch 0: 16%|█▌ | 1965/12384 [4:10:09<22:04:19, 7.63s/it, loss=0.0012, acc=0.9981, iter_time=10.43s]
Epoch 0: 16%|█▌ | 1965/12384 [4:10:16<22:04:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1966/12384 [4:10:16<22:04:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1966/12384 [4:10:24<22:04:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1967/12384 [4:10:24<22:08:13, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1967/12384 [4:10:32<22:08:13, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 16%|█▌ | 1968/12384 [4:10:32<22:07:08, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 16%|█▌ | 1968/12384 [4:10:39<22:07:08, 7.64s/it, loss=0.0006, acc=0.9980, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1969/12384 [4:10:39<22:04:45, 7.63s/it, loss=0.0006, acc=0.9980, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1969/12384 [4:10:47<22:04:45, 7.63s/it, loss=0.0019, acc=0.9948, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1970/12384 [4:10:47<22:03:26, 7.62s/it, loss=0.0019, acc=0.9948, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1970/12384 [4:10:54<22:03:26, 7.62s/it, loss=0.0023, acc=0.9961, iter_time=4.32s]
Epoch 0: 16%|█▌ | 1971/12384 [4:10:54<22:02:28, 7.62s/it, loss=0.0023, acc=0.9961, iter_time=4.32s]
Epoch 0: 16%|█▌ | 1971/12384 [4:11:02<22:02:28, 7.62s/it, loss=0.0010, acc=0.9983, iter_time=10.89s]
Epoch 0: 16%|█▌ | 1972/12384 [4:11:02<22:01:25, 7.61s/it, loss=0.0010, acc=0.9983, iter_time=10.89s]
Epoch 0: 16%|█▌ | 1972/12384 [4:11:10<22:01:25, 7.61s/it, loss=0.0008, acc=0.9980, iter_time=7.32s]
Epoch 0: 16%|█▌ | 1973/12384 [4:11:10<22:00:05, 7.61s/it, loss=0.0008, acc=0.9980, iter_time=7.32s]
Epoch 0: 16%|█▌ | 1973/12384 [4:11:17<22:00:05, 7.61s/it, loss=0.0005, acc=0.9998, iter_time=7.89s]
Epoch 0: 16%|█▌ | 1974/12384 [4:11:17<22:00:07, 7.61s/it, loss=0.0005, acc=0.9998, iter_time=7.89s]
Epoch 0: 16%|█▌ | 1974/12384 [4:11:25<22:00:07, 7.61s/it, loss=0.0035, acc=0.9948, iter_time=6.67s]
Epoch 0: 16%|█▌ | 1975/12384 [4:11:25<22:00:29, 7.61s/it, loss=0.0035, acc=0.9948, iter_time=6.67s]
Epoch 0: 16%|█▌ | 1975/12384 [4:11:32<22:00:29, 7.61s/it, loss=0.0004, acc=0.9984, iter_time=8.96s]
Epoch 0: 16%|█▌ | 1976/12384 [4:11:32<22:00:37, 7.61s/it, loss=0.0004, acc=0.9984, iter_time=8.96s]
Epoch 0: 16%|█▌ | 1976/12384 [4:11:40<22:00:37, 7.61s/it, loss=0.0003, acc=0.9994, iter_time=6.90s]
Epoch 0: 16%|█▌ | 1977/12384 [4:11:40<22:00:34, 7.61s/it, loss=0.0003, acc=0.9994, iter_time=6.90s]
Epoch 0: 16%|█▌ | 1977/12384 [4:11:48<22:00:34, 7.61s/it, loss=0.0004, acc=0.9996, iter_time=7.93s]
Epoch 0: 16%|█▌ | 1978/12384 [4:11:48<22:00:23, 7.61s/it, loss=0.0004, acc=0.9996, iter_time=7.93s]
Epoch 0: 16%|█▌ | 1978/12384 [4:11:55<22:00:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1979/12384 [4:11:55<21:59:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1979/12384 [4:12:03<21:59:03, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1980/12384 [4:12:03<21:59:40, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1980/12384 [4:12:11<21:59:40, 7.61s/it, loss=0.0006, acc=0.9991, iter_time=7.93s]
Epoch 0: 16%|█▌ | 1981/12384 [4:12:11<22:22:17, 7.74s/it, loss=0.0006, acc=0.9991, iter_time=7.93s]
Epoch 0: 16%|█▌ | 1981/12384 [4:12:19<22:22:17, 7.74s/it, loss=0.0004, acc=0.9991, iter_time=7.81s]
Epoch 0: 16%|█▌ | 1982/12384 [4:12:19<22:19:05, 7.72s/it, loss=0.0004, acc=0.9991, iter_time=7.81s]
Epoch 0: 16%|█▌ | 1982/12384 [4:12:26<22:19:05, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1983/12384 [4:12:26<22:12:33, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1983/12384 [4:12:34<22:12:33, 7.69s/it, loss=0.0002, acc=0.9998, iter_time=8.10s]
Epoch 0: 16%|█▌ | 1984/12384 [4:12:34<22:13:41, 7.69s/it, loss=0.0002, acc=0.9998, iter_time=8.10s]
Epoch 0: 16%|█▌ | 1984/12384 [4:12:41<22:13:41, 7.69s/it, loss=0.0007, acc=0.9972, iter_time=6.29s]
Epoch 0: 16%|█▌ | 1985/12384 [4:12:41<22:08:51, 7.67s/it, loss=0.0007, acc=0.9972, iter_time=6.29s]
Epoch 0: 16%|█▌ | 1985/12384 [4:12:49<22:08:51, 7.67s/it, loss=0.0004, acc=0.9997, iter_time=8.53s]
Epoch 0: 16%|█▌ | 1986/12384 [4:12:49<22:05:04, 7.65s/it, loss=0.0004, acc=0.9997, iter_time=8.53s]
Epoch 0: 16%|█▌ | 1986/12384 [4:12:57<22:05:04, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=7.30s]
Epoch 0: 16%|█▌ | 1987/12384 [4:12:57<22:04:30, 7.64s/it, loss=0.0003, acc=0.9997, iter_time=7.30s]
Epoch 0: 16%|█▌ | 1987/12384 [4:13:04<22:04:30, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=7.92s]
Epoch 0: 16%|█▌ | 1988/12384 [4:13:04<22:03:06, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=7.92s]
Epoch 0: 16%|█▌ | 1988/12384 [4:13:12<22:03:06, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=3.65s]
Epoch 0: 16%|█▌ | 1989/12384 [4:13:12<22:01:57, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=3.65s]
Epoch 0: 16%|█▌ | 1989/12384 [4:13:20<22:01:57, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=11.58s]
Epoch 0: 16%|█▌ | 1990/12384 [4:13:20<22:00:45, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=11.58s]
Epoch 0: 16%|█▌ | 1990/12384 [4:13:27<22:00:45, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.17s]
Epoch 0: 16%|█▌ | 1991/12384 [4:13:27<21:59:56, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.17s]
Epoch 0: 16%|█▌ | 1991/12384 [4:13:35<21:59:56, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=9.43s]
Epoch 0: 16%|█▌ | 1992/12384 [4:13:35<21:59:55, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=9.43s]
Epoch 0: 16%|█▌ | 1992/12384 [4:13:42<21:59:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.10s]
Epoch 0: 16%|█▌ | 1993/12384 [4:13:42<21:59:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.10s]
Epoch 0: 16%|█▌ | 1993/12384 [4:13:50<21:59:38, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=8.46s]
Epoch 0: 16%|█▌ | 1994/12384 [4:13:50<21:59:39, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=8.46s]
Epoch 0: 16%|█▌ | 1994/12384 [4:13:58<21:59:39, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=9.93s]
Epoch 0: 16%|█▌ | 1995/12384 [4:13:58<21:59:25, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=9.93s]
Epoch 0: 16%|█▌ | 1995/12384 [4:14:05<21:59:25, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1996/12384 [4:14:05<21:57:18, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1996/12384 [4:14:13<21:57:18, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1997/12384 [4:14:13<21:57:03, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1997/12384 [4:14:20<21:57:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.54s]
Epoch 0: 16%|█▌ | 1998/12384 [4:14:20<21:58:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.54s]
Epoch 0: 16%|█▌ | 1998/12384 [4:14:28<21:58:13, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.69s]
Epoch 0: 16%|█▌ | 1999/12384 [4:14:28<21:56:41, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=10.69s]
Epoch 0: 16%|█▌ | 1999/12384 [4:14:36<21:56:41, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=8.01s]
Epoch 0: 16%|█▌ | 2000/12384 [4:14:36<22:06:59, 7.67s/it, loss=0.0004, acc=0.9998, iter_time=8.01s]
Epoch 0: 16%|█▌ | 2000/12384 [4:14:43<22:06:59, 7.67s/it, loss=0.0011, acc=0.9961, iter_time=7.10s]
Epoch 0: 16%|█▌ | 2001/12384 [4:14:43<22:04:31, 7.65s/it, loss=0.0011, acc=0.9961, iter_time=7.10s]
Epoch 0: 16%|█▌ | 2001/12384 [4:14:51<22:04:31, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.37s]
Epoch 0: 16%|█▌ | 2002/12384 [4:14:51<22:03:15, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.37s]
Epoch 0: 16%|█▌ | 2002/12384 [4:14:59<22:03:15, 7.65s/it, loss=0.0007, acc=0.9977, iter_time=8.19s]
Epoch 0: 16%|█▌ | 2003/12384 [4:14:59<22:01:33, 7.64s/it, loss=0.0007, acc=0.9977, iter_time=8.19s]
Epoch 0: 16%|█▌ | 2003/12384 [4:15:06<22:01:33, 7.64s/it, loss=0.0027, acc=0.9974, iter_time=7.63s]
Epoch 0: 16%|█▌ | 2004/12384 [4:15:06<22:00:28, 7.63s/it, loss=0.0027, acc=0.9974, iter_time=7.63s]
Epoch 0: 16%|█▌ | 2004/12384 [4:15:14<22:00:28, 7.63s/it, loss=0.0013, acc=0.9964, iter_time=7.60s]
Epoch 0: 16%|█▌ | 2005/12384 [4:15:14<21:58:38, 7.62s/it, loss=0.0013, acc=0.9964, iter_time=7.60s]
Epoch 0: 16%|█▌ | 2005/12384 [4:15:22<21:58:38, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.90s]
Epoch 0: 16%|█▌ | 2006/12384 [4:15:22<22:12:09, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.90s]
Epoch 0: 16%|█▌ | 2006/12384 [4:15:30<22:12:09, 7.70s/it, loss=0.0004, acc=0.9995, iter_time=7.64s]
Epoch 0: 16%|█▌ | 2007/12384 [4:15:30<22:23:41, 7.77s/it, loss=0.0004, acc=0.9995, iter_time=7.64s]
Epoch 0: 16%|█▌ | 2007/12384 [4:15:37<22:23:41, 7.77s/it, loss=0.0003, acc=1.0000, iter_time=8.25s]
Epoch 0: 16%|█▌ | 2008/12384 [4:15:37<22:15:26, 7.72s/it, loss=0.0003, acc=1.0000, iter_time=8.25s]
Epoch 0: 16%|█▌ | 2008/12384 [4:15:45<22:15:26, 7.72s/it, loss=0.0007, acc=0.9988, iter_time=7.26s]
Epoch 0: 16%|█▌ | 2009/12384 [4:15:45<22:10:14, 7.69s/it, loss=0.0007, acc=0.9988, iter_time=7.26s]
Epoch 0: 16%|█▌ | 2009/12384 [4:15:53<22:10:14, 7.69s/it, loss=0.0108, acc=0.9933, iter_time=4.31s]
Epoch 0: 16%|█▌ | 2010/12384 [4:15:53<22:06:29, 7.67s/it, loss=0.0108, acc=0.9933, iter_time=4.31s]
Epoch 0: 16%|█▌ | 2010/12384 [4:16:00<22:06:29, 7.67s/it, loss=0.0006, acc=0.9983, iter_time=10.90s]
Epoch 0: 16%|█▌ | 2011/12384 [4:16:00<22:02:11, 7.65s/it, loss=0.0006, acc=0.9983, iter_time=10.90s]
Epoch 0: 16%|█▌ | 2011/12384 [4:16:08<22:02:11, 7.65s/it, loss=0.0018, acc=0.9972, iter_time=7.60s]
Epoch 0: 16%|█▌ | 2012/12384 [4:16:08<21:59:17, 7.63s/it, loss=0.0018, acc=0.9972, iter_time=7.60s]
Epoch 0: 16%|█▌ | 2012/12384 [4:16:15<21:59:17, 7.63s/it, loss=0.0006, acc=0.9987, iter_time=6.39s]
Epoch 0: 16%|█▋ | 2013/12384 [4:16:15<21:58:14, 7.63s/it, loss=0.0006, acc=0.9987, iter_time=6.39s]
Epoch 0: 16%|█▋ | 2013/12384 [4:16:23<21:58:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.21s]
Epoch 0: 16%|█▋ | 2014/12384 [4:16:23<21:56:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.21s]
Epoch 0: 16%|█▋ | 2014/12384 [4:16:31<21:56:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.20s]
Epoch 0: 16%|█▋ | 2015/12384 [4:16:31<21:55:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.20s]
Epoch 0: 16%|█▋ | 2015/12384 [4:16:38<21:55:58, 7.61s/it, loss=0.0017, acc=0.9963, iter_time=7.56s]
Epoch 0: 16%|█▋ | 2016/12384 [4:16:38<21:54:56, 7.61s/it, loss=0.0017, acc=0.9963, iter_time=7.56s]
Epoch 0: 16%|█▋ | 2016/12384 [4:16:46<21:54:56, 7.61s/it, loss=0.0007, acc=0.9967, iter_time=7.32s]
Epoch 0: 16%|█▋ | 2017/12384 [4:16:46<21:54:06, 7.61s/it, loss=0.0007, acc=0.9967, iter_time=7.32s]
Epoch 0: 16%|█▋ | 2017/12384 [4:16:53<21:54:06, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=6.99s]
Epoch 0: 16%|█▋ | 2018/12384 [4:16:53<21:54:48, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=6.99s]
Epoch 0: 16%|█▋ | 2018/12384 [4:17:01<21:54:48, 7.61s/it, loss=0.0019, acc=0.9958, iter_time=8.56s]
Epoch 0: 16%|█▋ | 2019/12384 [4:17:01<21:55:53, 7.62s/it, loss=0.0019, acc=0.9958, iter_time=8.56s]
Epoch 0: 16%|█▋ | 2019/12384 [4:17:09<21:55:53, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▋ | 2020/12384 [4:17:09<21:57:46, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▋ | 2020/12384 [4:17:16<21:57:46, 7.63s/it, loss=0.0005, acc=0.9977, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2021/12384 [4:17:16<21:55:22, 7.62s/it, loss=0.0005, acc=0.9977, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2021/12384 [4:17:24<21:55:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.73s]
Epoch 0: 16%|█▋ | 2022/12384 [4:17:24<21:55:11, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.73s]
Epoch 0: 16%|█▋ | 2022/12384 [4:17:32<21:55:11, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=10.49s]
Epoch 0: 16%|█▋ | 2023/12384 [4:17:32<21:55:49, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=10.49s]
Epoch 0: 16%|█▋ | 2023/12384 [4:17:39<21:55:49, 7.62s/it, loss=0.0016, acc=0.9940, iter_time=8.01s]
Epoch 0: 16%|█▋ | 2024/12384 [4:17:39<21:55:09, 7.62s/it, loss=0.0016, acc=0.9940, iter_time=8.01s]
Epoch 0: 16%|█▋ | 2024/12384 [4:17:47<21:55:09, 7.62s/it, loss=0.0006, acc=0.9985, iter_time=7.23s]
Epoch 0: 16%|█▋ | 2025/12384 [4:17:47<21:57:27, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.23s]
Epoch 0: 16%|█▋ | 2025/12384 [4:17:54<21:57:27, 7.63s/it, loss=0.0017, acc=0.9965, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2026/12384 [4:17:54<21:56:58, 7.63s/it, loss=0.0017, acc=0.9965, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2026/12384 [4:18:02<21:56:58, 7.63s/it, loss=0.0033, acc=0.9953, iter_time=7.62s]
Epoch 0: 16%|█▋ | 2027/12384 [4:18:02<21:55:47, 7.62s/it, loss=0.0033, acc=0.9953, iter_time=7.62s]
Epoch 0: 16%|█▋ | 2027/12384 [4:18:10<21:55:47, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=7.62s]
Epoch 0: 16%|█▋ | 2028/12384 [4:18:10<21:55:07, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=7.62s]
Epoch 0: 16%|█▋ | 2028/12384 [4:18:17<21:55:07, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.63s]
Epoch 0: 16%|█▋ | 2029/12384 [4:18:17<21:55:04, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.63s]
Epoch 0: 16%|█▋ | 2029/12384 [4:18:25<21:55:04, 7.62s/it, loss=0.0022, acc=0.9895, iter_time=7.60s]
Epoch 0: 16%|█▋ | 2030/12384 [4:18:25<21:53:24, 7.61s/it, loss=0.0022, acc=0.9895, iter_time=7.60s]
Epoch 0: 16%|█▋ | 2030/12384 [4:18:33<21:53:24, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.58s]
Epoch 0: 16%|█▋ | 2031/12384 [4:18:33<21:52:12, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.58s]
Epoch 0: 16%|█▋ | 2031/12384 [4:18:40<21:52:12, 7.60s/it, loss=0.0012, acc=0.9958, iter_time=8.30s]
Epoch 0: 16%|█▋ | 2032/12384 [4:18:40<22:07:54, 7.70s/it, loss=0.0012, acc=0.9958, iter_time=8.30s]
Epoch 0: 16%|█▋ | 2032/12384 [4:18:48<22:07:54, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=3.66s]
Epoch 0: 16%|█▋ | 2033/12384 [4:18:48<22:20:33, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=3.66s]
Epoch 0: 16%|█▋ | 2033/12384 [4:18:56<22:20:33, 7.77s/it, loss=0.0003, acc=0.9998, iter_time=9.76s]
Epoch 0: 16%|█▋ | 2034/12384 [4:18:56<22:12:54, 7.73s/it, loss=0.0003, acc=0.9998, iter_time=9.76s]
Epoch 0: 16%|█▋ | 2034/12384 [4:19:04<22:12:54, 7.73s/it, loss=0.0078, acc=0.9892, iter_time=9.36s]
Epoch 0: 16%|█▋ | 2035/12384 [4:19:04<22:05:37, 7.69s/it, loss=0.0078, acc=0.9892, iter_time=9.36s]
Epoch 0: 16%|█▋ | 2035/12384 [4:19:11<22:05:37, 7.69s/it, loss=0.0014, acc=0.9959, iter_time=7.30s]
Epoch 0: 16%|█▋ | 2036/12384 [4:19:11<22:01:41, 7.66s/it, loss=0.0014, acc=0.9959, iter_time=7.30s]
Epoch 0: 16%|█▋ | 2036/12384 [4:19:19<22:01:41, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 16%|█▋ | 2037/12384 [4:19:19<21:58:39, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 16%|█▋ | 2037/12384 [4:19:26<21:58:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.07s]
Epoch 0: 16%|█▋ | 2038/12384 [4:19:26<21:56:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.07s]
Epoch 0: 16%|█▋ | 2038/12384 [4:19:34<21:56:43, 7.64s/it, loss=0.0006, acc=0.9986, iter_time=10.65s]
Epoch 0: 16%|█▋ | 2039/12384 [4:19:34<21:54:54, 7.63s/it, loss=0.0006, acc=0.9986, iter_time=10.65s]
Epoch 0: 16%|█▋ | 2039/12384 [4:19:42<21:54:54, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 16%|█▋ | 2040/12384 [4:19:42<21:53:50, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 16%|█▋ | 2040/12384 [4:19:49<21:53:50, 7.62s/it, loss=0.0013, acc=0.9969, iter_time=7.19s]
Epoch 0: 16%|█▋ | 2041/12384 [4:19:49<21:52:55, 7.62s/it, loss=0.0013, acc=0.9969, iter_time=7.19s]
Epoch 0: 16%|█▋ | 2041/12384 [4:19:57<21:52:55, 7.62s/it, loss=0.0009, acc=0.9990, iter_time=6.77s]
Epoch 0: 16%|█▋ | 2042/12384 [4:19:57<21:52:55, 7.62s/it, loss=0.0009, acc=0.9990, iter_time=6.77s]
Epoch 0: 16%|█▋ | 2042/12384 [4:20:04<21:52:55, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=8.46s]
Epoch 0: 16%|█▋ | 2043/12384 [4:20:04<21:51:30, 7.61s/it, loss=0.0008, acc=0.9980, iter_time=8.46s]
Epoch 0: 16%|█▋ | 2043/12384 [4:20:12<21:51:30, 7.61s/it, loss=0.0013, acc=0.9952, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2044/12384 [4:20:12<21:51:02, 7.61s/it, loss=0.0013, acc=0.9952, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2044/12384 [4:20:20<21:51:02, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2045/12384 [4:20:20<21:52:02, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2045/12384 [4:20:27<21:52:02, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.90s]
Epoch 0: 17%|█▋ | 2046/12384 [4:20:27<21:50:54, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.90s]
Epoch 0: 17%|█▋ | 2046/12384 [4:20:35<21:50:54, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.60s]
Epoch 0: 17%|█▋ | 2047/12384 [4:20:35<21:51:12, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.60s]
Epoch 0: 17%|█▋ | 2047/12384 [4:20:42<21:51:12, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 17%|█▋ | 2048/12384 [4:20:42<21:50:49, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 17%|█▋ | 2048/12384 [4:20:50<21:50:49, 7.61s/it, loss=0.0019, acc=0.9946, iter_time=7.23s]
Epoch 0: 17%|█▋ | 2049/12384 [4:20:50<21:51:28, 7.61s/it, loss=0.0019, acc=0.9946, iter_time=7.23s]
Epoch 0: 17%|█▋ | 2049/12384 [4:20:58<21:51:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 17%|█▋ | 2050/12384 [4:20:58<21:53:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 17%|█▋ | 2050/12384 [4:21:05<21:53:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2051/12384 [4:21:05<21:53:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2051/12384 [4:21:13<21:53:13, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2052/12384 [4:21:13<21:57:26, 7.65s/it, loss=0.0006, acc=0.9985, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2052/12384 [4:21:21<21:57:26, 7.65s/it, loss=0.0001, acc=0.9995, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2053/12384 [4:21:21<21:58:46, 7.66s/it, loss=0.0001, acc=0.9995, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2053/12384 [4:21:28<21:58:46, 7.66s/it, loss=0.0018, acc=0.9981, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2054/12384 [4:21:28<21:56:14, 7.65s/it, loss=0.0018, acc=0.9981, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2054/12384 [4:21:36<21:56:14, 7.65s/it, loss=0.0010, acc=0.9964, iter_time=4.80s]
Epoch 0: 17%|█▋ | 2055/12384 [4:21:36<21:54:46, 7.64s/it, loss=0.0010, acc=0.9964, iter_time=4.80s]
Epoch 0: 17%|█▋ | 2055/12384 [4:21:44<21:54:46, 7.64s/it, loss=0.0008, acc=0.9981, iter_time=10.81s]
Epoch 0: 17%|█▋ | 2056/12384 [4:21:44<21:52:07, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=10.81s]
Epoch 0: 17%|█▋ | 2056/12384 [4:21:51<21:52:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 17%|█▋ | 2057/12384 [4:21:51<21:50:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 17%|█▋ | 2057/12384 [4:21:59<21:50:23, 7.61s/it, loss=0.0003, acc=0.9988, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2058/12384 [4:21:59<21:50:43, 7.62s/it, loss=0.0003, acc=0.9988, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2058/12384 [4:22:07<21:50:43, 7.62s/it, loss=0.0127, acc=0.9778, iter_time=7.94s]
Epoch 0: 17%|█▋ | 2059/12384 [4:22:07<22:08:19, 7.72s/it, loss=0.0127, acc=0.9778, iter_time=7.94s]
Epoch 0: 17%|█▋ | 2059/12384 [4:22:14<22:08:19, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=6.13s]
Epoch 0: 17%|█▋ | 2060/12384 [4:22:14<22:01:30, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=6.13s]
Epoch 0: 17%|█▋ | 2060/12384 [4:22:22<22:01:30, 7.68s/it, loss=0.0168, acc=0.9786, iter_time=9.10s]
Epoch 0: 17%|█▋ | 2061/12384 [4:22:22<21:57:46, 7.66s/it, loss=0.0168, acc=0.9786, iter_time=9.10s]
Epoch 0: 17%|█▋ | 2061/12384 [4:22:30<21:57:46, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2062/12384 [4:22:30<21:55:45, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2062/12384 [4:22:37<21:55:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2063/12384 [4:22:37<21:53:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2063/12384 [4:22:45<21:53:07, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=7.99s]
Epoch 0: 17%|█▋ | 2064/12384 [4:22:45<21:53:42, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=7.99s]
Epoch 0: 17%|█▋ | 2064/12384 [4:22:52<21:53:42, 7.64s/it, loss=0.0016, acc=0.9990, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2065/12384 [4:22:52<21:51:10, 7.62s/it, loss=0.0016, acc=0.9990, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2065/12384 [4:23:00<21:51:10, 7.62s/it, loss=0.0010, acc=0.9958, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2066/12384 [4:23:00<21:50:46, 7.62s/it, loss=0.0010, acc=0.9958, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2066/12384 [4:23:08<21:50:46, 7.62s/it, loss=0.0006, acc=0.9994, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2067/12384 [4:23:08<21:49:56, 7.62s/it, loss=0.0006, acc=0.9994, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2067/12384 [4:23:15<21:49:56, 7.62s/it, loss=0.0020, acc=0.9943, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2068/12384 [4:23:15<21:49:15, 7.61s/it, loss=0.0020, acc=0.9943, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2068/12384 [4:23:23<21:49:15, 7.61s/it, loss=0.0009, acc=0.9972, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2069/12384 [4:23:23<21:49:45, 7.62s/it, loss=0.0009, acc=0.9972, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2069/12384 [4:23:31<21:49:45, 7.62s/it, loss=0.0008, acc=0.9986, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2070/12384 [4:23:31<21:49:43, 7.62s/it, loss=0.0008, acc=0.9986, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2070/12384 [4:23:38<21:49:43, 7.62s/it, loss=0.0004, acc=0.9963, iter_time=6.70s]
Epoch 0: 17%|█▋ | 2071/12384 [4:23:38<21:48:58, 7.62s/it, loss=0.0004, acc=0.9963, iter_time=6.70s]
Epoch 0: 17%|█▋ | 2071/12384 [4:23:46<21:48:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.92s]
Epoch 0: 17%|█▋ | 2072/12384 [4:23:46<21:47:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.92s]
Epoch 0: 17%|█▋ | 2072/12384 [4:23:53<21:47:47, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2073/12384 [4:23:53<21:47:34, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2073/12384 [4:24:01<21:47:34, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2074/12384 [4:24:01<21:48:19, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2074/12384 [4:24:09<21:48:19, 7.61s/it, loss=0.0010, acc=0.9987, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2075/12384 [4:24:09<21:47:11, 7.61s/it, loss=0.0010, acc=0.9987, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2075/12384 [4:24:16<21:47:11, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2076/12384 [4:24:16<21:46:33, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2076/12384 [4:24:24<21:46:33, 7.61s/it, loss=0.0005, acc=0.9984, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2077/12384 [4:24:24<21:46:40, 7.61s/it, loss=0.0005, acc=0.9984, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2077/12384 [4:24:31<21:46:40, 7.61s/it, loss=0.0011, acc=0.9990, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2078/12384 [4:24:31<21:46:50, 7.61s/it, loss=0.0011, acc=0.9990, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2078/12384 [4:24:39<21:46:50, 7.61s/it, loss=0.0017, acc=0.9956, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2079/12384 [4:24:39<21:46:44, 7.61s/it, loss=0.0017, acc=0.9956, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2079/12384 [4:24:47<21:46:44, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=8.02s]
Epoch 0: 17%|█▋ | 2080/12384 [4:24:47<21:46:56, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=8.02s]
Epoch 0: 17%|█▋ | 2080/12384 [4:24:54<21:46:56, 7.61s/it, loss=0.0006, acc=0.9966, iter_time=7.19s]
Epoch 0: 17%|█▋ | 2081/12384 [4:24:54<21:52:01, 7.64s/it, loss=0.0006, acc=0.9966, iter_time=7.19s]
Epoch 0: 17%|█▋ | 2081/12384 [4:25:02<21:52:01, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.19s]
Epoch 0: 17%|█▋ | 2082/12384 [4:25:02<21:49:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.19s]
Epoch 0: 17%|█▋ | 2082/12384 [4:25:10<21:49:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.13s]
Epoch 0: 17%|█▋ | 2083/12384 [4:25:10<21:49:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.13s]
Epoch 0: 17%|█▋ | 2083/12384 [4:25:17<21:49:00, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2084/12384 [4:25:17<21:49:30, 7.63s/it, loss=0.0006, acc=0.9991, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2084/12384 [4:25:25<21:49:30, 7.63s/it, loss=0.0055, acc=0.9762, iter_time=6.45s]
Epoch 0: 17%|█▋ | 2085/12384 [4:25:25<22:05:22, 7.72s/it, loss=0.0055, acc=0.9762, iter_time=6.45s]
Epoch 0: 17%|█▋ | 2085/12384 [4:25:33<22:05:22, 7.72s/it, loss=0.0002, acc=0.9998, iter_time=8.53s]
Epoch 0: 17%|█▋ | 2086/12384 [4:25:33<21:58:24, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=8.53s]
Epoch 0: 17%|█▋ | 2086/12384 [4:25:40<21:58:24, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 17%|█▋ | 2087/12384 [4:25:40<21:54:53, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 17%|█▋ | 2087/12384 [4:25:48<21:54:53, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 17%|█▋ | 2088/12384 [4:25:48<21:52:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 17%|█▋ | 2088/12384 [4:25:56<21:52:43, 7.65s/it, loss=0.0004, acc=0.9984, iter_time=7.06s]
Epoch 0: 17%|█▋ | 2089/12384 [4:25:56<21:50:15, 7.64s/it, loss=0.0004, acc=0.9984, iter_time=7.06s]
Epoch 0: 17%|█▋ | 2089/12384 [4:26:03<21:50:15, 7.64s/it, loss=0.0004, acc=0.9984, iter_time=8.20s]
Epoch 0: 17%|█▋ | 2090/12384 [4:26:03<21:49:44, 7.63s/it, loss=0.0004, acc=0.9984, iter_time=8.20s]
Epoch 0: 17%|█▋ | 2090/12384 [4:26:11<21:49:44, 7.63s/it, loss=0.0007, acc=0.9988, iter_time=4.57s]
Epoch 0: 17%|█▋ | 2091/12384 [4:26:11<21:49:01, 7.63s/it, loss=0.0007, acc=0.9988, iter_time=4.57s]
Epoch 0: 17%|█▋ | 2091/12384 [4:26:18<21:49:01, 7.63s/it, loss=0.0009, acc=0.9957, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2092/12384 [4:26:18<21:48:28, 7.63s/it, loss=0.0009, acc=0.9957, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2092/12384 [4:26:26<21:48:28, 7.63s/it, loss=0.0010, acc=0.9992, iter_time=10.43s]
Epoch 0: 17%|█▋ | 2093/12384 [4:26:26<21:47:48, 7.62s/it, loss=0.0010, acc=0.9992, iter_time=10.43s]
Epoch 0: 17%|█▋ | 2093/12384 [4:26:34<21:47:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 17%|█▋ | 2094/12384 [4:26:34<21:46:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 17%|█▋ | 2094/12384 [4:26:41<21:46:39, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=5.79s]
Epoch 0: 17%|█▋ | 2095/12384 [4:26:41<21:46:15, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=5.79s]
Epoch 0: 17%|█▋ | 2095/12384 [4:26:49<21:46:15, 7.62s/it, loss=0.0012, acc=0.9955, iter_time=9.40s]
Epoch 0: 17%|█▋ | 2096/12384 [4:26:49<21:46:39, 7.62s/it, loss=0.0012, acc=0.9955, iter_time=9.40s]
Epoch 0: 17%|█▋ | 2096/12384 [4:26:56<21:46:39, 7.62s/it, loss=0.0055, acc=0.9894, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2097/12384 [4:26:56<21:44:41, 7.61s/it, loss=0.0055, acc=0.9894, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2097/12384 [4:27:04<21:44:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.98s]
Epoch 0: 17%|█▋ | 2098/12384 [4:27:04<21:44:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.98s]
Epoch 0: 17%|█▋ | 2098/12384 [4:27:12<21:44:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.21s]
Epoch 0: 17%|█▋ | 2099/12384 [4:27:12<21:43:37, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.21s]
Epoch 0: 17%|█▋ | 2099/12384 [4:27:19<21:43:37, 7.61s/it, loss=0.0025, acc=0.9942, iter_time=7.99s]
Epoch 0: 17%|█▋ | 2100/12384 [4:27:19<21:42:26, 7.60s/it, loss=0.0025, acc=0.9942, iter_time=7.99s]
Epoch 0: 17%|█▋ | 2100/12384 [4:27:27<21:42:26, 7.60s/it, loss=0.0016, acc=0.9949, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2101/12384 [4:27:27<21:42:49, 7.60s/it, loss=0.0016, acc=0.9949, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2101/12384 [4:27:34<21:42:49, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2102/12384 [4:27:34<21:42:50, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2102/12384 [4:27:42<21:42:50, 7.60s/it, loss=0.0005, acc=0.9988, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2103/12384 [4:27:42<21:44:07, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2103/12384 [4:27:50<21:44:07, 7.61s/it, loss=0.0020, acc=0.9977, iter_time=7.58s]
Epoch 0: 17%|█▋ | 2104/12384 [4:27:50<21:44:01, 7.61s/it, loss=0.0020, acc=0.9977, iter_time=7.58s]
Epoch 0: 17%|█▋ | 2104/12384 [4:27:57<21:44:01, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.02s]
Epoch 0: 17%|█▋ | 2105/12384 [4:27:57<21:42:38, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.02s]
Epoch 0: 17%|█▋ | 2105/12384 [4:28:05<21:42:38, 7.60s/it, loss=0.0004, acc=0.9992, iter_time=8.24s]
Epoch 0: 17%|█▋ | 2106/12384 [4:28:05<21:43:18, 7.61s/it, loss=0.0004, acc=0.9992, iter_time=8.24s]
Epoch 0: 17%|█▋ | 2106/12384 [4:28:13<21:43:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2107/12384 [4:28:13<21:43:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2107/12384 [4:28:20<21:43:54, 7.61s/it, loss=0.0007, acc=0.9978, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2108/12384 [4:28:20<21:43:55, 7.61s/it, loss=0.0007, acc=0.9978, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2108/12384 [4:28:28<21:43:55, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.37s]
Epoch 0: 17%|█▋ | 2109/12384 [4:28:28<21:44:18, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.37s]
Epoch 0: 17%|█▋ | 2109/12384 [4:28:35<21:44:18, 7.62s/it, loss=0.0010, acc=0.9992, iter_time=6.67s]
Epoch 0: 17%|█▋ | 2110/12384 [4:28:35<21:43:15, 7.61s/it, loss=0.0010, acc=0.9992, iter_time=6.67s]
Epoch 0: 17%|█▋ | 2110/12384 [4:28:43<21:43:15, 7.61s/it, loss=0.0007, acc=0.9998, iter_time=6.98s]
Epoch 0: 17%|█▋ | 2111/12384 [4:28:43<21:42:32, 7.61s/it, loss=0.0007, acc=0.9998, iter_time=6.98s]
Epoch 0: 17%|█▋ | 2111/12384 [4:28:51<21:42:32, 7.61s/it, loss=0.0004, acc=0.9983, iter_time=9.86s]
Epoch 0: 17%|█▋ | 2112/12384 [4:28:51<21:59:52, 7.71s/it, loss=0.0004, acc=0.9983, iter_time=9.86s]
Epoch 0: 17%|█▋ | 2112/12384 [4:28:58<21:59:52, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 17%|█▋ | 2113/12384 [4:28:58<21:54:02, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 17%|█▋ | 2113/12384 [4:29:06<21:54:02, 7.68s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2114/12384 [4:29:06<21:52:20, 7.67s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2114/12384 [4:29:14<21:52:20, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 17%|█▋ | 2115/12384 [4:29:14<21:49:04, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 17%|█▋ | 2115/12384 [4:29:21<21:49:04, 7.65s/it, loss=0.0002, acc=0.9999, iter_time=7.91s]
Epoch 0: 17%|█▋ | 2116/12384 [4:29:21<21:46:09, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.91s]
Epoch 0: 17%|█▋ | 2116/12384 [4:29:29<21:46:09, 7.63s/it, loss=0.0005, acc=0.9994, iter_time=5.55s]
Epoch 0: 17%|█▋ | 2117/12384 [4:29:29<21:44:23, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=5.55s]
Epoch 0: 17%|█▋ | 2117/12384 [4:29:37<21:44:23, 7.62s/it, loss=0.0022, acc=0.9939, iter_time=9.65s]
Epoch 0: 17%|█▋ | 2118/12384 [4:29:37<21:43:02, 7.62s/it, loss=0.0022, acc=0.9939, iter_time=9.65s]
Epoch 0: 17%|█▋ | 2118/12384 [4:29:44<21:43:02, 7.62s/it, loss=0.0004, acc=0.9987, iter_time=5.54s]
Epoch 0: 17%|█▋ | 2119/12384 [4:29:44<21:41:15, 7.61s/it, loss=0.0004, acc=0.9987, iter_time=5.54s]
Epoch 0: 17%|█▋ | 2119/12384 [4:29:52<21:41:15, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=9.58s]
Epoch 0: 17%|█▋ | 2120/12384 [4:29:52<21:40:47, 7.60s/it, loss=0.0004, acc=0.9986, iter_time=9.58s]
Epoch 0: 17%|█▋ | 2120/12384 [4:29:59<21:40:47, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2121/12384 [4:29:59<21:40:24, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2121/12384 [4:30:07<21:40:24, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2122/12384 [4:30:07<21:39:36, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2122/12384 [4:30:15<21:39:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2123/12384 [4:30:15<21:40:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2123/12384 [4:30:22<21:40:07, 7.60s/it, loss=0.0004, acc=0.9995, iter_time=5.61s]
Epoch 0: 17%|█▋ | 2124/12384 [4:30:22<21:40:18, 7.60s/it, loss=0.0004, acc=0.9995, iter_time=5.61s]
Epoch 0: 17%|█▋ | 2124/12384 [4:30:30<21:40:18, 7.60s/it, loss=0.0007, acc=0.9982, iter_time=9.60s]
Epoch 0: 17%|█▋ | 2125/12384 [4:30:30<21:40:58, 7.61s/it, loss=0.0007, acc=0.9982, iter_time=9.60s]
Epoch 0: 17%|█▋ | 2125/12384 [4:30:37<21:40:58, 7.61s/it, loss=0.0004, acc=0.9972, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2126/12384 [4:30:37<21:41:07, 7.61s/it, loss=0.0004, acc=0.9972, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2126/12384 [4:30:45<21:41:07, 7.61s/it, loss=0.0022, acc=0.9934, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2127/12384 [4:30:45<21:41:07, 7.61s/it, loss=0.0022, acc=0.9934, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2127/12384 [4:30:53<21:41:07, 7.61s/it, loss=0.0006, acc=0.9980, iter_time=8.14s]
Epoch 0: 17%|█▋ | 2128/12384 [4:30:53<21:46:26, 7.64s/it, loss=0.0006, acc=0.9980, iter_time=8.14s]
Epoch 0: 17%|█▋ | 2128/12384 [4:31:00<21:46:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2129/12384 [4:31:00<21:44:58, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2129/12384 [4:31:08<21:44:58, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2130/12384 [4:31:08<21:42:59, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2130/12384 [4:31:16<21:42:59, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2131/12384 [4:31:16<21:42:51, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2131/12384 [4:31:23<21:42:51, 7.62s/it, loss=0.0020, acc=0.9962, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2132/12384 [4:31:23<21:42:21, 7.62s/it, loss=0.0020, acc=0.9962, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2132/12384 [4:31:31<21:42:21, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2133/12384 [4:31:31<21:41:17, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2133/12384 [4:31:38<21:41:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.39s]
Epoch 0: 17%|█▋ | 2134/12384 [4:31:38<21:41:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.39s]
Epoch 0: 17%|█▋ | 2134/12384 [4:31:46<21:41:11, 7.62s/it, loss=0.0013, acc=0.9968, iter_time=8.83s]
Epoch 0: 17%|█▋ | 2135/12384 [4:31:46<21:40:36, 7.61s/it, loss=0.0013, acc=0.9968, iter_time=8.83s]
Epoch 0: 17%|█▋ | 2135/12384 [4:31:54<21:40:36, 7.61s/it, loss=0.0007, acc=0.9997, iter_time=7.56s]
Epoch 0: 17%|█▋ | 2136/12384 [4:31:54<21:40:13, 7.61s/it, loss=0.0007, acc=0.9997, iter_time=7.56s]
Epoch 0: 17%|█▋ | 2136/12384 [4:32:01<21:40:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 0: 17%|█▋ | 2137/12384 [4:32:01<21:39:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 0: 17%|█▋ | 2137/12384 [4:32:09<21:39:57, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.75s]
Epoch 0: 17%|█▋ | 2138/12384 [4:32:09<21:58:21, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=9.75s]
Epoch 0: 17%|█▋ | 2138/12384 [4:32:17<21:58:21, 7.72s/it, loss=0.0002, acc=0.9996, iter_time=4.03s]
Epoch 0: 17%|█▋ | 2139/12384 [4:32:17<21:53:08, 7.69s/it, loss=0.0002, acc=0.9996, iter_time=4.03s]
Epoch 0: 17%|█▋ | 2139/12384 [4:32:24<21:53:08, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=11.23s]
Epoch 0: 17%|█▋ | 2140/12384 [4:32:24<21:48:36, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=11.23s]
Epoch 0: 17%|█▋ | 2140/12384 [4:32:32<21:48:36, 7.66s/it, loss=0.0003, acc=0.9999, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2141/12384 [4:32:32<21:45:15, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2141/12384 [4:32:40<21:45:15, 7.65s/it, loss=0.0022, acc=0.9967, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2142/12384 [4:32:40<21:43:22, 7.64s/it, loss=0.0022, acc=0.9967, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2142/12384 [4:32:47<21:43:22, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=4.79s]
Epoch 0: 17%|█▋ | 2143/12384 [4:32:47<21:41:32, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=4.79s]
Epoch 0: 17%|█▋ | 2143/12384 [4:32:55<21:41:32, 7.63s/it, loss=0.0003, acc=0.9989, iter_time=10.81s]
Epoch 0: 17%|█▋ | 2144/12384 [4:32:55<21:41:13, 7.62s/it, loss=0.0003, acc=0.9989, iter_time=10.81s]
Epoch 0: 17%|█▋ | 2144/12384 [4:33:02<21:41:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 0: 17%|█▋ | 2145/12384 [4:33:02<21:39:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 0: 17%|█▋ | 2145/12384 [4:33:10<21:39:45, 7.62s/it, loss=0.0029, acc=0.9913, iter_time=10.64s]
Epoch 0: 17%|█▋ | 2146/12384 [4:33:10<21:39:41, 7.62s/it, loss=0.0029, acc=0.9913, iter_time=10.64s]
Epoch 0: 17%|█▋ | 2146/12384 [4:33:18<21:39:41, 7.62s/it, loss=0.0003, acc=0.9996, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2147/12384 [4:33:18<21:39:32, 7.62s/it, loss=0.0003, acc=0.9996, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2147/12384 [4:33:25<21:39:32, 7.62s/it, loss=0.0005, acc=0.9993, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2148/12384 [4:33:25<21:38:44, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2148/12384 [4:33:33<21:38:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2149/12384 [4:33:33<21:39:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2149/12384 [4:33:41<21:39:05, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=8.04s]
Epoch 0: 17%|█▋ | 2150/12384 [4:33:41<21:39:15, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=8.04s]
Epoch 0: 17%|█▋ | 2150/12384 [4:33:48<21:39:15, 7.62s/it, loss=0.0004, acc=0.9994, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2151/12384 [4:33:48<21:39:30, 7.62s/it, loss=0.0004, acc=0.9994, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2151/12384 [4:33:56<21:39:30, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=7.57s]
Epoch 0: 17%|█▋ | 2152/12384 [4:33:56<21:38:57, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=7.57s]
Epoch 0: 17%|█▋ | 2152/12384 [4:34:03<21:38:57, 7.62s/it, loss=0.0012, acc=0.9983, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2153/12384 [4:34:03<21:39:01, 7.62s/it, loss=0.0012, acc=0.9983, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2153/12384 [4:34:11<21:39:01, 7.62s/it, loss=0.0007, acc=0.9977, iter_time=6.46s]
Epoch 0: 17%|█▋ | 2154/12384 [4:34:11<21:37:01, 7.61s/it, loss=0.0007, acc=0.9977, iter_time=6.46s]
Epoch 0: 17%|█▋ | 2154/12384 [4:34:19<21:37:01, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=6.75s]
Epoch 0: 17%|█▋ | 2155/12384 [4:34:19<21:36:03, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=6.75s]
Epoch 0: 17%|█▋ | 2155/12384 [4:34:26<21:36:03, 7.60s/it, loss=0.0007, acc=0.9982, iter_time=9.67s]
Epoch 0: 17%|█▋ | 2156/12384 [4:34:26<21:39:56, 7.63s/it, loss=0.0007, acc=0.9982, iter_time=9.67s]
Epoch 0: 17%|█▋ | 2156/12384 [4:34:34<21:39:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2157/12384 [4:34:34<21:40:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2157/12384 [4:34:41<21:40:46, 7.63s/it, loss=0.0007, acc=0.9983, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2158/12384 [4:34:41<21:40:12, 7.63s/it, loss=0.0007, acc=0.9983, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2158/12384 [4:34:49<21:40:12, 7.63s/it, loss=0.0030, acc=0.9930, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2159/12384 [4:34:49<21:39:36, 7.63s/it, loss=0.0030, acc=0.9930, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2159/12384 [4:34:57<21:39:36, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 17%|█▋ | 2160/12384 [4:34:57<21:43:52, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 17%|█▋ | 2160/12384 [4:35:04<21:43:52, 7.65s/it, loss=0.0006, acc=0.9963, iter_time=7.32s]
Epoch 0: 17%|█▋ | 2161/12384 [4:35:04<21:41:40, 7.64s/it, loss=0.0006, acc=0.9963, iter_time=7.32s]
Epoch 0: 17%|█▋ | 2161/12384 [4:35:12<21:41:40, 7.64s/it, loss=0.0006, acc=0.9978, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2162/12384 [4:35:12<21:40:24, 7.63s/it, loss=0.0006, acc=0.9978, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2162/12384 [4:35:20<21:40:24, 7.63s/it, loss=0.0021, acc=0.9954, iter_time=6.94s]
Epoch 0: 17%|█▋ | 2163/12384 [4:35:20<21:42:02, 7.64s/it, loss=0.0021, acc=0.9954, iter_time=6.94s]
Epoch 0: 17%|█▋ | 2163/12384 [4:35:27<21:42:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.32s]
Epoch 0: 17%|█▋ | 2164/12384 [4:35:27<21:40:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.32s]
Epoch 0: 17%|█▋ | 2164/12384 [4:35:35<21:40:19, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2165/12384 [4:35:35<21:57:36, 7.74s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2165/12384 [4:35:43<21:57:36, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 17%|█▋ | 2166/12384 [4:35:43<21:57:06, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 17%|█▋ | 2166/12384 [4:35:51<21:57:06, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2167/12384 [4:35:51<21:50:14, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2167/12384 [4:35:58<21:50:14, 7.69s/it, loss=0.0005, acc=0.9996, iter_time=7.54s]
Epoch 0: 18%|█▊ | 2168/12384 [4:35:58<21:44:54, 7.66s/it, loss=0.0005, acc=0.9996, iter_time=7.54s]
Epoch 0: 18%|█▊ | 2168/12384 [4:36:06<21:44:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 18%|█▊ | 2169/12384 [4:36:06<21:42:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 18%|█▊ | 2169/12384 [4:36:13<21:42:18, 7.65s/it, loss=0.0004, acc=0.9979, iter_time=8.25s]
Epoch 0: 18%|█▊ | 2170/12384 [4:36:13<21:41:08, 7.64s/it, loss=0.0004, acc=0.9979, iter_time=8.25s]
Epoch 0: 18%|█▊ | 2170/12384 [4:36:21<21:41:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2171/12384 [4:36:21<21:38:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2171/12384 [4:36:29<21:38:40, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 0: 18%|█▊ | 2172/12384 [4:36:29<21:37:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 0: 18%|█▊ | 2172/12384 [4:36:36<21:37:37, 7.62s/it, loss=0.0013, acc=0.9960, iter_time=9.03s]
Epoch 0: 18%|█▊ | 2173/12384 [4:36:36<21:38:17, 7.63s/it, loss=0.0013, acc=0.9960, iter_time=9.03s]
Epoch 0: 18%|█▊ | 2173/12384 [4:36:44<21:38:17, 7.63s/it, loss=0.0015, acc=0.9965, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2174/12384 [4:36:44<21:36:49, 7.62s/it, loss=0.0015, acc=0.9965, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2174/12384 [4:36:51<21:36:49, 7.62s/it, loss=0.0004, acc=0.9998, iter_time=4.83s]
Epoch 0: 18%|█▊ | 2175/12384 [4:36:51<21:34:38, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=4.83s]
Epoch 0: 18%|█▊ | 2175/12384 [4:36:59<21:34:38, 7.61s/it, loss=0.0006, acc=0.9989, iter_time=10.75s]
Epoch 0: 18%|█▊ | 2176/12384 [4:36:59<21:39:38, 7.64s/it, loss=0.0006, acc=0.9989, iter_time=10.75s]
Epoch 0: 18%|█▊ | 2176/12384 [4:37:07<21:39:38, 7.64s/it, loss=0.0002, acc=0.9999, iter_time=7.32s]
Epoch 0: 18%|█▊ | 2177/12384 [4:37:07<21:43:15, 7.66s/it, loss=0.0002, acc=0.9999, iter_time=7.32s]
Epoch 0: 18%|█▊ | 2177/12384 [4:37:15<21:43:15, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 18%|█▊ | 2178/12384 [4:37:15<21:46:55, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 18%|█▊ | 2178/12384 [4:37:22<21:46:55, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.54s]
Epoch 0: 18%|█▊ | 2179/12384 [4:37:22<21:44:14, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.54s]
Epoch 0: 18%|█▊ | 2179/12384 [4:37:30<21:44:14, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 18%|█▊ | 2180/12384 [4:37:30<21:40:55, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 18%|█▊ | 2180/12384 [4:37:38<21:40:55, 7.65s/it, loss=0.0001, acc=0.9993, iter_time=6.45s]
Epoch 0: 18%|█▊ | 2181/12384 [4:37:38<21:39:03, 7.64s/it, loss=0.0001, acc=0.9993, iter_time=6.45s]
Epoch 0: 18%|█▊ | 2181/12384 [4:37:45<21:39:03, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=9.06s]
Epoch 0: 18%|█▊ | 2182/12384 [4:37:45<21:36:32, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=9.06s]
Epoch 0: 18%|█▊ | 2182/12384 [4:37:53<21:36:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2183/12384 [4:37:53<21:36:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2183/12384 [4:38:00<21:36:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.56s]
Epoch 0: 18%|█▊ | 2184/12384 [4:38:00<21:34:41, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.56s]
Epoch 0: 18%|█▊ | 2184/12384 [4:38:08<21:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 18%|█▊ | 2185/12384 [4:38:08<21:37:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 18%|█▊ | 2185/12384 [4:38:16<21:37:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 0: 18%|█▊ | 2186/12384 [4:38:16<21:36:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 0: 18%|█▊ | 2186/12384 [4:38:23<21:36:40, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2187/12384 [4:38:23<21:35:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2187/12384 [4:38:31<21:35:39, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.30s]
Epoch 0: 18%|█▊ | 2188/12384 [4:38:31<21:34:16, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.30s]
Epoch 0: 18%|█▊ | 2188/12384 [4:38:38<21:34:16, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.91s]
Epoch 0: 18%|█▊ | 2189/12384 [4:38:38<21:34:12, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.91s]
Epoch 0: 18%|█▊ | 2189/12384 [4:38:46<21:34:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2190/12384 [4:38:46<21:51:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2190/12384 [4:38:54<21:51:11, 7.72s/it, loss=0.0004, acc=0.9997, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2191/12384 [4:38:54<22:02:58, 7.79s/it, loss=0.0004, acc=0.9997, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2191/12384 [4:39:02<22:02:58, 7.79s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 0: 18%|█▊ | 2192/12384 [4:39:02<21:53:20, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 0: 18%|█▊ | 2192/12384 [4:39:10<21:53:20, 7.73s/it, loss=0.0007, acc=0.9980, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2193/12384 [4:39:10<21:46:19, 7.69s/it, loss=0.0007, acc=0.9980, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2193/12384 [4:39:17<21:46:19, 7.69s/it, loss=0.0011, acc=0.9981, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2194/12384 [4:39:17<21:41:56, 7.67s/it, loss=0.0011, acc=0.9981, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2194/12384 [4:39:25<21:41:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 0: 18%|█▊ | 2195/12384 [4:39:25<21:38:27, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 0: 18%|█▊ | 2195/12384 [4:39:32<21:38:27, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2196/12384 [4:39:32<21:38:22, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2196/12384 [4:39:40<21:38:22, 7.65s/it, loss=0.0006, acc=0.9979, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2197/12384 [4:39:40<21:38:30, 7.65s/it, loss=0.0006, acc=0.9979, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2197/12384 [4:39:48<21:38:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 18%|█▊ | 2198/12384 [4:39:48<21:36:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 18%|█▊ | 2198/12384 [4:39:55<21:36:09, 7.63s/it, loss=0.0016, acc=0.9944, iter_time=9.42s]
Epoch 0: 18%|█▊ | 2199/12384 [4:39:55<21:38:48, 7.65s/it, loss=0.0016, acc=0.9944, iter_time=9.42s]
Epoch 0: 18%|█▊ | 2199/12384 [4:40:03<21:38:48, 7.65s/it, loss=0.0013, acc=0.9976, iter_time=8.09s]
Epoch 0: 18%|█▊ | 2200/12384 [4:40:03<21:40:57, 7.66s/it, loss=0.0013, acc=0.9976, iter_time=8.09s]
Epoch 0: 18%|█▊ | 2200/12384 [4:40:11<21:40:57, 7.66s/it, loss=0.0014, acc=0.9973, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2201/12384 [4:40:11<21:39:02, 7.65s/it, loss=0.0014, acc=0.9973, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2201/12384 [4:40:18<21:39:02, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=6.52s]
Epoch 0: 18%|█▊ | 2202/12384 [4:40:18<21:35:24, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.52s]
Epoch 0: 18%|█▊ | 2202/12384 [4:40:26<21:35:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 18%|█▊ | 2203/12384 [4:40:26<21:33:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 18%|█▊ | 2203/12384 [4:40:33<21:33:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 18%|█▊ | 2204/12384 [4:40:33<21:32:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 18%|█▊ | 2204/12384 [4:40:41<21:32:53, 7.62s/it, loss=0.0005, acc=0.9973, iter_time=9.93s]
Epoch 0: 18%|█▊ | 2205/12384 [4:40:41<21:31:21, 7.61s/it, loss=0.0005, acc=0.9973, iter_time=9.93s]
Epoch 0: 18%|█▊ | 2205/12384 [4:40:49<21:31:21, 7.61s/it, loss=0.0029, acc=0.9917, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2206/12384 [4:40:49<21:33:16, 7.62s/it, loss=0.0029, acc=0.9917, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2206/12384 [4:40:56<21:33:16, 7.62s/it, loss=0.0005, acc=0.9997, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2207/12384 [4:40:56<21:38:00, 7.65s/it, loss=0.0005, acc=0.9997, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2207/12384 [4:41:04<21:38:00, 7.65s/it, loss=0.0013, acc=0.9955, iter_time=8.10s]
Epoch 0: 18%|█▊ | 2208/12384 [4:41:04<21:36:16, 7.64s/it, loss=0.0013, acc=0.9955, iter_time=8.10s]
Epoch 0: 18%|█▊ | 2208/12384 [4:41:12<21:36:16, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.42s]
Epoch 0: 18%|█▊ | 2209/12384 [4:41:12<21:33:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.42s]
Epoch 0: 18%|█▊ | 2209/12384 [4:41:19<21:33:34, 7.63s/it, loss=0.0006, acc=0.9974, iter_time=6.37s]
Epoch 0: 18%|█▊ | 2210/12384 [4:41:19<21:33:08, 7.63s/it, loss=0.0006, acc=0.9974, iter_time=6.37s]
Epoch 0: 18%|█▊ | 2210/12384 [4:41:27<21:33:08, 7.63s/it, loss=0.0008, acc=0.9986, iter_time=10.65s]
Epoch 0: 18%|█▊ | 2211/12384 [4:41:27<21:32:49, 7.63s/it, loss=0.0008, acc=0.9986, iter_time=10.65s]
Epoch 0: 18%|█▊ | 2211/12384 [4:41:35<21:32:49, 7.63s/it, loss=0.0003, acc=0.9997, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2212/12384 [4:41:35<21:32:35, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2212/12384 [4:41:42<21:32:35, 7.62s/it, loss=0.0005, acc=0.9996, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2213/12384 [4:41:42<21:31:14, 7.62s/it, loss=0.0005, acc=0.9996, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2213/12384 [4:41:50<21:31:14, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.68s]
Epoch 0: 18%|█▊ | 2214/12384 [4:41:50<21:30:33, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=6.68s]
Epoch 0: 18%|█▊ | 2214/12384 [4:41:58<21:30:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 18%|█▊ | 2215/12384 [4:41:58<21:44:56, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 18%|█▊ | 2215/12384 [4:42:05<21:44:56, 7.70s/it, loss=0.0009, acc=0.9983, iter_time=8.01s]
Epoch 0: 18%|█▊ | 2216/12384 [4:42:05<21:40:45, 7.68s/it, loss=0.0009, acc=0.9983, iter_time=8.01s]
Epoch 0: 18%|█▊ | 2216/12384 [4:42:13<21:40:45, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.29s]
Epoch 0: 18%|█▊ | 2217/12384 [4:42:13<21:51:10, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=6.29s]
Epoch 0: 18%|█▊ | 2217/12384 [4:42:21<21:51:10, 7.74s/it, loss=0.0010, acc=0.9967, iter_time=6.72s]
Epoch 0: 18%|█▊ | 2218/12384 [4:42:21<21:45:31, 7.71s/it, loss=0.0010, acc=0.9967, iter_time=6.72s]
Epoch 0: 18%|█▊ | 2218/12384 [4:42:28<21:45:31, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.77s]
Epoch 0: 18%|█▊ | 2219/12384 [4:42:28<21:40:01, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.77s]
Epoch 0: 18%|█▊ | 2219/12384 [4:42:36<21:40:01, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=5.78s]
Epoch 0: 18%|█▊ | 2220/12384 [4:42:36<21:36:15, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=5.78s]
Epoch 0: 18%|█▊ | 2220/12384 [4:42:44<21:36:15, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.35s]
Epoch 0: 18%|█▊ | 2221/12384 [4:42:44<21:33:44, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.35s]
Epoch 0: 18%|█▊ | 2221/12384 [4:42:51<21:33:44, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=8.27s]
Epoch 0: 18%|█▊ | 2222/12384 [4:42:51<21:31:10, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=8.27s]
Epoch 0: 18%|█▊ | 2222/12384 [4:42:59<21:31:10, 7.62s/it, loss=0.0008, acc=0.9979, iter_time=9.01s]
Epoch 0: 18%|█▊ | 2223/12384 [4:42:59<21:29:50, 7.62s/it, loss=0.0008, acc=0.9979, iter_time=9.01s]
Epoch 0: 18%|█▊ | 2223/12384 [4:43:06<21:29:50, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=8.89s]
Epoch 0: 18%|█▊ | 2224/12384 [4:43:06<21:28:40, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=8.89s]
Epoch 0: 18%|█▊ | 2224/12384 [4:43:14<21:28:40, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.25s]
Epoch 0: 18%|█▊ | 2225/12384 [4:43:14<21:28:51, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.25s]
Epoch 0: 18%|█▊ | 2225/12384 [4:43:22<21:28:51, 7.61s/it, loss=0.0005, acc=0.9984, iter_time=6.76s]
Epoch 0: 18%|█▊ | 2226/12384 [4:43:22<21:28:03, 7.61s/it, loss=0.0005, acc=0.9984, iter_time=6.76s]
Epoch 0: 18%|█▊ | 2226/12384 [4:43:29<21:28:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.45s]
Epoch 0: 18%|█▊ | 2227/12384 [4:43:29<21:27:14, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.45s]
Epoch 0: 18%|█▊ | 2227/12384 [4:43:37<21:27:14, 7.60s/it, loss=0.0003, acc=0.9998, iter_time=6.37s]
Epoch 0: 18%|█▊ | 2228/12384 [4:43:37<21:25:34, 7.60s/it, loss=0.0003, acc=0.9998, iter_time=6.37s]
Epoch 0: 18%|█▊ | 2228/12384 [4:43:44<21:25:34, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.43s]
Epoch 0: 18%|█▊ | 2229/12384 [4:43:44<21:28:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.43s]
Epoch 0: 18%|█▊ | 2229/12384 [4:43:52<21:28:21, 7.61s/it, loss=0.0005, acc=0.9975, iter_time=7.28s]
Epoch 0: 18%|█▊ | 2230/12384 [4:43:52<21:27:35, 7.61s/it, loss=0.0005, acc=0.9975, iter_time=7.28s]
Epoch 0: 18%|█▊ | 2230/12384 [4:44:00<21:27:35, 7.61s/it, loss=0.0007, acc=0.9988, iter_time=11.33s]
Epoch 0: 18%|█▊ | 2231/12384 [4:44:00<21:26:37, 7.60s/it, loss=0.0007, acc=0.9988, iter_time=11.33s]
Epoch 0: 18%|█▊ | 2231/12384 [4:44:07<21:26:37, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.54s]
Epoch 0: 18%|█▊ | 2232/12384 [4:44:07<21:26:15, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.54s]
Epoch 0: 18%|█▊ | 2232/12384 [4:44:15<21:26:15, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2233/12384 [4:44:15<21:28:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2233/12384 [4:44:22<21:28:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.21s]
Epoch 0: 18%|█▊ | 2234/12384 [4:44:22<21:28:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.21s]
Epoch 0: 18%|█▊ | 2234/12384 [4:44:30<21:28:18, 7.62s/it, loss=0.0007, acc=0.9986, iter_time=9.08s]
Epoch 0: 18%|█▊ | 2235/12384 [4:44:30<21:27:40, 7.61s/it, loss=0.0007, acc=0.9986, iter_time=9.08s]
Epoch 0: 18%|█▊ | 2235/12384 [4:44:38<21:27:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.11s]
Epoch 0: 18%|█▊ | 2236/12384 [4:44:38<21:27:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.11s]
Epoch 0: 18%|█▊ | 2236/12384 [4:44:45<21:27:35, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.09s]
Epoch 0: 18%|█▊ | 2237/12384 [4:44:45<21:26:46, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.09s]
Epoch 0: 18%|█▊ | 2237/12384 [4:44:53<21:26:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2238/12384 [4:44:53<21:26:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2238/12384 [4:45:00<21:26:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2239/12384 [4:45:00<21:26:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2239/12384 [4:45:08<21:26:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 18%|█▊ | 2240/12384 [4:45:08<21:30:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 18%|█▊ | 2240/12384 [4:45:16<21:30:14, 7.63s/it, loss=0.0004, acc=0.9963, iter_time=7.55s]
Epoch 0: 18%|█▊ | 2241/12384 [4:45:16<21:41:56, 7.70s/it, loss=0.0004, acc=0.9963, iter_time=7.55s]
Epoch 0: 18%|█▊ | 2241/12384 [4:45:24<21:41:56, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2242/12384 [4:45:24<21:36:58, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2242/12384 [4:45:32<21:36:58, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=4.26s]
Epoch 0: 18%|█▊ | 2243/12384 [4:45:32<21:49:16, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=4.26s]
Epoch 0: 18%|█▊ | 2243/12384 [4:45:39<21:49:16, 7.75s/it, loss=0.0006, acc=0.9990, iter_time=8.70s]
Epoch 0: 18%|█▊ | 2244/12384 [4:45:39<21:42:06, 7.70s/it, loss=0.0006, acc=0.9990, iter_time=8.70s]
Epoch 0: 18%|█▊ | 2244/12384 [4:45:47<21:42:06, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2245/12384 [4:45:47<21:36:40, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2245/12384 [4:45:54<21:36:40, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=10.14s]
Epoch 0: 18%|█▊ | 2246/12384 [4:45:54<21:32:23, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=10.14s]
Epoch 0: 18%|█▊ | 2246/12384 [4:46:02<21:32:23, 7.65s/it, loss=0.0066, acc=0.9912, iter_time=5.33s]
Epoch 0: 18%|█▊ | 2247/12384 [4:46:02<21:29:19, 7.63s/it, loss=0.0066, acc=0.9912, iter_time=5.33s]
Epoch 0: 18%|█▊ | 2247/12384 [4:46:10<21:29:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 0: 18%|█▊ | 2248/12384 [4:46:10<21:27:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 0: 18%|█▊ | 2248/12384 [4:46:17<21:27:26, 7.62s/it, loss=0.0009, acc=0.9975, iter_time=5.88s]
Epoch 0: 18%|█▊ | 2249/12384 [4:46:17<21:25:19, 7.61s/it, loss=0.0009, acc=0.9975, iter_time=5.88s]
Epoch 0: 18%|█▊ | 2249/12384 [4:46:25<21:25:19, 7.61s/it, loss=0.0020, acc=0.9934, iter_time=9.76s]
Epoch 0: 18%|█▊ | 2250/12384 [4:46:25<21:24:52, 7.61s/it, loss=0.0020, acc=0.9934, iter_time=9.76s]
Epoch 0: 18%|█▊ | 2250/12384 [4:46:32<21:24:52, 7.61s/it, loss=0.0006, acc=0.9995, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2251/12384 [4:46:32<21:24:18, 7.60s/it, loss=0.0006, acc=0.9995, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2251/12384 [4:46:40<21:24:18, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 18%|█▊ | 2252/12384 [4:46:40<21:24:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 18%|█▊ | 2252/12384 [4:46:48<21:24:55, 7.61s/it, loss=0.0002, acc=0.9983, iter_time=7.17s]
Epoch 0: 18%|█▊ | 2253/12384 [4:46:48<21:25:31, 7.61s/it, loss=0.0002, acc=0.9983, iter_time=7.17s]
Epoch 0: 18%|█▊ | 2253/12384 [4:46:55<21:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 18%|█▊ | 2254/12384 [4:46:55<21:25:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 18%|█▊ | 2254/12384 [4:47:03<21:25:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2255/12384 [4:47:03<21:25:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2255/12384 [4:47:10<21:25:45, 7.62s/it, loss=0.0003, acc=0.9988, iter_time=7.58s]
Epoch 0: 18%|█▊ | 2256/12384 [4:47:10<21:26:04, 7.62s/it, loss=0.0003, acc=0.9988, iter_time=7.58s]
Epoch 0: 18%|█▊ | 2256/12384 [4:47:18<21:26:04, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 18%|█▊ | 2257/12384 [4:47:18<21:25:42, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 18%|█▊ | 2257/12384 [4:47:26<21:25:42, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.56s]
Epoch 0: 18%|█▊ | 2258/12384 [4:47:26<21:25:41, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.56s]
Epoch 0: 18%|█▊ | 2258/12384 [4:47:33<21:25:41, 7.62s/it, loss=0.0007, acc=0.9986, iter_time=8.47s]
Epoch 0: 18%|█▊ | 2259/12384 [4:47:33<21:24:42, 7.61s/it, loss=0.0007, acc=0.9986, iter_time=8.47s]
Epoch 0: 18%|█▊ | 2259/12384 [4:47:41<21:24:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.82s]
Epoch 0: 18%|█▊ | 2260/12384 [4:47:41<21:26:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.82s]
Epoch 0: 18%|█▊ | 2260/12384 [4:47:48<21:26:58, 7.63s/it, loss=0.0004, acc=0.9980, iter_time=7.06s]
Epoch 0: 18%|█▊ | 2261/12384 [4:47:48<21:24:28, 7.61s/it, loss=0.0004, acc=0.9980, iter_time=7.06s]
Epoch 0: 18%|█▊ | 2261/12384 [4:47:56<21:24:28, 7.61s/it, loss=0.0016, acc=0.9958, iter_time=8.18s]
Epoch 0: 18%|█▊ | 2262/12384 [4:47:56<21:24:46, 7.62s/it, loss=0.0016, acc=0.9958, iter_time=8.18s]
Epoch 0: 18%|█▊ | 2262/12384 [4:48:04<21:24:46, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2263/12384 [4:48:04<21:23:56, 7.61s/it, loss=0.0007, acc=0.9979, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2263/12384 [4:48:11<21:23:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 0: 18%|█▊ | 2264/12384 [4:48:11<21:24:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 0: 18%|█▊ | 2264/12384 [4:48:19<21:24:08, 7.61s/it, loss=0.0011, acc=0.9992, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2265/12384 [4:48:19<21:24:08, 7.61s/it, loss=0.0011, acc=0.9992, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2265/12384 [4:48:27<21:24:08, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2266/12384 [4:48:27<21:23:49, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2266/12384 [4:48:34<21:23:49, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.90s]
Epoch 0: 18%|█▊ | 2267/12384 [4:48:34<21:37:39, 7.70s/it, loss=0.0004, acc=1.0000, iter_time=7.90s]
Epoch 0: 18%|█▊ | 2267/12384 [4:48:42<21:37:39, 7.70s/it, loss=0.0003, acc=0.9999, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2268/12384 [4:48:42<21:33:45, 7.67s/it, loss=0.0003, acc=0.9999, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2268/12384 [4:48:50<21:33:45, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2269/12384 [4:48:50<21:43:06, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2269/12384 [4:48:58<21:43:06, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=7.83s]
Epoch 0: 18%|█▊ | 2270/12384 [4:48:58<21:37:24, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.83s]
Epoch 0: 18%|█▊ | 2270/12384 [4:49:05<21:37:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2271/12384 [4:49:05<21:32:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2271/12384 [4:49:13<21:32:50, 7.67s/it, loss=0.0003, acc=0.9994, iter_time=7.99s]
Epoch 0: 18%|█▊ | 2272/12384 [4:49:13<21:30:21, 7.66s/it, loss=0.0003, acc=0.9994, iter_time=7.99s]
Epoch 0: 18%|█▊ | 2272/12384 [4:49:20<21:30:21, 7.66s/it, loss=0.0004, acc=0.9979, iter_time=5.46s]
Epoch 0: 18%|█▊ | 2273/12384 [4:49:20<21:28:19, 7.65s/it, loss=0.0004, acc=0.9979, iter_time=5.46s]
Epoch 0: 18%|█▊ | 2273/12384 [4:49:28<21:28:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.39s]
Epoch 0: 18%|█▊ | 2274/12384 [4:49:28<21:26:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.39s]
Epoch 0: 18%|█▊ | 2274/12384 [4:49:36<21:26:18, 7.63s/it, loss=0.0009, acc=0.9974, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2275/12384 [4:49:36<21:25:37, 7.63s/it, loss=0.0009, acc=0.9974, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2275/12384 [4:49:43<21:25:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2276/12384 [4:49:43<21:24:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2276/12384 [4:49:51<21:24:06, 7.62s/it, loss=0.0016, acc=0.9981, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2277/12384 [4:49:51<21:23:38, 7.62s/it, loss=0.0016, acc=0.9981, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2277/12384 [4:49:59<21:23:38, 7.62s/it, loss=0.0016, acc=0.9956, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2278/12384 [4:49:59<21:28:39, 7.65s/it, loss=0.0016, acc=0.9956, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2278/12384 [4:50:06<21:28:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.64s]
Epoch 0: 18%|█▊ | 2279/12384 [4:50:06<21:25:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.64s]
Epoch 0: 18%|█▊ | 2279/12384 [4:50:14<21:25:31, 7.63s/it, loss=0.0036, acc=0.9906, iter_time=11.03s]
Epoch 0: 18%|█▊ | 2280/12384 [4:50:14<21:25:12, 7.63s/it, loss=0.0036, acc=0.9906, iter_time=11.03s]
Epoch 0: 18%|█▊ | 2280/12384 [4:50:21<21:25:12, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.80s]
Epoch 0: 18%|█▊ | 2281/12384 [4:50:21<21:23:02, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.80s]
Epoch 0: 18%|█▊ | 2281/12384 [4:50:29<21:23:02, 7.62s/it, loss=0.0004, acc=0.9998, iter_time=9.03s]
Epoch 0: 18%|█▊ | 2282/12384 [4:50:29<21:21:30, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=9.03s]
Epoch 0: 18%|█▊ | 2282/12384 [4:50:37<21:21:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 18%|█▊ | 2283/12384 [4:50:37<21:20:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 18%|█▊ | 2283/12384 [4:50:44<21:20:58, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=8.55s]
Epoch 0: 18%|█▊ | 2284/12384 [4:50:44<21:21:00, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=8.55s]
Epoch 0: 18%|█▊ | 2284/12384 [4:50:52<21:21:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2285/12384 [4:50:52<21:20:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2285/12384 [4:50:59<21:20:15, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2286/12384 [4:50:59<21:19:31, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2286/12384 [4:51:07<21:19:31, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2287/12384 [4:51:07<21:20:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2287/12384 [4:51:15<21:20:30, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2288/12384 [4:51:15<21:22:04, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2288/12384 [4:51:22<21:22:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 0: 18%|█▊ | 2289/12384 [4:51:22<21:20:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 0: 18%|█▊ | 2289/12384 [4:51:30<21:20:16, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2290/12384 [4:51:30<21:20:20, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2290/12384 [4:51:37<21:20:20, 7.61s/it, loss=0.0002, acc=0.9984, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2291/12384 [4:51:37<21:19:22, 7.61s/it, loss=0.0002, acc=0.9984, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2291/12384 [4:51:45<21:19:22, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2292/12384 [4:51:45<21:20:20, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2292/12384 [4:51:53<21:20:20, 7.61s/it, loss=0.0006, acc=0.9990, iter_time=7.90s]
Epoch 0: 19%|█▊ | 2293/12384 [4:51:53<21:32:53, 7.69s/it, loss=0.0006, acc=0.9990, iter_time=7.90s]
Epoch 0: 19%|█▊ | 2293/12384 [4:52:01<21:32:53, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 0: 19%|█▊ | 2294/12384 [4:52:01<21:28:30, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 0: 19%|█▊ | 2294/12384 [4:52:08<21:28:30, 7.66s/it, loss=0.0012, acc=0.9977, iter_time=7.83s]
Epoch 0: 19%|█▊ | 2295/12384 [4:52:08<21:25:55, 7.65s/it, loss=0.0012, acc=0.9977, iter_time=7.83s]
Epoch 0: 19%|█▊ | 2295/12384 [4:52:16<21:25:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 19%|█▊ | 2296/12384 [4:52:16<21:40:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 19%|█▊ | 2296/12384 [4:52:24<21:40:13, 7.73s/it, loss=0.0014, acc=0.9943, iter_time=5.37s]
Epoch 0: 19%|█▊ | 2297/12384 [4:52:24<21:32:53, 7.69s/it, loss=0.0014, acc=0.9943, iter_time=5.37s]
Epoch 0: 19%|█▊ | 2297/12384 [4:52:31<21:32:53, 7.69s/it, loss=0.0018, acc=0.9982, iter_time=9.88s]
Epoch 0: 19%|█▊ | 2298/12384 [4:52:31<21:28:46, 7.67s/it, loss=0.0018, acc=0.9982, iter_time=9.88s]
Epoch 0: 19%|█▊ | 2298/12384 [4:52:39<21:28:46, 7.67s/it, loss=0.0024, acc=0.9967, iter_time=7.61s]
Epoch 0: 19%|█▊ | 2299/12384 [4:52:39<21:25:07, 7.65s/it, loss=0.0024, acc=0.9967, iter_time=7.61s]
Epoch 0: 19%|█▊ | 2299/12384 [4:52:47<21:25:07, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 19%|█▊ | 2300/12384 [4:52:47<21:25:03, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 19%|█▊ | 2300/12384 [4:52:54<21:25:03, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.21s]
Epoch 0: 19%|█▊ | 2301/12384 [4:52:54<21:22:30, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.21s]
Epoch 0: 19%|█▊ | 2301/12384 [4:53:02<21:22:30, 7.63s/it, loss=0.0015, acc=0.9954, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2302/12384 [4:53:02<21:21:50, 7.63s/it, loss=0.0015, acc=0.9954, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2302/12384 [4:53:09<21:21:50, 7.63s/it, loss=0.0019, acc=0.9975, iter_time=5.89s]
Epoch 0: 19%|█▊ | 2303/12384 [4:53:09<21:21:32, 7.63s/it, loss=0.0019, acc=0.9975, iter_time=5.89s]
Epoch 0: 19%|█▊ | 2303/12384 [4:53:17<21:21:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.32s]
Epoch 0: 19%|█▊ | 2304/12384 [4:53:17<21:21:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.32s]
Epoch 0: 19%|█▊ | 2304/12384 [4:53:25<21:21:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.58s]
Epoch 0: 19%|█▊ | 2305/12384 [4:53:25<21:20:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.58s]
Epoch 0: 19%|█▊ | 2305/12384 [4:53:32<21:20:20, 7.62s/it, loss=0.0004, acc=0.9980, iter_time=9.07s]
Epoch 0: 19%|█▊ | 2306/12384 [4:53:32<21:20:25, 7.62s/it, loss=0.0004, acc=0.9980, iter_time=9.07s]
Epoch 0: 19%|█▊ | 2306/12384 [4:53:40<21:20:25, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=5.22s]
Epoch 0: 19%|█▊ | 2307/12384 [4:53:40<21:19:25, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=5.22s]
Epoch 0: 19%|█▊ | 2307/12384 [4:53:47<21:19:25, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.34s]
Epoch 0: 19%|█▊ | 2308/12384 [4:53:47<21:20:02, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.34s]
Epoch 0: 19%|█▊ | 2308/12384 [4:53:55<21:20:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.93s]
Epoch 0: 19%|█▊ | 2309/12384 [4:53:55<21:22:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.93s]
Epoch 0: 19%|█▊ | 2309/12384 [4:54:03<21:22:46, 7.64s/it, loss=0.0015, acc=0.9974, iter_time=6.72s]
Epoch 0: 19%|█▊ | 2310/12384 [4:54:03<21:21:37, 7.63s/it, loss=0.0015, acc=0.9974, iter_time=6.72s]
Epoch 0: 19%|█▊ | 2310/12384 [4:54:10<21:21:37, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.59s]
Epoch 0: 19%|█▊ | 2311/12384 [4:54:10<21:20:24, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.59s]
Epoch 0: 19%|█▊ | 2311/12384 [4:54:18<21:20:24, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.98s]
Epoch 0: 19%|█▊ | 2312/12384 [4:54:18<21:19:56, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.98s]
Epoch 0: 19%|█▊ | 2312/12384 [4:54:26<21:19:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 19%|█▊ | 2313/12384 [4:54:26<21:18:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 19%|█▊ | 2313/12384 [4:54:33<21:18:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 0: 19%|█▊ | 2314/12384 [4:54:33<21:17:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 0: 19%|█▊ | 2314/12384 [4:54:41<21:17:26, 7.61s/it, loss=0.0020, acc=0.9911, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2315/12384 [4:54:41<21:16:37, 7.61s/it, loss=0.0020, acc=0.9911, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2315/12384 [4:54:48<21:16:37, 7.61s/it, loss=0.0007, acc=0.9979, iter_time=6.45s]
Epoch 0: 19%|█▊ | 2316/12384 [4:54:48<21:17:07, 7.61s/it, loss=0.0007, acc=0.9979, iter_time=6.45s]
Epoch 0: 19%|█▊ | 2316/12384 [4:54:56<21:17:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▊ | 2317/12384 [4:54:56<21:17:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▊ | 2317/12384 [4:55:04<21:17:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.39s]
Epoch 0: 19%|█▊ | 2318/12384 [4:55:04<21:18:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.39s]
Epoch 0: 19%|█▊ | 2318/12384 [4:55:11<21:18:16, 7.62s/it, loss=0.0004, acc=0.9988, iter_time=7.89s]
Epoch 0: 19%|█▊ | 2319/12384 [4:55:11<21:18:10, 7.62s/it, loss=0.0004, acc=0.9988, iter_time=7.89s]
Epoch 0: 19%|█▊ | 2319/12384 [4:55:19<21:18:10, 7.62s/it, loss=0.0008, acc=0.9978, iter_time=10.59s]
Epoch 0: 19%|█▊ | 2320/12384 [4:55:19<21:16:33, 7.61s/it, loss=0.0008, acc=0.9978, iter_time=10.59s]
Epoch 0: 19%|█▊ | 2320/12384 [4:55:26<21:16:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▊ | 2321/12384 [4:55:26<21:15:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▊ | 2321/12384 [4:55:34<21:15:48, 7.61s/it, loss=0.0013, acc=0.9958, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2322/12384 [4:55:34<21:32:54, 7.71s/it, loss=0.0013, acc=0.9958, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2322/12384 [4:55:42<21:32:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 19%|█▉ | 2323/12384 [4:55:42<21:27:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 19%|█▉ | 2323/12384 [4:55:50<21:27:44, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=9.67s]
Epoch 0: 19%|█▉ | 2324/12384 [4:55:50<21:24:09, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.67s]
Epoch 0: 19%|█▉ | 2324/12384 [4:55:57<21:24:09, 7.66s/it, loss=0.0005, acc=0.9998, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2325/12384 [4:55:57<21:22:10, 7.65s/it, loss=0.0005, acc=0.9998, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2325/12384 [4:56:05<21:22:10, 7.65s/it, loss=0.0008, acc=0.9973, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2326/12384 [4:56:05<21:20:33, 7.64s/it, loss=0.0008, acc=0.9973, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2326/12384 [4:56:13<21:20:33, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2327/12384 [4:56:13<21:19:39, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2327/12384 [4:56:20<21:19:39, 7.63s/it, loss=0.0011, acc=0.9985, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2328/12384 [4:56:20<21:18:14, 7.63s/it, loss=0.0011, acc=0.9985, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2328/12384 [4:56:28<21:18:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 0: 19%|█▉ | 2329/12384 [4:56:28<21:16:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 0: 19%|█▉ | 2329/12384 [4:56:35<21:16:24, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=9.09s]
Epoch 0: 19%|█▉ | 2330/12384 [4:56:35<21:15:33, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=9.09s]
Epoch 0: 19%|█▉ | 2330/12384 [4:56:43<21:15:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2331/12384 [4:56:43<21:16:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2331/12384 [4:56:51<21:16:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2332/12384 [4:56:51<21:15:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2332/12384 [4:56:58<21:15:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 19%|█▉ | 2333/12384 [4:56:58<21:14:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 19%|█▉ | 2333/12384 [4:57:06<21:14:31, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 19%|█▉ | 2334/12384 [4:57:06<21:14:24, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 19%|█▉ | 2334/12384 [4:57:13<21:14:24, 7.61s/it, loss=0.0017, acc=0.9957, iter_time=9.70s]
Epoch 0: 19%|█▉ | 2335/12384 [4:57:13<21:14:05, 7.61s/it, loss=0.0017, acc=0.9957, iter_time=9.70s]
Epoch 0: 19%|█▉ | 2335/12384 [4:57:21<21:14:05, 7.61s/it, loss=0.0009, acc=0.9963, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2336/12384 [4:57:21<21:13:55, 7.61s/it, loss=0.0009, acc=0.9963, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2336/12384 [4:57:29<21:13:55, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=4.89s]
Epoch 0: 19%|█▉ | 2337/12384 [4:57:29<21:13:56, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=4.89s]
Epoch 0: 19%|█▉ | 2337/12384 [4:57:36<21:13:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 19%|█▉ | 2338/12384 [4:57:36<21:12:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 19%|█▉ | 2338/12384 [4:57:44<21:12:30, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2339/12384 [4:57:44<21:12:39, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2339/12384 [4:57:51<21:12:39, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2340/12384 [4:57:51<21:16:04, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2340/12384 [4:57:59<21:16:04, 7.62s/it, loss=0.0006, acc=0.9978, iter_time=5.56s]
Epoch 0: 19%|█▉ | 2341/12384 [4:57:59<21:14:36, 7.61s/it, loss=0.0006, acc=0.9978, iter_time=5.56s]
Epoch 0: 19%|█▉ | 2341/12384 [4:58:07<21:14:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 19%|█▉ | 2342/12384 [4:58:07<21:13:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 19%|█▉ | 2342/12384 [4:58:14<21:13:09, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=11.11s]
Epoch 0: 19%|█▉ | 2343/12384 [4:58:14<21:12:43, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=11.11s]
Epoch 0: 19%|█▉ | 2343/12384 [4:58:22<21:12:43, 7.61s/it, loss=0.0003, acc=0.9991, iter_time=7.70s]
Epoch 0: 19%|█▉ | 2344/12384 [4:58:22<21:11:51, 7.60s/it, loss=0.0003, acc=0.9991, iter_time=7.70s]
Epoch 0: 19%|█▉ | 2344/12384 [4:58:29<21:11:51, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.49s]
Epoch 0: 19%|█▉ | 2345/12384 [4:58:29<21:12:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.49s]
Epoch 0: 19%|█▉ | 2345/12384 [4:58:37<21:12:30, 7.61s/it, loss=0.0012, acc=0.9975, iter_time=5.08s]
Epoch 0: 19%|█▉ | 2346/12384 [4:58:37<21:14:58, 7.62s/it, loss=0.0012, acc=0.9975, iter_time=5.08s]
Epoch 0: 19%|█▉ | 2346/12384 [4:58:45<21:14:58, 7.62s/it, loss=0.0004, acc=0.9974, iter_time=9.64s]
Epoch 0: 19%|█▉ | 2347/12384 [4:58:45<21:15:00, 7.62s/it, loss=0.0004, acc=0.9974, iter_time=9.64s]
Epoch 0: 19%|█▉ | 2347/12384 [4:58:52<21:15:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 19%|█▉ | 2348/12384 [4:58:52<21:18:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 19%|█▉ | 2348/12384 [4:59:00<21:18:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2349/12384 [4:59:00<21:33:16, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2349/12384 [4:59:08<21:33:16, 7.73s/it, loss=0.0005, acc=0.9976, iter_time=8.29s]
Epoch 0: 19%|█▉ | 2350/12384 [4:59:08<21:26:40, 7.69s/it, loss=0.0005, acc=0.9976, iter_time=8.29s]
Epoch 0: 19%|█▉ | 2350/12384 [4:59:16<21:26:40, 7.69s/it, loss=0.0011, acc=0.9984, iter_time=7.21s]
Epoch 0: 19%|█▉ | 2351/12384 [4:59:16<21:23:05, 7.67s/it, loss=0.0011, acc=0.9984, iter_time=7.21s]
Epoch 0: 19%|█▉ | 2351/12384 [4:59:23<21:23:05, 7.67s/it, loss=0.0006, acc=0.9995, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2352/12384 [4:59:23<21:20:07, 7.66s/it, loss=0.0006, acc=0.9995, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2352/12384 [4:59:31<21:20:07, 7.66s/it, loss=0.0004, acc=0.9984, iter_time=3.05s]
Epoch 0: 19%|█▉ | 2353/12384 [4:59:31<21:17:47, 7.64s/it, loss=0.0004, acc=0.9984, iter_time=3.05s]
Epoch 0: 19%|█▉ | 2353/12384 [4:59:38<21:17:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.80s]
Epoch 0: 19%|█▉ | 2354/12384 [4:59:38<21:16:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.80s]
Epoch 0: 19%|█▉ | 2354/12384 [4:59:46<21:16:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2355/12384 [4:59:46<21:15:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2355/12384 [4:59:54<21:15:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2356/12384 [4:59:54<21:14:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2356/12384 [5:00:01<21:14:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2357/12384 [5:00:01<21:13:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2357/12384 [5:00:09<21:13:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.56s]
Epoch 0: 19%|█▉ | 2358/12384 [5:00:09<21:11:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.56s]
Epoch 0: 19%|█▉ | 2358/12384 [5:00:16<21:11:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 19%|█▉ | 2359/12384 [5:00:16<21:11:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 19%|█▉ | 2359/12384 [5:00:24<21:11:25, 7.61s/it, loss=0.0003, acc=0.9979, iter_time=7.56s]
Epoch 0: 19%|█▉ | 2360/12384 [5:00:24<21:11:04, 7.61s/it, loss=0.0003, acc=0.9979, iter_time=7.56s]
Epoch 0: 19%|█▉ | 2360/12384 [5:00:32<21:11:04, 7.61s/it, loss=0.0010, acc=0.9974, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2361/12384 [5:00:32<21:12:09, 7.62s/it, loss=0.0010, acc=0.9974, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2361/12384 [5:00:39<21:12:09, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2362/12384 [5:00:39<21:12:05, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2362/12384 [5:00:47<21:12:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2363/12384 [5:00:47<21:12:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2363/12384 [5:00:55<21:12:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.03s]
Epoch 0: 19%|█▉ | 2364/12384 [5:00:55<21:10:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.03s]
Epoch 0: 19%|█▉ | 2364/12384 [5:01:02<21:10:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 19%|█▉ | 2365/12384 [5:01:02<21:09:44, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 19%|█▉ | 2365/12384 [5:01:10<21:09:44, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2366/12384 [5:01:10<21:09:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2366/12384 [5:01:17<21:09:49, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=4.49s]
Epoch 0: 19%|█▉ | 2367/12384 [5:01:17<21:08:59, 7.60s/it, loss=0.0003, acc=0.9982, iter_time=4.49s]
Epoch 0: 19%|█▉ | 2367/12384 [5:01:25<21:08:59, 7.60s/it, loss=0.0005, acc=0.9990, iter_time=11.09s]
Epoch 0: 19%|█▉ | 2368/12384 [5:01:25<21:08:28, 7.60s/it, loss=0.0005, acc=0.9990, iter_time=11.09s]
Epoch 0: 19%|█▉ | 2368/12384 [5:01:33<21:08:28, 7.60s/it, loss=0.0019, acc=0.9976, iter_time=7.21s]
Epoch 0: 19%|█▉ | 2369/12384 [5:01:33<21:08:39, 7.60s/it, loss=0.0019, acc=0.9976, iter_time=7.21s]
Epoch 0: 19%|█▉ | 2369/12384 [5:01:40<21:08:39, 7.60s/it, loss=0.0001, acc=0.9997, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2370/12384 [5:01:40<21:09:26, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2370/12384 [5:01:48<21:09:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2371/12384 [5:01:48<21:10:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2371/12384 [5:01:55<21:10:02, 7.61s/it, loss=0.0008, acc=0.9982, iter_time=5.63s]
Epoch 0: 19%|█▉ | 2372/12384 [5:01:55<21:09:29, 7.61s/it, loss=0.0008, acc=0.9982, iter_time=5.63s]
Epoch 0: 19%|█▉ | 2372/12384 [5:02:03<21:09:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.89s]
Epoch 0: 19%|█▉ | 2373/12384 [5:02:03<21:23:12, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=9.89s]
Epoch 0: 19%|█▉ | 2373/12384 [5:02:11<21:23:12, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2374/12384 [5:02:11<21:21:33, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2374/12384 [5:02:19<21:21:33, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=6.51s]
Epoch 0: 19%|█▉ | 2375/12384 [5:02:19<21:37:40, 7.78s/it, loss=0.0001, acc=0.9999, iter_time=6.51s]
Epoch 0: 19%|█▉ | 2375/12384 [5:02:27<21:37:40, 7.78s/it, loss=0.0003, acc=1.0000, iter_time=9.10s]
Epoch 0: 19%|█▉ | 2376/12384 [5:02:27<21:28:55, 7.73s/it, loss=0.0003, acc=1.0000, iter_time=9.10s]
Epoch 0: 19%|█▉ | 2376/12384 [5:02:34<21:28:55, 7.73s/it, loss=0.0012, acc=0.9973, iter_time=5.65s]
Epoch 0: 19%|█▉ | 2377/12384 [5:02:34<21:23:55, 7.70s/it, loss=0.0012, acc=0.9973, iter_time=5.65s]
Epoch 0: 19%|█▉ | 2377/12384 [5:02:42<21:23:55, 7.70s/it, loss=0.0004, acc=0.9995, iter_time=9.63s]
Epoch 0: 19%|█▉ | 2378/12384 [5:02:42<21:19:28, 7.67s/it, loss=0.0004, acc=0.9995, iter_time=9.63s]
Epoch 0: 19%|█▉ | 2378/12384 [5:02:49<21:19:28, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2379/12384 [5:02:49<21:20:33, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2379/12384 [5:02:57<21:20:33, 7.68s/it, loss=0.0003, acc=0.9986, iter_time=6.77s]
Epoch 0: 19%|█▉ | 2380/12384 [5:02:57<21:17:08, 7.66s/it, loss=0.0003, acc=0.9986, iter_time=6.77s]
Epoch 0: 19%|█▉ | 2380/12384 [5:03:05<21:17:08, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=8.54s]
Epoch 0: 19%|█▉ | 2381/12384 [5:03:05<21:15:24, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=8.54s]
Epoch 0: 19%|█▉ | 2381/12384 [5:03:12<21:15:24, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=6.41s]
Epoch 0: 19%|█▉ | 2382/12384 [5:03:12<21:13:49, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=6.41s]
Epoch 0: 19%|█▉ | 2382/12384 [5:03:20<21:13:49, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=8.84s]
Epoch 0: 19%|█▉ | 2383/12384 [5:03:20<21:15:32, 7.65s/it, loss=0.0005, acc=0.9998, iter_time=8.84s]
Epoch 0: 19%|█▉ | 2383/12384 [5:03:28<21:15:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 19%|█▉ | 2384/12384 [5:03:28<21:14:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 19%|█▉ | 2384/12384 [5:03:35<21:14:07, 7.64s/it, loss=0.0006, acc=0.9991, iter_time=5.69s]
Epoch 0: 19%|█▉ | 2385/12384 [5:03:35<21:12:38, 7.64s/it, loss=0.0006, acc=0.9991, iter_time=5.69s]
Epoch 0: 19%|█▉ | 2385/12384 [5:03:43<21:12:38, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=9.14s]
Epoch 0: 19%|█▉ | 2386/12384 [5:03:43<21:13:38, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=9.14s]
Epoch 0: 19%|█▉ | 2386/12384 [5:03:50<21:13:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2387/12384 [5:03:50<21:11:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2387/12384 [5:03:58<21:11:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2388/12384 [5:03:58<21:12:01, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2388/12384 [5:04:06<21:12:01, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.86s]
Epoch 0: 19%|█▉ | 2389/12384 [5:04:06<21:10:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.86s]
Epoch 0: 19%|█▉ | 2389/12384 [5:04:13<21:10:51, 7.63s/it, loss=0.0002, acc=0.9992, iter_time=10.39s]
Epoch 0: 19%|█▉ | 2390/12384 [5:04:13<21:09:41, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=10.39s]
Epoch 0: 19%|█▉ | 2390/12384 [5:04:21<21:09:41, 7.62s/it, loss=0.0031, acc=0.9921, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2391/12384 [5:04:21<21:08:22, 7.62s/it, loss=0.0031, acc=0.9921, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2391/12384 [5:04:29<21:08:22, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.98s]
Epoch 0: 19%|█▉ | 2392/12384 [5:04:29<21:10:05, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.98s]
Epoch 0: 19%|█▉ | 2392/12384 [5:04:36<21:10:05, 7.63s/it, loss=0.0006, acc=0.9998, iter_time=7.26s]
Epoch 0: 19%|█▉ | 2393/12384 [5:04:36<21:08:59, 7.62s/it, loss=0.0006, acc=0.9998, iter_time=7.26s]
Epoch 0: 19%|█▉ | 2393/12384 [5:04:44<21:08:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2394/12384 [5:04:44<21:08:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2394/12384 [5:04:51<21:08:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2395/12384 [5:04:51<21:07:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2395/12384 [5:04:59<21:07:54, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2396/12384 [5:04:59<21:07:00, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2396/12384 [5:05:07<21:07:00, 7.61s/it, loss=0.0004, acc=0.9988, iter_time=7.58s]
Epoch 0: 19%|█▉ | 2397/12384 [5:05:07<21:11:11, 7.64s/it, loss=0.0004, acc=0.9988, iter_time=7.58s]
Epoch 0: 19%|█▉ | 2397/12384 [5:05:14<21:11:11, 7.64s/it, loss=0.0006, acc=0.9976, iter_time=7.70s]
Epoch 0: 19%|█▉ | 2398/12384 [5:05:14<21:09:18, 7.63s/it, loss=0.0006, acc=0.9976, iter_time=7.70s]
Epoch 0: 19%|█▉ | 2398/12384 [5:05:22<21:09:18, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=7.90s]
Epoch 0: 19%|█▉ | 2399/12384 [5:05:22<21:21:52, 7.70s/it, loss=0.0002, acc=0.9995, iter_time=7.90s]
Epoch 0: 19%|█▉ | 2399/12384 [5:05:30<21:21:52, 7.70s/it, loss=0.0008, acc=0.9974, iter_time=7.99s]
Epoch 0: 19%|█▉ | 2400/12384 [5:05:30<21:16:50, 7.67s/it, loss=0.0008, acc=0.9974, iter_time=7.99s]
Epoch 0: 19%|█▉ | 2400/12384 [5:05:38<21:16:50, 7.67s/it, loss=0.0004, acc=0.9981, iter_time=7.25s]
Epoch 0: 19%|█▉ | 2401/12384 [5:05:38<21:28:01, 7.74s/it, loss=0.0004, acc=0.9981, iter_time=7.25s]
Epoch 0: 19%|█▉ | 2401/12384 [5:05:45<21:28:01, 7.74s/it, loss=0.0008, acc=0.9978, iter_time=7.86s]
Epoch 0: 19%|█▉ | 2402/12384 [5:05:45<21:22:13, 7.71s/it, loss=0.0008, acc=0.9978, iter_time=7.86s]
Epoch 0: 19%|█▉ | 2402/12384 [5:05:53<21:22:13, 7.71s/it, loss=0.0007, acc=0.9995, iter_time=7.68s]
Epoch 0: 19%|█▉ | 2403/12384 [5:05:53<21:19:38, 7.69s/it, loss=0.0007, acc=0.9995, iter_time=7.68s]
Epoch 0: 19%|█▉ | 2403/12384 [5:06:01<21:19:38, 7.69s/it, loss=0.0003, acc=0.9994, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2404/12384 [5:06:01<21:15:52, 7.67s/it, loss=0.0003, acc=0.9994, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2404/12384 [5:06:08<21:15:52, 7.67s/it, loss=0.0005, acc=0.9985, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2405/12384 [5:06:08<21:13:54, 7.66s/it, loss=0.0005, acc=0.9985, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2405/12384 [5:06:16<21:13:54, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=7.72s]
Epoch 0: 19%|█▉ | 2406/12384 [5:06:16<21:15:26, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=7.72s]
Epoch 0: 19%|█▉ | 2406/12384 [5:06:24<21:15:26, 7.67s/it, loss=0.0004, acc=0.9978, iter_time=7.59s]
Epoch 0: 19%|█▉ | 2407/12384 [5:06:24<21:12:42, 7.65s/it, loss=0.0004, acc=0.9978, iter_time=7.59s]
Epoch 0: 19%|█▉ | 2407/12384 [5:06:31<21:12:42, 7.65s/it, loss=0.0013, acc=0.9973, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2408/12384 [5:06:31<21:10:58, 7.64s/it, loss=0.0013, acc=0.9973, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2408/12384 [5:06:39<21:10:58, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2409/12384 [5:06:39<21:07:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2409/12384 [5:06:46<21:07:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.01s]
Epoch 0: 19%|█▉ | 2410/12384 [5:06:46<21:06:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.01s]
Epoch 0: 19%|█▉ | 2410/12384 [5:06:54<21:06:17, 7.62s/it, loss=0.0008, acc=0.9971, iter_time=9.09s]
Epoch 0: 19%|█▉ | 2411/12384 [5:06:54<21:05:25, 7.61s/it, loss=0.0008, acc=0.9971, iter_time=9.09s]
Epoch 0: 19%|█▉ | 2411/12384 [5:07:02<21:05:25, 7.61s/it, loss=0.0008, acc=0.9982, iter_time=9.68s]
Epoch 0: 19%|█▉ | 2412/12384 [5:07:02<21:05:08, 7.61s/it, loss=0.0008, acc=0.9982, iter_time=9.68s]
Epoch 0: 19%|█▉ | 2412/12384 [5:07:09<21:05:08, 7.61s/it, loss=0.0010, acc=0.9971, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2413/12384 [5:07:09<21:06:13, 7.62s/it, loss=0.0010, acc=0.9971, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2413/12384 [5:07:17<21:06:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 19%|█▉ | 2414/12384 [5:07:17<21:05:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 19%|█▉ | 2414/12384 [5:07:24<21:05:37, 7.62s/it, loss=0.0004, acc=0.9998, iter_time=8.23s]
Epoch 0: 20%|█▉ | 2415/12384 [5:07:24<21:04:47, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=8.23s]
Epoch 0: 20%|█▉ | 2415/12384 [5:07:32<21:04:47, 7.61s/it, loss=0.0007, acc=0.9951, iter_time=8.01s]
Epoch 0: 20%|█▉ | 2416/12384 [5:07:32<21:04:50, 7.61s/it, loss=0.0007, acc=0.9951, iter_time=8.01s]
Epoch 0: 20%|█▉ | 2416/12384 [5:07:40<21:04:50, 7.61s/it, loss=0.0003, acc=0.9987, iter_time=7.21s]
Epoch 0: 20%|█▉ | 2417/12384 [5:07:40<21:04:19, 7.61s/it, loss=0.0003, acc=0.9987, iter_time=7.21s]
Epoch 0: 20%|█▉ | 2417/12384 [5:07:47<21:04:19, 7.61s/it, loss=0.0008, acc=0.9966, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2418/12384 [5:07:47<21:03:20, 7.61s/it, loss=0.0008, acc=0.9966, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2418/12384 [5:07:55<21:03:20, 7.61s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2419/12384 [5:07:55<21:03:20, 7.61s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2419/12384 [5:08:02<21:03:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2420/12384 [5:08:02<21:03:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2420/12384 [5:08:10<21:03:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 20%|█▉ | 2421/12384 [5:08:10<21:03:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 20%|█▉ | 2421/12384 [5:08:18<21:03:13, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 20%|█▉ | 2422/12384 [5:08:18<21:02:46, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 20%|█▉ | 2422/12384 [5:08:25<21:02:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 0: 20%|█▉ | 2423/12384 [5:08:25<21:02:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 0: 20%|█▉ | 2423/12384 [5:08:33<21:02:19, 7.60s/it, loss=0.0009, acc=0.9979, iter_time=10.58s]
Epoch 0: 20%|█▉ | 2424/12384 [5:08:33<21:02:26, 7.61s/it, loss=0.0009, acc=0.9979, iter_time=10.58s]
Epoch 0: 20%|█▉ | 2424/12384 [5:08:41<21:02:26, 7.61s/it, loss=0.0017, acc=0.9978, iter_time=7.92s]
Epoch 0: 20%|█▉ | 2425/12384 [5:08:41<21:15:16, 7.68s/it, loss=0.0017, acc=0.9978, iter_time=7.92s]
Epoch 0: 20%|█▉ | 2425/12384 [5:08:48<21:15:16, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 20%|█▉ | 2426/12384 [5:08:48<21:11:51, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 20%|█▉ | 2426/12384 [5:08:56<21:11:51, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2427/12384 [5:08:56<21:23:07, 7.73s/it, loss=0.0006, acc=0.9998, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2427/12384 [5:09:04<21:23:07, 7.73s/it, loss=0.0023, acc=0.9939, iter_time=4.83s]
Epoch 0: 20%|█▉ | 2428/12384 [5:09:04<21:16:47, 7.69s/it, loss=0.0023, acc=0.9939, iter_time=4.83s]
Epoch 0: 20%|█▉ | 2428/12384 [5:09:11<21:16:47, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=10.63s]
Epoch 0: 20%|█▉ | 2429/12384 [5:09:11<21:11:28, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=10.63s]
Epoch 0: 20%|█▉ | 2429/12384 [5:09:19<21:11:28, 7.66s/it, loss=0.0004, acc=0.9980, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2430/12384 [5:09:19<21:08:38, 7.65s/it, loss=0.0004, acc=0.9980, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2430/12384 [5:09:27<21:08:38, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2431/12384 [5:09:27<21:07:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2431/12384 [5:09:34<21:07:12, 7.64s/it, loss=0.0079, acc=0.9976, iter_time=7.59s]
Epoch 0: 20%|█▉ | 2432/12384 [5:09:34<21:06:22, 7.63s/it, loss=0.0079, acc=0.9976, iter_time=7.59s]
Epoch 0: 20%|█▉ | 2432/12384 [5:09:42<21:06:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2433/12384 [5:09:42<21:05:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2433/12384 [5:09:50<21:05:21, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2434/12384 [5:09:50<21:04:00, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2434/12384 [5:09:57<21:04:00, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2435/12384 [5:09:57<21:03:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2435/12384 [5:10:05<21:03:05, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2436/12384 [5:10:05<21:02:23, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2436/12384 [5:10:12<21:02:23, 7.61s/it, loss=0.0007, acc=0.9977, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2437/12384 [5:10:12<21:03:03, 7.62s/it, loss=0.0007, acc=0.9977, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2437/12384 [5:10:20<21:03:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2438/12384 [5:10:20<21:02:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2438/12384 [5:10:28<21:02:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2439/12384 [5:10:28<21:06:44, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2439/12384 [5:10:35<21:06:44, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2440/12384 [5:10:35<21:05:10, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2440/12384 [5:10:43<21:05:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2441/12384 [5:10:43<21:05:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2441/12384 [5:10:51<21:05:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 20%|█▉ | 2442/12384 [5:10:51<21:03:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 20%|█▉ | 2442/12384 [5:10:58<21:03:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 20%|█▉ | 2443/12384 [5:10:58<21:02:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 20%|█▉ | 2443/12384 [5:11:06<21:02:24, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.38s]
Epoch 0: 20%|█▉ | 2444/12384 [5:11:06<21:00:50, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.38s]
Epoch 0: 20%|█▉ | 2444/12384 [5:11:13<21:00:50, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.58s]
Epoch 0: 20%|█▉ | 2445/12384 [5:11:13<20:59:56, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.58s]
Epoch 0: 20%|█▉ | 2445/12384 [5:11:21<20:59:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2446/12384 [5:11:21<20:59:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2446/12384 [5:11:29<20:59:44, 7.61s/it, loss=0.0006, acc=0.9975, iter_time=6.76s]
Epoch 0: 20%|█▉ | 2447/12384 [5:11:29<20:59:51, 7.61s/it, loss=0.0006, acc=0.9975, iter_time=6.76s]
Epoch 0: 20%|█▉ | 2447/12384 [5:11:36<20:59:51, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.84s]
Epoch 0: 20%|█▉ | 2448/12384 [5:11:36<20:59:33, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.84s]
Epoch 0: 20%|█▉ | 2448/12384 [5:11:44<20:59:33, 7.61s/it, loss=0.0003, acc=0.9990, iter_time=7.22s]
Epoch 0: 20%|█▉ | 2449/12384 [5:11:44<20:58:56, 7.60s/it, loss=0.0003, acc=0.9990, iter_time=7.22s]
Epoch 0: 20%|█▉ | 2449/12384 [5:11:51<20:58:56, 7.60s/it, loss=0.0042, acc=0.9888, iter_time=8.00s]
Epoch 0: 20%|█▉ | 2450/12384 [5:11:51<20:58:56, 7.60s/it, loss=0.0042, acc=0.9888, iter_time=8.00s]
Epoch 0: 20%|█▉ | 2450/12384 [5:11:59<20:58:56, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.52s]
Epoch 0: 20%|█▉ | 2451/12384 [5:11:59<21:13:48, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.52s]
Epoch 0: 20%|█▉ | 2451/12384 [5:12:07<21:13:48, 7.69s/it, loss=0.0007, acc=0.9985, iter_time=5.49s]
Epoch 0: 20%|█▉ | 2452/12384 [5:12:07<21:09:36, 7.67s/it, loss=0.0007, acc=0.9985, iter_time=5.49s]
Epoch 0: 20%|█▉ | 2452/12384 [5:12:15<21:09:36, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=9.13s]
Epoch 0: 20%|█▉ | 2453/12384 [5:12:15<21:24:18, 7.76s/it, loss=0.0002, acc=1.0000, iter_time=9.13s]
Epoch 0: 20%|█▉ | 2453/12384 [5:12:22<21:24:18, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 0: 20%|█▉ | 2454/12384 [5:12:22<21:16:42, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 0: 20%|█▉ | 2454/12384 [5:12:30<21:16:42, 7.71s/it, loss=0.0007, acc=0.9981, iter_time=5.55s]
Epoch 0: 20%|█▉ | 2455/12384 [5:12:30<21:12:10, 7.69s/it, loss=0.0007, acc=0.9981, iter_time=5.55s]
Epoch 0: 20%|█▉ | 2455/12384 [5:12:38<21:12:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 20%|█▉ | 2456/12384 [5:12:38<21:08:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 20%|█▉ | 2456/12384 [5:12:45<21:08:46, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2457/12384 [5:12:45<21:06:52, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2457/12384 [5:12:53<21:06:52, 7.66s/it, loss=0.0008, acc=0.9953, iter_time=5.83s]
Epoch 0: 20%|█▉ | 2458/12384 [5:12:53<21:05:04, 7.65s/it, loss=0.0008, acc=0.9953, iter_time=5.83s]
Epoch 0: 20%|█▉ | 2458/12384 [5:13:01<21:05:04, 7.65s/it, loss=0.0002, acc=0.9987, iter_time=9.42s]
Epoch 0: 20%|█▉ | 2459/12384 [5:13:01<21:03:06, 7.64s/it, loss=0.0002, acc=0.9987, iter_time=9.42s]
Epoch 0: 20%|█▉ | 2459/12384 [5:13:08<21:03:06, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2460/12384 [5:13:08<21:03:44, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2460/12384 [5:13:16<21:03:44, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2461/12384 [5:13:16<21:01:56, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2461/12384 [5:13:24<21:01:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2462/12384 [5:13:24<21:04:55, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2462/12384 [5:13:31<21:04:55, 7.65s/it, loss=0.0013, acc=0.9985, iter_time=7.37s]
Epoch 0: 20%|█▉ | 2463/12384 [5:13:31<21:02:46, 7.64s/it, loss=0.0013, acc=0.9985, iter_time=7.37s]
Epoch 0: 20%|█▉ | 2463/12384 [5:13:39<21:02:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 20%|█▉ | 2464/12384 [5:13:39<21:02:23, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 20%|█▉ | 2464/12384 [5:13:46<21:02:23, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.84s]
Epoch 0: 20%|█▉ | 2465/12384 [5:13:46<21:01:02, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.84s]
Epoch 0: 20%|█▉ | 2465/12384 [5:13:54<21:01:02, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.43s]
Epoch 0: 20%|█▉ | 2466/12384 [5:13:54<21:00:46, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.43s]
Epoch 0: 20%|█▉ | 2466/12384 [5:14:02<21:00:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.56s]
Epoch 0: 20%|█▉ | 2467/12384 [5:14:02<21:00:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.56s]
Epoch 0: 20%|█▉ | 2467/12384 [5:14:09<21:00:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 0: 20%|█▉ | 2468/12384 [5:14:09<21:00:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 0: 20%|█▉ | 2468/12384 [5:14:17<21:00:39, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=9.41s]
Epoch 0: 20%|█▉ | 2469/12384 [5:14:17<20:59:06, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=9.41s]
Epoch 0: 20%|█▉ | 2469/12384 [5:14:25<20:59:06, 7.62s/it, loss=0.0004, acc=0.9992, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2470/12384 [5:14:25<21:02:27, 7.64s/it, loss=0.0004, acc=0.9992, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2470/12384 [5:14:32<21:02:27, 7.64s/it, loss=0.0004, acc=0.9999, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2471/12384 [5:14:32<21:00:34, 7.63s/it, loss=0.0004, acc=0.9999, iter_time=7.60s]
Epoch 0: 20%|█▉ | 2471/12384 [5:14:40<21:00:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 20%|█▉ | 2472/12384 [5:14:40<20:58:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 20%|█▉ | 2472/12384 [5:14:47<20:58:46, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.19s]
Epoch 0: 20%|█▉ | 2473/12384 [5:14:47<20:57:27, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.19s]
Epoch 0: 20%|█▉ | 2473/12384 [5:14:55<20:57:27, 7.61s/it, loss=0.0009, acc=0.9980, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2474/12384 [5:14:55<20:56:44, 7.61s/it, loss=0.0009, acc=0.9980, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2474/12384 [5:15:03<20:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 20%|█▉ | 2475/12384 [5:15:03<20:56:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 20%|█▉ | 2475/12384 [5:15:10<20:56:17, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=9.13s]
Epoch 0: 20%|█▉ | 2476/12384 [5:15:10<20:58:48, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=9.13s]
Epoch 0: 20%|█▉ | 2476/12384 [5:15:18<20:58:48, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 20%|██ | 2477/12384 [5:15:18<20:58:16, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 20%|██ | 2477/12384 [5:15:25<20:58:16, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.67s]
Epoch 0: 20%|██ | 2478/12384 [5:15:25<20:57:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.67s]
Epoch 0: 20%|██ | 2478/12384 [5:15:33<20:57:22, 7.62s/it, loss=0.0011, acc=0.9960, iter_time=10.62s]
Epoch 0: 20%|██ | 2479/12384 [5:15:33<20:56:54, 7.61s/it, loss=0.0011, acc=0.9960, iter_time=10.62s]
Epoch 0: 20%|██ | 2479/12384 [5:15:41<20:56:54, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.10s]
Epoch 0: 20%|██ | 2480/12384 [5:15:41<21:16:14, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=8.10s]
Epoch 0: 20%|██ | 2480/12384 [5:15:49<21:16:14, 7.73s/it, loss=0.0006, acc=0.9970, iter_time=7.54s]
Epoch 0: 20%|██ | 2481/12384 [5:15:49<21:13:57, 7.72s/it, loss=0.0006, acc=0.9970, iter_time=7.54s]
Epoch 0: 20%|██ | 2481/12384 [5:15:56<21:13:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2482/12384 [5:15:56<21:09:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2482/12384 [5:16:04<21:09:10, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=4.28s]
Epoch 0: 20%|██ | 2483/12384 [5:16:04<21:06:11, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=4.28s]
Epoch 0: 20%|██ | 2483/12384 [5:16:12<21:06:11, 7.67s/it, loss=0.0050, acc=0.9972, iter_time=10.37s]
Epoch 0: 20%|██ | 2484/12384 [5:16:12<21:07:29, 7.68s/it, loss=0.0050, acc=0.9972, iter_time=10.37s]
Epoch 0: 20%|██ | 2484/12384 [5:16:19<21:07:29, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=5.53s]
Epoch 0: 20%|██ | 2485/12384 [5:16:19<21:03:00, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=5.53s]
Epoch 0: 20%|██ | 2485/12384 [5:16:27<21:03:00, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.36s]
Epoch 0: 20%|██ | 2486/12384 [5:16:27<20:59:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.36s]
Epoch 0: 20%|██ | 2486/12384 [5:16:34<20:59:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2487/12384 [5:16:34<20:57:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2487/12384 [5:16:42<20:57:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 0: 20%|██ | 2488/12384 [5:16:42<20:56:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 0: 20%|██ | 2488/12384 [5:16:50<20:56:10, 7.62s/it, loss=0.0003, acc=0.9991, iter_time=7.64s]
Epoch 0: 20%|██ | 2489/12384 [5:16:50<20:57:04, 7.62s/it, loss=0.0003, acc=0.9991, iter_time=7.64s]
Epoch 0: 20%|██ | 2489/12384 [5:16:57<20:57:04, 7.62s/it, loss=0.0012, acc=0.9982, iter_time=6.45s]
Epoch 0: 20%|██ | 2490/12384 [5:16:57<20:55:42, 7.62s/it, loss=0.0012, acc=0.9982, iter_time=6.45s]
Epoch 0: 20%|██ | 2490/12384 [5:17:05<20:55:42, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=8.80s]
Epoch 0: 20%|██ | 2491/12384 [5:17:05<20:58:38, 7.63s/it, loss=0.0002, acc=0.9992, iter_time=8.80s]
Epoch 0: 20%|██ | 2491/12384 [5:17:13<20:58:38, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.68s]
Epoch 0: 20%|██ | 2492/12384 [5:17:13<20:57:07, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.68s]
Epoch 0: 20%|██ | 2492/12384 [5:17:20<20:57:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2493/12384 [5:17:20<20:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2493/12384 [5:17:28<20:56:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 20%|██ | 2494/12384 [5:17:28<20:55:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 20%|██ | 2494/12384 [5:17:35<20:55:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.41s]
Epoch 0: 20%|██ | 2495/12384 [5:17:35<20:55:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.41s]
Epoch 0: 20%|██ | 2495/12384 [5:17:43<20:55:29, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=8.00s]
Epoch 0: 20%|██ | 2496/12384 [5:17:43<20:55:35, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=8.00s]
Epoch 0: 20%|██ | 2496/12384 [5:17:51<20:55:35, 7.62s/it, loss=0.0006, acc=0.9987, iter_time=7.24s]
Epoch 0: 20%|██ | 2497/12384 [5:17:51<20:55:22, 7.62s/it, loss=0.0006, acc=0.9987, iter_time=7.24s]
Epoch 0: 20%|██ | 2497/12384 [5:17:58<20:55:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.32s]
Epoch 0: 20%|██ | 2498/12384 [5:17:58<20:54:51, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.32s]
Epoch 0: 20%|██ | 2498/12384 [5:18:06<20:54:51, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.10s]
Epoch 0: 20%|██ | 2499/12384 [5:18:06<20:54:22, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.10s]
Epoch 0: 20%|██ | 2499/12384 [5:18:13<20:54:22, 7.61s/it, loss=0.0012, acc=0.9991, iter_time=9.82s]
Epoch 0: 20%|██ | 2500/12384 [5:18:14<21:03:17, 7.67s/it, loss=0.0012, acc=0.9991, iter_time=9.82s]
Epoch 0: 20%|██ | 2500/12384 [5:18:21<21:03:17, 7.67s/it, loss=0.0012, acc=0.9951, iter_time=5.12s]
Epoch 0: 20%|██ | 2501/12384 [5:18:21<21:01:02, 7.66s/it, loss=0.0012, acc=0.9951, iter_time=5.12s]
Epoch 0: 20%|██ | 2501/12384 [5:18:29<21:01:02, 7.66s/it, loss=0.0009, acc=1.0000, iter_time=9.88s]
Epoch 0: 20%|██ | 2502/12384 [5:18:29<20:57:38, 7.64s/it, loss=0.0009, acc=1.0000, iter_time=9.88s]
Epoch 0: 20%|██ | 2502/12384 [5:18:37<20:57:38, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|██ | 2503/12384 [5:18:37<20:58:17, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|██ | 2503/12384 [5:18:44<20:58:17, 7.64s/it, loss=0.0005, acc=0.9997, iter_time=8.00s]
Epoch 0: 20%|██ | 2504/12384 [5:18:44<20:56:46, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=8.00s]
Epoch 0: 20%|██ | 2504/12384 [5:18:52<20:56:46, 7.63s/it, loss=0.0008, acc=0.9976, iter_time=7.23s]
Epoch 0: 20%|██ | 2505/12384 [5:18:52<20:54:45, 7.62s/it, loss=0.0008, acc=0.9976, iter_time=7.23s]
Epoch 0: 20%|██ | 2505/12384 [5:19:00<20:54:45, 7.62s/it, loss=0.0004, acc=0.9990, iter_time=7.02s]
Epoch 0: 20%|██ | 2506/12384 [5:19:00<21:10:06, 7.71s/it, loss=0.0004, acc=0.9990, iter_time=7.02s]
Epoch 0: 20%|██ | 2506/12384 [5:19:07<21:10:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 20%|██ | 2507/12384 [5:19:07<21:05:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 20%|██ | 2507/12384 [5:19:15<21:05:08, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 20%|██ | 2508/12384 [5:19:15<21:06:35, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 20%|██ | 2508/12384 [5:19:23<21:06:35, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.36s]
Epoch 0: 20%|██ | 2509/12384 [5:19:23<21:02:58, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.36s]
Epoch 0: 20%|██ | 2509/12384 [5:19:30<21:02:58, 7.67s/it, loss=0.0048, acc=0.9965, iter_time=7.60s]
Epoch 0: 20%|██ | 2510/12384 [5:19:30<20:59:08, 7.65s/it, loss=0.0048, acc=0.9965, iter_time=7.60s]
Epoch 0: 20%|██ | 2510/12384 [5:19:38<20:59:08, 7.65s/it, loss=0.0004, acc=0.9995, iter_time=4.75s]
Epoch 0: 20%|██ | 2511/12384 [5:19:38<20:57:32, 7.64s/it, loss=0.0004, acc=0.9995, iter_time=4.75s]
Epoch 0: 20%|██ | 2511/12384 [5:19:46<20:57:32, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=10.53s]
Epoch 0: 20%|██ | 2512/12384 [5:19:46<21:00:53, 7.66s/it, loss=0.0002, acc=0.9997, iter_time=10.53s]
Epoch 0: 20%|██ | 2512/12384 [5:19:53<21:00:53, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 20%|██ | 2513/12384 [5:19:53<20:57:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 20%|██ | 2513/12384 [5:20:01<20:57:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.54s]
Epoch 0: 20%|██ | 2514/12384 [5:20:01<20:52:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.54s]
Epoch 0: 20%|██ | 2514/12384 [5:20:08<20:52:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 0: 20%|██ | 2515/12384 [5:20:08<20:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 0: 20%|██ | 2515/12384 [5:20:16<20:51:56, 7.61s/it, loss=0.0003, acc=0.9997, iter_time=6.68s]
Epoch 0: 20%|██ | 2516/12384 [5:20:16<20:51:10, 7.61s/it, loss=0.0003, acc=0.9997, iter_time=6.68s]
Epoch 0: 20%|██ | 2516/12384 [5:20:24<20:51:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.52s]
Epoch 0: 20%|██ | 2517/12384 [5:20:24<20:50:01, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.52s]
Epoch 0: 20%|██ | 2517/12384 [5:20:31<20:50:01, 7.60s/it, loss=0.0010, acc=0.9984, iter_time=7.60s]
Epoch 0: 20%|██ | 2518/12384 [5:20:31<20:50:01, 7.60s/it, loss=0.0010, acc=0.9984, iter_time=7.60s]
Epoch 0: 20%|██ | 2518/12384 [5:20:39<20:50:01, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2519/12384 [5:20:39<20:50:19, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2519/12384 [5:20:46<20:50:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 20%|██ | 2520/12384 [5:20:46<20:51:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 20%|██ | 2520/12384 [5:20:54<20:51:39, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=7.21s]
Epoch 0: 20%|██ | 2521/12384 [5:20:54<20:51:12, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=7.21s]
Epoch 0: 20%|██ | 2521/12384 [5:21:02<20:51:12, 7.61s/it, loss=0.0005, acc=0.9991, iter_time=7.59s]
Epoch 0: 20%|██ | 2522/12384 [5:21:02<20:50:48, 7.61s/it, loss=0.0005, acc=0.9991, iter_time=7.59s]
Epoch 0: 20%|██ | 2522/12384 [5:21:09<20:50:48, 7.61s/it, loss=0.0043, acc=0.9953, iter_time=7.61s]
Epoch 0: 20%|██ | 2523/12384 [5:21:09<20:49:42, 7.60s/it, loss=0.0043, acc=0.9953, iter_time=7.61s]
Epoch 0: 20%|██ | 2523/12384 [5:21:17<20:49:42, 7.60s/it, loss=0.0003, acc=0.9990, iter_time=7.58s]
Epoch 0: 20%|██ | 2524/12384 [5:21:17<20:49:04, 7.60s/it, loss=0.0003, acc=0.9990, iter_time=7.58s]
Epoch 0: 20%|██ | 2524/12384 [5:21:24<20:49:04, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|██ | 2525/12384 [5:21:24<20:48:47, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 20%|██ | 2525/12384 [5:21:32<20:48:47, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.21s]
Epoch 0: 20%|██ | 2526/12384 [5:21:32<20:49:03, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.21s]
Epoch 0: 20%|██ | 2526/12384 [5:21:40<20:49:03, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.99s]
Epoch 0: 20%|██ | 2527/12384 [5:21:40<20:49:02, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.99s]
Epoch 0: 20%|██ | 2527/12384 [5:21:47<20:49:02, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=7.99s]
Epoch 0: 20%|██ | 2528/12384 [5:21:47<20:49:52, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.99s]
Epoch 0: 20%|██ | 2528/12384 [5:21:55<20:49:52, 7.61s/it, loss=0.0056, acc=0.9915, iter_time=3.23s]
Epoch 0: 20%|██ | 2529/12384 [5:21:55<20:50:18, 7.61s/it, loss=0.0056, acc=0.9915, iter_time=3.23s]
Epoch 0: 20%|██ | 2529/12384 [5:22:02<20:50:18, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.37s]
Epoch 0: 20%|██ | 2530/12384 [5:22:02<20:49:36, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.37s]
Epoch 0: 20%|██ | 2530/12384 [5:22:10<20:49:36, 7.61s/it, loss=0.0011, acc=0.9967, iter_time=10.87s]
Epoch 0: 20%|██ | 2531/12384 [5:22:10<20:50:10, 7.61s/it, loss=0.0011, acc=0.9967, iter_time=10.87s]
Epoch 0: 20%|██ | 2531/12384 [5:22:18<20:50:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2532/12384 [5:22:18<20:49:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2532/12384 [5:22:26<20:49:27, 7.61s/it, loss=0.0019, acc=0.9966, iter_time=4.54s]
Epoch 0: 20%|██ | 2533/12384 [5:22:26<21:06:19, 7.71s/it, loss=0.0019, acc=0.9966, iter_time=4.54s]
Epoch 0: 20%|██ | 2533/12384 [5:22:33<21:06:19, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=11.04s]
Epoch 0: 20%|██ | 2534/12384 [5:22:33<21:00:21, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=11.04s]
Epoch 0: 20%|██ | 2534/12384 [5:22:41<21:00:21, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 0: 20%|██ | 2535/12384 [5:22:41<20:56:09, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 0: 20%|██ | 2535/12384 [5:22:48<20:56:09, 7.65s/it, loss=0.0024, acc=0.9937, iter_time=10.29s]
Epoch 0: 20%|██ | 2536/12384 [5:22:48<20:54:03, 7.64s/it, loss=0.0024, acc=0.9937, iter_time=10.29s]
Epoch 0: 20%|██ | 2536/12384 [5:22:56<20:54:03, 7.64s/it, loss=0.0006, acc=0.9998, iter_time=6.65s]
Epoch 0: 20%|██ | 2537/12384 [5:22:56<20:52:18, 7.63s/it, loss=0.0006, acc=0.9998, iter_time=6.65s]
Epoch 0: 20%|██ | 2537/12384 [5:23:04<20:52:18, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=8.19s]
Epoch 0: 20%|██ | 2538/12384 [5:23:04<20:50:33, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=8.19s]
Epoch 0: 20%|██ | 2538/12384 [5:23:11<20:50:33, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=5.34s]
Epoch 0: 21%|██ | 2539/12384 [5:23:11<20:49:22, 7.61s/it, loss=0.0008, acc=0.9980, iter_time=5.34s]
Epoch 0: 21%|██ | 2539/12384 [5:23:19<20:49:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 0: 21%|██ | 2540/12384 [5:23:19<20:50:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 0: 21%|██ | 2540/12384 [5:23:26<20:50:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 21%|██ | 2541/12384 [5:23:26<20:50:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 21%|██ | 2541/12384 [5:23:34<20:50:12, 7.62s/it, loss=0.0005, acc=0.9985, iter_time=7.60s]
Epoch 0: 21%|██ | 2542/12384 [5:23:34<20:49:52, 7.62s/it, loss=0.0005, acc=0.9985, iter_time=7.60s]
Epoch 0: 21%|██ | 2542/12384 [5:23:42<20:49:52, 7.62s/it, loss=0.0006, acc=0.9998, iter_time=7.66s]
Epoch 0: 21%|██ | 2543/12384 [5:23:42<20:51:39, 7.63s/it, loss=0.0006, acc=0.9998, iter_time=7.66s]
Epoch 0: 21%|██ | 2543/12384 [5:23:49<20:51:39, 7.63s/it, loss=0.0022, acc=0.9942, iter_time=7.55s]
Epoch 0: 21%|██ | 2544/12384 [5:23:49<20:50:13, 7.62s/it, loss=0.0022, acc=0.9942, iter_time=7.55s]
Epoch 0: 21%|██ | 2544/12384 [5:23:57<20:50:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 21%|██ | 2545/12384 [5:23:57<20:49:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 21%|██ | 2545/12384 [5:24:05<20:49:09, 7.62s/it, loss=0.0066, acc=0.9922, iter_time=6.08s]
Epoch 0: 21%|██ | 2546/12384 [5:24:05<20:47:43, 7.61s/it, loss=0.0066, acc=0.9922, iter_time=6.08s]
Epoch 0: 21%|██ | 2546/12384 [5:24:12<20:47:43, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=9.13s]
Epoch 0: 21%|██ | 2547/12384 [5:24:12<20:47:22, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=9.13s]
Epoch 0: 21%|██ | 2547/12384 [5:24:20<20:47:22, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.58s]
Epoch 0: 21%|██ | 2548/12384 [5:24:20<20:47:26, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.58s]
Epoch 0: 21%|██ | 2548/12384 [5:24:27<20:47:26, 7.61s/it, loss=0.0015, acc=0.9976, iter_time=7.63s]
Epoch 0: 21%|██ | 2549/12384 [5:24:27<20:50:00, 7.63s/it, loss=0.0015, acc=0.9976, iter_time=7.63s]
Epoch 0: 21%|██ | 2549/12384 [5:24:35<20:50:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 21%|██ | 2550/12384 [5:24:35<20:49:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 21%|██ | 2550/12384 [5:24:43<20:49:32, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=7.22s]
Epoch 0: 21%|██ | 2551/12384 [5:24:43<20:49:07, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=7.22s]
Epoch 0: 21%|██ | 2551/12384 [5:24:50<20:49:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 21%|██ | 2552/12384 [5:24:50<20:47:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 21%|██ | 2552/12384 [5:24:58<20:47:15, 7.61s/it, loss=0.0004, acc=0.9994, iter_time=6.04s]
Epoch 0: 21%|██ | 2553/12384 [5:24:58<20:52:53, 7.65s/it, loss=0.0004, acc=0.9994, iter_time=6.04s]
Epoch 0: 21%|██ | 2553/12384 [5:25:06<20:52:53, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 21%|██ | 2554/12384 [5:25:06<20:49:34, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 21%|██ | 2554/12384 [5:25:13<20:49:34, 7.63s/it, loss=0.0009, acc=0.9971, iter_time=8.53s]
Epoch 0: 21%|██ | 2555/12384 [5:25:13<20:51:44, 7.64s/it, loss=0.0009, acc=0.9971, iter_time=8.53s]
Epoch 0: 21%|██ | 2555/12384 [5:25:21<20:51:44, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.37s]
Epoch 0: 21%|██ | 2556/12384 [5:25:21<20:48:34, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.37s]
Epoch 0: 21%|██ | 2556/12384 [5:25:28<20:48:34, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=7.87s]
Epoch 0: 21%|██ | 2557/12384 [5:25:28<20:47:08, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=7.87s]
Epoch 0: 21%|██ | 2557/12384 [5:25:36<20:47:08, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██ | 2558/12384 [5:25:36<20:48:37, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██ | 2558/12384 [5:25:44<20:48:37, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=7.66s]
Epoch 0: 21%|██ | 2559/12384 [5:25:44<21:07:17, 7.74s/it, loss=0.0003, acc=0.9987, iter_time=7.66s]
Epoch 0: 21%|██ | 2559/12384 [5:25:52<21:07:17, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 21%|██ | 2560/12384 [5:25:52<21:00:02, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 21%|██ | 2560/12384 [5:25:59<21:00:02, 7.70s/it, loss=0.0013, acc=0.9972, iter_time=7.66s]
Epoch 0: 21%|██ | 2561/12384 [5:25:59<20:55:55, 7.67s/it, loss=0.0013, acc=0.9972, iter_time=7.66s]
Epoch 0: 21%|██ | 2561/12384 [5:26:07<20:55:55, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 21%|██ | 2562/12384 [5:26:07<20:51:53, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 21%|██ | 2562/12384 [5:26:14<20:51:53, 7.65s/it, loss=0.0007, acc=0.9979, iter_time=7.01s]
Epoch 0: 21%|██ | 2563/12384 [5:26:14<20:50:28, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.01s]
Epoch 0: 21%|██ | 2563/12384 [5:26:22<20:50:28, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.20s]
Epoch 0: 21%|██ | 2564/12384 [5:26:22<20:49:21, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.20s]
Epoch 0: 21%|██ | 2564/12384 [5:26:30<20:49:21, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=7.31s]
Epoch 0: 21%|██ | 2565/12384 [5:26:30<20:48:39, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=7.31s]
Epoch 0: 21%|██ | 2565/12384 [5:26:37<20:48:39, 7.63s/it, loss=0.0020, acc=0.9964, iter_time=7.93s]
Epoch 0: 21%|██ | 2566/12384 [5:26:37<20:46:11, 7.62s/it, loss=0.0020, acc=0.9964, iter_time=7.93s]
Epoch 0: 21%|██ | 2566/12384 [5:26:45<20:46:11, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 0: 21%|██ | 2567/12384 [5:26:45<20:46:03, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 0: 21%|██ | 2567/12384 [5:26:53<20:46:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 21%|██ | 2568/12384 [5:26:53<20:48:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 21%|██ | 2568/12384 [5:27:00<20:48:34, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.26s]
Epoch 0: 21%|██ | 2569/12384 [5:27:00<20:47:23, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.26s]
Epoch 0: 21%|██ | 2569/12384 [5:27:08<20:47:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.13s]
Epoch 0: 21%|██ | 2570/12384 [5:27:08<20:50:36, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.13s]
Epoch 0: 21%|██ | 2570/12384 [5:27:15<20:50:36, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2571/12384 [5:27:15<20:47:45, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2571/12384 [5:27:23<20:47:45, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.33s]
Epoch 0: 21%|██ | 2572/12384 [5:27:23<20:47:03, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.33s]
Epoch 0: 21%|██ | 2572/12384 [5:27:31<20:47:03, 7.63s/it, loss=0.0004, acc=0.9994, iter_time=8.82s]
Epoch 0: 21%|██ | 2573/12384 [5:27:31<20:45:05, 7.61s/it, loss=0.0004, acc=0.9994, iter_time=8.82s]
Epoch 0: 21%|██ | 2573/12384 [5:27:38<20:45:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 21%|██ | 2574/12384 [5:27:38<20:44:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 21%|██ | 2574/12384 [5:27:46<20:44:53, 7.61s/it, loss=0.0309, acc=0.9508, iter_time=7.60s]
Epoch 0: 21%|██ | 2575/12384 [5:27:46<20:44:06, 7.61s/it, loss=0.0309, acc=0.9508, iter_time=7.60s]
Epoch 0: 21%|██ | 2575/12384 [5:27:53<20:44:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 21%|██ | 2576/12384 [5:27:53<20:44:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 21%|██ | 2576/12384 [5:28:01<20:44:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.95s]
Epoch 0: 21%|██ | 2577/12384 [5:28:01<20:47:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.95s]
Epoch 0: 21%|██ | 2577/12384 [5:28:09<20:47:43, 7.63s/it, loss=0.0002, acc=0.9990, iter_time=7.95s]
Epoch 0: 21%|██ | 2578/12384 [5:28:09<20:46:06, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.95s]
Epoch 0: 21%|██ | 2578/12384 [5:28:16<20:46:06, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=7.60s]
Epoch 0: 21%|██ | 2579/12384 [5:28:16<20:44:26, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=7.60s]
Epoch 0: 21%|██ | 2579/12384 [5:28:24<20:44:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 21%|██ | 2580/12384 [5:28:24<20:44:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 21%|██ | 2580/12384 [5:28:32<20:44:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 21%|██ | 2581/12384 [5:28:32<20:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 21%|██ | 2581/12384 [5:28:39<20:44:44, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=9.42s]
Epoch 0: 21%|██ | 2582/12384 [5:28:39<20:44:31, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=9.42s]
Epoch 0: 21%|██ | 2582/12384 [5:28:47<20:44:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 21%|██ | 2583/12384 [5:28:47<20:44:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 21%|██ | 2583/12384 [5:28:54<20:44:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.60s]
Epoch 0: 21%|██ | 2584/12384 [5:28:54<20:44:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.60s]
Epoch 0: 21%|██ | 2584/12384 [5:29:02<20:44:37, 7.62s/it, loss=0.0053, acc=0.9963, iter_time=7.30s]
Epoch 0: 21%|██ | 2585/12384 [5:29:02<21:00:58, 7.72s/it, loss=0.0053, acc=0.9963, iter_time=7.30s]
Epoch 0: 21%|██ | 2585/12384 [5:29:10<21:00:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 21%|██ | 2586/12384 [5:29:10<20:54:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 21%|██ | 2586/12384 [5:29:18<20:54:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 21%|██ | 2587/12384 [5:29:18<20:50:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 21%|██ | 2587/12384 [5:29:25<20:50:15, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 21%|██ | 2588/12384 [5:29:25<20:48:04, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 21%|██ | 2588/12384 [5:29:33<20:48:04, 7.64s/it, loss=0.0017, acc=0.9940, iter_time=7.63s]
Epoch 0: 21%|██ | 2589/12384 [5:29:33<20:46:54, 7.64s/it, loss=0.0017, acc=0.9940, iter_time=7.63s]
Epoch 0: 21%|██ | 2589/12384 [5:29:40<20:46:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 21%|██ | 2590/12384 [5:29:40<20:43:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 21%|██ | 2590/12384 [5:29:48<20:43:51, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.86s]
Epoch 0: 21%|██ | 2591/12384 [5:29:48<20:44:23, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.86s]
Epoch 0: 21%|██ | 2591/12384 [5:29:56<20:44:23, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=7.99s]
Epoch 0: 21%|██ | 2592/12384 [5:29:56<20:43:02, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=7.99s]
Epoch 0: 21%|██ | 2592/12384 [5:30:03<20:43:02, 7.62s/it, loss=0.0004, acc=0.9989, iter_time=7.21s]
Epoch 0: 21%|██ | 2593/12384 [5:30:03<20:43:08, 7.62s/it, loss=0.0004, acc=0.9989, iter_time=7.21s]
Epoch 0: 21%|██ | 2593/12384 [5:30:11<20:43:08, 7.62s/it, loss=0.0004, acc=0.9995, iter_time=7.64s]
Epoch 0: 21%|██ | 2594/12384 [5:30:11<20:45:41, 7.63s/it, loss=0.0004, acc=0.9995, iter_time=7.64s]
Epoch 0: 21%|██ | 2594/12384 [5:30:19<20:45:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.81s]
Epoch 0: 21%|██ | 2595/12384 [5:30:19<20:43:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.81s]
Epoch 0: 21%|██ | 2595/12384 [5:30:26<20:43:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 21%|██ | 2596/12384 [5:30:26<20:42:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 21%|██ | 2596/12384 [5:30:34<20:42:30, 7.62s/it, loss=0.0004, acc=0.9974, iter_time=7.34s]
Epoch 0: 21%|██ | 2597/12384 [5:30:34<20:43:08, 7.62s/it, loss=0.0004, acc=0.9974, iter_time=7.34s]
Epoch 0: 21%|██ | 2597/12384 [5:30:42<20:43:08, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=9.40s]
Epoch 0: 21%|██ | 2598/12384 [5:30:42<20:46:56, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.40s]
Epoch 0: 21%|██ | 2598/12384 [5:30:49<20:46:56, 7.65s/it, loss=0.0007, acc=0.9956, iter_time=7.73s]
Epoch 0: 21%|██ | 2599/12384 [5:30:49<20:46:36, 7.64s/it, loss=0.0007, acc=0.9956, iter_time=7.73s]
Epoch 0: 21%|██ | 2599/12384 [5:30:57<20:46:36, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 21%|██ | 2600/12384 [5:30:57<20:44:22, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 21%|██ | 2600/12384 [5:31:04<20:44:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.35s]
Epoch 0: 21%|██ | 2601/12384 [5:31:04<20:42:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.35s]
Epoch 0: 21%|██ | 2601/12384 [5:31:12<20:42:55, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=8.46s]
Epoch 0: 21%|██ | 2602/12384 [5:31:12<20:45:34, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=8.46s]
Epoch 0: 21%|██ | 2602/12384 [5:31:20<20:45:34, 7.64s/it, loss=0.0022, acc=0.9964, iter_time=7.68s]
Epoch 0: 21%|██ | 2603/12384 [5:31:20<20:43:11, 7.63s/it, loss=0.0022, acc=0.9964, iter_time=7.68s]
Epoch 0: 21%|██ | 2603/12384 [5:31:27<20:43:11, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=7.60s]
Epoch 0: 21%|██ | 2604/12384 [5:31:27<20:43:28, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=7.60s]
Epoch 0: 21%|██ | 2604/12384 [5:31:35<20:43:28, 7.63s/it, loss=0.0002, acc=0.9991, iter_time=7.62s]
Epoch 0: 21%|██ | 2605/12384 [5:31:35<20:41:47, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=7.62s]
Epoch 0: 21%|██ | 2605/12384 [5:31:42<20:41:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 21%|██ | 2606/12384 [5:31:42<20:40:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 21%|██ | 2606/12384 [5:31:50<20:40:11, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.59s]
Epoch 0: 21%|██ | 2607/12384 [5:31:50<20:40:20, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.59s]
Epoch 0: 21%|██ | 2607/12384 [5:31:58<20:40:20, 7.61s/it, loss=0.0005, acc=0.9983, iter_time=8.01s]
Epoch 0: 21%|██ | 2608/12384 [5:31:58<20:39:55, 7.61s/it, loss=0.0005, acc=0.9983, iter_time=8.01s]
Epoch 0: 21%|██ | 2608/12384 [5:32:05<20:39:55, 7.61s/it, loss=0.0017, acc=0.9954, iter_time=5.96s]
Epoch 0: 21%|██ | 2609/12384 [5:32:05<20:38:58, 7.60s/it, loss=0.0017, acc=0.9954, iter_time=5.96s]
Epoch 0: 21%|██ | 2609/12384 [5:32:13<20:38:58, 7.60s/it, loss=0.0006, acc=0.9992, iter_time=8.84s]
Epoch 0: 21%|██ | 2610/12384 [5:32:13<20:38:16, 7.60s/it, loss=0.0006, acc=0.9992, iter_time=8.84s]
Epoch 0: 21%|██ | 2610/12384 [5:32:21<20:38:16, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=5.53s]
Epoch 0: 21%|██ | 2611/12384 [5:32:21<20:52:49, 7.69s/it, loss=0.0001, acc=0.9998, iter_time=5.53s]
Epoch 0: 21%|██ | 2611/12384 [5:32:28<20:52:49, 7.69s/it, loss=0.0001, acc=0.9992, iter_time=9.97s]
Epoch 0: 21%|██ | 2612/12384 [5:32:28<20:48:10, 7.66s/it, loss=0.0001, acc=0.9992, iter_time=9.97s]
Epoch 0: 21%|██ | 2612/12384 [5:32:36<20:48:10, 7.66s/it, loss=0.0006, acc=0.9986, iter_time=7.60s]
Epoch 0: 21%|██ | 2613/12384 [5:32:36<20:44:31, 7.64s/it, loss=0.0006, acc=0.9986, iter_time=7.60s]
Epoch 0: 21%|██ | 2613/12384 [5:32:44<20:44:31, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.28s]
Epoch 0: 21%|██ | 2614/12384 [5:32:44<20:42:35, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.28s]
Epoch 0: 21%|██ | 2614/12384 [5:32:51<20:42:35, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.92s]
Epoch 0: 21%|██ | 2615/12384 [5:32:51<20:41:38, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.92s]
Epoch 0: 21%|██ | 2615/12384 [5:32:59<20:41:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 21%|██ | 2616/12384 [5:32:59<20:42:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 21%|██ | 2616/12384 [5:33:06<20:42:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 21%|██ | 2617/12384 [5:33:06<20:41:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 21%|██ | 2617/12384 [5:33:14<20:41:51, 7.63s/it, loss=0.0006, acc=0.9983, iter_time=5.54s]
Epoch 0: 21%|██ | 2618/12384 [5:33:14<20:41:02, 7.62s/it, loss=0.0006, acc=0.9983, iter_time=5.54s]
Epoch 0: 21%|██ | 2618/12384 [5:33:22<20:41:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 0: 21%|██ | 2619/12384 [5:33:22<20:40:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 0: 21%|██ | 2619/12384 [5:33:29<20:40:32, 7.62s/it, loss=0.0024, acc=0.9961, iter_time=7.62s]
Epoch 0: 21%|██ | 2620/12384 [5:33:29<20:39:21, 7.62s/it, loss=0.0024, acc=0.9961, iter_time=7.62s]
Epoch 0: 21%|██ | 2620/12384 [5:33:37<20:39:21, 7.62s/it, loss=0.0013, acc=0.9957, iter_time=7.60s]
Epoch 0: 21%|██ | 2621/12384 [5:33:37<20:39:29, 7.62s/it, loss=0.0013, acc=0.9957, iter_time=7.60s]
Epoch 0: 21%|██ | 2621/12384 [5:33:44<20:39:29, 7.62s/it, loss=0.0006, acc=0.9996, iter_time=7.61s]
Epoch 0: 21%|██ | 2622/12384 [5:33:44<20:37:52, 7.61s/it, loss=0.0006, acc=0.9996, iter_time=7.61s]
Epoch 0: 21%|██ | 2622/12384 [5:33:52<20:37:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 21%|██ | 2623/12384 [5:33:52<20:37:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 21%|██ | 2623/12384 [5:34:00<20:37:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 21%|██ | 2624/12384 [5:34:00<20:37:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 21%|██ | 2624/12384 [5:34:07<20:37:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 21%|██ | 2625/12384 [5:34:07<20:36:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 21%|██ | 2625/12384 [5:34:15<20:36:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 21%|██ | 2626/12384 [5:34:15<20:37:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 21%|██ | 2626/12384 [5:34:23<20:37:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.50s]
Epoch 0: 21%|██ | 2627/12384 [5:34:23<20:38:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.50s]
Epoch 0: 21%|██ | 2627/12384 [5:34:30<20:38:19, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.34s]
Epoch 0: 21%|██ | 2628/12384 [5:34:30<20:38:53, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.34s]
Epoch 0: 21%|██ | 2628/12384 [5:34:38<20:38:53, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=5.71s]
Epoch 0: 21%|██ | 2629/12384 [5:34:38<20:39:39, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=5.71s]
Epoch 0: 21%|██ | 2629/12384 [5:34:45<20:39:39, 7.62s/it, loss=0.0006, acc=0.9990, iter_time=10.48s]
Epoch 0: 21%|██ | 2630/12384 [5:34:45<20:37:43, 7.61s/it, loss=0.0006, acc=0.9990, iter_time=10.48s]
Epoch 0: 21%|██ | 2630/12384 [5:34:53<20:37:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 21%|██ | 2631/12384 [5:34:53<20:38:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 21%|██ | 2631/12384 [5:35:01<20:38:04, 7.62s/it, loss=0.0009, acc=0.9981, iter_time=7.57s]
Epoch 0: 21%|██▏ | 2632/12384 [5:35:01<20:37:24, 7.61s/it, loss=0.0009, acc=0.9981, iter_time=7.57s]
Epoch 0: 21%|██▏ | 2632/12384 [5:35:08<20:37:24, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 21%|██▏ | 2633/12384 [5:35:08<20:35:58, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 21%|██▏ | 2633/12384 [5:35:16<20:35:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 21%|██▏ | 2634/12384 [5:35:16<20:38:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 21%|██▏ | 2634/12384 [5:35:23<20:38:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 21%|██▏ | 2635/12384 [5:35:23<20:37:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 21%|██▏ | 2635/12384 [5:35:31<20:37:48, 7.62s/it, loss=0.0038, acc=0.9901, iter_time=7.93s]
Epoch 0: 21%|██▏ | 2636/12384 [5:35:31<20:52:04, 7.71s/it, loss=0.0038, acc=0.9901, iter_time=7.93s]
Epoch 0: 21%|██▏ | 2636/12384 [5:35:39<20:52:04, 7.71s/it, loss=0.0008, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2637/12384 [5:35:39<21:02:18, 7.77s/it, loss=0.0008, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2637/12384 [5:35:47<21:02:18, 7.77s/it, loss=0.0010, acc=0.9998, iter_time=6.07s]
Epoch 0: 21%|██▏ | 2638/12384 [5:35:47<20:52:56, 7.71s/it, loss=0.0010, acc=0.9998, iter_time=6.07s]
Epoch 0: 21%|██▏ | 2638/12384 [5:35:55<20:52:56, 7.71s/it, loss=0.0082, acc=0.9861, iter_time=9.39s]
Epoch 0: 21%|██▏ | 2639/12384 [5:35:55<20:48:32, 7.69s/it, loss=0.0082, acc=0.9861, iter_time=9.39s]
Epoch 0: 21%|██▏ | 2639/12384 [5:36:02<20:48:32, 7.69s/it, loss=0.0011, acc=0.9975, iter_time=8.02s]
Epoch 0: 21%|██▏ | 2640/12384 [5:36:02<20:45:17, 7.67s/it, loss=0.0011, acc=0.9975, iter_time=8.02s]
Epoch 0: 21%|██▏ | 2640/12384 [5:36:08<20:45:17, 7.67s/it, loss=0.0028, acc=0.9933, iter_time=4.01s]
Epoch 0: 21%|██▏ | 2641/12384 [5:36:08<19:36:03, 7.24s/it, loss=0.0028, acc=0.9933, iter_time=4.01s]
Epoch 0: 21%|██▏ | 2641/12384 [5:36:16<19:36:03, 7.24s/it, loss=0.0003, acc=0.9999, iter_time=9.47s]
Epoch 0: 21%|██▏ | 2642/12384 [5:36:16<19:54:51, 7.36s/it, loss=0.0003, acc=0.9999, iter_time=9.47s]
Epoch 0: 21%|██▏ | 2642/12384 [5:36:24<19:54:51, 7.36s/it, loss=0.0053, acc=0.9927, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2643/12384 [5:36:24<20:06:31, 7.43s/it, loss=0.0053, acc=0.9927, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2643/12384 [5:36:31<20:06:31, 7.43s/it, loss=0.0003, acc=0.9998, iter_time=4.98s]
Epoch 0: 21%|██▏ | 2644/12384 [5:36:31<20:18:18, 7.51s/it, loss=0.0003, acc=0.9998, iter_time=4.98s]
Epoch 0: 21%|██▏ | 2644/12384 [5:36:39<20:18:18, 7.51s/it, loss=0.0003, acc=1.0000, iter_time=10.27s]
Epoch 0: 21%|██▏ | 2645/12384 [5:36:39<20:28:44, 7.57s/it, loss=0.0003, acc=1.0000, iter_time=10.27s]
Epoch 0: 21%|██▏ | 2645/12384 [5:36:47<20:28:44, 7.57s/it, loss=0.0003, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██▏ | 2646/12384 [5:36:47<20:30:59, 7.58s/it, loss=0.0003, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██▏ | 2646/12384 [5:36:54<20:30:59, 7.58s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██▏ | 2647/12384 [5:36:54<20:32:08, 7.59s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██▏ | 2647/12384 [5:37:02<20:32:08, 7.59s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 21%|██▏ | 2648/12384 [5:37:02<20:32:24, 7.59s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 21%|██▏ | 2648/12384 [5:37:09<20:32:24, 7.59s/it, loss=0.0002, acc=0.9998, iter_time=5.45s]
Epoch 0: 21%|██▏ | 2649/12384 [5:37:09<20:32:49, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=5.45s]
Epoch 0: 21%|██▏ | 2649/12384 [5:37:17<20:32:49, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=9.79s]
Epoch 0: 21%|██▏ | 2650/12384 [5:37:17<20:34:01, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.79s]
Epoch 0: 21%|██▏ | 2650/12384 [5:37:25<20:34:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 21%|██▏ | 2651/12384 [5:37:25<20:34:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 21%|██▏ | 2651/12384 [5:37:32<20:34:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2652/12384 [5:37:32<20:34:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2652/12384 [5:37:40<20:34:41, 7.61s/it, loss=0.0005, acc=0.9992, iter_time=4.48s]
Epoch 0: 21%|██▏ | 2653/12384 [5:37:40<20:35:04, 7.62s/it, loss=0.0005, acc=0.9992, iter_time=4.48s]
Epoch 0: 21%|██▏ | 2653/12384 [5:37:48<20:35:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 21%|██▏ | 2654/12384 [5:37:48<20:35:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 21%|██▏ | 2654/12384 [5:37:55<20:35:16, 7.62s/it, loss=0.0010, acc=0.9981, iter_time=8.54s]
Epoch 0: 21%|██▏ | 2655/12384 [5:37:55<20:38:27, 7.64s/it, loss=0.0010, acc=0.9981, iter_time=8.54s]
Epoch 0: 21%|██▏ | 2655/12384 [5:38:03<20:38:27, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=8.09s]
Epoch 0: 21%|██▏ | 2656/12384 [5:38:03<20:38:29, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=8.09s]
Epoch 0: 21%|██▏ | 2656/12384 [5:38:11<20:38:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 21%|██▏ | 2657/12384 [5:38:11<20:37:58, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 21%|██▏ | 2657/12384 [5:38:18<20:37:58, 7.64s/it, loss=0.0006, acc=0.9978, iter_time=7.62s]
Epoch 0: 21%|██▏ | 2658/12384 [5:38:18<20:36:05, 7.63s/it, loss=0.0006, acc=0.9978, iter_time=7.62s]
Epoch 0: 21%|██▏ | 2658/12384 [5:38:26<20:36:05, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2659/12384 [5:38:26<20:34:48, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2659/12384 [5:38:33<20:34:48, 7.62s/it, loss=0.0024, acc=0.9961, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2660/12384 [5:38:33<20:34:06, 7.61s/it, loss=0.0024, acc=0.9961, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2660/12384 [5:38:41<20:34:06, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2661/12384 [5:38:41<20:33:50, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2661/12384 [5:38:49<20:33:50, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2662/12384 [5:38:49<20:33:53, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2662/12384 [5:38:56<20:33:53, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=5.25s]
Epoch 0: 22%|██▏ | 2663/12384 [5:38:56<20:33:40, 7.61s/it, loss=0.0002, acc=0.9993, iter_time=5.25s]
Epoch 0: 22%|██▏ | 2663/12384 [5:39:04<20:33:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 22%|██▏ | 2664/12384 [5:39:04<20:49:51, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 22%|██▏ | 2664/12384 [5:39:12<20:49:51, 7.72s/it, loss=0.0003, acc=0.9996, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2665/12384 [5:39:12<20:44:06, 7.68s/it, loss=0.0003, acc=0.9996, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2665/12384 [5:39:19<20:44:06, 7.68s/it, loss=0.0001, acc=0.9993, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2666/12384 [5:39:19<20:40:35, 7.66s/it, loss=0.0001, acc=0.9993, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2666/12384 [5:39:27<20:40:35, 7.66s/it, loss=0.0012, acc=0.9973, iter_time=7.58s]
Epoch 0: 22%|██▏ | 2667/12384 [5:39:27<20:37:07, 7.64s/it, loss=0.0012, acc=0.9973, iter_time=7.58s]
Epoch 0: 22%|██▏ | 2667/12384 [5:39:35<20:37:07, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 22%|██▏ | 2668/12384 [5:39:35<20:35:31, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 22%|██▏ | 2668/12384 [5:39:42<20:35:31, 7.63s/it, loss=0.0020, acc=0.9934, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2669/12384 [5:39:42<20:34:17, 7.62s/it, loss=0.0020, acc=0.9934, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2669/12384 [5:39:50<20:34:17, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 22%|██▏ | 2670/12384 [5:39:50<20:33:02, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 22%|██▏ | 2670/12384 [5:39:57<20:33:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 22%|██▏ | 2671/12384 [5:39:57<20:32:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 22%|██▏ | 2671/12384 [5:40:05<20:32:42, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.74s]
Epoch 0: 22%|██▏ | 2672/12384 [5:40:05<20:33:33, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.74s]
Epoch 0: 22%|██▏ | 2672/12384 [5:40:13<20:33:33, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=5.45s]
Epoch 0: 22%|██▏ | 2673/12384 [5:40:13<20:31:45, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=5.45s]
Epoch 0: 22%|██▏ | 2673/12384 [5:40:20<20:31:45, 7.61s/it, loss=0.0002, acc=0.9995, iter_time=8.46s]
Epoch 0: 22%|██▏ | 2674/12384 [5:40:20<20:31:36, 7.61s/it, loss=0.0002, acc=0.9995, iter_time=8.46s]
Epoch 0: 22%|██▏ | 2674/12384 [5:40:28<20:31:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 22%|██▏ | 2675/12384 [5:40:28<20:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 22%|██▏ | 2675/12384 [5:40:35<20:30:58, 7.61s/it, loss=0.0004, acc=0.9971, iter_time=4.78s]
Epoch 0: 22%|██▏ | 2676/12384 [5:40:35<20:34:40, 7.63s/it, loss=0.0004, acc=0.9971, iter_time=4.78s]
Epoch 0: 22%|██▏ | 2676/12384 [5:40:43<20:34:40, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.56s]
Epoch 0: 22%|██▏ | 2677/12384 [5:40:43<20:33:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.56s]
Epoch 0: 22%|██▏ | 2677/12384 [5:40:51<20:33:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.77s]
Epoch 0: 22%|██▏ | 2678/12384 [5:40:51<20:32:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.77s]
Epoch 0: 22%|██▏ | 2678/12384 [5:40:58<20:32:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 22%|██▏ | 2679/12384 [5:40:58<20:32:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 22%|██▏ | 2679/12384 [5:41:06<20:32:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 22%|██▏ | 2680/12384 [5:41:06<20:32:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 22%|██▏ | 2680/12384 [5:41:14<20:32:27, 7.62s/it, loss=0.0021, acc=0.9950, iter_time=7.26s]
Epoch 0: 22%|██▏ | 2681/12384 [5:41:14<20:32:08, 7.62s/it, loss=0.0021, acc=0.9950, iter_time=7.26s]
Epoch 0: 22%|██▏ | 2681/12384 [5:41:21<20:32:08, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=6.67s]
Epoch 0: 22%|██▏ | 2682/12384 [5:41:21<20:32:00, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=6.67s]
Epoch 0: 22%|██▏ | 2682/12384 [5:41:29<20:32:00, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=8.54s]
Epoch 0: 22%|██▏ | 2683/12384 [5:41:29<20:30:55, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=8.54s]
Epoch 0: 22%|██▏ | 2683/12384 [5:41:36<20:30:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 22%|██▏ | 2684/12384 [5:41:36<20:34:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 22%|██▏ | 2684/12384 [5:41:44<20:34:00, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.02s]
Epoch 0: 22%|██▏ | 2685/12384 [5:41:44<20:34:55, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.02s]
Epoch 0: 22%|██▏ | 2685/12384 [5:41:52<20:34:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 22%|██▏ | 2686/12384 [5:41:52<20:34:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 22%|██▏ | 2686/12384 [5:41:59<20:34:12, 7.64s/it, loss=0.0005, acc=0.9985, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2687/12384 [5:41:59<20:33:25, 7.63s/it, loss=0.0005, acc=0.9985, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2687/12384 [5:42:07<20:33:25, 7.63s/it, loss=0.0007, acc=0.9991, iter_time=7.56s]
Epoch 0: 22%|██▏ | 2688/12384 [5:42:07<20:32:52, 7.63s/it, loss=0.0007, acc=0.9991, iter_time=7.56s]
Epoch 0: 22%|██▏ | 2688/12384 [5:42:15<20:32:52, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2689/12384 [5:42:15<20:30:13, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2689/12384 [5:42:22<20:30:13, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.10s]
Epoch 0: 22%|██▏ | 2690/12384 [5:42:22<20:46:55, 7.72s/it, loss=0.0004, acc=0.9998, iter_time=5.10s]
Epoch 0: 22%|██▏ | 2690/12384 [5:42:30<20:46:55, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=6.49s]
Epoch 0: 22%|██▏ | 2691/12384 [5:42:30<20:42:02, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.49s]
Epoch 0: 22%|██▏ | 2691/12384 [5:42:38<20:42:02, 7.69s/it, loss=0.0021, acc=0.9954, iter_time=11.59s]
Epoch 0: 22%|██▏ | 2692/12384 [5:42:38<20:37:04, 7.66s/it, loss=0.0021, acc=0.9954, iter_time=11.59s]
Epoch 0: 22%|██▏ | 2692/12384 [5:42:45<20:37:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 22%|██▏ | 2693/12384 [5:42:45<20:35:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 22%|██▏ | 2693/12384 [5:42:53<20:35:43, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=6.78s]
Epoch 0: 22%|██▏ | 2694/12384 [5:42:53<20:32:26, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=6.78s]
Epoch 0: 22%|██▏ | 2694/12384 [5:43:01<20:32:26, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.87s]
Epoch 0: 22%|██▏ | 2695/12384 [5:43:01<20:30:43, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=7.87s]
Epoch 0: 22%|██▏ | 2695/12384 [5:43:08<20:30:43, 7.62s/it, loss=0.0004, acc=0.9991, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2696/12384 [5:43:08<20:30:22, 7.62s/it, loss=0.0004, acc=0.9991, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2696/12384 [5:43:16<20:30:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=3.94s]
Epoch 0: 22%|██▏ | 2697/12384 [5:43:16<20:28:45, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=3.94s]
Epoch 0: 22%|██▏ | 2697/12384 [5:43:23<20:28:45, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=8.11s]
Epoch 0: 22%|██▏ | 2698/12384 [5:43:23<20:30:07, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=8.11s]
Epoch 0: 22%|██▏ | 2698/12384 [5:43:31<20:30:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 22%|██▏ | 2699/12384 [5:43:31<20:29:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 22%|██▏ | 2699/12384 [5:43:39<20:29:02, 7.61s/it, loss=0.0048, acc=0.9951, iter_time=10.54s]
Epoch 0: 22%|██▏ | 2700/12384 [5:43:39<20:28:50, 7.61s/it, loss=0.0048, acc=0.9951, iter_time=10.54s]
Epoch 0: 22%|██▏ | 2700/12384 [5:43:46<20:28:50, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=7.21s]
Epoch 0: 22%|██▏ | 2701/12384 [5:43:46<20:28:09, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=7.21s]
Epoch 0: 22%|██▏ | 2701/12384 [5:43:54<20:28:09, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2702/12384 [5:43:54<20:28:22, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2702/12384 [5:44:01<20:28:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 22%|██▏ | 2703/12384 [5:44:01<20:27:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 22%|██▏ | 2703/12384 [5:44:09<20:27:55, 7.61s/it, loss=0.0015, acc=0.9963, iter_time=7.84s]
Epoch 0: 22%|██▏ | 2704/12384 [5:44:09<20:29:44, 7.62s/it, loss=0.0015, acc=0.9963, iter_time=7.84s]
Epoch 0: 22%|██▏ | 2704/12384 [5:44:17<20:29:44, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=4.80s]
Epoch 0: 22%|██▏ | 2705/12384 [5:44:17<20:29:13, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=4.80s]
Epoch 0: 22%|██▏ | 2705/12384 [5:44:24<20:29:13, 7.62s/it, loss=0.0007, acc=1.0000, iter_time=10.46s]
Epoch 0: 22%|██▏ | 2706/12384 [5:44:24<20:27:51, 7.61s/it, loss=0.0007, acc=1.0000, iter_time=10.46s]
Epoch 0: 22%|██▏ | 2706/12384 [5:44:32<20:27:51, 7.61s/it, loss=0.0003, acc=0.9990, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2707/12384 [5:44:32<20:28:25, 7.62s/it, loss=0.0003, acc=0.9990, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2707/12384 [5:44:39<20:28:25, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2708/12384 [5:44:40<20:28:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2708/12384 [5:44:47<20:28:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2709/12384 [5:44:47<20:28:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2709/12384 [5:44:55<20:28:03, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=7.05s]
Epoch 0: 22%|██▏ | 2710/12384 [5:44:55<20:27:40, 7.61s/it, loss=0.0002, acc=0.9992, iter_time=7.05s]
Epoch 0: 22%|██▏ | 2710/12384 [5:45:02<20:27:40, 7.61s/it, loss=0.0063, acc=0.9969, iter_time=5.10s]
Epoch 0: 22%|██▏ | 2711/12384 [5:45:02<20:27:57, 7.62s/it, loss=0.0063, acc=0.9969, iter_time=5.10s]
Epoch 0: 22%|██▏ | 2711/12384 [5:45:10<20:27:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 0: 22%|██▏ | 2712/12384 [5:45:10<20:27:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 0: 22%|██▏ | 2712/12384 [5:45:18<20:27:02, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=5.19s]
Epoch 0: 22%|██▏ | 2713/12384 [5:45:18<20:27:12, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=5.19s]
Epoch 0: 22%|██▏ | 2713/12384 [5:45:25<20:27:12, 7.61s/it, loss=0.0005, acc=0.9962, iter_time=6.67s]
Epoch 0: 22%|██▏ | 2714/12384 [5:45:25<20:27:16, 7.61s/it, loss=0.0005, acc=0.9962, iter_time=6.67s]
Epoch 0: 22%|██▏ | 2714/12384 [5:45:33<20:27:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.86s]
Epoch 0: 22%|██▏ | 2715/12384 [5:45:33<20:26:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.86s]
Epoch 0: 22%|██▏ | 2715/12384 [5:45:40<20:26:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 22%|██▏ | 2716/12384 [5:45:40<20:25:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 22%|██▏ | 2716/12384 [5:45:48<20:25:38, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=7.34s]
Epoch 0: 22%|██▏ | 2717/12384 [5:45:48<20:41:23, 7.70s/it, loss=0.0003, acc=0.9999, iter_time=7.34s]
Epoch 0: 22%|██▏ | 2717/12384 [5:45:56<20:41:23, 7.70s/it, loss=0.0003, acc=0.9991, iter_time=8.74s]
Epoch 0: 22%|██▏ | 2718/12384 [5:45:56<20:37:03, 7.68s/it, loss=0.0003, acc=0.9991, iter_time=8.74s]
Epoch 0: 22%|██▏ | 2718/12384 [5:46:04<20:37:03, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2719/12384 [5:46:04<20:33:29, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2719/12384 [5:46:11<20:33:29, 7.66s/it, loss=0.0004, acc=0.9978, iter_time=7.98s]
Epoch 0: 22%|██▏ | 2720/12384 [5:46:11<20:31:10, 7.64s/it, loss=0.0004, acc=0.9978, iter_time=7.98s]
Epoch 0: 22%|██▏ | 2720/12384 [5:46:19<20:31:10, 7.64s/it, loss=0.0003, acc=0.9981, iter_time=7.22s]
Epoch 0: 22%|██▏ | 2721/12384 [5:46:19<20:30:15, 7.64s/it, loss=0.0003, acc=0.9981, iter_time=7.22s]
Epoch 0: 22%|██▏ | 2721/12384 [5:46:26<20:30:15, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2722/12384 [5:46:26<20:29:14, 7.63s/it, loss=0.0004, acc=0.9982, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2722/12384 [5:46:34<20:29:14, 7.63s/it, loss=0.0004, acc=0.9992, iter_time=7.31s]
Epoch 0: 22%|██▏ | 2723/12384 [5:46:34<20:26:55, 7.62s/it, loss=0.0004, acc=0.9992, iter_time=7.31s]
Epoch 0: 22%|██▏ | 2723/12384 [5:46:42<20:26:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 22%|██▏ | 2724/12384 [5:46:42<20:26:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 22%|██▏ | 2724/12384 [5:46:49<20:26:30, 7.62s/it, loss=0.0006, acc=0.9999, iter_time=8.25s]
Epoch 0: 22%|██▏ | 2725/12384 [5:46:49<20:26:16, 7.62s/it, loss=0.0006, acc=0.9999, iter_time=8.25s]
Epoch 0: 22%|██▏ | 2725/12384 [5:46:57<20:26:16, 7.62s/it, loss=0.0013, acc=0.9973, iter_time=7.59s]
Epoch 0: 22%|██▏ | 2726/12384 [5:46:57<20:26:19, 7.62s/it, loss=0.0013, acc=0.9973, iter_time=7.59s]
Epoch 0: 22%|██▏ | 2726/12384 [5:47:04<20:26:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.24s]
Epoch 0: 22%|██▏ | 2727/12384 [5:47:04<20:26:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.24s]
Epoch 0: 22%|██▏ | 2727/12384 [5:47:12<20:26:25, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=11.39s]
Epoch 0: 22%|██▏ | 2728/12384 [5:47:12<20:25:19, 7.61s/it, loss=0.0002, acc=0.9989, iter_time=11.39s]
Epoch 0: 22%|██▏ | 2728/12384 [5:47:20<20:25:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 22%|██▏ | 2729/12384 [5:47:20<20:25:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 22%|██▏ | 2729/12384 [5:47:27<20:25:21, 7.61s/it, loss=0.0031, acc=0.9949, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2730/12384 [5:47:27<20:25:33, 7.62s/it, loss=0.0031, acc=0.9949, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2730/12384 [5:47:35<20:25:33, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.80s]
Epoch 0: 22%|██▏ | 2731/12384 [5:47:35<20:24:26, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=4.80s]
Epoch 0: 22%|██▏ | 2731/12384 [5:47:43<20:24:26, 7.61s/it, loss=0.0011, acc=0.9967, iter_time=10.42s]
Epoch 0: 22%|██▏ | 2732/12384 [5:47:43<20:24:19, 7.61s/it, loss=0.0011, acc=0.9967, iter_time=10.42s]
Epoch 0: 22%|██▏ | 2732/12384 [5:47:50<20:24:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.06s]
Epoch 0: 22%|██▏ | 2733/12384 [5:47:50<20:24:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.06s]
Epoch 0: 22%|██▏ | 2733/12384 [5:47:58<20:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 22%|██▏ | 2734/12384 [5:47:58<20:27:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 22%|██▏ | 2734/12384 [5:48:05<20:27:08, 7.63s/it, loss=0.0009, acc=0.9977, iter_time=8.53s]
Epoch 0: 22%|██▏ | 2735/12384 [5:48:05<20:27:05, 7.63s/it, loss=0.0009, acc=0.9977, iter_time=8.53s]
Epoch 0: 22%|██▏ | 2735/12384 [5:48:13<20:27:05, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.27s]
Epoch 0: 22%|██▏ | 2736/12384 [5:48:13<20:24:46, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.27s]
Epoch 0: 22%|██▏ | 2736/12384 [5:48:21<20:24:46, 7.62s/it, loss=0.0015, acc=1.0000, iter_time=3.92s]
Epoch 0: 22%|██▏ | 2737/12384 [5:48:21<20:25:25, 7.62s/it, loss=0.0015, acc=1.0000, iter_time=3.92s]
Epoch 0: 22%|██▏ | 2737/12384 [5:48:28<20:25:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 22%|██▏ | 2738/12384 [5:48:28<20:25:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 22%|██▏ | 2738/12384 [5:48:36<20:25:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.97s]
Epoch 0: 22%|██▏ | 2739/12384 [5:48:36<20:24:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.97s]
Epoch 0: 22%|██▏ | 2739/12384 [5:48:44<20:24:23, 7.62s/it, loss=0.0035, acc=0.9946, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2740/12384 [5:48:44<20:38:06, 7.70s/it, loss=0.0035, acc=0.9946, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2740/12384 [5:48:51<20:38:06, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2741/12384 [5:48:51<20:33:57, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2741/12384 [5:48:59<20:33:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2742/12384 [5:48:59<20:32:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2742/12384 [5:49:07<20:32:35, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=5.13s]
Epoch 0: 22%|██▏ | 2743/12384 [5:49:07<20:46:48, 7.76s/it, loss=0.0004, acc=1.0000, iter_time=5.13s]
Epoch 0: 22%|██▏ | 2743/12384 [5:49:15<20:46:48, 7.76s/it, loss=0.0016, acc=0.9981, iter_time=10.43s]
Epoch 0: 22%|██▏ | 2744/12384 [5:49:15<20:39:05, 7.71s/it, loss=0.0016, acc=0.9981, iter_time=10.43s]
Epoch 0: 22%|██▏ | 2744/12384 [5:49:22<20:39:05, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2745/12384 [5:49:22<20:33:30, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2745/12384 [5:49:30<20:33:30, 7.68s/it, loss=0.0005, acc=0.9985, iter_time=7.61s]
Epoch 0: 22%|██▏ | 2746/12384 [5:49:30<20:29:59, 7.66s/it, loss=0.0005, acc=0.9985, iter_time=7.61s]
Epoch 0: 22%|██▏ | 2746/12384 [5:49:37<20:29:59, 7.66s/it, loss=0.0004, acc=0.9988, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2747/12384 [5:49:37<20:27:40, 7.64s/it, loss=0.0004, acc=0.9988, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2747/12384 [5:49:45<20:27:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 22%|██▏ | 2748/12384 [5:49:45<20:24:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 22%|██▏ | 2748/12384 [5:49:53<20:24:15, 7.62s/it, loss=0.0008, acc=0.9964, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2749/12384 [5:49:53<20:23:13, 7.62s/it, loss=0.0008, acc=0.9964, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2749/12384 [5:50:00<20:23:13, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.06s]
Epoch 0: 22%|██▏ | 2750/12384 [5:50:00<20:25:29, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.06s]
Epoch 0: 22%|██▏ | 2750/12384 [5:50:08<20:25:29, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 22%|██▏ | 2751/12384 [5:50:08<20:26:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 22%|██▏ | 2751/12384 [5:50:16<20:26:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 22%|██▏ | 2752/12384 [5:50:16<20:25:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 22%|██▏ | 2752/12384 [5:50:23<20:25:55, 7.64s/it, loss=0.0006, acc=0.9998, iter_time=7.24s]
Epoch 0: 22%|██▏ | 2753/12384 [5:50:23<20:24:46, 7.63s/it, loss=0.0006, acc=0.9998, iter_time=7.24s]
Epoch 0: 22%|██▏ | 2753/12384 [5:50:31<20:24:46, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=4.34s]
Epoch 0: 22%|██▏ | 2754/12384 [5:50:31<20:23:41, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=4.34s]
Epoch 0: 22%|██▏ | 2754/12384 [5:50:38<20:23:41, 7.62s/it, loss=0.0026, acc=0.9958, iter_time=10.89s]
Epoch 0: 22%|██▏ | 2755/12384 [5:50:38<20:23:11, 7.62s/it, loss=0.0026, acc=0.9958, iter_time=10.89s]
Epoch 0: 22%|██▏ | 2755/12384 [5:50:46<20:23:11, 7.62s/it, loss=0.0007, acc=0.9998, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2756/12384 [5:50:46<20:22:41, 7.62s/it, loss=0.0007, acc=0.9998, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2756/12384 [5:50:54<20:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2757/12384 [5:50:54<20:27:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2757/12384 [5:51:01<20:27:28, 7.65s/it, loss=0.0006, acc=0.9976, iter_time=7.71s]
Epoch 0: 22%|██▏ | 2758/12384 [5:51:01<20:25:44, 7.64s/it, loss=0.0006, acc=0.9976, iter_time=7.71s]
Epoch 0: 22%|██▏ | 2758/12384 [5:51:09<20:25:44, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.42s]
Epoch 0: 22%|██▏ | 2759/12384 [5:51:09<20:24:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.42s]
Epoch 0: 22%|██▏ | 2759/12384 [5:51:17<20:24:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 0: 22%|██▏ | 2760/12384 [5:51:17<20:24:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 0: 22%|██▏ | 2760/12384 [5:51:24<20:24:00, 7.63s/it, loss=0.0006, acc=0.9981, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2761/12384 [5:51:24<20:22:03, 7.62s/it, loss=0.0006, acc=0.9981, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2761/12384 [5:51:32<20:22:03, 7.62s/it, loss=0.0003, acc=0.9981, iter_time=5.50s]
Epoch 0: 22%|██▏ | 2762/12384 [5:51:32<20:22:01, 7.62s/it, loss=0.0003, acc=0.9981, iter_time=5.50s]
Epoch 0: 22%|██▏ | 2762/12384 [5:51:39<20:22:01, 7.62s/it, loss=0.0008, acc=0.9990, iter_time=9.71s]
Epoch 0: 22%|██▏ | 2763/12384 [5:51:39<20:20:45, 7.61s/it, loss=0.0008, acc=0.9990, iter_time=9.71s]
Epoch 0: 22%|██▏ | 2763/12384 [5:51:47<20:20:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2764/12384 [5:51:47<20:21:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2764/12384 [5:51:55<20:21:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 0: 22%|██▏ | 2765/12384 [5:51:55<20:21:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 0: 22%|██▏ | 2765/12384 [5:52:02<20:21:04, 7.62s/it, loss=0.0006, acc=0.9983, iter_time=5.97s]
Epoch 0: 22%|██▏ | 2766/12384 [5:52:02<20:19:44, 7.61s/it, loss=0.0006, acc=0.9983, iter_time=5.97s]
Epoch 0: 22%|██▏ | 2766/12384 [5:52:10<20:19:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.02s]
Epoch 0: 22%|██▏ | 2767/12384 [5:52:10<20:33:18, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=11.02s]
Epoch 0: 22%|██▏ | 2767/12384 [5:52:18<20:33:18, 7.69s/it, loss=0.0003, acc=0.9993, iter_time=7.98s]
Epoch 0: 22%|██▏ | 2768/12384 [5:52:18<20:29:35, 7.67s/it, loss=0.0003, acc=0.9993, iter_time=7.98s]
Epoch 0: 22%|██▏ | 2768/12384 [5:52:26<20:29:35, 7.67s/it, loss=0.0002, acc=0.9992, iter_time=7.27s]
Epoch 0: 22%|██▏ | 2769/12384 [5:52:26<20:40:04, 7.74s/it, loss=0.0002, acc=0.9992, iter_time=7.27s]
Epoch 0: 22%|██▏ | 2769/12384 [5:52:33<20:40:04, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=6.63s]
Epoch 0: 22%|██▏ | 2770/12384 [5:52:33<20:33:52, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.63s]
Epoch 0: 22%|██▏ | 2770/12384 [5:52:41<20:33:52, 7.70s/it, loss=0.0004, acc=1.0000, iter_time=8.83s]
Epoch 0: 22%|██▏ | 2771/12384 [5:52:41<20:30:18, 7.68s/it, loss=0.0004, acc=1.0000, iter_time=8.83s]
Epoch 0: 22%|██▏ | 2771/12384 [5:52:49<20:30:18, 7.68s/it, loss=0.0009, acc=0.9968, iter_time=3.61s]
Epoch 0: 22%|██▏ | 2772/12384 [5:52:49<20:26:39, 7.66s/it, loss=0.0009, acc=0.9968, iter_time=3.61s]
Epoch 0: 22%|██▏ | 2772/12384 [5:52:56<20:26:39, 7.66s/it, loss=0.0003, acc=0.9985, iter_time=11.62s]
Epoch 0: 22%|██▏ | 2773/12384 [5:52:56<20:23:22, 7.64s/it, loss=0.0003, acc=0.9985, iter_time=11.62s]
Epoch 0: 22%|██▏ | 2773/12384 [5:53:04<20:23:22, 7.64s/it, loss=0.0013, acc=0.9986, iter_time=6.67s]
Epoch 0: 22%|██▏ | 2774/12384 [5:53:04<20:21:57, 7.63s/it, loss=0.0013, acc=0.9986, iter_time=6.67s]
Epoch 0: 22%|██▏ | 2774/12384 [5:53:11<20:21:57, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.28s]
Epoch 0: 22%|██▏ | 2775/12384 [5:53:11<20:21:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.28s]
Epoch 0: 22%|██▏ | 2775/12384 [5:53:19<20:21:00, 7.62s/it, loss=0.0009, acc=1.0000, iter_time=10.23s]
Epoch 0: 22%|██▏ | 2776/12384 [5:53:19<20:20:04, 7.62s/it, loss=0.0009, acc=1.0000, iter_time=10.23s]
Epoch 0: 22%|██▏ | 2776/12384 [5:53:27<20:20:04, 7.62s/it, loss=0.0003, acc=0.9981, iter_time=7.24s]
Epoch 0: 22%|██▏ | 2777/12384 [5:53:27<20:18:37, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=7.24s]
Epoch 0: 22%|██▏ | 2777/12384 [5:53:34<20:18:37, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.01s]
Epoch 0: 22%|██▏ | 2778/12384 [5:53:34<20:21:36, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.01s]
Epoch 0: 22%|██▏ | 2778/12384 [5:53:42<20:21:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.26s]
Epoch 0: 22%|██▏ | 2779/12384 [5:53:42<20:21:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.26s]
Epoch 0: 22%|██▏ | 2779/12384 [5:53:49<20:21:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 22%|██▏ | 2780/12384 [5:53:49<20:22:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 22%|██▏ | 2780/12384 [5:53:57<20:22:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 22%|██▏ | 2781/12384 [5:53:57<20:21:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 22%|██▏ | 2781/12384 [5:54:05<20:21:55, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.41s]
Epoch 0: 22%|██▏ | 2782/12384 [5:54:05<20:20:16, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.41s]
Epoch 0: 22%|██▏ | 2782/12384 [5:54:12<20:20:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2783/12384 [5:54:12<20:19:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2783/12384 [5:54:20<20:19:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 22%|██▏ | 2784/12384 [5:54:20<20:20:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 22%|██▏ | 2784/12384 [5:54:28<20:20:26, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=5.84s]
Epoch 0: 22%|██▏ | 2785/12384 [5:54:28<20:19:37, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=5.84s]
Epoch 0: 22%|██▏ | 2785/12384 [5:54:35<20:19:37, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2786/12384 [5:54:35<20:19:28, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2786/12384 [5:54:43<20:19:28, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=8.26s]
Epoch 0: 23%|██▎ | 2787/12384 [5:54:43<20:19:11, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=8.26s]
Epoch 0: 23%|██▎ | 2787/12384 [5:54:50<20:19:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 0: 23%|██▎ | 2788/12384 [5:54:50<20:18:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 0: 23%|██▎ | 2788/12384 [5:54:58<20:18:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 23%|██▎ | 2789/12384 [5:54:58<20:17:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 23%|██▎ | 2789/12384 [5:55:06<20:17:52, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=9.67s]
Epoch 0: 23%|██▎ | 2790/12384 [5:55:06<20:18:01, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=9.67s]
Epoch 0: 23%|██▎ | 2790/12384 [5:55:13<20:18:01, 7.62s/it, loss=0.0009, acc=0.9963, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2791/12384 [5:55:13<20:17:29, 7.61s/it, loss=0.0009, acc=0.9963, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2791/12384 [5:55:21<20:17:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 23%|██▎ | 2792/12384 [5:55:21<20:17:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 23%|██▎ | 2792/12384 [5:55:29<20:17:19, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.15s]
Epoch 0: 23%|██▎ | 2793/12384 [5:55:29<20:17:16, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.15s]
Epoch 0: 23%|██▎ | 2793/12384 [5:55:36<20:17:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 23%|██▎ | 2794/12384 [5:55:36<20:16:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 23%|██▎ | 2794/12384 [5:55:44<20:16:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.31s]
Epoch 0: 23%|██▎ | 2795/12384 [5:55:44<20:34:17, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.31s]
Epoch 0: 23%|██▎ | 2795/12384 [5:55:52<20:34:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 23%|██▎ | 2796/12384 [5:55:52<20:27:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 23%|██▎ | 2796/12384 [5:55:59<20:27:45, 7.68s/it, loss=0.0004, acc=0.9986, iter_time=6.42s]
Epoch 0: 23%|██▎ | 2797/12384 [5:55:59<20:24:25, 7.66s/it, loss=0.0004, acc=0.9986, iter_time=6.42s]
Epoch 0: 23%|██▎ | 2797/12384 [5:56:07<20:24:25, 7.66s/it, loss=0.0006, acc=0.9966, iter_time=8.48s]
Epoch 0: 23%|██▎ | 2798/12384 [5:56:07<20:21:42, 7.65s/it, loss=0.0006, acc=0.9966, iter_time=8.48s]
Epoch 0: 23%|██▎ | 2798/12384 [5:56:15<20:21:42, 7.65s/it, loss=0.0010, acc=0.9980, iter_time=7.93s]
Epoch 0: 23%|██▎ | 2799/12384 [5:56:15<20:19:20, 7.63s/it, loss=0.0010, acc=0.9980, iter_time=7.93s]
Epoch 0: 23%|██▎ | 2799/12384 [5:56:22<20:19:20, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 23%|██▎ | 2800/12384 [5:56:22<20:18:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 23%|██▎ | 2800/12384 [5:56:30<20:18:48, 7.63s/it, loss=0.0005, acc=0.9986, iter_time=4.87s]
Epoch 0: 23%|██▎ | 2801/12384 [5:56:30<20:16:53, 7.62s/it, loss=0.0005, acc=0.9986, iter_time=4.87s]
Epoch 0: 23%|██▎ | 2801/12384 [5:56:37<20:16:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 0: 23%|██▎ | 2802/12384 [5:56:37<20:15:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 0: 23%|██▎ | 2802/12384 [5:56:45<20:15:31, 7.61s/it, loss=0.0004, acc=0.9995, iter_time=7.03s]
Epoch 0: 23%|██▎ | 2803/12384 [5:56:45<20:15:17, 7.61s/it, loss=0.0004, acc=0.9995, iter_time=7.03s]
Epoch 0: 23%|██▎ | 2803/12384 [5:56:53<20:15:17, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=8.19s]
Epoch 0: 23%|██▎ | 2804/12384 [5:56:53<20:16:51, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.19s]
Epoch 0: 23%|██▎ | 2804/12384 [5:57:00<20:16:51, 7.62s/it, loss=0.0010, acc=0.9979, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2805/12384 [5:57:00<20:16:33, 7.62s/it, loss=0.0010, acc=0.9979, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2805/12384 [5:57:08<20:16:33, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2806/12384 [5:57:08<20:19:59, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2806/12384 [5:57:16<20:19:59, 7.64s/it, loss=0.0012, acc=0.9977, iter_time=4.08s]
Epoch 0: 23%|██▎ | 2807/12384 [5:57:16<20:18:58, 7.64s/it, loss=0.0012, acc=0.9977, iter_time=4.08s]
Epoch 0: 23%|██▎ | 2807/12384 [5:57:23<20:18:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 0: 23%|██▎ | 2808/12384 [5:57:23<20:17:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 0: 23%|██▎ | 2808/12384 [5:57:31<20:17:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 23%|██▎ | 2809/12384 [5:57:31<20:16:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 23%|██▎ | 2809/12384 [5:57:38<20:16:38, 7.62s/it, loss=0.0007, acc=0.9986, iter_time=7.27s]
Epoch 0: 23%|██▎ | 2810/12384 [5:57:38<20:20:01, 7.65s/it, loss=0.0007, acc=0.9986, iter_time=7.27s]
Epoch 0: 23%|██▎ | 2810/12384 [5:57:46<20:20:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 0: 23%|██▎ | 2811/12384 [5:57:46<20:18:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 0: 23%|██▎ | 2811/12384 [5:57:54<20:18:41, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=5.55s]
Epoch 0: 23%|██▎ | 2812/12384 [5:57:54<20:17:17, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=5.55s]
Epoch 0: 23%|██▎ | 2812/12384 [5:58:01<20:17:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 23%|██▎ | 2813/12384 [5:58:01<20:15:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 23%|██▎ | 2813/12384 [5:58:09<20:15:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 23%|██▎ | 2814/12384 [5:58:09<20:14:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 23%|██▎ | 2814/12384 [5:58:16<20:14:49, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.35s]
Epoch 0: 23%|██▎ | 2815/12384 [5:58:16<20:14:28, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.35s]
Epoch 0: 23%|██▎ | 2815/12384 [5:58:24<20:14:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 23%|██▎ | 2816/12384 [5:58:24<20:14:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 23%|██▎ | 2816/12384 [5:58:32<20:14:00, 7.61s/it, loss=0.0010, acc=0.9988, iter_time=6.04s]
Epoch 0: 23%|██▎ | 2817/12384 [5:58:32<20:13:08, 7.61s/it, loss=0.0010, acc=0.9988, iter_time=6.04s]
Epoch 0: 23%|██▎ | 2817/12384 [5:58:39<20:13:08, 7.61s/it, loss=0.0001, acc=0.9993, iter_time=8.48s]
Epoch 0: 23%|██▎ | 2818/12384 [5:58:39<20:12:19, 7.60s/it, loss=0.0001, acc=0.9993, iter_time=8.48s]
Epoch 0: 23%|██▎ | 2818/12384 [5:58:47<20:12:19, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 23%|██▎ | 2819/12384 [5:58:47<20:13:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 23%|██▎ | 2819/12384 [5:58:54<20:13:09, 7.61s/it, loss=0.0009, acc=0.9971, iter_time=6.15s]
Epoch 0: 23%|██▎ | 2820/12384 [5:58:54<20:12:35, 7.61s/it, loss=0.0009, acc=0.9971, iter_time=6.15s]
Epoch 0: 23%|██▎ | 2820/12384 [5:59:02<20:12:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 23%|██▎ | 2821/12384 [5:59:02<20:27:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 23%|██▎ | 2821/12384 [5:59:10<20:27:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 23%|██▎ | 2822/12384 [5:59:10<20:26:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 23%|██▎ | 2822/12384 [5:59:18<20:26:41, 7.70s/it, loss=0.0006, acc=0.9978, iter_time=5.89s]
Epoch 0: 23%|██▎ | 2823/12384 [5:59:18<20:22:31, 7.67s/it, loss=0.0006, acc=0.9978, iter_time=5.89s]
Epoch 0: 23%|██▎ | 2823/12384 [5:59:25<20:22:31, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.36s]
Epoch 0: 23%|██▎ | 2824/12384 [5:59:25<20:19:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.36s]
Epoch 0: 23%|██▎ | 2824/12384 [5:59:33<20:19:17, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 23%|██▎ | 2825/12384 [5:59:33<20:20:32, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 23%|██▎ | 2825/12384 [5:59:41<20:20:32, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2826/12384 [5:59:41<20:18:35, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2826/12384 [5:59:48<20:18:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 23%|██▎ | 2827/12384 [5:59:48<20:20:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 23%|██▎ | 2827/12384 [5:59:56<20:20:38, 7.66s/it, loss=0.0009, acc=0.9978, iter_time=7.37s]
Epoch 0: 23%|██▎ | 2828/12384 [5:59:56<20:17:38, 7.65s/it, loss=0.0009, acc=0.9978, iter_time=7.37s]
Epoch 0: 23%|██▎ | 2828/12384 [6:00:04<20:17:38, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=6.79s]
Epoch 0: 23%|██▎ | 2829/12384 [6:00:04<20:16:20, 7.64s/it, loss=0.0003, acc=0.9997, iter_time=6.79s]
Epoch 0: 23%|██▎ | 2829/12384 [6:00:11<20:16:20, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 0: 23%|██▎ | 2830/12384 [6:00:11<20:18:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 0: 23%|██▎ | 2830/12384 [6:00:19<20:18:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.03s]
Epoch 0: 23%|██▎ | 2831/12384 [6:00:19<20:16:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.03s]
Epoch 0: 23%|██▎ | 2831/12384 [6:00:26<20:16:39, 7.64s/it, loss=0.0016, acc=0.9949, iter_time=7.98s]
Epoch 0: 23%|██▎ | 2832/12384 [6:00:26<20:14:57, 7.63s/it, loss=0.0016, acc=0.9949, iter_time=7.98s]
Epoch 0: 23%|██▎ | 2832/12384 [6:00:34<20:14:57, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 23%|██▎ | 2833/12384 [6:00:34<20:13:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 23%|██▎ | 2833/12384 [6:00:42<20:13:27, 7.62s/it, loss=0.0003, acc=0.9993, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2834/12384 [6:00:42<20:13:19, 7.62s/it, loss=0.0003, acc=0.9993, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2834/12384 [6:00:49<20:13:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 23%|██▎ | 2835/12384 [6:00:49<20:11:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 23%|██▎ | 2835/12384 [6:00:57<20:11:49, 7.61s/it, loss=0.0004, acc=0.9999, iter_time=10.89s]
Epoch 0: 23%|██▎ | 2836/12384 [6:00:57<20:11:25, 7.61s/it, loss=0.0004, acc=0.9999, iter_time=10.89s]
Epoch 0: 23%|██▎ | 2836/12384 [6:01:05<20:11:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.85s]
Epoch 0: 23%|██▎ | 2837/12384 [6:01:05<20:11:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.85s]
Epoch 0: 23%|██▎ | 2837/12384 [6:01:12<20:11:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.83s]
Epoch 0: 23%|██▎ | 2838/12384 [6:01:12<20:11:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.83s]
Epoch 0: 23%|██▎ | 2838/12384 [6:01:20<20:11:42, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=10.39s]
Epoch 0: 23%|██▎ | 2839/12384 [6:01:20<20:11:48, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=10.39s]
Epoch 0: 23%|██▎ | 2839/12384 [6:01:27<20:11:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 23%|██▎ | 2840/12384 [6:01:27<20:11:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 23%|██▎ | 2840/12384 [6:01:35<20:11:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.17s]
Epoch 0: 23%|██▎ | 2841/12384 [6:01:35<20:10:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.17s]
Epoch 0: 23%|██▎ | 2841/12384 [6:01:43<20:10:56, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=10.63s]
Epoch 0: 23%|██▎ | 2842/12384 [6:01:43<20:15:45, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.63s]
Epoch 0: 23%|██▎ | 2842/12384 [6:01:50<20:15:45, 7.64s/it, loss=0.0014, acc=0.9968, iter_time=5.40s]
Epoch 0: 23%|██▎ | 2843/12384 [6:01:50<20:14:31, 7.64s/it, loss=0.0014, acc=0.9968, iter_time=5.40s]
Epoch 0: 23%|██▎ | 2843/12384 [6:01:58<20:14:31, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.96s]
Epoch 0: 23%|██▎ | 2844/12384 [6:01:58<20:14:17, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.96s]
Epoch 0: 23%|██▎ | 2844/12384 [6:02:06<20:14:17, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2845/12384 [6:02:06<20:12:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2845/12384 [6:02:13<20:12:03, 7.62s/it, loss=0.0004, acc=0.9999, iter_time=7.90s]
Epoch 0: 23%|██▎ | 2846/12384 [6:02:13<20:24:39, 7.70s/it, loss=0.0004, acc=0.9999, iter_time=7.90s]
Epoch 0: 23%|██▎ | 2846/12384 [6:02:21<20:24:39, 7.70s/it, loss=0.0007, acc=0.9982, iter_time=6.47s]
Epoch 0: 23%|██▎ | 2847/12384 [6:02:21<20:20:45, 7.68s/it, loss=0.0007, acc=0.9982, iter_time=6.47s]
Epoch 0: 23%|██▎ | 2847/12384 [6:02:29<20:20:45, 7.68s/it, loss=0.0001, acc=0.9997, iter_time=9.20s]
Epoch 0: 23%|██▎ | 2848/12384 [6:02:29<20:34:02, 7.76s/it, loss=0.0001, acc=0.9997, iter_time=9.20s]
Epoch 0: 23%|██▎ | 2848/12384 [6:02:37<20:34:02, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=7.50s]
Epoch 0: 23%|██▎ | 2849/12384 [6:02:37<20:27:00, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.50s]
Epoch 0: 23%|██▎ | 2849/12384 [6:02:44<20:27:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 23%|██▎ | 2850/12384 [6:02:44<20:21:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 23%|██▎ | 2850/12384 [6:02:52<20:21:54, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.11s]
Epoch 0: 23%|██▎ | 2851/12384 [6:02:52<20:18:20, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.11s]
Epoch 0: 23%|██▎ | 2851/12384 [6:03:00<20:18:20, 7.67s/it, loss=0.0045, acc=0.9978, iter_time=9.79s]
Epoch 0: 23%|██▎ | 2852/12384 [6:03:00<20:19:14, 7.67s/it, loss=0.0045, acc=0.9978, iter_time=9.79s]
Epoch 0: 23%|██▎ | 2852/12384 [6:03:07<20:19:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 23%|██▎ | 2853/12384 [6:03:07<20:14:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 23%|██▎ | 2853/12384 [6:03:15<20:14:40, 7.65s/it, loss=0.0013, acc=0.9952, iter_time=9.05s]
Epoch 0: 23%|██▎ | 2854/12384 [6:03:15<20:12:51, 7.64s/it, loss=0.0013, acc=0.9952, iter_time=9.05s]
Epoch 0: 23%|██▎ | 2854/12384 [6:03:22<20:12:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 23%|██▎ | 2855/12384 [6:03:22<20:11:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 23%|██▎ | 2855/12384 [6:03:30<20:11:56, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.82s]
Epoch 0: 23%|██▎ | 2856/12384 [6:03:30<20:10:01, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.82s]
Epoch 0: 23%|██▎ | 2856/12384 [6:03:38<20:10:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 23%|██▎ | 2857/12384 [6:03:38<20:08:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 23%|██▎ | 2857/12384 [6:03:45<20:08:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2858/12384 [6:03:45<20:07:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2858/12384 [6:03:53<20:07:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 23%|██▎ | 2859/12384 [6:03:53<20:08:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 23%|██▎ | 2859/12384 [6:04:00<20:08:16, 7.61s/it, loss=0.0002, acc=0.9983, iter_time=3.90s]
Epoch 0: 23%|██▎ | 2860/12384 [6:04:00<20:07:05, 7.60s/it, loss=0.0002, acc=0.9983, iter_time=3.90s]
Epoch 0: 23%|██▎ | 2860/12384 [6:04:08<20:07:05, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.24s]
Epoch 0: 23%|██▎ | 2861/12384 [6:04:08<20:07:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.24s]
Epoch 0: 23%|██▎ | 2861/12384 [6:04:16<20:07:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 0: 23%|██▎ | 2862/12384 [6:04:16<20:12:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 0: 23%|██▎ | 2862/12384 [6:04:23<20:12:12, 7.64s/it, loss=0.0006, acc=0.9985, iter_time=7.72s]
Epoch 0: 23%|██▎ | 2863/12384 [6:04:23<20:10:54, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.72s]
Epoch 0: 23%|██▎ | 2863/12384 [6:04:31<20:10:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 23%|██▎ | 2864/12384 [6:04:31<20:09:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 23%|██▎ | 2864/12384 [6:04:39<20:09:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 23%|██▎ | 2865/12384 [6:04:39<20:09:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 23%|██▎ | 2865/12384 [6:04:46<20:09:25, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2866/12384 [6:04:46<20:09:07, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2866/12384 [6:04:54<20:09:07, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2867/12384 [6:04:54<20:11:01, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2867/12384 [6:05:01<20:11:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 23%|██▎ | 2868/12384 [6:05:01<20:09:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 23%|██▎ | 2868/12384 [6:05:09<20:09:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2869/12384 [6:05:09<20:09:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2869/12384 [6:05:17<20:09:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2870/12384 [6:05:17<20:08:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2870/12384 [6:05:24<20:08:57, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=5.62s]
Epoch 0: 23%|██▎ | 2871/12384 [6:05:24<20:08:09, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=5.62s]
Epoch 0: 23%|██▎ | 2871/12384 [6:05:32<20:08:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 0: 23%|██▎ | 2872/12384 [6:05:32<20:07:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 0: 23%|██▎ | 2872/12384 [6:05:40<20:07:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 23%|██▎ | 2873/12384 [6:05:40<20:10:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 23%|██▎ | 2873/12384 [6:05:48<20:10:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 23%|██▎ | 2874/12384 [6:05:48<20:24:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 23%|██▎ | 2874/12384 [6:05:55<20:24:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 23%|██▎ | 2875/12384 [6:05:55<20:19:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 23%|██▎ | 2875/12384 [6:06:03<20:19:38, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.04s]
Epoch 0: 23%|██▎ | 2876/12384 [6:06:03<20:15:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.04s]
Epoch 0: 23%|██▎ | 2876/12384 [6:06:10<20:15:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.61s]
Epoch 0: 23%|██▎ | 2877/12384 [6:06:10<20:13:14, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.61s]
Epoch 0: 23%|██▎ | 2877/12384 [6:06:18<20:13:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 23%|██▎ | 2878/12384 [6:06:18<20:10:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 23%|██▎ | 2878/12384 [6:06:26<20:10:17, 7.64s/it, loss=0.0009, acc=0.9983, iter_time=5.81s]
Epoch 0: 23%|██▎ | 2879/12384 [6:06:26<20:08:15, 7.63s/it, loss=0.0009, acc=0.9983, iter_time=5.81s]
Epoch 0: 23%|██▎ | 2879/12384 [6:06:33<20:08:15, 7.63s/it, loss=0.0005, acc=0.9980, iter_time=9.77s]
Epoch 0: 23%|██▎ | 2880/12384 [6:06:33<20:06:51, 7.62s/it, loss=0.0005, acc=0.9980, iter_time=9.77s]
Epoch 0: 23%|██▎ | 2880/12384 [6:06:41<20:06:51, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=3.23s]
Epoch 0: 23%|██▎ | 2881/12384 [6:06:41<20:07:04, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=3.23s]
Epoch 0: 23%|██▎ | 2881/12384 [6:06:48<20:07:04, 7.62s/it, loss=0.0006, acc=0.9989, iter_time=11.61s]
Epoch 0: 23%|██▎ | 2882/12384 [6:06:48<20:06:18, 7.62s/it, loss=0.0006, acc=0.9989, iter_time=11.61s]
Epoch 0: 23%|██▎ | 2882/12384 [6:06:56<20:06:18, 7.62s/it, loss=0.0005, acc=0.9982, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2883/12384 [6:06:56<20:05:35, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2883/12384 [6:07:04<20:05:35, 7.61s/it, loss=0.0004, acc=0.9985, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2884/12384 [6:07:04<20:06:02, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2884/12384 [6:07:11<20:06:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 23%|██▎ | 2885/12384 [6:07:11<20:05:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 23%|██▎ | 2885/12384 [6:07:19<20:05:31, 7.61s/it, loss=0.0005, acc=0.9983, iter_time=5.05s]
Epoch 0: 23%|██▎ | 2886/12384 [6:07:19<20:04:30, 7.61s/it, loss=0.0005, acc=0.9983, iter_time=5.05s]
Epoch 0: 23%|██▎ | 2886/12384 [6:07:26<20:04:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 23%|██▎ | 2887/12384 [6:07:26<20:03:35, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 23%|██▎ | 2887/12384 [6:07:34<20:03:35, 7.60s/it, loss=0.0016, acc=0.9949, iter_time=10.13s]
Epoch 0: 23%|██▎ | 2888/12384 [6:07:34<20:04:31, 7.61s/it, loss=0.0016, acc=0.9949, iter_time=10.13s]
Epoch 0: 23%|██▎ | 2888/12384 [6:07:42<20:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2889/12384 [6:07:42<20:07:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2889/12384 [6:07:49<20:07:38, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 23%|██▎ | 2890/12384 [6:07:49<20:06:00, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 23%|██▎ | 2890/12384 [6:07:57<20:06:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 23%|██▎ | 2891/12384 [6:07:57<20:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 23%|██▎ | 2891/12384 [6:08:05<20:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2892/12384 [6:08:05<20:03:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 23%|██▎ | 2892/12384 [6:08:12<20:03:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 23%|██▎ | 2893/12384 [6:08:12<20:03:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 23%|██▎ | 2893/12384 [6:08:20<20:03:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 23%|██▎ | 2894/12384 [6:08:20<20:03:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 23%|██▎ | 2894/12384 [6:08:27<20:03:33, 7.61s/it, loss=0.0012, acc=0.9976, iter_time=9.60s]
Epoch 0: 23%|██▎ | 2895/12384 [6:08:27<20:03:31, 7.61s/it, loss=0.0012, acc=0.9976, iter_time=9.60s]
Epoch 0: 23%|██▎ | 2895/12384 [6:08:35<20:03:31, 7.61s/it, loss=0.0008, acc=0.9971, iter_time=7.58s]
Epoch 0: 23%|██▎ | 2896/12384 [6:08:35<20:03:37, 7.61s/it, loss=0.0008, acc=0.9971, iter_time=7.58s]
Epoch 0: 23%|██▎ | 2896/12384 [6:08:43<20:03:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 23%|██▎ | 2897/12384 [6:08:43<20:04:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 23%|██▎ | 2897/12384 [6:08:50<20:04:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 23%|██▎ | 2898/12384 [6:08:50<20:03:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 23%|██▎ | 2898/12384 [6:08:58<20:03:16, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=9.62s]
Epoch 0: 23%|██▎ | 2899/12384 [6:08:58<20:02:44, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=9.62s]
Epoch 0: 23%|██▎ | 2899/12384 [6:09:05<20:02:44, 7.61s/it, loss=0.0009, acc=0.9984, iter_time=8.00s]
Epoch 0: 23%|██▎ | 2900/12384 [6:09:05<20:02:45, 7.61s/it, loss=0.0009, acc=0.9984, iter_time=8.00s]
Epoch 0: 23%|██▎ | 2900/12384 [6:09:13<20:02:45, 7.61s/it, loss=0.0012, acc=0.9950, iter_time=7.26s]
Epoch 0: 23%|██▎ | 2901/12384 [6:09:13<20:19:10, 7.71s/it, loss=0.0012, acc=0.9950, iter_time=7.26s]
Epoch 0: 23%|██▎ | 2901/12384 [6:09:21<20:19:10, 7.71s/it, loss=0.0014, acc=0.9958, iter_time=4.55s]
Epoch 0: 23%|██▎ | 2902/12384 [6:09:21<20:14:02, 7.68s/it, loss=0.0014, acc=0.9958, iter_time=4.55s]
Epoch 0: 23%|██▎ | 2902/12384 [6:09:29<20:14:02, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=9.16s]
Epoch 0: 23%|██▎ | 2903/12384 [6:09:29<20:11:37, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=9.16s]
Epoch 0: 23%|██▎ | 2903/12384 [6:09:36<20:11:37, 7.67s/it, loss=0.0002, acc=0.9999, iter_time=9.83s]
Epoch 0: 23%|██▎ | 2904/12384 [6:09:36<20:09:15, 7.65s/it, loss=0.0002, acc=0.9999, iter_time=9.83s]
Epoch 0: 23%|██▎ | 2904/12384 [6:09:44<20:09:15, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.23s]
Epoch 0: 23%|██▎ | 2905/12384 [6:09:44<20:08:10, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.23s]
Epoch 0: 23%|██▎ | 2905/12384 [6:09:51<20:08:10, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2906/12384 [6:09:51<20:05:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 23%|██▎ | 2906/12384 [6:09:59<20:05:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2907/12384 [6:09:59<20:06:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 23%|██▎ | 2907/12384 [6:10:07<20:06:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 23%|██▎ | 2908/12384 [6:10:07<20:05:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 23%|██▎ | 2908/12384 [6:10:14<20:05:17, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=5.28s]
Epoch 0: 23%|██▎ | 2909/12384 [6:10:14<20:03:05, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.28s]
Epoch 0: 23%|██▎ | 2909/12384 [6:10:22<20:03:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 23%|██▎ | 2910/12384 [6:10:22<20:01:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 23%|██▎ | 2910/12384 [6:10:30<20:01:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 24%|██▎ | 2911/12384 [6:10:30<20:02:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 24%|██▎ | 2911/12384 [6:10:37<20:02:08, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 24%|██▎ | 2912/12384 [6:10:37<20:02:18, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 24%|██▎ | 2912/12384 [6:10:45<20:02:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.65s]
Epoch 0: 24%|██▎ | 2913/12384 [6:10:45<20:01:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.65s]
Epoch 0: 24%|██▎ | 2913/12384 [6:10:52<20:01:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 24%|██▎ | 2914/12384 [6:10:52<20:00:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 24%|██▎ | 2914/12384 [6:11:00<20:00:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▎ | 2915/12384 [6:11:00<20:00:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▎ | 2915/12384 [6:11:08<20:00:54, 7.61s/it, loss=0.0008, acc=0.9974, iter_time=4.84s]
Epoch 0: 24%|██▎ | 2916/12384 [6:11:08<20:01:21, 7.61s/it, loss=0.0008, acc=0.9974, iter_time=4.84s]
Epoch 0: 24%|██▎ | 2916/12384 [6:11:15<20:01:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 24%|██▎ | 2917/12384 [6:11:15<20:00:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 24%|██▎ | 2917/12384 [6:11:23<20:00:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.39s]
Epoch 0: 24%|██▎ | 2918/12384 [6:11:23<19:59:43, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.39s]
Epoch 0: 24%|██▎ | 2918/12384 [6:11:30<19:59:43, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=9.57s]
Epoch 0: 24%|██▎ | 2919/12384 [6:11:30<19:58:38, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=9.57s]
Epoch 0: 24%|██▎ | 2919/12384 [6:11:38<19:58:38, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=9.48s]
Epoch 0: 24%|██▎ | 2920/12384 [6:11:38<19:58:06, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=9.48s]
Epoch 0: 24%|██▎ | 2920/12384 [6:11:46<19:58:06, 7.60s/it, loss=0.0013, acc=0.9940, iter_time=4.19s]
Epoch 0: 24%|██▎ | 2921/12384 [6:11:46<19:58:54, 7.60s/it, loss=0.0013, acc=0.9940, iter_time=4.19s]
Epoch 0: 24%|██▎ | 2921/12384 [6:11:53<19:58:54, 7.60s/it, loss=0.0005, acc=0.9996, iter_time=10.65s]
Epoch 0: 24%|██▎ | 2922/12384 [6:11:53<19:58:20, 7.60s/it, loss=0.0005, acc=0.9996, iter_time=10.65s]
Epoch 0: 24%|██▎ | 2922/12384 [6:12:01<19:58:20, 7.60s/it, loss=0.0007, acc=0.9990, iter_time=6.96s]
Epoch 0: 24%|██▎ | 2923/12384 [6:12:01<19:57:56, 7.60s/it, loss=0.0007, acc=0.9990, iter_time=6.96s]
Epoch 0: 24%|██▎ | 2923/12384 [6:12:08<19:57:56, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.18s]
Epoch 0: 24%|██▎ | 2924/12384 [6:12:08<19:58:01, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.18s]
Epoch 0: 24%|██▎ | 2924/12384 [6:12:16<19:58:01, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.64s]
Epoch 0: 24%|██▎ | 2925/12384 [6:12:16<19:58:28, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.64s]
Epoch 0: 24%|██▎ | 2925/12384 [6:12:24<19:58:28, 7.60s/it, loss=0.0002, acc=0.9992, iter_time=7.62s]
Epoch 0: 24%|██▎ | 2926/12384 [6:12:24<19:58:40, 7.60s/it, loss=0.0002, acc=0.9992, iter_time=7.62s]
Epoch 0: 24%|██▎ | 2926/12384 [6:12:32<19:58:40, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 24%|██▎ | 2927/12384 [6:12:32<20:16:05, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 24%|██▎ | 2927/12384 [6:12:39<20:16:05, 7.72s/it, loss=0.0002, acc=0.9988, iter_time=8.33s]
Epoch 0: 24%|██▎ | 2928/12384 [6:12:39<20:10:28, 7.68s/it, loss=0.0002, acc=0.9988, iter_time=8.33s]
Epoch 0: 24%|██▎ | 2928/12384 [6:12:47<20:10:28, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=3.17s]
Epoch 0: 24%|██▎ | 2929/12384 [6:12:47<20:07:07, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=3.17s]
Epoch 0: 24%|██▎ | 2929/12384 [6:12:54<20:07:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 0: 24%|██▎ | 2930/12384 [6:12:54<20:05:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 0: 24%|██▎ | 2930/12384 [6:13:02<20:05:15, 7.65s/it, loss=0.0016, acc=0.9959, iter_time=7.63s]
Epoch 0: 24%|██▎ | 2931/12384 [6:13:02<20:02:50, 7.63s/it, loss=0.0016, acc=0.9959, iter_time=7.63s]
Epoch 0: 24%|██▎ | 2931/12384 [6:13:10<20:02:50, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=7.60s]
Epoch 0: 24%|██▎ | 2932/12384 [6:13:10<20:00:40, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=7.60s]
Epoch 0: 24%|██▎ | 2932/12384 [6:13:17<20:00:40, 7.62s/it, loss=0.0005, acc=0.9995, iter_time=7.58s]
Epoch 0: 24%|██▎ | 2933/12384 [6:13:17<19:59:16, 7.61s/it, loss=0.0005, acc=0.9995, iter_time=7.58s]
Epoch 0: 24%|██▎ | 2933/12384 [6:13:25<19:59:16, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.61s]
Epoch 0: 24%|██▎ | 2934/12384 [6:13:25<19:59:27, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=7.61s]
Epoch 0: 24%|██▎ | 2934/12384 [6:13:32<19:59:27, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.43s]
Epoch 0: 24%|██▎ | 2935/12384 [6:13:32<19:58:43, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=6.43s]
Epoch 0: 24%|██▎ | 2935/12384 [6:13:40<19:58:43, 7.61s/it, loss=0.0012, acc=0.9980, iter_time=9.17s]
Epoch 0: 24%|██▎ | 2936/12384 [6:13:40<20:02:31, 7.64s/it, loss=0.0012, acc=0.9980, iter_time=9.17s]
Epoch 0: 24%|██▎ | 2936/12384 [6:13:48<20:02:31, 7.64s/it, loss=0.0043, acc=0.9953, iter_time=4.72s]
Epoch 0: 24%|██▎ | 2937/12384 [6:13:48<20:00:58, 7.63s/it, loss=0.0043, acc=0.9953, iter_time=4.72s]
Epoch 0: 24%|██▎ | 2937/12384 [6:13:55<20:00:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.27s]
Epoch 0: 24%|██▎ | 2938/12384 [6:13:55<19:59:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.27s]
Epoch 0: 24%|██▎ | 2938/12384 [6:14:03<19:59:33, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=8.56s]
Epoch 0: 24%|██▎ | 2939/12384 [6:14:03<19:59:56, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=8.56s]
Epoch 0: 24%|██▎ | 2939/12384 [6:14:11<19:59:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 24%|██▎ | 2940/12384 [6:14:11<19:59:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 24%|██▎ | 2940/12384 [6:14:18<19:59:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 24%|██▎ | 2941/12384 [6:14:18<19:58:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 24%|██▎ | 2941/12384 [6:14:26<19:58:55, 7.62s/it, loss=0.0018, acc=0.9962, iter_time=7.60s]
Epoch 0: 24%|██▍ | 2942/12384 [6:14:26<19:57:07, 7.61s/it, loss=0.0018, acc=0.9962, iter_time=7.60s]
Epoch 0: 24%|██▍ | 2942/12384 [6:14:33<19:57:07, 7.61s/it, loss=0.0006, acc=0.9980, iter_time=4.45s]
Epoch 0: 24%|██▍ | 2943/12384 [6:14:33<19:56:19, 7.60s/it, loss=0.0006, acc=0.9980, iter_time=4.45s]
Epoch 0: 24%|██▍ | 2943/12384 [6:14:41<19:56:19, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=11.10s]
Epoch 0: 24%|██▍ | 2944/12384 [6:14:41<19:56:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.10s]
Epoch 0: 24%|██▍ | 2944/12384 [6:14:49<19:56:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.20s]
Epoch 0: 24%|██▍ | 2945/12384 [6:14:49<19:56:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.20s]
Epoch 0: 24%|██▍ | 2945/12384 [6:14:56<19:56:23, 7.61s/it, loss=0.0013, acc=0.9959, iter_time=8.78s]
Epoch 0: 24%|██▍ | 2946/12384 [6:14:56<19:55:25, 7.60s/it, loss=0.0013, acc=0.9959, iter_time=8.78s]
Epoch 0: 24%|██▍ | 2946/12384 [6:15:04<19:55:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 24%|██▍ | 2947/12384 [6:15:04<19:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 24%|██▍ | 2947/12384 [6:15:11<19:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 24%|██▍ | 2948/12384 [6:15:11<19:57:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 24%|██▍ | 2948/12384 [6:15:19<19:57:29, 7.61s/it, loss=0.0006, acc=0.9987, iter_time=7.63s]
Epoch 0: 24%|██▍ | 2949/12384 [6:15:19<19:56:38, 7.61s/it, loss=0.0006, acc=0.9987, iter_time=7.63s]
Epoch 0: 24%|██▍ | 2949/12384 [6:15:27<19:56:38, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.01s]
Epoch 0: 24%|██▍ | 2950/12384 [6:15:27<19:56:48, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.01s]
Epoch 0: 24%|██▍ | 2950/12384 [6:15:34<19:56:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.17s]
Epoch 0: 24%|██▍ | 2951/12384 [6:15:34<19:56:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.17s]
Epoch 0: 24%|██▍ | 2951/12384 [6:15:42<19:56:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.05s]
Epoch 0: 24%|██▍ | 2952/12384 [6:15:42<19:56:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.05s]
Epoch 0: 24%|██▍ | 2952/12384 [6:15:50<19:56:22, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.25s]
Epoch 0: 24%|██▍ | 2953/12384 [6:15:50<20:11:51, 7.71s/it, loss=0.0002, acc=0.9998, iter_time=7.25s]
Epoch 0: 24%|██▍ | 2953/12384 [6:15:57<20:11:51, 7.71s/it, loss=0.0007, acc=0.9975, iter_time=7.89s]
Epoch 0: 24%|██▍ | 2954/12384 [6:15:57<20:05:59, 7.67s/it, loss=0.0007, acc=0.9975, iter_time=7.89s]
Epoch 0: 24%|██▍ | 2954/12384 [6:16:05<20:05:59, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2955/12384 [6:16:05<20:04:00, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2955/12384 [6:16:13<20:04:00, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2956/12384 [6:16:13<20:01:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2956/12384 [6:16:20<20:01:42, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2957/12384 [6:16:20<19:59:14, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2957/12384 [6:16:28<19:59:14, 7.63s/it, loss=0.0010, acc=0.9984, iter_time=7.71s]
Epoch 0: 24%|██▍ | 2958/12384 [6:16:28<20:02:34, 7.65s/it, loss=0.0010, acc=0.9984, iter_time=7.71s]
Epoch 0: 24%|██▍ | 2958/12384 [6:16:36<20:02:34, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=6.99s]
Epoch 0: 24%|██▍ | 2959/12384 [6:16:36<20:00:47, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=6.99s]
Epoch 0: 24%|██▍ | 2959/12384 [6:16:43<20:00:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 0: 24%|██▍ | 2960/12384 [6:16:43<19:59:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 0: 24%|██▍ | 2960/12384 [6:16:51<19:59:35, 7.64s/it, loss=0.0002, acc=0.9996, iter_time=5.14s]
Epoch 0: 24%|██▍ | 2961/12384 [6:16:51<19:56:26, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=5.14s]
Epoch 0: 24%|██▍ | 2961/12384 [6:16:58<19:56:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.15s]
Epoch 0: 24%|██▍ | 2962/12384 [6:16:58<19:54:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.15s]
Epoch 0: 24%|██▍ | 2962/12384 [6:17:06<19:54:54, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=10.11s]
Epoch 0: 24%|██▍ | 2963/12384 [6:17:06<20:00:13, 7.64s/it, loss=0.0002, acc=0.9986, iter_time=10.11s]
Epoch 0: 24%|██▍ | 2963/12384 [6:17:14<20:00:13, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.74s]
Epoch 0: 24%|██▍ | 2964/12384 [6:17:14<19:59:20, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.74s]
Epoch 0: 24%|██▍ | 2964/12384 [6:17:21<19:59:20, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 0: 24%|██▍ | 2965/12384 [6:17:21<19:58:25, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 0: 24%|██▍ | 2965/12384 [6:17:29<19:58:25, 7.63s/it, loss=0.0006, acc=0.9976, iter_time=7.62s]
Epoch 0: 24%|██▍ | 2966/12384 [6:17:29<19:56:33, 7.62s/it, loss=0.0006, acc=0.9976, iter_time=7.62s]
Epoch 0: 24%|██▍ | 2966/12384 [6:17:36<19:56:33, 7.62s/it, loss=0.0016, acc=0.9968, iter_time=7.60s]
Epoch 0: 24%|██▍ | 2967/12384 [6:17:36<19:55:05, 7.61s/it, loss=0.0016, acc=0.9968, iter_time=7.60s]
Epoch 0: 24%|██▍ | 2967/12384 [6:17:44<19:55:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 24%|██▍ | 2968/12384 [6:17:44<19:54:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 24%|██▍ | 2968/12384 [6:17:52<19:54:50, 7.61s/it, loss=0.0009, acc=0.9984, iter_time=7.23s]
Epoch 0: 24%|██▍ | 2969/12384 [6:17:52<19:54:48, 7.61s/it, loss=0.0009, acc=0.9984, iter_time=7.23s]
Epoch 0: 24%|██▍ | 2969/12384 [6:17:59<19:54:48, 7.61s/it, loss=0.0006, acc=0.9985, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2970/12384 [6:17:59<19:53:52, 7.61s/it, loss=0.0006, acc=0.9985, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2970/12384 [6:18:07<19:53:52, 7.61s/it, loss=0.0003, acc=0.9974, iter_time=4.54s]
Epoch 0: 24%|██▍ | 2971/12384 [6:18:07<19:52:49, 7.60s/it, loss=0.0003, acc=0.9974, iter_time=4.54s]
Epoch 0: 24%|██▍ | 2971/12384 [6:18:14<19:52:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 24%|██▍ | 2972/12384 [6:18:14<19:52:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 24%|██▍ | 2972/12384 [6:18:22<19:52:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 24%|██▍ | 2973/12384 [6:18:22<19:57:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 24%|██▍ | 2973/12384 [6:18:30<19:57:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 24%|██▍ | 2974/12384 [6:18:30<19:59:40, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 24%|██▍ | 2974/12384 [6:18:37<19:59:40, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 24%|██▍ | 2975/12384 [6:18:37<19:56:41, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 24%|██▍ | 2975/12384 [6:18:45<19:56:41, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.45s]
Epoch 0: 24%|██▍ | 2976/12384 [6:18:45<19:57:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.45s]
Epoch 0: 24%|██▍ | 2976/12384 [6:18:53<19:57:37, 7.64s/it, loss=0.0005, acc=0.9992, iter_time=7.96s]
Epoch 0: 24%|██▍ | 2977/12384 [6:18:53<20:09:23, 7.71s/it, loss=0.0005, acc=0.9992, iter_time=7.96s]
Epoch 0: 24%|██▍ | 2977/12384 [6:19:01<20:09:23, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=4.23s]
Epoch 0: 24%|██▍ | 2978/12384 [6:19:01<20:04:40, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.23s]
Epoch 0: 24%|██▍ | 2978/12384 [6:19:09<20:04:40, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=11.03s]
Epoch 0: 24%|██▍ | 2979/12384 [6:19:09<20:16:22, 7.76s/it, loss=0.0001, acc=0.9999, iter_time=11.03s]
Epoch 0: 24%|██▍ | 2979/12384 [6:19:16<20:16:22, 7.76s/it, loss=0.0001, acc=0.9999, iter_time=7.88s]
Epoch 0: 24%|██▍ | 2980/12384 [6:19:16<20:08:14, 7.71s/it, loss=0.0001, acc=0.9999, iter_time=7.88s]
Epoch 0: 24%|██▍ | 2980/12384 [6:19:24<20:08:14, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=5.86s]
Epoch 0: 24%|██▍ | 2981/12384 [6:19:24<20:04:07, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=5.86s]
Epoch 0: 24%|██▍ | 2981/12384 [6:19:31<20:04:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 24%|██▍ | 2982/12384 [6:19:31<20:00:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 24%|██▍ | 2982/12384 [6:19:39<20:00:59, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 24%|██▍ | 2983/12384 [6:19:39<19:58:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 24%|██▍ | 2983/12384 [6:19:47<19:58:42, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=8.01s]
Epoch 0: 24%|██▍ | 2984/12384 [6:19:47<19:56:18, 7.64s/it, loss=0.0002, acc=0.9992, iter_time=8.01s]
Epoch 0: 24%|██▍ | 2984/12384 [6:19:54<19:56:18, 7.64s/it, loss=0.0005, acc=0.9985, iter_time=7.21s]
Epoch 0: 24%|██▍ | 2985/12384 [6:19:54<19:55:22, 7.63s/it, loss=0.0005, acc=0.9985, iter_time=7.21s]
Epoch 0: 24%|██▍ | 2985/12384 [6:20:02<19:55:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2986/12384 [6:20:02<19:54:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2986/12384 [6:20:09<19:54:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 24%|██▍ | 2987/12384 [6:20:09<19:53:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 24%|██▍ | 2987/12384 [6:20:17<19:53:26, 7.62s/it, loss=0.0003, acc=0.9993, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2988/12384 [6:20:17<19:56:35, 7.64s/it, loss=0.0003, acc=0.9993, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2988/12384 [6:20:25<19:56:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 24%|██▍ | 2989/12384 [6:20:25<19:54:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 24%|██▍ | 2989/12384 [6:20:32<19:54:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2990/12384 [6:20:32<19:53:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2990/12384 [6:20:40<19:53:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2991/12384 [6:20:40<19:52:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 24%|██▍ | 2991/12384 [6:20:48<19:52:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 24%|██▍ | 2992/12384 [6:20:48<19:52:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 24%|██▍ | 2992/12384 [6:20:55<19:52:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 24%|██▍ | 2993/12384 [6:20:55<19:51:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 24%|██▍ | 2993/12384 [6:21:03<19:51:39, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=5.10s]
Epoch 0: 24%|██▍ | 2994/12384 [6:21:03<19:55:07, 7.64s/it, loss=0.0002, acc=0.9996, iter_time=5.10s]
Epoch 0: 24%|██▍ | 2994/12384 [6:21:11<19:55:07, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=10.21s]
Epoch 0: 24%|██▍ | 2995/12384 [6:21:11<19:54:17, 7.63s/it, loss=0.0007, acc=0.9980, iter_time=10.21s]
Epoch 0: 24%|██▍ | 2995/12384 [6:21:18<19:54:17, 7.63s/it, loss=0.0018, acc=0.9980, iter_time=7.32s]
Epoch 0: 24%|██▍ | 2996/12384 [6:21:18<19:53:50, 7.63s/it, loss=0.0018, acc=0.9980, iter_time=7.32s]
Epoch 0: 24%|██▍ | 2996/12384 [6:21:26<19:53:50, 7.63s/it, loss=0.0003, acc=0.9980, iter_time=7.93s]
Epoch 0: 24%|██▍ | 2997/12384 [6:21:26<19:56:10, 7.65s/it, loss=0.0003, acc=0.9980, iter_time=7.93s]
Epoch 0: 24%|██▍ | 2997/12384 [6:21:33<19:56:10, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 24%|██▍ | 2998/12384 [6:21:33<19:53:55, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 24%|██▍ | 2998/12384 [6:21:41<19:53:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 24%|██▍ | 2999/12384 [6:21:41<19:52:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 24%|██▍ | 2999/12384 [6:21:49<19:52:19, 7.62s/it, loss=0.0006, acc=0.9993, iter_time=8.66s]
Epoch 0: 24%|██▍ | 3000/12384 [6:21:49<20:00:53, 7.68s/it, loss=0.0006, acc=0.9993, iter_time=8.66s]
Epoch 0: 24%|██▍ | 3000/12384 [6:21:56<20:00:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 24%|██▍ | 3001/12384 [6:21:56<19:58:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 24%|██▍ | 3001/12384 [6:22:04<19:58:03, 7.66s/it, loss=0.0009, acc=0.9974, iter_time=7.59s]
Epoch 0: 24%|██▍ | 3002/12384 [6:22:04<19:55:31, 7.65s/it, loss=0.0009, acc=0.9974, iter_time=7.59s]
Epoch 0: 24%|██▍ | 3002/12384 [6:22:12<19:55:31, 7.65s/it, loss=0.0006, acc=0.9978, iter_time=9.03s]
Epoch 0: 24%|██▍ | 3003/12384 [6:22:12<19:52:59, 7.63s/it, loss=0.0006, acc=0.9978, iter_time=9.03s]
Epoch 0: 24%|██▍ | 3003/12384 [6:22:19<19:52:59, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.46s]
Epoch 0: 24%|██▍ | 3004/12384 [6:22:19<19:52:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.46s]
Epoch 0: 24%|██▍ | 3004/12384 [6:22:27<19:52:23, 7.63s/it, loss=0.0005, acc=0.9990, iter_time=9.74s]
Epoch 0: 24%|██▍ | 3005/12384 [6:22:27<20:07:09, 7.72s/it, loss=0.0005, acc=0.9990, iter_time=9.74s]
Epoch 0: 24%|██▍ | 3005/12384 [6:22:35<20:07:09, 7.72s/it, loss=0.0013, acc=0.9976, iter_time=7.90s]
Epoch 0: 24%|██▍ | 3006/12384 [6:22:35<20:01:22, 7.69s/it, loss=0.0013, acc=0.9976, iter_time=7.90s]
Epoch 0: 24%|██▍ | 3006/12384 [6:22:42<20:01:22, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.97s]
Epoch 0: 24%|██▍ | 3007/12384 [6:22:42<20:00:35, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.97s]
Epoch 0: 24%|██▍ | 3007/12384 [6:22:50<20:00:35, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.70s]
Epoch 0: 24%|██▍ | 3008/12384 [6:22:50<19:57:51, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.70s]
Epoch 0: 24%|██▍ | 3008/12384 [6:22:58<19:57:51, 7.67s/it, loss=0.0004, acc=0.9998, iter_time=5.78s]
Epoch 0: 24%|██▍ | 3009/12384 [6:22:58<19:53:38, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=5.78s]
Epoch 0: 24%|██▍ | 3009/12384 [6:23:05<19:53:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 0: 24%|██▍ | 3010/12384 [6:23:05<19:51:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 0: 24%|██▍ | 3010/12384 [6:23:13<19:51:15, 7.62s/it, loss=0.0007, acc=0.9998, iter_time=6.98s]
Epoch 0: 24%|██▍ | 3011/12384 [6:23:13<19:49:27, 7.61s/it, loss=0.0007, acc=0.9998, iter_time=6.98s]
Epoch 0: 24%|██▍ | 3011/12384 [6:23:20<19:49:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 24%|██▍ | 3012/12384 [6:23:20<19:48:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 24%|██▍ | 3012/12384 [6:23:28<19:48:25, 7.61s/it, loss=0.0098, acc=0.9923, iter_time=4.21s]
Epoch 0: 24%|██▍ | 3013/12384 [6:23:28<19:48:48, 7.61s/it, loss=0.0098, acc=0.9923, iter_time=4.21s]
Epoch 0: 24%|██▍ | 3013/12384 [6:23:36<19:48:48, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.65s]
Epoch 0: 24%|██▍ | 3014/12384 [6:23:36<19:50:36, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.65s]
Epoch 0: 24%|██▍ | 3014/12384 [6:23:43<19:50:36, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=11.00s]
Epoch 0: 24%|██▍ | 3015/12384 [6:23:43<19:49:34, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=11.00s]
Epoch 0: 24%|██▍ | 3015/12384 [6:23:51<19:49:34, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=8.09s]
Epoch 0: 24%|██▍ | 3016/12384 [6:23:51<19:52:33, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=8.09s]
Epoch 0: 24%|██▍ | 3016/12384 [6:23:59<19:52:33, 7.64s/it, loss=0.0006, acc=0.9968, iter_time=7.21s]
Epoch 0: 24%|██▍ | 3017/12384 [6:23:59<19:51:30, 7.63s/it, loss=0.0006, acc=0.9968, iter_time=7.21s]
Epoch 0: 24%|██▍ | 3017/12384 [6:24:06<19:51:30, 7.63s/it, loss=0.0008, acc=0.9971, iter_time=6.41s]
Epoch 0: 24%|██▍ | 3018/12384 [6:24:06<19:50:58, 7.63s/it, loss=0.0008, acc=0.9971, iter_time=6.41s]
Epoch 0: 24%|██▍ | 3018/12384 [6:24:14<19:50:58, 7.63s/it, loss=0.0014, acc=0.9955, iter_time=8.83s]
Epoch 0: 24%|██▍ | 3019/12384 [6:24:14<19:50:52, 7.63s/it, loss=0.0014, acc=0.9955, iter_time=8.83s]
Epoch 0: 24%|██▍ | 3019/12384 [6:24:22<19:50:52, 7.63s/it, loss=0.0002, acc=0.9985, iter_time=6.68s]
Epoch 0: 24%|██▍ | 3020/12384 [6:24:22<19:50:31, 7.63s/it, loss=0.0002, acc=0.9985, iter_time=6.68s]
Epoch 0: 24%|██▍ | 3020/12384 [6:24:29<19:50:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 24%|██▍ | 3021/12384 [6:24:29<19:50:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 24%|██▍ | 3021/12384 [6:24:37<19:50:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.90s]
Epoch 0: 24%|██▍ | 3022/12384 [6:24:37<19:48:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.90s]
Epoch 0: 24%|██▍ | 3022/12384 [6:24:44<19:48:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.73s]
Epoch 0: 24%|██▍ | 3023/12384 [6:24:44<19:49:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.73s]
Epoch 0: 24%|██▍ | 3023/12384 [6:24:52<19:49:01, 7.62s/it, loss=0.0022, acc=0.9970, iter_time=10.14s]
Epoch 0: 24%|██▍ | 3024/12384 [6:24:52<19:46:49, 7.61s/it, loss=0.0022, acc=0.9970, iter_time=10.14s]
Epoch 0: 24%|██▍ | 3024/12384 [6:25:00<19:46:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.84s]
Epoch 0: 24%|██▍ | 3025/12384 [6:25:00<19:47:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.84s]
Epoch 0: 24%|██▍ | 3025/12384 [6:25:07<19:47:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 0: 24%|██▍ | 3026/12384 [6:25:07<19:48:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 0: 24%|██▍ | 3026/12384 [6:25:15<19:48:32, 7.62s/it, loss=0.0024, acc=0.9971, iter_time=7.64s]
Epoch 0: 24%|██▍ | 3027/12384 [6:25:15<19:48:15, 7.62s/it, loss=0.0024, acc=0.9971, iter_time=7.64s]
Epoch 0: 24%|██▍ | 3027/12384 [6:25:23<19:48:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 24%|██▍ | 3028/12384 [6:25:23<19:51:10, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 24%|██▍ | 3028/12384 [6:25:30<19:51:10, 7.64s/it, loss=0.0004, acc=0.9992, iter_time=7.29s]
Epoch 0: 24%|██▍ | 3029/12384 [6:25:30<19:49:01, 7.63s/it, loss=0.0004, acc=0.9992, iter_time=7.29s]
Epoch 0: 24%|██▍ | 3029/12384 [6:25:38<19:49:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.04s]
Epoch 0: 24%|██▍ | 3030/12384 [6:25:38<19:49:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.04s]
Epoch 0: 24%|██▍ | 3030/12384 [6:25:45<19:49:53, 7.63s/it, loss=0.0005, acc=0.9977, iter_time=10.49s]
Epoch 0: 24%|██▍ | 3031/12384 [6:25:45<19:48:14, 7.62s/it, loss=0.0005, acc=0.9977, iter_time=10.49s]
Epoch 0: 24%|██▍ | 3031/12384 [6:25:53<19:48:14, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.91s]
Epoch 0: 24%|██▍ | 3032/12384 [6:25:53<20:02:59, 7.72s/it, loss=0.0002, acc=0.9998, iter_time=7.91s]
Epoch 0: 24%|██▍ | 3032/12384 [6:26:01<20:02:59, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 24%|██▍ | 3033/12384 [6:26:01<19:57:29, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 24%|██▍ | 3033/12384 [6:26:09<19:57:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 24%|██▍ | 3034/12384 [6:26:09<19:55:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 24%|██▍ | 3034/12384 [6:26:16<19:55:00, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.92s]
Epoch 0: 25%|██▍ | 3035/12384 [6:26:16<19:51:25, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.92s]
Epoch 0: 25%|██▍ | 3035/12384 [6:26:24<19:51:25, 7.65s/it, loss=0.0011, acc=0.9949, iter_time=9.07s]
Epoch 0: 25%|██▍ | 3036/12384 [6:26:24<19:48:10, 7.63s/it, loss=0.0011, acc=0.9949, iter_time=9.07s]
Epoch 0: 25%|██▍ | 3036/12384 [6:26:31<19:48:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3037/12384 [6:26:31<19:47:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3037/12384 [6:26:39<19:47:50, 7.62s/it, loss=0.0011, acc=0.9992, iter_time=7.61s]
Epoch 0: 25%|██▍ | 3038/12384 [6:26:39<19:47:28, 7.62s/it, loss=0.0011, acc=0.9992, iter_time=7.61s]
Epoch 0: 25%|██▍ | 3038/12384 [6:26:47<19:47:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 25%|██▍ | 3039/12384 [6:26:47<19:45:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 25%|██▍ | 3039/12384 [6:26:54<19:45:04, 7.61s/it, loss=0.0006, acc=0.9976, iter_time=8.26s]
Epoch 0: 25%|██▍ | 3040/12384 [6:26:54<19:44:52, 7.61s/it, loss=0.0006, acc=0.9976, iter_time=8.26s]
Epoch 0: 25%|██▍ | 3040/12384 [6:27:02<19:44:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 25%|██▍ | 3041/12384 [6:27:02<19:44:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 25%|██▍ | 3041/12384 [6:27:09<19:44:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 25%|██▍ | 3042/12384 [6:27:09<19:44:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 25%|██▍ | 3042/12384 [6:27:17<19:44:18, 7.61s/it, loss=0.0015, acc=0.9969, iter_time=8.54s]
Epoch 0: 25%|██▍ | 3043/12384 [6:27:17<19:43:46, 7.60s/it, loss=0.0015, acc=0.9969, iter_time=8.54s]
Epoch 0: 25%|██▍ | 3043/12384 [6:27:25<19:43:46, 7.60s/it, loss=0.0004, acc=0.9984, iter_time=7.61s]
Epoch 0: 25%|██▍ | 3044/12384 [6:27:25<19:43:42, 7.60s/it, loss=0.0004, acc=0.9984, iter_time=7.61s]
Epoch 0: 25%|██▍ | 3044/12384 [6:27:32<19:43:42, 7.60s/it, loss=0.0003, acc=0.9984, iter_time=6.08s]
Epoch 0: 25%|██▍ | 3045/12384 [6:27:32<19:43:54, 7.61s/it, loss=0.0003, acc=0.9984, iter_time=6.08s]
Epoch 0: 25%|██▍ | 3045/12384 [6:27:40<19:43:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 25%|██▍ | 3046/12384 [6:27:40<19:43:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 25%|██▍ | 3046/12384 [6:27:47<19:43:16, 7.60s/it, loss=0.0004, acc=0.9990, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3047/12384 [6:27:47<19:44:06, 7.61s/it, loss=0.0004, acc=0.9990, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3047/12384 [6:27:55<19:44:06, 7.61s/it, loss=0.0009, acc=0.9978, iter_time=8.00s]
Epoch 0: 25%|██▍ | 3048/12384 [6:27:55<19:44:05, 7.61s/it, loss=0.0009, acc=0.9978, iter_time=8.00s]
Epoch 0: 25%|██▍ | 3048/12384 [6:28:03<19:44:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 25%|██▍ | 3049/12384 [6:28:03<19:44:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 25%|██▍ | 3049/12384 [6:28:10<19:44:48, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.03s]
Epoch 0: 25%|██▍ | 3050/12384 [6:28:10<19:44:24, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.03s]
Epoch 0: 25%|██▍ | 3050/12384 [6:28:18<19:44:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 25%|██▍ | 3051/12384 [6:28:18<19:47:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 25%|██▍ | 3051/12384 [6:28:25<19:47:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 25%|██▍ | 3052/12384 [6:28:25<19:45:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 25%|██▍ | 3052/12384 [6:28:33<19:45:04, 7.62s/it, loss=0.0018, acc=0.9982, iter_time=7.70s]
Epoch 0: 25%|██▍ | 3053/12384 [6:28:33<19:49:03, 7.65s/it, loss=0.0018, acc=0.9982, iter_time=7.70s]
Epoch 0: 25%|██▍ | 3053/12384 [6:28:41<19:49:03, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 25%|██▍ | 3054/12384 [6:28:41<19:46:48, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 25%|██▍ | 3054/12384 [6:28:49<19:46:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 25%|██▍ | 3055/12384 [6:28:49<19:50:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 25%|██▍ | 3055/12384 [6:28:56<19:50:35, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=7.76s]
Epoch 0: 25%|██▍ | 3056/12384 [6:28:56<19:52:13, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.76s]
Epoch 0: 25%|██▍ | 3056/12384 [6:29:04<19:52:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 25%|██▍ | 3057/12384 [6:29:04<20:01:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 25%|██▍ | 3057/12384 [6:29:12<20:01:25, 7.73s/it, loss=0.0006, acc=0.9972, iter_time=7.71s]
Epoch 0: 25%|██▍ | 3058/12384 [6:29:12<20:10:35, 7.79s/it, loss=0.0006, acc=0.9972, iter_time=7.71s]
Epoch 0: 25%|██▍ | 3058/12384 [6:29:20<20:10:35, 7.79s/it, loss=0.0010, acc=0.9963, iter_time=7.83s]
Epoch 0: 25%|██▍ | 3059/12384 [6:29:20<20:01:49, 7.73s/it, loss=0.0010, acc=0.9963, iter_time=7.83s]
Epoch 0: 25%|██▍ | 3059/12384 [6:29:27<20:01:49, 7.73s/it, loss=0.0006, acc=0.9981, iter_time=6.96s]
Epoch 0: 25%|██▍ | 3060/12384 [6:29:27<19:55:01, 7.69s/it, loss=0.0006, acc=0.9981, iter_time=6.96s]
Epoch 0: 25%|██▍ | 3060/12384 [6:29:35<19:55:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 25%|██▍ | 3061/12384 [6:29:35<19:51:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 25%|██▍ | 3061/12384 [6:29:42<19:51:34, 7.67s/it, loss=0.0004, acc=0.9994, iter_time=7.62s]
Epoch 0: 25%|██▍ | 3062/12384 [6:29:42<19:48:31, 7.65s/it, loss=0.0004, acc=0.9994, iter_time=7.62s]
Epoch 0: 25%|██▍ | 3062/12384 [6:29:50<19:48:31, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 0: 25%|██▍ | 3063/12384 [6:29:50<19:46:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 0: 25%|██▍ | 3063/12384 [6:29:58<19:46:35, 7.64s/it, loss=0.0015, acc=0.9963, iter_time=9.36s]
Epoch 0: 25%|██▍ | 3064/12384 [6:29:58<19:44:39, 7.63s/it, loss=0.0015, acc=0.9963, iter_time=9.36s]
Epoch 0: 25%|██▍ | 3064/12384 [6:30:05<19:44:39, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.13s]
Epoch 0: 25%|██▍ | 3065/12384 [6:30:05<19:45:30, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.13s]
Epoch 0: 25%|██▍ | 3065/12384 [6:30:13<19:45:30, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=10.18s]
Epoch 0: 25%|██▍ | 3066/12384 [6:30:13<19:43:47, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=10.18s]
Epoch 0: 25%|██▍ | 3066/12384 [6:30:20<19:43:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3067/12384 [6:30:20<19:43:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3067/12384 [6:30:28<19:43:19, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 25%|██▍ | 3068/12384 [6:30:28<19:43:42, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 25%|██▍ | 3068/12384 [6:30:36<19:43:42, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.63s]
Epoch 0: 25%|██▍ | 3069/12384 [6:30:36<19:43:39, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.63s]
Epoch 0: 25%|██▍ | 3069/12384 [6:30:43<19:43:39, 7.62s/it, loss=0.0003, acc=0.9985, iter_time=6.09s]
Epoch 0: 25%|██▍ | 3070/12384 [6:30:43<19:42:12, 7.62s/it, loss=0.0003, acc=0.9985, iter_time=6.09s]
Epoch 0: 25%|██▍ | 3070/12384 [6:30:51<19:42:12, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.57s]
Epoch 0: 25%|██▍ | 3071/12384 [6:30:51<19:41:29, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.57s]
Epoch 0: 25%|██▍ | 3071/12384 [6:30:59<19:41:29, 7.61s/it, loss=0.0006, acc=0.9999, iter_time=8.55s]
Epoch 0: 25%|██▍ | 3072/12384 [6:30:59<19:40:56, 7.61s/it, loss=0.0006, acc=0.9999, iter_time=8.55s]
Epoch 0: 25%|██▍ | 3072/12384 [6:31:06<19:40:56, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=4.89s]
Epoch 0: 25%|██▍ | 3073/12384 [6:31:06<19:40:51, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=4.89s]
Epoch 0: 25%|██▍ | 3073/12384 [6:31:14<19:40:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 25%|██▍ | 3074/12384 [6:31:14<19:40:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 25%|██▍ | 3074/12384 [6:31:21<19:40:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.46s]
Epoch 0: 25%|██▍ | 3075/12384 [6:31:21<19:44:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.46s]
Epoch 0: 25%|██▍ | 3075/12384 [6:31:29<19:44:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 25%|██▍ | 3076/12384 [6:31:29<19:43:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 25%|██▍ | 3076/12384 [6:31:37<19:43:01, 7.63s/it, loss=0.0002, acc=0.9990, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3077/12384 [6:31:37<19:41:13, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3077/12384 [6:31:44<19:41:13, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 25%|██▍ | 3078/12384 [6:31:44<19:40:52, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 25%|██▍ | 3078/12384 [6:31:52<19:40:52, 7.61s/it, loss=0.0003, acc=0.9977, iter_time=6.74s]
Epoch 0: 25%|██▍ | 3079/12384 [6:31:52<19:41:19, 7.62s/it, loss=0.0003, acc=0.9977, iter_time=6.74s]
Epoch 0: 25%|██▍ | 3079/12384 [6:32:00<19:41:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.88s]
Epoch 0: 25%|██▍ | 3080/12384 [6:32:00<19:40:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.88s]
Epoch 0: 25%|██▍ | 3080/12384 [6:32:07<19:40:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 25%|██▍ | 3081/12384 [6:32:07<19:40:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 25%|██▍ | 3081/12384 [6:32:15<19:40:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 25%|██▍ | 3082/12384 [6:32:15<19:40:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 25%|██▍ | 3082/12384 [6:32:22<19:40:02, 7.61s/it, loss=0.0014, acc=0.9967, iter_time=5.83s]
Epoch 0: 25%|██▍ | 3083/12384 [6:32:22<19:39:22, 7.61s/it, loss=0.0014, acc=0.9967, iter_time=5.83s]
Epoch 0: 25%|██▍ | 3083/12384 [6:32:30<19:39:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.63s]
Epoch 0: 25%|██▍ | 3084/12384 [6:32:30<19:40:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.63s]
Epoch 0: 25%|██▍ | 3084/12384 [6:32:38<19:40:14, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.69s]
Epoch 0: 25%|██▍ | 3085/12384 [6:32:38<19:56:14, 7.72s/it, loss=0.0002, acc=0.9999, iter_time=7.69s]
Epoch 0: 25%|██▍ | 3085/12384 [6:32:46<19:56:14, 7.72s/it, loss=0.0004, acc=0.9998, iter_time=7.90s]
Epoch 0: 25%|██▍ | 3086/12384 [6:32:46<19:51:38, 7.69s/it, loss=0.0004, acc=0.9998, iter_time=7.90s]
Epoch 0: 25%|██▍ | 3086/12384 [6:32:53<19:51:38, 7.69s/it, loss=0.0003, acc=0.9991, iter_time=7.62s]
Epoch 0: 25%|██▍ | 3087/12384 [6:32:53<19:47:49, 7.67s/it, loss=0.0003, acc=0.9991, iter_time=7.62s]
Epoch 0: 25%|██▍ | 3087/12384 [6:33:01<19:47:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 25%|██▍ | 3088/12384 [6:33:01<19:46:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 25%|██▍ | 3088/12384 [6:33:08<19:46:17, 7.66s/it, loss=0.0005, acc=0.9960, iter_time=7.64s]
Epoch 0: 25%|██▍ | 3089/12384 [6:33:08<19:46:20, 7.66s/it, loss=0.0005, acc=0.9960, iter_time=7.64s]
Epoch 0: 25%|██▍ | 3089/12384 [6:33:16<19:46:20, 7.66s/it, loss=0.0005, acc=0.9989, iter_time=6.20s]
Epoch 0: 25%|██▍ | 3090/12384 [6:33:16<19:45:00, 7.65s/it, loss=0.0005, acc=0.9989, iter_time=6.20s]
Epoch 0: 25%|██▍ | 3090/12384 [6:33:24<19:45:00, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=9.11s]
Epoch 0: 25%|██▍ | 3091/12384 [6:33:24<19:42:27, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=9.11s]
Epoch 0: 25%|██▍ | 3091/12384 [6:33:31<19:42:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3092/12384 [6:33:31<19:40:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▍ | 3092/12384 [6:33:39<19:40:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 25%|██▍ | 3093/12384 [6:33:39<19:40:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 25%|██▍ | 3093/12384 [6:33:47<19:40:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 25%|██▍ | 3094/12384 [6:33:47<19:40:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 25%|██▍ | 3094/12384 [6:33:54<19:40:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.35s]
Epoch 0: 25%|██▍ | 3095/12384 [6:33:54<19:38:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.35s]
Epoch 0: 25%|██▍ | 3095/12384 [6:34:02<19:38:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 25%|██▌ | 3096/12384 [6:34:02<19:38:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 25%|██▌ | 3096/12384 [6:34:09<19:38:13, 7.61s/it, loss=0.0008, acc=0.9987, iter_time=7.23s]
Epoch 0: 25%|██▌ | 3097/12384 [6:34:09<19:37:44, 7.61s/it, loss=0.0008, acc=0.9987, iter_time=7.23s]
Epoch 0: 25%|██▌ | 3097/12384 [6:34:17<19:37:44, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=5.55s]
Epoch 0: 25%|██▌ | 3098/12384 [6:34:17<19:40:45, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=5.55s]
Epoch 0: 25%|██▌ | 3098/12384 [6:34:25<19:40:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 25%|██▌ | 3099/12384 [6:34:25<19:39:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 25%|██▌ | 3099/12384 [6:34:32<19:39:47, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=10.55s]
Epoch 0: 25%|██▌ | 3100/12384 [6:34:32<19:38:48, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=10.55s]
Epoch 0: 25%|██▌ | 3100/12384 [6:34:40<19:38:48, 7.62s/it, loss=0.0035, acc=0.9950, iter_time=7.21s]
Epoch 0: 25%|██▌ | 3101/12384 [6:34:40<19:38:00, 7.61s/it, loss=0.0035, acc=0.9950, iter_time=7.21s]
Epoch 0: 25%|██▌ | 3101/12384 [6:34:47<19:38:00, 7.61s/it, loss=0.0004, acc=0.9993, iter_time=7.60s]
Epoch 0: 25%|██▌ | 3102/12384 [6:34:47<19:38:23, 7.62s/it, loss=0.0004, acc=0.9993, iter_time=7.60s]
Epoch 0: 25%|██▌ | 3102/12384 [6:34:55<19:38:23, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=7.63s]
Epoch 0: 25%|██▌ | 3103/12384 [6:34:55<19:38:23, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=7.63s]
Epoch 0: 25%|██▌ | 3103/12384 [6:35:03<19:38:23, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.56s]
Epoch 0: 25%|██▌ | 3104/12384 [6:35:03<19:38:00, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.56s]
Epoch 0: 25%|██▌ | 3104/12384 [6:35:10<19:38:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 25%|██▌ | 3105/12384 [6:35:10<19:37:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 25%|██▌ | 3105/12384 [6:35:18<19:37:44, 7.62s/it, loss=0.0002, acc=0.9994, iter_time=7.96s]
Epoch 0: 25%|██▌ | 3106/12384 [6:35:18<19:40:29, 7.63s/it, loss=0.0002, acc=0.9994, iter_time=7.96s]
Epoch 0: 25%|██▌ | 3106/12384 [6:35:26<19:40:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 25%|██▌ | 3107/12384 [6:35:26<19:40:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 25%|██▌ | 3107/12384 [6:35:33<19:40:43, 7.64s/it, loss=0.0002, acc=0.9987, iter_time=7.66s]
Epoch 0: 25%|██▌ | 3108/12384 [6:35:33<19:39:24, 7.63s/it, loss=0.0002, acc=0.9987, iter_time=7.66s]
Epoch 0: 25%|██▌ | 3108/12384 [6:35:41<19:39:24, 7.63s/it, loss=0.0030, acc=0.9922, iter_time=5.85s]
Epoch 0: 25%|██▌ | 3109/12384 [6:35:41<19:39:09, 7.63s/it, loss=0.0030, acc=0.9922, iter_time=5.85s]
Epoch 0: 25%|██▌ | 3109/12384 [6:35:48<19:39:09, 7.63s/it, loss=0.0009, acc=0.9975, iter_time=8.72s]
Epoch 0: 25%|██▌ | 3110/12384 [6:35:48<19:37:04, 7.62s/it, loss=0.0009, acc=0.9975, iter_time=8.72s]
Epoch 0: 25%|██▌ | 3110/12384 [6:35:56<19:37:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 25%|██▌ | 3111/12384 [6:35:56<19:53:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 25%|██▌ | 3111/12384 [6:36:04<19:53:40, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.30s]
Epoch 0: 25%|██▌ | 3112/12384 [6:36:04<19:48:42, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.30s]
Epoch 0: 25%|██▌ | 3112/12384 [6:36:12<19:48:42, 7.69s/it, loss=0.0005, acc=0.9994, iter_time=7.01s]
Epoch 0: 25%|██▌ | 3113/12384 [6:36:12<19:44:08, 7.66s/it, loss=0.0005, acc=0.9994, iter_time=7.01s]
Epoch 0: 25%|██▌ | 3113/12384 [6:36:19<19:44:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▌ | 3114/12384 [6:36:19<19:42:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▌ | 3114/12384 [6:36:27<19:42:00, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.84s]
Epoch 0: 25%|██▌ | 3115/12384 [6:36:27<19:40:00, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.84s]
Epoch 0: 25%|██▌ | 3115/12384 [6:36:34<19:40:00, 7.64s/it, loss=0.0009, acc=0.9973, iter_time=7.63s]
Epoch 0: 25%|██▌ | 3116/12384 [6:36:34<19:38:21, 7.63s/it, loss=0.0009, acc=0.9973, iter_time=7.63s]
Epoch 0: 25%|██▌ | 3116/12384 [6:36:42<19:38:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 25%|██▌ | 3117/12384 [6:36:42<19:36:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 25%|██▌ | 3117/12384 [6:36:50<19:36:59, 7.62s/it, loss=0.0022, acc=0.9940, iter_time=9.91s]
Epoch 0: 25%|██▌ | 3118/12384 [6:36:50<19:36:29, 7.62s/it, loss=0.0022, acc=0.9940, iter_time=9.91s]
Epoch 0: 25%|██▌ | 3118/12384 [6:36:57<19:36:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 25%|██▌ | 3119/12384 [6:36:57<19:40:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 25%|██▌ | 3119/12384 [6:37:05<19:40:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 25%|██▌ | 3120/12384 [6:37:05<19:38:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 25%|██▌ | 3120/12384 [6:37:13<19:38:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 25%|██▌ | 3121/12384 [6:37:13<19:37:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 25%|██▌ | 3121/12384 [6:37:20<19:37:51, 7.63s/it, loss=0.0010, acc=0.9982, iter_time=6.71s]
Epoch 0: 25%|██▌ | 3122/12384 [6:37:20<19:35:44, 7.62s/it, loss=0.0010, acc=0.9982, iter_time=6.71s]
Epoch 0: 25%|██▌ | 3122/12384 [6:37:28<19:35:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 0: 25%|██▌ | 3123/12384 [6:37:28<19:35:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 0: 25%|██▌ | 3123/12384 [6:37:35<19:35:54, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.70s]
Epoch 0: 25%|██▌ | 3124/12384 [6:37:35<19:34:37, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.70s]
Epoch 0: 25%|██▌ | 3124/12384 [6:37:43<19:34:37, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 0: 25%|██▌ | 3125/12384 [6:37:43<19:34:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 0: 25%|██▌ | 3125/12384 [6:37:51<19:34:47, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=9.40s]
Epoch 0: 25%|██▌ | 3126/12384 [6:37:51<19:34:31, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=9.40s]
Epoch 0: 25%|██▌ | 3126/12384 [6:37:58<19:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 25%|██▌ | 3127/12384 [6:37:58<19:34:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 25%|██▌ | 3127/12384 [6:38:06<19:34:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 25%|██▌ | 3128/12384 [6:38:06<19:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 25%|██▌ | 3128/12384 [6:38:13<19:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 25%|██▌ | 3129/12384 [6:38:13<19:34:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 25%|██▌ | 3129/12384 [6:38:21<19:34:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 25%|██▌ | 3130/12384 [6:38:21<19:34:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 25%|██▌ | 3130/12384 [6:38:29<19:34:43, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=7.63s]
Epoch 0: 25%|██▌ | 3131/12384 [6:38:29<19:34:25, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=7.63s]
Epoch 0: 25%|██▌ | 3131/12384 [6:38:36<19:34:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 25%|██▌ | 3132/12384 [6:38:36<19:34:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 25%|██▌ | 3132/12384 [6:38:44<19:34:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.66s]
Epoch 0: 25%|██▌ | 3133/12384 [6:38:44<19:33:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.66s]
Epoch 0: 25%|██▌ | 3133/12384 [6:38:52<19:33:38, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=7.87s]
Epoch 0: 25%|██▌ | 3134/12384 [6:38:52<19:33:38, 7.61s/it, loss=0.0005, acc=0.9997, iter_time=7.87s]
Epoch 0: 25%|██▌ | 3134/12384 [6:38:59<19:33:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 25%|██▌ | 3135/12384 [6:38:59<19:47:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 25%|██▌ | 3135/12384 [6:39:07<19:47:06, 7.70s/it, loss=0.0003, acc=0.9993, iter_time=8.00s]
Epoch 0: 25%|██▌ | 3136/12384 [6:39:07<19:43:33, 7.68s/it, loss=0.0003, acc=0.9993, iter_time=8.00s]
Epoch 0: 25%|██▌ | 3136/12384 [6:39:15<19:43:33, 7.68s/it, loss=0.0002, acc=0.9999, iter_time=7.29s]
Epoch 0: 25%|██▌ | 3137/12384 [6:39:15<19:54:16, 7.75s/it, loss=0.0002, acc=0.9999, iter_time=7.29s]
Epoch 0: 25%|██▌ | 3137/12384 [6:39:23<19:54:16, 7.75s/it, loss=0.0007, acc=0.9969, iter_time=5.26s]
Epoch 0: 25%|██▌ | 3138/12384 [6:39:23<19:47:11, 7.70s/it, loss=0.0007, acc=0.9969, iter_time=5.26s]
Epoch 0: 25%|██▌ | 3138/12384 [6:39:30<19:47:11, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=10.19s]
Epoch 0: 25%|██▌ | 3139/12384 [6:39:30<19:43:29, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=10.19s]
Epoch 0: 25%|██▌ | 3139/12384 [6:39:38<19:43:29, 7.68s/it, loss=0.0002, acc=0.9983, iter_time=7.61s]
Epoch 0: 25%|██▌ | 3140/12384 [6:39:38<19:39:31, 7.66s/it, loss=0.0002, acc=0.9983, iter_time=7.61s]
Epoch 0: 25%|██▌ | 3140/12384 [6:39:45<19:39:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 25%|██▌ | 3141/12384 [6:39:45<19:37:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 25%|██▌ | 3141/12384 [6:39:53<19:37:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 25%|██▌ | 3142/12384 [6:39:53<19:36:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 25%|██▌ | 3142/12384 [6:40:01<19:36:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 25%|██▌ | 3143/12384 [6:40:01<19:39:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 25%|██▌ | 3143/12384 [6:40:08<19:39:29, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.09s]
Epoch 0: 25%|██▌ | 3144/12384 [6:40:08<19:37:31, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.09s]
Epoch 0: 25%|██▌ | 3144/12384 [6:40:16<19:37:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 0: 25%|██▌ | 3145/12384 [6:40:16<19:35:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 0: 25%|██▌ | 3145/12384 [6:40:24<19:35:15, 7.63s/it, loss=0.0008, acc=0.9981, iter_time=9.87s]
Epoch 0: 25%|██▌ | 3146/12384 [6:40:24<19:33:48, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=9.87s]
Epoch 0: 25%|██▌ | 3146/12384 [6:40:31<19:33:48, 7.62s/it, loss=0.0008, acc=0.9977, iter_time=4.32s]
Epoch 0: 25%|██▌ | 3147/12384 [6:40:31<19:32:58, 7.62s/it, loss=0.0008, acc=0.9977, iter_time=4.32s]
Epoch 0: 25%|██▌ | 3147/12384 [6:40:39<19:32:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 25%|██▌ | 3148/12384 [6:40:39<19:32:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 25%|██▌ | 3148/12384 [6:40:46<19:32:47, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=8.67s]
Epoch 0: 25%|██▌ | 3149/12384 [6:40:46<19:32:48, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=8.67s]
Epoch 0: 25%|██▌ | 3149/12384 [6:40:54<19:32:48, 7.62s/it, loss=0.0009, acc=0.9982, iter_time=9.78s]
Epoch 0: 25%|██▌ | 3150/12384 [6:40:54<19:32:49, 7.62s/it, loss=0.0009, acc=0.9982, iter_time=9.78s]
Epoch 0: 25%|██▌ | 3150/12384 [6:41:02<19:32:49, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.20s]
Epoch 0: 25%|██▌ | 3151/12384 [6:41:02<19:31:58, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.20s]
Epoch 0: 25%|██▌ | 3151/12384 [6:41:09<19:31:58, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=8.00s]
Epoch 0: 25%|██▌ | 3152/12384 [6:41:09<19:31:14, 7.61s/it, loss=0.0003, acc=0.9983, iter_time=8.00s]
Epoch 0: 25%|██▌ | 3152/12384 [6:41:17<19:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 0: 25%|██▌ | 3153/12384 [6:41:17<19:30:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 0: 25%|██▌ | 3153/12384 [6:41:24<19:30:53, 7.61s/it, loss=0.0002, acc=0.9994, iter_time=6.55s]
Epoch 0: 25%|██▌ | 3154/12384 [6:41:24<19:30:07, 7.61s/it, loss=0.0002, acc=0.9994, iter_time=6.55s]
Epoch 0: 25%|██▌ | 3154/12384 [6:41:32<19:30:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 0: 25%|██▌ | 3155/12384 [6:41:32<19:29:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 0: 25%|██▌ | 3155/12384 [6:41:40<19:29:36, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=11.21s]
Epoch 0: 25%|██▌ | 3156/12384 [6:41:40<19:29:13, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=11.21s]
Epoch 0: 25%|██▌ | 3156/12384 [6:41:47<19:29:13, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▌ | 3157/12384 [6:41:47<19:28:38, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 25%|██▌ | 3157/12384 [6:41:55<19:28:38, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=6.48s]
Epoch 0: 26%|██▌ | 3158/12384 [6:41:55<19:28:53, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=6.48s]
Epoch 0: 26%|██▌ | 3158/12384 [6:42:02<19:28:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 26%|██▌ | 3159/12384 [6:42:02<19:28:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 26%|██▌ | 3159/12384 [6:42:10<19:28:45, 7.60s/it, loss=0.0002, acc=0.9999, iter_time=8.01s]
Epoch 0: 26%|██▌ | 3160/12384 [6:42:10<19:29:02, 7.60s/it, loss=0.0002, acc=0.9999, iter_time=8.01s]
Epoch 0: 26%|██▌ | 3160/12384 [6:42:18<19:29:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 0: 26%|██▌ | 3161/12384 [6:42:18<19:29:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 0: 26%|██▌ | 3161/12384 [6:42:25<19:29:22, 7.61s/it, loss=0.0005, acc=0.9981, iter_time=11.18s]
Epoch 0: 26%|██▌ | 3162/12384 [6:42:25<19:28:10, 7.60s/it, loss=0.0005, acc=0.9981, iter_time=11.18s]
Epoch 0: 26%|██▌ | 3162/12384 [6:42:33<19:28:10, 7.60s/it, loss=0.0010, acc=0.9973, iter_time=7.65s]
Epoch 0: 26%|██▌ | 3163/12384 [6:42:33<19:44:37, 7.71s/it, loss=0.0010, acc=0.9973, iter_time=7.65s]
Epoch 0: 26%|██▌ | 3163/12384 [6:42:41<19:44:37, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 26%|██▌ | 3164/12384 [6:42:41<19:38:48, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 26%|██▌ | 3164/12384 [6:42:48<19:38:48, 7.67s/it, loss=0.0003, acc=0.9999, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3165/12384 [6:42:48<19:36:02, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3165/12384 [6:42:56<19:36:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 26%|██▌ | 3166/12384 [6:42:56<19:34:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 26%|██▌ | 3166/12384 [6:43:04<19:34:22, 7.64s/it, loss=0.0005, acc=0.9982, iter_time=9.86s]
Epoch 0: 26%|██▌ | 3167/12384 [6:43:04<19:33:03, 7.64s/it, loss=0.0005, acc=0.9982, iter_time=9.86s]
Epoch 0: 26%|██▌ | 3167/12384 [6:43:11<19:33:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 26%|██▌ | 3168/12384 [6:43:11<19:32:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 26%|██▌ | 3168/12384 [6:43:19<19:32:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 26%|██▌ | 3169/12384 [6:43:19<19:33:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 26%|██▌ | 3169/12384 [6:43:27<19:33:27, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.32s]
Epoch 0: 26%|██▌ | 3170/12384 [6:43:27<19:31:22, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=4.32s]
Epoch 0: 26%|██▌ | 3170/12384 [6:43:34<19:31:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 26%|██▌ | 3171/12384 [6:43:34<19:30:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 26%|██▌ | 3171/12384 [6:43:42<19:30:47, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=7.88s]
Epoch 0: 26%|██▌ | 3172/12384 [6:43:42<19:30:32, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=7.88s]
Epoch 0: 26%|██▌ | 3172/12384 [6:43:49<19:30:32, 7.62s/it, loss=0.0019, acc=0.9952, iter_time=8.50s]
Epoch 0: 26%|██▌ | 3173/12384 [6:43:49<19:30:38, 7.63s/it, loss=0.0019, acc=0.9952, iter_time=8.50s]
Epoch 0: 26%|██▌ | 3173/12384 [6:43:57<19:30:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 26%|██▌ | 3174/12384 [6:43:57<19:29:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 26%|██▌ | 3174/12384 [6:44:05<19:29:45, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=10.17s]
Epoch 0: 26%|██▌ | 3175/12384 [6:44:05<19:28:11, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=10.17s]
Epoch 0: 26%|██▌ | 3175/12384 [6:44:12<19:28:11, 7.61s/it, loss=0.0018, acc=0.9956, iter_time=7.99s]
Epoch 0: 26%|██▌ | 3176/12384 [6:44:12<19:28:05, 7.61s/it, loss=0.0018, acc=0.9956, iter_time=7.99s]
Epoch 0: 26%|██▌ | 3176/12384 [6:44:20<19:28:05, 7.61s/it, loss=0.0017, acc=0.9955, iter_time=7.19s]
Epoch 0: 26%|██▌ | 3177/12384 [6:44:20<19:27:52, 7.61s/it, loss=0.0017, acc=0.9955, iter_time=7.19s]
Epoch 0: 26%|██▌ | 3177/12384 [6:44:27<19:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 26%|██▌ | 3178/12384 [6:44:27<19:28:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 26%|██▌ | 3178/12384 [6:44:35<19:28:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 26%|██▌ | 3179/12384 [6:44:35<19:28:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 26%|██▌ | 3179/12384 [6:44:43<19:28:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.45s]
Epoch 0: 26%|██▌ | 3180/12384 [6:44:43<19:28:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.45s]
Epoch 0: 26%|██▌ | 3180/12384 [6:44:50<19:28:08, 7.62s/it, loss=0.0011, acc=0.9978, iter_time=7.17s]
Epoch 0: 26%|██▌ | 3181/12384 [6:44:50<19:30:37, 7.63s/it, loss=0.0011, acc=0.9978, iter_time=7.17s]
Epoch 0: 26%|██▌ | 3181/12384 [6:44:58<19:30:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 0: 26%|██▌ | 3182/12384 [6:44:58<19:28:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 0: 26%|██▌ | 3182/12384 [6:45:06<19:28:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 26%|██▌ | 3183/12384 [6:45:06<19:27:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 26%|██▌ | 3183/12384 [6:45:13<19:27:36, 7.61s/it, loss=0.0059, acc=0.9883, iter_time=8.00s]
Epoch 0: 26%|██▌ | 3184/12384 [6:45:13<19:27:05, 7.61s/it, loss=0.0059, acc=0.9883, iter_time=8.00s]
Epoch 0: 26%|██▌ | 3184/12384 [6:45:21<19:27:05, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=6.60s]
Epoch 0: 26%|██▌ | 3185/12384 [6:45:21<19:26:23, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=6.60s]
Epoch 0: 26%|██▌ | 3185/12384 [6:45:28<19:26:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.71s]
Epoch 0: 26%|██▌ | 3186/12384 [6:45:28<19:26:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.71s]
Epoch 0: 26%|██▌ | 3186/12384 [6:45:36<19:26:14, 7.61s/it, loss=0.0008, acc=0.9964, iter_time=9.40s]
Epoch 0: 26%|██▌ | 3187/12384 [6:45:36<19:39:22, 7.69s/it, loss=0.0008, acc=0.9964, iter_time=9.40s]
Epoch 0: 26%|██▌ | 3187/12384 [6:45:44<19:39:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 26%|██▌ | 3188/12384 [6:45:44<19:35:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 26%|██▌ | 3188/12384 [6:45:52<19:35:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 26%|██▌ | 3189/12384 [6:45:52<19:48:27, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 26%|██▌ | 3189/12384 [6:45:59<19:48:27, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 26%|██▌ | 3190/12384 [6:45:59<19:41:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 26%|██▌ | 3190/12384 [6:46:07<19:41:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.98s]
Epoch 0: 26%|██▌ | 3191/12384 [6:46:07<19:35:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.98s]
Epoch 0: 26%|██▌ | 3191/12384 [6:46:15<19:35:52, 7.67s/it, loss=0.0005, acc=0.9980, iter_time=11.58s]
Epoch 0: 26%|██▌ | 3192/12384 [6:46:15<19:32:15, 7.65s/it, loss=0.0005, acc=0.9980, iter_time=11.58s]
Epoch 0: 26%|██▌ | 3192/12384 [6:46:22<19:32:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 26%|██▌ | 3193/12384 [6:46:22<19:33:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 26%|██▌ | 3193/12384 [6:46:30<19:33:29, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.94s]
Epoch 0: 26%|██▌ | 3194/12384 [6:46:30<19:31:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.94s]
Epoch 0: 26%|██▌ | 3194/12384 [6:46:38<19:31:17, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=5.32s]
Epoch 0: 26%|██▌ | 3195/12384 [6:46:38<19:28:19, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=5.32s]
Epoch 0: 26%|██▌ | 3195/12384 [6:46:45<19:28:19, 7.63s/it, loss=0.0011, acc=0.9983, iter_time=7.81s]
Epoch 0: 26%|██▌ | 3196/12384 [6:46:45<19:27:09, 7.62s/it, loss=0.0011, acc=0.9983, iter_time=7.81s]
Epoch 0: 26%|██▌ | 3196/12384 [6:46:53<19:27:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 26%|██▌ | 3197/12384 [6:46:53<19:29:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 26%|██▌ | 3197/12384 [6:47:00<19:29:23, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 26%|██▌ | 3198/12384 [6:47:00<19:31:18, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 26%|██▌ | 3198/12384 [6:47:08<19:31:18, 7.65s/it, loss=0.0003, acc=0.9978, iter_time=7.38s]
Epoch 0: 26%|██▌ | 3199/12384 [6:47:08<19:27:49, 7.63s/it, loss=0.0003, acc=0.9978, iter_time=7.38s]
Epoch 0: 26%|██▌ | 3199/12384 [6:47:16<19:27:49, 7.63s/it, loss=0.0004, acc=0.9986, iter_time=8.29s]
Epoch 0: 26%|██▌ | 3200/12384 [6:47:16<19:26:38, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=8.29s]
Epoch 0: 26%|██▌ | 3200/12384 [6:47:23<19:26:38, 7.62s/it, loss=0.0004, acc=0.9999, iter_time=7.21s]
Epoch 0: 26%|██▌ | 3201/12384 [6:47:23<19:30:02, 7.64s/it, loss=0.0004, acc=0.9999, iter_time=7.21s]
Epoch 0: 26%|██▌ | 3201/12384 [6:47:31<19:30:02, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.70s]
Epoch 0: 26%|██▌ | 3202/12384 [6:47:31<19:28:27, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.70s]
Epoch 0: 26%|██▌ | 3202/12384 [6:47:39<19:28:27, 7.64s/it, loss=0.0004, acc=0.9984, iter_time=7.62s]
Epoch 0: 26%|██▌ | 3203/12384 [6:47:39<19:26:57, 7.63s/it, loss=0.0004, acc=0.9984, iter_time=7.62s]
Epoch 0: 26%|██▌ | 3203/12384 [6:47:46<19:26:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3204/12384 [6:47:46<19:25:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3204/12384 [6:47:54<19:25:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 26%|██▌ | 3205/12384 [6:47:54<19:26:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 26%|██▌ | 3205/12384 [6:48:01<19:26:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 0: 26%|██▌ | 3206/12384 [6:48:01<19:25:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 0: 26%|██▌ | 3206/12384 [6:48:09<19:25:23, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=8.06s]
Epoch 0: 26%|██▌ | 3207/12384 [6:48:09<19:25:08, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=8.06s]
Epoch 0: 26%|██▌ | 3207/12384 [6:48:17<19:25:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.29s]
Epoch 0: 26%|██▌ | 3208/12384 [6:48:17<19:24:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.29s]
Epoch 0: 26%|██▌ | 3208/12384 [6:48:24<19:24:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.69s]
Epoch 0: 26%|██▌ | 3209/12384 [6:48:24<19:24:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.69s]
Epoch 0: 26%|██▌ | 3209/12384 [6:48:32<19:24:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 26%|██▌ | 3210/12384 [6:48:32<19:24:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 26%|██▌ | 3210/12384 [6:48:39<19:24:29, 7.62s/it, loss=0.0010, acc=0.9982, iter_time=6.69s]
Epoch 0: 26%|██▌ | 3211/12384 [6:48:39<19:23:42, 7.61s/it, loss=0.0010, acc=0.9982, iter_time=6.69s]
Epoch 0: 26%|██▌ | 3211/12384 [6:48:47<19:23:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.52s]
Epoch 0: 26%|██▌ | 3212/12384 [6:48:47<19:23:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.52s]
Epoch 0: 26%|██▌ | 3212/12384 [6:48:55<19:23:39, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3213/12384 [6:48:55<19:24:01, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3213/12384 [6:49:03<19:24:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 26%|██▌ | 3214/12384 [6:49:03<19:36:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 26%|██▌ | 3214/12384 [6:49:10<19:36:08, 7.70s/it, loss=0.0022, acc=0.9946, iter_time=5.79s]
Epoch 0: 26%|██▌ | 3215/12384 [6:49:10<19:31:56, 7.67s/it, loss=0.0022, acc=0.9946, iter_time=5.79s]
Epoch 0: 26%|██▌ | 3215/12384 [6:49:18<19:31:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.86s]
Epoch 0: 26%|██▌ | 3216/12384 [6:49:18<19:44:48, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=9.86s]
Epoch 0: 26%|██▌ | 3216/12384 [6:49:26<19:44:48, 7.75s/it, loss=0.0005, acc=0.9974, iter_time=6.55s]
Epoch 0: 26%|██▌ | 3217/12384 [6:49:26<19:38:23, 7.71s/it, loss=0.0005, acc=0.9974, iter_time=6.55s]
Epoch 0: 26%|██▌ | 3217/12384 [6:49:33<19:38:23, 7.71s/it, loss=0.0003, acc=0.9974, iter_time=6.78s]
Epoch 0: 26%|██▌ | 3218/12384 [6:49:33<19:32:06, 7.67s/it, loss=0.0003, acc=0.9974, iter_time=6.78s]
Epoch 0: 26%|██▌ | 3218/12384 [6:49:41<19:32:06, 7.67s/it, loss=0.0001, acc=0.9990, iter_time=9.35s]
Epoch 0: 26%|██▌ | 3219/12384 [6:49:41<19:28:22, 7.65s/it, loss=0.0001, acc=0.9990, iter_time=9.35s]
Epoch 0: 26%|██▌ | 3219/12384 [6:49:49<19:28:22, 7.65s/it, loss=0.0002, acc=0.9995, iter_time=7.69s]
Epoch 0: 26%|██▌ | 3220/12384 [6:49:49<19:30:14, 7.66s/it, loss=0.0002, acc=0.9995, iter_time=7.69s]
Epoch 0: 26%|██▌ | 3220/12384 [6:49:56<19:30:14, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.08s]
Epoch 0: 26%|██▌ | 3221/12384 [6:49:56<19:26:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.08s]
Epoch 0: 26%|██▌ | 3221/12384 [6:50:04<19:26:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.54s]
Epoch 0: 26%|██▌ | 3222/12384 [6:50:04<19:25:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.54s]
Epoch 0: 26%|██▌ | 3222/12384 [6:50:11<19:25:03, 7.63s/it, loss=0.0005, acc=0.9957, iter_time=6.97s]
Epoch 0: 26%|██▌ | 3223/12384 [6:50:11<19:22:33, 7.61s/it, loss=0.0005, acc=0.9957, iter_time=6.97s]
Epoch 0: 26%|██▌ | 3223/12384 [6:50:19<19:22:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 26%|██▌ | 3224/12384 [6:50:19<19:21:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 26%|██▌ | 3224/12384 [6:50:27<19:21:43, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.28s]
Epoch 0: 26%|██▌ | 3225/12384 [6:50:27<19:21:45, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.28s]
Epoch 0: 26%|██▌ | 3225/12384 [6:50:34<19:21:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.78s]
Epoch 0: 26%|██▌ | 3226/12384 [6:50:34<19:21:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.78s]
Epoch 0: 26%|██▌ | 3226/12384 [6:50:42<19:21:49, 7.61s/it, loss=0.0009, acc=0.9980, iter_time=9.39s]
Epoch 0: 26%|██▌ | 3227/12384 [6:50:42<19:21:51, 7.61s/it, loss=0.0009, acc=0.9980, iter_time=9.39s]
Epoch 0: 26%|██▌ | 3227/12384 [6:50:50<19:21:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 26%|██▌ | 3228/12384 [6:50:50<19:23:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 26%|██▌ | 3228/12384 [6:50:57<19:23:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 26%|██▌ | 3229/12384 [6:50:57<19:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 26%|██▌ | 3229/12384 [6:51:05<19:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 26%|██▌ | 3230/12384 [6:51:05<19:25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 26%|██▌ | 3230/12384 [6:51:12<19:25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 0: 26%|██▌ | 3231/12384 [6:51:12<19:24:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 0: 26%|██▌ | 3231/12384 [6:51:20<19:24:06, 7.63s/it, loss=0.0006, acc=0.9997, iter_time=10.86s]
Epoch 0: 26%|██▌ | 3232/12384 [6:51:20<19:24:07, 7.63s/it, loss=0.0006, acc=0.9997, iter_time=10.86s]
Epoch 0: 26%|██▌ | 3232/12384 [6:51:28<19:24:07, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.79s]
Epoch 0: 26%|██▌ | 3233/12384 [6:51:28<19:23:13, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.79s]
Epoch 0: 26%|██▌ | 3233/12384 [6:51:35<19:23:13, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.07s]
Epoch 0: 26%|██▌ | 3234/12384 [6:51:35<19:22:51, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.07s]
Epoch 0: 26%|██▌ | 3234/12384 [6:51:43<19:22:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 26%|██▌ | 3235/12384 [6:51:43<19:21:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 26%|██▌ | 3235/12384 [6:51:51<19:21:48, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3236/12384 [6:51:51<19:21:29, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3236/12384 [6:51:58<19:21:29, 7.62s/it, loss=0.0100, acc=0.9850, iter_time=7.62s]
Epoch 0: 26%|██▌ | 3237/12384 [6:51:58<19:21:01, 7.62s/it, loss=0.0100, acc=0.9850, iter_time=7.62s]
Epoch 0: 26%|██▌ | 3237/12384 [6:52:06<19:21:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.03s]
Epoch 0: 26%|██▌ | 3238/12384 [6:52:06<19:19:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.03s]
Epoch 0: 26%|██▌ | 3238/12384 [6:52:13<19:19:42, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=10.18s]
Epoch 0: 26%|██▌ | 3239/12384 [6:52:13<19:20:51, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=10.18s]
Epoch 0: 26%|██▌ | 3239/12384 [6:52:21<19:20:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 26%|██▌ | 3240/12384 [6:52:21<19:21:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 26%|██▌ | 3240/12384 [6:52:29<19:21:02, 7.62s/it, loss=0.0030, acc=0.9952, iter_time=7.49s]
Epoch 0: 26%|██▌ | 3241/12384 [6:52:29<19:31:24, 7.69s/it, loss=0.0030, acc=0.9952, iter_time=7.49s]
Epoch 0: 26%|██▌ | 3241/12384 [6:52:37<19:31:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 26%|██▌ | 3242/12384 [6:52:37<19:43:51, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 26%|██▌ | 3242/12384 [6:52:44<19:43:51, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 0: 26%|██▌ | 3243/12384 [6:52:44<19:37:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 0: 26%|██▌ | 3243/12384 [6:52:52<19:37:25, 7.73s/it, loss=0.0013, acc=0.9969, iter_time=7.65s]
Epoch 0: 26%|██▌ | 3244/12384 [6:52:52<19:33:09, 7.70s/it, loss=0.0013, acc=0.9969, iter_time=7.65s]
Epoch 0: 26%|██▌ | 3244/12384 [6:53:00<19:33:09, 7.70s/it, loss=0.0009, acc=0.9998, iter_time=7.63s]
Epoch 0: 26%|██▌ | 3245/12384 [6:53:00<19:29:13, 7.68s/it, loss=0.0009, acc=0.9998, iter_time=7.63s]
Epoch 0: 26%|██▌ | 3245/12384 [6:53:07<19:29:13, 7.68s/it, loss=0.0007, acc=0.9975, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3246/12384 [6:53:07<19:26:36, 7.66s/it, loss=0.0007, acc=0.9975, iter_time=7.61s]
Epoch 0: 26%|██▌ | 3246/12384 [6:53:15<19:26:36, 7.66s/it, loss=0.0003, acc=0.9994, iter_time=7.64s]
Epoch 0: 26%|██▌ | 3247/12384 [6:53:15<19:24:40, 7.65s/it, loss=0.0003, acc=0.9994, iter_time=7.64s]
Epoch 0: 26%|██▌ | 3247/12384 [6:53:23<19:24:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 26%|██▌ | 3248/12384 [6:53:23<19:22:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 26%|██▌ | 3248/12384 [6:53:30<19:22:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.52s]
Epoch 0: 26%|██▌ | 3249/12384 [6:53:30<19:20:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.52s]
Epoch 0: 26%|██▌ | 3249/12384 [6:53:38<19:20:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 26%|██▌ | 3250/12384 [6:53:38<19:20:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 26%|██▌ | 3250/12384 [6:53:45<19:20:13, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=6.62s]
Epoch 0: 26%|██▋ | 3251/12384 [6:53:45<19:19:44, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=6.62s]
Epoch 0: 26%|██▋ | 3251/12384 [6:53:53<19:19:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 26%|██▋ | 3252/12384 [6:53:53<19:22:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 26%|██▋ | 3252/12384 [6:54:01<19:22:49, 7.64s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 0: 26%|██▋ | 3253/12384 [6:54:01<19:21:37, 7.63s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 0: 26%|██▋ | 3253/12384 [6:54:08<19:21:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 26%|██▋ | 3254/12384 [6:54:08<19:24:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 26%|██▋ | 3254/12384 [6:54:16<19:24:15, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 26%|██▋ | 3255/12384 [6:54:16<19:23:02, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 26%|██▋ | 3255/12384 [6:54:24<19:23:02, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.72s]
Epoch 0: 26%|██▋ | 3256/12384 [6:54:24<19:22:03, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.72s]
Epoch 0: 26%|██▋ | 3256/12384 [6:54:31<19:22:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 0: 26%|██▋ | 3257/12384 [6:54:31<19:21:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 0: 26%|██▋ | 3257/12384 [6:54:39<19:21:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 26%|██▋ | 3258/12384 [6:54:39<19:21:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 26%|██▋ | 3258/12384 [6:54:46<19:21:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 26%|██▋ | 3259/12384 [6:54:46<19:19:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 26%|██▋ | 3259/12384 [6:54:54<19:19:49, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 26%|██▋ | 3260/12384 [6:54:54<19:19:00, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 26%|██▋ | 3260/12384 [6:55:02<19:19:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 26%|██▋ | 3261/12384 [6:55:02<19:18:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 26%|██▋ | 3261/12384 [6:55:09<19:18:48, 7.62s/it, loss=0.0036, acc=0.9926, iter_time=10.42s]
Epoch 0: 26%|██▋ | 3262/12384 [6:55:09<19:18:05, 7.62s/it, loss=0.0036, acc=0.9926, iter_time=10.42s]
Epoch 0: 26%|██▋ | 3262/12384 [6:55:17<19:18:05, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=7.61s]
Epoch 0: 26%|██▋ | 3263/12384 [6:55:17<19:16:50, 7.61s/it, loss=0.0002, acc=0.9997, iter_time=7.61s]
Epoch 0: 26%|██▋ | 3263/12384 [6:55:24<19:16:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 26%|██▋ | 3264/12384 [6:55:24<19:16:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 26%|██▋ | 3264/12384 [6:55:32<19:16:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 26%|██▋ | 3265/12384 [6:55:32<19:16:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 26%|██▋ | 3265/12384 [6:55:40<19:16:39, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.19s]
Epoch 0: 26%|██▋ | 3266/12384 [6:55:40<19:16:34, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.19s]
Epoch 0: 26%|██▋ | 3266/12384 [6:55:48<19:16:34, 7.61s/it, loss=0.0006, acc=1.0000, iter_time=7.89s]
Epoch 0: 26%|██▋ | 3267/12384 [6:55:48<19:28:23, 7.69s/it, loss=0.0006, acc=1.0000, iter_time=7.89s]
Epoch 0: 26%|██▋ | 3267/12384 [6:55:55<19:28:23, 7.69s/it, loss=0.0010, acc=0.9976, iter_time=7.61s]
Epoch 0: 26%|██▋ | 3268/12384 [6:55:55<19:26:45, 7.68s/it, loss=0.0010, acc=0.9976, iter_time=7.61s]
Epoch 0: 26%|██▋ | 3268/12384 [6:56:03<19:26:45, 7.68s/it, loss=0.0002, acc=0.9997, iter_time=7.71s]
Epoch 0: 26%|██▋ | 3269/12384 [6:56:03<19:37:09, 7.75s/it, loss=0.0002, acc=0.9997, iter_time=7.71s]
Epoch 0: 26%|██▋ | 3269/12384 [6:56:11<19:37:09, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 26%|██▋ | 3270/12384 [6:56:11<19:30:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 26%|██▋ | 3270/12384 [6:56:18<19:30:19, 7.70s/it, loss=0.0001, acc=0.9996, iter_time=7.59s]
Epoch 0: 26%|██▋ | 3271/12384 [6:56:18<19:24:51, 7.67s/it, loss=0.0001, acc=0.9996, iter_time=7.59s]
Epoch 0: 26%|██▋ | 3271/12384 [6:56:26<19:24:51, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 26%|██▋ | 3272/12384 [6:56:26<19:22:52, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 26%|██▋ | 3272/12384 [6:56:34<19:22:52, 7.66s/it, loss=0.0001, acc=0.9996, iter_time=7.66s]
Epoch 0: 26%|██▋ | 3273/12384 [6:56:34<19:20:47, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=7.66s]
Epoch 0: 26%|██▋ | 3273/12384 [6:56:41<19:20:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 26%|██▋ | 3274/12384 [6:56:41<19:19:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 26%|██▋ | 3274/12384 [6:56:49<19:19:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 26%|██▋ | 3275/12384 [6:56:49<19:17:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 26%|██▋ | 3275/12384 [6:56:56<19:17:12, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 26%|██▋ | 3276/12384 [6:56:56<19:16:01, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 26%|██▋ | 3276/12384 [6:57:04<19:16:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 0: 26%|██▋ | 3277/12384 [6:57:04<19:15:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 0: 26%|██▋ | 3277/12384 [6:57:12<19:15:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.94s]
Epoch 0: 26%|██▋ | 3278/12384 [6:57:12<19:14:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.94s]
Epoch 0: 26%|██▋ | 3278/12384 [6:57:19<19:14:53, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=4.30s]
Epoch 0: 26%|██▋ | 3279/12384 [6:57:19<19:14:05, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=4.30s]
Epoch 0: 26%|██▋ | 3279/12384 [6:57:27<19:14:05, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=11.27s]
Epoch 0: 26%|██▋ | 3280/12384 [6:57:27<19:14:25, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=11.27s]
Epoch 0: 26%|██▋ | 3280/12384 [6:57:34<19:14:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 26%|██▋ | 3281/12384 [6:57:34<19:13:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 26%|██▋ | 3281/12384 [6:57:42<19:13:23, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=7.89s]
Epoch 0: 27%|██▋ | 3282/12384 [6:57:42<19:14:53, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.89s]
Epoch 0: 27%|██▋ | 3282/12384 [6:57:50<19:14:53, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.65s]
Epoch 0: 27%|██▋ | 3283/12384 [6:57:50<19:14:22, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.65s]
Epoch 0: 27%|██▋ | 3283/12384 [6:57:57<19:14:22, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3284/12384 [6:57:57<19:14:48, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3284/12384 [6:58:05<19:14:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3285/12384 [6:58:05<19:13:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3285/12384 [6:58:12<19:13:52, 7.61s/it, loss=0.0004, acc=0.9987, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3286/12384 [6:58:12<19:13:58, 7.61s/it, loss=0.0004, acc=0.9987, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3286/12384 [6:58:20<19:13:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.42s]
Epoch 0: 27%|██▋ | 3287/12384 [6:58:20<19:12:46, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.42s]
Epoch 0: 27%|██▋ | 3287/12384 [6:58:28<19:12:46, 7.60s/it, loss=0.0015, acc=0.9977, iter_time=9.15s]
Epoch 0: 27%|██▋ | 3288/12384 [6:58:28<19:13:08, 7.61s/it, loss=0.0015, acc=0.9977, iter_time=9.15s]
Epoch 0: 27%|██▋ | 3288/12384 [6:58:35<19:13:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 27%|██▋ | 3289/12384 [6:58:35<19:12:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 27%|██▋ | 3289/12384 [6:58:43<19:12:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3290/12384 [6:58:43<19:12:16, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3290/12384 [6:58:50<19:12:16, 7.60s/it, loss=0.0010, acc=0.9970, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3291/12384 [6:58:50<19:11:59, 7.60s/it, loss=0.0010, acc=0.9970, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3291/12384 [6:58:58<19:11:59, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3292/12384 [6:58:58<19:17:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3292/12384 [6:59:06<19:17:03, 7.64s/it, loss=0.0003, acc=0.9990, iter_time=5.64s]
Epoch 0: 27%|██▋ | 3293/12384 [6:59:06<19:16:03, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=5.64s]
Epoch 0: 27%|██▋ | 3293/12384 [6:59:13<19:16:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 27%|██▋ | 3294/12384 [6:59:13<19:15:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 27%|██▋ | 3294/12384 [6:59:21<19:15:20, 7.63s/it, loss=0.0005, acc=0.9976, iter_time=9.47s]
Epoch 0: 27%|██▋ | 3295/12384 [6:59:21<19:29:26, 7.72s/it, loss=0.0005, acc=0.9976, iter_time=9.47s]
Epoch 0: 27%|██▋ | 3295/12384 [6:59:29<19:29:26, 7.72s/it, loss=0.0009, acc=0.9978, iter_time=8.27s]
Epoch 0: 27%|██▋ | 3296/12384 [6:59:29<19:24:27, 7.69s/it, loss=0.0009, acc=0.9978, iter_time=8.27s]
Epoch 0: 27%|██▋ | 3296/12384 [6:59:37<19:24:27, 7.69s/it, loss=0.0008, acc=0.9969, iter_time=4.09s]
Epoch 0: 27%|██▋ | 3297/12384 [6:59:37<19:21:44, 7.67s/it, loss=0.0008, acc=0.9969, iter_time=4.09s]
Epoch 0: 27%|██▋ | 3297/12384 [6:59:44<19:21:44, 7.67s/it, loss=0.0001, acc=0.9995, iter_time=10.79s]
Epoch 0: 27%|██▋ | 3298/12384 [6:59:44<19:19:19, 7.66s/it, loss=0.0001, acc=0.9995, iter_time=10.79s]
Epoch 0: 27%|██▋ | 3298/12384 [6:59:52<19:19:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3299/12384 [6:59:52<19:16:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3299/12384 [6:59:59<19:16:48, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.03s]
Epoch 0: 27%|██▋ | 3300/12384 [6:59:59<19:16:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.03s]
Epoch 0: 27%|██▋ | 3300/12384 [7:00:07<19:16:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 27%|██▋ | 3301/12384 [7:00:07<19:14:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 27%|██▋ | 3301/12384 [7:00:15<19:14:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3302/12384 [7:00:15<19:14:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3302/12384 [7:00:22<19:14:09, 7.62s/it, loss=0.0015, acc=0.9976, iter_time=4.77s]
Epoch 0: 27%|██▋ | 3303/12384 [7:00:22<19:13:17, 7.62s/it, loss=0.0015, acc=0.9976, iter_time=4.77s]
Epoch 0: 27%|██▋ | 3303/12384 [7:00:30<19:13:17, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=10.84s]
Epoch 0: 27%|██▋ | 3304/12384 [7:00:30<19:13:50, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=10.84s]
Epoch 0: 27%|██▋ | 3304/12384 [7:00:38<19:13:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 27%|██▋ | 3305/12384 [7:00:38<19:14:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 27%|██▋ | 3305/12384 [7:00:45<19:14:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3306/12384 [7:00:45<19:13:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3306/12384 [7:00:53<19:13:24, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3307/12384 [7:00:53<19:13:19, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3307/12384 [7:01:00<19:13:19, 7.62s/it, loss=0.0004, acc=0.9984, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3308/12384 [7:01:00<19:12:05, 7.62s/it, loss=0.0004, acc=0.9984, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3308/12384 [7:01:08<19:12:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3309/12384 [7:01:08<19:12:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3309/12384 [7:01:16<19:12:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.35s]
Epoch 0: 27%|██▋ | 3310/12384 [7:01:16<19:10:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.35s]
Epoch 0: 27%|██▋ | 3310/12384 [7:01:23<19:10:49, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=8.91s]
Epoch 0: 27%|██▋ | 3311/12384 [7:01:23<19:11:39, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=8.91s]
Epoch 0: 27%|██▋ | 3311/12384 [7:01:31<19:11:39, 7.62s/it, loss=0.0005, acc=0.9982, iter_time=8.96s]
Epoch 0: 27%|██▋ | 3312/12384 [7:01:31<19:11:18, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=8.96s]
Epoch 0: 27%|██▋ | 3312/12384 [7:01:38<19:11:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 0: 27%|██▋ | 3313/12384 [7:01:38<19:10:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 0: 27%|██▋ | 3313/12384 [7:01:46<19:10:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.95s]
Epoch 0: 27%|██▋ | 3314/12384 [7:01:46<19:10:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.95s]
Epoch 0: 27%|██▋ | 3314/12384 [7:01:54<19:10:42, 7.61s/it, loss=0.0021, acc=0.9973, iter_time=5.95s]
Epoch 0: 27%|██▋ | 3315/12384 [7:01:54<19:09:52, 7.61s/it, loss=0.0021, acc=0.9973, iter_time=5.95s]
Epoch 0: 27%|██▋ | 3315/12384 [7:02:01<19:09:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 27%|██▋ | 3316/12384 [7:02:01<19:10:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 27%|██▋ | 3316/12384 [7:02:09<19:10:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 0: 27%|██▋ | 3317/12384 [7:02:09<19:11:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 0: 27%|██▋ | 3317/12384 [7:02:17<19:11:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3318/12384 [7:02:17<19:10:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3318/12384 [7:02:24<19:10:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 27%|██▋ | 3319/12384 [7:02:24<19:22:48, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 27%|██▋ | 3319/12384 [7:02:32<19:22:48, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 27%|██▋ | 3320/12384 [7:02:32<19:19:32, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 27%|██▋ | 3320/12384 [7:02:40<19:19:32, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 27%|██▋ | 3321/12384 [7:02:40<19:30:40, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 27%|██▋ | 3321/12384 [7:02:48<19:30:40, 7.75s/it, loss=0.0031, acc=0.9980, iter_time=7.89s]
Epoch 0: 27%|██▋ | 3322/12384 [7:02:48<19:24:50, 7.71s/it, loss=0.0031, acc=0.9980, iter_time=7.89s]
Epoch 0: 27%|██▋ | 3322/12384 [7:02:55<19:24:50, 7.71s/it, loss=0.0006, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3323/12384 [7:02:55<19:21:29, 7.69s/it, loss=0.0006, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3323/12384 [7:03:03<19:21:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3324/12384 [7:03:03<19:18:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3324/12384 [7:03:10<19:18:01, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.30s]
Epoch 0: 27%|██▋ | 3325/12384 [7:03:10<19:16:04, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.30s]
Epoch 0: 27%|██▋ | 3325/12384 [7:03:18<19:16:04, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 27%|██▋ | 3326/12384 [7:03:18<19:15:53, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 27%|██▋ | 3326/12384 [7:03:26<19:15:53, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3327/12384 [7:03:26<19:12:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3327/12384 [7:03:33<19:12:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 27%|██▋ | 3328/12384 [7:03:33<19:14:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 27%|██▋ | 3328/12384 [7:03:41<19:14:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 27%|██▋ | 3329/12384 [7:03:41<19:12:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 27%|██▋ | 3329/12384 [7:03:49<19:12:47, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.31s]
Epoch 0: 27%|██▋ | 3330/12384 [7:03:49<19:11:30, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.31s]
Epoch 0: 27%|██▋ | 3330/12384 [7:03:56<19:11:30, 7.63s/it, loss=0.0005, acc=0.9991, iter_time=7.90s]
Epoch 0: 27%|██▋ | 3331/12384 [7:03:56<19:09:52, 7.62s/it, loss=0.0005, acc=0.9991, iter_time=7.90s]
Epoch 0: 27%|██▋ | 3331/12384 [7:04:04<19:09:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 27%|██▋ | 3332/12384 [7:04:04<19:10:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 27%|██▋ | 3332/12384 [7:04:11<19:10:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.97s]
Epoch 0: 27%|██▋ | 3333/12384 [7:04:11<19:09:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.97s]
Epoch 0: 27%|██▋ | 3333/12384 [7:04:19<19:09:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3334/12384 [7:04:19<19:09:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3334/12384 [7:04:27<19:09:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3335/12384 [7:04:27<19:08:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3335/12384 [7:04:34<19:08:46, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=8.03s]
Epoch 0: 27%|██▋ | 3336/12384 [7:04:34<19:08:50, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=8.03s]
Epoch 0: 27%|██▋ | 3336/12384 [7:04:42<19:08:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 0: 27%|██▋ | 3337/12384 [7:04:42<19:08:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 0: 27%|██▋ | 3337/12384 [7:04:50<19:08:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.16s]
Epoch 0: 27%|██▋ | 3338/12384 [7:04:50<19:08:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.16s]
Epoch 0: 27%|██▋ | 3338/12384 [7:04:57<19:08:31, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=6.74s]
Epoch 0: 27%|██▋ | 3339/12384 [7:04:57<19:06:44, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=6.74s]
Epoch 0: 27%|██▋ | 3339/12384 [7:05:05<19:06:44, 7.61s/it, loss=0.0002, acc=0.9979, iter_time=8.46s]
Epoch 0: 27%|██▋ | 3340/12384 [7:05:05<19:06:22, 7.61s/it, loss=0.0002, acc=0.9979, iter_time=8.46s]
Epoch 0: 27%|██▋ | 3340/12384 [7:05:12<19:06:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3341/12384 [7:05:12<19:07:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3341/12384 [7:05:20<19:07:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3342/12384 [7:05:20<19:06:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3342/12384 [7:05:28<19:06:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3343/12384 [7:05:28<19:07:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3343/12384 [7:05:35<19:07:28, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=8.01s]
Epoch 0: 27%|██▋ | 3344/12384 [7:05:35<19:07:06, 7.61s/it, loss=0.0002, acc=0.9988, iter_time=8.01s]
Epoch 0: 27%|██▋ | 3344/12384 [7:05:43<19:07:06, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=6.91s]
Epoch 0: 27%|██▋ | 3345/12384 [7:05:43<19:07:07, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=6.91s]
Epoch 0: 27%|██▋ | 3345/12384 [7:05:50<19:07:07, 7.61s/it, loss=0.0001, acc=0.9994, iter_time=5.36s]
Epoch 0: 27%|██▋ | 3346/12384 [7:05:50<19:06:21, 7.61s/it, loss=0.0001, acc=0.9994, iter_time=5.36s]
Epoch 0: 27%|██▋ | 3346/12384 [7:05:58<19:06:21, 7.61s/it, loss=0.0022, acc=0.9937, iter_time=9.96s]
Epoch 0: 27%|██▋ | 3347/12384 [7:05:58<19:21:22, 7.71s/it, loss=0.0022, acc=0.9937, iter_time=9.96s]
Epoch 0: 27%|██▋ | 3347/12384 [7:06:06<19:21:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 27%|██▋ | 3348/12384 [7:06:06<19:17:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 27%|██▋ | 3348/12384 [7:06:14<19:17:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 27%|██▋ | 3349/12384 [7:06:14<19:13:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 27%|██▋ | 3349/12384 [7:06:21<19:13:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 27%|██▋ | 3350/12384 [7:06:21<19:11:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 27%|██▋ | 3350/12384 [7:06:29<19:11:16, 7.65s/it, loss=0.0003, acc=0.9988, iter_time=6.90s]
Epoch 0: 27%|██▋ | 3351/12384 [7:06:29<19:08:29, 7.63s/it, loss=0.0003, acc=0.9988, iter_time=6.90s]
Epoch 0: 27%|██▋ | 3351/12384 [7:06:36<19:08:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 27%|██▋ | 3352/12384 [7:06:36<19:06:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 27%|██▋ | 3352/12384 [7:06:44<19:06:58, 7.62s/it, loss=0.0003, acc=0.9989, iter_time=7.65s]
Epoch 0: 27%|██▋ | 3353/12384 [7:06:44<19:06:15, 7.62s/it, loss=0.0003, acc=0.9989, iter_time=7.65s]
Epoch 0: 27%|██▋ | 3353/12384 [7:06:52<19:06:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3354/12384 [7:06:52<19:04:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3354/12384 [7:06:59<19:04:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3355/12384 [7:06:59<19:05:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3355/12384 [7:07:07<19:05:23, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3356/12384 [7:07:07<19:04:35, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3356/12384 [7:07:14<19:04:35, 7.61s/it, loss=0.0003, acc=0.9987, iter_time=7.34s]
Epoch 0: 27%|██▋ | 3357/12384 [7:07:14<19:03:32, 7.60s/it, loss=0.0003, acc=0.9987, iter_time=7.34s]
Epoch 0: 27%|██▋ | 3357/12384 [7:07:22<19:03:32, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 27%|██▋ | 3358/12384 [7:07:22<19:04:01, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 27%|██▋ | 3358/12384 [7:07:30<19:04:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3359/12384 [7:07:30<19:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3359/12384 [7:07:37<19:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 27%|██▋ | 3360/12384 [7:07:37<19:04:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 27%|██▋ | 3360/12384 [7:07:45<19:04:09, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.65s]
Epoch 0: 27%|██▋ | 3361/12384 [7:07:45<19:03:34, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=7.65s]
Epoch 0: 27%|██▋ | 3361/12384 [7:07:52<19:03:34, 7.60s/it, loss=0.0010, acc=0.9980, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3362/12384 [7:07:52<19:03:27, 7.60s/it, loss=0.0010, acc=0.9980, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3362/12384 [7:08:00<19:03:27, 7.60s/it, loss=0.0009, acc=0.9979, iter_time=5.55s]
Epoch 0: 27%|██▋ | 3363/12384 [7:08:00<19:03:08, 7.60s/it, loss=0.0009, acc=0.9979, iter_time=5.55s]
Epoch 0: 27%|██▋ | 3363/12384 [7:08:08<19:03:08, 7.60s/it, loss=0.0002, acc=0.9999, iter_time=9.64s]
Epoch 0: 27%|██▋ | 3364/12384 [7:08:08<19:03:29, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=9.64s]
Epoch 0: 27%|██▋ | 3364/12384 [7:08:15<19:03:29, 7.61s/it, loss=0.0025, acc=0.9925, iter_time=5.08s]
Epoch 0: 27%|██▋ | 3365/12384 [7:08:15<19:03:22, 7.61s/it, loss=0.0025, acc=0.9925, iter_time=5.08s]
Epoch 0: 27%|██▋ | 3365/12384 [7:08:23<19:03:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 27%|██▋ | 3366/12384 [7:08:23<19:03:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 27%|██▋ | 3366/12384 [7:08:31<19:03:46, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3367/12384 [7:08:31<19:04:04, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3367/12384 [7:08:38<19:04:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3368/12384 [7:08:38<19:04:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 27%|██▋ | 3368/12384 [7:08:46<19:04:55, 7.62s/it, loss=0.0011, acc=0.9981, iter_time=7.41s]
Epoch 0: 27%|██▋ | 3369/12384 [7:08:46<19:05:14, 7.62s/it, loss=0.0011, acc=0.9981, iter_time=7.41s]
Epoch 0: 27%|██▋ | 3369/12384 [7:08:53<19:05:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.75s]
Epoch 0: 27%|██▋ | 3370/12384 [7:08:53<19:04:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.75s]
Epoch 0: 27%|██▋ | 3370/12384 [7:09:01<19:04:51, 7.62s/it, loss=0.0007, acc=0.9978, iter_time=11.04s]
Epoch 0: 27%|██▋ | 3371/12384 [7:09:01<19:17:08, 7.70s/it, loss=0.0007, acc=0.9978, iter_time=11.04s]
Epoch 0: 27%|██▋ | 3371/12384 [7:09:09<19:17:08, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3372/12384 [7:09:09<19:12:16, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3372/12384 [7:09:17<19:12:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 27%|██▋ | 3373/12384 [7:09:17<19:25:31, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 27%|██▋ | 3373/12384 [7:09:24<19:25:31, 7.76s/it, loss=0.0005, acc=0.9972, iter_time=11.52s]
Epoch 0: 27%|██▋ | 3374/12384 [7:09:24<19:17:38, 7.71s/it, loss=0.0005, acc=0.9972, iter_time=11.52s]
Epoch 0: 27%|██▋ | 3374/12384 [7:09:32<19:17:38, 7.71s/it, loss=0.0002, acc=0.9994, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3375/12384 [7:09:32<19:13:04, 7.68s/it, loss=0.0002, acc=0.9994, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3375/12384 [7:09:40<19:13:04, 7.68s/it, loss=0.0096, acc=0.9879, iter_time=7.56s]
Epoch 0: 27%|██▋ | 3376/12384 [7:09:40<19:09:08, 7.65s/it, loss=0.0096, acc=0.9879, iter_time=7.56s]
Epoch 0: 27%|██▋ | 3376/12384 [7:09:47<19:09:08, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3377/12384 [7:09:47<19:07:44, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 27%|██▋ | 3377/12384 [7:09:55<19:07:44, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.10s]
Epoch 0: 27%|██▋ | 3378/12384 [7:09:55<19:04:24, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.10s]
Epoch 0: 27%|██▋ | 3378/12384 [7:10:02<19:04:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 27%|██▋ | 3379/12384 [7:10:02<19:02:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 27%|██▋ | 3379/12384 [7:10:10<19:02:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 27%|██▋ | 3380/12384 [7:10:10<19:06:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 27%|██▋ | 3380/12384 [7:10:18<19:06:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3381/12384 [7:10:18<19:04:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3381/12384 [7:10:25<19:04:09, 7.63s/it, loss=0.0004, acc=0.9978, iter_time=7.58s]
Epoch 0: 27%|██▋ | 3382/12384 [7:10:25<19:03:14, 7.62s/it, loss=0.0004, acc=0.9978, iter_time=7.58s]
Epoch 0: 27%|██▋ | 3382/12384 [7:10:33<19:03:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3383/12384 [7:10:33<19:02:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3383/12384 [7:10:41<19:02:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 27%|██▋ | 3384/12384 [7:10:41<19:02:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 27%|██▋ | 3384/12384 [7:10:48<19:02:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 27%|██▋ | 3385/12384 [7:10:48<19:05:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 27%|██▋ | 3385/12384 [7:10:56<19:05:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3386/12384 [7:10:56<19:04:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 27%|██▋ | 3386/12384 [7:11:03<19:04:31, 7.63s/it, loss=0.0006, acc=0.9997, iter_time=6.69s]
Epoch 0: 27%|██▋ | 3387/12384 [7:11:03<19:04:16, 7.63s/it, loss=0.0006, acc=0.9997, iter_time=6.69s]
Epoch 0: 27%|██▋ | 3387/12384 [7:11:11<19:04:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 27%|██▋ | 3388/12384 [7:11:11<19:03:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 27%|██▋ | 3388/12384 [7:11:19<19:03:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 27%|██▋ | 3389/12384 [7:11:19<19:01:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 27%|██▋ | 3389/12384 [7:11:26<19:01:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 0: 27%|██▋ | 3390/12384 [7:11:26<19:01:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 0: 27%|██▋ | 3390/12384 [7:11:34<19:01:05, 7.61s/it, loss=0.0020, acc=0.9965, iter_time=9.93s]
Epoch 0: 27%|██▋ | 3391/12384 [7:11:34<19:01:00, 7.61s/it, loss=0.0020, acc=0.9965, iter_time=9.93s]
Epoch 0: 27%|██▋ | 3391/12384 [7:11:42<19:01:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 27%|██▋ | 3392/12384 [7:11:42<19:01:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 27%|██▋ | 3392/12384 [7:11:49<19:01:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3393/12384 [7:11:49<18:59:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 27%|██▋ | 3393/12384 [7:11:57<18:59:14, 7.60s/it, loss=0.0005, acc=0.9995, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3394/12384 [7:11:57<18:59:54, 7.61s/it, loss=0.0005, acc=0.9995, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3394/12384 [7:12:04<18:59:54, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3395/12384 [7:12:04<19:02:32, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 27%|██▋ | 3395/12384 [7:12:12<19:02:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.36s]
Epoch 0: 27%|██▋ | 3396/12384 [7:12:12<19:00:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.36s]
Epoch 0: 27%|██▋ | 3396/12384 [7:12:20<19:00:40, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.89s]
Epoch 0: 27%|██▋ | 3397/12384 [7:12:20<19:00:03, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.89s]
Epoch 0: 27%|██▋ | 3397/12384 [7:12:27<19:00:03, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=6.96s]
Epoch 0: 27%|██▋ | 3398/12384 [7:12:27<19:00:25, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=6.96s]
Epoch 0: 27%|██▋ | 3398/12384 [7:12:35<19:00:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.26s]
Epoch 0: 27%|██▋ | 3399/12384 [7:12:35<18:59:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.26s]
Epoch 0: 27%|██▋ | 3399/12384 [7:12:43<18:59:16, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=8.34s]
Epoch 0: 27%|██▋ | 3400/12384 [7:12:43<19:14:14, 7.71s/it, loss=0.0005, acc=1.0000, iter_time=8.34s]
Epoch 0: 27%|██▋ | 3400/12384 [7:12:50<19:14:14, 7.71s/it, loss=0.0002, acc=0.9999, iter_time=7.20s]
Epoch 0: 27%|██▋ | 3401/12384 [7:12:50<19:09:53, 7.68s/it, loss=0.0002, acc=0.9999, iter_time=7.20s]
Epoch 0: 27%|██▋ | 3401/12384 [7:12:58<19:09:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 27%|██▋ | 3402/12384 [7:12:58<19:05:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 27%|██▋ | 3402/12384 [7:13:06<19:05:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 27%|██▋ | 3403/12384 [7:13:06<19:03:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 27%|██▋ | 3403/12384 [7:13:13<19:03:33, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3404/12384 [7:13:13<19:01:35, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3404/12384 [7:13:21<19:01:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3405/12384 [7:13:21<19:00:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 27%|██▋ | 3405/12384 [7:13:28<19:00:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3406/12384 [7:13:28<19:00:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3406/12384 [7:13:36<19:00:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3407/12384 [7:13:36<19:02:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3407/12384 [7:13:44<19:02:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 28%|██▊ | 3408/12384 [7:13:44<19:02:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 28%|██▊ | 3408/12384 [7:13:51<19:02:27, 7.64s/it, loss=0.0005, acc=0.9984, iter_time=7.67s]
Epoch 0: 28%|██▊ | 3409/12384 [7:13:51<19:01:32, 7.63s/it, loss=0.0005, acc=0.9984, iter_time=7.67s]
Epoch 0: 28%|██▊ | 3409/12384 [7:13:59<19:01:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 28%|██▊ | 3410/12384 [7:13:59<18:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 28%|██▊ | 3410/12384 [7:14:07<18:59:22, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=10.92s]
Epoch 0: 28%|██▊ | 3411/12384 [7:14:07<19:00:44, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=10.92s]
Epoch 0: 28%|██▊ | 3411/12384 [7:14:14<19:00:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3412/12384 [7:14:14<18:59:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3412/12384 [7:14:22<18:59:29, 7.62s/it, loss=0.0026, acc=0.9968, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3413/12384 [7:14:22<18:59:27, 7.62s/it, loss=0.0026, acc=0.9968, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3413/12384 [7:14:29<18:59:27, 7.62s/it, loss=0.0007, acc=0.9973, iter_time=4.80s]
Epoch 0: 28%|██▊ | 3414/12384 [7:14:29<19:01:32, 7.64s/it, loss=0.0007, acc=0.9973, iter_time=4.80s]
Epoch 0: 28%|██▊ | 3414/12384 [7:14:37<19:01:32, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.48s]
Epoch 0: 28%|██▊ | 3415/12384 [7:14:37<19:00:56, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.48s]
Epoch 0: 28%|██▊ | 3415/12384 [7:14:45<19:00:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 28%|██▊ | 3416/12384 [7:14:45<18:59:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 28%|██▊ | 3416/12384 [7:14:52<18:59:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 28%|██▊ | 3417/12384 [7:14:52<18:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 28%|██▊ | 3417/12384 [7:15:00<18:58:27, 7.62s/it, loss=0.0003, acc=0.9991, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3418/12384 [7:15:00<18:58:13, 7.62s/it, loss=0.0003, acc=0.9991, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3418/12384 [7:15:07<18:58:13, 7.62s/it, loss=0.0001, acc=0.9990, iter_time=6.76s]
Epoch 0: 28%|██▊ | 3419/12384 [7:15:07<18:57:02, 7.61s/it, loss=0.0001, acc=0.9990, iter_time=6.76s]
Epoch 0: 28%|██▊ | 3419/12384 [7:15:15<18:57:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.47s]
Epoch 0: 28%|██▊ | 3420/12384 [7:15:15<18:58:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.47s]
Epoch 0: 28%|██▊ | 3420/12384 [7:15:23<18:58:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3421/12384 [7:15:23<18:59:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3421/12384 [7:15:30<18:59:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 28%|██▊ | 3422/12384 [7:15:30<18:58:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 28%|██▊ | 3422/12384 [7:15:38<18:58:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.94s]
Epoch 0: 28%|██▊ | 3423/12384 [7:15:38<18:57:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.94s]
Epoch 0: 28%|██▊ | 3423/12384 [7:15:46<18:57:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 28%|██▊ | 3424/12384 [7:15:46<18:58:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 28%|██▊ | 3424/12384 [7:15:53<18:58:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 28%|██▊ | 3425/12384 [7:15:53<19:09:10, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 28%|██▊ | 3425/12384 [7:16:01<19:09:10, 7.70s/it, loss=0.0009, acc=0.9974, iter_time=5.55s]
Epoch 0: 28%|██▊ | 3426/12384 [7:16:01<19:23:08, 7.79s/it, loss=0.0009, acc=0.9974, iter_time=5.55s]
Epoch 0: 28%|██▊ | 3426/12384 [7:16:09<19:23:08, 7.79s/it, loss=0.0004, acc=0.9996, iter_time=10.06s]
Epoch 0: 28%|██▊ | 3427/12384 [7:16:09<19:14:19, 7.73s/it, loss=0.0004, acc=0.9996, iter_time=10.06s]
Epoch 0: 28%|██▊ | 3427/12384 [7:16:17<19:14:19, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.00s]
Epoch 0: 28%|██▊ | 3428/12384 [7:16:17<19:09:47, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.00s]
Epoch 0: 28%|██▊ | 3428/12384 [7:16:24<19:09:47, 7.70s/it, loss=0.0003, acc=0.9992, iter_time=6.18s]
Epoch 0: 28%|██▊ | 3429/12384 [7:16:24<19:06:14, 7.68s/it, loss=0.0003, acc=0.9992, iter_time=6.18s]
Epoch 0: 28%|██▊ | 3429/12384 [7:16:32<19:06:14, 7.68s/it, loss=0.0003, acc=0.9998, iter_time=9.71s]
Epoch 0: 28%|██▊ | 3430/12384 [7:16:32<19:04:06, 7.67s/it, loss=0.0003, acc=0.9998, iter_time=9.71s]
Epoch 0: 28%|██▊ | 3430/12384 [7:16:40<19:04:06, 7.67s/it, loss=0.0002, acc=0.9994, iter_time=7.30s]
Epoch 0: 28%|██▊ | 3431/12384 [7:16:40<19:00:09, 7.64s/it, loss=0.0002, acc=0.9994, iter_time=7.30s]
Epoch 0: 28%|██▊ | 3431/12384 [7:16:47<19:00:09, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 28%|██▊ | 3432/12384 [7:16:47<19:01:58, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 28%|██▊ | 3432/12384 [7:16:55<19:01:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 28%|██▊ | 3433/12384 [7:16:55<19:00:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 28%|██▊ | 3433/12384 [7:17:03<19:00:05, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.32s]
Epoch 0: 28%|██▊ | 3434/12384 [7:17:03<19:02:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.32s]
Epoch 0: 28%|██▊ | 3434/12384 [7:17:10<19:02:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 0: 28%|██▊ | 3435/12384 [7:17:10<19:00:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 0: 28%|██▊ | 3435/12384 [7:17:18<19:00:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 28%|██▊ | 3436/12384 [7:17:18<18:58:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 28%|██▊ | 3436/12384 [7:17:25<18:58:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 28%|██▊ | 3437/12384 [7:17:25<18:57:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 28%|██▊ | 3437/12384 [7:17:33<18:57:45, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 28%|██▊ | 3438/12384 [7:17:33<18:57:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 28%|██▊ | 3438/12384 [7:17:41<18:57:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 28%|██▊ | 3439/12384 [7:17:41<18:57:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 28%|██▊ | 3439/12384 [7:17:48<18:57:17, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=11.30s]
Epoch 0: 28%|██▊ | 3440/12384 [7:17:48<18:56:01, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=11.30s]
Epoch 0: 28%|██▊ | 3440/12384 [7:17:56<18:56:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 28%|██▊ | 3441/12384 [7:17:56<18:55:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 28%|██▊ | 3441/12384 [7:18:03<18:55:19, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3442/12384 [7:18:03<18:53:53, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3442/12384 [7:18:11<18:53:53, 7.61s/it, loss=0.0010, acc=0.9968, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3443/12384 [7:18:11<18:56:42, 7.63s/it, loss=0.0010, acc=0.9968, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3443/12384 [7:18:19<18:56:42, 7.63s/it, loss=0.0002, acc=0.9984, iter_time=7.64s]
Epoch 0: 28%|██▊ | 3444/12384 [7:18:19<18:54:43, 7.62s/it, loss=0.0002, acc=0.9984, iter_time=7.64s]
Epoch 0: 28%|██▊ | 3444/12384 [7:18:26<18:54:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.26s]
Epoch 0: 28%|██▊ | 3445/12384 [7:18:26<18:54:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.26s]
Epoch 0: 28%|██▊ | 3445/12384 [7:18:34<18:54:26, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.40s]
Epoch 0: 28%|██▊ | 3446/12384 [7:18:34<18:55:01, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=8.40s]
Epoch 0: 28%|██▊ | 3446/12384 [7:18:42<18:55:01, 7.62s/it, loss=0.0017, acc=0.9954, iter_time=9.18s]
Epoch 0: 28%|██▊ | 3447/12384 [7:18:42<18:58:27, 7.64s/it, loss=0.0017, acc=0.9954, iter_time=9.18s]
Epoch 0: 28%|██▊ | 3447/12384 [7:18:49<18:58:27, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=8.07s]
Epoch 0: 28%|██▊ | 3448/12384 [7:18:49<18:56:59, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=8.07s]
Epoch 0: 28%|██▊ | 3448/12384 [7:18:57<18:56:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.18s]
Epoch 0: 28%|██▊ | 3449/12384 [7:18:57<18:56:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.18s]
Epoch 0: 28%|██▊ | 3449/12384 [7:19:05<18:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 28%|██▊ | 3450/12384 [7:19:05<18:57:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 28%|██▊ | 3450/12384 [7:19:12<18:57:19, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=5.42s]
Epoch 0: 28%|██▊ | 3451/12384 [7:19:12<18:54:28, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=5.42s]
Epoch 0: 28%|██▊ | 3451/12384 [7:19:20<18:54:28, 7.62s/it, loss=0.0010, acc=0.9979, iter_time=9.35s]
Epoch 0: 28%|██▊ | 3452/12384 [7:19:20<18:53:22, 7.61s/it, loss=0.0010, acc=0.9979, iter_time=9.35s]
Epoch 0: 28%|██▊ | 3452/12384 [7:19:28<18:53:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 28%|██▊ | 3453/12384 [7:19:28<19:07:56, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 28%|██▊ | 3453/12384 [7:19:35<19:07:56, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 28%|██▊ | 3454/12384 [7:19:35<19:03:31, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 28%|██▊ | 3454/12384 [7:19:43<19:03:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 28%|██▊ | 3455/12384 [7:19:43<18:58:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 28%|██▊ | 3455/12384 [7:19:50<18:58:37, 7.65s/it, loss=0.0005, acc=0.9990, iter_time=8.89s]
Epoch 0: 28%|██▊ | 3456/12384 [7:19:50<18:56:40, 7.64s/it, loss=0.0005, acc=0.9990, iter_time=8.89s]
Epoch 0: 28%|██▊ | 3456/12384 [7:19:58<18:56:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 28%|██▊ | 3457/12384 [7:19:58<18:54:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 28%|██▊ | 3457/12384 [7:20:06<18:54:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3458/12384 [7:20:06<18:54:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3458/12384 [7:20:13<18:54:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3459/12384 [7:20:13<18:53:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3459/12384 [7:20:21<18:53:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3460/12384 [7:20:21<18:53:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3460/12384 [7:20:29<18:53:02, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=7.28s]
Epoch 0: 28%|██▊ | 3461/12384 [7:20:29<18:53:11, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=7.28s]
Epoch 0: 28%|██▊ | 3461/12384 [7:20:36<18:53:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 28%|██▊ | 3462/12384 [7:20:36<18:52:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 28%|██▊ | 3462/12384 [7:20:44<18:52:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 0: 28%|██▊ | 3463/12384 [7:20:44<18:51:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 0: 28%|██▊ | 3463/12384 [7:20:51<18:51:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 28%|██▊ | 3464/12384 [7:20:51<18:56:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 28%|██▊ | 3464/12384 [7:20:59<18:56:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 28%|██▊ | 3465/12384 [7:20:59<18:54:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 28%|██▊ | 3465/12384 [7:21:07<18:54:21, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3466/12384 [7:21:07<18:53:16, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3466/12384 [7:21:14<18:53:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3467/12384 [7:21:14<18:52:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3467/12384 [7:21:22<18:52:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3468/12384 [7:21:22<18:52:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3468/12384 [7:21:30<18:52:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3469/12384 [7:21:30<18:52:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3469/12384 [7:21:37<18:52:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3470/12384 [7:21:37<18:53:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3470/12384 [7:21:45<18:53:25, 7.63s/it, loss=0.0012, acc=0.9977, iter_time=7.12s]
Epoch 0: 28%|██▊ | 3471/12384 [7:21:45<18:53:23, 7.63s/it, loss=0.0012, acc=0.9977, iter_time=7.12s]
Epoch 0: 28%|██▊ | 3471/12384 [7:21:52<18:53:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 28%|██▊ | 3472/12384 [7:21:52<18:52:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 28%|██▊ | 3472/12384 [7:22:00<18:52:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 28%|██▊ | 3473/12384 [7:22:00<18:51:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 28%|██▊ | 3473/12384 [7:22:08<18:51:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3474/12384 [7:22:08<18:50:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3474/12384 [7:22:15<18:50:30, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3475/12384 [7:22:15<18:55:03, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3475/12384 [7:22:23<18:55:03, 7.64s/it, loss=0.0003, acc=0.9976, iter_time=7.41s]
Epoch 0: 28%|██▊ | 3476/12384 [7:22:23<18:53:55, 7.64s/it, loss=0.0003, acc=0.9976, iter_time=7.41s]
Epoch 0: 28%|██▊ | 3476/12384 [7:22:31<18:53:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 0: 28%|██▊ | 3477/12384 [7:22:31<19:04:10, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 0: 28%|██▊ | 3477/12384 [7:22:39<19:04:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3478/12384 [7:22:39<19:02:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3478/12384 [7:22:46<19:02:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 28%|██▊ | 3479/12384 [7:22:46<19:13:04, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 28%|██▊ | 3479/12384 [7:22:54<19:13:04, 7.77s/it, loss=0.0001, acc=0.9998, iter_time=7.83s]
Epoch 0: 28%|██▊ | 3480/12384 [7:22:54<19:06:30, 7.73s/it, loss=0.0001, acc=0.9998, iter_time=7.83s]
Epoch 0: 28%|██▊ | 3480/12384 [7:23:02<19:06:30, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 28%|██▊ | 3481/12384 [7:23:02<19:00:25, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 28%|██▊ | 3481/12384 [7:23:09<19:00:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3482/12384 [7:23:09<18:57:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3482/12384 [7:23:17<18:57:27, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3483/12384 [7:23:17<18:55:14, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3483/12384 [7:23:24<18:55:14, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3484/12384 [7:23:24<18:52:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3484/12384 [7:23:32<18:52:00, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=6.66s]
Epoch 0: 28%|██▊ | 3485/12384 [7:23:32<18:49:08, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=6.66s]
Epoch 0: 28%|██▊ | 3485/12384 [7:23:40<18:49:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 28%|██▊ | 3486/12384 [7:23:40<18:49:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 28%|██▊ | 3486/12384 [7:23:47<18:49:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3487/12384 [7:23:47<18:49:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3487/12384 [7:23:55<18:49:38, 7.62s/it, loss=0.0004, acc=0.9988, iter_time=8.02s]
Epoch 0: 28%|██▊ | 3488/12384 [7:23:55<18:50:53, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=8.02s]
Epoch 0: 28%|██▊ | 3488/12384 [7:24:03<18:50:53, 7.63s/it, loss=0.0008, acc=0.9952, iter_time=5.47s]
Epoch 0: 28%|██▊ | 3489/12384 [7:24:03<18:49:46, 7.62s/it, loss=0.0008, acc=0.9952, iter_time=5.47s]
Epoch 0: 28%|██▊ | 3489/12384 [7:24:10<18:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 28%|██▊ | 3490/12384 [7:24:10<18:48:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 28%|██▊ | 3490/12384 [7:24:18<18:48:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3491/12384 [7:24:18<18:48:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3491/12384 [7:24:25<18:48:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 28%|██▊ | 3492/12384 [7:24:25<18:47:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 28%|██▊ | 3492/12384 [7:24:33<18:47:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.17s]
Epoch 0: 28%|██▊ | 3493/12384 [7:24:33<18:47:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.17s]
Epoch 0: 28%|██▊ | 3493/12384 [7:24:41<18:47:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 28%|██▊ | 3494/12384 [7:24:41<18:46:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 28%|██▊ | 3494/12384 [7:24:48<18:46:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 28%|██▊ | 3495/12384 [7:24:48<18:47:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 28%|██▊ | 3495/12384 [7:24:56<18:47:36, 7.61s/it, loss=0.0008, acc=0.9998, iter_time=8.03s]
Epoch 0: 28%|██▊ | 3496/12384 [7:24:56<18:52:58, 7.65s/it, loss=0.0008, acc=0.9998, iter_time=8.03s]
Epoch 0: 28%|██▊ | 3496/12384 [7:25:04<18:52:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 28%|██▊ | 3497/12384 [7:25:04<18:51:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 28%|██▊ | 3497/12384 [7:25:11<18:51:26, 7.64s/it, loss=0.0004, acc=0.9972, iter_time=6.08s]
Epoch 0: 28%|██▊ | 3498/12384 [7:25:11<18:50:00, 7.63s/it, loss=0.0004, acc=0.9972, iter_time=6.08s]
Epoch 0: 28%|██▊ | 3498/12384 [7:25:19<18:50:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3499/12384 [7:25:19<18:49:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3499/12384 [7:25:26<18:49:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 28%|██▊ | 3500/12384 [7:25:27<18:59:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 28%|██▊ | 3500/12384 [7:25:34<18:59:36, 7.70s/it, loss=0.0001, acc=0.9997, iter_time=7.38s]
Epoch 0: 28%|██▊ | 3501/12384 [7:25:34<18:53:49, 7.66s/it, loss=0.0001, acc=0.9997, iter_time=7.38s]
Epoch 0: 28%|██▊ | 3501/12384 [7:25:42<18:53:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 28%|██▊ | 3502/12384 [7:25:42<19:04:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 28%|██▊ | 3502/12384 [7:25:50<19:04:41, 7.73s/it, loss=0.0008, acc=0.9980, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3503/12384 [7:25:50<19:01:01, 7.71s/it, loss=0.0008, acc=0.9980, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3503/12384 [7:25:57<19:01:01, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 28%|██▊ | 3504/12384 [7:25:57<18:56:57, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 28%|██▊ | 3504/12384 [7:26:05<18:56:57, 7.68s/it, loss=0.0007, acc=0.9984, iter_time=3.91s]
Epoch 0: 28%|██▊ | 3505/12384 [7:26:05<19:08:54, 7.76s/it, loss=0.0007, acc=0.9984, iter_time=3.91s]
Epoch 0: 28%|██▊ | 3505/12384 [7:26:13<19:08:54, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 0: 28%|██▊ | 3506/12384 [7:26:13<19:02:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 0: 28%|██▊ | 3506/12384 [7:26:21<19:02:25, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3507/12384 [7:26:21<18:57:48, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3507/12384 [7:26:28<18:57:48, 7.69s/it, loss=0.0069, acc=0.9733, iter_time=6.67s]
Epoch 0: 28%|██▊ | 3508/12384 [7:26:28<18:54:02, 7.67s/it, loss=0.0069, acc=0.9733, iter_time=6.67s]
Epoch 0: 28%|██▊ | 3508/12384 [7:26:36<18:54:02, 7.67s/it, loss=0.0010, acc=0.9960, iter_time=8.23s]
Epoch 0: 28%|██▊ | 3509/12384 [7:26:36<18:50:58, 7.65s/it, loss=0.0010, acc=0.9960, iter_time=8.23s]
Epoch 0: 28%|██▊ | 3509/12384 [7:26:43<18:50:58, 7.65s/it, loss=0.0004, acc=0.9971, iter_time=7.93s]
Epoch 0: 28%|██▊ | 3510/12384 [7:26:43<18:50:43, 7.65s/it, loss=0.0004, acc=0.9971, iter_time=7.93s]
Epoch 0: 28%|██▊ | 3510/12384 [7:26:51<18:50:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3511/12384 [7:26:51<18:48:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3511/12384 [7:26:59<18:48:19, 7.63s/it, loss=0.0017, acc=0.9933, iter_time=7.97s]
Epoch 0: 28%|██▊ | 3512/12384 [7:26:59<18:47:37, 7.63s/it, loss=0.0017, acc=0.9933, iter_time=7.97s]
Epoch 0: 28%|██▊ | 3512/12384 [7:27:06<18:47:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 28%|██▊ | 3513/12384 [7:27:06<18:46:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 28%|██▊ | 3513/12384 [7:27:14<18:46:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 28%|██▊ | 3514/12384 [7:27:14<18:46:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 28%|██▊ | 3514/12384 [7:27:21<18:46:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 0: 28%|██▊ | 3515/12384 [7:27:21<18:44:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 0: 28%|██▊ | 3515/12384 [7:27:29<18:44:29, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3516/12384 [7:27:29<18:44:53, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 0: 28%|██▊ | 3516/12384 [7:27:37<18:44:53, 7.61s/it, loss=0.0006, acc=0.9986, iter_time=6.11s]
Epoch 0: 28%|██▊ | 3517/12384 [7:27:37<18:44:40, 7.61s/it, loss=0.0006, acc=0.9986, iter_time=6.11s]
Epoch 0: 28%|██▊ | 3517/12384 [7:27:44<18:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 28%|██▊ | 3518/12384 [7:27:44<18:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 28%|██▊ | 3518/12384 [7:27:52<18:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 28%|██▊ | 3519/12384 [7:27:52<18:43:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 28%|██▊ | 3519/12384 [7:27:59<18:43:25, 7.60s/it, loss=0.0025, acc=0.9953, iter_time=7.68s]
Epoch 0: 28%|██▊ | 3520/12384 [7:27:59<18:42:55, 7.60s/it, loss=0.0025, acc=0.9953, iter_time=7.68s]
Epoch 0: 28%|██▊ | 3520/12384 [7:28:07<18:42:55, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 28%|██▊ | 3521/12384 [7:28:07<18:43:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 28%|██▊ | 3521/12384 [7:28:15<18:43:30, 7.61s/it, loss=0.0003, acc=0.9987, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3522/12384 [7:28:15<18:44:05, 7.61s/it, loss=0.0003, acc=0.9987, iter_time=7.62s]
Epoch 0: 28%|██▊ | 3522/12384 [7:28:22<18:44:05, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3523/12384 [7:28:22<18:44:22, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 28%|██▊ | 3523/12384 [7:28:30<18:44:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.32s]
Epoch 0: 28%|██▊ | 3524/12384 [7:28:30<18:43:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.32s]
Epoch 0: 28%|██▊ | 3524/12384 [7:28:38<18:43:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 28%|██▊ | 3525/12384 [7:28:38<18:42:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 28%|██▊ | 3525/12384 [7:28:45<18:42:43, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3526/12384 [7:28:45<18:46:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 28%|██▊ | 3526/12384 [7:28:53<18:46:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 28%|██▊ | 3527/12384 [7:28:53<18:45:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 28%|██▊ | 3527/12384 [7:29:01<18:45:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.13s]
Epoch 0: 28%|██▊ | 3528/12384 [7:29:01<18:58:53, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=10.13s]
Epoch 0: 28%|██▊ | 3528/12384 [7:29:08<18:58:53, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 0: 28%|██▊ | 3529/12384 [7:29:08<18:54:23, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 0: 28%|██▊ | 3529/12384 [7:29:16<18:54:23, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=3.83s]
Epoch 0: 29%|██▊ | 3530/12384 [7:29:16<18:49:49, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=3.83s]
Epoch 0: 29%|██▊ | 3530/12384 [7:29:24<18:49:49, 7.66s/it, loss=0.0023, acc=0.9910, iter_time=7.91s]
Epoch 0: 29%|██▊ | 3531/12384 [7:29:24<19:02:13, 7.74s/it, loss=0.0023, acc=0.9910, iter_time=7.91s]
Epoch 0: 29%|██▊ | 3531/12384 [7:29:32<19:02:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 0: 29%|██▊ | 3532/12384 [7:29:32<18:55:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 0: 29%|██▊ | 3532/12384 [7:29:39<18:55:57, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.96s]
Epoch 0: 29%|██▊ | 3533/12384 [7:29:39<18:53:20, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.96s]
Epoch 0: 29%|██▊ | 3533/12384 [7:29:47<18:53:20, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 0: 29%|██▊ | 3534/12384 [7:29:47<18:50:52, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 0: 29%|██▊ | 3534/12384 [7:29:54<18:50:52, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=8.26s]
Epoch 0: 29%|██▊ | 3535/12384 [7:29:54<18:47:20, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.26s]
Epoch 0: 29%|██▊ | 3535/12384 [7:30:02<18:47:20, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 29%|██▊ | 3536/12384 [7:30:02<18:45:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 29%|██▊ | 3536/12384 [7:30:10<18:45:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 29%|██▊ | 3537/12384 [7:30:10<18:44:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 29%|██▊ | 3537/12384 [7:30:17<18:44:51, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=8.27s]
Epoch 0: 29%|██▊ | 3538/12384 [7:30:17<18:43:23, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.27s]
Epoch 0: 29%|██▊ | 3538/12384 [7:30:25<18:43:23, 7.62s/it, loss=0.0030, acc=0.9907, iter_time=7.60s]
Epoch 0: 29%|██▊ | 3539/12384 [7:30:25<18:42:58, 7.62s/it, loss=0.0030, acc=0.9907, iter_time=7.60s]
Epoch 0: 29%|██▊ | 3539/12384 [7:30:32<18:42:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 0: 29%|██▊ | 3540/12384 [7:30:32<18:43:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 0: 29%|██▊ | 3540/12384 [7:30:40<18:43:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 0: 29%|██▊ | 3541/12384 [7:30:40<18:42:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 0: 29%|██▊ | 3541/12384 [7:30:48<18:42:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.09s]
Epoch 0: 29%|██▊ | 3542/12384 [7:30:48<18:42:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.09s]
Epoch 0: 29%|██▊ | 3542/12384 [7:30:55<18:42:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 0: 29%|██▊ | 3543/12384 [7:30:55<18:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 0: 29%|██▊ | 3543/12384 [7:31:03<18:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 0: 29%|██▊ | 3544/12384 [7:31:03<18:42:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 0: 29%|██▊ | 3544/12384 [7:31:11<18:42:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.01s]
Epoch 0: 29%|██▊ | 3545/12384 [7:31:11<18:41:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.01s]
Epoch 0: 29%|██▊ | 3545/12384 [7:31:18<18:41:32, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.81s]
Epoch 0: 29%|██▊ | 3546/12384 [7:31:18<18:41:06, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.81s]
Epoch 0: 29%|██▊ | 3546/12384 [7:31:26<18:41:06, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.02s]
Epoch 0: 29%|██▊ | 3547/12384 [7:31:26<18:41:40, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.02s]
Epoch 0: 29%|██▊ | 3547/12384 [7:31:33<18:41:40, 7.62s/it, loss=0.0009, acc=0.9967, iter_time=8.21s]
Epoch 0: 29%|██▊ | 3548/12384 [7:31:33<18:40:16, 7.61s/it, loss=0.0009, acc=0.9967, iter_time=8.21s]
Epoch 0: 29%|██▊ | 3548/12384 [7:31:41<18:40:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 29%|██▊ | 3549/12384 [7:31:41<18:40:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 29%|██▊ | 3549/12384 [7:31:49<18:40:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.53s]
Epoch 0: 29%|██▊ | 3550/12384 [7:31:49<18:40:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.53s]
Epoch 0: 29%|██▊ | 3550/12384 [7:31:56<18:40:02, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.41s]
Epoch 0: 29%|██▊ | 3551/12384 [7:31:56<18:44:33, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.41s]
Epoch 0: 29%|██▊ | 3551/12384 [7:32:04<18:44:33, 7.64s/it, loss=0.0031, acc=0.9884, iter_time=9.91s]
Epoch 0: 29%|██▊ | 3552/12384 [7:32:04<18:43:35, 7.63s/it, loss=0.0031, acc=0.9884, iter_time=9.91s]
Epoch 0: 29%|██▊ | 3552/12384 [7:32:12<18:43:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.60s]
Epoch 0: 29%|██▊ | 3553/12384 [7:32:12<18:43:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.60s]
Epoch 0: 29%|██▊ | 3553/12384 [7:32:19<18:43:37, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=10.57s]
Epoch 0: 29%|██▊ | 3554/12384 [7:32:19<18:55:35, 7.72s/it, loss=0.0002, acc=0.9999, iter_time=10.57s]
Epoch 0: 29%|██▊ | 3554/12384 [7:32:27<18:55:35, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▊ | 3555/12384 [7:32:27<18:50:14, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▊ | 3555/12384 [7:32:35<18:50:14, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 29%|██▊ | 3556/12384 [7:32:35<18:47:02, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 29%|██▊ | 3556/12384 [7:32:43<18:47:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 29%|██▊ | 3557/12384 [7:32:43<18:59:25, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 29%|██▊ | 3557/12384 [7:32:50<18:59:25, 7.74s/it, loss=0.0017, acc=0.9944, iter_time=7.91s]
Epoch 0: 29%|██▊ | 3558/12384 [7:32:50<18:54:06, 7.71s/it, loss=0.0017, acc=0.9944, iter_time=7.91s]
Epoch 0: 29%|██▊ | 3558/12384 [7:32:58<18:54:06, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▊ | 3559/12384 [7:32:58<18:50:08, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▊ | 3559/12384 [7:33:05<18:50:08, 7.68s/it, loss=0.0008, acc=0.9976, iter_time=8.01s]
Epoch 0: 29%|██▊ | 3560/12384 [7:33:05<18:46:42, 7.66s/it, loss=0.0008, acc=0.9976, iter_time=8.01s]
Epoch 0: 29%|██▊ | 3560/12384 [7:33:13<18:46:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 29%|██▉ | 3561/12384 [7:33:13<18:44:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 29%|██▉ | 3561/12384 [7:33:21<18:44:08, 7.64s/it, loss=0.0004, acc=0.9999, iter_time=6.08s]
Epoch 0: 29%|██▉ | 3562/12384 [7:33:21<18:42:27, 7.63s/it, loss=0.0004, acc=0.9999, iter_time=6.08s]
Epoch 0: 29%|██▉ | 3562/12384 [7:33:28<18:42:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 29%|██▉ | 3563/12384 [7:33:28<18:41:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 29%|██▉ | 3563/12384 [7:33:36<18:41:25, 7.63s/it, loss=0.0003, acc=0.9975, iter_time=9.70s]
Epoch 0: 29%|██▉ | 3564/12384 [7:33:36<18:40:49, 7.62s/it, loss=0.0003, acc=0.9975, iter_time=9.70s]
Epoch 0: 29%|██▉ | 3564/12384 [7:33:43<18:40:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3565/12384 [7:33:43<18:39:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3565/12384 [7:33:51<18:39:20, 7.62s/it, loss=0.0004, acc=0.9984, iter_time=7.61s]
Epoch 0: 29%|██▉ | 3566/12384 [7:33:51<18:39:44, 7.62s/it, loss=0.0004, acc=0.9984, iter_time=7.61s]
Epoch 0: 29%|██▉ | 3566/12384 [7:33:59<18:39:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3567/12384 [7:33:59<18:39:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3567/12384 [7:34:06<18:39:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 29%|██▉ | 3568/12384 [7:34:06<18:38:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 29%|██▉ | 3568/12384 [7:34:14<18:38:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 29%|██▉ | 3569/12384 [7:34:14<18:38:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 29%|██▉ | 3569/12384 [7:34:22<18:38:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 29%|██▉ | 3570/12384 [7:34:22<18:38:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 29%|██▉ | 3570/12384 [7:34:29<18:38:02, 7.61s/it, loss=0.0007, acc=0.9986, iter_time=7.59s]
Epoch 0: 29%|██▉ | 3571/12384 [7:34:29<18:37:17, 7.61s/it, loss=0.0007, acc=0.9986, iter_time=7.59s]
Epoch 0: 29%|██▉ | 3571/12384 [7:34:37<18:37:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3572/12384 [7:34:37<18:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3572/12384 [7:34:44<18:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 29%|██▉ | 3573/12384 [7:34:44<18:36:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 29%|██▉ | 3573/12384 [7:34:52<18:36:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 29%|██▉ | 3574/12384 [7:34:52<18:36:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 29%|██▉ | 3574/12384 [7:35:00<18:36:52, 7.61s/it, loss=0.0004, acc=0.9982, iter_time=10.47s]
Epoch 0: 29%|██▉ | 3575/12384 [7:35:00<18:37:16, 7.61s/it, loss=0.0004, acc=0.9982, iter_time=10.47s]
Epoch 0: 29%|██▉ | 3575/12384 [7:35:07<18:37:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 29%|██▉ | 3576/12384 [7:35:07<18:36:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 29%|██▉ | 3576/12384 [7:35:15<18:36:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 29%|██▉ | 3577/12384 [7:35:15<18:37:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 29%|██▉ | 3577/12384 [7:35:22<18:37:16, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.04s]
Epoch 0: 29%|██▉ | 3578/12384 [7:35:22<18:36:44, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.04s]
Epoch 0: 29%|██▉ | 3578/12384 [7:35:30<18:36:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 29%|██▉ | 3579/12384 [7:35:30<18:36:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 29%|██▉ | 3579/12384 [7:35:38<18:36:54, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.93s]
Epoch 0: 29%|██▉ | 3580/12384 [7:35:38<18:49:32, 7.70s/it, loss=0.0001, acc=0.9999, iter_time=7.93s]
Epoch 0: 29%|██▉ | 3580/12384 [7:35:46<18:49:32, 7.70s/it, loss=0.0002, acc=0.9999, iter_time=7.59s]
Epoch 0: 29%|██▉ | 3581/12384 [7:35:46<18:45:02, 7.67s/it, loss=0.0002, acc=0.9999, iter_time=7.59s]
Epoch 0: 29%|██▉ | 3581/12384 [7:35:53<18:45:02, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 29%|██▉ | 3582/12384 [7:35:53<18:42:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 29%|██▉ | 3582/12384 [7:36:01<18:42:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.77s]
Epoch 0: 29%|██▉ | 3583/12384 [7:36:01<18:40:16, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.77s]
Epoch 0: 29%|██▉ | 3583/12384 [7:36:09<18:40:16, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.92s]
Epoch 0: 29%|██▉ | 3584/12384 [7:36:09<18:53:47, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=10.92s]
Epoch 0: 29%|██▉ | 3584/12384 [7:36:16<18:53:47, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 29%|██▉ | 3585/12384 [7:36:16<18:48:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 29%|██▉ | 3585/12384 [7:36:24<18:48:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3586/12384 [7:36:24<18:44:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3586/12384 [7:36:32<18:44:52, 7.67s/it, loss=0.0003, acc=0.9983, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3587/12384 [7:36:32<18:41:44, 7.65s/it, loss=0.0003, acc=0.9983, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3587/12384 [7:36:39<18:41:44, 7.65s/it, loss=0.0002, acc=0.9994, iter_time=7.59s]
Epoch 0: 29%|██▉ | 3588/12384 [7:36:39<18:39:31, 7.64s/it, loss=0.0002, acc=0.9994, iter_time=7.59s]
Epoch 0: 29%|██▉ | 3588/12384 [7:36:47<18:39:31, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3589/12384 [7:36:47<18:38:11, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3589/12384 [7:36:54<18:38:11, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 29%|██▉ | 3590/12384 [7:36:54<18:38:09, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 29%|██▉ | 3590/12384 [7:37:02<18:38:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3591/12384 [7:37:02<18:40:36, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3591/12384 [7:37:10<18:40:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 29%|██▉ | 3592/12384 [7:37:10<18:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 29%|██▉ | 3592/12384 [7:37:17<18:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 29%|██▉ | 3593/12384 [7:37:17<18:42:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 29%|██▉ | 3593/12384 [7:37:25<18:42:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.91s]
Epoch 0: 29%|██▉ | 3594/12384 [7:37:25<18:39:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.91s]
Epoch 0: 29%|██▉ | 3594/12384 [7:37:33<18:39:50, 7.64s/it, loss=0.0007, acc=0.9981, iter_time=9.41s]
Epoch 0: 29%|██▉ | 3595/12384 [7:37:33<18:38:39, 7.64s/it, loss=0.0007, acc=0.9981, iter_time=9.41s]
Epoch 0: 29%|██▉ | 3595/12384 [7:37:40<18:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 29%|██▉ | 3596/12384 [7:37:40<18:36:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 29%|██▉ | 3596/12384 [7:37:48<18:36:22, 7.62s/it, loss=0.0006, acc=0.9968, iter_time=4.98s]
Epoch 0: 29%|██▉ | 3597/12384 [7:37:48<18:34:44, 7.61s/it, loss=0.0006, acc=0.9968, iter_time=4.98s]
Epoch 0: 29%|██▉ | 3597/12384 [7:37:55<18:34:44, 7.61s/it, loss=0.0013, acc=0.9950, iter_time=10.18s]
Epoch 0: 29%|██▉ | 3598/12384 [7:37:55<18:34:46, 7.61s/it, loss=0.0013, acc=0.9950, iter_time=10.18s]
Epoch 0: 29%|██▉ | 3598/12384 [7:38:03<18:34:46, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.63s]
Epoch 0: 29%|██▉ | 3599/12384 [7:38:03<18:33:42, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.63s]
Epoch 0: 29%|██▉ | 3599/12384 [7:38:11<18:33:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 29%|██▉ | 3600/12384 [7:38:11<18:34:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 29%|██▉ | 3600/12384 [7:38:18<18:34:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 29%|██▉ | 3601/12384 [7:38:18<18:33:10, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 29%|██▉ | 3601/12384 [7:38:26<18:33:10, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.34s]
Epoch 0: 29%|██▉ | 3602/12384 [7:38:26<18:33:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.34s]
Epoch 0: 29%|██▉ | 3602/12384 [7:38:33<18:33:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.34s]
Epoch 0: 29%|██▉ | 3603/12384 [7:38:33<18:32:54, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.34s]
Epoch 0: 29%|██▉ | 3603/12384 [7:38:41<18:32:54, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.11s]
Epoch 0: 29%|██▉ | 3604/12384 [7:38:41<18:32:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.11s]
Epoch 0: 29%|██▉ | 3604/12384 [7:38:49<18:32:53, 7.61s/it, loss=0.0002, acc=0.9997, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3605/12384 [7:38:49<18:32:35, 7.60s/it, loss=0.0002, acc=0.9997, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3605/12384 [7:38:56<18:32:35, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.05s]
Epoch 0: 29%|██▉ | 3606/12384 [7:38:56<18:33:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.05s]
Epoch 0: 29%|██▉ | 3606/12384 [7:39:04<18:33:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 29%|██▉ | 3607/12384 [7:39:04<18:33:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 29%|██▉ | 3607/12384 [7:39:11<18:33:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 29%|██▉ | 3608/12384 [7:39:11<18:33:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 29%|██▉ | 3608/12384 [7:39:19<18:33:25, 7.61s/it, loss=0.0003, acc=0.9968, iter_time=5.76s]
Epoch 0: 29%|██▉ | 3609/12384 [7:39:19<18:35:15, 7.63s/it, loss=0.0003, acc=0.9968, iter_time=5.76s]
Epoch 0: 29%|██▉ | 3609/12384 [7:39:27<18:35:15, 7.63s/it, loss=0.0014, acc=0.9965, iter_time=7.40s]
Epoch 0: 29%|██▉ | 3610/12384 [7:39:27<18:50:14, 7.73s/it, loss=0.0014, acc=0.9965, iter_time=7.40s]
Epoch 0: 29%|██▉ | 3610/12384 [7:39:35<18:50:14, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 29%|██▉ | 3611/12384 [7:39:35<18:45:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 29%|██▉ | 3611/12384 [7:39:42<18:45:43, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3612/12384 [7:39:42<18:42:07, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3612/12384 [7:39:50<18:42:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 29%|██▉ | 3613/12384 [7:39:50<18:38:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 29%|██▉ | 3613/12384 [7:39:58<18:38:58, 7.65s/it, loss=0.0009, acc=0.9978, iter_time=7.36s]
Epoch 0: 29%|██▉ | 3614/12384 [7:39:58<18:38:16, 7.65s/it, loss=0.0009, acc=0.9978, iter_time=7.36s]
Epoch 0: 29%|██▉ | 3614/12384 [7:40:05<18:38:16, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.20s]
Epoch 0: 29%|██▉ | 3615/12384 [7:40:05<18:38:04, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.20s]
Epoch 0: 29%|██▉ | 3615/12384 [7:40:13<18:38:04, 7.65s/it, loss=0.0012, acc=0.9981, iter_time=8.01s]
Epoch 0: 29%|██▉ | 3616/12384 [7:40:13<18:35:22, 7.63s/it, loss=0.0012, acc=0.9981, iter_time=8.01s]
Epoch 0: 29%|██▉ | 3616/12384 [7:40:20<18:35:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=3.68s]
Epoch 0: 29%|██▉ | 3617/12384 [7:40:20<18:35:06, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=3.68s]
Epoch 0: 29%|██▉ | 3617/12384 [7:40:28<18:35:06, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.61s]
Epoch 0: 29%|██▉ | 3618/12384 [7:40:28<18:38:40, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.61s]
Epoch 0: 29%|██▉ | 3618/12384 [7:40:36<18:38:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 0: 29%|██▉ | 3619/12384 [7:40:36<18:36:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 0: 29%|██▉ | 3619/12384 [7:40:43<18:36:22, 7.64s/it, loss=0.0012, acc=0.9959, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3620/12384 [7:40:43<18:35:10, 7.63s/it, loss=0.0012, acc=0.9959, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3620/12384 [7:40:51<18:35:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 29%|██▉ | 3621/12384 [7:40:51<18:36:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 29%|██▉ | 3621/12384 [7:40:59<18:36:02, 7.64s/it, loss=0.0004, acc=0.9992, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3622/12384 [7:40:59<18:35:49, 7.64s/it, loss=0.0004, acc=0.9992, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3622/12384 [7:41:06<18:35:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 29%|██▉ | 3623/12384 [7:41:06<18:34:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 29%|██▉ | 3623/12384 [7:41:14<18:34:58, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3624/12384 [7:41:14<18:34:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3624/12384 [7:41:22<18:34:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 0: 29%|██▉ | 3625/12384 [7:41:22<18:33:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 0: 29%|██▉ | 3625/12384 [7:41:29<18:33:23, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=11.20s]
Epoch 0: 29%|██▉ | 3626/12384 [7:41:29<18:32:05, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=11.20s]
Epoch 0: 29%|██▉ | 3626/12384 [7:41:37<18:32:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 29%|██▉ | 3627/12384 [7:41:37<18:31:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 29%|██▉ | 3627/12384 [7:41:44<18:31:56, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.48s]
Epoch 0: 29%|██▉ | 3628/12384 [7:41:44<18:31:52, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.48s]
Epoch 0: 29%|██▉ | 3628/12384 [7:41:52<18:31:52, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=6.42s]
Epoch 0: 29%|██▉ | 3629/12384 [7:41:52<18:31:23, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=6.42s]
Epoch 0: 29%|██▉ | 3629/12384 [7:42:00<18:31:23, 7.62s/it, loss=0.0009, acc=0.9988, iter_time=8.81s]
Epoch 0: 29%|██▉ | 3630/12384 [7:42:00<18:31:05, 7.62s/it, loss=0.0009, acc=0.9988, iter_time=8.81s]
Epoch 0: 29%|██▉ | 3630/12384 [7:42:07<18:31:05, 7.62s/it, loss=0.0007, acc=0.9988, iter_time=7.31s]
Epoch 0: 29%|██▉ | 3631/12384 [7:42:07<18:30:03, 7.61s/it, loss=0.0007, acc=0.9988, iter_time=7.31s]
Epoch 0: 29%|██▉ | 3631/12384 [7:42:15<18:30:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 29%|██▉ | 3632/12384 [7:42:15<18:30:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 29%|██▉ | 3632/12384 [7:42:22<18:30:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.24s]
Epoch 0: 29%|██▉ | 3633/12384 [7:42:22<18:29:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.24s]
Epoch 0: 29%|██▉ | 3633/12384 [7:42:30<18:29:18, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.57s]
Epoch 0: 29%|██▉ | 3634/12384 [7:42:30<18:29:38, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.57s]
Epoch 0: 29%|██▉ | 3634/12384 [7:42:38<18:29:38, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3635/12384 [7:42:38<18:28:52, 7.60s/it, loss=0.0002, acc=0.9991, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3635/12384 [7:42:45<18:28:52, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 29%|██▉ | 3636/12384 [7:42:45<18:28:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 29%|██▉ | 3636/12384 [7:42:53<18:28:53, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3637/12384 [7:42:53<18:43:59, 7.71s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 0: 29%|██▉ | 3637/12384 [7:43:01<18:43:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 29%|██▉ | 3638/12384 [7:43:01<18:40:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 29%|██▉ | 3638/12384 [7:43:08<18:40:05, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=10.50s]
Epoch 0: 29%|██▉ | 3639/12384 [7:43:08<18:39:07, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=10.50s]
Epoch 0: 29%|██▉ | 3639/12384 [7:43:16<18:39:07, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 29%|██▉ | 3640/12384 [7:43:16<18:41:19, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 29%|██▉ | 3640/12384 [7:43:24<18:41:19, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=6.37s]
Epoch 0: 29%|██▉ | 3641/12384 [7:43:24<18:39:47, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=6.37s]
Epoch 0: 29%|██▉ | 3641/12384 [7:43:31<18:39:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 29%|██▉ | 3642/12384 [7:43:31<18:35:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 29%|██▉ | 3642/12384 [7:43:39<18:35:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 29%|██▉ | 3643/12384 [7:43:39<18:37:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 29%|██▉ | 3643/12384 [7:43:47<18:37:51, 7.67s/it, loss=0.0011, acc=0.9978, iter_time=4.58s]
Epoch 0: 29%|██▉ | 3644/12384 [7:43:47<18:36:58, 7.67s/it, loss=0.0011, acc=0.9978, iter_time=4.58s]
Epoch 0: 29%|██▉ | 3644/12384 [7:43:55<18:36:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 0: 29%|██▉ | 3645/12384 [7:43:55<18:37:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 0: 29%|██▉ | 3645/12384 [7:44:02<18:37:10, 7.67s/it, loss=0.0019, acc=0.9965, iter_time=7.67s]
Epoch 0: 29%|██▉ | 3646/12384 [7:44:02<18:33:37, 7.65s/it, loss=0.0019, acc=0.9965, iter_time=7.67s]
Epoch 0: 29%|██▉ | 3646/12384 [7:44:10<18:33:37, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.46s]
Epoch 0: 29%|██▉ | 3647/12384 [7:44:10<18:31:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.46s]
Epoch 0: 29%|██▉ | 3647/12384 [7:44:17<18:31:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.67s]
Epoch 0: 29%|██▉ | 3648/12384 [7:44:17<18:29:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.67s]
Epoch 0: 29%|██▉ | 3648/12384 [7:44:25<18:29:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 29%|██▉ | 3649/12384 [7:44:25<18:29:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 29%|██▉ | 3649/12384 [7:44:33<18:29:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 29%|██▉ | 3650/12384 [7:44:33<18:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 29%|██▉ | 3650/12384 [7:44:40<18:29:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.26s]
Epoch 0: 29%|██▉ | 3651/12384 [7:44:40<18:29:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.26s]
Epoch 0: 29%|██▉ | 3651/12384 [7:44:48<18:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 29%|██▉ | 3652/12384 [7:44:48<18:28:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 29%|██▉ | 3652/12384 [7:44:55<18:28:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3653/12384 [7:44:55<18:27:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 29%|██▉ | 3653/12384 [7:45:03<18:27:23, 7.61s/it, loss=0.0004, acc=0.9984, iter_time=7.61s]
Epoch 0: 30%|██▉ | 3654/12384 [7:45:03<18:27:04, 7.61s/it, loss=0.0004, acc=0.9984, iter_time=7.61s]
Epoch 0: 30%|██▉ | 3654/12384 [7:45:11<18:27:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|██▉ | 3655/12384 [7:45:11<18:27:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|██▉ | 3655/12384 [7:45:18<18:27:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 30%|██▉ | 3656/12384 [7:45:18<18:30:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 30%|██▉ | 3656/12384 [7:45:26<18:30:26, 7.63s/it, loss=0.0004, acc=0.9978, iter_time=7.21s]
Epoch 0: 30%|██▉ | 3657/12384 [7:45:26<18:29:15, 7.63s/it, loss=0.0004, acc=0.9978, iter_time=7.21s]
Epoch 0: 30%|██▉ | 3657/12384 [7:45:34<18:29:15, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|██▉ | 3658/12384 [7:45:34<18:29:51, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|██▉ | 3658/12384 [7:45:41<18:29:51, 7.63s/it, loss=0.0002, acc=0.9987, iter_time=7.93s]
Epoch 0: 30%|██▉ | 3659/12384 [7:45:41<18:40:55, 7.71s/it, loss=0.0002, acc=0.9987, iter_time=7.93s]
Epoch 0: 30%|██▉ | 3659/12384 [7:45:49<18:40:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 30%|██▉ | 3660/12384 [7:45:49<18:36:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 30%|██▉ | 3660/12384 [7:45:57<18:36:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 30%|██▉ | 3661/12384 [7:45:57<18:33:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 30%|██▉ | 3661/12384 [7:46:04<18:33:55, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 30%|██▉ | 3662/12384 [7:46:04<18:31:56, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 30%|██▉ | 3662/12384 [7:46:12<18:31:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 30%|██▉ | 3663/12384 [7:46:12<18:44:29, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 30%|██▉ | 3663/12384 [7:46:20<18:44:29, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 30%|██▉ | 3664/12384 [7:46:20<18:39:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 30%|██▉ | 3664/12384 [7:46:27<18:39:36, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=4.84s]
Epoch 0: 30%|██▉ | 3665/12384 [7:46:27<18:35:31, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.84s]
Epoch 0: 30%|██▉ | 3665/12384 [7:46:35<18:35:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 30%|██▉ | 3666/12384 [7:46:35<18:32:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 30%|██▉ | 3666/12384 [7:46:43<18:32:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 30%|██▉ | 3667/12384 [7:46:43<18:30:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 30%|██▉ | 3667/12384 [7:46:50<18:30:38, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=11.23s]
Epoch 0: 30%|██▉ | 3668/12384 [7:46:50<18:30:07, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=11.23s]
Epoch 0: 30%|██▉ | 3668/12384 [7:46:58<18:30:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 30%|██▉ | 3669/12384 [7:46:58<18:28:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 30%|██▉ | 3669/12384 [7:47:05<18:28:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 30%|██▉ | 3670/12384 [7:47:05<18:26:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 30%|██▉ | 3670/12384 [7:47:13<18:26:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 30%|██▉ | 3671/12384 [7:47:13<18:25:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 30%|██▉ | 3671/12384 [7:47:21<18:25:03, 7.61s/it, loss=0.0045, acc=0.9915, iter_time=7.57s]
Epoch 0: 30%|██▉ | 3672/12384 [7:47:21<18:25:34, 7.61s/it, loss=0.0045, acc=0.9915, iter_time=7.57s]
Epoch 0: 30%|██▉ | 3672/12384 [7:47:28<18:25:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 30%|██▉ | 3673/12384 [7:47:28<18:24:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 30%|██▉ | 3673/12384 [7:47:36<18:24:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 30%|██▉ | 3674/12384 [7:47:36<18:29:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 30%|██▉ | 3674/12384 [7:47:44<18:29:09, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.68s]
Epoch 0: 30%|██▉ | 3675/12384 [7:47:44<18:28:52, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.68s]
Epoch 0: 30%|██▉ | 3675/12384 [7:47:51<18:28:52, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.06s]
Epoch 0: 30%|██▉ | 3676/12384 [7:47:51<18:26:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.06s]
Epoch 0: 30%|██▉ | 3676/12384 [7:47:59<18:26:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 0: 30%|██▉ | 3677/12384 [7:47:59<18:29:55, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 0: 30%|██▉ | 3677/12384 [7:48:07<18:29:55, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.20s]
Epoch 0: 30%|██▉ | 3678/12384 [7:48:07<18:27:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.20s]
Epoch 0: 30%|██▉ | 3678/12384 [7:48:14<18:27:09, 7.63s/it, loss=0.0003, acc=0.9975, iter_time=5.79s]
Epoch 0: 30%|██▉ | 3679/12384 [7:48:14<18:26:30, 7.63s/it, loss=0.0003, acc=0.9975, iter_time=5.79s]
Epoch 0: 30%|██▉ | 3679/12384 [7:48:22<18:26:30, 7.63s/it, loss=0.0007, acc=0.9981, iter_time=9.38s]
Epoch 0: 30%|██▉ | 3680/12384 [7:48:22<18:25:35, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=9.38s]
Epoch 0: 30%|██▉ | 3680/12384 [7:48:29<18:25:35, 7.62s/it, loss=0.0006, acc=0.9985, iter_time=7.04s]
Epoch 0: 30%|██▉ | 3681/12384 [7:48:29<18:25:02, 7.62s/it, loss=0.0006, acc=0.9985, iter_time=7.04s]
Epoch 0: 30%|██▉ | 3681/12384 [7:48:37<18:25:02, 7.62s/it, loss=0.0005, acc=0.9975, iter_time=7.63s]
Epoch 0: 30%|██▉ | 3682/12384 [7:48:37<18:25:23, 7.62s/it, loss=0.0005, acc=0.9975, iter_time=7.63s]
Epoch 0: 30%|██▉ | 3682/12384 [7:48:45<18:25:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.62s]
Epoch 0: 30%|██▉ | 3683/12384 [7:48:45<18:24:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.62s]
Epoch 0: 30%|██▉ | 3683/12384 [7:48:52<18:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 30%|██▉ | 3684/12384 [7:48:52<18:23:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 30%|██▉ | 3684/12384 [7:49:00<18:23:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 30%|██▉ | 3685/12384 [7:49:00<18:25:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 30%|██▉ | 3685/12384 [7:49:07<18:25:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.43s]
Epoch 0: 30%|██▉ | 3686/12384 [7:49:07<18:24:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.43s]
Epoch 0: 30%|██▉ | 3686/12384 [7:49:15<18:24:11, 7.62s/it, loss=0.0004, acc=0.9982, iter_time=8.22s]
Epoch 0: 30%|██▉ | 3687/12384 [7:49:15<18:23:03, 7.61s/it, loss=0.0004, acc=0.9982, iter_time=8.22s]
Epoch 0: 30%|██▉ | 3687/12384 [7:49:23<18:23:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 30%|██▉ | 3688/12384 [7:49:23<18:23:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 30%|██▉ | 3688/12384 [7:49:31<18:23:23, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.39s]
Epoch 0: 30%|██▉ | 3689/12384 [7:49:31<18:36:14, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=5.39s]
Epoch 0: 30%|██▉ | 3689/12384 [7:49:38<18:36:14, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=10.18s]
Epoch 0: 30%|██▉ | 3690/12384 [7:49:38<18:32:46, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=10.18s]
Epoch 0: 30%|██▉ | 3690/12384 [7:49:46<18:32:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 30%|██▉ | 3691/12384 [7:49:46<18:28:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 30%|██▉ | 3691/12384 [7:49:53<18:28:31, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.78s]
Epoch 0: 30%|██▉ | 3692/12384 [7:49:53<18:26:51, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.78s]
Epoch 0: 30%|██▉ | 3692/12384 [7:50:01<18:26:51, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=6.61s]
Epoch 0: 30%|██▉ | 3693/12384 [7:50:01<18:25:17, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=6.61s]
Epoch 0: 30%|██▉ | 3693/12384 [7:50:09<18:25:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 30%|██▉ | 3694/12384 [7:50:09<18:23:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 30%|██▉ | 3694/12384 [7:50:16<18:23:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 30%|██▉ | 3695/12384 [7:50:16<18:23:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 30%|██▉ | 3695/12384 [7:50:24<18:23:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.37s]
Epoch 0: 30%|██▉ | 3696/12384 [7:50:24<18:23:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.37s]
Epoch 0: 30%|██▉ | 3696/12384 [7:50:31<18:23:29, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.64s]
Epoch 0: 30%|██▉ | 3697/12384 [7:50:32<18:49:41, 7.80s/it, loss=0.0003, acc=0.9984, iter_time=7.64s]
Epoch 0: 30%|██▉ | 3697/12384 [7:50:40<18:49:41, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 30%|██▉ | 3698/12384 [7:50:40<18:40:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 30%|██▉ | 3698/12384 [7:50:47<18:40:53, 7.74s/it, loss=0.0002, acc=0.9985, iter_time=7.60s]
Epoch 0: 30%|██▉ | 3699/12384 [7:50:47<18:35:42, 7.71s/it, loss=0.0002, acc=0.9985, iter_time=7.60s]
Epoch 0: 30%|██▉ | 3699/12384 [7:50:55<18:35:42, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 30%|██▉ | 3700/12384 [7:50:55<18:31:01, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 30%|██▉ | 3700/12384 [7:51:02<18:31:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 30%|██▉ | 3701/12384 [7:51:02<18:26:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 30%|██▉ | 3701/12384 [7:51:10<18:26:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 30%|██▉ | 3702/12384 [7:51:10<18:23:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 30%|██▉ | 3702/12384 [7:51:18<18:23:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 30%|██▉ | 3703/12384 [7:51:18<18:23:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 30%|██▉ | 3703/12384 [7:51:25<18:23:04, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.29s]
Epoch 0: 30%|██▉ | 3704/12384 [7:51:25<18:22:25, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.29s]
Epoch 0: 30%|██▉ | 3704/12384 [7:51:33<18:22:25, 7.62s/it, loss=0.0001, acc=0.9993, iter_time=7.22s]
Epoch 0: 30%|██▉ | 3705/12384 [7:51:33<18:22:05, 7.62s/it, loss=0.0001, acc=0.9993, iter_time=7.22s]
Epoch 0: 30%|██▉ | 3705/12384 [7:51:41<18:22:05, 7.62s/it, loss=0.0008, acc=0.9987, iter_time=4.76s]
Epoch 0: 30%|██▉ | 3706/12384 [7:51:41<18:20:37, 7.61s/it, loss=0.0008, acc=0.9987, iter_time=4.76s]
Epoch 0: 30%|██▉ | 3706/12384 [7:51:48<18:20:37, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.86s]
Epoch 0: 30%|██▉ | 3707/12384 [7:51:48<18:21:08, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.86s]
Epoch 0: 30%|██▉ | 3707/12384 [7:51:56<18:21:08, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=10.22s]
Epoch 0: 30%|██▉ | 3708/12384 [7:51:56<18:21:11, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=10.22s]
Epoch 0: 30%|██▉ | 3708/12384 [7:52:03<18:21:11, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|██▉ | 3709/12384 [7:52:03<18:20:56, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|██▉ | 3709/12384 [7:52:11<18:20:56, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.61s]
Epoch 0: 30%|██▉ | 3710/12384 [7:52:11<18:20:04, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.61s]
Epoch 0: 30%|██▉ | 3710/12384 [7:52:19<18:20:04, 7.61s/it, loss=0.0003, acc=0.9997, iter_time=7.91s]
Epoch 0: 30%|██▉ | 3711/12384 [7:52:19<18:32:46, 7.70s/it, loss=0.0003, acc=0.9997, iter_time=7.91s]
Epoch 0: 30%|██▉ | 3711/12384 [7:52:26<18:32:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 30%|██▉ | 3712/12384 [7:52:26<18:28:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 30%|██▉ | 3712/12384 [7:52:34<18:28:35, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 30%|██▉ | 3713/12384 [7:52:34<18:28:13, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 30%|██▉ | 3713/12384 [7:52:42<18:28:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 30%|██▉ | 3714/12384 [7:52:42<18:25:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 30%|██▉ | 3714/12384 [7:52:50<18:25:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 30%|██▉ | 3715/12384 [7:52:50<18:38:11, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 30%|██▉ | 3715/12384 [7:52:57<18:38:11, 7.74s/it, loss=0.0005, acc=0.9976, iter_time=9.67s]
Epoch 0: 30%|███ | 3716/12384 [7:52:57<18:33:45, 7.71s/it, loss=0.0005, acc=0.9976, iter_time=9.67s]
Epoch 0: 30%|███ | 3716/12384 [7:53:05<18:33:45, 7.71s/it, loss=0.0014, acc=0.9955, iter_time=7.65s]
Epoch 0: 30%|███ | 3717/12384 [7:53:05<18:29:18, 7.68s/it, loss=0.0014, acc=0.9955, iter_time=7.65s]
Epoch 0: 30%|███ | 3717/12384 [7:53:13<18:29:18, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=5.80s]
Epoch 0: 30%|███ | 3718/12384 [7:53:13<18:26:19, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=5.80s]
Epoch 0: 30%|███ | 3718/12384 [7:53:20<18:26:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 30%|███ | 3719/12384 [7:53:20<18:23:23, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 30%|███ | 3719/12384 [7:53:28<18:23:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 30%|███ | 3720/12384 [7:53:28<18:22:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 30%|███ | 3720/12384 [7:53:35<18:22:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 30%|███ | 3721/12384 [7:53:35<18:20:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 30%|███ | 3721/12384 [7:53:43<18:20:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 30%|███ | 3722/12384 [7:53:43<18:19:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 30%|███ | 3722/12384 [7:53:51<18:19:51, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=7.60s]
Epoch 0: 30%|███ | 3723/12384 [7:53:51<18:20:11, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=7.60s]
Epoch 0: 30%|███ | 3723/12384 [7:53:58<18:20:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.33s]
Epoch 0: 30%|███ | 3724/12384 [7:53:58<18:18:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.33s]
Epoch 0: 30%|███ | 3724/12384 [7:54:06<18:18:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.29s]
Epoch 0: 30%|███ | 3725/12384 [7:54:06<18:18:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.29s]
Epoch 0: 30%|███ | 3725/12384 [7:54:13<18:18:02, 7.61s/it, loss=0.0010, acc=0.9984, iter_time=8.19s]
Epoch 0: 30%|███ | 3726/12384 [7:54:13<18:18:23, 7.61s/it, loss=0.0010, acc=0.9984, iter_time=8.19s]
Epoch 0: 30%|███ | 3726/12384 [7:54:21<18:18:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 30%|███ | 3727/12384 [7:54:21<18:18:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 30%|███ | 3727/12384 [7:54:29<18:18:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 30%|███ | 3728/12384 [7:54:29<18:18:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 30%|███ | 3728/12384 [7:54:36<18:18:24, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=7.64s]
Epoch 0: 30%|███ | 3729/12384 [7:54:36<18:17:25, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=7.64s]
Epoch 0: 30%|███ | 3729/12384 [7:54:44<18:17:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 30%|███ | 3730/12384 [7:54:44<18:17:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 30%|███ | 3730/12384 [7:54:51<18:17:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 0: 30%|███ | 3731/12384 [7:54:51<18:17:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 0: 30%|███ | 3731/12384 [7:54:59<18:17:24, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.13s]
Epoch 0: 30%|███ | 3732/12384 [7:54:59<18:22:04, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=6.13s]
Epoch 0: 30%|███ | 3732/12384 [7:55:07<18:22:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.55s]
Epoch 0: 30%|███ | 3733/12384 [7:55:07<18:19:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.55s]
Epoch 0: 30%|███ | 3733/12384 [7:55:14<18:19:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 30%|███ | 3734/12384 [7:55:14<18:17:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 30%|███ | 3734/12384 [7:55:22<18:17:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 30%|███ | 3735/12384 [7:55:22<18:17:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 30%|███ | 3735/12384 [7:55:30<18:17:24, 7.61s/it, loss=0.0038, acc=0.9976, iter_time=7.99s]
Epoch 0: 30%|███ | 3736/12384 [7:55:30<18:18:07, 7.62s/it, loss=0.0038, acc=0.9976, iter_time=7.99s]
Epoch 0: 30%|███ | 3736/12384 [7:55:37<18:18:07, 7.62s/it, loss=0.0008, acc=0.9975, iter_time=6.54s]
Epoch 0: 30%|███ | 3737/12384 [7:55:37<18:17:25, 7.61s/it, loss=0.0008, acc=0.9975, iter_time=6.54s]
Epoch 0: 30%|███ | 3737/12384 [7:55:45<18:17:25, 7.61s/it, loss=0.0002, acc=0.9995, iter_time=6.53s]
Epoch 0: 30%|███ | 3738/12384 [7:55:45<18:17:55, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=6.53s]
Epoch 0: 30%|███ | 3738/12384 [7:55:52<18:17:55, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.38s]
Epoch 0: 30%|███ | 3739/12384 [7:55:52<18:16:37, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.38s]
Epoch 0: 30%|███ | 3739/12384 [7:56:00<18:16:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|███ | 3740/12384 [7:56:00<18:17:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|███ | 3740/12384 [7:56:08<18:17:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 30%|███ | 3741/12384 [7:56:08<18:31:10, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 30%|███ | 3741/12384 [7:56:16<18:31:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 0: 30%|███ | 3742/12384 [7:56:16<18:26:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 0: 30%|███ | 3742/12384 [7:56:23<18:26:50, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.73s]
Epoch 0: 30%|███ | 3743/12384 [7:56:23<18:23:52, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.73s]
Epoch 0: 30%|███ | 3743/12384 [7:56:31<18:23:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 30%|███ | 3744/12384 [7:56:31<18:22:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 30%|███ | 3744/12384 [7:56:38<18:22:01, 7.65s/it, loss=0.0010, acc=0.9992, iter_time=7.64s]
Epoch 0: 30%|███ | 3745/12384 [7:56:38<18:20:24, 7.64s/it, loss=0.0010, acc=0.9992, iter_time=7.64s]
Epoch 0: 30%|███ | 3745/12384 [7:56:46<18:20:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 30%|███ | 3746/12384 [7:56:46<18:18:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 30%|███ | 3746/12384 [7:56:54<18:18:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 30%|███ | 3747/12384 [7:56:54<18:17:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 30%|███ | 3747/12384 [7:57:01<18:17:55, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=9.40s]
Epoch 0: 30%|███ | 3748/12384 [7:57:01<18:18:08, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=9.40s]
Epoch 0: 30%|███ | 3748/12384 [7:57:09<18:18:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 30%|███ | 3749/12384 [7:57:09<18:17:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 30%|███ | 3749/12384 [7:57:17<18:17:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.24s]
Epoch 0: 30%|███ | 3750/12384 [7:57:17<18:17:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.24s]
Epoch 0: 30%|███ | 3750/12384 [7:57:24<18:17:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.40s]
Epoch 0: 30%|███ | 3751/12384 [7:57:24<18:16:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.40s]
Epoch 0: 30%|███ | 3751/12384 [7:57:32<18:16:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.37s]
Epoch 0: 30%|███ | 3752/12384 [7:57:32<18:16:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.37s]
Epoch 0: 30%|███ | 3752/12384 [7:57:39<18:16:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 30%|███ | 3753/12384 [7:57:39<18:15:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 30%|███ | 3753/12384 [7:57:47<18:15:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|███ | 3754/12384 [7:57:47<18:15:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 30%|███ | 3754/12384 [7:57:55<18:15:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 30%|███ | 3755/12384 [7:57:55<18:14:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 30%|███ | 3755/12384 [7:58:02<18:14:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 30%|███ | 3756/12384 [7:58:02<18:14:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 30%|███ | 3756/12384 [7:58:10<18:14:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 30%|███ | 3757/12384 [7:58:10<18:13:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 30%|███ | 3757/12384 [7:58:17<18:13:21, 7.60s/it, loss=0.0004, acc=0.9980, iter_time=4.97s]
Epoch 0: 30%|███ | 3758/12384 [7:58:17<18:12:43, 7.60s/it, loss=0.0004, acc=0.9980, iter_time=4.97s]
Epoch 0: 30%|███ | 3758/12384 [7:58:25<18:12:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.40s]
Epoch 0: 30%|███ | 3759/12384 [7:58:25<18:13:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.40s]
Epoch 0: 30%|███ | 3759/12384 [7:58:33<18:13:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 30%|███ | 3760/12384 [7:58:33<18:13:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 30%|███ | 3760/12384 [7:58:40<18:13:10, 7.61s/it, loss=0.0029, acc=0.9923, iter_time=6.45s]
Epoch 0: 30%|███ | 3761/12384 [7:58:40<18:13:35, 7.61s/it, loss=0.0029, acc=0.9923, iter_time=6.45s]
Epoch 0: 30%|███ | 3761/12384 [7:58:48<18:13:35, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=8.81s]
Epoch 0: 30%|███ | 3762/12384 [7:58:48<18:12:35, 7.60s/it, loss=0.0002, acc=0.9996, iter_time=8.81s]
Epoch 0: 30%|███ | 3762/12384 [7:58:56<18:12:35, 7.60s/it, loss=0.0001, acc=0.9989, iter_time=7.91s]
Epoch 0: 30%|███ | 3763/12384 [7:58:56<18:25:25, 7.69s/it, loss=0.0001, acc=0.9989, iter_time=7.91s]
Epoch 0: 30%|███ | 3763/12384 [7:59:03<18:25:25, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 30%|███ | 3764/12384 [7:59:03<18:21:22, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 30%|███ | 3764/12384 [7:59:11<18:21:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 30%|███ | 3765/12384 [7:59:11<18:24:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 30%|███ | 3765/12384 [7:59:19<18:24:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 30%|███ | 3766/12384 [7:59:19<18:22:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 30%|███ | 3766/12384 [7:59:26<18:22:28, 7.68s/it, loss=0.0001, acc=0.9997, iter_time=5.04s]
Epoch 0: 30%|███ | 3767/12384 [7:59:26<18:20:01, 7.66s/it, loss=0.0001, acc=0.9997, iter_time=5.04s]
Epoch 0: 30%|███ | 3767/12384 [7:59:34<18:20:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 0: 30%|███ | 3768/12384 [7:59:34<18:33:08, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 0: 30%|███ | 3768/12384 [7:59:42<18:33:08, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 30%|███ | 3769/12384 [7:59:42<18:26:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 30%|███ | 3769/12384 [7:59:50<18:26:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 30%|███ | 3770/12384 [7:59:50<18:25:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 30%|███ | 3770/12384 [7:59:57<18:25:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 30%|███ | 3771/12384 [7:59:57<18:21:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 30%|███ | 3771/12384 [8:00:05<18:21:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 30%|███ | 3772/12384 [8:00:05<18:18:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 30%|███ | 3772/12384 [8:00:12<18:18:50, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 30%|███ | 3773/12384 [8:00:12<18:17:12, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 30%|███ | 3773/12384 [8:00:20<18:17:12, 7.65s/it, loss=0.0030, acc=1.0000, iter_time=8.92s]
Epoch 0: 30%|███ | 3774/12384 [8:00:20<18:14:34, 7.63s/it, loss=0.0030, acc=1.0000, iter_time=8.92s]
Epoch 0: 30%|███ | 3774/12384 [8:00:28<18:14:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 30%|███ | 3775/12384 [8:00:28<18:13:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 30%|███ | 3775/12384 [8:00:35<18:13:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 30%|███ | 3776/12384 [8:00:35<18:13:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 30%|███ | 3776/12384 [8:00:43<18:13:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 0: 30%|███ | 3777/12384 [8:00:43<18:12:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 0: 30%|███ | 3777/12384 [8:00:51<18:12:56, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.64s]
Epoch 0: 31%|███ | 3778/12384 [8:00:51<18:13:54, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=7.64s]
Epoch 0: 31%|███ | 3778/12384 [8:00:58<18:13:54, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=5.88s]
Epoch 0: 31%|███ | 3779/12384 [8:00:58<18:14:36, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=5.88s]
Epoch 0: 31%|███ | 3779/12384 [8:01:06<18:14:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 31%|███ | 3780/12384 [8:01:06<18:11:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 31%|███ | 3780/12384 [8:01:13<18:11:58, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.58s]
Epoch 0: 31%|███ | 3781/12384 [8:01:13<18:10:20, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.58s]
Epoch 0: 31%|███ | 3781/12384 [8:01:21<18:10:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 31%|███ | 3782/12384 [8:01:21<18:10:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 31%|███ | 3782/12384 [8:01:29<18:10:00, 7.60s/it, loss=0.0002, acc=0.9987, iter_time=7.61s]
Epoch 0: 31%|███ | 3783/12384 [8:01:29<18:10:47, 7.61s/it, loss=0.0002, acc=0.9987, iter_time=7.61s]
Epoch 0: 31%|███ | 3783/12384 [8:01:36<18:10:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 31%|███ | 3784/12384 [8:01:36<18:11:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 31%|███ | 3784/12384 [8:01:44<18:11:42, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.27s]
Epoch 0: 31%|███ | 3785/12384 [8:01:44<18:12:11, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.27s]
Epoch 0: 31%|███ | 3785/12384 [8:01:51<18:12:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 31%|███ | 3786/12384 [8:01:51<18:13:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 31%|███ | 3786/12384 [8:01:59<18:13:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.19s]
Epoch 0: 31%|███ | 3787/12384 [8:01:59<18:11:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.19s]
Epoch 0: 31%|███ | 3787/12384 [8:02:07<18:11:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 31%|███ | 3788/12384 [8:02:07<18:10:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 31%|███ | 3788/12384 [8:02:14<18:10:51, 7.61s/it, loss=0.0006, acc=0.9989, iter_time=7.29s]
Epoch 0: 31%|███ | 3789/12384 [8:02:14<18:10:03, 7.61s/it, loss=0.0006, acc=0.9989, iter_time=7.29s]
Epoch 0: 31%|███ | 3789/12384 [8:02:22<18:10:03, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=6.07s]
Epoch 0: 31%|███ | 3790/12384 [8:02:22<18:09:24, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=6.07s]
Epoch 0: 31%|███ | 3790/12384 [8:02:30<18:09:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 0: 31%|███ | 3791/12384 [8:02:30<18:10:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 0: 31%|███ | 3791/12384 [8:02:37<18:10:22, 7.61s/it, loss=0.0021, acc=0.9974, iter_time=11.15s]
Epoch 0: 31%|███ | 3792/12384 [8:02:37<18:10:10, 7.61s/it, loss=0.0021, acc=0.9974, iter_time=11.15s]
Epoch 0: 31%|███ | 3792/12384 [8:02:45<18:10:10, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.20s]
Epoch 0: 31%|███ | 3793/12384 [8:02:45<18:09:09, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.20s]
Epoch 0: 31%|███ | 3793/12384 [8:02:53<18:09:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 31%|███ | 3794/12384 [8:02:53<18:23:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 31%|███ | 3794/12384 [8:03:00<18:23:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 0: 31%|███ | 3795/12384 [8:03:00<18:17:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 0: 31%|███ | 3795/12384 [8:03:08<18:17:22, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 0: 31%|███ | 3796/12384 [8:03:08<18:14:46, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 0: 31%|███ | 3796/12384 [8:03:15<18:14:46, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 31%|███ | 3797/12384 [8:03:15<18:12:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 31%|███ | 3797/12384 [8:03:23<18:12:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 31%|███ | 3798/12384 [8:03:23<18:11:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 31%|███ | 3798/12384 [8:03:31<18:11:07, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 31%|███ | 3799/12384 [8:03:31<18:11:07, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 31%|███ | 3799/12384 [8:03:38<18:11:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 31%|███ | 3800/12384 [8:03:38<18:09:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 31%|███ | 3800/12384 [8:03:46<18:09:37, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.18s]
Epoch 0: 31%|███ | 3801/12384 [8:03:46<18:07:54, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.18s]
Epoch 0: 31%|███ | 3801/12384 [8:03:54<18:07:54, 7.61s/it, loss=0.0016, acc=0.9968, iter_time=7.69s]
Epoch 0: 31%|███ | 3802/12384 [8:03:54<18:11:33, 7.63s/it, loss=0.0016, acc=0.9968, iter_time=7.69s]
Epoch 0: 31%|███ | 3802/12384 [8:04:01<18:11:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 31%|███ | 3803/12384 [8:04:01<18:11:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 31%|███ | 3803/12384 [8:04:09<18:11:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 31%|███ | 3804/12384 [8:04:09<18:10:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 31%|███ | 3804/12384 [8:04:16<18:10:34, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=7.66s]
Epoch 0: 31%|███ | 3805/12384 [8:04:16<18:09:54, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=7.66s]
Epoch 0: 31%|███ | 3805/12384 [8:04:24<18:09:54, 7.62s/it, loss=0.0011, acc=0.9975, iter_time=7.62s]
Epoch 0: 31%|███ | 3806/12384 [8:04:24<18:10:17, 7.63s/it, loss=0.0011, acc=0.9975, iter_time=7.62s]
Epoch 0: 31%|███ | 3806/12384 [8:04:32<18:10:17, 7.63s/it, loss=0.0014, acc=0.9951, iter_time=7.60s]
Epoch 0: 31%|███ | 3807/12384 [8:04:32<18:08:55, 7.62s/it, loss=0.0014, acc=0.9951, iter_time=7.60s]
Epoch 0: 31%|███ | 3807/12384 [8:04:39<18:08:55, 7.62s/it, loss=0.0012, acc=0.9949, iter_time=7.54s]
Epoch 0: 31%|███ | 3808/12384 [8:04:39<18:07:51, 7.61s/it, loss=0.0012, acc=0.9949, iter_time=7.54s]
Epoch 0: 31%|███ | 3808/12384 [8:04:47<18:07:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 31%|███ | 3809/12384 [8:04:47<18:07:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 31%|███ | 3809/12384 [8:04:54<18:07:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███ | 3810/12384 [8:04:54<18:08:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███ | 3810/12384 [8:05:02<18:08:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 31%|███ | 3811/12384 [8:05:02<18:06:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 31%|███ | 3811/12384 [8:05:10<18:06:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 31%|███ | 3812/12384 [8:05:10<18:07:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 31%|███ | 3812/12384 [8:05:17<18:07:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 31%|███ | 3813/12384 [8:05:17<18:06:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 31%|███ | 3813/12384 [8:05:25<18:06:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 0: 31%|███ | 3814/12384 [8:05:25<18:06:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 0: 31%|███ | 3814/12384 [8:05:32<18:06:07, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=10.47s]
Epoch 0: 31%|███ | 3815/12384 [8:05:32<18:05:48, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=10.47s]
Epoch 0: 31%|███ | 3815/12384 [8:05:40<18:05:48, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 31%|███ | 3816/12384 [8:05:40<18:06:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 31%|███ | 3816/12384 [8:05:48<18:06:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 0: 31%|███ | 3817/12384 [8:05:48<18:06:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 0: 31%|███ | 3817/12384 [8:05:55<18:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 31%|███ | 3818/12384 [8:05:55<18:06:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 31%|███ | 3818/12384 [8:06:03<18:06:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 31%|███ | 3819/12384 [8:06:03<18:06:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 31%|███ | 3819/12384 [8:06:11<18:06:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 31%|███ | 3820/12384 [8:06:11<18:07:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 31%|███ | 3820/12384 [8:06:18<18:07:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 31%|███ | 3821/12384 [8:06:18<18:20:20, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 31%|███ | 3821/12384 [8:06:26<18:20:20, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 0: 31%|███ | 3822/12384 [8:06:26<18:15:47, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 0: 31%|███ | 3822/12384 [8:06:34<18:15:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 31%|███ | 3823/12384 [8:06:34<18:12:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 31%|███ | 3823/12384 [8:06:41<18:12:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 31%|███ | 3824/12384 [8:06:41<18:10:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 31%|███ | 3824/12384 [8:06:49<18:10:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 0: 31%|███ | 3825/12384 [8:06:49<18:09:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 0: 31%|███ | 3825/12384 [8:06:57<18:09:11, 7.64s/it, loss=0.0006, acc=0.9986, iter_time=10.51s]
Epoch 0: 31%|███ | 3826/12384 [8:06:57<18:08:23, 7.63s/it, loss=0.0006, acc=0.9986, iter_time=10.51s]
Epoch 0: 31%|███ | 3826/12384 [8:07:04<18:08:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███ | 3827/12384 [8:07:04<18:07:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███ | 3827/12384 [8:07:12<18:07:37, 7.63s/it, loss=0.0013, acc=0.9960, iter_time=7.61s]
Epoch 0: 31%|███ | 3828/12384 [8:07:12<18:07:33, 7.63s/it, loss=0.0013, acc=0.9960, iter_time=7.61s]
Epoch 0: 31%|███ | 3828/12384 [8:07:19<18:07:33, 7.63s/it, loss=0.0006, acc=0.9993, iter_time=7.63s]
Epoch 0: 31%|███ | 3829/12384 [8:07:19<18:07:00, 7.62s/it, loss=0.0006, acc=0.9993, iter_time=7.63s]
Epoch 0: 31%|███ | 3829/12384 [8:07:27<18:07:00, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=6.76s]
Epoch 0: 31%|███ | 3830/12384 [8:07:27<18:05:58, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=6.76s]
Epoch 0: 31%|███ | 3830/12384 [8:07:35<18:05:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 31%|███ | 3831/12384 [8:07:35<18:05:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 31%|███ | 3831/12384 [8:07:42<18:05:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 31%|███ | 3832/12384 [8:07:42<18:04:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 31%|███ | 3832/12384 [8:07:50<18:04:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 31%|███ | 3833/12384 [8:07:50<18:05:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 31%|███ | 3833/12384 [8:07:57<18:05:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 31%|███ | 3834/12384 [8:07:57<18:05:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 31%|███ | 3834/12384 [8:08:05<18:05:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███ | 3835/12384 [8:08:05<18:04:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███ | 3835/12384 [8:08:13<18:04:32, 7.61s/it, loss=0.0003, acc=0.9979, iter_time=4.22s]
Epoch 0: 31%|███ | 3836/12384 [8:08:13<18:04:55, 7.62s/it, loss=0.0003, acc=0.9979, iter_time=4.22s]
Epoch 0: 31%|███ | 3836/12384 [8:08:20<18:04:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.99s]
Epoch 0: 31%|███ | 3837/12384 [8:08:20<18:03:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.99s]
Epoch 0: 31%|███ | 3837/12384 [8:08:28<18:03:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 31%|███ | 3838/12384 [8:08:28<18:02:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 31%|███ | 3838/12384 [8:08:35<18:02:55, 7.60s/it, loss=0.0009, acc=0.9990, iter_time=6.53s]
Epoch 0: 31%|███ | 3839/12384 [8:08:35<18:03:08, 7.61s/it, loss=0.0009, acc=0.9990, iter_time=6.53s]
Epoch 0: 31%|███ | 3839/12384 [8:08:43<18:03:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.30s]
Epoch 0: 31%|███ | 3840/12384 [8:08:43<18:03:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.30s]
Epoch 0: 31%|███ | 3840/12384 [8:08:51<18:03:37, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.24s]
Epoch 0: 31%|███ | 3841/12384 [8:08:51<18:03:10, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.24s]
Epoch 0: 31%|███ | 3841/12384 [8:08:58<18:03:10, 7.61s/it, loss=0.0002, acc=0.9980, iter_time=5.62s]
Epoch 0: 31%|███ | 3842/12384 [8:08:58<18:04:06, 7.61s/it, loss=0.0002, acc=0.9980, iter_time=5.62s]
Epoch 0: 31%|███ | 3842/12384 [8:09:06<18:04:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.91s]
Epoch 0: 31%|███ | 3843/12384 [8:09:06<18:15:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.91s]
Epoch 0: 31%|███ | 3843/12384 [8:09:14<18:15:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 31%|███ | 3844/12384 [8:09:14<18:11:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 31%|███ | 3844/12384 [8:09:21<18:11:26, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.16s]
Epoch 0: 31%|███ | 3845/12384 [8:09:21<18:07:06, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.16s]
Epoch 0: 31%|███ | 3845/12384 [8:09:29<18:07:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 0: 31%|███ | 3846/12384 [8:09:29<18:05:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 0: 31%|███ | 3846/12384 [8:09:37<18:05:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 31%|███ | 3847/12384 [8:09:37<18:23:17, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 31%|███ | 3847/12384 [8:09:45<18:23:17, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 31%|███ | 3848/12384 [8:09:45<18:16:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 31%|███ | 3848/12384 [8:09:52<18:16:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 31%|███ | 3849/12384 [8:09:52<18:12:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 31%|███ | 3849/12384 [8:10:00<18:12:38, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 31%|███ | 3850/12384 [8:10:00<18:09:52, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 31%|███ | 3850/12384 [8:10:07<18:09:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 31%|███ | 3851/12384 [8:10:07<18:06:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 31%|███ | 3851/12384 [8:10:15<18:06:55, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 0: 31%|███ | 3852/12384 [8:10:15<18:09:09, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 0: 31%|███ | 3852/12384 [8:10:23<18:09:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 0: 31%|███ | 3853/12384 [8:10:23<18:08:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 0: 31%|███ | 3853/12384 [8:10:30<18:08:52, 7.66s/it, loss=0.0003, acc=0.9996, iter_time=10.81s]
Epoch 0: 31%|███ | 3854/12384 [8:10:30<18:07:07, 7.65s/it, loss=0.0003, acc=0.9996, iter_time=10.81s]
Epoch 0: 31%|███ | 3854/12384 [8:10:38<18:07:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 31%|███ | 3855/12384 [8:10:38<18:05:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 31%|███ | 3855/12384 [8:10:46<18:05:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 0: 31%|███ | 3856/12384 [8:10:46<18:04:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 0: 31%|███ | 3856/12384 [8:10:53<18:04:54, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.43s]
Epoch 0: 31%|███ | 3857/12384 [8:10:53<18:03:19, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.43s]
Epoch 0: 31%|███ | 3857/12384 [8:11:01<18:03:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 31%|███ | 3858/12384 [8:11:01<18:03:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 31%|███ | 3858/12384 [8:11:09<18:03:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.06s]
Epoch 0: 31%|███ | 3859/12384 [8:11:09<18:03:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.06s]
Epoch 0: 31%|███ | 3859/12384 [8:11:16<18:03:28, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=10.97s]
Epoch 0: 31%|███ | 3860/12384 [8:11:16<18:02:09, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=10.97s]
Epoch 0: 31%|███ | 3860/12384 [8:11:24<18:02:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███ | 3861/12384 [8:11:24<18:03:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███ | 3861/12384 [8:11:31<18:03:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 31%|███ | 3862/12384 [8:11:31<18:01:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 31%|███ | 3862/12384 [8:11:39<18:01:57, 7.62s/it, loss=0.0009, acc=0.9974, iter_time=5.02s]
Epoch 0: 31%|███ | 3863/12384 [8:11:39<18:01:02, 7.61s/it, loss=0.0009, acc=0.9974, iter_time=5.02s]
Epoch 0: 31%|███ | 3863/12384 [8:11:47<18:01:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 31%|███ | 3864/12384 [8:11:47<18:02:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 31%|███ | 3864/12384 [8:11:54<18:02:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.90s]
Epoch 0: 31%|███ | 3865/12384 [8:11:54<18:02:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.90s]
Epoch 0: 31%|███ | 3865/12384 [8:12:02<18:02:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.20s]
Epoch 0: 31%|███ | 3866/12384 [8:12:02<18:01:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.20s]
Epoch 0: 31%|███ | 3866/12384 [8:12:09<18:01:38, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=11.34s]
Epoch 0: 31%|███ | 3867/12384 [8:12:09<18:02:27, 7.63s/it, loss=0.0005, acc=0.9998, iter_time=11.34s]
Epoch 0: 31%|███ | 3867/12384 [8:12:17<18:02:27, 7.63s/it, loss=0.0018, acc=0.9991, iter_time=5.84s]
Epoch 0: 31%|███ | 3868/12384 [8:12:17<18:01:08, 7.62s/it, loss=0.0018, acc=0.9991, iter_time=5.84s]
Epoch 0: 31%|███ | 3868/12384 [8:12:25<18:01:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 31%|███ | 3869/12384 [8:12:25<18:11:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 31%|███ | 3869/12384 [8:12:33<18:11:52, 7.69s/it, loss=0.0003, acc=0.9984, iter_time=7.60s]
Epoch 0: 31%|███▏ | 3870/12384 [8:12:33<18:08:40, 7.67s/it, loss=0.0003, acc=0.9984, iter_time=7.60s]
Epoch 0: 31%|███▏ | 3870/12384 [8:12:40<18:08:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███▏ | 3871/12384 [8:12:40<18:06:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 31%|███▏ | 3871/12384 [8:12:48<18:06:12, 7.66s/it, loss=0.0003, acc=0.9984, iter_time=7.59s]
Epoch 0: 31%|███▏ | 3872/12384 [8:12:48<18:04:45, 7.65s/it, loss=0.0003, acc=0.9984, iter_time=7.59s]
Epoch 0: 31%|███▏ | 3872/12384 [8:12:56<18:04:45, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=5.16s]
Epoch 0: 31%|███▏ | 3873/12384 [8:12:56<18:16:45, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=5.16s]
Epoch 0: 31%|███▏ | 3873/12384 [8:13:03<18:16:45, 7.73s/it, loss=0.0011, acc=0.9950, iter_time=10.42s]
Epoch 0: 31%|███▏ | 3874/12384 [8:13:03<18:12:02, 7.70s/it, loss=0.0011, acc=0.9950, iter_time=10.42s]
Epoch 0: 31%|███▏ | 3874/12384 [8:13:11<18:12:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 31%|███▏ | 3875/12384 [8:13:11<18:08:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 31%|███▏ | 3875/12384 [8:13:19<18:08:32, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=9.73s]
Epoch 0: 31%|███▏ | 3876/12384 [8:13:19<18:07:00, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.73s]
Epoch 0: 31%|███▏ | 3876/12384 [8:13:26<18:07:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 31%|███▏ | 3877/12384 [8:13:26<18:03:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 31%|███▏ | 3877/12384 [8:13:34<18:03:49, 7.64s/it, loss=0.0010, acc=0.9956, iter_time=8.86s]
Epoch 0: 31%|███▏ | 3878/12384 [8:13:34<18:04:34, 7.65s/it, loss=0.0010, acc=0.9956, iter_time=8.86s]
Epoch 0: 31%|███▏ | 3878/12384 [8:13:41<18:04:34, 7.65s/it, loss=0.0005, acc=0.9971, iter_time=5.54s]
Epoch 0: 31%|███▏ | 3879/12384 [8:13:41<18:01:54, 7.63s/it, loss=0.0005, acc=0.9971, iter_time=5.54s]
Epoch 0: 31%|███▏ | 3879/12384 [8:13:49<18:01:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 31%|███▏ | 3880/12384 [8:13:49<18:00:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 31%|███▏ | 3880/12384 [8:13:57<18:00:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.57s]
Epoch 0: 31%|███▏ | 3881/12384 [8:13:57<18:00:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.57s]
Epoch 0: 31%|███▏ | 3881/12384 [8:14:04<18:00:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 31%|███▏ | 3882/12384 [8:14:04<17:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 31%|███▏ | 3882/12384 [8:14:12<17:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 31%|███▏ | 3883/12384 [8:14:12<17:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 31%|███▏ | 3883/12384 [8:14:20<17:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 31%|███▏ | 3884/12384 [8:14:20<17:59:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 31%|███▏ | 3884/12384 [8:14:27<17:59:21, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=6.17s]
Epoch 0: 31%|███▏ | 3885/12384 [8:14:27<17:59:41, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=6.17s]
Epoch 0: 31%|███▏ | 3885/12384 [8:14:35<17:59:41, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=9.08s]
Epoch 0: 31%|███▏ | 3886/12384 [8:14:35<17:59:35, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=9.08s]
Epoch 0: 31%|███▏ | 3886/12384 [8:14:42<17:59:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 31%|███▏ | 3887/12384 [8:14:42<18:01:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 31%|███▏ | 3887/12384 [8:14:50<18:01:13, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=8.05s]
Epoch 0: 31%|███▏ | 3888/12384 [8:14:50<18:00:24, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=8.05s]
Epoch 0: 31%|███▏ | 3888/12384 [8:14:58<18:00:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 31%|███▏ | 3889/12384 [8:14:58<17:58:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 31%|███▏ | 3889/12384 [8:15:05<17:58:46, 7.62s/it, loss=0.0015, acc=0.9967, iter_time=6.11s]
Epoch 0: 31%|███▏ | 3890/12384 [8:15:05<17:58:39, 7.62s/it, loss=0.0015, acc=0.9967, iter_time=6.11s]
Epoch 0: 31%|███▏ | 3890/12384 [8:15:13<17:58:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 31%|███▏ | 3891/12384 [8:15:13<17:56:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 31%|███▏ | 3891/12384 [8:15:21<17:56:53, 7.61s/it, loss=0.0005, acc=0.9980, iter_time=6.37s]
Epoch 0: 31%|███▏ | 3892/12384 [8:15:21<17:57:17, 7.61s/it, loss=0.0005, acc=0.9980, iter_time=6.37s]
Epoch 0: 31%|███▏ | 3892/12384 [8:15:28<17:57:17, 7.61s/it, loss=0.0003, acc=0.9991, iter_time=8.85s]
Epoch 0: 31%|███▏ | 3893/12384 [8:15:28<17:56:59, 7.61s/it, loss=0.0003, acc=0.9991, iter_time=8.85s]
Epoch 0: 31%|███▏ | 3893/12384 [8:15:36<17:56:59, 7.61s/it, loss=0.0010, acc=0.9983, iter_time=7.60s]
Epoch 0: 31%|███▏ | 3894/12384 [8:15:36<17:56:24, 7.61s/it, loss=0.0010, acc=0.9983, iter_time=7.60s]
Epoch 0: 31%|███▏ | 3894/12384 [8:15:44<17:56:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 31%|███▏ | 3895/12384 [8:15:44<18:08:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 31%|███▏ | 3895/12384 [8:15:51<18:08:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 31%|███▏ | 3896/12384 [8:15:51<18:05:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 31%|███▏ | 3896/12384 [8:15:59<18:05:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 31%|███▏ | 3897/12384 [8:15:59<18:02:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 31%|███▏ | 3897/12384 [8:16:06<18:02:32, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=7.92s]
Epoch 0: 31%|███▏ | 3898/12384 [8:16:06<18:00:35, 7.64s/it, loss=0.0002, acc=0.9990, iter_time=7.92s]
Epoch 0: 31%|███▏ | 3898/12384 [8:16:14<18:00:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.10s]
Epoch 0: 31%|███▏ | 3899/12384 [8:16:14<18:12:35, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=5.10s]
Epoch 0: 31%|███▏ | 3899/12384 [8:16:22<18:12:35, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 0: 31%|███▏ | 3900/12384 [8:16:22<18:06:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 0: 31%|███▏ | 3900/12384 [8:16:30<18:06:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 32%|███▏ | 3901/12384 [8:16:30<18:03:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 32%|███▏ | 3901/12384 [8:16:37<18:03:47, 7.67s/it, loss=0.0008, acc=0.9950, iter_time=5.07s]
Epoch 0: 32%|███▏ | 3902/12384 [8:16:37<18:01:46, 7.65s/it, loss=0.0008, acc=0.9950, iter_time=5.07s]
Epoch 0: 32%|███▏ | 3902/12384 [8:16:45<18:01:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 32%|███▏ | 3903/12384 [8:16:45<18:00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 32%|███▏ | 3903/12384 [8:16:52<18:00:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 32%|███▏ | 3904/12384 [8:16:52<17:59:22, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 32%|███▏ | 3904/12384 [8:17:00<17:59:22, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 32%|███▏ | 3905/12384 [8:17:00<17:58:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 32%|███▏ | 3905/12384 [8:17:08<17:58:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3906/12384 [8:17:08<17:57:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3906/12384 [8:17:15<17:57:47, 7.63s/it, loss=0.0005, acc=0.9978, iter_time=6.69s]
Epoch 0: 32%|███▏ | 3907/12384 [8:17:15<17:57:20, 7.63s/it, loss=0.0005, acc=0.9978, iter_time=6.69s]
Epoch 0: 32%|███▏ | 3907/12384 [8:17:23<17:57:20, 7.63s/it, loss=0.0009, acc=0.9978, iter_time=8.56s]
Epoch 0: 32%|███▏ | 3908/12384 [8:17:23<17:56:54, 7.62s/it, loss=0.0009, acc=0.9978, iter_time=8.56s]
Epoch 0: 32%|███▏ | 3908/12384 [8:17:31<17:56:54, 7.62s/it, loss=0.0007, acc=0.9956, iter_time=4.25s]
Epoch 0: 32%|███▏ | 3909/12384 [8:17:31<17:56:14, 7.62s/it, loss=0.0007, acc=0.9956, iter_time=4.25s]
Epoch 0: 32%|███▏ | 3909/12384 [8:17:38<17:56:14, 7.62s/it, loss=0.0027, acc=0.9949, iter_time=9.77s]
Epoch 0: 32%|███▏ | 3910/12384 [8:17:38<17:54:34, 7.61s/it, loss=0.0027, acc=0.9949, iter_time=9.77s]
Epoch 0: 32%|███▏ | 3910/12384 [8:17:46<17:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 32%|███▏ | 3911/12384 [8:17:46<17:54:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 32%|███▏ | 3911/12384 [8:17:53<17:54:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 32%|███▏ | 3912/12384 [8:17:53<17:54:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 32%|███▏ | 3912/12384 [8:18:01<17:54:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 32%|███▏ | 3913/12384 [8:18:01<17:55:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 32%|███▏ | 3913/12384 [8:18:09<17:55:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 32%|███▏ | 3914/12384 [8:18:09<17:55:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 32%|███▏ | 3914/12384 [8:18:16<17:55:19, 7.62s/it, loss=0.0003, acc=0.9985, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3915/12384 [8:18:16<17:55:06, 7.62s/it, loss=0.0003, acc=0.9985, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3915/12384 [8:18:24<17:55:06, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3916/12384 [8:18:24<17:55:08, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3916/12384 [8:18:31<17:55:08, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3917/12384 [8:18:31<17:55:11, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3917/12384 [8:18:39<17:55:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 32%|███▏ | 3918/12384 [8:18:39<17:54:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 32%|███▏ | 3918/12384 [8:18:47<17:54:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 32%|███▏ | 3919/12384 [8:18:47<17:54:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 32%|███▏ | 3919/12384 [8:18:54<17:54:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 32%|███▏ | 3920/12384 [8:18:54<17:54:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 32%|███▏ | 3920/12384 [8:19:02<17:54:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 0: 32%|███▏ | 3921/12384 [8:19:02<17:53:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 0: 32%|███▏ | 3921/12384 [8:19:10<17:53:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 0: 32%|███▏ | 3922/12384 [8:19:10<17:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 0: 32%|███▏ | 3922/12384 [8:19:17<17:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 0: 32%|███▏ | 3923/12384 [8:19:17<17:54:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 0: 32%|███▏ | 3923/12384 [8:19:25<17:54:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3924/12384 [8:19:25<17:54:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3924/12384 [8:19:33<17:54:04, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.31s]
Epoch 0: 32%|███▏ | 3925/12384 [8:19:33<18:08:48, 7.72s/it, loss=0.0002, acc=0.9998, iter_time=5.31s]
Epoch 0: 32%|███▏ | 3925/12384 [8:19:40<18:08:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 32%|███▏ | 3926/12384 [8:19:40<18:04:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 32%|███▏ | 3926/12384 [8:19:48<18:04:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 32%|███▏ | 3927/12384 [8:19:48<18:01:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 32%|███▏ | 3927/12384 [8:19:56<18:01:13, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.80s]
Epoch 0: 32%|███▏ | 3928/12384 [8:19:56<17:59:06, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.80s]
Epoch 0: 32%|███▏ | 3928/12384 [8:20:03<17:59:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 32%|███▏ | 3929/12384 [8:20:03<17:56:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 32%|███▏ | 3929/12384 [8:20:11<17:56:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 32%|███▏ | 3930/12384 [8:20:11<17:55:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 32%|███▏ | 3930/12384 [8:20:18<17:55:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 32%|███▏ | 3931/12384 [8:20:18<17:54:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 32%|███▏ | 3931/12384 [8:20:26<17:54:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 32%|███▏ | 3932/12384 [8:20:26<17:53:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 32%|███▏ | 3932/12384 [8:20:34<17:53:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.20s]
Epoch 0: 32%|███▏ | 3933/12384 [8:20:34<17:53:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.20s]
Epoch 0: 32%|███▏ | 3933/12384 [8:20:41<17:53:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 0: 32%|███▏ | 3934/12384 [8:20:41<17:56:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 0: 32%|███▏ | 3934/12384 [8:20:49<17:56:44, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.91s]
Epoch 0: 32%|███▏ | 3935/12384 [8:20:49<17:57:59, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.91s]
Epoch 0: 32%|███▏ | 3935/12384 [8:20:57<17:57:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 32%|███▏ | 3936/12384 [8:20:57<17:56:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 32%|███▏ | 3936/12384 [8:21:04<17:56:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3937/12384 [8:21:04<17:54:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3937/12384 [8:21:12<17:54:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 32%|███▏ | 3938/12384 [8:21:12<17:52:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 32%|███▏ | 3938/12384 [8:21:20<17:52:58, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.21s]
Epoch 0: 32%|███▏ | 3939/12384 [8:21:20<17:52:35, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.21s]
Epoch 0: 32%|███▏ | 3939/12384 [8:21:27<17:52:35, 7.62s/it, loss=0.0008, acc=0.9949, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3940/12384 [8:21:27<17:53:42, 7.63s/it, loss=0.0008, acc=0.9949, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3940/12384 [8:21:35<17:53:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 32%|███▏ | 3941/12384 [8:21:35<17:52:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 32%|███▏ | 3941/12384 [8:21:42<17:52:56, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=5.35s]
Epoch 0: 32%|███▏ | 3942/12384 [8:21:42<17:51:13, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=5.35s]
Epoch 0: 32%|███▏ | 3942/12384 [8:21:50<17:51:13, 7.61s/it, loss=0.0005, acc=0.9970, iter_time=9.83s]
Epoch 0: 32%|███▏ | 3943/12384 [8:21:50<17:51:38, 7.62s/it, loss=0.0005, acc=0.9970, iter_time=9.83s]
Epoch 0: 32%|███▏ | 3943/12384 [8:21:58<17:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3944/12384 [8:21:58<17:51:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3944/12384 [8:22:05<17:51:59, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.03s]
Epoch 0: 32%|███▏ | 3945/12384 [8:22:05<17:50:24, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=7.03s]
Epoch 0: 32%|███▏ | 3945/12384 [8:22:13<17:50:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.24s]
Epoch 0: 32%|███▏ | 3946/12384 [8:22:13<17:50:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.24s]
Epoch 0: 32%|███▏ | 3946/12384 [8:22:21<17:50:02, 7.61s/it, loss=0.0009, acc=0.9998, iter_time=11.88s]
Epoch 0: 32%|███▏ | 3947/12384 [8:22:21<18:01:51, 7.69s/it, loss=0.0009, acc=0.9998, iter_time=11.88s]
Epoch 0: 32%|███▏ | 3947/12384 [8:22:28<18:01:51, 7.69s/it, loss=0.0001, acc=0.9995, iter_time=7.59s]
Epoch 0: 32%|███▏ | 3948/12384 [8:22:28<17:58:32, 7.67s/it, loss=0.0001, acc=0.9995, iter_time=7.59s]
Epoch 0: 32%|███▏ | 3948/12384 [8:22:36<17:58:32, 7.67s/it, loss=0.0006, acc=0.9978, iter_time=7.63s]
Epoch 0: 32%|███▏ | 3949/12384 [8:22:36<17:55:57, 7.65s/it, loss=0.0006, acc=0.9978, iter_time=7.63s]
Epoch 0: 32%|███▏ | 3949/12384 [8:22:44<17:55:57, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 32%|███▏ | 3950/12384 [8:22:44<17:54:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 32%|███▏ | 3950/12384 [8:22:51<17:54:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.90s]
Epoch 0: 32%|███▏ | 3951/12384 [8:22:51<17:53:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.90s]
Epoch 0: 32%|███▏ | 3951/12384 [8:22:59<17:53:18, 7.64s/it, loss=0.0004, acc=0.9981, iter_time=8.39s]
Epoch 0: 32%|███▏ | 3952/12384 [8:22:59<18:06:25, 7.73s/it, loss=0.0004, acc=0.9981, iter_time=8.39s]
Epoch 0: 32%|███▏ | 3952/12384 [8:23:07<18:06:25, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.48s]
Epoch 0: 32%|███▏ | 3953/12384 [8:23:07<18:00:34, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.48s]
Epoch 0: 32%|███▏ | 3953/12384 [8:23:14<18:00:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 32%|███▏ | 3954/12384 [8:23:14<17:56:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 32%|███▏ | 3954/12384 [8:23:22<17:56:02, 7.66s/it, loss=0.0002, acc=0.9995, iter_time=11.09s]
Epoch 0: 32%|███▏ | 3955/12384 [8:23:22<17:53:11, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=11.09s]
Epoch 0: 32%|███▏ | 3955/12384 [8:23:29<17:53:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3956/12384 [8:23:29<17:51:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 3956/12384 [8:23:37<17:51:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3957/12384 [8:23:37<17:50:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3957/12384 [8:23:45<17:50:45, 7.62s/it, loss=0.0009, acc=0.9983, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3958/12384 [8:23:45<17:52:03, 7.63s/it, loss=0.0009, acc=0.9983, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3958/12384 [8:23:52<17:52:03, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.68s]
Epoch 0: 32%|███▏ | 3959/12384 [8:23:52<17:53:34, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.68s]
Epoch 0: 32%|███▏ | 3959/12384 [8:24:00<17:53:34, 7.65s/it, loss=0.0004, acc=0.9990, iter_time=8.03s]
Epoch 0: 32%|███▏ | 3960/12384 [8:24:00<17:52:09, 7.64s/it, loss=0.0004, acc=0.9990, iter_time=8.03s]
Epoch 0: 32%|███▏ | 3960/12384 [8:24:08<17:52:09, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 0: 32%|███▏ | 3961/12384 [8:24:08<17:50:48, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 0: 32%|███▏ | 3961/12384 [8:24:15<17:50:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3962/12384 [8:24:15<17:49:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3962/12384 [8:24:23<17:49:32, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=7.63s]
Epoch 0: 32%|███▏ | 3963/12384 [8:24:23<17:48:52, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=7.63s]
Epoch 0: 32%|███▏ | 3963/12384 [8:24:30<17:48:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3964/12384 [8:24:30<17:48:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3964/12384 [8:24:38<17:48:36, 7.61s/it, loss=0.0004, acc=0.9997, iter_time=4.75s]
Epoch 0: 32%|███▏ | 3965/12384 [8:24:38<17:52:49, 7.65s/it, loss=0.0004, acc=0.9997, iter_time=4.75s]
Epoch 0: 32%|███▏ | 3965/12384 [8:24:46<17:52:49, 7.65s/it, loss=0.0004, acc=0.9993, iter_time=10.55s]
Epoch 0: 32%|███▏ | 3966/12384 [8:24:46<17:53:50, 7.65s/it, loss=0.0004, acc=0.9993, iter_time=10.55s]
Epoch 0: 32%|███▏ | 3966/12384 [8:24:53<17:53:50, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=7.69s]
Epoch 0: 32%|███▏ | 3967/12384 [8:24:53<17:51:45, 7.64s/it, loss=0.0008, acc=0.9979, iter_time=7.69s]
Epoch 0: 32%|███▏ | 3967/12384 [8:25:01<17:51:45, 7.64s/it, loss=0.0005, acc=0.9980, iter_time=8.00s]
Epoch 0: 32%|███▏ | 3968/12384 [8:25:01<17:52:37, 7.65s/it, loss=0.0005, acc=0.9980, iter_time=8.00s]
Epoch 0: 32%|███▏ | 3968/12384 [8:25:09<17:52:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 32%|███▏ | 3969/12384 [8:25:09<17:50:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 32%|███▏ | 3969/12384 [8:25:16<17:50:01, 7.63s/it, loss=0.0176, acc=0.9900, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3970/12384 [8:25:16<17:49:14, 7.62s/it, loss=0.0176, acc=0.9900, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3970/12384 [8:25:24<17:49:14, 7.62s/it, loss=0.0003, acc=0.9991, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3971/12384 [8:25:24<17:47:51, 7.62s/it, loss=0.0003, acc=0.9991, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3971/12384 [8:25:32<17:47:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.47s]
Epoch 0: 32%|███▏ | 3972/12384 [8:25:32<17:47:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.47s]
Epoch 0: 32%|███▏ | 3972/12384 [8:25:39<17:47:05, 7.61s/it, loss=0.0007, acc=0.9983, iter_time=7.78s]
Epoch 0: 32%|███▏ | 3973/12384 [8:25:39<17:46:41, 7.61s/it, loss=0.0007, acc=0.9983, iter_time=7.78s]
Epoch 0: 32%|███▏ | 3973/12384 [8:25:47<17:46:41, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.84s]
Epoch 0: 32%|███▏ | 3974/12384 [8:25:47<17:58:23, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=8.84s]
Epoch 0: 32%|███▏ | 3974/12384 [8:25:55<17:58:23, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 32%|███▏ | 3975/12384 [8:25:55<17:54:01, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 32%|███▏ | 3975/12384 [8:26:02<17:54:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 32%|███▏ | 3976/12384 [8:26:02<17:53:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 32%|███▏ | 3976/12384 [8:26:10<17:53:45, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=6.92s]
Epoch 0: 32%|███▏ | 3977/12384 [8:26:10<17:52:06, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=6.92s]
Epoch 0: 32%|███▏ | 3977/12384 [8:26:18<17:52:06, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 32%|███▏ | 3978/12384 [8:26:18<18:01:52, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 32%|███▏ | 3978/12384 [8:26:25<18:01:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 32%|███▏ | 3979/12384 [8:26:25<17:57:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 32%|███▏ | 3979/12384 [8:26:33<17:57:20, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3980/12384 [8:26:33<17:57:04, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3980/12384 [8:26:41<17:57:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 32%|███▏ | 3981/12384 [8:26:41<17:54:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 32%|███▏ | 3981/12384 [8:26:48<17:54:11, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 32%|███▏ | 3982/12384 [8:26:48<17:51:56, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 32%|███▏ | 3982/12384 [8:26:56<17:51:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 0: 32%|███▏ | 3983/12384 [8:26:56<17:50:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 0: 32%|███▏ | 3983/12384 [8:27:04<17:50:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 32%|███▏ | 3984/12384 [8:27:04<17:48:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 32%|███▏ | 3984/12384 [8:27:11<17:48:57, 7.64s/it, loss=0.0005, acc=0.9986, iter_time=7.65s]
Epoch 0: 32%|███▏ | 3985/12384 [8:27:11<17:46:55, 7.62s/it, loss=0.0005, acc=0.9986, iter_time=7.65s]
Epoch 0: 32%|███▏ | 3985/12384 [8:27:19<17:46:55, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3986/12384 [8:27:19<17:46:41, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3986/12384 [8:27:26<17:46:41, 7.62s/it, loss=0.0030, acc=0.9971, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3987/12384 [8:27:26<17:45:26, 7.61s/it, loss=0.0030, acc=0.9971, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3987/12384 [8:27:34<17:45:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3988/12384 [8:27:34<17:45:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 3988/12384 [8:27:42<17:45:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 32%|███▏ | 3989/12384 [8:27:42<17:44:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 32%|███▏ | 3989/12384 [8:27:49<17:44:20, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=8.82s]
Epoch 0: 32%|███▏ | 3990/12384 [8:27:49<17:44:09, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=8.82s]
Epoch 0: 32%|███▏ | 3990/12384 [8:27:57<17:44:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3991/12384 [8:27:57<17:47:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3991/12384 [8:28:05<17:47:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 32%|███▏ | 3992/12384 [8:28:05<17:46:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 32%|███▏ | 3992/12384 [8:28:12<17:46:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 0: 32%|███▏ | 3993/12384 [8:28:12<17:46:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 0: 32%|███▏ | 3993/12384 [8:28:20<17:46:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 0: 32%|███▏ | 3994/12384 [8:28:20<17:45:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 0: 32%|███▏ | 3994/12384 [8:28:27<17:45:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 32%|███▏ | 3995/12384 [8:28:27<17:45:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 32%|███▏ | 3995/12384 [8:28:35<17:45:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 0: 32%|███▏ | 3996/12384 [8:28:35<17:47:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 0: 32%|███▏ | 3996/12384 [8:28:43<17:47:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 32%|███▏ | 3997/12384 [8:28:43<17:46:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 32%|███▏ | 3997/12384 [8:28:50<17:46:16, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 32%|███▏ | 3998/12384 [8:28:50<17:44:44, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 32%|███▏ | 3998/12384 [8:28:58<17:44:44, 7.62s/it, loss=0.0003, acc=0.9988, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3999/12384 [8:28:58<17:44:52, 7.62s/it, loss=0.0003, acc=0.9988, iter_time=7.60s]
Epoch 0: 32%|███▏ | 3999/12384 [8:29:06<17:44:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 32%|███▏ | 4000/12384 [8:29:06<17:55:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 32%|███▏ | 4000/12384 [8:29:14<17:55:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 32%|███▏ | 4001/12384 [8:29:14<18:03:28, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 32%|███▏ | 4001/12384 [8:29:21<18:03:28, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 4002/12384 [8:29:21<18:01:17, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 4002/12384 [8:29:29<18:01:17, 7.74s/it, loss=0.0004, acc=0.9992, iter_time=5.62s]
Epoch 0: 32%|███▏ | 4003/12384 [8:29:29<17:54:59, 7.70s/it, loss=0.0004, acc=0.9992, iter_time=5.62s]
Epoch 0: 32%|███▏ | 4003/12384 [8:29:37<17:54:59, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 0: 32%|███▏ | 4004/12384 [8:29:37<17:51:07, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 0: 32%|███▏ | 4004/12384 [8:29:44<17:51:07, 7.67s/it, loss=0.0008, acc=1.0000, iter_time=7.64s]
Epoch 0: 32%|███▏ | 4005/12384 [8:29:44<18:00:25, 7.74s/it, loss=0.0008, acc=1.0000, iter_time=7.64s]
Epoch 0: 32%|███▏ | 4005/12384 [8:29:52<18:00:25, 7.74s/it, loss=0.0007, acc=0.9976, iter_time=7.86s]
Epoch 0: 32%|███▏ | 4006/12384 [8:29:52<17:54:33, 7.70s/it, loss=0.0007, acc=0.9976, iter_time=7.86s]
Epoch 0: 32%|███▏ | 4006/12384 [8:30:00<17:54:33, 7.70s/it, loss=0.0002, acc=0.9994, iter_time=7.62s]
Epoch 0: 32%|███▏ | 4007/12384 [8:30:00<17:53:01, 7.69s/it, loss=0.0002, acc=0.9994, iter_time=7.62s]
Epoch 0: 32%|███▏ | 4007/12384 [8:30:07<17:53:01, 7.69s/it, loss=0.0003, acc=0.9997, iter_time=7.60s]
Epoch 0: 32%|███▏ | 4008/12384 [8:30:07<17:50:02, 7.67s/it, loss=0.0003, acc=0.9997, iter_time=7.60s]
Epoch 0: 32%|███▏ | 4008/12384 [8:30:15<17:50:02, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.20s]
Epoch 0: 32%|███▏ | 4009/12384 [8:30:15<17:46:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.20s]
Epoch 0: 32%|███▏ | 4009/12384 [8:30:22<17:46:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.92s]
Epoch 0: 32%|███▏ | 4010/12384 [8:30:22<17:45:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.92s]
Epoch 0: 32%|███▏ | 4010/12384 [8:30:30<17:45:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.74s]
Epoch 0: 32%|███▏ | 4011/12384 [8:30:30<17:43:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.74s]
Epoch 0: 32%|███▏ | 4011/12384 [8:30:38<17:43:56, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 4012/12384 [8:30:38<17:43:12, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 4012/12384 [8:30:45<17:43:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 4013/12384 [8:30:45<17:42:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 4013/12384 [8:30:53<17:42:40, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=7.60s]
Epoch 0: 32%|███▏ | 4014/12384 [8:30:53<17:42:20, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=7.60s]
Epoch 0: 32%|███▏ | 4014/12384 [8:31:01<17:42:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 32%|███▏ | 4015/12384 [8:31:01<17:42:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 32%|███▏ | 4015/12384 [8:31:08<17:42:37, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.99s]
Epoch 0: 32%|███▏ | 4016/12384 [8:31:08<17:45:18, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.99s]
Epoch 0: 32%|███▏ | 4016/12384 [8:31:16<17:45:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 0: 32%|███▏ | 4017/12384 [8:31:16<17:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 0: 32%|███▏ | 4017/12384 [8:31:24<17:45:25, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=11.02s]
Epoch 0: 32%|███▏ | 4018/12384 [8:31:24<17:44:59, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=11.02s]
Epoch 0: 32%|███▏ | 4018/12384 [8:31:31<17:44:59, 7.64s/it, loss=0.0008, acc=0.9982, iter_time=7.65s]
Epoch 0: 32%|███▏ | 4019/12384 [8:31:31<17:44:08, 7.63s/it, loss=0.0008, acc=0.9982, iter_time=7.65s]
Epoch 0: 32%|███▏ | 4019/12384 [8:31:39<17:44:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 4020/12384 [8:31:39<17:43:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 4020/12384 [8:31:46<17:43:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 4021/12384 [8:31:46<17:43:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 32%|███▏ | 4021/12384 [8:31:54<17:43:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 4022/12384 [8:31:54<17:41:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 32%|███▏ | 4022/12384 [8:32:02<17:41:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 4023/12384 [8:32:02<17:41:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 32%|███▏ | 4023/12384 [8:32:09<17:41:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 32%|███▏ | 4024/12384 [8:32:09<17:41:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 32%|███▏ | 4024/12384 [8:32:17<17:41:49, 7.62s/it, loss=0.0006, acc=0.9994, iter_time=7.53s]
Epoch 0: 33%|███▎ | 4025/12384 [8:32:17<17:40:49, 7.61s/it, loss=0.0006, acc=0.9994, iter_time=7.53s]
Epoch 0: 33%|███▎ | 4025/12384 [8:32:24<17:40:49, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 33%|███▎ | 4026/12384 [8:32:24<17:40:55, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 33%|███▎ | 4026/12384 [8:32:32<17:40:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 33%|███▎ | 4027/12384 [8:32:32<17:40:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 33%|███▎ | 4027/12384 [8:32:40<17:40:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 33%|███▎ | 4028/12384 [8:32:40<17:51:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 33%|███▎ | 4028/12384 [8:32:48<17:51:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 33%|███▎ | 4029/12384 [8:32:48<17:50:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 33%|███▎ | 4029/12384 [8:32:55<17:50:17, 7.69s/it, loss=0.0004, acc=0.9993, iter_time=9.95s]
Epoch 0: 33%|███▎ | 4030/12384 [8:32:55<17:47:21, 7.67s/it, loss=0.0004, acc=0.9993, iter_time=9.95s]
Epoch 0: 33%|███▎ | 4030/12384 [8:33:03<17:47:21, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=6.54s]
Epoch 0: 33%|███▎ | 4031/12384 [8:33:03<17:57:33, 7.74s/it, loss=0.0001, acc=0.9998, iter_time=6.54s]
Epoch 0: 33%|███▎ | 4031/12384 [8:33:11<17:57:33, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=8.93s]
Epoch 0: 33%|███▎ | 4032/12384 [8:33:11<17:51:29, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.93s]
Epoch 0: 33%|███▎ | 4032/12384 [8:33:18<17:51:29, 7.70s/it, loss=0.0008, acc=0.9985, iter_time=7.65s]
Epoch 0: 33%|███▎ | 4033/12384 [8:33:18<17:47:41, 7.67s/it, loss=0.0008, acc=0.9985, iter_time=7.65s]
Epoch 0: 33%|███▎ | 4033/12384 [8:33:26<17:47:41, 7.67s/it, loss=0.0005, acc=1.0000, iter_time=4.77s]
Epoch 0: 33%|███▎ | 4034/12384 [8:33:26<17:44:30, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=4.77s]
Epoch 0: 33%|███▎ | 4034/12384 [8:33:34<17:44:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 33%|███▎ | 4035/12384 [8:33:34<17:42:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 33%|███▎ | 4035/12384 [8:33:41<17:42:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 33%|███▎ | 4036/12384 [8:33:41<17:42:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 33%|███▎ | 4036/12384 [8:33:49<17:42:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.42s]
Epoch 0: 33%|███▎ | 4037/12384 [8:33:49<17:41:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.42s]
Epoch 0: 33%|███▎ | 4037/12384 [8:33:56<17:41:50, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.47s]
Epoch 0: 33%|███▎ | 4038/12384 [8:33:56<17:40:42, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.47s]
Epoch 0: 33%|███▎ | 4038/12384 [8:34:04<17:40:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.98s]
Epoch 0: 33%|███▎ | 4039/12384 [8:34:04<17:44:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.98s]
Epoch 0: 33%|███▎ | 4039/12384 [8:34:12<17:44:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 33%|███▎ | 4040/12384 [8:34:12<17:43:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 33%|███▎ | 4040/12384 [8:34:19<17:43:24, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.24s]
Epoch 0: 33%|███▎ | 4041/12384 [8:34:19<17:41:42, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.24s]
Epoch 0: 33%|███▎ | 4041/12384 [8:34:27<17:41:42, 7.64s/it, loss=0.0002, acc=0.9989, iter_time=6.07s]
Epoch 0: 33%|███▎ | 4042/12384 [8:34:27<17:42:07, 7.64s/it, loss=0.0002, acc=0.9989, iter_time=6.07s]
Epoch 0: 33%|███▎ | 4042/12384 [8:34:35<17:42:07, 7.64s/it, loss=0.0013, acc=0.9970, iter_time=7.96s]
Epoch 0: 33%|███▎ | 4043/12384 [8:34:35<17:41:03, 7.63s/it, loss=0.0013, acc=0.9970, iter_time=7.96s]
Epoch 0: 33%|███▎ | 4043/12384 [8:34:42<17:41:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 33%|███▎ | 4044/12384 [8:34:42<17:40:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 33%|███▎ | 4044/12384 [8:34:50<17:40:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4045/12384 [8:34:50<17:39:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4045/12384 [8:34:58<17:39:22, 7.62s/it, loss=0.0004, acc=0.9975, iter_time=7.59s]
Epoch 0: 33%|███▎ | 4046/12384 [8:34:58<17:43:46, 7.65s/it, loss=0.0004, acc=0.9975, iter_time=7.59s]
Epoch 0: 33%|███▎ | 4046/12384 [8:35:05<17:43:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 33%|███▎ | 4047/12384 [8:35:05<17:41:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 33%|███▎ | 4047/12384 [8:35:13<17:41:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 33%|███▎ | 4048/12384 [8:35:13<17:40:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 33%|███▎ | 4048/12384 [8:35:20<17:40:48, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=7.65s]
Epoch 0: 33%|███▎ | 4049/12384 [8:35:20<17:39:16, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.65s]
Epoch 0: 33%|███▎ | 4049/12384 [8:35:28<17:39:16, 7.63s/it, loss=0.0002, acc=0.9988, iter_time=8.03s]
Epoch 0: 33%|███▎ | 4050/12384 [8:35:28<17:39:04, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=8.03s]
Epoch 0: 33%|███▎ | 4050/12384 [8:35:36<17:39:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 33%|███▎ | 4051/12384 [8:35:36<17:37:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 33%|███▎ | 4051/12384 [8:35:43<17:37:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 33%|███▎ | 4052/12384 [8:35:43<17:36:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 33%|███▎ | 4052/12384 [8:35:51<17:36:56, 7.61s/it, loss=0.0032, acc=0.9967, iter_time=11.18s]
Epoch 0: 33%|███▎ | 4053/12384 [8:35:51<17:36:49, 7.61s/it, loss=0.0032, acc=0.9967, iter_time=11.18s]
Epoch 0: 33%|███▎ | 4053/12384 [8:35:59<17:36:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 33%|███▎ | 4054/12384 [8:35:59<17:51:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 33%|███▎ | 4054/12384 [8:36:06<17:51:02, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 33%|███▎ | 4055/12384 [8:36:06<17:46:26, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 33%|███▎ | 4055/12384 [8:36:14<17:46:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 33%|███▎ | 4056/12384 [8:36:14<17:43:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 33%|███▎ | 4056/12384 [8:36:22<17:43:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 33%|███▎ | 4057/12384 [8:36:22<17:54:44, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 33%|███▎ | 4057/12384 [8:36:30<17:54:44, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.39s]
Epoch 0: 33%|███▎ | 4058/12384 [8:36:30<17:48:18, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.39s]
Epoch 0: 33%|███▎ | 4058/12384 [8:36:37<17:48:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 0: 33%|███▎ | 4059/12384 [8:36:37<17:44:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 0: 33%|███▎ | 4059/12384 [8:36:45<17:44:45, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4060/12384 [8:36:45<17:40:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4060/12384 [8:36:52<17:40:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 33%|███▎ | 4061/12384 [8:36:52<17:39:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 33%|███▎ | 4061/12384 [8:37:00<17:39:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4062/12384 [8:37:00<17:37:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4062/12384 [8:37:08<17:37:25, 7.62s/it, loss=0.0005, acc=0.9996, iter_time=7.00s]
Epoch 0: 33%|███▎ | 4063/12384 [8:37:08<17:36:36, 7.62s/it, loss=0.0005, acc=0.9996, iter_time=7.00s]
Epoch 0: 33%|███▎ | 4063/12384 [8:37:15<17:36:36, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.57s]
Epoch 0: 33%|███▎ | 4064/12384 [8:37:15<17:35:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.57s]
Epoch 0: 33%|███▎ | 4064/12384 [8:37:23<17:35:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 33%|███▎ | 4065/12384 [8:37:23<17:34:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 33%|███▎ | 4065/12384 [8:37:30<17:34:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.73s]
Epoch 0: 33%|███▎ | 4066/12384 [8:37:30<17:34:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.73s]
Epoch 0: 33%|███▎ | 4066/12384 [8:37:38<17:34:28, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=10.48s]
Epoch 0: 33%|███▎ | 4067/12384 [8:37:38<17:35:12, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=10.48s]
Epoch 0: 33%|███▎ | 4067/12384 [8:37:46<17:35:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.89s]
Epoch 0: 33%|███▎ | 4068/12384 [8:37:46<17:35:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.89s]
Epoch 0: 33%|███▎ | 4068/12384 [8:37:53<17:35:22, 7.61s/it, loss=0.0002, acc=0.9997, iter_time=9.35s]
Epoch 0: 33%|███▎ | 4069/12384 [8:37:53<17:35:31, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=9.35s]
Epoch 0: 33%|███▎ | 4069/12384 [8:38:01<17:35:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4070/12384 [8:38:01<17:35:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4070/12384 [8:38:08<17:35:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4071/12384 [8:38:08<17:34:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4071/12384 [8:38:16<17:34:48, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.56s]
Epoch 0: 33%|███▎ | 4072/12384 [8:38:16<17:33:52, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.56s]
Epoch 0: 33%|███▎ | 4072/12384 [8:38:24<17:33:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 33%|███▎ | 4073/12384 [8:38:24<17:33:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 33%|███▎ | 4073/12384 [8:38:31<17:33:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4074/12384 [8:38:31<17:33:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4074/12384 [8:38:39<17:33:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 33%|███▎ | 4075/12384 [8:38:39<17:37:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 33%|███▎ | 4075/12384 [8:38:47<17:37:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 33%|███▎ | 4076/12384 [8:38:47<17:36:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 33%|███▎ | 4076/12384 [8:38:54<17:36:56, 7.63s/it, loss=0.0012, acc=0.9980, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4077/12384 [8:38:54<17:35:42, 7.63s/it, loss=0.0012, acc=0.9980, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4077/12384 [8:39:02<17:35:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 33%|███▎ | 4078/12384 [8:39:02<17:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 33%|███▎ | 4078/12384 [8:39:09<17:34:46, 7.62s/it, loss=0.0006, acc=0.9967, iter_time=8.83s]
Epoch 0: 33%|███▎ | 4079/12384 [8:39:09<17:34:07, 7.62s/it, loss=0.0006, acc=0.9967, iter_time=8.83s]
Epoch 0: 33%|███▎ | 4079/12384 [8:39:17<17:34:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 33%|███▎ | 4080/12384 [8:39:17<17:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 33%|███▎ | 4080/12384 [8:39:25<17:33:53, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=7.67s]
Epoch 0: 33%|███▎ | 4081/12384 [8:39:25<17:37:43, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.67s]
Epoch 0: 33%|███▎ | 4081/12384 [8:39:32<17:37:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 33%|███▎ | 4082/12384 [8:39:32<17:36:31, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 33%|███▎ | 4082/12384 [8:39:40<17:36:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 33%|███▎ | 4083/12384 [8:39:40<17:48:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 33%|███▎ | 4083/12384 [8:39:48<17:48:09, 7.72s/it, loss=0.0016, acc=0.9961, iter_time=4.74s]
Epoch 0: 33%|███▎ | 4084/12384 [8:39:48<17:48:01, 7.72s/it, loss=0.0016, acc=0.9961, iter_time=4.74s]
Epoch 0: 33%|███▎ | 4084/12384 [8:39:56<17:48:01, 7.72s/it, loss=0.0002, acc=0.9994, iter_time=10.83s]
Epoch 0: 33%|███▎ | 4085/12384 [8:39:56<17:42:38, 7.68s/it, loss=0.0002, acc=0.9994, iter_time=10.83s]
Epoch 0: 33%|███▎ | 4085/12384 [8:40:03<17:42:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 0: 33%|███▎ | 4086/12384 [8:40:03<17:40:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 0: 33%|███▎ | 4086/12384 [8:40:11<17:40:06, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.45s]
Epoch 0: 33%|███▎ | 4087/12384 [8:40:11<17:37:48, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=11.45s]
Epoch 0: 33%|███▎ | 4087/12384 [8:40:18<17:37:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4088/12384 [8:40:18<17:38:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4088/12384 [8:40:26<17:38:42, 7.66s/it, loss=0.0005, acc=0.9976, iter_time=5.32s]
Epoch 0: 33%|███▎ | 4089/12384 [8:40:26<17:36:46, 7.64s/it, loss=0.0005, acc=0.9976, iter_time=5.32s]
Epoch 0: 33%|███▎ | 4089/12384 [8:40:34<17:36:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.96s]
Epoch 0: 33%|███▎ | 4090/12384 [8:40:34<17:35:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.96s]
Epoch 0: 33%|███▎ | 4090/12384 [8:40:41<17:35:38, 7.64s/it, loss=0.0003, acc=0.9979, iter_time=7.33s]
Epoch 0: 33%|███▎ | 4091/12384 [8:40:41<17:36:21, 7.64s/it, loss=0.0003, acc=0.9979, iter_time=7.33s]
Epoch 0: 33%|███▎ | 4091/12384 [8:40:49<17:36:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 33%|███▎ | 4092/12384 [8:40:49<17:33:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 33%|███▎ | 4092/12384 [8:40:57<17:33:52, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4093/12384 [8:40:57<17:33:29, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4093/12384 [8:41:04<17:33:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.08s]
Epoch 0: 33%|███▎ | 4094/12384 [8:41:04<17:35:36, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.08s]
Epoch 0: 33%|███▎ | 4094/12384 [8:41:12<17:35:36, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=8.62s]
Epoch 0: 33%|███▎ | 4095/12384 [8:41:12<17:34:37, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=8.62s]
Epoch 0: 33%|███▎ | 4095/12384 [8:41:20<17:34:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.61s]
Epoch 0: 33%|███▎ | 4096/12384 [8:41:20<17:34:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.61s]
Epoch 0: 33%|███▎ | 4096/12384 [8:41:27<17:34:05, 7.63s/it, loss=0.0014, acc=0.9971, iter_time=7.21s]
Epoch 0: 33%|███▎ | 4097/12384 [8:41:27<17:32:11, 7.62s/it, loss=0.0014, acc=0.9971, iter_time=7.21s]
Epoch 0: 33%|███▎ | 4097/12384 [8:41:35<17:32:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4098/12384 [8:41:35<17:31:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4098/12384 [8:41:42<17:31:56, 7.62s/it, loss=0.0103, acc=0.9903, iter_time=7.64s]
Epoch 0: 33%|███▎ | 4099/12384 [8:41:42<17:31:42, 7.62s/it, loss=0.0103, acc=0.9903, iter_time=7.64s]
Epoch 0: 33%|███▎ | 4099/12384 [8:41:50<17:31:42, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.01s]
Epoch 0: 33%|███▎ | 4100/12384 [8:41:50<17:31:47, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.01s]
Epoch 0: 33%|███▎ | 4100/12384 [8:41:58<17:31:47, 7.62s/it, loss=0.0005, acc=0.9987, iter_time=7.21s]
Epoch 0: 33%|███▎ | 4101/12384 [8:41:58<17:31:42, 7.62s/it, loss=0.0005, acc=0.9987, iter_time=7.21s]
Epoch 0: 33%|███▎ | 4101/12384 [8:42:05<17:31:42, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4102/12384 [8:42:05<17:30:31, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4102/12384 [8:42:13<17:30:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.58s]
Epoch 0: 33%|███▎ | 4103/12384 [8:42:13<17:29:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.58s]
Epoch 0: 33%|███▎ | 4103/12384 [8:42:20<17:29:53, 7.61s/it, loss=0.0002, acc=0.9995, iter_time=12.00s]
Epoch 0: 33%|███▎ | 4104/12384 [8:42:20<17:29:24, 7.60s/it, loss=0.0002, acc=0.9995, iter_time=12.00s]
Epoch 0: 33%|███▎ | 4104/12384 [8:42:28<17:29:24, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 33%|███▎ | 4105/12384 [8:42:28<17:41:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 33%|███▎ | 4105/12384 [8:42:36<17:41:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4106/12384 [8:42:36<17:37:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4106/12384 [8:42:44<17:37:57, 7.67s/it, loss=0.0012, acc=0.9964, iter_time=7.59s]
Epoch 0: 33%|███▎ | 4107/12384 [8:42:44<17:38:42, 7.67s/it, loss=0.0012, acc=0.9964, iter_time=7.59s]
Epoch 0: 33%|███▎ | 4107/12384 [8:42:51<17:38:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 33%|███▎ | 4108/12384 [8:42:51<17:38:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 33%|███▎ | 4108/12384 [8:42:59<17:38:01, 7.67s/it, loss=0.0003, acc=0.9975, iter_time=7.80s]
Epoch 0: 33%|███▎ | 4109/12384 [8:42:59<17:49:05, 7.75s/it, loss=0.0003, acc=0.9975, iter_time=7.80s]
Epoch 0: 33%|███▎ | 4109/12384 [8:43:07<17:49:05, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 33%|███▎ | 4110/12384 [8:43:07<17:42:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 33%|███▎ | 4110/12384 [8:43:14<17:42:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 33%|███▎ | 4111/12384 [8:43:14<17:38:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 33%|███▎ | 4111/12384 [8:43:22<17:38:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 33%|███▎ | 4112/12384 [8:43:22<17:36:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 33%|███▎ | 4112/12384 [8:43:30<17:36:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 33%|███▎ | 4113/12384 [8:43:30<17:33:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 33%|███▎ | 4113/12384 [8:43:37<17:33:41, 7.64s/it, loss=0.0003, acc=0.9985, iter_time=7.63s]
Epoch 0: 33%|███▎ | 4114/12384 [8:43:37<17:32:37, 7.64s/it, loss=0.0003, acc=0.9985, iter_time=7.63s]
Epoch 0: 33%|███▎ | 4114/12384 [8:43:45<17:32:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 33%|███▎ | 4115/12384 [8:43:45<17:31:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 33%|███▎ | 4115/12384 [8:43:52<17:31:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 33%|███▎ | 4116/12384 [8:43:52<17:29:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 33%|███▎ | 4116/12384 [8:44:00<17:29:59, 7.62s/it, loss=0.0043, acc=0.9911, iter_time=6.08s]
Epoch 0: 33%|███▎ | 4117/12384 [8:44:00<17:29:51, 7.62s/it, loss=0.0043, acc=0.9911, iter_time=6.08s]
Epoch 0: 33%|███▎ | 4117/12384 [8:44:08<17:29:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 33%|███▎ | 4118/12384 [8:44:08<17:28:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 33%|███▎ | 4118/12384 [8:44:15<17:28:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4119/12384 [8:44:15<17:29:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4119/12384 [8:44:23<17:29:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 33%|███▎ | 4120/12384 [8:44:23<17:29:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 33%|███▎ | 4120/12384 [8:44:31<17:29:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 33%|███▎ | 4121/12384 [8:44:31<17:30:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 33%|███▎ | 4121/12384 [8:44:38<17:30:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 33%|███▎ | 4122/12384 [8:44:38<17:35:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 33%|███▎ | 4122/12384 [8:44:46<17:35:25, 7.66s/it, loss=0.0019, acc=0.9980, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4123/12384 [8:44:46<17:32:59, 7.65s/it, loss=0.0019, acc=0.9980, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4123/12384 [8:44:54<17:32:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 33%|███▎ | 4124/12384 [8:44:54<17:34:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 33%|███▎ | 4124/12384 [8:45:01<17:34:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 33%|███▎ | 4125/12384 [8:45:01<17:31:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 33%|███▎ | 4125/12384 [8:45:09<17:31:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 33%|███▎ | 4126/12384 [8:45:09<17:29:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 33%|███▎ | 4126/12384 [8:45:16<17:29:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 33%|███▎ | 4127/12384 [8:45:16<17:29:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 33%|███▎ | 4127/12384 [8:45:24<17:29:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 33%|███▎ | 4128/12384 [8:45:24<17:29:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 33%|███▎ | 4128/12384 [8:45:32<17:29:11, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=7.31s]
Epoch 0: 33%|███▎ | 4129/12384 [8:45:32<17:28:19, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=7.31s]
Epoch 0: 33%|███▎ | 4129/12384 [8:45:40<17:28:19, 7.62s/it, loss=0.0008, acc=1.0000, iter_time=8.13s]
Epoch 0: 33%|███▎ | 4130/12384 [8:45:40<17:38:52, 7.70s/it, loss=0.0008, acc=1.0000, iter_time=8.13s]
Epoch 0: 33%|███▎ | 4130/12384 [8:45:47<17:38:52, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 33%|███▎ | 4131/12384 [8:45:47<17:34:41, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 33%|███▎ | 4131/12384 [8:45:55<17:34:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 33%|███▎ | 4132/12384 [8:45:55<17:31:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 33%|███▎ | 4132/12384 [8:46:02<17:31:12, 7.64s/it, loss=0.0023, acc=0.9976, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4133/12384 [8:46:02<17:29:58, 7.64s/it, loss=0.0023, acc=0.9976, iter_time=7.60s]
Epoch 0: 33%|███▎ | 4133/12384 [8:46:10<17:29:58, 7.64s/it, loss=0.0013, acc=0.9955, iter_time=9.40s]
Epoch 0: 33%|███▎ | 4134/12384 [8:46:10<17:28:29, 7.63s/it, loss=0.0013, acc=0.9955, iter_time=9.40s]
Epoch 0: 33%|███▎ | 4134/12384 [8:46:18<17:28:29, 7.63s/it, loss=0.0002, acc=0.9985, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4135/12384 [8:46:18<17:28:01, 7.62s/it, loss=0.0002, acc=0.9985, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4135/12384 [8:46:25<17:28:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 33%|███▎ | 4136/12384 [8:46:25<17:40:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 33%|███▎ | 4136/12384 [8:46:33<17:40:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 33%|███▎ | 4137/12384 [8:46:33<17:36:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 33%|███▎ | 4137/12384 [8:46:41<17:36:47, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 33%|███▎ | 4138/12384 [8:46:41<17:32:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 33%|███▎ | 4138/12384 [8:46:48<17:32:24, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=8.71s]
Epoch 0: 33%|███▎ | 4139/12384 [8:46:48<17:30:56, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=8.71s]
Epoch 0: 33%|███▎ | 4139/12384 [8:46:56<17:30:56, 7.65s/it, loss=0.0005, acc=0.9987, iter_time=7.63s]
Epoch 0: 33%|███▎ | 4140/12384 [8:46:56<17:29:47, 7.64s/it, loss=0.0005, acc=0.9987, iter_time=7.63s]
Epoch 0: 33%|███▎ | 4140/12384 [8:47:04<17:29:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4141/12384 [8:47:04<17:32:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 33%|███▎ | 4141/12384 [8:47:11<17:32:22, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=7.73s]
Epoch 0: 33%|███▎ | 4142/12384 [8:47:11<17:34:43, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=7.73s]
Epoch 0: 33%|███▎ | 4142/12384 [8:47:19<17:34:43, 7.68s/it, loss=0.0005, acc=0.9993, iter_time=7.70s]
Epoch 0: 33%|███▎ | 4143/12384 [8:47:19<17:31:50, 7.66s/it, loss=0.0005, acc=0.9993, iter_time=7.70s]
Epoch 0: 33%|███▎ | 4143/12384 [8:47:27<17:31:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 33%|███▎ | 4144/12384 [8:47:27<17:30:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 33%|███▎ | 4144/12384 [8:47:34<17:30:21, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.34s]
Epoch 0: 33%|███▎ | 4145/12384 [8:47:34<17:28:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.34s]
Epoch 0: 33%|███▎ | 4145/12384 [8:47:42<17:28:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.93s]
Epoch 0: 33%|███▎ | 4146/12384 [8:47:42<17:26:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.93s]
Epoch 0: 33%|███▎ | 4146/12384 [8:47:49<17:26:47, 7.62s/it, loss=0.0016, acc=0.9984, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4147/12384 [8:47:49<17:26:21, 7.62s/it, loss=0.0016, acc=0.9984, iter_time=7.62s]
Epoch 0: 33%|███▎ | 4147/12384 [8:47:57<17:26:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 0: 33%|███▎ | 4148/12384 [8:47:57<17:26:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 0: 33%|███▎ | 4148/12384 [8:48:05<17:26:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 34%|███▎ | 4149/12384 [8:48:05<17:25:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 34%|███▎ | 4149/12384 [8:48:12<17:25:53, 7.62s/it, loss=0.0004, acc=0.9987, iter_time=8.01s]
Epoch 0: 34%|███▎ | 4150/12384 [8:48:12<17:24:25, 7.61s/it, loss=0.0004, acc=0.9987, iter_time=8.01s]
Epoch 0: 34%|███▎ | 4150/12384 [8:48:20<17:24:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 0: 34%|███▎ | 4151/12384 [8:48:20<17:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 0: 34%|███▎ | 4151/12384 [8:48:27<17:24:15, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.29s]
Epoch 0: 34%|███▎ | 4152/12384 [8:48:27<17:23:47, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.29s]
Epoch 0: 34%|███▎ | 4152/12384 [8:48:35<17:23:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 34%|███▎ | 4153/12384 [8:48:35<17:23:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 34%|███▎ | 4153/12384 [8:48:43<17:23:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.82s]
Epoch 0: 34%|███▎ | 4154/12384 [8:48:43<17:25:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.82s]
Epoch 0: 34%|███▎ | 4154/12384 [8:48:50<17:25:16, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=9.45s]
Epoch 0: 34%|███▎ | 4155/12384 [8:48:50<17:23:57, 7.61s/it, loss=0.0003, acc=0.9994, iter_time=9.45s]
Epoch 0: 34%|███▎ | 4155/12384 [8:48:58<17:23:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 34%|███▎ | 4156/12384 [8:48:58<17:35:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 34%|███▎ | 4156/12384 [8:49:06<17:35:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 34%|███▎ | 4157/12384 [8:49:06<17:32:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 34%|███▎ | 4157/12384 [8:49:13<17:32:05, 7.67s/it, loss=0.0002, acc=0.9987, iter_time=8.84s]
Epoch 0: 34%|███▎ | 4158/12384 [8:49:13<17:28:50, 7.65s/it, loss=0.0002, acc=0.9987, iter_time=8.84s]
Epoch 0: 34%|███▎ | 4158/12384 [8:49:21<17:28:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 34%|███▎ | 4159/12384 [8:49:21<17:25:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 34%|███▎ | 4159/12384 [8:49:29<17:25:47, 7.63s/it, loss=0.0009, acc=0.9993, iter_time=9.79s]
Epoch 0: 34%|███▎ | 4160/12384 [8:49:29<17:26:15, 7.63s/it, loss=0.0009, acc=0.9993, iter_time=9.79s]
Epoch 0: 34%|███▎ | 4160/12384 [8:49:36<17:26:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 34%|███▎ | 4161/12384 [8:49:36<17:25:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 34%|███▎ | 4161/12384 [8:49:44<17:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 34%|███▎ | 4162/12384 [8:49:44<17:40:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 34%|███▎ | 4162/12384 [8:49:52<17:40:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 34%|███▎ | 4163/12384 [8:49:52<17:34:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 34%|███▎ | 4163/12384 [8:49:59<17:34:04, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 34%|███▎ | 4164/12384 [8:49:59<17:31:08, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 34%|███▎ | 4164/12384 [8:50:07<17:31:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 34%|███▎ | 4165/12384 [8:50:07<17:31:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 34%|███▎ | 4165/12384 [8:50:15<17:31:57, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=9.26s]
Epoch 0: 34%|███▎ | 4166/12384 [8:50:15<17:31:19, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=9.26s]
Epoch 0: 34%|███▎ | 4166/12384 [8:50:22<17:31:19, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 34%|███▎ | 4167/12384 [8:50:22<17:28:12, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 34%|███▎ | 4167/12384 [8:50:30<17:28:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 34%|███▎ | 4168/12384 [8:50:30<17:27:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 34%|███▎ | 4168/12384 [8:50:38<17:27:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 0: 34%|███▎ | 4169/12384 [8:50:38<17:25:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 0: 34%|███▎ | 4169/12384 [8:50:45<17:25:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 0: 34%|███▎ | 4170/12384 [8:50:45<17:23:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 0: 34%|███▎ | 4170/12384 [8:50:53<17:23:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 0: 34%|███▎ | 4171/12384 [8:50:53<17:23:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 0: 34%|███▎ | 4171/12384 [8:51:01<17:23:39, 7.62s/it, loss=0.0006, acc=0.9978, iter_time=8.32s]
Epoch 0: 34%|███▎ | 4172/12384 [8:51:01<17:27:12, 7.65s/it, loss=0.0006, acc=0.9978, iter_time=8.32s]
Epoch 0: 34%|███▎ | 4172/12384 [8:51:08<17:27:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 34%|███▎ | 4173/12384 [8:51:08<17:26:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 34%|███▎ | 4173/12384 [8:51:16<17:26:07, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.53s]
Epoch 0: 34%|███▎ | 4174/12384 [8:51:16<17:23:53, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.53s]
Epoch 0: 34%|███▎ | 4174/12384 [8:51:23<17:23:53, 7.63s/it, loss=0.0016, acc=0.9973, iter_time=9.69s]
Epoch 0: 34%|███▎ | 4175/12384 [8:51:23<17:23:47, 7.63s/it, loss=0.0016, acc=0.9973, iter_time=9.69s]
Epoch 0: 34%|███▎ | 4175/12384 [8:51:31<17:23:47, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=8.00s]
Epoch 0: 34%|███▎ | 4176/12384 [8:51:31<17:22:05, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=8.00s]
Epoch 0: 34%|███▎ | 4176/12384 [8:51:39<17:22:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 34%|███▎ | 4177/12384 [8:51:39<17:22:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 34%|███▎ | 4177/12384 [8:51:46<17:22:59, 7.63s/it, loss=0.0003, acc=0.9997, iter_time=7.33s]
Epoch 0: 34%|███▎ | 4178/12384 [8:51:46<17:22:23, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=7.33s]
Epoch 0: 34%|███▎ | 4178/12384 [8:51:54<17:22:23, 7.62s/it, loss=0.0007, acc=0.9998, iter_time=7.62s]
Epoch 0: 34%|███▎ | 4179/12384 [8:51:54<17:22:39, 7.62s/it, loss=0.0007, acc=0.9998, iter_time=7.62s]
Epoch 0: 34%|███▎ | 4179/12384 [8:52:02<17:22:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 34%|███▍ | 4180/12384 [8:52:02<17:22:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 34%|███▍ | 4180/12384 [8:52:09<17:22:53, 7.63s/it, loss=0.0001, acc=0.9994, iter_time=7.65s]
Epoch 0: 34%|███▍ | 4181/12384 [8:52:09<17:21:49, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.65s]
Epoch 0: 34%|███▍ | 4181/12384 [8:52:17<17:21:49, 7.62s/it, loss=0.0004, acc=0.9993, iter_time=7.30s]
Epoch 0: 34%|███▍ | 4182/12384 [8:52:17<17:21:15, 7.62s/it, loss=0.0004, acc=0.9993, iter_time=7.30s]
Epoch 0: 34%|███▍ | 4182/12384 [8:52:24<17:21:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 34%|███▍ | 4183/12384 [8:52:24<17:24:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 34%|███▍ | 4183/12384 [8:52:32<17:24:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 34%|███▍ | 4184/12384 [8:52:32<17:24:04, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 34%|███▍ | 4184/12384 [8:52:40<17:24:04, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.65s]
Epoch 0: 34%|███▍ | 4185/12384 [8:52:40<17:22:15, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.65s]
Epoch 0: 34%|███▍ | 4185/12384 [8:52:47<17:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 34%|███▍ | 4186/12384 [8:52:47<17:22:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 34%|███▍ | 4186/12384 [8:52:55<17:22:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 34%|███▍ | 4187/12384 [8:52:55<17:22:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 34%|███▍ | 4187/12384 [8:53:03<17:22:17, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=4.05s]
Epoch 0: 34%|███▍ | 4188/12384 [8:53:03<17:20:32, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=4.05s]
Epoch 0: 34%|███▍ | 4188/12384 [8:53:11<17:20:32, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=11.22s]
Epoch 0: 34%|███▍ | 4189/12384 [8:53:11<17:35:45, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=11.22s]
Epoch 0: 34%|███▍ | 4189/12384 [8:53:18<17:35:45, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 34%|███▍ | 4190/12384 [8:53:18<17:31:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 34%|███▍ | 4190/12384 [8:53:26<17:31:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4191/12384 [8:53:26<17:27:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4191/12384 [8:53:33<17:27:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 34%|███▍ | 4192/12384 [8:53:33<17:25:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 34%|███▍ | 4192/12384 [8:53:41<17:25:07, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 34%|███▍ | 4193/12384 [8:53:41<17:23:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 34%|███▍ | 4193/12384 [8:53:49<17:23:30, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 34%|███▍ | 4194/12384 [8:53:49<17:22:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 34%|███▍ | 4194/12384 [8:53:56<17:22:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 34%|███▍ | 4195/12384 [8:53:56<17:21:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 34%|███▍ | 4195/12384 [8:54:04<17:21:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 34%|███▍ | 4196/12384 [8:54:04<17:21:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 34%|███▍ | 4196/12384 [8:54:12<17:21:41, 7.63s/it, loss=0.0006, acc=0.9981, iter_time=6.15s]
Epoch 0: 34%|███▍ | 4197/12384 [8:54:12<17:20:47, 7.63s/it, loss=0.0006, acc=0.9981, iter_time=6.15s]
Epoch 0: 34%|███▍ | 4197/12384 [8:54:19<17:20:47, 7.63s/it, loss=0.0005, acc=0.9976, iter_time=7.59s]
Epoch 0: 34%|███▍ | 4198/12384 [8:54:19<17:21:10, 7.63s/it, loss=0.0005, acc=0.9976, iter_time=7.59s]
Epoch 0: 34%|███▍ | 4198/12384 [8:54:27<17:21:10, 7.63s/it, loss=0.0010, acc=0.9977, iter_time=9.14s]
Epoch 0: 34%|███▍ | 4199/12384 [8:54:27<17:20:52, 7.63s/it, loss=0.0010, acc=0.9977, iter_time=9.14s]
Epoch 0: 34%|███▍ | 4199/12384 [8:54:34<17:20:52, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.65s]
Epoch 0: 34%|███▍ | 4200/12384 [8:54:34<17:20:32, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.65s]
Epoch 0: 34%|███▍ | 4200/12384 [8:54:42<17:20:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.62s]
Epoch 0: 34%|███▍ | 4201/12384 [8:54:42<17:19:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.62s]
Epoch 0: 34%|███▍ | 4201/12384 [8:54:50<17:19:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.18s]
Epoch 0: 34%|███▍ | 4202/12384 [8:54:50<17:18:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.18s]
Epoch 0: 34%|███▍ | 4202/12384 [8:54:57<17:18:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 34%|███▍ | 4203/12384 [8:54:57<17:18:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 34%|███▍ | 4203/12384 [8:55:05<17:18:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 0: 34%|███▍ | 4204/12384 [8:55:05<17:18:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 0: 34%|███▍ | 4204/12384 [8:55:12<17:18:59, 7.62s/it, loss=0.0003, acc=0.9996, iter_time=10.76s]
Epoch 0: 34%|███▍ | 4205/12384 [8:55:12<17:18:39, 7.62s/it, loss=0.0003, acc=0.9996, iter_time=10.76s]
Epoch 0: 34%|███▍ | 4205/12384 [8:55:20<17:18:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 34%|███▍ | 4206/12384 [8:55:20<17:18:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 34%|███▍ | 4206/12384 [8:55:28<17:18:44, 7.62s/it, loss=0.0006, acc=0.9978, iter_time=7.63s]
Epoch 0: 34%|███▍ | 4207/12384 [8:55:28<17:18:26, 7.62s/it, loss=0.0006, acc=0.9978, iter_time=7.63s]
Epoch 0: 34%|███▍ | 4207/12384 [8:55:35<17:18:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 34%|███▍ | 4208/12384 [8:55:35<17:17:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 34%|███▍ | 4208/12384 [8:55:43<17:17:07, 7.61s/it, loss=0.0007, acc=0.9974, iter_time=6.46s]
Epoch 0: 34%|███▍ | 4209/12384 [8:55:43<17:16:18, 7.61s/it, loss=0.0007, acc=0.9974, iter_time=6.46s]
Epoch 0: 34%|███▍ | 4209/12384 [8:55:51<17:16:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.01s]
Epoch 0: 34%|███▍ | 4210/12384 [8:55:51<17:16:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.01s]
Epoch 0: 34%|███▍ | 4210/12384 [8:55:58<17:16:11, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=10.38s]
Epoch 0: 34%|███▍ | 4211/12384 [8:55:58<17:16:40, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=10.38s]
Epoch 0: 34%|███▍ | 4211/12384 [8:56:06<17:16:40, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 34%|███▍ | 4212/12384 [8:56:06<17:17:22, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 34%|███▍ | 4212/12384 [8:56:13<17:17:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 34%|███▍ | 4213/12384 [8:56:13<17:16:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 34%|███▍ | 4213/12384 [8:56:21<17:16:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4214/12384 [8:56:21<17:17:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4214/12384 [8:56:29<17:17:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 34%|███▍ | 4215/12384 [8:56:29<17:28:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 34%|███▍ | 4215/12384 [8:56:37<17:28:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 34%|███▍ | 4216/12384 [8:56:37<17:25:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 34%|███▍ | 4216/12384 [8:56:44<17:25:20, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=3.84s]
Epoch 0: 34%|███▍ | 4217/12384 [8:56:44<17:22:11, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=3.84s]
Epoch 0: 34%|███▍ | 4217/12384 [8:56:52<17:22:11, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.96s]
Epoch 0: 34%|███▍ | 4218/12384 [8:56:52<17:20:19, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.96s]
Epoch 0: 34%|███▍ | 4218/12384 [8:56:59<17:20:19, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.64s]
Epoch 0: 34%|███▍ | 4219/12384 [8:56:59<17:19:10, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.64s]
Epoch 0: 34%|███▍ | 4219/12384 [8:57:07<17:19:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4220/12384 [8:57:07<17:22:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4220/12384 [8:57:15<17:22:09, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=7.72s]
Epoch 0: 34%|███▍ | 4221/12384 [8:57:15<17:20:51, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.72s]
Epoch 0: 34%|███▍ | 4221/12384 [8:57:22<17:20:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 34%|███▍ | 4222/12384 [8:57:22<17:18:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 34%|███▍ | 4222/12384 [8:57:30<17:18:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 34%|███▍ | 4223/12384 [8:57:30<17:17:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 34%|███▍ | 4223/12384 [8:57:38<17:17:53, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 34%|███▍ | 4224/12384 [8:57:38<17:17:07, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 34%|███▍ | 4224/12384 [8:57:45<17:17:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 0: 34%|███▍ | 4225/12384 [8:57:45<17:17:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 0: 34%|███▍ | 4225/12384 [8:57:53<17:17:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.48s]
Epoch 0: 34%|███▍ | 4226/12384 [8:57:53<17:16:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.48s]
Epoch 0: 34%|███▍ | 4226/12384 [8:58:00<17:16:33, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=9.81s]
Epoch 0: 34%|███▍ | 4227/12384 [8:58:00<17:15:49, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=9.81s]
Epoch 0: 34%|███▍ | 4227/12384 [8:58:08<17:15:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 34%|███▍ | 4228/12384 [8:58:08<17:14:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 34%|███▍ | 4228/12384 [8:58:16<17:14:37, 7.61s/it, loss=0.0005, acc=0.9984, iter_time=7.60s]
Epoch 0: 34%|███▍ | 4229/12384 [8:58:16<17:14:21, 7.61s/it, loss=0.0005, acc=0.9984, iter_time=7.60s]
Epoch 0: 34%|███▍ | 4229/12384 [8:58:23<17:14:21, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 34%|███▍ | 4230/12384 [8:58:23<17:13:55, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 34%|███▍ | 4230/12384 [8:58:31<17:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 34%|███▍ | 4231/12384 [8:58:31<17:13:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 34%|███▍ | 4231/12384 [8:58:38<17:13:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.43s]
Epoch 0: 34%|███▍ | 4232/12384 [8:58:38<17:13:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.43s]
Epoch 0: 34%|███▍ | 4232/12384 [8:58:46<17:13:40, 7.61s/it, loss=0.0009, acc=0.9978, iter_time=7.66s]
Epoch 0: 34%|███▍ | 4233/12384 [8:58:46<17:13:32, 7.61s/it, loss=0.0009, acc=0.9978, iter_time=7.66s]
Epoch 0: 34%|███▍ | 4233/12384 [8:58:54<17:13:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 34%|███▍ | 4234/12384 [8:58:54<17:13:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 34%|███▍ | 4234/12384 [8:59:01<17:13:58, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.64s]
Epoch 0: 34%|███▍ | 4235/12384 [8:59:01<17:12:36, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=5.64s]
Epoch 0: 34%|███▍ | 4235/12384 [8:59:09<17:12:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 0: 34%|███▍ | 4236/12384 [8:59:09<17:15:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 0: 34%|███▍ | 4236/12384 [8:59:17<17:15:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 34%|███▍ | 4237/12384 [8:59:17<17:14:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 34%|███▍ | 4237/12384 [8:59:24<17:14:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 34%|███▍ | 4238/12384 [8:59:24<17:14:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 34%|███▍ | 4238/12384 [8:59:32<17:14:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4239/12384 [8:59:32<17:18:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4239/12384 [8:59:39<17:18:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 34%|███▍ | 4240/12384 [8:59:39<17:16:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 34%|███▍ | 4240/12384 [8:59:47<17:16:41, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=3.94s]
Epoch 0: 34%|███▍ | 4241/12384 [8:59:47<17:28:55, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=3.94s]
Epoch 0: 34%|███▍ | 4241/12384 [8:59:55<17:28:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 34%|███▍ | 4242/12384 [8:59:55<17:23:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 34%|███▍ | 4242/12384 [9:00:03<17:23:32, 7.69s/it, loss=0.0001, acc=0.9998, iter_time=9.71s]
Epoch 0: 34%|███▍ | 4243/12384 [9:00:03<17:20:29, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=9.71s]
Epoch 0: 34%|███▍ | 4243/12384 [9:00:10<17:20:29, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.70s]
Epoch 0: 34%|███▍ | 4244/12384 [9:00:10<17:17:56, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.70s]
Epoch 0: 34%|███▍ | 4244/12384 [9:00:18<17:17:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 0: 34%|███▍ | 4245/12384 [9:00:18<17:16:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 0: 34%|███▍ | 4245/12384 [9:00:25<17:16:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 34%|███▍ | 4246/12384 [9:00:25<17:14:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 34%|███▍ | 4246/12384 [9:00:33<17:14:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 34%|███▍ | 4247/12384 [9:00:33<17:13:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 34%|███▍ | 4247/12384 [9:00:41<17:13:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 34%|███▍ | 4248/12384 [9:00:41<17:12:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 34%|███▍ | 4248/12384 [9:00:48<17:12:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 34%|███▍ | 4249/12384 [9:00:48<17:12:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 34%|███▍ | 4249/12384 [9:00:56<17:12:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 34%|███▍ | 4250/12384 [9:00:56<17:12:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 34%|███▍ | 4250/12384 [9:01:04<17:12:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 34%|███▍ | 4251/12384 [9:01:04<17:12:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 34%|███▍ | 4251/12384 [9:01:11<17:12:01, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=6.88s]
Epoch 0: 34%|███▍ | 4252/12384 [9:01:11<17:12:24, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.88s]
Epoch 0: 34%|███▍ | 4252/12384 [9:01:19<17:12:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.39s]
Epoch 0: 34%|███▍ | 4253/12384 [9:01:19<17:12:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.39s]
Epoch 0: 34%|███▍ | 4253/12384 [9:01:26<17:12:15, 7.62s/it, loss=0.0002, acc=0.9982, iter_time=7.62s]
Epoch 0: 34%|███▍ | 4254/12384 [9:01:26<17:12:47, 7.62s/it, loss=0.0002, acc=0.9982, iter_time=7.62s]
Epoch 0: 34%|███▍ | 4254/12384 [9:01:34<17:12:47, 7.62s/it, loss=0.0033, acc=0.9961, iter_time=7.66s]
Epoch 0: 34%|███▍ | 4255/12384 [9:01:34<17:12:53, 7.62s/it, loss=0.0033, acc=0.9961, iter_time=7.66s]
Epoch 0: 34%|███▍ | 4255/12384 [9:01:42<17:12:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 34%|███▍ | 4256/12384 [9:01:42<17:11:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 34%|███▍ | 4256/12384 [9:01:49<17:11:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 34%|███▍ | 4257/12384 [9:01:49<17:15:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 34%|███▍ | 4257/12384 [9:01:57<17:15:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 34%|███▍ | 4258/12384 [9:01:57<17:13:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 34%|███▍ | 4258/12384 [9:02:05<17:13:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 34%|███▍ | 4259/12384 [9:02:05<17:13:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 34%|███▍ | 4259/12384 [9:02:12<17:13:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 34%|███▍ | 4260/12384 [9:02:12<17:14:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 34%|███▍ | 4260/12384 [9:02:20<17:14:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 0: 34%|███▍ | 4261/12384 [9:02:20<17:26:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 0: 34%|███▍ | 4261/12384 [9:02:28<17:26:13, 7.73s/it, loss=0.0023, acc=0.9980, iter_time=6.11s]
Epoch 0: 34%|███▍ | 4262/12384 [9:02:28<17:21:52, 7.70s/it, loss=0.0023, acc=0.9980, iter_time=6.11s]
Epoch 0: 34%|███▍ | 4262/12384 [9:02:35<17:21:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 34%|███▍ | 4263/12384 [9:02:35<17:18:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 34%|███▍ | 4263/12384 [9:02:43<17:18:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 34%|███▍ | 4264/12384 [9:02:43<17:15:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 34%|███▍ | 4264/12384 [9:02:51<17:15:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 34%|███▍ | 4265/12384 [9:02:51<17:12:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 34%|███▍ | 4265/12384 [9:02:58<17:12:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 34%|███▍ | 4266/12384 [9:02:58<17:11:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 34%|███▍ | 4266/12384 [9:03:06<17:11:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 34%|███▍ | 4267/12384 [9:03:06<17:23:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 34%|███▍ | 4267/12384 [9:03:14<17:23:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 34%|███▍ | 4268/12384 [9:03:14<17:20:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 34%|███▍ | 4268/12384 [9:03:21<17:20:07, 7.69s/it, loss=0.0007, acc=0.9975, iter_time=8.55s]
Epoch 0: 34%|███▍ | 4269/12384 [9:03:21<17:16:05, 7.66s/it, loss=0.0007, acc=0.9975, iter_time=8.55s]
Epoch 0: 34%|███▍ | 4269/12384 [9:03:29<17:16:05, 7.66s/it, loss=0.0007, acc=0.9982, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4270/12384 [9:03:29<17:13:51, 7.64s/it, loss=0.0007, acc=0.9982, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4270/12384 [9:03:37<17:13:51, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4271/12384 [9:03:37<17:11:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 34%|███▍ | 4271/12384 [9:03:44<17:11:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 34%|███▍ | 4272/12384 [9:03:44<17:11:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 34%|███▍ | 4272/12384 [9:03:52<17:11:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 0: 35%|███▍ | 4273/12384 [9:03:52<17:10:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 0: 35%|███▍ | 4273/12384 [9:03:59<17:10:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.95s]
Epoch 0: 35%|███▍ | 4274/12384 [9:03:59<17:10:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.95s]
Epoch 0: 35%|███▍ | 4274/12384 [9:04:07<17:10:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 0: 35%|███▍ | 4275/12384 [9:04:07<17:09:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 0: 35%|███▍ | 4275/12384 [9:04:15<17:09:35, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=10.63s]
Epoch 0: 35%|███▍ | 4276/12384 [9:04:15<17:08:25, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=10.63s]
Epoch 0: 35%|███▍ | 4276/12384 [9:04:22<17:08:25, 7.61s/it, loss=0.0003, acc=0.9980, iter_time=7.59s]
Epoch 0: 35%|███▍ | 4277/12384 [9:04:22<17:07:26, 7.60s/it, loss=0.0003, acc=0.9980, iter_time=7.59s]
Epoch 0: 35%|███▍ | 4277/12384 [9:04:30<17:07:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 35%|███▍ | 4278/12384 [9:04:30<17:07:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 35%|███▍ | 4278/12384 [9:04:37<17:07:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 35%|███▍ | 4279/12384 [9:04:37<17:07:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 35%|███▍ | 4279/12384 [9:04:45<17:07:18, 7.60s/it, loss=0.0002, acc=0.9984, iter_time=7.54s]
Epoch 0: 35%|███▍ | 4280/12384 [9:04:45<17:06:28, 7.60s/it, loss=0.0002, acc=0.9984, iter_time=7.54s]
Epoch 0: 35%|███▍ | 4280/12384 [9:04:53<17:06:28, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 0: 35%|███▍ | 4281/12384 [9:04:53<17:07:02, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 0: 35%|███▍ | 4281/12384 [9:05:00<17:07:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 35%|███▍ | 4282/12384 [9:05:00<17:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 35%|███▍ | 4282/12384 [9:05:08<17:07:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 35%|███▍ | 4283/12384 [9:05:08<17:06:41, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 35%|███▍ | 4283/12384 [9:05:15<17:06:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 35%|███▍ | 4284/12384 [9:05:15<17:06:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 35%|███▍ | 4284/12384 [9:05:23<17:06:09, 7.60s/it, loss=0.0003, acc=0.9993, iter_time=6.13s]
Epoch 0: 35%|███▍ | 4285/12384 [9:05:23<17:06:42, 7.61s/it, loss=0.0003, acc=0.9993, iter_time=6.13s]
Epoch 0: 35%|███▍ | 4285/12384 [9:05:31<17:06:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 35%|███▍ | 4286/12384 [9:05:31<17:06:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 35%|███▍ | 4286/12384 [9:05:38<17:06:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 0: 35%|███▍ | 4287/12384 [9:05:38<17:06:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 0: 35%|███▍ | 4287/12384 [9:05:46<17:06:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 35%|███▍ | 4288/12384 [9:05:46<17:07:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 35%|███▍ | 4288/12384 [9:05:53<17:07:13, 7.61s/it, loss=0.0005, acc=0.9985, iter_time=7.02s]
Epoch 0: 35%|███▍ | 4289/12384 [9:05:53<17:07:32, 7.62s/it, loss=0.0005, acc=0.9985, iter_time=7.02s]
Epoch 0: 35%|███▍ | 4289/12384 [9:06:01<17:07:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 35%|███▍ | 4290/12384 [9:06:01<17:06:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 35%|███▍ | 4290/12384 [9:06:09<17:06:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 35%|███▍ | 4291/12384 [9:06:09<17:05:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 35%|███▍ | 4291/12384 [9:06:16<17:05:57, 7.61s/it, loss=0.0002, acc=0.9994, iter_time=10.17s]
Epoch 0: 35%|███▍ | 4292/12384 [9:06:16<17:05:50, 7.61s/it, loss=0.0002, acc=0.9994, iter_time=10.17s]
Epoch 0: 35%|███▍ | 4292/12384 [9:06:24<17:05:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 35%|███▍ | 4293/12384 [9:06:24<17:19:38, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 35%|███▍ | 4293/12384 [9:06:32<17:19:38, 7.71s/it, loss=0.0027, acc=0.9933, iter_time=6.80s]
Epoch 0: 35%|███▍ | 4294/12384 [9:06:32<17:15:33, 7.68s/it, loss=0.0027, acc=0.9933, iter_time=6.80s]
Epoch 0: 35%|███▍ | 4294/12384 [9:06:39<17:15:33, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 0: 35%|███▍ | 4295/12384 [9:06:39<17:12:26, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 0: 35%|███▍ | 4295/12384 [9:06:47<17:12:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 0: 35%|███▍ | 4296/12384 [9:06:47<17:10:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 0: 35%|███▍ | 4296/12384 [9:06:55<17:10:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 35%|███▍ | 4297/12384 [9:06:55<17:07:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 35%|███▍ | 4297/12384 [9:07:02<17:07:41, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=8.18s]
Epoch 0: 35%|███▍ | 4298/12384 [9:07:02<17:07:01, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=8.18s]
Epoch 0: 35%|███▍ | 4298/12384 [9:07:10<17:07:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4299/12384 [9:07:10<17:06:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4299/12384 [9:07:18<17:06:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 35%|███▍ | 4300/12384 [9:07:18<17:07:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 35%|███▍ | 4300/12384 [9:07:25<17:07:56, 7.63s/it, loss=0.0002, acc=0.9989, iter_time=7.19s]
Epoch 0: 35%|███▍ | 4301/12384 [9:07:25<17:06:21, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=7.19s]
Epoch 0: 35%|███▍ | 4301/12384 [9:07:33<17:06:21, 7.62s/it, loss=0.0006, acc=0.9972, iter_time=7.64s]
Epoch 0: 35%|███▍ | 4302/12384 [9:07:33<17:06:31, 7.62s/it, loss=0.0006, acc=0.9972, iter_time=7.64s]
Epoch 0: 35%|███▍ | 4302/12384 [9:07:40<17:06:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 35%|███▍ | 4303/12384 [9:07:40<17:06:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 35%|███▍ | 4303/12384 [9:07:48<17:06:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 35%|███▍ | 4304/12384 [9:07:48<17:06:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 35%|███▍ | 4304/12384 [9:07:56<17:06:16, 7.62s/it, loss=0.0022, acc=0.9982, iter_time=7.66s]
Epoch 0: 35%|███▍ | 4305/12384 [9:07:56<17:05:27, 7.62s/it, loss=0.0022, acc=0.9982, iter_time=7.66s]
Epoch 0: 35%|███▍ | 4305/12384 [9:08:03<17:05:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 35%|███▍ | 4306/12384 [9:08:03<17:05:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 35%|███▍ | 4306/12384 [9:08:11<17:05:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 35%|███▍ | 4307/12384 [9:08:11<17:04:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 35%|███▍ | 4307/12384 [9:08:18<17:04:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.18s]
Epoch 0: 35%|███▍ | 4308/12384 [9:08:18<17:05:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.18s]
Epoch 0: 35%|███▍ | 4308/12384 [9:08:26<17:05:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 35%|███▍ | 4309/12384 [9:08:26<17:04:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 35%|███▍ | 4309/12384 [9:08:34<17:04:12, 7.61s/it, loss=0.0011, acc=0.9979, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4310/12384 [9:08:34<17:06:30, 7.63s/it, loss=0.0011, acc=0.9979, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4310/12384 [9:08:41<17:06:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 35%|███▍ | 4311/12384 [9:08:41<17:06:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 35%|███▍ | 4311/12384 [9:08:49<17:06:25, 7.63s/it, loss=0.0008, acc=0.9982, iter_time=7.99s]
Epoch 0: 35%|███▍ | 4312/12384 [9:08:49<17:05:22, 7.62s/it, loss=0.0008, acc=0.9982, iter_time=7.99s]
Epoch 0: 35%|███▍ | 4312/12384 [9:08:57<17:05:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.49s]
Epoch 0: 35%|███▍ | 4313/12384 [9:08:57<17:15:20, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.49s]
Epoch 0: 35%|███▍ | 4313/12384 [9:09:04<17:15:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4314/12384 [9:09:04<17:12:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4314/12384 [9:09:12<17:12:23, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4315/12384 [9:09:12<17:08:58, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4315/12384 [9:09:20<17:08:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 35%|███▍ | 4316/12384 [9:09:20<17:08:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 35%|███▍ | 4316/12384 [9:09:27<17:08:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 35%|███▍ | 4317/12384 [9:09:27<17:05:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 35%|███▍ | 4317/12384 [9:09:35<17:05:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 35%|███▍ | 4318/12384 [9:09:35<17:04:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 35%|███▍ | 4318/12384 [9:09:42<17:04:48, 7.62s/it, loss=0.0004, acc=0.9996, iter_time=5.61s]
Epoch 0: 35%|███▍ | 4319/12384 [9:09:42<17:04:06, 7.62s/it, loss=0.0004, acc=0.9996, iter_time=5.61s]
Epoch 0: 35%|███▍ | 4319/12384 [9:09:50<17:04:06, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=10.07s]
Epoch 0: 35%|███▍ | 4320/12384 [9:09:50<17:18:07, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=10.07s]
Epoch 0: 35%|███▍ | 4320/12384 [9:09:58<17:18:07, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.51s]
Epoch 0: 35%|███▍ | 4321/12384 [9:09:58<17:13:20, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.51s]
Epoch 0: 35%|███▍ | 4321/12384 [9:10:06<17:13:20, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 35%|███▍ | 4322/12384 [9:10:06<17:10:33, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 35%|███▍ | 4322/12384 [9:10:13<17:10:33, 7.67s/it, loss=0.0014, acc=0.9959, iter_time=3.80s]
Epoch 0: 35%|███▍ | 4323/12384 [9:10:13<17:07:40, 7.65s/it, loss=0.0014, acc=0.9959, iter_time=3.80s]
Epoch 0: 35%|███▍ | 4323/12384 [9:10:21<17:07:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 0: 35%|███▍ | 4324/12384 [9:10:21<17:06:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 0: 35%|███▍ | 4324/12384 [9:10:29<17:06:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 0: 35%|███▍ | 4325/12384 [9:10:29<17:05:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 0: 35%|███▍ | 4325/12384 [9:10:36<17:05:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 0: 35%|███▍ | 4326/12384 [9:10:36<17:04:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 0: 35%|███▍ | 4326/12384 [9:10:44<17:04:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 35%|███▍ | 4327/12384 [9:10:44<17:03:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 35%|███▍ | 4327/12384 [9:10:51<17:03:50, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.58s]
Epoch 0: 35%|███▍ | 4328/12384 [9:10:51<17:03:07, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.58s]
Epoch 0: 35%|███▍ | 4328/12384 [9:10:59<17:03:07, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=7.64s]
Epoch 0: 35%|███▍ | 4329/12384 [9:10:59<17:02:08, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=7.64s]
Epoch 0: 35%|███▍ | 4329/12384 [9:11:07<17:02:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 35%|███▍ | 4330/12384 [9:11:07<17:02:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 35%|███▍ | 4330/12384 [9:11:14<17:02:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 35%|███▍ | 4331/12384 [9:11:14<17:01:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 35%|███▍ | 4331/12384 [9:11:22<17:01:55, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=7.60s]
Epoch 0: 35%|███▍ | 4332/12384 [9:11:22<17:02:23, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.60s]
Epoch 0: 35%|███▍ | 4332/12384 [9:11:29<17:02:23, 7.62s/it, loss=0.0002, acc=0.9979, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4333/12384 [9:11:29<17:02:08, 7.62s/it, loss=0.0002, acc=0.9979, iter_time=7.61s]
Epoch 0: 35%|███▍ | 4333/12384 [9:11:37<17:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 35%|███▍ | 4334/12384 [9:11:37<17:03:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 35%|███▍ | 4334/12384 [9:11:45<17:03:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 35%|███▌ | 4335/12384 [9:11:45<17:02:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 35%|███▌ | 4335/12384 [9:11:52<17:02:51, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.99s]
Epoch 0: 35%|███▌ | 4336/12384 [9:11:52<17:01:36, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.99s]
Epoch 0: 35%|███▌ | 4336/12384 [9:12:00<17:01:36, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 35%|███▌ | 4337/12384 [9:12:00<17:05:42, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 35%|███▌ | 4337/12384 [9:12:08<17:05:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 35%|███▌ | 4338/12384 [9:12:08<17:03:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 35%|███▌ | 4338/12384 [9:12:16<17:03:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 0: 35%|███▌ | 4339/12384 [9:12:16<17:14:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 0: 35%|███▌ | 4339/12384 [9:12:23<17:14:50, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.31s]
Epoch 0: 35%|███▌ | 4340/12384 [9:12:23<17:10:19, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.31s]
Epoch 0: 35%|███▌ | 4340/12384 [9:12:31<17:10:19, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 35%|███▌ | 4341/12384 [9:12:31<17:06:50, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 35%|███▌ | 4341/12384 [9:12:38<17:06:50, 7.66s/it, loss=0.0002, acc=0.9997, iter_time=7.64s]
Epoch 0: 35%|███▌ | 4342/12384 [9:12:38<17:05:44, 7.65s/it, loss=0.0002, acc=0.9997, iter_time=7.64s]
Epoch 0: 35%|███▌ | 4342/12384 [9:12:46<17:05:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 35%|███▌ | 4343/12384 [9:12:46<17:03:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 35%|███▌ | 4343/12384 [9:12:54<17:03:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 35%|███▌ | 4344/12384 [9:12:54<17:03:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 35%|███▌ | 4344/12384 [9:13:01<17:03:34, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=6.65s]
Epoch 0: 35%|███▌ | 4345/12384 [9:13:01<17:02:32, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.65s]
Epoch 0: 35%|███▌ | 4345/12384 [9:13:09<17:02:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 35%|███▌ | 4346/12384 [9:13:09<17:15:54, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 35%|███▌ | 4346/12384 [9:13:17<17:15:54, 7.73s/it, loss=0.0007, acc=0.9996, iter_time=7.01s]
Epoch 0: 35%|███▌ | 4347/12384 [9:13:17<17:10:55, 7.70s/it, loss=0.0007, acc=0.9996, iter_time=7.01s]
Epoch 0: 35%|███▌ | 4347/12384 [9:13:24<17:10:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 35%|███▌ | 4348/12384 [9:13:24<17:07:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 35%|███▌ | 4348/12384 [9:13:32<17:07:00, 7.67s/it, loss=0.0007, acc=0.9976, iter_time=9.13s]
Epoch 0: 35%|███▌ | 4349/12384 [9:13:32<17:07:22, 7.67s/it, loss=0.0007, acc=0.9976, iter_time=9.13s]
Epoch 0: 35%|███▌ | 4349/12384 [9:13:40<17:07:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 35%|███▌ | 4350/12384 [9:13:40<17:04:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 35%|███▌ | 4350/12384 [9:13:47<17:04:53, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 35%|███▌ | 4351/12384 [9:13:47<17:03:10, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 35%|███▌ | 4351/12384 [9:13:55<17:03:10, 7.64s/it, loss=0.0001, acc=0.9989, iter_time=8.03s]
Epoch 0: 35%|███▌ | 4352/12384 [9:13:55<17:05:01, 7.66s/it, loss=0.0001, acc=0.9989, iter_time=8.03s]
Epoch 0: 35%|███▌ | 4352/12384 [9:14:03<17:05:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 35%|███▌ | 4353/12384 [9:14:03<17:07:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 35%|███▌ | 4353/12384 [9:14:10<17:07:02, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=5.16s]
Epoch 0: 35%|███▌ | 4354/12384 [9:14:10<17:04:18, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=5.16s]
Epoch 0: 35%|███▌ | 4354/12384 [9:14:18<17:04:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 35%|███▌ | 4355/12384 [9:14:18<17:02:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 35%|███▌ | 4355/12384 [9:14:26<17:02:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.00s]
Epoch 0: 35%|███▌ | 4356/12384 [9:14:26<17:00:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.00s]
Epoch 0: 35%|███▌ | 4356/12384 [9:14:33<17:00:22, 7.63s/it, loss=0.0003, acc=0.9994, iter_time=8.18s]
Epoch 0: 35%|███▌ | 4357/12384 [9:14:33<16:59:25, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=8.18s]
Epoch 0: 35%|███▌ | 4357/12384 [9:14:41<16:59:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 35%|███▌ | 4358/12384 [9:14:41<16:59:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 35%|███▌ | 4358/12384 [9:14:48<16:59:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 35%|███▌ | 4359/12384 [9:14:48<16:58:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 35%|███▌ | 4359/12384 [9:14:56<16:58:32, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.01s]
Epoch 0: 35%|███▌ | 4360/12384 [9:14:56<16:58:27, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.01s]
Epoch 0: 35%|███▌ | 4360/12384 [9:15:04<16:58:27, 7.62s/it, loss=0.0012, acc=0.9973, iter_time=5.68s]
Epoch 0: 35%|███▌ | 4361/12384 [9:15:04<16:58:29, 7.62s/it, loss=0.0012, acc=0.9973, iter_time=5.68s]
Epoch 0: 35%|███▌ | 4361/12384 [9:15:11<16:58:29, 7.62s/it, loss=0.0012, acc=0.9964, iter_time=9.18s]
Epoch 0: 35%|███▌ | 4362/12384 [9:15:11<16:58:36, 7.62s/it, loss=0.0012, acc=0.9964, iter_time=9.18s]
Epoch 0: 35%|███▌ | 4362/12384 [9:15:19<16:58:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 35%|███▌ | 4363/12384 [9:15:19<16:57:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 35%|███▌ | 4363/12384 [9:15:26<16:57:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 35%|███▌ | 4364/12384 [9:15:26<16:56:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 35%|███▌ | 4364/12384 [9:15:34<16:56:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 0: 35%|███▌ | 4365/12384 [9:15:34<16:57:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 0: 35%|███▌ | 4365/12384 [9:15:42<16:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 35%|███▌ | 4366/12384 [9:15:42<17:08:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 35%|███▌ | 4366/12384 [9:15:50<17:08:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 35%|███▌ | 4367/12384 [9:15:50<17:04:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 35%|███▌ | 4367/12384 [9:15:57<17:04:09, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=10.53s]
Epoch 0: 35%|███▌ | 4368/12384 [9:15:57<17:02:27, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=10.53s]
Epoch 0: 35%|███▌ | 4368/12384 [9:16:05<17:02:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 0: 35%|███▌ | 4369/12384 [9:16:05<17:00:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 0: 35%|███▌ | 4369/12384 [9:16:12<17:00:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 35%|███▌ | 4370/12384 [9:16:12<16:59:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 35%|███▌ | 4370/12384 [9:16:20<16:59:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 35%|███▌ | 4371/12384 [9:16:20<16:58:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 35%|███▌ | 4371/12384 [9:16:28<16:58:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 35%|███▌ | 4372/12384 [9:16:28<16:58:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 35%|███▌ | 4372/12384 [9:16:36<16:58:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 35%|███▌ | 4373/12384 [9:16:36<17:10:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 35%|███▌ | 4373/12384 [9:16:43<17:10:53, 7.72s/it, loss=0.0013, acc=0.9964, iter_time=7.86s]
Epoch 0: 35%|███▌ | 4374/12384 [9:16:43<17:06:36, 7.69s/it, loss=0.0013, acc=0.9964, iter_time=7.86s]
Epoch 0: 35%|███▌ | 4374/12384 [9:16:51<17:06:36, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 35%|███▌ | 4375/12384 [9:16:51<17:03:46, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 35%|███▌ | 4375/12384 [9:16:58<17:03:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 35%|███▌ | 4376/12384 [9:16:58<17:01:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 35%|███▌ | 4376/12384 [9:17:06<17:01:50, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=4.89s]
Epoch 0: 35%|███▌ | 4377/12384 [9:17:06<17:00:03, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.89s]
Epoch 0: 35%|███▌ | 4377/12384 [9:17:14<17:00:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 35%|███▌ | 4378/12384 [9:17:14<16:58:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 35%|███▌ | 4378/12384 [9:17:21<16:58:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 35%|███▌ | 4379/12384 [9:17:21<16:57:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 35%|███▌ | 4379/12384 [9:17:29<16:57:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 35%|███▌ | 4380/12384 [9:17:29<16:57:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 35%|███▌ | 4380/12384 [9:17:37<16:57:11, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.96s]
Epoch 0: 35%|███▌ | 4381/12384 [9:17:37<16:56:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.96s]
Epoch 0: 35%|███▌ | 4381/12384 [9:17:44<16:56:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 35%|███▌ | 4382/12384 [9:17:44<16:56:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 35%|███▌ | 4382/12384 [9:17:52<16:56:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 35%|███▌ | 4383/12384 [9:17:52<16:56:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 35%|███▌ | 4383/12384 [9:17:59<16:56:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 35%|███▌ | 4384/12384 [9:17:59<16:56:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 35%|███▌ | 4384/12384 [9:18:07<16:56:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 35%|███▌ | 4385/12384 [9:18:07<16:55:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 35%|███▌ | 4385/12384 [9:18:15<16:55:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 35%|███▌ | 4386/12384 [9:18:15<16:54:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 35%|███▌ | 4386/12384 [9:18:22<16:54:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 35%|███▌ | 4387/12384 [9:18:22<16:54:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 35%|███▌ | 4387/12384 [9:18:30<16:54:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 35%|███▌ | 4388/12384 [9:18:30<16:55:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 35%|███▌ | 4388/12384 [9:18:37<16:55:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 35%|███▌ | 4389/12384 [9:18:37<16:54:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 35%|███▌ | 4389/12384 [9:18:45<16:54:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 35%|███▌ | 4390/12384 [9:18:45<16:53:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 35%|███▌ | 4390/12384 [9:18:53<16:53:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 35%|███▌ | 4391/12384 [9:18:53<16:55:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 35%|███▌ | 4391/12384 [9:19:00<16:55:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 35%|███▌ | 4392/12384 [9:19:00<16:54:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 35%|███▌ | 4392/12384 [9:19:08<16:54:12, 7.61s/it, loss=0.0007, acc=0.9981, iter_time=7.56s]
Epoch 0: 35%|███▌ | 4393/12384 [9:19:08<17:07:21, 7.71s/it, loss=0.0007, acc=0.9981, iter_time=7.56s]
Epoch 0: 35%|███▌ | 4393/12384 [9:19:16<17:07:21, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 35%|███▌ | 4394/12384 [9:19:16<17:06:04, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 35%|███▌ | 4394/12384 [9:19:24<17:06:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 35%|███▌ | 4395/12384 [9:19:24<17:05:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 35%|███▌ | 4395/12384 [9:19:31<17:05:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 35%|███▌ | 4396/12384 [9:19:31<17:05:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 35%|███▌ | 4396/12384 [9:19:39<17:05:03, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.47s]
Epoch 0: 36%|███▌ | 4397/12384 [9:19:39<17:01:30, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.47s]
Epoch 0: 36%|███▌ | 4397/12384 [9:19:47<17:01:30, 7.67s/it, loss=0.0003, acc=0.9996, iter_time=10.47s]
Epoch 0: 36%|███▌ | 4398/12384 [9:19:47<16:58:39, 7.65s/it, loss=0.0003, acc=0.9996, iter_time=10.47s]
Epoch 0: 36%|███▌ | 4398/12384 [9:19:54<16:58:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 36%|███▌ | 4399/12384 [9:19:54<17:10:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 36%|███▌ | 4399/12384 [9:20:02<17:10:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 36%|███▌ | 4400/12384 [9:20:02<17:06:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 36%|███▌ | 4400/12384 [9:20:10<17:06:04, 7.71s/it, loss=0.0003, acc=0.9999, iter_time=7.20s]
Epoch 0: 36%|███▌ | 4401/12384 [9:20:10<17:02:38, 7.69s/it, loss=0.0003, acc=0.9999, iter_time=7.20s]
Epoch 0: 36%|███▌ | 4401/12384 [9:20:17<17:02:38, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4402/12384 [9:20:17<16:58:52, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4402/12384 [9:20:25<16:58:52, 7.66s/it, loss=0.0011, acc=0.9986, iter_time=7.63s]
Epoch 0: 36%|███▌ | 4403/12384 [9:20:25<16:56:59, 7.65s/it, loss=0.0011, acc=0.9986, iter_time=7.63s]
Epoch 0: 36%|███▌ | 4403/12384 [9:20:33<16:56:59, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 0: 36%|███▌ | 4404/12384 [9:20:33<16:54:38, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 0: 36%|███▌ | 4404/12384 [9:20:40<16:54:38, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4405/12384 [9:20:40<16:54:11, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4405/12384 [9:20:48<16:54:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▌ | 4406/12384 [9:20:48<16:53:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▌ | 4406/12384 [9:20:55<16:53:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.74s]
Epoch 0: 36%|███▌ | 4407/12384 [9:20:55<16:52:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.74s]
Epoch 0: 36%|███▌ | 4407/12384 [9:21:03<16:52:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 0: 36%|███▌ | 4408/12384 [9:21:03<16:52:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 0: 36%|███▌ | 4408/12384 [9:21:11<16:52:17, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=5.16s]
Epoch 0: 36%|███▌ | 4409/12384 [9:21:11<16:51:19, 7.61s/it, loss=0.0001, acc=0.9994, iter_time=5.16s]
Epoch 0: 36%|███▌ | 4409/12384 [9:21:18<16:51:19, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.11s]
Epoch 0: 36%|███▌ | 4410/12384 [9:21:18<16:51:16, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.11s]
Epoch 0: 36%|███▌ | 4410/12384 [9:21:26<16:51:16, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=8.17s]
Epoch 0: 36%|███▌ | 4411/12384 [9:21:26<16:50:35, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=8.17s]
Epoch 0: 36%|███▌ | 4411/12384 [9:21:33<16:50:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 36%|███▌ | 4412/12384 [9:21:33<16:52:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 36%|███▌ | 4412/12384 [9:21:41<16:52:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 36%|███▌ | 4413/12384 [9:21:41<16:51:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 36%|███▌ | 4413/12384 [9:21:49<16:51:22, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=9.34s]
Epoch 0: 36%|███▌ | 4414/12384 [9:21:49<16:50:43, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=9.34s]
Epoch 0: 36%|███▌ | 4414/12384 [9:21:56<16:50:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.31s]
Epoch 0: 36%|███▌ | 4415/12384 [9:21:56<16:51:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.31s]
Epoch 0: 36%|███▌ | 4415/12384 [9:22:04<16:51:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 36%|███▌ | 4416/12384 [9:22:04<16:52:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 36%|███▌ | 4416/12384 [9:22:12<16:52:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 0: 36%|███▌ | 4417/12384 [9:22:12<16:51:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 0: 36%|███▌ | 4417/12384 [9:22:19<16:51:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 36%|███▌ | 4418/12384 [9:22:19<16:51:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 36%|███▌ | 4418/12384 [9:22:27<16:51:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 36%|███▌ | 4419/12384 [9:22:27<17:01:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 36%|███▌ | 4419/12384 [9:22:35<17:01:31, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.95s]
Epoch 0: 36%|███▌ | 4420/12384 [9:22:35<16:57:34, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.95s]
Epoch 0: 36%|███▌ | 4420/12384 [9:22:42<16:57:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 0: 36%|███▌ | 4421/12384 [9:22:42<16:54:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 0: 36%|███▌ | 4421/12384 [9:22:50<16:54:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 36%|███▌ | 4422/12384 [9:22:50<16:52:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 36%|███▌ | 4422/12384 [9:22:57<16:52:35, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4423/12384 [9:22:57<16:51:03, 7.62s/it, loss=0.0003, acc=0.9990, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4423/12384 [9:23:05<16:51:03, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.55s]
Epoch 0: 36%|███▌ | 4424/12384 [9:23:05<16:50:50, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.55s]
Epoch 0: 36%|███▌ | 4424/12384 [9:23:13<16:50:50, 7.62s/it, loss=0.0009, acc=0.9989, iter_time=7.70s]
Epoch 0: 36%|███▌ | 4425/12384 [9:23:13<17:06:51, 7.74s/it, loss=0.0009, acc=0.9989, iter_time=7.70s]
Epoch 0: 36%|███▌ | 4425/12384 [9:23:21<17:06:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 36%|███▌ | 4426/12384 [9:23:21<17:01:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 36%|███▌ | 4426/12384 [9:23:28<17:01:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▌ | 4427/12384 [9:23:28<16:59:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▌ | 4427/12384 [9:23:36<16:59:45, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=4.64s]
Epoch 0: 36%|███▌ | 4428/12384 [9:23:36<16:55:40, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=4.64s]
Epoch 0: 36%|███▌ | 4428/12384 [9:23:44<16:55:40, 7.66s/it, loss=0.0002, acc=0.9992, iter_time=8.87s]
Epoch 0: 36%|███▌ | 4429/12384 [9:23:44<16:53:35, 7.64s/it, loss=0.0002, acc=0.9992, iter_time=8.87s]
Epoch 0: 36%|███▌ | 4429/12384 [9:23:51<16:53:35, 7.64s/it, loss=0.0004, acc=0.9968, iter_time=9.03s]
Epoch 0: 36%|███▌ | 4430/12384 [9:23:51<16:52:03, 7.63s/it, loss=0.0004, acc=0.9968, iter_time=9.03s]
Epoch 0: 36%|███▌ | 4430/12384 [9:23:59<16:52:03, 7.63s/it, loss=0.0004, acc=0.9982, iter_time=5.68s]
Epoch 0: 36%|███▌ | 4431/12384 [9:23:59<16:52:52, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=5.68s]
Epoch 0: 36%|███▌ | 4431/12384 [9:24:06<16:52:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 0: 36%|███▌ | 4432/12384 [9:24:06<16:51:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 0: 36%|███▌ | 4432/12384 [9:24:14<16:51:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.90s]
Epoch 0: 36%|███▌ | 4433/12384 [9:24:14<16:50:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.90s]
Epoch 0: 36%|███▌ | 4433/12384 [9:24:22<16:50:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 36%|███▌ | 4434/12384 [9:24:22<16:49:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 36%|███▌ | 4434/12384 [9:24:29<16:49:59, 7.62s/it, loss=0.0013, acc=0.9974, iter_time=8.74s]
Epoch 0: 36%|███▌ | 4435/12384 [9:24:29<16:49:41, 7.62s/it, loss=0.0013, acc=0.9974, iter_time=8.74s]
Epoch 0: 36%|███▌ | 4435/12384 [9:24:37<16:49:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 0: 36%|███▌ | 4436/12384 [9:24:37<16:49:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 0: 36%|███▌ | 4436/12384 [9:24:44<16:49:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 36%|███▌ | 4437/12384 [9:24:44<16:50:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 36%|███▌ | 4437/12384 [9:24:52<16:50:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 36%|███▌ | 4438/12384 [9:24:52<16:49:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 36%|███▌ | 4438/12384 [9:25:00<16:49:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▌ | 4439/12384 [9:25:00<16:49:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▌ | 4439/12384 [9:25:07<16:49:07, 7.62s/it, loss=0.0002, acc=0.9994, iter_time=7.56s]
Epoch 0: 36%|███▌ | 4440/12384 [9:25:07<16:48:34, 7.62s/it, loss=0.0002, acc=0.9994, iter_time=7.56s]
Epoch 0: 36%|███▌ | 4440/12384 [9:25:15<16:48:34, 7.62s/it, loss=0.0007, acc=0.9990, iter_time=7.06s]
Epoch 0: 36%|███▌ | 4441/12384 [9:25:15<16:48:02, 7.61s/it, loss=0.0007, acc=0.9990, iter_time=7.06s]
Epoch 0: 36%|███▌ | 4441/12384 [9:25:23<16:48:02, 7.61s/it, loss=0.0004, acc=0.9982, iter_time=8.21s]
Epoch 0: 36%|███▌ | 4442/12384 [9:25:23<16:48:57, 7.62s/it, loss=0.0004, acc=0.9982, iter_time=8.21s]
Epoch 0: 36%|███▌ | 4442/12384 [9:25:30<16:48:57, 7.62s/it, loss=0.0009, acc=0.9980, iter_time=7.65s]
Epoch 0: 36%|███▌ | 4443/12384 [9:25:30<16:48:11, 7.62s/it, loss=0.0009, acc=0.9980, iter_time=7.65s]
Epoch 0: 36%|███▌ | 4443/12384 [9:25:38<16:48:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▌ | 4444/12384 [9:25:38<16:50:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▌ | 4444/12384 [9:25:46<16:50:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 36%|███▌ | 4445/12384 [9:25:46<17:00:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 36%|███▌ | 4445/12384 [9:25:53<17:00:35, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 36%|███▌ | 4446/12384 [9:25:53<16:55:58, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 36%|███▌ | 4446/12384 [9:26:01<16:55:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4447/12384 [9:26:01<16:53:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4447/12384 [9:26:09<16:53:49, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 36%|███▌ | 4448/12384 [9:26:09<16:51:37, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 36%|███▌ | 4448/12384 [9:26:16<16:51:37, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.91s]
Epoch 0: 36%|███▌ | 4449/12384 [9:26:16<16:49:28, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.91s]
Epoch 0: 36%|███▌ | 4449/12384 [9:26:24<16:49:28, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.27s]
Epoch 0: 36%|███▌ | 4450/12384 [9:26:24<16:47:22, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=8.27s]
Epoch 0: 36%|███▌ | 4450/12384 [9:26:32<16:47:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.66s]
Epoch 0: 36%|███▌ | 4451/12384 [9:26:32<17:00:38, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=4.66s]
Epoch 0: 36%|███▌ | 4451/12384 [9:26:39<17:00:38, 7.72s/it, loss=0.0003, acc=0.9999, iter_time=10.51s]
Epoch 0: 36%|███▌ | 4452/12384 [9:26:39<16:56:09, 7.69s/it, loss=0.0003, acc=0.9999, iter_time=10.51s]
Epoch 0: 36%|███▌ | 4452/12384 [9:26:47<16:56:09, 7.69s/it, loss=0.0023, acc=0.9976, iter_time=6.08s]
Epoch 0: 36%|███▌ | 4453/12384 [9:26:47<16:53:33, 7.67s/it, loss=0.0023, acc=0.9976, iter_time=6.08s]
Epoch 0: 36%|███▌ | 4453/12384 [9:26:55<16:53:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 36%|███▌ | 4454/12384 [9:26:55<16:50:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 36%|███▌ | 4454/12384 [9:27:02<16:50:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▌ | 4455/12384 [9:27:02<16:49:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▌ | 4455/12384 [9:27:10<16:49:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 36%|███▌ | 4456/12384 [9:27:10<16:48:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 36%|███▌ | 4456/12384 [9:27:17<16:48:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=3.23s]
Epoch 0: 36%|███▌ | 4457/12384 [9:27:17<16:47:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=3.23s]
Epoch 0: 36%|███▌ | 4457/12384 [9:27:25<16:47:21, 7.62s/it, loss=0.0018, acc=0.9974, iter_time=11.58s]
Epoch 0: 36%|███▌ | 4458/12384 [9:27:25<16:47:03, 7.62s/it, loss=0.0018, acc=0.9974, iter_time=11.58s]
Epoch 0: 36%|███▌ | 4458/12384 [9:27:33<16:47:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 0: 36%|███▌ | 4459/12384 [9:27:33<16:45:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 0: 36%|███▌ | 4459/12384 [9:27:40<16:45:46, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=7.84s]
Epoch 0: 36%|███▌ | 4460/12384 [9:27:40<16:44:51, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=7.84s]
Epoch 0: 36%|███▌ | 4460/12384 [9:27:48<16:44:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 36%|███▌ | 4461/12384 [9:27:48<16:44:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 36%|███▌ | 4461/12384 [9:27:55<16:44:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 36%|███▌ | 4462/12384 [9:27:55<16:44:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 36%|███▌ | 4462/12384 [9:28:03<16:44:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 0: 36%|███▌ | 4463/12384 [9:28:03<16:44:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 0: 36%|███▌ | 4463/12384 [9:28:11<16:44:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 36%|███▌ | 4464/12384 [9:28:11<16:45:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 36%|███▌ | 4464/12384 [9:28:18<16:45:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 36%|███▌ | 4465/12384 [9:28:18<16:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 36%|███▌ | 4465/12384 [9:28:26<16:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4466/12384 [9:28:26<16:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4466/12384 [9:28:33<16:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 36%|███▌ | 4467/12384 [9:28:33<16:43:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 36%|███▌ | 4467/12384 [9:28:41<16:43:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 36%|███▌ | 4468/12384 [9:28:41<16:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 36%|███▌ | 4468/12384 [9:28:49<16:44:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.31s]
Epoch 0: 36%|███▌ | 4469/12384 [9:28:49<16:43:09, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.31s]
Epoch 0: 36%|███▌ | 4469/12384 [9:28:56<16:43:09, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=8.41s]
Epoch 0: 36%|███▌ | 4470/12384 [9:28:56<16:43:12, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.41s]
Epoch 0: 36%|███▌ | 4470/12384 [9:29:04<16:43:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 36%|███▌ | 4471/12384 [9:29:04<16:54:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 36%|███▌ | 4471/12384 [9:29:12<16:54:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 36%|███▌ | 4472/12384 [9:29:12<16:51:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 36%|███▌ | 4472/12384 [9:29:19<16:51:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 0: 36%|███▌ | 4473/12384 [9:29:19<16:48:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 0: 36%|███▌ | 4473/12384 [9:29:27<16:48:28, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 36%|███▌ | 4474/12384 [9:29:27<16:47:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 36%|███▌ | 4474/12384 [9:29:35<16:47:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 36%|███▌ | 4475/12384 [9:29:35<16:46:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 36%|███▌ | 4475/12384 [9:29:42<16:46:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.30s]
Epoch 0: 36%|███▌ | 4476/12384 [9:29:42<16:45:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.30s]
Epoch 0: 36%|███▌ | 4476/12384 [9:29:50<16:45:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.31s]
Epoch 0: 36%|███▌ | 4477/12384 [9:29:50<17:00:29, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=8.31s]
Epoch 0: 36%|███▌ | 4477/12384 [9:29:58<17:00:29, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.96s]
Epoch 0: 36%|███▌ | 4478/12384 [9:29:58<16:55:29, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.96s]
Epoch 0: 36%|███▌ | 4478/12384 [9:30:06<16:55:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▌ | 4479/12384 [9:30:06<16:51:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▌ | 4479/12384 [9:30:13<16:51:46, 7.68s/it, loss=0.0008, acc=0.9998, iter_time=8.01s]
Epoch 0: 36%|███▌ | 4480/12384 [9:30:13<16:48:41, 7.66s/it, loss=0.0008, acc=0.9998, iter_time=8.01s]
Epoch 0: 36%|███▌ | 4480/12384 [9:30:21<16:48:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 36%|███▌ | 4481/12384 [9:30:21<16:46:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 36%|███▌ | 4481/12384 [9:30:28<16:46:08, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 36%|███▌ | 4482/12384 [9:30:28<16:45:02, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 36%|███▌ | 4482/12384 [9:30:36<16:45:02, 7.63s/it, loss=0.0000, acc=0.9999, iter_time=8.24s]
Epoch 0: 36%|███▌ | 4483/12384 [9:30:36<16:44:22, 7.63s/it, loss=0.0000, acc=0.9999, iter_time=8.24s]
Epoch 0: 36%|███▌ | 4483/12384 [9:30:44<16:44:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 36%|███▌ | 4484/12384 [9:30:44<16:44:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 36%|███▌ | 4484/12384 [9:30:51<16:44:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4485/12384 [9:30:51<16:43:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▌ | 4485/12384 [9:30:59<16:43:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 36%|███▌ | 4486/12384 [9:30:59<16:44:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 36%|███▌ | 4486/12384 [9:31:06<16:44:16, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 0: 36%|███▌ | 4487/12384 [9:31:06<16:43:34, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 0: 36%|███▌ | 4487/12384 [9:31:14<16:43:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 36%|███▌ | 4488/12384 [9:31:14<16:43:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 36%|███▌ | 4488/12384 [9:31:22<16:43:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 36%|███▌ | 4489/12384 [9:31:22<16:42:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 36%|███▌ | 4489/12384 [9:31:29<16:42:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▋ | 4490/12384 [9:31:29<16:42:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▋ | 4490/12384 [9:31:37<16:42:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▋ | 4491/12384 [9:31:37<16:41:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 36%|███▋ | 4491/12384 [9:31:44<16:41:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 36%|███▋ | 4492/12384 [9:31:44<16:40:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 36%|███▋ | 4492/12384 [9:31:52<16:40:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 36%|███▋ | 4493/12384 [9:31:52<16:41:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 36%|███▋ | 4493/12384 [9:32:00<16:41:02, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=9.73s]
Epoch 0: 36%|███▋ | 4494/12384 [9:32:00<16:40:13, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=9.73s]
Epoch 0: 36%|███▋ | 4494/12384 [9:32:07<16:40:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 36%|███▋ | 4495/12384 [9:32:07<16:40:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 36%|███▋ | 4495/12384 [9:32:15<16:40:11, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.49s]
Epoch 0: 36%|███▋ | 4496/12384 [9:32:15<16:39:49, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.49s]
Epoch 0: 36%|███▋ | 4496/12384 [9:32:23<16:39:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 36%|███▋ | 4497/12384 [9:32:23<16:50:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 36%|███▋ | 4497/12384 [9:32:30<16:50:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▋ | 4498/12384 [9:32:30<16:49:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▋ | 4498/12384 [9:32:38<16:49:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 36%|███▋ | 4499/12384 [9:32:38<16:45:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 36%|███▋ | 4499/12384 [9:32:46<16:45:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 0: 36%|███▋ | 4500/12384 [9:32:46<16:51:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 0: 36%|███▋ | 4500/12384 [9:32:53<16:51:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 36%|███▋ | 4501/12384 [9:32:53<16:48:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 36%|███▋ | 4501/12384 [9:33:01<16:48:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 36%|███▋ | 4502/12384 [9:33:01<16:45:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 36%|███▋ | 4502/12384 [9:33:09<16:45:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▋ | 4503/12384 [9:33:09<16:43:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▋ | 4503/12384 [9:33:17<16:43:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 36%|███▋ | 4504/12384 [9:33:17<16:55:03, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 36%|███▋ | 4504/12384 [9:33:24<16:55:03, 7.73s/it, loss=0.0001, acc=0.9998, iter_time=5.17s]
Epoch 0: 36%|███▋ | 4505/12384 [9:33:24<16:52:25, 7.71s/it, loss=0.0001, acc=0.9998, iter_time=5.17s]
Epoch 0: 36%|███▋ | 4505/12384 [9:33:32<16:52:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 0: 36%|███▋ | 4506/12384 [9:33:32<16:48:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 0: 36%|███▋ | 4506/12384 [9:33:40<16:48:38, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 36%|███▋ | 4507/12384 [9:33:40<16:46:13, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 36%|███▋ | 4507/12384 [9:33:47<16:46:13, 7.66s/it, loss=0.0002, acc=0.9984, iter_time=7.62s]
Epoch 0: 36%|███▋ | 4508/12384 [9:33:47<16:44:12, 7.65s/it, loss=0.0002, acc=0.9984, iter_time=7.62s]
Epoch 0: 36%|███▋ | 4508/12384 [9:33:55<16:44:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 36%|███▋ | 4509/12384 [9:33:55<16:43:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 36%|███▋ | 4509/12384 [9:34:02<16:43:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 36%|███▋ | 4510/12384 [9:34:02<16:41:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 36%|███▋ | 4510/12384 [9:34:10<16:41:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▋ | 4511/12384 [9:34:10<16:40:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▋ | 4511/12384 [9:34:18<16:40:24, 7.62s/it, loss=0.0003, acc=0.9990, iter_time=8.00s]
Epoch 0: 36%|███▋ | 4512/12384 [9:34:18<16:42:25, 7.64s/it, loss=0.0003, acc=0.9990, iter_time=8.00s]
Epoch 0: 36%|███▋ | 4512/12384 [9:34:25<16:42:25, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.30s]
Epoch 0: 36%|███▋ | 4513/12384 [9:34:25<16:41:12, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.30s]
Epoch 0: 36%|███▋ | 4513/12384 [9:34:33<16:41:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 36%|███▋ | 4514/12384 [9:34:33<16:42:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 36%|███▋ | 4514/12384 [9:34:41<16:42:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▋ | 4515/12384 [9:34:41<16:41:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▋ | 4515/12384 [9:34:48<16:41:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▋ | 4516/12384 [9:34:48<16:40:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 36%|███▋ | 4516/12384 [9:34:56<16:40:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 36%|███▋ | 4517/12384 [9:34:56<16:40:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 36%|███▋ | 4517/12384 [9:35:03<16:40:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 0: 36%|███▋ | 4518/12384 [9:35:03<16:39:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 0: 36%|███▋ | 4518/12384 [9:35:11<16:39:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▋ | 4519/12384 [9:35:11<16:38:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 36%|███▋ | 4519/12384 [9:35:19<16:38:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 36%|███▋ | 4520/12384 [9:35:19<16:38:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 36%|███▋ | 4520/12384 [9:35:26<16:38:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 37%|███▋ | 4521/12384 [9:35:26<16:37:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 37%|███▋ | 4521/12384 [9:35:34<16:37:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4522/12384 [9:35:34<16:37:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4522/12384 [9:35:42<16:37:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 37%|███▋ | 4523/12384 [9:35:42<16:48:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 37%|███▋ | 4523/12384 [9:35:49<16:48:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 37%|███▋ | 4524/12384 [9:35:49<16:44:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 37%|███▋ | 4524/12384 [9:35:57<16:44:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4525/12384 [9:35:57<16:41:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4525/12384 [9:36:05<16:41:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 37%|███▋ | 4526/12384 [9:36:05<16:40:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 37%|███▋ | 4526/12384 [9:36:12<16:40:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 0: 37%|███▋ | 4527/12384 [9:36:12<16:39:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 0: 37%|███▋ | 4527/12384 [9:36:20<16:39:14, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.52s]
Epoch 0: 37%|███▋ | 4528/12384 [9:36:20<16:38:54, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.52s]
Epoch 0: 37%|███▋ | 4528/12384 [9:36:27<16:38:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 37%|███▋ | 4529/12384 [9:36:27<16:37:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 37%|███▋ | 4529/12384 [9:36:35<16:37:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.28s]
Epoch 0: 37%|███▋ | 4530/12384 [9:36:35<16:50:32, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=4.28s]
Epoch 0: 37%|███▋ | 4530/12384 [9:36:43<16:50:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 0: 37%|███▋ | 4531/12384 [9:36:43<16:46:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 0: 37%|███▋ | 4531/12384 [9:36:51<16:46:32, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=11.81s]
Epoch 0: 37%|███▋ | 4532/12384 [9:36:51<16:43:05, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=11.81s]
Epoch 0: 37%|███▋ | 4532/12384 [9:36:58<16:43:05, 7.67s/it, loss=0.0004, acc=0.9997, iter_time=6.41s]
Epoch 0: 37%|███▋ | 4533/12384 [9:36:58<16:40:52, 7.65s/it, loss=0.0004, acc=0.9997, iter_time=6.41s]
Epoch 0: 37%|███▋ | 4533/12384 [9:37:06<16:40:52, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.79s]
Epoch 0: 37%|███▋ | 4534/12384 [9:37:06<16:39:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.79s]
Epoch 0: 37%|███▋ | 4534/12384 [9:37:13<16:39:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 37%|███▋ | 4535/12384 [9:37:13<16:38:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 37%|███▋ | 4535/12384 [9:37:21<16:38:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4536/12384 [9:37:21<16:40:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4536/12384 [9:37:29<16:40:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4537/12384 [9:37:29<16:39:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4537/12384 [9:37:36<16:39:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4538/12384 [9:37:36<16:38:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4538/12384 [9:37:44<16:38:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4539/12384 [9:37:44<16:37:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4539/12384 [9:37:52<16:37:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 37%|███▋ | 4540/12384 [9:37:52<16:37:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 37%|███▋ | 4540/12384 [9:37:59<16:37:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 37%|███▋ | 4541/12384 [9:37:59<16:36:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 37%|███▋ | 4541/12384 [9:38:07<16:36:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 37%|███▋ | 4542/12384 [9:38:07<16:35:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 37%|███▋ | 4542/12384 [9:38:14<16:35:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 37%|███▋ | 4543/12384 [9:38:14<16:35:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 37%|███▋ | 4543/12384 [9:38:22<16:35:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 37%|███▋ | 4544/12384 [9:38:22<16:35:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 37%|███▋ | 4544/12384 [9:38:30<16:35:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 37%|███▋ | 4545/12384 [9:38:30<16:34:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 37%|███▋ | 4545/12384 [9:38:37<16:34:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 37%|███▋ | 4546/12384 [9:38:37<16:33:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 37%|███▋ | 4546/12384 [9:38:45<16:33:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 37%|███▋ | 4547/12384 [9:38:45<16:37:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 37%|███▋ | 4547/12384 [9:38:53<16:37:54, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.83s]
Epoch 0: 37%|███▋ | 4548/12384 [9:38:53<16:36:53, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.83s]
Epoch 0: 37%|███▋ | 4548/12384 [9:39:00<16:36:53, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.93s]
Epoch 0: 37%|███▋ | 4549/12384 [9:39:00<16:47:12, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=7.93s]
Epoch 0: 37%|███▋ | 4549/12384 [9:39:08<16:47:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 37%|███▋ | 4550/12384 [9:39:08<16:42:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 37%|███▋ | 4550/12384 [9:39:16<16:42:41, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 37%|███▋ | 4551/12384 [9:39:16<16:39:50, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 37%|███▋ | 4551/12384 [9:39:23<16:39:50, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=7.57s]
Epoch 0: 37%|███▋ | 4552/12384 [9:39:23<16:38:21, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.57s]
Epoch 0: 37%|███▋ | 4552/12384 [9:39:31<16:38:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 37%|███▋ | 4553/12384 [9:39:31<16:36:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 37%|███▋ | 4553/12384 [9:39:39<16:36:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 37%|███▋ | 4554/12384 [9:39:39<16:35:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 37%|███▋ | 4554/12384 [9:39:46<16:35:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 37%|███▋ | 4555/12384 [9:39:46<16:33:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 37%|███▋ | 4555/12384 [9:39:54<16:33:46, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=7.32s]
Epoch 0: 37%|███▋ | 4556/12384 [9:39:54<16:33:45, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=7.32s]
Epoch 0: 37%|███▋ | 4556/12384 [9:40:02<16:33:45, 7.62s/it, loss=0.0006, acc=1.0000, iter_time=9.16s]
Epoch 0: 37%|███▋ | 4557/12384 [9:40:02<16:46:45, 7.72s/it, loss=0.0006, acc=1.0000, iter_time=9.16s]
Epoch 0: 37%|███▋ | 4557/12384 [9:40:09<16:46:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 37%|███▋ | 4558/12384 [9:40:09<16:44:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 37%|███▋ | 4558/12384 [9:40:17<16:44:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 37%|███▋ | 4559/12384 [9:40:17<16:40:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 37%|███▋ | 4559/12384 [9:40:25<16:40:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 37%|███▋ | 4560/12384 [9:40:25<16:36:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 37%|███▋ | 4560/12384 [9:40:32<16:36:35, 7.64s/it, loss=0.0003, acc=0.9980, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4561/12384 [9:40:32<16:34:33, 7.63s/it, loss=0.0003, acc=0.9980, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4561/12384 [9:40:40<16:34:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 37%|███▋ | 4562/12384 [9:40:40<16:33:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 37%|███▋ | 4562/12384 [9:40:47<16:33:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 37%|███▋ | 4563/12384 [9:40:47<16:35:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 37%|███▋ | 4563/12384 [9:40:55<16:35:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 37%|███▋ | 4564/12384 [9:40:55<16:33:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 37%|███▋ | 4564/12384 [9:41:03<16:33:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 37%|███▋ | 4565/12384 [9:41:03<16:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 37%|███▋ | 4565/12384 [9:41:10<16:32:35, 7.62s/it, loss=0.0013, acc=0.9962, iter_time=5.80s]
Epoch 0: 37%|███▋ | 4566/12384 [9:41:10<16:32:38, 7.62s/it, loss=0.0013, acc=0.9962, iter_time=5.80s]
Epoch 0: 37%|███▋ | 4566/12384 [9:41:18<16:32:38, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=9.43s]
Epoch 0: 37%|███▋ | 4567/12384 [9:41:18<16:32:32, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=9.43s]
Epoch 0: 37%|███▋ | 4567/12384 [9:41:25<16:32:32, 7.62s/it, loss=0.0005, acc=0.9973, iter_time=7.54s]
Epoch 0: 37%|███▋ | 4568/12384 [9:41:25<16:31:06, 7.61s/it, loss=0.0005, acc=0.9973, iter_time=7.54s]
Epoch 0: 37%|███▋ | 4568/12384 [9:41:33<16:31:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4569/12384 [9:41:33<16:30:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4569/12384 [9:41:41<16:30:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.66s]
Epoch 0: 37%|███▋ | 4570/12384 [9:41:41<16:29:40, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.66s]
Epoch 0: 37%|███▋ | 4570/12384 [9:41:48<16:29:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 37%|███▋ | 4571/12384 [9:41:48<16:30:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 37%|███▋ | 4571/12384 [9:41:56<16:30:06, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=5.77s]
Epoch 0: 37%|███▋ | 4572/12384 [9:41:56<16:30:29, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=5.77s]
Epoch 0: 37%|███▋ | 4572/12384 [9:42:03<16:30:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 0: 37%|███▋ | 4573/12384 [9:42:03<16:30:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 0: 37%|███▋ | 4573/12384 [9:42:11<16:30:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 37%|███▋ | 4574/12384 [9:42:11<16:32:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 37%|███▋ | 4574/12384 [9:42:19<16:32:28, 7.62s/it, loss=0.0005, acc=0.9992, iter_time=7.93s]
Epoch 0: 37%|███▋ | 4575/12384 [9:42:19<16:41:52, 7.70s/it, loss=0.0005, acc=0.9992, iter_time=7.93s]
Epoch 0: 37%|███▋ | 4575/12384 [9:42:27<16:41:52, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 37%|███▋ | 4576/12384 [9:42:27<16:39:14, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 37%|███▋ | 4576/12384 [9:42:34<16:39:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4577/12384 [9:42:34<16:36:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4577/12384 [9:42:42<16:36:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 37%|███▋ | 4578/12384 [9:42:42<16:33:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 37%|███▋ | 4578/12384 [9:42:49<16:33:47, 7.64s/it, loss=0.0003, acc=0.9983, iter_time=6.38s]
Epoch 0: 37%|███▋ | 4579/12384 [9:42:49<16:32:35, 7.63s/it, loss=0.0003, acc=0.9983, iter_time=6.38s]
Epoch 0: 37%|███▋ | 4579/12384 [9:42:57<16:32:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 37%|███▋ | 4580/12384 [9:42:57<16:31:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 37%|███▋ | 4580/12384 [9:43:05<16:31:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 37%|███▋ | 4581/12384 [9:43:05<16:30:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 37%|███▋ | 4581/12384 [9:43:12<16:30:45, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=9.43s]
Epoch 0: 37%|███▋ | 4582/12384 [9:43:12<16:30:39, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=9.43s]
Epoch 0: 37%|███▋ | 4582/12384 [9:43:20<16:30:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 37%|███▋ | 4583/12384 [9:43:20<16:43:08, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 37%|███▋ | 4583/12384 [9:43:28<16:43:08, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 37%|███▋ | 4584/12384 [9:43:28<16:39:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 37%|███▋ | 4584/12384 [9:43:35<16:39:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 37%|███▋ | 4585/12384 [9:43:35<16:36:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 37%|███▋ | 4585/12384 [9:43:43<16:36:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 37%|███▋ | 4586/12384 [9:43:43<16:34:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 37%|███▋ | 4586/12384 [9:43:51<16:34:31, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=5.62s]
Epoch 0: 37%|███▋ | 4587/12384 [9:43:51<16:32:40, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.62s]
Epoch 0: 37%|███▋ | 4587/12384 [9:43:58<16:32:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 37%|███▋ | 4588/12384 [9:43:58<16:30:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 37%|███▋ | 4588/12384 [9:44:06<16:30:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 37%|███▋ | 4589/12384 [9:44:06<16:30:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 37%|███▋ | 4589/12384 [9:44:13<16:30:05, 7.62s/it, loss=0.0009, acc=0.9974, iter_time=7.00s]
Epoch 0: 37%|███▋ | 4590/12384 [9:44:13<16:29:24, 7.62s/it, loss=0.0009, acc=0.9974, iter_time=7.00s]
Epoch 0: 37%|███▋ | 4590/12384 [9:44:21<16:29:24, 7.62s/it, loss=0.0008, acc=0.9968, iter_time=7.00s]
Epoch 0: 37%|███▋ | 4591/12384 [9:44:21<16:28:11, 7.61s/it, loss=0.0008, acc=0.9968, iter_time=7.00s]
Epoch 0: 37%|███▋ | 4591/12384 [9:44:29<16:28:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.18s]
Epoch 0: 37%|███▋ | 4592/12384 [9:44:29<16:27:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.18s]
Epoch 0: 37%|███▋ | 4592/12384 [9:44:36<16:27:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 37%|███▋ | 4593/12384 [9:44:36<16:29:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 37%|███▋ | 4593/12384 [9:44:44<16:29:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 37%|███▋ | 4594/12384 [9:44:44<16:29:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 37%|███▋ | 4594/12384 [9:44:52<16:29:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 37%|███▋ | 4595/12384 [9:44:52<16:28:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 37%|███▋ | 4595/12384 [9:44:59<16:28:06, 7.61s/it, loss=0.0003, acc=0.9994, iter_time=4.82s]
Epoch 0: 37%|███▋ | 4596/12384 [9:44:59<16:27:19, 7.61s/it, loss=0.0003, acc=0.9994, iter_time=4.82s]
Epoch 0: 37%|███▋ | 4596/12384 [9:45:07<16:27:19, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=10.36s]
Epoch 0: 37%|███▋ | 4597/12384 [9:45:07<16:28:18, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=10.36s]
Epoch 0: 37%|███▋ | 4597/12384 [9:45:14<16:28:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 37%|███▋ | 4598/12384 [9:45:14<16:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 37%|███▋ | 4598/12384 [9:45:22<16:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4599/12384 [9:45:22<16:27:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4599/12384 [9:45:30<16:27:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 37%|███▋ | 4600/12384 [9:45:30<16:27:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 37%|███▋ | 4600/12384 [9:45:37<16:27:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 37%|███▋ | 4601/12384 [9:45:37<16:27:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 37%|███▋ | 4601/12384 [9:45:45<16:27:04, 7.61s/it, loss=0.0005, acc=0.9998, iter_time=7.03s]
Epoch 0: 37%|███▋ | 4602/12384 [9:45:45<16:29:53, 7.63s/it, loss=0.0005, acc=0.9998, iter_time=7.03s]
Epoch 0: 37%|███▋ | 4602/12384 [9:45:53<16:29:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 37%|███▋ | 4603/12384 [9:45:53<16:29:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 37%|███▋ | 4603/12384 [9:46:00<16:29:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 37%|███▋ | 4604/12384 [9:46:00<16:29:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 37%|███▋ | 4604/12384 [9:46:08<16:29:00, 7.63s/it, loss=0.0002, acc=0.9984, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4605/12384 [9:46:08<16:28:39, 7.63s/it, loss=0.0002, acc=0.9984, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4605/12384 [9:46:15<16:28:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4606/12384 [9:46:15<16:27:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4606/12384 [9:46:23<16:27:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 37%|███▋ | 4607/12384 [9:46:23<16:27:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 37%|███▋ | 4607/12384 [9:46:31<16:27:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 37%|███▋ | 4608/12384 [9:46:31<16:27:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 37%|███▋ | 4608/12384 [9:46:39<16:27:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 37%|███▋ | 4609/12384 [9:46:39<16:39:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 37%|███▋ | 4609/12384 [9:46:46<16:39:45, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 37%|███▋ | 4610/12384 [9:46:46<16:34:44, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 37%|███▋ | 4610/12384 [9:46:54<16:34:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 37%|███▋ | 4611/12384 [9:46:54<16:31:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 37%|███▋ | 4611/12384 [9:47:01<16:31:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 37%|███▋ | 4612/12384 [9:47:01<16:29:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 37%|███▋ | 4612/12384 [9:47:09<16:29:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4613/12384 [9:47:09<16:27:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4613/12384 [9:47:17<16:27:46, 7.63s/it, loss=0.0002, acc=0.9984, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4614/12384 [9:47:17<16:26:58, 7.62s/it, loss=0.0002, acc=0.9984, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4614/12384 [9:47:24<16:26:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 37%|███▋ | 4615/12384 [9:47:24<16:26:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 37%|███▋ | 4615/12384 [9:47:32<16:26:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 37%|███▋ | 4616/12384 [9:47:32<16:25:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 37%|███▋ | 4616/12384 [9:47:39<16:25:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 37%|███▋ | 4617/12384 [9:47:39<16:24:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 37%|███▋ | 4617/12384 [9:47:47<16:24:32, 7.61s/it, loss=0.0025, acc=0.9952, iter_time=9.90s]
Epoch 0: 37%|███▋ | 4618/12384 [9:47:47<16:24:24, 7.61s/it, loss=0.0025, acc=0.9952, iter_time=9.90s]
Epoch 0: 37%|███▋ | 4618/12384 [9:47:55<16:24:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 37%|███▋ | 4619/12384 [9:47:55<16:27:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 37%|███▋ | 4619/12384 [9:48:02<16:27:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 37%|███▋ | 4620/12384 [9:48:02<16:26:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 37%|███▋ | 4620/12384 [9:48:10<16:26:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.91s]
Epoch 0: 37%|███▋ | 4621/12384 [9:48:10<16:24:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.91s]
Epoch 0: 37%|███▋ | 4621/12384 [9:48:17<16:24:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 37%|███▋ | 4622/12384 [9:48:17<16:23:38, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 37%|███▋ | 4622/12384 [9:48:25<16:23:38, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 37%|███▋ | 4623/12384 [9:48:25<16:23:20, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 37%|███▋ | 4623/12384 [9:48:33<16:23:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 37%|███▋ | 4624/12384 [9:48:33<16:23:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 37%|███▋ | 4624/12384 [9:48:40<16:23:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 0: 37%|███▋ | 4625/12384 [9:48:40<16:23:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 0: 37%|███▋ | 4625/12384 [9:48:48<16:23:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.72s]
Epoch 0: 37%|███▋ | 4626/12384 [9:48:48<16:23:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.72s]
Epoch 0: 37%|███▋ | 4626/12384 [9:48:55<16:23:21, 7.61s/it, loss=0.0008, acc=0.9981, iter_time=7.36s]
Epoch 0: 37%|███▋ | 4627/12384 [9:48:55<16:22:49, 7.60s/it, loss=0.0008, acc=0.9981, iter_time=7.36s]
Epoch 0: 37%|███▋ | 4627/12384 [9:49:03<16:22:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 0: 37%|███▋ | 4628/12384 [9:49:03<16:22:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 0: 37%|███▋ | 4628/12384 [9:49:11<16:22:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 37%|███▋ | 4629/12384 [9:49:11<16:23:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 37%|███▋ | 4629/12384 [9:49:18<16:23:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 37%|███▋ | 4630/12384 [9:49:18<16:23:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 37%|███▋ | 4630/12384 [9:49:26<16:23:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 37%|███▋ | 4631/12384 [9:49:26<16:25:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 37%|███▋ | 4631/12384 [9:49:34<16:25:47, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=10.69s]
Epoch 0: 37%|███▋ | 4632/12384 [9:49:34<16:25:20, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=10.69s]
Epoch 0: 37%|███▋ | 4632/12384 [9:49:41<16:25:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4633/12384 [9:49:41<16:24:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4633/12384 [9:49:49<16:24:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4634/12384 [9:49:49<16:24:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 37%|███▋ | 4634/12384 [9:49:57<16:24:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 37%|███▋ | 4635/12384 [9:49:57<16:37:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 37%|███▋ | 4635/12384 [9:50:04<16:37:31, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 0: 37%|███▋ | 4636/12384 [9:50:04<16:33:27, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 0: 37%|███▋ | 4636/12384 [9:50:12<16:33:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 37%|███▋ | 4637/12384 [9:50:12<16:30:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 37%|███▋ | 4637/12384 [9:50:20<16:30:32, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=8.69s]
Epoch 0: 37%|███▋ | 4638/12384 [9:50:20<16:28:15, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=8.69s]
Epoch 0: 37%|███▋ | 4638/12384 [9:50:27<16:28:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 37%|███▋ | 4639/12384 [9:50:27<16:26:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 37%|███▋ | 4639/12384 [9:50:35<16:26:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 37%|███▋ | 4640/12384 [9:50:35<16:26:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 37%|███▋ | 4640/12384 [9:50:42<16:26:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4641/12384 [9:50:42<16:24:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 37%|███▋ | 4641/12384 [9:50:50<16:24:45, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4642/12384 [9:50:50<16:24:22, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4642/12384 [9:50:58<16:24:22, 7.63s/it, loss=0.0014, acc=0.9965, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4643/12384 [9:50:58<16:23:48, 7.63s/it, loss=0.0014, acc=0.9965, iter_time=7.63s]
Epoch 0: 37%|███▋ | 4643/12384 [9:51:05<16:23:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4644/12384 [9:51:05<16:23:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4644/12384 [9:51:13<16:23:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4645/12384 [9:51:13<16:25:00, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4645/12384 [9:51:21<16:25:00, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.66s]
Epoch 0: 38%|███▊ | 4646/12384 [9:51:21<16:24:18, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.66s]
Epoch 0: 38%|███▊ | 4646/12384 [9:51:28<16:24:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 38%|███▊ | 4647/12384 [9:51:28<16:23:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 38%|███▊ | 4647/12384 [9:51:36<16:23:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.31s]
Epoch 0: 38%|███▊ | 4648/12384 [9:51:36<16:23:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.31s]
Epoch 0: 38%|███▊ | 4648/12384 [9:51:43<16:23:07, 7.63s/it, loss=0.0002, acc=0.9988, iter_time=7.24s]
Epoch 0: 38%|███▊ | 4649/12384 [9:51:43<16:22:11, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=7.24s]
Epoch 0: 38%|███▊ | 4649/12384 [9:51:51<16:22:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.09s]
Epoch 0: 38%|███▊ | 4650/12384 [9:51:51<16:24:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.09s]
Epoch 0: 38%|███▊ | 4650/12384 [9:51:59<16:24:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 38%|███▊ | 4651/12384 [9:51:59<16:22:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 38%|███▊ | 4651/12384 [9:52:06<16:22:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 38%|███▊ | 4652/12384 [9:52:06<16:21:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 38%|███▊ | 4652/12384 [9:52:14<16:21:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 38%|███▊ | 4653/12384 [9:52:14<16:20:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 38%|███▊ | 4653/12384 [9:52:22<16:20:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.09s]
Epoch 0: 38%|███▊ | 4654/12384 [9:52:22<16:20:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.09s]
Epoch 0: 38%|███▊ | 4654/12384 [9:52:29<16:20:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 38%|███▊ | 4655/12384 [9:52:29<16:22:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 38%|███▊ | 4655/12384 [9:52:37<16:22:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 38%|███▊ | 4656/12384 [9:52:37<16:21:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 38%|███▊ | 4656/12384 [9:52:44<16:21:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 38%|███▊ | 4657/12384 [9:52:44<16:21:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 38%|███▊ | 4657/12384 [9:52:52<16:21:17, 7.62s/it, loss=0.0009, acc=0.9975, iter_time=8.85s]
Epoch 0: 38%|███▊ | 4658/12384 [9:52:52<16:20:26, 7.61s/it, loss=0.0009, acc=0.9975, iter_time=8.85s]
Epoch 0: 38%|███▊ | 4658/12384 [9:53:00<16:20:26, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=6.97s]
Epoch 0: 38%|███▊ | 4659/12384 [9:53:00<16:20:34, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=6.97s]
Epoch 0: 38%|███▊ | 4659/12384 [9:53:07<16:20:34, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=8.25s]
Epoch 0: 38%|███▊ | 4660/12384 [9:53:07<16:20:15, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=8.25s]
Epoch 0: 38%|███▊ | 4660/12384 [9:53:15<16:20:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 38%|███▊ | 4661/12384 [9:53:15<16:34:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 38%|███▊ | 4661/12384 [9:53:23<16:34:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 38%|███▊ | 4662/12384 [9:53:23<16:30:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 38%|███▊ | 4662/12384 [9:53:30<16:30:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 0: 38%|███▊ | 4663/12384 [9:53:30<16:26:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 0: 38%|███▊ | 4663/12384 [9:53:38<16:26:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 38%|███▊ | 4664/12384 [9:53:38<16:24:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 38%|███▊ | 4664/12384 [9:53:46<16:24:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 38%|███▊ | 4665/12384 [9:53:46<16:22:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 38%|███▊ | 4665/12384 [9:53:53<16:22:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4666/12384 [9:53:53<16:21:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4666/12384 [9:54:01<16:21:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 0: 38%|███▊ | 4667/12384 [9:54:01<16:20:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 0: 38%|███▊ | 4667/12384 [9:54:08<16:20:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 0: 38%|███▊ | 4668/12384 [9:54:08<16:18:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 0: 38%|███▊ | 4668/12384 [9:54:16<16:18:59, 7.61s/it, loss=0.0004, acc=0.9983, iter_time=4.31s]
Epoch 0: 38%|███▊ | 4669/12384 [9:54:16<16:18:55, 7.61s/it, loss=0.0004, acc=0.9983, iter_time=4.31s]
Epoch 0: 38%|███▊ | 4669/12384 [9:54:24<16:18:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 38%|███▊ | 4670/12384 [9:54:24<16:19:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 38%|███▊ | 4670/12384 [9:54:31<16:19:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 38%|███▊ | 4671/12384 [9:54:31<16:19:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 38%|███▊ | 4671/12384 [9:54:39<16:19:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 0: 38%|███▊ | 4672/12384 [9:54:39<16:18:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 0: 38%|███▊ | 4672/12384 [9:54:47<16:18:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 38%|███▊ | 4673/12384 [9:54:47<16:17:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 38%|███▊ | 4673/12384 [9:54:54<16:17:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 0: 38%|███▊ | 4674/12384 [9:54:54<16:18:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 0: 38%|███▊ | 4674/12384 [9:55:02<16:18:05, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=9.93s]
Epoch 0: 38%|███▊ | 4675/12384 [9:55:02<16:20:46, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=9.93s]
Epoch 0: 38%|███▊ | 4675/12384 [9:55:09<16:20:46, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=6.48s]
Epoch 0: 38%|███▊ | 4676/12384 [9:55:09<16:19:16, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.48s]
Epoch 0: 38%|███▊ | 4676/12384 [9:55:17<16:19:16, 7.62s/it, loss=0.0017, acc=0.9959, iter_time=8.79s]
Epoch 0: 38%|███▊ | 4677/12384 [9:55:17<16:18:58, 7.62s/it, loss=0.0017, acc=0.9959, iter_time=8.79s]
Epoch 0: 38%|███▊ | 4677/12384 [9:55:25<16:18:58, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4678/12384 [9:55:25<16:17:37, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4678/12384 [9:55:32<16:17:37, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4679/12384 [9:55:32<16:17:57, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4679/12384 [9:55:40<16:17:57, 7.62s/it, loss=0.0007, acc=0.9985, iter_time=8.31s]
Epoch 0: 38%|███▊ | 4680/12384 [9:55:40<16:29:11, 7.70s/it, loss=0.0007, acc=0.9985, iter_time=8.31s]
Epoch 0: 38%|███▊ | 4680/12384 [9:55:48<16:29:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 38%|███▊ | 4681/12384 [9:55:48<16:25:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 38%|███▊ | 4681/12384 [9:55:55<16:25:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4682/12384 [9:55:55<16:23:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4682/12384 [9:56:03<16:23:08, 7.66s/it, loss=0.0002, acc=0.9997, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4683/12384 [9:56:03<16:20:58, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4683/12384 [9:56:11<16:20:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4684/12384 [9:56:11<16:20:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4684/12384 [9:56:18<16:20:04, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4685/12384 [9:56:18<16:18:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4685/12384 [9:56:26<16:18:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 0: 38%|███▊ | 4686/12384 [9:56:26<16:17:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 0: 38%|███▊ | 4686/12384 [9:56:33<16:17:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 0: 38%|███▊ | 4687/12384 [9:56:33<16:17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 0: 38%|███▊ | 4687/12384 [9:56:41<16:17:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.11s]
Epoch 0: 38%|███▊ | 4688/12384 [9:56:41<16:29:43, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.11s]
Epoch 0: 38%|███▊ | 4688/12384 [9:56:49<16:29:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 0: 38%|███▊ | 4689/12384 [9:56:49<16:25:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 0: 38%|███▊ | 4689/12384 [9:56:57<16:25:39, 7.69s/it, loss=0.0002, acc=0.9981, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4690/12384 [9:56:57<16:22:24, 7.66s/it, loss=0.0002, acc=0.9981, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4690/12384 [9:57:04<16:22:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4691/12384 [9:57:04<16:19:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4691/12384 [9:57:12<16:19:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 38%|███▊ | 4692/12384 [9:57:12<16:17:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 38%|███▊ | 4692/12384 [9:57:19<16:17:28, 7.62s/it, loss=0.0057, acc=0.9956, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4693/12384 [9:57:19<16:16:49, 7.62s/it, loss=0.0057, acc=0.9956, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4693/12384 [9:57:27<16:16:49, 7.62s/it, loss=0.0005, acc=0.9978, iter_time=3.66s]
Epoch 0: 38%|███▊ | 4694/12384 [9:57:27<16:16:43, 7.62s/it, loss=0.0005, acc=0.9978, iter_time=3.66s]
Epoch 0: 38%|███▊ | 4694/12384 [9:57:35<16:16:43, 7.62s/it, loss=0.0002, acc=0.9987, iter_time=11.56s]
Epoch 0: 38%|███▊ | 4695/12384 [9:57:35<16:16:10, 7.62s/it, loss=0.0002, acc=0.9987, iter_time=11.56s]
Epoch 0: 38%|███▊ | 4695/12384 [9:57:42<16:16:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 38%|███▊ | 4696/12384 [9:57:42<16:15:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 38%|███▊ | 4696/12384 [9:57:50<16:15:28, 7.61s/it, loss=0.0015, acc=0.9950, iter_time=7.23s]
Epoch 0: 38%|███▊ | 4697/12384 [9:57:50<16:15:10, 7.61s/it, loss=0.0015, acc=0.9950, iter_time=7.23s]
Epoch 0: 38%|███▊ | 4697/12384 [9:57:57<16:15:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 38%|███▊ | 4698/12384 [9:57:57<16:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 38%|███▊ | 4698/12384 [9:58:05<16:14:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 0: 38%|███▊ | 4699/12384 [9:58:05<16:14:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 0: 38%|███▊ | 4699/12384 [9:58:13<16:14:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 38%|███▊ | 4700/12384 [9:58:13<16:14:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 38%|███▊ | 4700/12384 [9:58:20<16:14:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 38%|███▊ | 4701/12384 [9:58:20<16:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 38%|███▊ | 4701/12384 [9:58:28<16:15:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 38%|███▊ | 4702/12384 [9:58:28<16:17:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 38%|███▊ | 4702/12384 [9:58:36<16:17:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 38%|███▊ | 4703/12384 [9:58:36<16:17:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 38%|███▊ | 4703/12384 [9:58:43<16:17:01, 7.63s/it, loss=0.0022, acc=0.9974, iter_time=8.63s]
Epoch 0: 38%|███▊ | 4704/12384 [9:58:43<16:18:19, 7.64s/it, loss=0.0022, acc=0.9974, iter_time=8.63s]
Epoch 0: 38%|███▊ | 4704/12384 [9:58:51<16:18:19, 7.64s/it, loss=0.0001, acc=0.9994, iter_time=4.94s]
Epoch 0: 38%|███▊ | 4705/12384 [9:58:51<16:17:44, 7.64s/it, loss=0.0001, acc=0.9994, iter_time=4.94s]
Epoch 0: 38%|███▊ | 4705/12384 [9:58:59<16:17:44, 7.64s/it, loss=0.0005, acc=0.9973, iter_time=10.26s]
Epoch 0: 38%|███▊ | 4706/12384 [9:58:59<16:26:51, 7.71s/it, loss=0.0005, acc=0.9973, iter_time=10.26s]
Epoch 0: 38%|███▊ | 4706/12384 [9:59:06<16:26:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 38%|███▊ | 4707/12384 [9:59:06<16:23:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 38%|███▊ | 4707/12384 [9:59:14<16:23:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 38%|███▊ | 4708/12384 [9:59:14<16:20:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 38%|███▊ | 4708/12384 [9:59:22<16:20:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 38%|███▊ | 4709/12384 [9:59:22<16:17:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 38%|███▊ | 4709/12384 [9:59:29<16:17:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 38%|███▊ | 4710/12384 [9:59:29<16:15:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 38%|███▊ | 4710/12384 [9:59:37<16:15:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 38%|███▊ | 4711/12384 [9:59:37<16:14:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 38%|███▊ | 4711/12384 [9:59:45<16:14:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 38%|███▊ | 4712/12384 [9:59:45<16:16:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 38%|███▊ | 4712/12384 [9:59:52<16:16:13, 7.63s/it, loss=0.0052, acc=0.9958, iter_time=6.33s]
Epoch 0: 38%|███▊ | 4713/12384 [9:59:52<16:15:10, 7.63s/it, loss=0.0052, acc=0.9958, iter_time=6.33s]
Epoch 0: 38%|███▊ | 4713/12384 [10:00:00<16:15:10, 7.63s/it, loss=0.0007, acc=0.9989, iter_time=7.42s]
Epoch 0: 38%|███▊ | 4714/12384 [10:00:00<16:25:35, 7.71s/it, loss=0.0007, acc=0.9989, iter_time=7.42s]
Epoch 0: 38%|███▊ | 4714/12384 [10:00:08<16:25:35, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 38%|███▊ | 4715/12384 [10:00:08<16:20:33, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 38%|███▊ | 4715/12384 [10:00:15<16:20:33, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 38%|███▊ | 4716/12384 [10:00:15<16:17:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 38%|███▊ | 4716/12384 [10:00:23<16:17:19, 7.65s/it, loss=0.0006, acc=0.9971, iter_time=9.06s]
Epoch 0: 38%|███▊ | 4717/12384 [10:00:23<16:15:28, 7.63s/it, loss=0.0006, acc=0.9971, iter_time=9.06s]
Epoch 0: 38%|███▊ | 4717/12384 [10:00:30<16:15:28, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4718/12384 [10:00:30<16:13:55, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4718/12384 [10:00:38<16:13:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4719/12384 [10:00:38<16:13:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4719/12384 [10:00:46<16:13:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.53s]
Epoch 0: 38%|███▊ | 4720/12384 [10:00:46<16:12:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.53s]
Epoch 0: 38%|███▊ | 4720/12384 [10:00:53<16:12:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 38%|███▊ | 4721/12384 [10:00:53<16:12:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 38%|███▊ | 4721/12384 [10:01:01<16:12:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 0: 38%|███▊ | 4722/12384 [10:01:01<16:12:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 0: 38%|███▊ | 4722/12384 [10:01:08<16:12:19, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.54s]
Epoch 0: 38%|███▊ | 4723/12384 [10:01:08<16:11:56, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.54s]
Epoch 0: 38%|███▊ | 4723/12384 [10:01:16<16:11:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4724/12384 [10:01:16<16:12:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4724/12384 [10:01:24<16:12:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4725/12384 [10:01:24<16:12:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 38%|███▊ | 4725/12384 [10:01:31<16:12:14, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4726/12384 [10:01:31<16:12:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4726/12384 [10:01:39<16:12:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4727/12384 [10:01:39<16:11:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4727/12384 [10:01:47<16:11:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 38%|███▊ | 4728/12384 [10:01:47<16:10:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 38%|███▊ | 4728/12384 [10:01:54<16:10:46, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=4.91s]
Epoch 0: 38%|███▊ | 4729/12384 [10:01:54<16:10:23, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=4.91s]
Epoch 0: 38%|███▊ | 4729/12384 [10:02:02<16:10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 38%|███▊ | 4730/12384 [10:02:02<16:09:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 38%|███▊ | 4730/12384 [10:02:09<16:09:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4731/12384 [10:02:09<16:13:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4731/12384 [10:02:17<16:13:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 38%|███▊ | 4732/12384 [10:02:17<16:22:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 38%|███▊ | 4732/12384 [10:02:25<16:22:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 38%|███▊ | 4733/12384 [10:02:25<16:21:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 38%|███▊ | 4733/12384 [10:02:33<16:21:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 38%|███▊ | 4734/12384 [10:02:33<16:18:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 38%|███▊ | 4734/12384 [10:02:40<16:18:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 0: 38%|███▊ | 4735/12384 [10:02:40<16:15:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 0: 38%|███▊ | 4735/12384 [10:02:48<16:15:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 0: 38%|███▊ | 4736/12384 [10:02:48<16:13:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 0: 38%|███▊ | 4736/12384 [10:02:55<16:13:43, 7.64s/it, loss=0.0004, acc=0.9988, iter_time=6.09s]
Epoch 0: 38%|███▊ | 4737/12384 [10:02:55<16:16:00, 7.66s/it, loss=0.0004, acc=0.9988, iter_time=6.09s]
Epoch 0: 38%|███▊ | 4737/12384 [10:03:03<16:16:00, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=9.14s]
Epoch 0: 38%|███▊ | 4738/12384 [10:03:03<16:14:04, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.14s]
Epoch 0: 38%|███▊ | 4738/12384 [10:03:11<16:14:04, 7.64s/it, loss=0.0000, acc=0.9999, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4739/12384 [10:03:11<16:13:01, 7.64s/it, loss=0.0000, acc=0.9999, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4739/12384 [10:03:18<16:13:01, 7.64s/it, loss=0.0006, acc=0.9983, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4740/12384 [10:03:18<16:11:54, 7.63s/it, loss=0.0006, acc=0.9983, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4740/12384 [10:03:26<16:11:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 38%|███▊ | 4741/12384 [10:03:26<16:22:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 38%|███▊ | 4741/12384 [10:03:34<16:22:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 38%|███▊ | 4742/12384 [10:03:34<16:18:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 38%|███▊ | 4742/12384 [10:03:41<16:18:14, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 0: 38%|███▊ | 4743/12384 [10:03:41<16:14:02, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 0: 38%|███▊ | 4743/12384 [10:03:49<16:14:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 38%|███▊ | 4744/12384 [10:03:49<16:13:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 38%|███▊ | 4744/12384 [10:03:57<16:13:00, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 38%|███▊ | 4745/12384 [10:03:57<16:11:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 38%|███▊ | 4745/12384 [10:04:04<16:11:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 38%|███▊ | 4746/12384 [10:04:04<16:10:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 38%|███▊ | 4746/12384 [10:04:12<16:10:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 38%|███▊ | 4747/12384 [10:04:12<16:10:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 38%|███▊ | 4747/12384 [10:04:19<16:10:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 38%|███▊ | 4748/12384 [10:04:19<16:10:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 38%|███▊ | 4748/12384 [10:04:27<16:10:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 38%|███▊ | 4749/12384 [10:04:27<16:09:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 38%|███▊ | 4749/12384 [10:04:35<16:09:56, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=8.03s]
Epoch 0: 38%|███▊ | 4750/12384 [10:04:35<16:09:24, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=8.03s]
Epoch 0: 38%|███▊ | 4750/12384 [10:04:42<16:09:24, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.91s]
Epoch 0: 38%|███▊ | 4751/12384 [10:04:42<16:09:44, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.91s]
Epoch 0: 38%|███▊ | 4751/12384 [10:04:50<16:09:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 38%|███▊ | 4752/12384 [10:04:50<16:08:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 38%|███▊ | 4752/12384 [10:04:58<16:08:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 38%|███▊ | 4753/12384 [10:04:58<16:08:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 38%|███▊ | 4753/12384 [10:05:05<16:08:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 38%|███▊ | 4754/12384 [10:05:05<16:08:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 38%|███▊ | 4754/12384 [10:05:13<16:08:33, 7.62s/it, loss=0.0006, acc=0.9978, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4755/12384 [10:05:13<16:08:18, 7.62s/it, loss=0.0006, acc=0.9978, iter_time=7.61s]
Epoch 0: 38%|███▊ | 4755/12384 [10:05:20<16:08:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4756/12384 [10:05:20<16:08:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 38%|███▊ | 4756/12384 [10:05:28<16:08:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 38%|███▊ | 4757/12384 [10:05:28<16:07:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 38%|███▊ | 4757/12384 [10:05:36<16:07:55, 7.61s/it, loss=0.0010, acc=0.9968, iter_time=5.23s]
Epoch 0: 38%|███▊ | 4758/12384 [10:05:36<16:07:59, 7.62s/it, loss=0.0010, acc=0.9968, iter_time=5.23s]
Epoch 0: 38%|███▊ | 4758/12384 [10:05:43<16:07:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 38%|███▊ | 4759/12384 [10:05:43<16:07:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 38%|███▊ | 4759/12384 [10:05:51<16:07:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 38%|███▊ | 4760/12384 [10:05:51<16:06:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 38%|███▊ | 4760/12384 [10:05:58<16:06:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 38%|███▊ | 4761/12384 [10:05:58<16:06:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 38%|███▊ | 4761/12384 [10:06:06<16:06:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 38%|███▊ | 4762/12384 [10:06:06<16:06:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 38%|███▊ | 4762/12384 [10:06:14<16:06:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 0: 38%|███▊ | 4763/12384 [10:06:14<16:06:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 0: 38%|███▊ | 4763/12384 [10:06:21<16:06:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 38%|███▊ | 4764/12384 [10:06:21<16:06:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 38%|███▊ | 4764/12384 [10:06:29<16:06:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 38%|███▊ | 4765/12384 [10:06:29<16:07:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 38%|███▊ | 4765/12384 [10:06:37<16:07:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 0: 38%|███▊ | 4766/12384 [10:06:37<16:07:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 0: 38%|███▊ | 4766/12384 [10:06:44<16:07:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 0: 38%|███▊ | 4767/12384 [10:06:44<16:18:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 0: 38%|███▊ | 4767/12384 [10:06:52<16:18:25, 7.71s/it, loss=0.0003, acc=0.9994, iter_time=8.27s]
Epoch 0: 39%|███▊ | 4768/12384 [10:06:52<16:17:40, 7.70s/it, loss=0.0003, acc=0.9994, iter_time=8.27s]
Epoch 0: 39%|███▊ | 4768/12384 [10:07:00<16:17:40, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 39%|███▊ | 4769/12384 [10:07:00<16:15:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 39%|███▊ | 4769/12384 [10:07:07<16:15:28, 7.69s/it, loss=0.0007, acc=0.9995, iter_time=3.84s]
Epoch 0: 39%|███▊ | 4770/12384 [10:07:07<16:12:00, 7.66s/it, loss=0.0007, acc=0.9995, iter_time=3.84s]
Epoch 0: 39%|███▊ | 4770/12384 [10:07:15<16:12:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 39%|███▊ | 4771/12384 [10:07:15<16:10:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 39%|███▊ | 4771/12384 [10:07:23<16:10:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 39%|███▊ | 4772/12384 [10:07:23<16:08:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 39%|███▊ | 4772/12384 [10:07:30<16:08:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▊ | 4773/12384 [10:07:30<16:10:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▊ | 4773/12384 [10:07:38<16:10:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 39%|███▊ | 4774/12384 [10:07:38<16:08:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 39%|███▊ | 4774/12384 [10:07:46<16:08:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▊ | 4775/12384 [10:07:46<16:07:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▊ | 4775/12384 [10:07:53<16:07:14, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.98s]
Epoch 0: 39%|███▊ | 4776/12384 [10:07:53<16:07:38, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.98s]
Epoch 0: 39%|███▊ | 4776/12384 [10:08:01<16:07:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 39%|███▊ | 4777/12384 [10:08:01<16:06:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 39%|███▊ | 4777/12384 [10:08:08<16:06:59, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▊ | 4778/12384 [10:08:08<16:09:18, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▊ | 4778/12384 [10:08:16<16:09:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 39%|███▊ | 4779/12384 [10:08:16<16:08:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 39%|███▊ | 4779/12384 [10:08:24<16:08:31, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 0: 39%|███▊ | 4780/12384 [10:08:24<16:09:14, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 0: 39%|███▊ | 4780/12384 [10:08:31<16:09:14, 7.65s/it, loss=0.0006, acc=0.9982, iter_time=7.64s]
Epoch 0: 39%|███▊ | 4781/12384 [10:08:31<16:06:16, 7.63s/it, loss=0.0006, acc=0.9982, iter_time=7.64s]
Epoch 0: 39%|███▊ | 4781/12384 [10:08:39<16:06:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 39%|███▊ | 4782/12384 [10:08:39<16:06:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 39%|███▊ | 4782/12384 [10:08:47<16:06:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 39%|███▊ | 4783/12384 [10:08:47<16:06:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 39%|███▊ | 4783/12384 [10:08:54<16:06:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 0: 39%|███▊ | 4784/12384 [10:08:54<16:05:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 0: 39%|███▊ | 4784/12384 [10:09:02<16:05:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 39%|███▊ | 4785/12384 [10:09:02<16:04:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 39%|███▊ | 4785/12384 [10:09:09<16:04:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 39%|███▊ | 4786/12384 [10:09:09<16:04:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 39%|███▊ | 4786/12384 [10:09:17<16:04:07, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.26s]
Epoch 0: 39%|███▊ | 4787/12384 [10:09:17<16:03:57, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.26s]
Epoch 0: 39%|███▊ | 4787/12384 [10:09:25<16:03:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▊ | 4788/12384 [10:09:25<16:03:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▊ | 4788/12384 [10:09:32<16:03:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 0: 39%|███▊ | 4789/12384 [10:09:32<16:03:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 0: 39%|███▊ | 4789/12384 [10:09:40<16:03:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 39%|███▊ | 4790/12384 [10:09:40<16:01:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 39%|███▊ | 4790/12384 [10:09:47<16:01:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 0: 39%|███▊ | 4791/12384 [10:09:47<16:02:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 0: 39%|███▊ | 4791/12384 [10:09:55<16:02:32, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=10.71s]
Epoch 0: 39%|███▊ | 4792/12384 [10:09:55<16:03:05, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=10.71s]
Epoch 0: 39%|███▊ | 4792/12384 [10:10:03<16:03:05, 7.61s/it, loss=0.0036, acc=0.9864, iter_time=7.69s]
Epoch 0: 39%|███▊ | 4793/12384 [10:10:03<16:17:49, 7.73s/it, loss=0.0036, acc=0.9864, iter_time=7.69s]
Epoch 0: 39%|███▊ | 4793/12384 [10:10:11<16:17:49, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 39%|███▊ | 4794/12384 [10:10:11<16:13:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 39%|███▊ | 4794/12384 [10:10:18<16:13:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 39%|███▊ | 4795/12384 [10:10:18<16:10:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 39%|███▊ | 4795/12384 [10:10:26<16:10:29, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=9.68s]
Epoch 0: 39%|███▊ | 4796/12384 [10:10:26<16:08:14, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=9.68s]
Epoch 0: 39%|███▊ | 4796/12384 [10:10:34<16:08:14, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▊ | 4797/12384 [10:10:34<16:06:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▊ | 4797/12384 [10:10:41<16:06:14, 7.64s/it, loss=0.0007, acc=0.9983, iter_time=5.35s]
Epoch 0: 39%|███▊ | 4798/12384 [10:10:41<16:04:45, 7.63s/it, loss=0.0007, acc=0.9983, iter_time=5.35s]
Epoch 0: 39%|███▊ | 4798/12384 [10:10:49<16:04:45, 7.63s/it, loss=0.0010, acc=0.9974, iter_time=9.83s]
Epoch 0: 39%|███▉ | 4799/12384 [10:10:49<16:03:26, 7.62s/it, loss=0.0010, acc=0.9974, iter_time=9.83s]
Epoch 0: 39%|███▉ | 4799/12384 [10:10:56<16:03:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 39%|███▉ | 4800/12384 [10:10:56<16:03:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 39%|███▉ | 4800/12384 [10:11:04<16:03:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 39%|███▉ | 4801/12384 [10:11:04<16:06:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 39%|███▉ | 4801/12384 [10:11:12<16:06:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 39%|███▉ | 4802/12384 [10:11:12<16:05:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 39%|███▉ | 4802/12384 [10:11:19<16:05:25, 7.64s/it, loss=0.0018, acc=0.9960, iter_time=7.62s]
Epoch 0: 39%|███▉ | 4803/12384 [10:11:19<16:03:55, 7.63s/it, loss=0.0018, acc=0.9960, iter_time=7.62s]
Epoch 0: 39%|███▉ | 4803/12384 [10:11:27<16:03:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▉ | 4804/12384 [10:11:27<16:02:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▉ | 4804/12384 [10:11:35<16:02:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▉ | 4805/12384 [10:11:35<16:02:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▉ | 4805/12384 [10:11:42<16:02:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▉ | 4806/12384 [10:11:42<16:02:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▉ | 4806/12384 [10:11:50<16:02:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 39%|███▉ | 4807/12384 [10:11:50<16:04:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 39%|███▉ | 4807/12384 [10:11:57<16:04:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 39%|███▉ | 4808/12384 [10:11:57<16:03:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 39%|███▉ | 4808/12384 [10:12:05<16:03:59, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=7.25s]
Epoch 0: 39%|███▉ | 4809/12384 [10:12:05<16:03:06, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=7.25s]
Epoch 0: 39%|███▉ | 4809/12384 [10:12:13<16:03:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 39%|███▉ | 4810/12384 [10:12:13<16:01:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 39%|███▉ | 4810/12384 [10:12:21<16:01:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.27s]
Epoch 0: 39%|███▉ | 4811/12384 [10:12:21<16:12:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.27s]
Epoch 0: 39%|███▉ | 4811/12384 [10:12:28<16:12:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4812/12384 [10:12:28<16:08:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4812/12384 [10:12:36<16:08:39, 7.68s/it, loss=0.0001, acc=0.9994, iter_time=4.29s]
Epoch 0: 39%|███▉ | 4813/12384 [10:12:36<16:05:06, 7.65s/it, loss=0.0001, acc=0.9994, iter_time=4.29s]
Epoch 0: 39%|███▉ | 4813/12384 [10:12:43<16:05:06, 7.65s/it, loss=0.0004, acc=0.9974, iter_time=8.89s]
Epoch 0: 39%|███▉ | 4814/12384 [10:12:43<16:03:35, 7.64s/it, loss=0.0004, acc=0.9974, iter_time=8.89s]
Epoch 0: 39%|███▉ | 4814/12384 [10:12:51<16:03:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.61s]
Epoch 0: 39%|███▉ | 4815/12384 [10:12:51<16:02:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.61s]
Epoch 0: 39%|███▉ | 4815/12384 [10:12:59<16:02:09, 7.63s/it, loss=0.0017, acc=0.9955, iter_time=7.56s]
Epoch 0: 39%|███▉ | 4816/12384 [10:12:59<16:01:07, 7.62s/it, loss=0.0017, acc=0.9955, iter_time=7.56s]
Epoch 0: 39%|███▉ | 4816/12384 [10:13:06<16:01:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 39%|███▉ | 4817/12384 [10:13:06<16:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 39%|███▉ | 4817/12384 [10:13:14<16:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 39%|███▉ | 4818/12384 [10:13:14<16:01:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 39%|███▉ | 4818/12384 [10:13:22<16:01:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 39%|███▉ | 4819/12384 [10:13:22<16:15:59, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 39%|███▉ | 4819/12384 [10:13:29<16:15:59, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 39%|███▉ | 4820/12384 [10:13:29<16:11:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 39%|███▉ | 4820/12384 [10:13:37<16:11:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 39%|███▉ | 4821/12384 [10:13:37<16:07:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 39%|███▉ | 4821/12384 [10:13:45<16:07:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▉ | 4822/12384 [10:13:45<16:04:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▉ | 4822/12384 [10:13:52<16:04:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 39%|███▉ | 4823/12384 [10:13:52<16:02:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 39%|███▉ | 4823/12384 [10:14:00<16:02:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 39%|███▉ | 4824/12384 [10:14:00<16:02:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 39%|███▉ | 4824/12384 [10:14:07<16:02:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 39%|███▉ | 4825/12384 [10:14:07<16:00:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 39%|███▉ | 4825/12384 [10:14:15<16:00:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.18s]
Epoch 0: 39%|███▉ | 4826/12384 [10:14:15<15:58:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.18s]
Epoch 0: 39%|███▉ | 4826/12384 [10:14:23<15:58:50, 7.61s/it, loss=0.0005, acc=0.9989, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4827/12384 [10:14:23<15:58:41, 7.61s/it, loss=0.0005, acc=0.9989, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4827/12384 [10:14:30<15:58:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▉ | 4828/12384 [10:14:30<16:01:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▉ | 4828/12384 [10:14:38<16:01:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 39%|███▉ | 4829/12384 [10:14:38<15:59:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 39%|███▉ | 4829/12384 [10:14:46<15:59:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4830/12384 [10:14:46<15:58:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4830/12384 [10:14:53<15:58:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 39%|███▉ | 4831/12384 [10:14:53<15:57:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 39%|███▉ | 4831/12384 [10:15:01<15:57:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.57s]
Epoch 0: 39%|███▉ | 4832/12384 [10:15:01<15:57:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.57s]
Epoch 0: 39%|███▉ | 4832/12384 [10:15:08<15:57:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 39%|███▉ | 4833/12384 [10:15:08<15:57:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 39%|███▉ | 4833/12384 [10:15:16<15:57:03, 7.60s/it, loss=0.0032, acc=0.9976, iter_time=6.66s]
Epoch 0: 39%|███▉ | 4834/12384 [10:15:16<15:57:32, 7.61s/it, loss=0.0032, acc=0.9976, iter_time=6.66s]
Epoch 0: 39%|███▉ | 4834/12384 [10:15:24<15:57:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 0: 39%|███▉ | 4835/12384 [10:15:24<15:58:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 0: 39%|███▉ | 4835/12384 [10:15:31<15:58:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 39%|███▉ | 4836/12384 [10:15:31<15:56:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 39%|███▉ | 4836/12384 [10:15:39<15:56:35, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 39%|███▉ | 4837/12384 [10:15:39<15:55:43, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 39%|███▉ | 4837/12384 [10:15:46<15:55:43, 7.60s/it, loss=0.0004, acc=0.9991, iter_time=9.66s]
Epoch 0: 39%|███▉ | 4838/12384 [10:15:46<15:56:21, 7.60s/it, loss=0.0004, acc=0.9991, iter_time=9.66s]
Epoch 0: 39%|███▉ | 4838/12384 [10:15:54<15:56:21, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▉ | 4839/12384 [10:15:54<15:56:11, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▉ | 4839/12384 [10:16:02<15:56:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 39%|███▉ | 4840/12384 [10:16:02<15:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 39%|███▉ | 4840/12384 [10:16:09<15:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 39%|███▉ | 4841/12384 [10:16:09<15:57:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 39%|███▉ | 4841/12384 [10:16:17<15:57:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 39%|███▉ | 4842/12384 [10:16:17<15:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 39%|███▉ | 4842/12384 [10:16:24<15:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 39%|███▉ | 4843/12384 [10:16:24<15:56:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 39%|███▉ | 4843/12384 [10:16:32<15:56:09, 7.61s/it, loss=0.0004, acc=0.9994, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4844/12384 [10:16:32<15:56:28, 7.61s/it, loss=0.0004, acc=0.9994, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4844/12384 [10:16:40<15:56:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 39%|███▉ | 4845/12384 [10:16:40<16:07:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 39%|███▉ | 4845/12384 [10:16:48<16:07:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 39%|███▉ | 4846/12384 [10:16:48<16:03:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 39%|███▉ | 4846/12384 [10:16:55<16:03:50, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.14s]
Epoch 0: 39%|███▉ | 4847/12384 [10:16:55<16:00:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.14s]
Epoch 0: 39%|███▉ | 4847/12384 [10:17:03<16:00:25, 7.65s/it, loss=0.0020, acc=1.0000, iter_time=9.45s]
Epoch 0: 39%|███▉ | 4848/12384 [10:17:03<15:58:48, 7.63s/it, loss=0.0020, acc=1.0000, iter_time=9.45s]
Epoch 0: 39%|███▉ | 4848/12384 [10:17:10<15:58:48, 7.63s/it, loss=0.0002, acc=0.9981, iter_time=4.35s]
Epoch 0: 39%|███▉ | 4849/12384 [10:17:10<15:57:48, 7.63s/it, loss=0.0002, acc=0.9981, iter_time=4.35s]
Epoch 0: 39%|███▉ | 4849/12384 [10:17:18<15:57:48, 7.63s/it, loss=0.0004, acc=0.9980, iter_time=10.88s]
Epoch 0: 39%|███▉ | 4850/12384 [10:17:18<15:56:45, 7.62s/it, loss=0.0004, acc=0.9980, iter_time=10.88s]
Epoch 0: 39%|███▉ | 4850/12384 [10:17:26<15:56:45, 7.62s/it, loss=0.0006, acc=0.9984, iter_time=4.14s]
Epoch 0: 39%|███▉ | 4851/12384 [10:17:26<15:57:09, 7.62s/it, loss=0.0006, acc=0.9984, iter_time=4.14s]
Epoch 0: 39%|███▉ | 4851/12384 [10:17:33<15:57:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 0: 39%|███▉ | 4852/12384 [10:17:33<15:56:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 0: 39%|███▉ | 4852/12384 [10:17:41<15:56:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 39%|███▉ | 4853/12384 [10:17:41<15:55:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 39%|███▉ | 4853/12384 [10:17:48<15:55:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.75s]
Epoch 0: 39%|███▉ | 4854/12384 [10:17:48<15:55:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.75s]
Epoch 0: 39%|███▉ | 4854/12384 [10:17:56<15:55:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▉ | 4855/12384 [10:17:56<15:56:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 39%|███▉ | 4855/12384 [10:18:04<15:56:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 0: 39%|███▉ | 4856/12384 [10:18:04<15:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 0: 39%|███▉ | 4856/12384 [10:18:11<15:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 39%|███▉ | 4857/12384 [10:18:11<15:53:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 39%|███▉ | 4857/12384 [10:18:19<15:53:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▉ | 4858/12384 [10:18:19<15:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 39%|███▉ | 4858/12384 [10:18:26<15:53:22, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.75s]
Epoch 0: 39%|███▉ | 4859/12384 [10:18:26<15:53:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.75s]
Epoch 0: 39%|███▉ | 4859/12384 [10:18:34<15:53:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 39%|███▉ | 4860/12384 [10:18:34<15:53:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 39%|███▉ | 4860/12384 [10:18:42<15:53:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 39%|███▉ | 4861/12384 [10:18:42<15:53:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 39%|███▉ | 4861/12384 [10:18:49<15:53:56, 7.61s/it, loss=0.0006, acc=0.9985, iter_time=9.92s]
Epoch 0: 39%|███▉ | 4862/12384 [10:18:49<15:54:16, 7.61s/it, loss=0.0006, acc=0.9985, iter_time=9.92s]
Epoch 0: 39%|███▉ | 4862/12384 [10:18:57<15:54:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 39%|███▉ | 4863/12384 [10:18:57<16:04:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 39%|███▉ | 4863/12384 [10:19:05<16:04:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 39%|███▉ | 4864/12384 [10:19:05<16:02:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 39%|███▉ | 4864/12384 [10:19:12<16:02:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 39%|███▉ | 4865/12384 [10:19:12<15:59:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 39%|███▉ | 4865/12384 [10:19:20<15:59:06, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▉ | 4866/12384 [10:19:20<15:57:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▉ | 4866/12384 [10:19:28<15:57:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 39%|███▉ | 4867/12384 [10:19:28<15:55:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 39%|███▉ | 4867/12384 [10:19:35<15:55:47, 7.63s/it, loss=0.0010, acc=0.9967, iter_time=7.60s]
Epoch 0: 39%|███▉ | 4868/12384 [10:19:35<15:56:59, 7.64s/it, loss=0.0010, acc=0.9967, iter_time=7.60s]
Epoch 0: 39%|███▉ | 4868/12384 [10:19:43<15:56:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 39%|███▉ | 4869/12384 [10:19:43<15:54:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 39%|███▉ | 4869/12384 [10:19:51<15:54:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 39%|███▉ | 4870/12384 [10:19:51<15:54:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 39%|███▉ | 4870/12384 [10:19:58<15:54:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 39%|███▉ | 4871/12384 [10:19:58<15:52:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 39%|███▉ | 4871/12384 [10:20:06<15:52:53, 7.61s/it, loss=0.0002, acc=0.9987, iter_time=8.06s]
Epoch 0: 39%|███▉ | 4872/12384 [10:20:06<16:06:15, 7.72s/it, loss=0.0002, acc=0.9987, iter_time=8.06s]
Epoch 0: 39%|███▉ | 4872/12384 [10:20:14<16:06:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 39%|███▉ | 4873/12384 [10:20:14<16:01:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 39%|███▉ | 4873/12384 [10:20:21<16:01:49, 7.68s/it, loss=0.0010, acc=0.9940, iter_time=5.06s]
Epoch 0: 39%|███▉ | 4874/12384 [10:20:21<15:58:23, 7.66s/it, loss=0.0010, acc=0.9940, iter_time=5.06s]
Epoch 0: 39%|███▉ | 4874/12384 [10:20:29<15:58:23, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=10.14s]
Epoch 0: 39%|███▉ | 4875/12384 [10:20:29<15:55:52, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.14s]
Epoch 0: 39%|███▉ | 4875/12384 [10:20:36<15:55:52, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4876/12384 [10:20:36<15:54:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 39%|███▉ | 4876/12384 [10:20:44<15:54:09, 7.63s/it, loss=0.0017, acc=0.9964, iter_time=5.87s]
Epoch 0: 39%|███▉ | 4877/12384 [10:20:44<15:51:58, 7.61s/it, loss=0.0017, acc=0.9964, iter_time=5.87s]
Epoch 0: 39%|███▉ | 4877/12384 [10:20:52<15:51:58, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=9.30s]
Epoch 0: 39%|███▉ | 4878/12384 [10:20:52<15:51:35, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=9.30s]
Epoch 0: 39%|███▉ | 4878/12384 [10:20:59<15:51:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 0: 39%|███▉ | 4879/12384 [10:20:59<15:51:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 0: 39%|███▉ | 4879/12384 [10:21:07<15:51:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.09s]
Epoch 0: 39%|███▉ | 4880/12384 [10:21:07<15:50:22, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.09s]
Epoch 0: 39%|███▉ | 4880/12384 [10:21:14<15:50:22, 7.60s/it, loss=0.0002, acc=0.9997, iter_time=7.21s]
Epoch 0: 39%|███▉ | 4881/12384 [10:21:14<15:51:12, 7.61s/it, loss=0.0002, acc=0.9997, iter_time=7.21s]
Epoch 0: 39%|███▉ | 4881/12384 [10:21:22<15:51:12, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=4.85s]
Epoch 0: 39%|███▉ | 4882/12384 [10:21:22<15:51:30, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=4.85s]
Epoch 0: 39%|███▉ | 4882/12384 [10:21:30<15:51:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 0: 39%|███▉ | 4883/12384 [10:21:30<15:51:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 0: 39%|███▉ | 4883/12384 [10:21:37<15:51:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 39%|███▉ | 4884/12384 [10:21:37<15:50:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 39%|███▉ | 4884/12384 [10:21:45<15:50:56, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▉ | 4885/12384 [10:21:45<15:53:42, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 39%|███▉ | 4885/12384 [10:21:53<15:53:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 39%|███▉ | 4886/12384 [10:21:53<15:55:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 39%|███▉ | 4886/12384 [10:22:00<15:55:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 39%|███▉ | 4887/12384 [10:22:00<15:54:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 39%|███▉ | 4887/12384 [10:22:08<15:54:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 0: 39%|███▉ | 4888/12384 [10:22:08<15:53:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 0: 39%|███▉ | 4888/12384 [10:22:15<15:53:37, 7.63s/it, loss=0.0008, acc=0.9979, iter_time=5.98s]
Epoch 0: 39%|███▉ | 4889/12384 [10:22:15<15:52:28, 7.62s/it, loss=0.0008, acc=0.9979, iter_time=5.98s]
Epoch 0: 39%|███▉ | 4889/12384 [10:22:23<15:52:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 39%|███▉ | 4890/12384 [10:22:23<15:51:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 39%|███▉ | 4890/12384 [10:22:31<15:51:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 39%|███▉ | 4891/12384 [10:22:31<15:52:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 39%|███▉ | 4891/12384 [10:22:38<15:52:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|███▉ | 4892/12384 [10:22:38<15:51:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|███▉ | 4892/12384 [10:22:46<15:51:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 40%|███▉ | 4893/12384 [10:22:46<15:50:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 40%|███▉ | 4893/12384 [10:22:54<15:50:36, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|███▉ | 4894/12384 [10:22:54<15:52:13, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|███▉ | 4894/12384 [10:23:01<15:52:13, 7.63s/it, loss=0.0008, acc=0.9972, iter_time=7.61s]
Epoch 0: 40%|███▉ | 4895/12384 [10:23:01<15:53:16, 7.64s/it, loss=0.0008, acc=0.9972, iter_time=7.61s]
Epoch 0: 40%|███▉ | 4895/12384 [10:23:09<15:53:16, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 40%|███▉ | 4896/12384 [10:23:09<15:54:56, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 40%|███▉ | 4896/12384 [10:23:17<15:54:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 0: 40%|███▉ | 4897/12384 [10:23:17<15:53:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 0: 40%|███▉ | 4897/12384 [10:23:25<15:53:23, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.50s]
Epoch 0: 40%|███▉ | 4898/12384 [10:23:25<16:04:50, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=10.50s]
Epoch 0: 40%|███▉ | 4898/12384 [10:23:32<16:04:50, 7.73s/it, loss=0.0007, acc=0.9965, iter_time=6.97s]
Epoch 0: 40%|███▉ | 4899/12384 [10:23:32<15:59:16, 7.69s/it, loss=0.0007, acc=0.9965, iter_time=6.97s]
Epoch 0: 40%|███▉ | 4899/12384 [10:23:40<15:59:16, 7.69s/it, loss=0.0002, acc=0.9992, iter_time=8.94s]
Epoch 0: 40%|███▉ | 4900/12384 [10:23:40<15:56:11, 7.67s/it, loss=0.0002, acc=0.9992, iter_time=8.94s]
Epoch 0: 40%|███▉ | 4900/12384 [10:23:47<15:56:11, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=7.21s]
Epoch 0: 40%|███▉ | 4901/12384 [10:23:47<15:54:40, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.21s]
Epoch 0: 40%|███▉ | 4901/12384 [10:23:55<15:54:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 40%|███▉ | 4902/12384 [10:23:55<15:54:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 40%|███▉ | 4902/12384 [10:24:03<15:54:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|███▉ | 4903/12384 [10:24:03<15:52:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|███▉ | 4903/12384 [10:24:10<15:52:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 40%|███▉ | 4904/12384 [10:24:10<15:51:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 40%|███▉ | 4904/12384 [10:24:18<15:51:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 40%|███▉ | 4905/12384 [10:24:18<15:54:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 40%|███▉ | 4905/12384 [10:24:26<15:54:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4906/12384 [10:24:26<15:52:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4906/12384 [10:24:33<15:52:22, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=7.59s]
Epoch 0: 40%|███▉ | 4907/12384 [10:24:33<15:50:02, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=7.59s]
Epoch 0: 40%|███▉ | 4907/12384 [10:24:41<15:50:02, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=7.60s]
Epoch 0: 40%|███▉ | 4908/12384 [10:24:41<15:49:38, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=7.60s]
Epoch 0: 40%|███▉ | 4908/12384 [10:24:48<15:49:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 40%|███▉ | 4909/12384 [10:24:48<15:48:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 40%|███▉ | 4909/12384 [10:24:56<15:48:18, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=4.58s]
Epoch 0: 40%|███▉ | 4910/12384 [10:24:56<15:49:38, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=4.58s]
Epoch 0: 40%|███▉ | 4910/12384 [10:25:04<15:49:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 0: 40%|███▉ | 4911/12384 [10:25:04<15:48:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 0: 40%|███▉ | 4911/12384 [10:25:11<15:48:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 40%|███▉ | 4912/12384 [10:25:11<15:48:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 40%|███▉ | 4912/12384 [10:25:19<15:48:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 40%|███▉ | 4913/12384 [10:25:19<15:51:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 40%|███▉ | 4913/12384 [10:25:26<15:51:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.23s]
Epoch 0: 40%|███▉ | 4914/12384 [10:25:26<15:49:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.23s]
Epoch 0: 40%|███▉ | 4914/12384 [10:25:34<15:49:25, 7.63s/it, loss=0.0004, acc=0.9974, iter_time=8.44s]
Epoch 0: 40%|███▉ | 4915/12384 [10:25:34<15:48:27, 7.62s/it, loss=0.0004, acc=0.9974, iter_time=8.44s]
Epoch 0: 40%|███▉ | 4915/12384 [10:25:42<15:48:27, 7.62s/it, loss=0.0011, acc=0.9983, iter_time=8.26s]
Epoch 0: 40%|███▉ | 4916/12384 [10:25:42<15:48:13, 7.62s/it, loss=0.0011, acc=0.9983, iter_time=8.26s]
Epoch 0: 40%|███▉ | 4916/12384 [10:25:49<15:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4917/12384 [10:25:49<15:47:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4917/12384 [10:25:57<15:47:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 40%|███▉ | 4918/12384 [10:25:57<15:46:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 40%|███▉ | 4918/12384 [10:26:05<15:46:55, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.11s]
Epoch 0: 40%|███▉ | 4919/12384 [10:26:05<15:51:29, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.11s]
Epoch 0: 40%|███▉ | 4919/12384 [10:26:12<15:51:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 40%|███▉ | 4920/12384 [10:26:12<15:50:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 40%|███▉ | 4920/12384 [10:26:20<15:50:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|███▉ | 4921/12384 [10:26:20<15:48:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|███▉ | 4921/12384 [10:26:27<15:48:36, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=6.41s]
Epoch 0: 40%|███▉ | 4922/12384 [10:26:27<15:48:20, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=6.41s]
Epoch 0: 40%|███▉ | 4922/12384 [10:26:35<15:48:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 40%|███▉ | 4923/12384 [10:26:35<15:47:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 40%|███▉ | 4923/12384 [10:26:43<15:47:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 40%|███▉ | 4924/12384 [10:26:43<15:47:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 40%|███▉ | 4924/12384 [10:26:51<15:47:03, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.67s]
Epoch 0: 40%|███▉ | 4925/12384 [10:26:51<15:57:41, 7.70s/it, loss=0.0002, acc=0.9986, iter_time=7.67s]
Epoch 0: 40%|███▉ | 4925/12384 [10:26:58<15:57:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 40%|███▉ | 4926/12384 [10:26:58<15:53:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 40%|███▉ | 4926/12384 [10:27:06<15:53:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 0: 40%|███▉ | 4927/12384 [10:27:06<15:50:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 0: 40%|███▉ | 4927/12384 [10:27:13<15:50:50, 7.65s/it, loss=0.0002, acc=0.9995, iter_time=7.99s]
Epoch 0: 40%|███▉ | 4928/12384 [10:27:14<15:53:52, 7.68s/it, loss=0.0002, acc=0.9995, iter_time=7.99s]
Epoch 0: 40%|███▉ | 4928/12384 [10:27:21<15:53:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 40%|███▉ | 4929/12384 [10:27:21<15:50:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 40%|███▉ | 4929/12384 [10:27:29<15:50:32, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|███▉ | 4930/12384 [10:27:29<15:51:27, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|███▉ | 4930/12384 [10:27:36<15:51:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 40%|███▉ | 4931/12384 [10:27:36<15:52:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 40%|███▉ | 4931/12384 [10:27:44<15:52:41, 7.67s/it, loss=0.0007, acc=0.9981, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4932/12384 [10:27:44<15:51:01, 7.66s/it, loss=0.0007, acc=0.9981, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4932/12384 [10:27:52<15:51:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 0: 40%|███▉ | 4933/12384 [10:27:52<15:49:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 0: 40%|███▉ | 4933/12384 [10:27:59<15:49:06, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=10.00s]
Epoch 0: 40%|███▉ | 4934/12384 [10:27:59<15:48:00, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=10.00s]
Epoch 0: 40%|███▉ | 4934/12384 [10:28:07<15:48:00, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 40%|███▉ | 4935/12384 [10:28:07<15:47:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 40%|███▉ | 4935/12384 [10:28:15<15:47:14, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.57s]
Epoch 0: 40%|███▉ | 4936/12384 [10:28:15<15:46:41, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.57s]
Epoch 0: 40%|███▉ | 4936/12384 [10:28:22<15:46:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 40%|███▉ | 4937/12384 [10:28:22<15:47:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 40%|███▉ | 4937/12384 [10:28:30<15:47:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 40%|███▉ | 4938/12384 [10:28:30<15:46:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 40%|███▉ | 4938/12384 [10:28:37<15:46:26, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=8.50s]
Epoch 0: 40%|███▉ | 4939/12384 [10:28:37<15:47:05, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=8.50s]
Epoch 0: 40%|███▉ | 4939/12384 [10:28:45<15:47:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4940/12384 [10:28:45<15:46:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4940/12384 [10:28:53<15:46:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4941/12384 [10:28:53<15:45:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|███▉ | 4941/12384 [10:29:01<15:45:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 40%|███▉ | 4942/12384 [10:29:01<15:56:24, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 40%|███▉ | 4942/12384 [10:29:08<15:56:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 40%|███▉ | 4943/12384 [10:29:08<15:52:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 40%|███▉ | 4943/12384 [10:29:16<15:52:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 40%|███▉ | 4944/12384 [10:29:16<15:50:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 40%|███▉ | 4944/12384 [10:29:24<15:50:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 40%|███▉ | 4945/12384 [10:29:24<15:49:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 40%|███▉ | 4945/12384 [10:29:31<15:49:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 40%|███▉ | 4946/12384 [10:29:31<15:47:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 40%|███▉ | 4946/12384 [10:29:39<15:47:30, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.90s]
Epoch 0: 40%|███▉ | 4947/12384 [10:29:39<15:45:36, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.90s]
Epoch 0: 40%|███▉ | 4947/12384 [10:29:46<15:45:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 0: 40%|███▉ | 4948/12384 [10:29:46<15:43:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 0: 40%|███▉ | 4948/12384 [10:29:54<15:43:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 40%|███▉ | 4949/12384 [10:29:54<15:31:21, 7.52s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 40%|███▉ | 4949/12384 [10:30:01<15:31:21, 7.52s/it, loss=0.0002, acc=1.0000, iter_time=11.10s]
Epoch 0: 40%|███▉ | 4950/12384 [10:30:01<15:38:27, 7.57s/it, loss=0.0002, acc=1.0000, iter_time=11.10s]
Epoch 0: 40%|███▉ | 4950/12384 [10:30:09<15:38:27, 7.57s/it, loss=0.0001, acc=0.9999, iter_time=7.26s]
Epoch 0: 40%|███▉ | 4951/12384 [10:30:09<15:52:28, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=7.26s]
Epoch 0: 40%|███▉ | 4951/12384 [10:30:17<15:52:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 40%|███▉ | 4952/12384 [10:30:17<15:49:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 40%|███▉ | 4952/12384 [10:30:24<15:49:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 40%|███▉ | 4953/12384 [10:30:24<15:47:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 40%|███▉ | 4953/12384 [10:30:32<15:47:53, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=5.06s]
Epoch 0: 40%|████ | 4954/12384 [10:30:32<15:46:25, 7.64s/it, loss=0.0004, acc=0.9988, iter_time=5.06s]
Epoch 0: 40%|████ | 4954/12384 [10:30:40<15:46:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.16s]
Epoch 0: 40%|████ | 4955/12384 [10:30:40<15:44:45, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.16s]
Epoch 0: 40%|████ | 4955/12384 [10:30:47<15:44:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 40%|████ | 4956/12384 [10:30:47<15:43:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 40%|████ | 4956/12384 [10:30:55<15:43:36, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.60s]
Epoch 0: 40%|████ | 4957/12384 [10:30:55<15:42:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.60s]
Epoch 0: 40%|████ | 4957/12384 [10:31:03<15:42:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 40%|████ | 4958/12384 [10:31:03<15:42:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 40%|████ | 4958/12384 [10:31:10<15:42:30, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=10.92s]
Epoch 0: 40%|████ | 4959/12384 [10:31:10<15:42:33, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=10.92s]
Epoch 0: 40%|████ | 4959/12384 [10:31:18<15:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 40%|████ | 4960/12384 [10:31:18<15:42:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 40%|████ | 4960/12384 [10:31:25<15:42:04, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=6.10s]
Epoch 0: 40%|████ | 4961/12384 [10:31:25<15:41:34, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=6.10s]
Epoch 0: 40%|████ | 4961/12384 [10:31:33<15:41:34, 7.61s/it, loss=0.0009, acc=0.9965, iter_time=6.93s]
Epoch 0: 40%|████ | 4962/12384 [10:31:33<15:41:31, 7.61s/it, loss=0.0009, acc=0.9965, iter_time=6.93s]
Epoch 0: 40%|████ | 4962/12384 [10:31:41<15:41:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 40%|████ | 4963/12384 [10:31:41<15:42:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 40%|████ | 4963/12384 [10:31:48<15:42:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|████ | 4964/12384 [10:31:48<15:42:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|████ | 4964/12384 [10:31:56<15:42:16, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 0: 40%|████ | 4965/12384 [10:31:56<15:42:17, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 0: 40%|████ | 4965/12384 [10:32:03<15:42:17, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 40%|████ | 4966/12384 [10:32:03<15:41:12, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 40%|████ | 4966/12384 [10:32:11<15:41:12, 7.61s/it, loss=0.0002, acc=0.9987, iter_time=7.59s]
Epoch 0: 40%|████ | 4967/12384 [10:32:11<15:39:57, 7.60s/it, loss=0.0002, acc=0.9987, iter_time=7.59s]
Epoch 0: 40%|████ | 4967/12384 [10:32:19<15:39:57, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 40%|████ | 4968/12384 [10:32:19<15:40:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 40%|████ | 4968/12384 [10:32:26<15:40:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 40%|████ | 4969/12384 [10:32:26<15:40:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 40%|████ | 4969/12384 [10:32:34<15:40:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.57s]
Epoch 0: 40%|████ | 4970/12384 [10:32:34<15:40:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.57s]
Epoch 0: 40%|████ | 4970/12384 [10:32:41<15:40:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 40%|████ | 4971/12384 [10:32:41<15:40:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 40%|████ | 4971/12384 [10:32:49<15:40:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 40%|████ | 4972/12384 [10:32:49<15:40:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 40%|████ | 4972/12384 [10:32:57<15:40:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|████ | 4973/12384 [10:32:57<15:40:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|████ | 4973/12384 [10:33:04<15:40:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 40%|████ | 4974/12384 [10:33:04<15:40:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 40%|████ | 4974/12384 [10:33:12<15:40:55, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=10.65s]
Epoch 0: 40%|████ | 4975/12384 [10:33:12<15:40:10, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=10.65s]
Epoch 0: 40%|████ | 4975/12384 [10:33:20<15:40:10, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.98s]
Epoch 0: 40%|████ | 4976/12384 [10:33:20<15:40:17, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.98s]
Epoch 0: 40%|████ | 4976/12384 [10:33:28<15:40:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 40%|████ | 4977/12384 [10:33:28<15:52:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 40%|████ | 4977/12384 [10:33:35<15:52:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 40%|████ | 4978/12384 [10:33:35<15:47:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 40%|████ | 4978/12384 [10:33:43<15:47:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 0: 40%|████ | 4979/12384 [10:33:43<15:44:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 0: 40%|████ | 4979/12384 [10:33:50<15:44:52, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|████ | 4980/12384 [10:33:50<15:43:08, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 40%|████ | 4980/12384 [10:33:58<15:43:08, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=7.60s]
Epoch 0: 40%|████ | 4981/12384 [10:33:58<15:41:27, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=7.60s]
Epoch 0: 40%|████ | 4981/12384 [10:34:06<15:41:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|████ | 4982/12384 [10:34:06<15:42:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|████ | 4982/12384 [10:34:13<15:42:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|████ | 4983/12384 [10:34:13<15:41:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|████ | 4983/12384 [10:34:21<15:41:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 40%|████ | 4984/12384 [10:34:21<15:40:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 40%|████ | 4984/12384 [10:34:29<15:40:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 40%|████ | 4985/12384 [10:34:29<15:43:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 40%|████ | 4985/12384 [10:34:36<15:43:29, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=7.72s]
Epoch 0: 40%|████ | 4986/12384 [10:34:36<15:42:11, 7.64s/it, loss=0.0002, acc=0.9992, iter_time=7.72s]
Epoch 0: 40%|████ | 4986/12384 [10:34:44<15:42:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 40%|████ | 4987/12384 [10:34:44<15:40:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 40%|████ | 4987/12384 [10:34:51<15:40:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 40%|████ | 4988/12384 [10:34:51<15:39:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 40%|████ | 4988/12384 [10:34:59<15:39:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 40%|████ | 4989/12384 [10:34:59<15:38:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 40%|████ | 4989/12384 [10:35:07<15:38:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|████ | 4990/12384 [10:35:07<15:37:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|████ | 4990/12384 [10:35:14<15:37:59, 7.61s/it, loss=0.0024, acc=0.9951, iter_time=6.66s]
Epoch 0: 40%|████ | 4991/12384 [10:35:14<15:37:05, 7.61s/it, loss=0.0024, acc=0.9951, iter_time=6.66s]
Epoch 0: 40%|████ | 4991/12384 [10:35:22<15:37:05, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=8.92s]
Epoch 0: 40%|████ | 4992/12384 [10:35:22<15:37:15, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=8.92s]
Epoch 0: 40%|████ | 4992/12384 [10:35:29<15:37:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.42s]
Epoch 0: 40%|████ | 4993/12384 [10:35:29<15:37:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.42s]
Epoch 0: 40%|████ | 4993/12384 [10:35:37<15:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 40%|████ | 4994/12384 [10:35:37<15:36:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 40%|████ | 4994/12384 [10:35:45<15:36:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 40%|████ | 4995/12384 [10:35:45<15:37:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 40%|████ | 4995/12384 [10:35:52<15:37:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|████ | 4996/12384 [10:35:52<15:37:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|████ | 4996/12384 [10:36:00<15:37:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.84s]
Epoch 0: 40%|████ | 4997/12384 [10:36:00<15:37:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.84s]
Epoch 0: 40%|████ | 4997/12384 [10:36:07<15:37:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 40%|████ | 4998/12384 [10:36:07<15:37:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 40%|████ | 4998/12384 [10:36:15<15:37:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|████ | 4999/12384 [10:36:15<15:37:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 40%|████ | 4999/12384 [10:36:23<15:37:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 40%|████ | 5000/12384 [10:36:23<15:43:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 40%|████ | 5000/12384 [10:36:30<15:43:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 40%|████ | 5001/12384 [10:36:30<15:41:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 40%|████ | 5001/12384 [10:36:38<15:41:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 40%|████ | 5002/12384 [10:36:38<15:40:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 40%|████ | 5002/12384 [10:36:46<15:40:54, 7.65s/it, loss=0.0016, acc=0.9922, iter_time=7.67s]
Epoch 0: 40%|████ | 5003/12384 [10:36:46<15:52:17, 7.74s/it, loss=0.0016, acc=0.9922, iter_time=7.67s]
Epoch 0: 40%|████ | 5003/12384 [10:36:54<15:52:17, 7.74s/it, loss=0.0004, acc=0.9998, iter_time=7.96s]
Epoch 0: 40%|████ | 5004/12384 [10:36:54<15:49:01, 7.72s/it, loss=0.0004, acc=0.9998, iter_time=7.96s]
Epoch 0: 40%|████ | 5004/12384 [10:37:01<15:49:01, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|████ | 5005/12384 [10:37:01<15:44:41, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 40%|████ | 5005/12384 [10:37:09<15:44:41, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 0: 40%|████ | 5006/12384 [10:37:09<15:42:19, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 0: 40%|████ | 5006/12384 [10:37:17<15:42:19, 7.66s/it, loss=0.0005, acc=0.9979, iter_time=5.09s]
Epoch 0: 40%|████ | 5007/12384 [10:37:17<15:39:26, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=5.09s]
Epoch 0: 40%|████ | 5007/12384 [10:37:24<15:39:26, 7.64s/it, loss=0.0005, acc=0.9990, iter_time=10.06s]
Epoch 0: 40%|████ | 5008/12384 [10:37:24<15:37:42, 7.63s/it, loss=0.0005, acc=0.9990, iter_time=10.06s]
Epoch 0: 40%|████ | 5008/12384 [10:37:32<15:37:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 40%|████ | 5009/12384 [10:37:32<15:36:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 40%|████ | 5009/12384 [10:37:39<15:36:51, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=6.67s]
Epoch 0: 40%|████ | 5010/12384 [10:37:39<15:36:30, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=6.67s]
Epoch 0: 40%|████ | 5010/12384 [10:37:47<15:36:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 0: 40%|████ | 5011/12384 [10:37:47<15:35:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 0: 40%|████ | 5011/12384 [10:37:55<15:35:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 40%|████ | 5012/12384 [10:37:55<15:35:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 40%|████ | 5012/12384 [10:38:02<15:35:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 0: 40%|████ | 5013/12384 [10:38:02<15:34:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 0: 40%|████ | 5013/12384 [10:38:10<15:34:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 0: 40%|████ | 5014/12384 [10:38:10<15:33:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 0: 40%|████ | 5014/12384 [10:38:17<15:33:59, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 40%|████ | 5015/12384 [10:38:17<15:33:25, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 40%|████ | 5015/12384 [10:38:25<15:33:25, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.75s]
Epoch 0: 41%|████ | 5016/12384 [10:38:25<15:33:51, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.75s]
Epoch 0: 41%|████ | 5016/12384 [10:38:33<15:33:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 41%|████ | 5017/12384 [10:38:33<15:34:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 41%|████ | 5017/12384 [10:38:40<15:34:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 41%|████ | 5018/12384 [10:38:40<15:34:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 41%|████ | 5018/12384 [10:38:48<15:34:40, 7.61s/it, loss=0.0009, acc=0.9975, iter_time=6.14s]
Epoch 0: 41%|████ | 5019/12384 [10:38:48<15:33:24, 7.60s/it, loss=0.0009, acc=0.9975, iter_time=6.14s]
Epoch 0: 41%|████ | 5019/12384 [10:38:55<15:33:24, 7.60s/it, loss=0.0035, acc=0.9909, iter_time=7.24s]
Epoch 0: 41%|████ | 5020/12384 [10:38:55<15:36:01, 7.63s/it, loss=0.0035, acc=0.9909, iter_time=7.24s]
Epoch 0: 41%|████ | 5020/12384 [10:39:03<15:36:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 41%|████ | 5021/12384 [10:39:03<15:34:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 41%|████ | 5021/12384 [10:39:11<15:34:38, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=9.33s]
Epoch 0: 41%|████ | 5022/12384 [10:39:11<15:34:01, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=9.33s]
Epoch 0: 41%|████ | 5022/12384 [10:39:18<15:34:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 41%|████ | 5023/12384 [10:39:18<15:34:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 41%|████ | 5023/12384 [10:39:26<15:34:16, 7.62s/it, loss=0.0003, acc=0.9993, iter_time=8.00s]
Epoch 0: 41%|████ | 5024/12384 [10:39:26<15:34:31, 7.62s/it, loss=0.0003, acc=0.9993, iter_time=8.00s]
Epoch 0: 41%|████ | 5024/12384 [10:39:34<15:34:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 0: 41%|████ | 5025/12384 [10:39:34<15:33:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 0: 41%|████ | 5025/12384 [10:39:41<15:33:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 0: 41%|████ | 5026/12384 [10:39:41<15:32:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 0: 41%|████ | 5026/12384 [10:39:49<15:32:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 41%|████ | 5027/12384 [10:39:49<15:32:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 41%|████ | 5027/12384 [10:39:56<15:32:23, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 41%|████ | 5028/12384 [10:39:56<15:32:13, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 41%|████ | 5028/12384 [10:40:04<15:32:13, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 41%|████ | 5029/12384 [10:40:04<15:45:25, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 41%|████ | 5029/12384 [10:40:12<15:45:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 41%|████ | 5030/12384 [10:40:12<15:41:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 41%|████ | 5030/12384 [10:40:19<15:41:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 41%|████ | 5031/12384 [10:40:19<15:39:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 41%|████ | 5031/12384 [10:40:27<15:39:02, 7.66s/it, loss=0.0003, acc=0.9994, iter_time=11.09s]
Epoch 0: 41%|████ | 5032/12384 [10:40:27<15:37:55, 7.65s/it, loss=0.0003, acc=0.9994, iter_time=11.09s]
Epoch 0: 41%|████ | 5032/12384 [10:40:35<15:37:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 41%|████ | 5033/12384 [10:40:35<15:35:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 41%|████ | 5033/12384 [10:40:42<15:35:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 41%|████ | 5034/12384 [10:40:42<15:33:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 41%|████ | 5034/12384 [10:40:50<15:33:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 41%|████ | 5035/12384 [10:40:50<15:31:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 41%|████ | 5035/12384 [10:40:58<15:31:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 0: 41%|████ | 5036/12384 [10:40:58<15:32:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 0: 41%|████ | 5036/12384 [10:41:05<15:32:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 41%|████ | 5037/12384 [10:41:05<15:31:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 41%|████ | 5037/12384 [10:41:13<15:31:58, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=9.91s]
Epoch 0: 41%|████ | 5038/12384 [10:41:13<15:31:02, 7.60s/it, loss=0.0001, acc=0.9995, iter_time=9.91s]
Epoch 0: 41%|████ | 5038/12384 [10:41:20<15:31:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 41%|████ | 5039/12384 [10:41:20<15:31:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 41%|████ | 5039/12384 [10:41:28<15:31:02, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.98s]
Epoch 0: 41%|████ | 5040/12384 [10:41:28<15:32:56, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.98s]
Epoch 0: 41%|████ | 5040/12384 [10:41:36<15:32:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 41%|████ | 5041/12384 [10:41:36<15:32:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 41%|████ | 5041/12384 [10:41:43<15:32:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 41%|████ | 5042/12384 [10:41:43<15:31:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 41%|████ | 5042/12384 [10:41:51<15:31:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 41%|████ | 5043/12384 [10:41:51<15:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 41%|████ | 5043/12384 [10:41:58<15:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 0: 41%|████ | 5044/12384 [10:41:58<15:31:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 0: 41%|████ | 5044/12384 [10:42:06<15:31:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 0: 41%|████ | 5045/12384 [10:42:06<15:31:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 0: 41%|████ | 5045/12384 [10:42:14<15:31:07, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.21s]
Epoch 0: 41%|████ | 5046/12384 [10:42:14<15:41:08, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=8.21s]
Epoch 0: 41%|████ | 5046/12384 [10:42:22<15:41:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 41%|████ | 5047/12384 [10:42:22<15:37:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 41%|████ | 5047/12384 [10:42:29<15:37:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 41%|████ | 5048/12384 [10:42:29<15:35:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 41%|████ | 5048/12384 [10:42:37<15:35:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.59s]
Epoch 0: 41%|████ | 5049/12384 [10:42:37<15:32:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.59s]
Epoch 0: 41%|████ | 5049/12384 [10:42:44<15:32:55, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=11.12s]
Epoch 0: 41%|████ | 5050/12384 [10:42:44<15:34:36, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=11.12s]
Epoch 0: 41%|████ | 5050/12384 [10:42:52<15:34:36, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.18s]
Epoch 0: 41%|████ | 5051/12384 [10:42:52<15:35:09, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.18s]
Epoch 0: 41%|████ | 5051/12384 [10:43:00<15:35:09, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=8.59s]
Epoch 0: 41%|████ | 5052/12384 [10:43:00<15:33:20, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=8.59s]
Epoch 0: 41%|████ | 5052/12384 [10:43:07<15:33:20, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.78s]
Epoch 0: 41%|████ | 5053/12384 [10:43:07<15:32:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.78s]
Epoch 0: 41%|████ | 5053/12384 [10:43:15<15:32:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 41%|████ | 5054/12384 [10:43:15<15:32:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 41%|████ | 5054/12384 [10:43:23<15:32:07, 7.63s/it, loss=0.0012, acc=0.9981, iter_time=9.38s]
Epoch 0: 41%|████ | 5055/12384 [10:43:23<15:31:43, 7.63s/it, loss=0.0012, acc=0.9981, iter_time=9.38s]
Epoch 0: 41%|████ | 5055/12384 [10:43:31<15:31:43, 7.63s/it, loss=0.0002, acc=0.9992, iter_time=9.62s]
Epoch 0: 41%|████ | 5056/12384 [10:43:31<15:46:18, 7.75s/it, loss=0.0002, acc=0.9992, iter_time=9.62s]
Epoch 0: 41%|████ | 5056/12384 [10:43:38<15:46:18, 7.75s/it, loss=0.0003, acc=0.9990, iter_time=7.57s]
Epoch 0: 41%|████ | 5057/12384 [10:43:38<15:42:08, 7.72s/it, loss=0.0003, acc=0.9990, iter_time=7.57s]
Epoch 0: 41%|████ | 5057/12384 [10:43:46<15:42:08, 7.72s/it, loss=0.0017, acc=0.9965, iter_time=7.62s]
Epoch 0: 41%|████ | 5058/12384 [10:43:46<15:37:30, 7.68s/it, loss=0.0017, acc=0.9965, iter_time=7.62s]
Epoch 0: 41%|████ | 5058/12384 [10:43:53<15:37:30, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 41%|████ | 5059/12384 [10:43:53<15:34:26, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 41%|████ | 5059/12384 [10:44:01<15:34:26, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 0: 41%|████ | 5060/12384 [10:44:01<15:32:09, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 0: 41%|████ | 5060/12384 [10:44:09<15:32:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 41%|████ | 5061/12384 [10:44:09<15:33:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 41%|████ | 5061/12384 [10:44:16<15:33:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 41%|████ | 5062/12384 [10:44:16<15:32:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 41%|████ | 5062/12384 [10:44:24<15:32:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 41%|████ | 5063/12384 [10:44:24<15:31:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 41%|████ | 5063/12384 [10:44:32<15:31:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.49s]
Epoch 0: 41%|████ | 5064/12384 [10:44:32<15:32:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.49s]
Epoch 0: 41%|████ | 5064/12384 [10:44:39<15:32:59, 7.65s/it, loss=0.0013, acc=0.9991, iter_time=7.65s]
Epoch 0: 41%|████ | 5065/12384 [10:44:39<15:31:23, 7.64s/it, loss=0.0013, acc=0.9991, iter_time=7.65s]
Epoch 0: 41%|████ | 5065/12384 [10:44:47<15:31:23, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=5.65s]
Epoch 0: 41%|████ | 5066/12384 [10:44:47<15:30:49, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=5.65s]
Epoch 0: 41%|████ | 5066/12384 [10:44:54<15:30:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 41%|████ | 5067/12384 [10:44:54<15:32:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 41%|████ | 5067/12384 [10:45:02<15:32:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 41%|████ | 5068/12384 [10:45:02<15:31:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 41%|████ | 5068/12384 [10:45:10<15:31:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 41%|████ | 5069/12384 [10:45:10<15:31:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 41%|████ | 5069/12384 [10:45:17<15:31:22, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 41%|████ | 5070/12384 [10:45:17<15:30:20, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 41%|████ | 5070/12384 [10:45:25<15:30:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 41%|████ | 5071/12384 [10:45:25<15:28:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 41%|████ | 5071/12384 [10:45:33<15:28:40, 7.62s/it, loss=0.0002, acc=0.9980, iter_time=7.54s]
Epoch 0: 41%|████ | 5072/12384 [10:45:33<15:27:37, 7.61s/it, loss=0.0002, acc=0.9980, iter_time=7.54s]
Epoch 0: 41%|████ | 5072/12384 [10:45:40<15:27:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 41%|████ | 5073/12384 [10:45:40<15:27:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 41%|████ | 5073/12384 [10:45:48<15:27:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 41%|████ | 5074/12384 [10:45:48<15:29:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 41%|████ | 5074/12384 [10:45:55<15:29:35, 7.63s/it, loss=0.0003, acc=0.9986, iter_time=6.99s]
Epoch 0: 41%|████ | 5075/12384 [10:45:55<15:28:36, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=6.99s]
Epoch 0: 41%|████ | 5075/12384 [10:46:03<15:28:36, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.99s]
Epoch 0: 41%|████ | 5076/12384 [10:46:03<15:27:15, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.99s]
Epoch 0: 41%|████ | 5076/12384 [10:46:11<15:27:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 41%|████ | 5077/12384 [10:46:11<15:26:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 41%|████ | 5077/12384 [10:46:18<15:26:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 41%|████ | 5078/12384 [10:46:18<15:26:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 41%|████ | 5078/12384 [10:46:26<15:26:54, 7.61s/it, loss=0.0005, acc=0.9976, iter_time=7.61s]
Epoch 0: 41%|████ | 5079/12384 [10:46:26<15:26:19, 7.61s/it, loss=0.0005, acc=0.9976, iter_time=7.61s]
Epoch 0: 41%|████ | 5079/12384 [10:46:33<15:26:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 41%|████ | 5080/12384 [10:46:33<15:26:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 41%|████ | 5080/12384 [10:46:41<15:26:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 41%|████ | 5081/12384 [10:46:41<15:25:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 41%|████ | 5081/12384 [10:46:49<15:25:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 41%|████ | 5082/12384 [10:46:49<15:36:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 41%|████ | 5082/12384 [10:46:57<15:36:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 41%|████ | 5083/12384 [10:46:57<15:33:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 41%|████ | 5083/12384 [10:47:04<15:33:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 41%|████ | 5084/12384 [10:47:04<15:30:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 41%|████ | 5084/12384 [10:47:12<15:30:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 41%|████ | 5085/12384 [10:47:12<15:29:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 41%|████ | 5085/12384 [10:47:19<15:29:34, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 41%|████ | 5086/12384 [10:47:19<15:31:51, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 41%|████ | 5086/12384 [10:47:27<15:31:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 41%|████ | 5087/12384 [10:47:27<15:29:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 41%|████ | 5087/12384 [10:47:35<15:29:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 41%|████ | 5088/12384 [10:47:35<15:31:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 41%|████ | 5088/12384 [10:47:42<15:31:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 41%|████ | 5089/12384 [10:47:42<15:29:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 41%|████ | 5089/12384 [10:47:50<15:29:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 41%|████ | 5090/12384 [10:47:50<15:27:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 41%|████ | 5090/12384 [10:47:58<15:27:24, 7.63s/it, loss=0.0016, acc=0.9973, iter_time=5.05s]
Epoch 0: 41%|████ | 5091/12384 [10:47:58<15:27:22, 7.63s/it, loss=0.0016, acc=0.9973, iter_time=5.05s]
Epoch 0: 41%|████ | 5091/12384 [10:48:05<15:27:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 41%|████ | 5092/12384 [10:48:05<15:27:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 41%|████ | 5092/12384 [10:48:13<15:27:19, 7.63s/it, loss=0.0004, acc=0.9993, iter_time=5.90s]
Epoch 0: 41%|████ | 5093/12384 [10:48:13<15:27:07, 7.63s/it, loss=0.0004, acc=0.9993, iter_time=5.90s]
Epoch 0: 41%|████ | 5093/12384 [10:48:21<15:27:07, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=9.37s]
Epoch 0: 41%|████ | 5094/12384 [10:48:21<15:26:58, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=9.37s]
Epoch 0: 41%|████ | 5094/12384 [10:48:28<15:26:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 41%|████ | 5095/12384 [10:48:28<15:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 41%|████ | 5095/12384 [10:48:36<15:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 41%|████ | 5096/12384 [10:48:36<15:26:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 41%|████ | 5096/12384 [10:48:43<15:26:09, 7.62s/it, loss=0.0012, acc=0.9968, iter_time=6.70s]
Epoch 0: 41%|████ | 5097/12384 [10:48:43<15:24:53, 7.62s/it, loss=0.0012, acc=0.9968, iter_time=6.70s]
Epoch 0: 41%|████ | 5097/12384 [10:48:51<15:24:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 41%|████ | 5098/12384 [10:48:51<15:34:38, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 41%|████ | 5098/12384 [10:48:59<15:34:38, 7.70s/it, loss=0.0003, acc=0.9980, iter_time=7.58s]
Epoch 0: 41%|████ | 5099/12384 [10:48:59<15:30:54, 7.67s/it, loss=0.0003, acc=0.9980, iter_time=7.58s]
Epoch 0: 41%|████ | 5099/12384 [10:49:07<15:30:54, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.10s]
Epoch 0: 41%|████ | 5100/12384 [10:49:07<15:31:48, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.10s]
Epoch 0: 41%|████ | 5100/12384 [10:49:14<15:31:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 0: 41%|████ | 5101/12384 [10:49:14<15:28:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 0: 41%|████ | 5101/12384 [10:49:22<15:28:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 0: 41%|████ | 5102/12384 [10:49:22<15:25:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 0: 41%|████ | 5102/12384 [10:49:29<15:25:38, 7.63s/it, loss=0.0003, acc=0.9992, iter_time=6.51s]
Epoch 0: 41%|████ | 5103/12384 [10:49:29<15:25:20, 7.63s/it, loss=0.0003, acc=0.9992, iter_time=6.51s]
Epoch 0: 41%|████ | 5103/12384 [10:49:37<15:25:20, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.86s]
Epoch 0: 41%|████ | 5104/12384 [10:49:37<15:25:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.86s]
Epoch 0: 41%|████ | 5104/12384 [10:49:44<15:25:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.38s]
Epoch 0: 41%|████ | 5105/12384 [10:49:44<14:47:27, 7.32s/it, loss=0.0001, acc=1.0000, iter_time=5.38s]
Epoch 0: 41%|████ | 5105/12384 [10:49:51<14:47:27, 7.32s/it, loss=0.0001, acc=1.0000, iter_time=5.96s]
Epoch 0: 41%|████ | 5106/12384 [10:49:51<14:58:02, 7.40s/it, loss=0.0001, acc=1.0000, iter_time=5.96s]
Epoch 0: 41%|████ | 5106/12384 [10:49:59<14:58:02, 7.40s/it, loss=0.0001, acc=1.0000, iter_time=10.11s]
Epoch 0: 41%|████ | 5107/12384 [10:49:59<15:05:09, 7.46s/it, loss=0.0001, acc=1.0000, iter_time=10.11s]
Epoch 0: 41%|████ | 5107/12384 [10:50:06<15:05:09, 7.46s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 41%|████ | 5108/12384 [10:50:06<15:10:37, 7.51s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 41%|████ | 5108/12384 [10:50:14<15:10:37, 7.51s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 0: 41%|████▏ | 5109/12384 [10:50:14<15:27:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 0: 41%|████▏ | 5109/12384 [10:50:22<15:27:17, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=8.69s]
Epoch 0: 41%|████▏ | 5110/12384 [10:50:22<15:27:49, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=8.69s]
Epoch 0: 41%|████▏ | 5110/12384 [10:50:30<15:27:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 41%|████▏ | 5111/12384 [10:50:30<15:27:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 41%|████▏ | 5111/12384 [10:50:37<15:27:12, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 41%|████▏ | 5112/12384 [10:50:37<15:26:04, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 41%|████▏ | 5112/12384 [10:50:45<15:26:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 41%|████▏ | 5113/12384 [10:50:45<15:26:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 41%|████▏ | 5113/12384 [10:50:53<15:26:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 41%|████▏ | 5114/12384 [10:50:53<15:25:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 41%|████▏ | 5114/12384 [10:51:00<15:25:00, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.30s]
Epoch 0: 41%|████▏ | 5115/12384 [10:51:00<15:23:50, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.30s]
Epoch 0: 41%|████▏ | 5115/12384 [10:51:08<15:23:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 41%|████▏ | 5116/12384 [10:51:08<15:22:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 41%|████▏ | 5116/12384 [10:51:15<15:22:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 41%|████▏ | 5117/12384 [10:51:15<15:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 41%|████▏ | 5117/12384 [10:51:23<15:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 41%|████▏ | 5118/12384 [10:51:23<15:26:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 41%|████▏ | 5118/12384 [10:51:31<15:26:12, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.25s]
Epoch 0: 41%|████▏ | 5119/12384 [10:51:31<15:25:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.25s]
Epoch 0: 41%|████▏ | 5119/12384 [10:51:38<15:25:29, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=8.04s]
Epoch 0: 41%|████▏ | 5120/12384 [10:51:38<15:26:45, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=8.04s]
Epoch 0: 41%|████▏ | 5120/12384 [10:51:46<15:26:45, 7.65s/it, loss=0.0008, acc=0.9973, iter_time=4.72s]
Epoch 0: 41%|████▏ | 5121/12384 [10:51:46<15:25:06, 7.64s/it, loss=0.0008, acc=0.9973, iter_time=4.72s]
Epoch 0: 41%|████▏ | 5121/12384 [10:51:54<15:25:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 41%|████▏ | 5122/12384 [10:51:54<15:24:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 41%|████▏ | 5122/12384 [10:52:01<15:24:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 41%|████▏ | 5123/12384 [10:52:01<15:24:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 41%|████▏ | 5123/12384 [10:52:09<15:24:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 41%|████▏ | 5124/12384 [10:52:09<15:34:20, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 41%|████▏ | 5124/12384 [10:52:17<15:34:20, 7.72s/it, loss=0.0006, acc=0.9980, iter_time=4.77s]
Epoch 0: 41%|████▏ | 5125/12384 [10:52:17<15:29:56, 7.69s/it, loss=0.0006, acc=0.9980, iter_time=4.77s]
Epoch 0: 41%|████▏ | 5125/12384 [10:52:24<15:29:56, 7.69s/it, loss=0.0002, acc=0.9997, iter_time=10.42s]
Epoch 0: 41%|████▏ | 5126/12384 [10:52:24<15:27:48, 7.67s/it, loss=0.0002, acc=0.9997, iter_time=10.42s]
Epoch 0: 41%|████▏ | 5126/12384 [10:52:32<15:27:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 41%|████▏ | 5127/12384 [10:52:32<15:25:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 41%|████▏ | 5127/12384 [10:52:40<15:25:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 41%|████▏ | 5128/12384 [10:52:40<15:23:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 41%|████▏ | 5128/12384 [10:52:47<15:23:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 41%|████▏ | 5129/12384 [10:52:47<15:23:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 41%|████▏ | 5129/12384 [10:52:55<15:23:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 41%|████▏ | 5130/12384 [10:52:55<15:21:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 41%|████▏ | 5130/12384 [10:53:02<15:21:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 41%|████▏ | 5131/12384 [10:53:02<15:21:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 41%|████▏ | 5131/12384 [10:53:10<15:21:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 41%|████▏ | 5132/12384 [10:53:10<15:22:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 41%|████▏ | 5132/12384 [10:53:18<15:22:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 41%|████▏ | 5133/12384 [10:53:18<15:21:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 41%|████▏ | 5133/12384 [10:53:25<15:21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 41%|████▏ | 5134/12384 [10:53:25<15:20:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 41%|████▏ | 5134/12384 [10:53:33<15:20:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 41%|████▏ | 5135/12384 [10:53:33<15:32:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 41%|████▏ | 5135/12384 [10:53:41<15:32:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 41%|████▏ | 5136/12384 [10:53:41<15:28:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 41%|████▏ | 5136/12384 [10:53:49<15:28:53, 7.69s/it, loss=0.0002, acc=0.9989, iter_time=7.23s]
Epoch 0: 41%|████▏ | 5137/12384 [10:53:49<15:25:25, 7.66s/it, loss=0.0002, acc=0.9989, iter_time=7.23s]
Epoch 0: 41%|████▏ | 5137/12384 [10:53:56<15:25:25, 7.66s/it, loss=0.0006, acc=0.9983, iter_time=7.60s]
Epoch 0: 41%|████▏ | 5138/12384 [10:53:56<15:23:44, 7.65s/it, loss=0.0006, acc=0.9983, iter_time=7.60s]
Epoch 0: 41%|████▏ | 5138/12384 [10:54:04<15:23:44, 7.65s/it, loss=0.0007, acc=1.0000, iter_time=7.62s]
Epoch 0: 41%|████▏ | 5139/12384 [10:54:04<15:22:35, 7.64s/it, loss=0.0007, acc=1.0000, iter_time=7.62s]
Epoch 0: 41%|████▏ | 5139/12384 [10:54:11<15:22:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 42%|████▏ | 5140/12384 [10:54:11<15:23:07, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 42%|████▏ | 5140/12384 [10:54:19<15:23:07, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=7.66s]
Epoch 0: 42%|████▏ | 5141/12384 [10:54:19<15:21:42, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=7.66s]
Epoch 0: 42%|████▏ | 5141/12384 [10:54:27<15:21:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.55s]
Epoch 0: 42%|████▏ | 5142/12384 [10:54:27<15:20:41, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.55s]
Epoch 0: 42%|████▏ | 5142/12384 [10:54:34<15:20:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 42%|████▏ | 5143/12384 [10:54:34<15:22:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 42%|████▏ | 5143/12384 [10:54:42<15:22:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 42%|████▏ | 5144/12384 [10:54:42<15:21:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 42%|████▏ | 5144/12384 [10:54:50<15:21:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 42%|████▏ | 5145/12384 [10:54:50<15:20:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 42%|████▏ | 5145/12384 [10:54:57<15:20:31, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 42%|████▏ | 5146/12384 [10:54:57<15:20:01, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 42%|████▏ | 5146/12384 [10:55:05<15:20:01, 7.63s/it, loss=0.0003, acc=0.9987, iter_time=5.33s]
Epoch 0: 42%|████▏ | 5147/12384 [10:55:05<15:19:42, 7.63s/it, loss=0.0003, acc=0.9987, iter_time=5.33s]
Epoch 0: 42%|████▏ | 5147/12384 [10:55:12<15:19:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.90s]
Epoch 0: 42%|████▏ | 5148/12384 [10:55:12<15:20:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.90s]
Epoch 0: 42%|████▏ | 5148/12384 [10:55:20<15:20:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 42%|████▏ | 5149/12384 [10:55:20<15:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 42%|████▏ | 5149/12384 [10:55:28<15:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 42%|████▏ | 5150/12384 [10:55:28<15:28:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 42%|████▏ | 5150/12384 [10:55:36<15:28:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 42%|████▏ | 5151/12384 [10:55:36<15:25:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 42%|████▏ | 5151/12384 [10:55:43<15:25:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 42%|████▏ | 5152/12384 [10:55:43<15:22:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 42%|████▏ | 5152/12384 [10:55:51<15:22:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 0: 42%|████▏ | 5153/12384 [10:55:51<15:20:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 0: 42%|████▏ | 5153/12384 [10:55:58<15:20:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.39s]
Epoch 0: 42%|████▏ | 5154/12384 [10:55:58<15:19:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.39s]
Epoch 0: 42%|████▏ | 5154/12384 [10:56:06<15:19:34, 7.63s/it, loss=0.0001, acc=0.9992, iter_time=7.59s]
Epoch 0: 42%|████▏ | 5155/12384 [10:56:06<15:18:22, 7.62s/it, loss=0.0001, acc=0.9992, iter_time=7.59s]
Epoch 0: 42%|████▏ | 5155/12384 [10:56:14<15:18:22, 7.62s/it, loss=0.0003, acc=0.9995, iter_time=7.65s]
Epoch 0: 42%|████▏ | 5156/12384 [10:56:14<15:19:07, 7.63s/it, loss=0.0003, acc=0.9995, iter_time=7.65s]
Epoch 0: 42%|████▏ | 5156/12384 [10:56:21<15:19:07, 7.63s/it, loss=0.0002, acc=0.9981, iter_time=7.63s]
Epoch 0: 42%|████▏ | 5157/12384 [10:56:21<15:18:38, 7.63s/it, loss=0.0002, acc=0.9981, iter_time=7.63s]
Epoch 0: 42%|████▏ | 5157/12384 [10:56:29<15:18:38, 7.63s/it, loss=0.0009, acc=0.9973, iter_time=5.01s]
Epoch 0: 42%|████▏ | 5158/12384 [10:56:29<15:18:17, 7.62s/it, loss=0.0009, acc=0.9973, iter_time=5.01s]
Epoch 0: 42%|████▏ | 5158/12384 [10:56:37<15:18:17, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=10.22s]
Epoch 0: 42%|████▏ | 5159/12384 [10:56:37<15:21:31, 7.65s/it, loss=0.0002, acc=0.9989, iter_time=10.22s]
Epoch 0: 42%|████▏ | 5159/12384 [10:56:44<15:21:31, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.68s]
Epoch 0: 42%|████▏ | 5160/12384 [10:56:44<15:20:25, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.68s]
Epoch 0: 42%|████▏ | 5160/12384 [10:56:52<15:20:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 42%|████▏ | 5161/12384 [10:56:52<15:32:33, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 42%|████▏ | 5161/12384 [10:57:00<15:32:33, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 42%|████▏ | 5162/12384 [10:57:00<15:27:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 42%|████▏ | 5162/12384 [10:57:07<15:27:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 42%|████▏ | 5163/12384 [10:57:07<15:22:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 42%|████▏ | 5163/12384 [10:57:15<15:22:46, 7.67s/it, loss=0.0009, acc=0.9977, iter_time=7.51s]
Epoch 0: 42%|████▏ | 5164/12384 [10:57:15<15:21:08, 7.65s/it, loss=0.0009, acc=0.9977, iter_time=7.51s]
Epoch 0: 42%|████▏ | 5164/12384 [10:57:23<15:21:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 0: 42%|████▏ | 5165/12384 [10:57:23<15:19:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 0: 42%|████▏ | 5165/12384 [10:57:30<15:19:23, 7.64s/it, loss=0.0001, acc=0.9992, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5166/12384 [10:57:30<15:17:47, 7.63s/it, loss=0.0001, acc=0.9992, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5166/12384 [10:57:38<15:17:47, 7.63s/it, loss=0.0008, acc=0.9973, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5167/12384 [10:57:38<15:16:46, 7.62s/it, loss=0.0008, acc=0.9973, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5167/12384 [10:57:45<15:16:46, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 42%|████▏ | 5168/12384 [10:57:45<15:16:53, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 42%|████▏ | 5168/12384 [10:57:53<15:16:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 42%|████▏ | 5169/12384 [10:57:53<15:16:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 42%|████▏ | 5169/12384 [10:58:01<15:16:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 42%|████▏ | 5170/12384 [10:58:01<15:17:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 42%|████▏ | 5170/12384 [10:58:08<15:17:21, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=7.66s]
Epoch 0: 42%|████▏ | 5171/12384 [10:58:08<15:16:28, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=7.66s]
Epoch 0: 42%|████▏ | 5171/12384 [10:58:16<15:16:28, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5172/12384 [10:58:16<15:20:04, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5172/12384 [10:58:24<15:20:04, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 42%|████▏ | 5173/12384 [10:58:24<15:20:42, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 42%|████▏ | 5173/12384 [10:58:31<15:20:42, 7.66s/it, loss=0.0049, acc=0.9899, iter_time=7.67s]
Epoch 0: 42%|████▏ | 5174/12384 [10:58:31<15:22:22, 7.68s/it, loss=0.0049, acc=0.9899, iter_time=7.67s]
Epoch 0: 42%|████▏ | 5174/12384 [10:58:39<15:22:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 42%|████▏ | 5175/12384 [10:58:39<15:19:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 42%|████▏ | 5175/12384 [10:58:47<15:19:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 42%|████▏ | 5176/12384 [10:58:47<15:18:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 42%|████▏ | 5176/12384 [10:58:55<15:18:09, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.53s]
Epoch 0: 42%|████▏ | 5177/12384 [10:58:55<15:27:12, 7.72s/it, loss=0.0001, acc=0.9999, iter_time=7.53s]
Epoch 0: 42%|████▏ | 5177/12384 [10:59:02<15:27:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 42%|████▏ | 5178/12384 [10:59:02<15:23:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 42%|████▏ | 5178/12384 [10:59:10<15:23:21, 7.69s/it, loss=0.0001, acc=0.9993, iter_time=7.00s]
Epoch 0: 42%|████▏ | 5179/12384 [10:59:10<15:20:20, 7.66s/it, loss=0.0001, acc=0.9993, iter_time=7.00s]
Epoch 0: 42%|████▏ | 5179/12384 [10:59:17<15:20:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 0: 42%|████▏ | 5180/12384 [10:59:17<15:18:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 0: 42%|████▏ | 5180/12384 [10:59:25<15:18:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 42%|████▏ | 5181/12384 [10:59:25<15:16:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 42%|████▏ | 5181/12384 [10:59:33<15:16:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5182/12384 [10:59:33<15:16:48, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5182/12384 [10:59:40<15:16:48, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 42%|████▏ | 5183/12384 [10:59:40<15:19:00, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 42%|████▏ | 5183/12384 [10:59:48<15:19:00, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 42%|████▏ | 5184/12384 [10:59:48<15:16:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 42%|████▏ | 5184/12384 [10:59:56<15:16:35, 7.64s/it, loss=0.0008, acc=0.9977, iter_time=7.21s]
Epoch 0: 42%|████▏ | 5185/12384 [10:59:56<15:15:43, 7.63s/it, loss=0.0008, acc=0.9977, iter_time=7.21s]
Epoch 0: 42%|████▏ | 5185/12384 [11:00:03<15:15:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 42%|████▏ | 5186/12384 [11:00:03<15:15:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 42%|████▏ | 5186/12384 [11:00:11<15:15:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 42%|████▏ | 5187/12384 [11:00:11<15:29:23, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 42%|████▏ | 5187/12384 [11:00:19<15:29:23, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 42%|████▏ | 5188/12384 [11:00:19<15:24:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 42%|████▏ | 5188/12384 [11:00:26<15:24:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 42%|████▏ | 5189/12384 [11:00:26<15:20:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 42%|████▏ | 5189/12384 [11:00:34<15:20:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 42%|████▏ | 5190/12384 [11:00:34<15:22:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 42%|████▏ | 5190/12384 [11:00:42<15:22:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 42%|████▏ | 5191/12384 [11:00:42<15:19:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 42%|████▏ | 5191/12384 [11:00:49<15:19:03, 7.67s/it, loss=0.0005, acc=0.9997, iter_time=8.96s]
Epoch 0: 42%|████▏ | 5192/12384 [11:00:49<15:17:39, 7.66s/it, loss=0.0005, acc=0.9997, iter_time=8.96s]
Epoch 0: 42%|████▏ | 5192/12384 [11:00:57<15:17:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 0: 42%|████▏ | 5193/12384 [11:00:57<15:16:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 0: 42%|████▏ | 5193/12384 [11:01:05<15:16:32, 7.65s/it, loss=0.0001, acc=0.9994, iter_time=11.17s]
Epoch 0: 42%|████▏ | 5194/12384 [11:01:05<15:17:16, 7.65s/it, loss=0.0001, acc=0.9994, iter_time=11.17s]
Epoch 0: 42%|████▏ | 5194/12384 [11:01:12<15:17:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 42%|████▏ | 5195/12384 [11:01:12<15:14:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 42%|████▏ | 5195/12384 [11:01:20<15:14:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 42%|████▏ | 5196/12384 [11:01:20<15:12:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 42%|████▏ | 5196/12384 [11:01:27<15:12:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 42%|████▏ | 5197/12384 [11:01:27<15:11:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 42%|████▏ | 5197/12384 [11:01:35<15:11:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 42%|████▏ | 5198/12384 [11:01:35<15:11:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 42%|████▏ | 5198/12384 [11:01:43<15:11:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 42%|████▏ | 5199/12384 [11:01:43<15:10:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 42%|████▏ | 5199/12384 [11:01:49<15:10:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 42%|████▏ | 5200/12384 [11:01:49<14:37:09, 7.33s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 42%|████▏ | 5200/12384 [11:01:57<14:37:09, 7.33s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 0: 42%|████▏ | 5201/12384 [11:01:57<14:47:49, 7.42s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 0: 42%|████▏ | 5201/12384 [11:02:05<14:47:49, 7.42s/it, loss=0.0003, acc=0.9986, iter_time=9.95s]
Epoch 0: 42%|████▏ | 5202/12384 [11:02:05<14:54:38, 7.47s/it, loss=0.0003, acc=0.9986, iter_time=9.95s]
Epoch 0: 42%|████▏ | 5202/12384 [11:02:12<14:54:38, 7.47s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 42%|████▏ | 5203/12384 [11:02:12<15:00:00, 7.52s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 42%|████▏ | 5203/12384 [11:02:20<15:00:00, 7.52s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 42%|████▏ | 5204/12384 [11:02:20<15:03:35, 7.55s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 42%|████▏ | 5204/12384 [11:02:27<15:03:35, 7.55s/it, loss=0.0001, acc=1.0000, iter_time=9.91s]
Epoch 0: 42%|████▏ | 5205/12384 [11:02:27<15:05:15, 7.57s/it, loss=0.0001, acc=1.0000, iter_time=9.91s]
Epoch 0: 42%|████▏ | 5205/12384 [11:02:35<15:05:15, 7.57s/it, loss=0.0002, acc=0.9986, iter_time=5.83s]
Epoch 0: 42%|████▏ | 5206/12384 [11:02:35<15:07:07, 7.58s/it, loss=0.0002, acc=0.9986, iter_time=5.83s]
Epoch 0: 42%|████▏ | 5206/12384 [11:02:43<15:07:07, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 42%|████▏ | 5207/12384 [11:02:43<15:07:34, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 42%|████▏ | 5207/12384 [11:02:50<15:07:34, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 42%|████▏ | 5208/12384 [11:02:50<15:07:45, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 42%|████▏ | 5208/12384 [11:02:58<15:07:45, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 42%|████▏ | 5209/12384 [11:02:58<15:06:55, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 42%|████▏ | 5209/12384 [11:03:05<15:06:55, 7.58s/it, loss=0.0005, acc=0.9971, iter_time=8.13s]
Epoch 0: 42%|████▏ | 5210/12384 [11:03:05<15:07:48, 7.59s/it, loss=0.0005, acc=0.9971, iter_time=8.13s]
Epoch 0: 42%|████▏ | 5210/12384 [11:03:13<15:07:48, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 42%|████▏ | 5211/12384 [11:03:13<15:08:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 42%|████▏ | 5211/12384 [11:03:21<15:08:46, 7.60s/it, loss=0.0008, acc=0.9985, iter_time=7.01s]
Epoch 0: 42%|████▏ | 5212/12384 [11:03:21<15:08:56, 7.60s/it, loss=0.0008, acc=0.9985, iter_time=7.01s]
Epoch 0: 42%|████▏ | 5212/12384 [11:03:29<15:08:56, 7.60s/it, loss=0.0002, acc=0.9987, iter_time=9.13s]
Epoch 0: 42%|████▏ | 5213/12384 [11:03:29<15:21:06, 7.71s/it, loss=0.0002, acc=0.9987, iter_time=9.13s]
Epoch 0: 42%|████▏ | 5213/12384 [11:03:36<15:21:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 42%|████▏ | 5214/12384 [11:03:36<15:20:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 42%|████▏ | 5214/12384 [11:03:44<15:20:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 42%|████▏ | 5215/12384 [11:03:44<15:17:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 42%|████▏ | 5215/12384 [11:03:51<15:17:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 42%|████▏ | 5216/12384 [11:03:51<15:14:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 42%|████▏ | 5216/12384 [11:03:59<15:14:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 0: 42%|████▏ | 5217/12384 [11:03:59<15:12:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 0: 42%|████▏ | 5217/12384 [11:04:07<15:12:19, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.79s]
Epoch 0: 42%|████▏ | 5218/12384 [11:04:07<15:10:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.79s]
Epoch 0: 42%|████▏ | 5218/12384 [11:04:14<15:10:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 42%|████▏ | 5219/12384 [11:04:14<15:09:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 42%|████▏ | 5219/12384 [11:04:22<15:09:26, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=4.00s]
Epoch 0: 42%|████▏ | 5220/12384 [11:04:22<15:08:49, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=4.00s]
Epoch 0: 42%|████▏ | 5220/12384 [11:04:29<15:08:49, 7.61s/it, loss=0.0007, acc=0.9980, iter_time=11.21s]
Epoch 0: 42%|████▏ | 5221/12384 [11:04:29<15:08:29, 7.61s/it, loss=0.0007, acc=0.9980, iter_time=11.21s]
Epoch 0: 42%|████▏ | 5221/12384 [11:04:37<15:08:29, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 42%|████▏ | 5222/12384 [11:04:37<15:07:29, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 42%|████▏ | 5222/12384 [11:04:45<15:07:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 42%|████▏ | 5223/12384 [11:04:45<15:08:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 42%|████▏ | 5223/12384 [11:04:52<15:08:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 42%|████▏ | 5224/12384 [11:04:52<15:08:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 42%|████▏ | 5224/12384 [11:05:00<15:08:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 42%|████▏ | 5225/12384 [11:05:00<15:08:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 42%|████▏ | 5225/12384 [11:05:08<15:08:58, 7.62s/it, loss=0.0039, acc=0.9977, iter_time=7.08s]
Epoch 0: 42%|████▏ | 5226/12384 [11:05:08<15:08:02, 7.61s/it, loss=0.0039, acc=0.9977, iter_time=7.08s]
Epoch 0: 42%|████▏ | 5226/12384 [11:05:15<15:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 42%|████▏ | 5227/12384 [11:05:15<15:07:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 42%|████▏ | 5227/12384 [11:05:23<15:07:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 42%|████▏ | 5228/12384 [11:05:23<15:07:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 42%|████▏ | 5228/12384 [11:05:31<15:07:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 42%|████▏ | 5229/12384 [11:05:31<15:16:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 42%|████▏ | 5229/12384 [11:05:38<15:16:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 42%|████▏ | 5230/12384 [11:05:38<15:14:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 42%|████▏ | 5230/12384 [11:05:46<15:14:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 42%|████▏ | 5231/12384 [11:05:46<15:11:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 42%|████▏ | 5231/12384 [11:05:53<15:11:19, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 42%|████▏ | 5232/12384 [11:05:53<15:10:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 42%|████▏ | 5232/12384 [11:06:01<15:10:30, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=7.65s]
Epoch 0: 42%|████▏ | 5233/12384 [11:06:01<15:08:31, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=7.65s]
Epoch 0: 42%|████▏ | 5233/12384 [11:06:09<15:08:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 42%|████▏ | 5234/12384 [11:06:09<15:08:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 42%|████▏ | 5234/12384 [11:06:16<15:08:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5235/12384 [11:06:16<15:10:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5235/12384 [11:06:24<15:10:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 42%|████▏ | 5236/12384 [11:06:24<15:09:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 42%|████▏ | 5236/12384 [11:06:32<15:09:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 0: 42%|████▏ | 5237/12384 [11:06:32<15:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 0: 42%|████▏ | 5237/12384 [11:06:39<15:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 42%|████▏ | 5238/12384 [11:06:39<15:07:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 42%|████▏ | 5238/12384 [11:06:47<15:07:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 42%|████▏ | 5239/12384 [11:06:47<15:06:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 42%|████▏ | 5239/12384 [11:06:55<15:06:58, 7.62s/it, loss=0.0039, acc=0.9963, iter_time=8.63s]
Epoch 0: 42%|████▏ | 5240/12384 [11:06:55<15:19:40, 7.72s/it, loss=0.0039, acc=0.9963, iter_time=8.63s]
Epoch 0: 42%|████▏ | 5240/12384 [11:07:02<15:19:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 42%|████▏ | 5241/12384 [11:07:02<15:15:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 42%|████▏ | 5241/12384 [11:07:10<15:15:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 42%|████▏ | 5242/12384 [11:07:10<15:12:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 42%|████▏ | 5242/12384 [11:07:18<15:12:34, 7.67s/it, loss=0.0003, acc=0.9998, iter_time=5.61s]
Epoch 0: 42%|████▏ | 5243/12384 [11:07:18<15:10:00, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=5.61s]
Epoch 0: 42%|████▏ | 5243/12384 [11:07:25<15:10:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 42%|████▏ | 5244/12384 [11:07:25<15:11:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 42%|████▏ | 5244/12384 [11:07:33<15:11:10, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=4.69s]
Epoch 0: 42%|████▏ | 5245/12384 [11:07:33<15:09:01, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=4.69s]
Epoch 0: 42%|████▏ | 5245/12384 [11:07:40<15:09:01, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.48s]
Epoch 0: 42%|████▏ | 5246/12384 [11:07:40<15:07:47, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.48s]
Epoch 0: 42%|████▏ | 5246/12384 [11:07:48<15:07:47, 7.63s/it, loss=0.0010, acc=0.9968, iter_time=8.21s]
Epoch 0: 42%|████▏ | 5247/12384 [11:07:48<15:10:53, 7.66s/it, loss=0.0010, acc=0.9968, iter_time=8.21s]
Epoch 0: 42%|████▏ | 5247/12384 [11:07:56<15:10:53, 7.66s/it, loss=0.0021, acc=0.9966, iter_time=10.64s]
Epoch 0: 42%|████▏ | 5248/12384 [11:07:56<15:09:07, 7.64s/it, loss=0.0021, acc=0.9966, iter_time=10.64s]
Epoch 0: 42%|████▏ | 5248/12384 [11:08:03<15:09:07, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 42%|████▏ | 5249/12384 [11:08:03<15:06:35, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 42%|████▏ | 5249/12384 [11:08:11<15:06:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 42%|████▏ | 5250/12384 [11:08:11<15:05:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 42%|████▏ | 5250/12384 [11:08:19<15:05:44, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=7.20s]
Epoch 0: 42%|████▏ | 5251/12384 [11:08:19<15:05:13, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.20s]
Epoch 0: 42%|████▏ | 5251/12384 [11:08:26<15:05:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 42%|████▏ | 5252/12384 [11:08:26<15:05:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 42%|████▏ | 5252/12384 [11:08:34<15:05:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.07s]
Epoch 0: 42%|████▏ | 5253/12384 [11:08:34<15:04:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.07s]
Epoch 0: 42%|████▏ | 5253/12384 [11:08:41<15:04:22, 7.61s/it, loss=0.0001, acc=0.9989, iter_time=10.14s]
Epoch 0: 42%|████▏ | 5254/12384 [11:08:41<15:04:18, 7.61s/it, loss=0.0001, acc=0.9989, iter_time=10.14s]
Epoch 0: 42%|████▏ | 5254/12384 [11:08:49<15:04:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 42%|████▏ | 5255/12384 [11:08:49<15:03:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 42%|████▏ | 5255/12384 [11:08:57<15:03:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 0: 42%|████▏ | 5256/12384 [11:08:57<15:03:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 0: 42%|████▏ | 5256/12384 [11:09:04<15:03:53, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.25s]
Epoch 0: 42%|████▏ | 5257/12384 [11:09:04<15:03:47, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.25s]
Epoch 0: 42%|████▏ | 5257/12384 [11:09:12<15:03:47, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5258/12384 [11:09:12<15:04:05, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5258/12384 [11:09:19<15:04:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5259/12384 [11:09:19<15:03:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 42%|████▏ | 5259/12384 [11:09:27<15:03:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 42%|████▏ | 5260/12384 [11:09:27<15:03:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 42%|████▏ | 5260/12384 [11:09:35<15:03:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 42%|████▏ | 5261/12384 [11:09:35<15:03:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 42%|████▏ | 5261/12384 [11:09:42<15:03:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 42%|████▏ | 5262/12384 [11:09:42<15:03:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 42%|████▏ | 5262/12384 [11:09:50<15:03:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 42%|████▏ | 5263/12384 [11:09:50<15:04:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 42%|████▏ | 5263/12384 [11:09:58<15:04:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 43%|████▎ | 5264/12384 [11:09:58<15:02:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 43%|████▎ | 5264/12384 [11:10:05<15:02:27, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.71s]
Epoch 0: 43%|████▎ | 5265/12384 [11:10:05<15:01:45, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=6.71s]
Epoch 0: 43%|████▎ | 5265/12384 [11:10:13<15:01:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 0: 43%|████▎ | 5266/12384 [11:10:13<15:13:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 0: 43%|████▎ | 5266/12384 [11:10:21<15:13:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 0: 43%|████▎ | 5267/12384 [11:10:21<15:10:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 0: 43%|████▎ | 5267/12384 [11:10:28<15:10:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 43%|████▎ | 5268/12384 [11:10:28<15:07:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 43%|████▎ | 5268/12384 [11:10:36<15:07:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 43%|████▎ | 5269/12384 [11:10:36<15:05:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 43%|████▎ | 5269/12384 [11:10:43<15:05:53, 7.64s/it, loss=0.0004, acc=0.9980, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5270/12384 [11:10:43<15:05:04, 7.63s/it, loss=0.0004, acc=0.9980, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5270/12384 [11:10:51<15:05:04, 7.63s/it, loss=0.0021, acc=0.9948, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5271/12384 [11:10:51<15:03:44, 7.62s/it, loss=0.0021, acc=0.9948, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5271/12384 [11:10:59<15:03:44, 7.62s/it, loss=0.0008, acc=0.9960, iter_time=7.99s]
Epoch 0: 43%|████▎ | 5272/12384 [11:10:59<15:03:45, 7.62s/it, loss=0.0008, acc=0.9960, iter_time=7.99s]
Epoch 0: 43%|████▎ | 5272/12384 [11:11:06<15:03:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 43%|████▎ | 5273/12384 [11:11:06<15:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 43%|████▎ | 5273/12384 [11:11:14<15:03:18, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=4.31s]
Epoch 0: 43%|████▎ | 5274/12384 [11:11:14<15:03:09, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=4.31s]
Epoch 0: 43%|████▎ | 5274/12384 [11:11:22<15:03:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.92s]
Epoch 0: 43%|████▎ | 5275/12384 [11:11:22<15:01:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.92s]
Epoch 0: 43%|████▎ | 5275/12384 [11:11:29<15:01:48, 7.61s/it, loss=0.0005, acc=0.9998, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5276/12384 [11:11:29<15:00:40, 7.60s/it, loss=0.0005, acc=0.9998, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5276/12384 [11:11:37<15:00:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5277/12384 [11:11:37<15:03:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5277/12384 [11:11:44<15:03:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 0: 43%|████▎ | 5278/12384 [11:11:44<15:02:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 0: 43%|████▎ | 5278/12384 [11:11:52<15:02:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 43%|████▎ | 5279/12384 [11:11:52<15:02:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 43%|████▎ | 5279/12384 [11:12:00<15:02:28, 7.62s/it, loss=0.0006, acc=0.9984, iter_time=11.58s]
Epoch 0: 43%|████▎ | 5280/12384 [11:12:00<15:01:20, 7.61s/it, loss=0.0006, acc=0.9984, iter_time=11.58s]
Epoch 0: 43%|████▎ | 5280/12384 [11:12:07<15:01:20, 7.61s/it, loss=0.0007, acc=0.9998, iter_time=5.35s]
Epoch 0: 43%|████▎ | 5281/12384 [11:12:07<15:00:21, 7.61s/it, loss=0.0007, acc=0.9998, iter_time=5.35s]
Epoch 0: 43%|████▎ | 5281/12384 [11:12:15<15:00:21, 7.61s/it, loss=0.0007, acc=0.9968, iter_time=9.46s]
Epoch 0: 43%|████▎ | 5282/12384 [11:12:15<15:00:20, 7.61s/it, loss=0.0007, acc=0.9968, iter_time=9.46s]
Epoch 0: 43%|████▎ | 5282/12384 [11:12:22<15:00:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 43%|████▎ | 5283/12384 [11:12:22<15:00:02, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 43%|████▎ | 5283/12384 [11:12:30<15:00:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 43%|████▎ | 5284/12384 [11:12:30<15:00:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 43%|████▎ | 5284/12384 [11:12:38<15:00:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 43%|████▎ | 5285/12384 [11:12:38<14:59:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 43%|████▎ | 5285/12384 [11:12:45<14:59:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 0: 43%|████▎ | 5286/12384 [11:12:45<15:00:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 0: 43%|████▎ | 5286/12384 [11:12:53<15:00:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.17s]
Epoch 0: 43%|████▎ | 5287/12384 [11:12:53<15:00:37, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.17s]
Epoch 0: 43%|████▎ | 5287/12384 [11:13:00<15:00:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 43%|████▎ | 5288/12384 [11:13:00<14:59:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 43%|████▎ | 5288/12384 [11:13:08<14:59:41, 7.61s/it, loss=0.0014, acc=0.9978, iter_time=7.65s]
Epoch 0: 43%|████▎ | 5289/12384 [11:13:08<14:59:14, 7.60s/it, loss=0.0014, acc=0.9978, iter_time=7.65s]
Epoch 0: 43%|████▎ | 5289/12384 [11:13:16<14:59:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 43%|████▎ | 5290/12384 [11:13:16<14:58:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 43%|████▎ | 5290/12384 [11:13:23<14:58:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 43%|████▎ | 5291/12384 [11:13:23<14:59:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 43%|████▎ | 5291/12384 [11:13:31<14:59:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 43%|████▎ | 5292/12384 [11:13:31<14:59:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 43%|████▎ | 5292/12384 [11:13:39<14:59:57, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.65s]
Epoch 0: 43%|████▎ | 5293/12384 [11:13:39<15:11:22, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=7.65s]
Epoch 0: 43%|████▎ | 5293/12384 [11:13:46<15:11:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 43%|████▎ | 5294/12384 [11:13:46<15:07:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 43%|████▎ | 5294/12384 [11:13:54<15:07:42, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 0: 43%|████▎ | 5295/12384 [11:13:54<15:05:32, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 0: 43%|████▎ | 5295/12384 [11:14:02<15:05:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 43%|████▎ | 5296/12384 [11:14:02<15:03:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 43%|████▎ | 5296/12384 [11:14:09<15:03:50, 7.65s/it, loss=0.0008, acc=0.9967, iter_time=4.10s]
Epoch 0: 43%|████▎ | 5297/12384 [11:14:09<15:02:43, 7.64s/it, loss=0.0008, acc=0.9967, iter_time=4.10s]
Epoch 0: 43%|████▎ | 5297/12384 [11:14:17<15:02:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 43%|████▎ | 5298/12384 [11:14:17<15:00:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 43%|████▎ | 5298/12384 [11:14:25<15:00:44, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5299/12384 [11:14:25<15:00:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5299/12384 [11:14:32<15:00:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 43%|████▎ | 5300/12384 [11:14:32<14:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 43%|████▎ | 5300/12384 [11:14:40<14:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 43%|████▎ | 5301/12384 [11:14:40<14:58:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 43%|████▎ | 5301/12384 [11:14:47<14:58:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 43%|████▎ | 5302/12384 [11:14:47<14:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 43%|████▎ | 5302/12384 [11:14:55<14:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 43%|████▎ | 5303/12384 [11:14:55<14:57:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 43%|████▎ | 5303/12384 [11:15:03<14:57:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 43%|████▎ | 5304/12384 [11:15:03<14:56:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 43%|████▎ | 5304/12384 [11:15:10<14:56:38, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 43%|████▎ | 5305/12384 [11:15:10<14:58:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 43%|████▎ | 5305/12384 [11:15:18<14:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 43%|████▎ | 5306/12384 [11:15:18<14:58:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 43%|████▎ | 5306/12384 [11:15:26<14:58:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 43%|████▎ | 5307/12384 [11:15:26<15:08:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 43%|████▎ | 5307/12384 [11:15:33<15:08:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5308/12384 [11:15:33<15:04:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5308/12384 [11:15:41<15:04:11, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5309/12384 [11:15:41<15:02:55, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5309/12384 [11:15:49<15:02:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5310/12384 [11:15:49<15:01:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5310/12384 [11:15:56<15:01:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 43%|████▎ | 5311/12384 [11:15:56<14:58:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 43%|████▎ | 5311/12384 [11:16:04<14:58:45, 7.62s/it, loss=0.0039, acc=0.9954, iter_time=8.85s]
Epoch 0: 43%|████▎ | 5312/12384 [11:16:04<14:58:35, 7.62s/it, loss=0.0039, acc=0.9954, iter_time=8.85s]
Epoch 0: 43%|████▎ | 5312/12384 [11:16:11<14:58:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 43%|████▎ | 5313/12384 [11:16:11<14:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 43%|████▎ | 5313/12384 [11:16:19<14:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 43%|████▎ | 5314/12384 [11:16:19<14:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 43%|████▎ | 5314/12384 [11:16:27<14:56:44, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=11.14s]
Epoch 0: 43%|████▎ | 5315/12384 [11:16:27<14:57:09, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=11.14s]
Epoch 0: 43%|████▎ | 5315/12384 [11:16:34<14:57:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5316/12384 [11:16:34<14:56:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5316/12384 [11:16:42<14:56:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 43%|████▎ | 5317/12384 [11:16:42<14:55:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 43%|████▎ | 5317/12384 [11:16:49<14:55:57, 7.61s/it, loss=0.0011, acc=0.9971, iter_time=10.75s]
Epoch 0: 43%|████▎ | 5318/12384 [11:16:49<14:56:24, 7.61s/it, loss=0.0011, acc=0.9971, iter_time=10.75s]
Epoch 0: 43%|████▎ | 5318/12384 [11:16:57<14:56:24, 7.61s/it, loss=0.0006, acc=0.9974, iter_time=7.64s]
Epoch 0: 43%|████▎ | 5319/12384 [11:16:57<15:07:48, 7.71s/it, loss=0.0006, acc=0.9974, iter_time=7.64s]
Epoch 0: 43%|████▎ | 5319/12384 [11:17:05<15:07:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 43%|████▎ | 5320/12384 [11:17:05<15:04:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 43%|████▎ | 5320/12384 [11:17:13<15:04:14, 7.68s/it, loss=0.0003, acc=0.9980, iter_time=7.21s]
Epoch 0: 43%|████▎ | 5321/12384 [11:17:13<15:00:48, 7.65s/it, loss=0.0003, acc=0.9980, iter_time=7.21s]
Epoch 0: 43%|████▎ | 5321/12384 [11:17:20<15:00:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5322/12384 [11:17:20<14:59:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5322/12384 [11:17:28<14:59:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5323/12384 [11:17:28<14:58:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5323/12384 [11:17:35<14:58:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5324/12384 [11:17:35<14:57:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5324/12384 [11:17:43<14:57:21, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 43%|████▎ | 5325/12384 [11:17:43<14:56:58, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 43%|████▎ | 5325/12384 [11:17:51<14:56:58, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5326/12384 [11:17:51<14:55:57, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5326/12384 [11:17:58<14:55:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5327/12384 [11:17:58<14:55:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5327/12384 [11:18:06<14:55:31, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=7.58s]
Epoch 0: 43%|████▎ | 5328/12384 [11:18:06<14:55:26, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=7.58s]
Epoch 0: 43%|████▎ | 5328/12384 [11:18:13<14:55:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 43%|████▎ | 5329/12384 [11:18:13<14:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 43%|████▎ | 5329/12384 [11:18:21<14:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 43%|████▎ | 5330/12384 [11:18:21<14:57:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 43%|████▎ | 5330/12384 [11:18:29<14:57:27, 7.63s/it, loss=0.0007, acc=0.9972, iter_time=7.66s]
Epoch 0: 43%|████▎ | 5331/12384 [11:18:29<14:56:15, 7.62s/it, loss=0.0007, acc=0.9972, iter_time=7.66s]
Epoch 0: 43%|████▎ | 5331/12384 [11:18:36<14:56:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 43%|████▎ | 5332/12384 [11:18:36<14:55:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 43%|████▎ | 5332/12384 [11:18:44<14:55:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 43%|████▎ | 5333/12384 [11:18:44<14:55:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 43%|████▎ | 5333/12384 [11:18:52<14:55:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 43%|████▎ | 5334/12384 [11:18:52<15:05:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 43%|████▎ | 5334/12384 [11:18:59<15:05:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 43%|████▎ | 5335/12384 [11:18:59<15:01:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 43%|████▎ | 5335/12384 [11:19:07<15:01:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 0: 43%|████▎ | 5336/12384 [11:19:07<14:59:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 0: 43%|████▎ | 5336/12384 [11:19:15<14:59:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 43%|████▎ | 5337/12384 [11:19:15<14:58:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 43%|████▎ | 5337/12384 [11:19:22<14:58:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 0: 43%|████▎ | 5338/12384 [11:19:22<14:56:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 0: 43%|████▎ | 5338/12384 [11:19:30<14:56:57, 7.64s/it, loss=0.0004, acc=0.9979, iter_time=8.45s]
Epoch 0: 43%|████▎ | 5339/12384 [11:19:30<14:54:50, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=8.45s]
Epoch 0: 43%|████▎ | 5339/12384 [11:19:37<14:54:50, 7.62s/it, loss=0.0005, acc=0.9982, iter_time=6.50s]
Epoch 0: 43%|████▎ | 5340/12384 [11:19:37<14:54:19, 7.62s/it, loss=0.0005, acc=0.9982, iter_time=6.50s]
Epoch 0: 43%|████▎ | 5340/12384 [11:19:45<14:54:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 43%|████▎ | 5341/12384 [11:19:45<14:53:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 43%|████▎ | 5341/12384 [11:19:53<14:53:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 43%|████▎ | 5342/12384 [11:19:53<14:53:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 43%|████▎ | 5342/12384 [11:20:00<14:53:20, 7.61s/it, loss=0.0003, acc=0.9970, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5343/12384 [11:20:00<14:52:45, 7.61s/it, loss=0.0003, acc=0.9970, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5343/12384 [11:20:08<14:52:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 43%|████▎ | 5344/12384 [11:20:08<14:53:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 43%|████▎ | 5344/12384 [11:20:16<14:53:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 0: 43%|████▎ | 5345/12384 [11:20:16<15:03:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 0: 43%|████▎ | 5345/12384 [11:20:23<15:03:26, 7.70s/it, loss=0.0004, acc=0.9983, iter_time=10.91s]
Epoch 0: 43%|████▎ | 5346/12384 [11:20:23<14:59:48, 7.67s/it, loss=0.0004, acc=0.9983, iter_time=10.91s]
Epoch 0: 43%|████▎ | 5346/12384 [11:20:31<14:59:48, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.36s]
Epoch 0: 43%|████▎ | 5347/12384 [11:20:31<14:57:49, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.36s]
Epoch 0: 43%|████▎ | 5347/12384 [11:20:39<14:57:49, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 43%|████▎ | 5348/12384 [11:20:39<14:57:00, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 43%|████▎ | 5348/12384 [11:20:46<14:57:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 0: 43%|████▎ | 5349/12384 [11:20:46<14:55:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 0: 43%|████▎ | 5349/12384 [11:20:54<14:55:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 43%|████▎ | 5350/12384 [11:20:54<14:53:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 43%|████▎ | 5350/12384 [11:21:02<14:53:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 43%|████▎ | 5351/12384 [11:21:02<14:54:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 43%|████▎ | 5351/12384 [11:21:09<14:54:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 43%|████▎ | 5352/12384 [11:21:09<14:52:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 43%|████▎ | 5352/12384 [11:21:17<14:52:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 0: 43%|████▎ | 5353/12384 [11:21:17<14:52:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 0: 43%|████▎ | 5353/12384 [11:21:24<14:52:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 0: 43%|████▎ | 5354/12384 [11:21:24<14:52:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 0: 43%|████▎ | 5354/12384 [11:21:32<14:52:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 43%|████▎ | 5355/12384 [11:21:32<14:52:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 43%|████▎ | 5355/12384 [11:21:40<14:52:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 43%|████▎ | 5356/12384 [11:21:40<14:51:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 43%|████▎ | 5356/12384 [11:21:47<14:51:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5357/12384 [11:21:47<14:51:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5357/12384 [11:21:55<14:51:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 43%|████▎ | 5358/12384 [11:21:55<14:51:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 43%|████▎ | 5358/12384 [11:22:02<14:51:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 43%|████▎ | 5359/12384 [11:22:02<14:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 43%|████▎ | 5359/12384 [11:22:10<14:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 43%|████▎ | 5360/12384 [11:22:10<14:51:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 43%|████▎ | 5360/12384 [11:22:18<14:51:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 43%|████▎ | 5361/12384 [11:22:18<15:00:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 43%|████▎ | 5361/12384 [11:22:26<15:00:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5362/12384 [11:22:26<15:00:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 43%|████▎ | 5362/12384 [11:22:33<15:00:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 43%|████▎ | 5363/12384 [11:22:33<14:56:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 43%|████▎ | 5363/12384 [11:22:41<14:56:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 43%|████▎ | 5364/12384 [11:22:41<14:57:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 43%|████▎ | 5364/12384 [11:22:48<14:57:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 43%|████▎ | 5365/12384 [11:22:48<14:55:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 43%|████▎ | 5365/12384 [11:22:56<14:55:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 0: 43%|████▎ | 5366/12384 [11:22:56<14:53:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 0: 43%|████▎ | 5366/12384 [11:23:04<14:53:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 43%|████▎ | 5367/12384 [11:23:04<14:52:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 43%|████▎ | 5367/12384 [11:23:11<14:52:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 43%|████▎ | 5368/12384 [11:23:11<14:51:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 43%|████▎ | 5368/12384 [11:23:19<14:51:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.61s]
Epoch 0: 43%|████▎ | 5369/12384 [11:23:19<14:51:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.61s]
Epoch 0: 43%|████▎ | 5369/12384 [11:23:27<14:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 43%|████▎ | 5370/12384 [11:23:27<14:52:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 43%|████▎ | 5370/12384 [11:23:35<14:52:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 0: 43%|████▎ | 5371/12384 [11:23:35<15:04:20, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 0: 43%|████▎ | 5371/12384 [11:23:42<15:04:20, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 43%|████▎ | 5372/12384 [11:23:42<15:02:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 43%|████▎ | 5372/12384 [11:23:50<15:02:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 43%|████▎ | 5373/12384 [11:23:50<14:58:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 43%|████▎ | 5373/12384 [11:23:57<14:58:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5374/12384 [11:23:57<14:54:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 43%|████▎ | 5374/12384 [11:24:05<14:54:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 43%|████▎ | 5375/12384 [11:24:05<14:53:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 43%|████▎ | 5375/12384 [11:24:13<14:53:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 43%|████▎ | 5376/12384 [11:24:13<14:52:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 43%|████▎ | 5376/12384 [11:24:20<14:52:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 43%|████▎ | 5377/12384 [11:24:20<14:50:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 43%|████▎ | 5377/12384 [11:24:28<14:50:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5378/12384 [11:24:28<14:50:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 43%|████▎ | 5378/12384 [11:24:36<14:50:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 43%|████▎ | 5379/12384 [11:24:36<14:48:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 43%|████▎ | 5379/12384 [11:24:43<14:48:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 0: 43%|████▎ | 5380/12384 [11:24:43<14:48:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 0: 43%|████▎ | 5380/12384 [11:24:51<14:48:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.21s]
Epoch 0: 43%|████▎ | 5381/12384 [11:24:51<14:50:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.21s]
Epoch 0: 43%|████▎ | 5381/12384 [11:24:58<14:50:05, 7.63s/it, loss=0.0021, acc=0.9968, iter_time=4.05s]
Epoch 0: 43%|████▎ | 5382/12384 [11:24:58<14:48:43, 7.62s/it, loss=0.0021, acc=0.9968, iter_time=4.05s]
Epoch 0: 43%|████▎ | 5382/12384 [11:25:06<14:48:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 43%|████▎ | 5383/12384 [11:25:06<14:51:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 43%|████▎ | 5383/12384 [11:25:14<14:51:05, 7.64s/it, loss=0.0022, acc=0.9919, iter_time=9.61s]
Epoch 0: 43%|████▎ | 5384/12384 [11:25:14<14:49:51, 7.63s/it, loss=0.0022, acc=0.9919, iter_time=9.61s]
Epoch 0: 43%|████▎ | 5384/12384 [11:25:21<14:49:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 43%|████▎ | 5385/12384 [11:25:21<14:48:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 43%|████▎ | 5385/12384 [11:25:29<14:48:37, 7.62s/it, loss=0.0011, acc=0.9974, iter_time=4.75s]
Epoch 0: 43%|████▎ | 5386/12384 [11:25:29<14:48:39, 7.62s/it, loss=0.0011, acc=0.9974, iter_time=4.75s]
Epoch 0: 43%|████▎ | 5386/12384 [11:25:37<14:48:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 0: 43%|████▎ | 5387/12384 [11:25:37<14:58:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 0: 43%|████▎ | 5387/12384 [11:25:44<14:58:53, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▎ | 5388/12384 [11:25:44<14:56:29, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▎ | 5388/12384 [11:25:52<14:56:29, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 44%|████▎ | 5389/12384 [11:25:52<14:53:59, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 44%|████▎ | 5389/12384 [11:26:00<14:53:59, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.72s]
Epoch 0: 44%|████▎ | 5390/12384 [11:26:00<14:51:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.72s]
Epoch 0: 44%|████▎ | 5390/12384 [11:26:07<14:51:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 44%|████▎ | 5391/12384 [11:26:07<14:49:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 44%|████▎ | 5391/12384 [11:26:15<14:49:48, 7.63s/it, loss=0.0007, acc=0.9972, iter_time=7.55s]
Epoch 0: 44%|████▎ | 5392/12384 [11:26:15<14:48:58, 7.63s/it, loss=0.0007, acc=0.9972, iter_time=7.55s]
Epoch 0: 44%|████▎ | 5392/12384 [11:26:22<14:48:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▎ | 5393/12384 [11:26:22<14:47:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▎ | 5393/12384 [11:26:30<14:47:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▎ | 5394/12384 [11:26:30<14:47:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▎ | 5394/12384 [11:26:38<14:47:13, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=5.02s]
Epoch 0: 44%|████▎ | 5395/12384 [11:26:38<14:46:57, 7.61s/it, loss=0.0002, acc=0.9992, iter_time=5.02s]
Epoch 0: 44%|████▎ | 5395/12384 [11:26:45<14:46:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 44%|████▎ | 5396/12384 [11:26:45<14:46:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 44%|████▎ | 5396/12384 [11:26:53<14:46:37, 7.61s/it, loss=0.0004, acc=0.9992, iter_time=9.65s]
Epoch 0: 44%|████▎ | 5397/12384 [11:26:53<14:58:44, 7.72s/it, loss=0.0004, acc=0.9992, iter_time=9.65s]
Epoch 0: 44%|████▎ | 5397/12384 [11:27:01<14:58:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=3.98s]
Epoch 0: 44%|████▎ | 5398/12384 [11:27:01<14:55:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.98s]
Epoch 0: 44%|████▎ | 5398/12384 [11:27:09<14:55:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.56s]
Epoch 0: 44%|████▎ | 5399/12384 [11:27:09<14:52:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.56s]
Epoch 0: 44%|████▎ | 5399/12384 [11:27:16<14:52:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 44%|████▎ | 5400/12384 [11:27:16<14:50:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 44%|████▎ | 5400/12384 [11:27:24<14:50:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 44%|████▎ | 5401/12384 [11:27:24<14:48:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 44%|████▎ | 5401/12384 [11:27:31<14:48:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 44%|████▎ | 5402/12384 [11:27:31<14:46:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 44%|████▎ | 5402/12384 [11:27:39<14:46:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.62s]
Epoch 0: 44%|████▎ | 5403/12384 [11:27:39<14:46:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.62s]
Epoch 0: 44%|████▎ | 5403/12384 [11:27:47<14:46:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 44%|████▎ | 5404/12384 [11:27:47<14:45:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 44%|████▎ | 5404/12384 [11:27:54<14:45:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 44%|████▎ | 5405/12384 [11:27:54<14:44:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 44%|████▎ | 5405/12384 [11:28:02<14:44:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 44%|████▎ | 5406/12384 [11:28:02<14:44:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 44%|████▎ | 5406/12384 [11:28:09<14:44:08, 7.60s/it, loss=0.0005, acc=1.0000, iter_time=8.35s]
Epoch 0: 44%|████▎ | 5407/12384 [11:28:09<14:44:58, 7.61s/it, loss=0.0005, acc=1.0000, iter_time=8.35s]
Epoch 0: 44%|████▎ | 5407/12384 [11:28:17<14:44:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 44%|████▎ | 5408/12384 [11:28:17<14:44:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 44%|████▎ | 5408/12384 [11:28:25<14:44:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 0: 44%|████▎ | 5409/12384 [11:28:25<14:44:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 0: 44%|████▎ | 5409/12384 [11:28:32<14:44:45, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=9.06s]
Epoch 0: 44%|████▎ | 5410/12384 [11:28:32<14:44:59, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=9.06s]
Epoch 0: 44%|████▎ | 5410/12384 [11:28:40<14:44:59, 7.61s/it, loss=0.0007, acc=0.9963, iter_time=7.35s]
Epoch 0: 44%|████▎ | 5411/12384 [11:28:40<14:46:06, 7.62s/it, loss=0.0007, acc=0.9963, iter_time=7.35s]
Epoch 0: 44%|████▎ | 5411/12384 [11:28:47<14:46:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 44%|████▎ | 5412/12384 [11:28:47<14:45:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 44%|████▎ | 5412/12384 [11:28:55<14:45:02, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=6.06s]
Epoch 0: 44%|████▎ | 5413/12384 [11:28:55<14:44:44, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=6.06s]
Epoch 0: 44%|████▎ | 5413/12384 [11:29:03<14:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 44%|████▎ | 5414/12384 [11:29:03<14:44:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 44%|████▎ | 5414/12384 [11:29:10<14:44:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 44%|████▎ | 5415/12384 [11:29:10<14:43:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 44%|████▎ | 5415/12384 [11:29:18<14:43:42, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=7.99s]
Epoch 0: 44%|████▎ | 5416/12384 [11:29:18<14:43:32, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=7.99s]
Epoch 0: 44%|████▎ | 5416/12384 [11:29:25<14:43:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 0: 44%|████▎ | 5417/12384 [11:29:25<14:43:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 0: 44%|████▎ | 5417/12384 [11:29:33<14:43:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 0: 44%|████▍ | 5418/12384 [11:29:33<14:44:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 0: 44%|████▍ | 5418/12384 [11:29:41<14:44:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5419/12384 [11:29:41<14:43:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5419/12384 [11:29:48<14:43:02, 7.61s/it, loss=0.0005, acc=0.9998, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5420/12384 [11:29:48<14:42:57, 7.61s/it, loss=0.0005, acc=0.9998, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5420/12384 [11:29:56<14:42:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 44%|████▍ | 5421/12384 [11:29:56<14:42:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 44%|████▍ | 5421/12384 [11:30:03<14:42:05, 7.60s/it, loss=0.0001, acc=0.9999, iter_time=8.44s]
Epoch 0: 44%|████▍ | 5422/12384 [11:30:03<14:42:01, 7.60s/it, loss=0.0001, acc=0.9999, iter_time=8.44s]
Epoch 0: 44%|████▍ | 5422/12384 [11:30:11<14:42:01, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.82s]
Epoch 0: 44%|████▍ | 5423/12384 [11:30:11<14:42:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.82s]
Epoch 0: 44%|████▍ | 5423/12384 [11:30:19<14:42:30, 7.61s/it, loss=0.0005, acc=0.9978, iter_time=9.84s]
Epoch 0: 44%|████▍ | 5424/12384 [11:30:19<14:54:26, 7.71s/it, loss=0.0005, acc=0.9978, iter_time=9.84s]
Epoch 0: 44%|████▍ | 5424/12384 [11:30:27<14:54:26, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 44%|████▍ | 5425/12384 [11:30:27<14:51:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 44%|████▍ | 5425/12384 [11:30:34<14:51:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5426/12384 [11:30:34<14:48:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5426/12384 [11:30:42<14:48:04, 7.66s/it, loss=0.0003, acc=0.9981, iter_time=5.31s]
Epoch 0: 44%|████▍ | 5427/12384 [11:30:42<14:45:42, 7.64s/it, loss=0.0003, acc=0.9981, iter_time=5.31s]
Epoch 0: 44%|████▍ | 5427/12384 [11:30:49<14:45:42, 7.64s/it, loss=0.0007, acc=0.9975, iter_time=9.89s]
Epoch 0: 44%|████▍ | 5428/12384 [11:30:49<14:44:12, 7.63s/it, loss=0.0007, acc=0.9975, iter_time=9.89s]
Epoch 0: 44%|████▍ | 5428/12384 [11:30:57<14:44:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 44%|████▍ | 5429/12384 [11:30:57<14:43:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 44%|████▍ | 5429/12384 [11:31:05<14:43:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 44%|████▍ | 5430/12384 [11:31:05<14:42:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 44%|████▍ | 5430/12384 [11:31:12<14:42:56, 7.62s/it, loss=0.0007, acc=0.9975, iter_time=7.88s]
Epoch 0: 44%|████▍ | 5431/12384 [11:31:12<14:42:37, 7.62s/it, loss=0.0007, acc=0.9975, iter_time=7.88s]
Epoch 0: 44%|████▍ | 5431/12384 [11:31:20<14:42:37, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=9.07s]
Epoch 0: 44%|████▍ | 5432/12384 [11:31:20<14:42:20, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=9.07s]
Epoch 0: 44%|████▍ | 5432/12384 [11:31:27<14:42:20, 7.62s/it, loss=0.0007, acc=0.9997, iter_time=6.43s]
Epoch 0: 44%|████▍ | 5433/12384 [11:31:27<14:41:05, 7.61s/it, loss=0.0007, acc=0.9997, iter_time=6.43s]
Epoch 0: 44%|████▍ | 5433/12384 [11:31:35<14:41:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 0: 44%|████▍ | 5434/12384 [11:31:35<14:41:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 0: 44%|████▍ | 5434/12384 [11:31:43<14:41:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 44%|████▍ | 5435/12384 [11:31:43<14:41:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 44%|████▍ | 5435/12384 [11:31:50<14:41:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 44%|████▍ | 5436/12384 [11:31:50<14:41:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 44%|████▍ | 5436/12384 [11:31:58<14:41:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 44%|████▍ | 5437/12384 [11:31:58<14:41:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 44%|████▍ | 5437/12384 [11:32:06<14:41:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▍ | 5438/12384 [11:32:06<14:44:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▍ | 5438/12384 [11:32:14<14:44:46, 7.64s/it, loss=0.0006, acc=0.9977, iter_time=8.02s]
Epoch 0: 44%|████▍ | 5439/12384 [11:32:14<14:53:53, 7.72s/it, loss=0.0006, acc=0.9977, iter_time=8.02s]
Epoch 0: 44%|████▍ | 5439/12384 [11:32:21<14:53:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 44%|████▍ | 5440/12384 [11:32:21<14:50:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 44%|████▍ | 5440/12384 [11:32:29<14:50:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 0: 44%|████▍ | 5441/12384 [11:32:29<14:47:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 0: 44%|████▍ | 5441/12384 [11:32:36<14:47:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 44%|████▍ | 5442/12384 [11:32:36<14:45:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 44%|████▍ | 5442/12384 [11:32:44<14:45:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 44%|████▍ | 5443/12384 [11:32:44<14:43:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 44%|████▍ | 5443/12384 [11:32:52<14:43:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.00s]
Epoch 0: 44%|████▍ | 5444/12384 [11:32:52<14:43:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.00s]
Epoch 0: 44%|████▍ | 5444/12384 [11:32:59<14:43:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 44%|████▍ | 5445/12384 [11:32:59<14:43:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 44%|████▍ | 5445/12384 [11:33:07<14:43:53, 7.64s/it, loss=0.0039, acc=1.0000, iter_time=4.31s]
Epoch 0: 44%|████▍ | 5446/12384 [11:33:07<14:46:18, 7.66s/it, loss=0.0039, acc=1.0000, iter_time=4.31s]
Epoch 0: 44%|████▍ | 5446/12384 [11:33:15<14:46:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 44%|████▍ | 5447/12384 [11:33:15<14:47:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 44%|████▍ | 5447/12384 [11:33:22<14:47:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 44%|████▍ | 5448/12384 [11:33:22<14:43:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 44%|████▍ | 5448/12384 [11:33:30<14:43:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 44%|████▍ | 5449/12384 [11:33:30<14:42:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 44%|████▍ | 5449/12384 [11:33:38<14:42:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 44%|████▍ | 5450/12384 [11:33:38<14:53:32, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 44%|████▍ | 5450/12384 [11:33:45<14:53:32, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=4.14s]
Epoch 0: 44%|████▍ | 5451/12384 [11:33:45<14:49:25, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=4.14s]
Epoch 0: 44%|████▍ | 5451/12384 [11:33:53<14:49:25, 7.70s/it, loss=0.0004, acc=0.9983, iter_time=10.68s]
Epoch 0: 44%|████▍ | 5452/12384 [11:33:53<14:50:39, 7.71s/it, loss=0.0004, acc=0.9983, iter_time=10.68s]
Epoch 0: 44%|████▍ | 5452/12384 [11:34:01<14:50:39, 7.71s/it, loss=0.0017, acc=0.9977, iter_time=7.74s]
Epoch 0: 44%|████▍ | 5453/12384 [11:34:01<14:46:25, 7.67s/it, loss=0.0017, acc=0.9977, iter_time=7.74s]
Epoch 0: 44%|████▍ | 5453/12384 [11:34:08<14:46:25, 7.67s/it, loss=0.0033, acc=0.9869, iter_time=5.27s]
Epoch 0: 44%|████▍ | 5454/12384 [11:34:08<14:44:09, 7.66s/it, loss=0.0033, acc=0.9869, iter_time=5.27s]
Epoch 0: 44%|████▍ | 5454/12384 [11:34:16<14:44:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 44%|████▍ | 5455/12384 [11:34:16<14:42:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 44%|████▍ | 5455/12384 [11:34:24<14:42:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 0: 44%|████▍ | 5456/12384 [11:34:24<14:40:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 0: 44%|████▍ | 5456/12384 [11:34:31<14:40:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▍ | 5457/12384 [11:34:31<14:39:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▍ | 5457/12384 [11:34:39<14:39:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5458/12384 [11:34:39<14:39:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5458/12384 [11:34:46<14:39:21, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=7.09s]
Epoch 0: 44%|████▍ | 5459/12384 [11:34:46<14:39:16, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=7.09s]
Epoch 0: 44%|████▍ | 5459/12384 [11:34:54<14:39:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 44%|████▍ | 5460/12384 [11:34:54<14:39:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 44%|████▍ | 5460/12384 [11:35:02<14:39:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 44%|████▍ | 5461/12384 [11:35:02<14:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 44%|████▍ | 5461/12384 [11:35:09<14:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 44%|████▍ | 5462/12384 [11:35:09<14:37:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 44%|████▍ | 5462/12384 [11:35:17<14:37:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 44%|████▍ | 5463/12384 [11:35:17<14:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 44%|████▍ | 5463/12384 [11:35:25<14:37:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.40s]
Epoch 0: 44%|████▍ | 5464/12384 [11:35:25<14:51:39, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=8.40s]
Epoch 0: 44%|████▍ | 5464/12384 [11:35:33<14:51:39, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 44%|████▍ | 5465/12384 [11:35:33<14:57:18, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 44%|████▍ | 5465/12384 [11:35:41<14:57:18, 7.78s/it, loss=0.0001, acc=1.0000, iter_time=8.50s]
Epoch 0: 44%|████▍ | 5466/12384 [11:35:41<15:21:43, 7.99s/it, loss=0.0001, acc=1.0000, iter_time=8.50s]
Epoch 0: 44%|████▍ | 5466/12384 [11:35:49<15:21:43, 7.99s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5467/12384 [11:35:49<15:10:11, 7.90s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5467/12384 [11:35:57<15:10:11, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 44%|████▍ | 5468/12384 [11:35:57<15:00:37, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 44%|████▍ | 5468/12384 [11:36:04<15:00:37, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5469/12384 [11:36:04<14:53:48, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5469/12384 [11:36:12<14:53:48, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5470/12384 [11:36:12<14:48:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5470/12384 [11:36:19<14:48:34, 7.71s/it, loss=0.0001, acc=0.9996, iter_time=7.63s]
Epoch 0: 44%|████▍ | 5471/12384 [11:36:19<14:45:07, 7.68s/it, loss=0.0001, acc=0.9996, iter_time=7.63s]
Epoch 0: 44%|████▍ | 5471/12384 [11:36:27<14:45:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 44%|████▍ | 5472/12384 [11:36:27<14:42:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 44%|████▍ | 5472/12384 [11:36:35<14:42:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 44%|████▍ | 5473/12384 [11:36:35<14:40:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 44%|████▍ | 5473/12384 [11:36:42<14:40:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 44%|████▍ | 5474/12384 [11:36:42<14:38:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 44%|████▍ | 5474/12384 [11:36:50<14:38:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 44%|████▍ | 5475/12384 [11:36:50<14:37:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 44%|████▍ | 5475/12384 [11:36:57<14:37:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 0: 44%|████▍ | 5476/12384 [11:36:57<14:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 0: 44%|████▍ | 5476/12384 [11:37:05<14:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 44%|████▍ | 5477/12384 [11:37:05<14:47:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 44%|████▍ | 5477/12384 [11:37:13<14:47:27, 7.71s/it, loss=0.0008, acc=0.9970, iter_time=6.74s]
Epoch 0: 44%|████▍ | 5478/12384 [11:37:13<14:44:12, 7.68s/it, loss=0.0008, acc=0.9970, iter_time=6.74s]
Epoch 0: 44%|████▍ | 5478/12384 [11:37:21<14:44:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 44%|████▍ | 5479/12384 [11:37:21<14:41:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 44%|████▍ | 5479/12384 [11:37:28<14:41:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 0: 44%|████▍ | 5480/12384 [11:37:28<14:40:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 0: 44%|████▍ | 5480/12384 [11:37:36<14:40:08, 7.65s/it, loss=0.0003, acc=0.9994, iter_time=6.59s]
Epoch 0: 44%|████▍ | 5481/12384 [11:37:36<14:39:09, 7.64s/it, loss=0.0003, acc=0.9994, iter_time=6.59s]
Epoch 0: 44%|████▍ | 5481/12384 [11:37:43<14:39:09, 7.64s/it, loss=0.0006, acc=0.9994, iter_time=8.54s]
Epoch 0: 44%|████▍ | 5482/12384 [11:37:43<14:37:53, 7.63s/it, loss=0.0006, acc=0.9994, iter_time=8.54s]
Epoch 0: 44%|████▍ | 5482/12384 [11:37:51<14:37:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 44%|████▍ | 5483/12384 [11:37:51<14:40:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 44%|████▍ | 5483/12384 [11:37:59<14:40:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5484/12384 [11:37:59<14:38:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5484/12384 [11:38:06<14:38:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.38s]
Epoch 0: 44%|████▍ | 5485/12384 [11:38:06<14:38:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.38s]
Epoch 0: 44%|████▍ | 5485/12384 [11:38:14<14:38:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 44%|████▍ | 5486/12384 [11:38:14<14:36:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 44%|████▍ | 5486/12384 [11:38:22<14:36:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 44%|████▍ | 5487/12384 [11:38:22<14:35:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 44%|████▍ | 5487/12384 [11:38:29<14:35:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.79s]
Epoch 0: 44%|████▍ | 5488/12384 [11:38:29<14:35:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.79s]
Epoch 0: 44%|████▍ | 5488/12384 [11:38:37<14:35:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.62s]
Epoch 0: 44%|████▍ | 5489/12384 [11:38:37<14:35:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.62s]
Epoch 0: 44%|████▍ | 5489/12384 [11:38:44<14:35:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 44%|████▍ | 5490/12384 [11:38:44<14:34:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 44%|████▍ | 5490/12384 [11:38:52<14:34:48, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.92s]
Epoch 0: 44%|████▍ | 5491/12384 [11:38:52<14:44:48, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.92s]
Epoch 0: 44%|████▍ | 5491/12384 [11:39:00<14:44:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5492/12384 [11:39:00<14:41:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5492/12384 [11:39:08<14:41:08, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 44%|████▍ | 5493/12384 [11:39:08<14:38:50, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 44%|████▍ | 5493/12384 [11:39:15<14:38:50, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▍ | 5494/12384 [11:39:15<14:38:35, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▍ | 5494/12384 [11:39:23<14:38:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5495/12384 [11:39:23<14:37:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5495/12384 [11:39:30<14:37:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 44%|████▍ | 5496/12384 [11:39:30<14:36:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 44%|████▍ | 5496/12384 [11:39:38<14:36:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 44%|████▍ | 5497/12384 [11:39:38<14:35:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 44%|████▍ | 5497/12384 [11:39:46<14:35:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 44%|████▍ | 5498/12384 [11:39:46<14:35:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 44%|████▍ | 5498/12384 [11:39:53<14:35:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 44%|████▍ | 5499/12384 [11:39:53<14:35:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 44%|████▍ | 5499/12384 [11:40:01<14:35:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 0: 44%|████▍ | 5500/12384 [11:40:01<14:41:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 0: 44%|████▍ | 5500/12384 [11:40:09<14:41:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 44%|████▍ | 5501/12384 [11:40:09<14:38:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 44%|████▍ | 5501/12384 [11:40:16<14:38:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5502/12384 [11:40:16<14:36:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5502/12384 [11:40:24<14:36:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▍ | 5503/12384 [11:40:24<14:46:26, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 44%|████▍ | 5503/12384 [11:40:32<14:46:26, 7.73s/it, loss=0.0001, acc=0.9999, iter_time=8.30s]
Epoch 0: 44%|████▍ | 5504/12384 [11:40:32<14:42:20, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=8.30s]
Epoch 0: 44%|████▍ | 5504/12384 [11:40:40<14:42:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 44%|████▍ | 5505/12384 [11:40:40<14:39:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 44%|████▍ | 5505/12384 [11:40:47<14:39:32, 7.67s/it, loss=0.0007, acc=0.9980, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5506/12384 [11:40:47<14:36:31, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5506/12384 [11:40:55<14:36:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5507/12384 [11:40:55<14:35:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5507/12384 [11:41:02<14:35:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5508/12384 [11:41:02<14:34:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 44%|████▍ | 5508/12384 [11:41:10<14:34:10, 7.63s/it, loss=0.0017, acc=0.9939, iter_time=7.59s]
Epoch 0: 44%|████▍ | 5509/12384 [11:41:10<14:32:59, 7.62s/it, loss=0.0017, acc=0.9939, iter_time=7.59s]
Epoch 0: 44%|████▍ | 5509/12384 [11:41:18<14:32:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5510/12384 [11:41:18<14:32:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 44%|████▍ | 5510/12384 [11:41:25<14:32:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 45%|████▍ | 5511/12384 [11:41:25<14:32:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 45%|████▍ | 5511/12384 [11:41:33<14:32:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 45%|████▍ | 5512/12384 [11:41:33<14:32:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 45%|████▍ | 5512/12384 [11:41:40<14:32:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 0: 45%|████▍ | 5513/12384 [11:41:40<14:33:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 0: 45%|████▍ | 5513/12384 [11:41:48<14:33:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 45%|████▍ | 5514/12384 [11:41:48<14:34:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 45%|████▍ | 5514/12384 [11:41:56<14:34:05, 7.63s/it, loss=0.0005, acc=0.9987, iter_time=10.27s]
Epoch 0: 45%|████▍ | 5515/12384 [11:41:56<14:33:39, 7.63s/it, loss=0.0005, acc=0.9987, iter_time=10.27s]
Epoch 0: 45%|████▍ | 5515/12384 [11:42:03<14:33:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 45%|████▍ | 5516/12384 [11:42:03<14:34:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 45%|████▍ | 5516/12384 [11:42:11<14:34:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▍ | 5517/12384 [11:42:11<14:33:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▍ | 5517/12384 [11:42:19<14:33:33, 7.63s/it, loss=0.0008, acc=0.9962, iter_time=5.36s]
Epoch 0: 45%|████▍ | 5518/12384 [11:42:19<14:33:07, 7.63s/it, loss=0.0008, acc=0.9962, iter_time=5.36s]
Epoch 0: 45%|████▍ | 5518/12384 [11:42:26<14:33:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 45%|████▍ | 5519/12384 [11:42:26<14:32:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 45%|████▍ | 5519/12384 [11:42:34<14:32:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 45%|████▍ | 5520/12384 [11:42:34<14:32:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 45%|████▍ | 5520/12384 [11:42:41<14:32:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 45%|████▍ | 5521/12384 [11:42:41<14:31:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 45%|████▍ | 5521/12384 [11:42:49<14:31:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▍ | 5522/12384 [11:42:49<14:31:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▍ | 5522/12384 [11:42:57<14:31:09, 7.62s/it, loss=0.0013, acc=0.9944, iter_time=6.12s]
Epoch 0: 45%|████▍ | 5523/12384 [11:42:57<14:58:27, 7.86s/it, loss=0.0013, acc=0.9944, iter_time=6.12s]
Epoch 0: 45%|████▍ | 5523/12384 [11:43:05<14:58:27, 7.86s/it, loss=0.0001, acc=1.0000, iter_time=9.88s]
Epoch 0: 45%|████▍ | 5524/12384 [11:43:05<14:50:14, 7.79s/it, loss=0.0001, acc=1.0000, iter_time=9.88s]
Epoch 0: 45%|████▍ | 5524/12384 [11:43:13<14:50:14, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▍ | 5525/12384 [11:43:13<14:44:18, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▍ | 5525/12384 [11:43:20<14:44:18, 7.74s/it, loss=0.0005, acc=0.9991, iter_time=6.71s]
Epoch 0: 45%|████▍ | 5526/12384 [11:43:20<14:41:40, 7.71s/it, loss=0.0005, acc=0.9991, iter_time=6.71s]
Epoch 0: 45%|████▍ | 5526/12384 [11:43:28<14:41:40, 7.71s/it, loss=0.0003, acc=0.9984, iter_time=8.58s]
Epoch 0: 45%|████▍ | 5527/12384 [11:43:28<14:38:22, 7.69s/it, loss=0.0003, acc=0.9984, iter_time=8.58s]
Epoch 0: 45%|████▍ | 5527/12384 [11:43:36<14:38:22, 7.69s/it, loss=0.0006, acc=0.9980, iter_time=7.58s]
Epoch 0: 45%|████▍ | 5528/12384 [11:43:36<14:36:17, 7.67s/it, loss=0.0006, acc=0.9980, iter_time=7.58s]
Epoch 0: 45%|████▍ | 5528/12384 [11:43:44<14:36:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 45%|████▍ | 5529/12384 [11:43:44<14:45:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 45%|████▍ | 5529/12384 [11:43:51<14:45:20, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 45%|████▍ | 5530/12384 [11:43:51<14:41:33, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 45%|████▍ | 5530/12384 [11:43:59<14:41:33, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▍ | 5531/12384 [11:43:59<14:37:48, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▍ | 5531/12384 [11:44:06<14:37:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 45%|████▍ | 5532/12384 [11:44:06<14:34:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 45%|████▍ | 5532/12384 [11:44:14<14:34:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 45%|████▍ | 5533/12384 [11:44:14<14:32:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 45%|████▍ | 5533/12384 [11:44:22<14:32:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 0: 45%|████▍ | 5534/12384 [11:44:22<14:31:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 0: 45%|████▍ | 5534/12384 [11:44:29<14:31:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 45%|████▍ | 5535/12384 [11:44:29<14:30:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 45%|████▍ | 5535/12384 [11:44:37<14:30:41, 7.63s/it, loss=0.0005, acc=0.9985, iter_time=7.56s]
Epoch 0: 45%|████▍ | 5536/12384 [11:44:37<14:29:19, 7.62s/it, loss=0.0005, acc=0.9985, iter_time=7.56s]
Epoch 0: 45%|████▍ | 5536/12384 [11:44:44<14:29:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 45%|████▍ | 5537/12384 [11:44:44<14:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 45%|████▍ | 5537/12384 [11:44:52<14:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 45%|████▍ | 5538/12384 [11:44:52<14:29:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 45%|████▍ | 5538/12384 [11:45:00<14:29:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 45%|████▍ | 5539/12384 [11:45:00<14:28:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 45%|████▍ | 5539/12384 [11:45:07<14:28:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▍ | 5540/12384 [11:45:07<14:28:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▍ | 5540/12384 [11:45:15<14:28:11, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.62s]
Epoch 0: 45%|████▍ | 5541/12384 [11:45:15<14:28:04, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.62s]
Epoch 0: 45%|████▍ | 5541/12384 [11:45:23<14:28:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 45%|████▍ | 5542/12384 [11:45:23<14:28:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 45%|████▍ | 5542/12384 [11:45:30<14:28:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 45%|████▍ | 5543/12384 [11:45:30<14:27:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 45%|████▍ | 5543/12384 [11:45:38<14:27:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 45%|████▍ | 5544/12384 [11:45:38<14:31:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 45%|████▍ | 5544/12384 [11:45:45<14:31:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 45%|████▍ | 5545/12384 [11:45:45<14:30:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 45%|████▍ | 5545/12384 [11:45:53<14:30:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 45%|████▍ | 5546/12384 [11:45:53<14:28:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 45%|████▍ | 5546/12384 [11:46:01<14:28:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 45%|████▍ | 5547/12384 [11:46:01<14:28:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 45%|████▍ | 5547/12384 [11:46:08<14:28:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▍ | 5548/12384 [11:46:08<14:28:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▍ | 5548/12384 [11:46:16<14:28:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.56s]
Epoch 0: 45%|████▍ | 5549/12384 [11:46:16<14:27:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.56s]
Epoch 0: 45%|████▍ | 5549/12384 [11:46:24<14:27:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.10s]
Epoch 0: 45%|████▍ | 5550/12384 [11:46:24<14:28:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.10s]
Epoch 0: 45%|████▍ | 5550/12384 [11:46:31<14:28:43, 7.63s/it, loss=0.0003, acc=0.9986, iter_time=7.23s]
Epoch 0: 45%|████▍ | 5551/12384 [11:46:31<14:28:14, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=7.23s]
Epoch 0: 45%|████▍ | 5551/12384 [11:46:39<14:28:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 45%|████▍ | 5552/12384 [11:46:39<14:31:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 45%|████▍ | 5552/12384 [11:46:46<14:31:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 45%|████▍ | 5553/12384 [11:46:46<14:30:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 45%|████▍ | 5553/12384 [11:46:54<14:30:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 45%|████▍ | 5554/12384 [11:46:54<14:29:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 45%|████▍ | 5554/12384 [11:47:02<14:29:15, 7.64s/it, loss=0.0002, acc=0.9976, iter_time=9.76s]
Epoch 0: 45%|████▍ | 5555/12384 [11:47:02<14:39:31, 7.73s/it, loss=0.0002, acc=0.9976, iter_time=9.76s]
Epoch 0: 45%|████▍ | 5555/12384 [11:47:10<14:39:31, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=5.04s]
Epoch 0: 45%|████▍ | 5556/12384 [11:47:10<14:35:49, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.04s]
Epoch 0: 45%|████▍ | 5556/12384 [11:47:17<14:35:49, 7.70s/it, loss=0.0005, acc=0.9980, iter_time=9.52s]
Epoch 0: 45%|████▍ | 5557/12384 [11:47:17<14:32:11, 7.67s/it, loss=0.0005, acc=0.9980, iter_time=9.52s]
Epoch 0: 45%|████▍ | 5557/12384 [11:47:25<14:32:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▍ | 5558/12384 [11:47:25<14:30:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▍ | 5558/12384 [11:47:32<14:30:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 45%|████▍ | 5559/12384 [11:47:32<14:28:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 45%|████▍ | 5559/12384 [11:47:40<14:28:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 45%|████▍ | 5560/12384 [11:47:40<14:27:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 45%|████▍ | 5560/12384 [11:47:48<14:27:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 45%|████▍ | 5561/12384 [11:47:48<14:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 45%|████▍ | 5561/12384 [11:47:55<14:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▍ | 5562/12384 [11:47:55<14:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▍ | 5562/12384 [11:48:03<14:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 45%|████▍ | 5563/12384 [11:48:03<14:24:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 45%|████▍ | 5563/12384 [11:48:11<14:24:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 45%|████▍ | 5564/12384 [11:48:11<14:25:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 45%|████▍ | 5564/12384 [11:48:18<14:25:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▍ | 5565/12384 [11:48:18<14:25:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▍ | 5565/12384 [11:48:26<14:25:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▍ | 5566/12384 [11:48:26<14:26:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▍ | 5566/12384 [11:48:33<14:26:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▍ | 5567/12384 [11:48:33<14:25:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▍ | 5567/12384 [11:48:41<14:25:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 45%|████▍ | 5568/12384 [11:48:41<14:24:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 45%|████▍ | 5568/12384 [11:48:49<14:24:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 45%|████▍ | 5569/12384 [11:48:49<14:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 45%|████▍ | 5569/12384 [11:48:56<14:23:56, 7.61s/it, loss=0.0008, acc=0.9972, iter_time=4.29s]
Epoch 0: 45%|████▍ | 5570/12384 [11:48:56<14:23:39, 7.60s/it, loss=0.0008, acc=0.9972, iter_time=4.29s]
Epoch 0: 45%|████▍ | 5570/12384 [11:49:04<14:23:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 45%|████▍ | 5571/12384 [11:49:04<14:24:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 45%|████▍ | 5571/12384 [11:49:12<14:24:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 45%|████▍ | 5572/12384 [11:49:12<14:32:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 45%|████▍ | 5572/12384 [11:49:19<14:32:44, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 45%|████▌ | 5573/12384 [11:49:19<14:29:54, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 45%|████▌ | 5573/12384 [11:49:27<14:29:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 45%|████▌ | 5574/12384 [11:49:27<14:28:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 45%|████▌ | 5574/12384 [11:49:34<14:28:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▌ | 5575/12384 [11:49:34<14:26:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▌ | 5575/12384 [11:49:42<14:26:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 45%|████▌ | 5576/12384 [11:49:42<14:28:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 45%|████▌ | 5576/12384 [11:49:50<14:28:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 45%|████▌ | 5577/12384 [11:49:50<14:26:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 45%|████▌ | 5577/12384 [11:49:57<14:26:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 45%|████▌ | 5578/12384 [11:49:57<14:25:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 45%|████▌ | 5578/12384 [11:50:05<14:25:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 45%|████▌ | 5579/12384 [11:50:05<14:24:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 45%|████▌ | 5579/12384 [11:50:13<14:24:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▌ | 5580/12384 [11:50:13<14:23:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▌ | 5580/12384 [11:50:21<14:23:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▌ | 5581/12384 [11:50:21<14:35:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▌ | 5581/12384 [11:50:28<14:35:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 45%|████▌ | 5582/12384 [11:50:28<14:32:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 45%|████▌ | 5582/12384 [11:50:36<14:32:08, 7.69s/it, loss=0.0007, acc=0.9996, iter_time=7.35s]
Epoch 0: 45%|████▌ | 5583/12384 [11:50:36<14:28:39, 7.66s/it, loss=0.0007, acc=0.9996, iter_time=7.35s]
Epoch 0: 45%|████▌ | 5583/12384 [11:50:43<14:28:39, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=8.27s]
Epoch 0: 45%|████▌ | 5584/12384 [11:50:43<14:26:55, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.27s]
Epoch 0: 45%|████▌ | 5584/12384 [11:50:51<14:26:55, 7.65s/it, loss=0.0001, acc=0.9995, iter_time=7.23s]
Epoch 0: 45%|████▌ | 5585/12384 [11:50:51<14:25:21, 7.64s/it, loss=0.0001, acc=0.9995, iter_time=7.23s]
Epoch 0: 45%|████▌ | 5585/12384 [11:50:59<14:25:21, 7.64s/it, loss=0.0075, acc=0.9865, iter_time=6.70s]
Epoch 0: 45%|████▌ | 5586/12384 [11:50:59<14:25:03, 7.64s/it, loss=0.0075, acc=0.9865, iter_time=6.70s]
Epoch 0: 45%|████▌ | 5586/12384 [11:51:06<14:25:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 45%|████▌ | 5587/12384 [11:51:06<14:23:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 45%|████▌ | 5587/12384 [11:51:14<14:23:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 45%|████▌ | 5588/12384 [11:51:14<14:22:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 45%|████▌ | 5588/12384 [11:51:21<14:22:40, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5589/12384 [11:51:21<14:22:14, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5589/12384 [11:51:29<14:22:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 45%|████▌ | 5590/12384 [11:51:29<14:25:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 45%|████▌ | 5590/12384 [11:51:37<14:25:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▌ | 5591/12384 [11:51:37<14:24:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▌ | 5591/12384 [11:51:44<14:24:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 45%|████▌ | 5592/12384 [11:51:44<14:23:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 45%|████▌ | 5592/12384 [11:51:52<14:23:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 45%|████▌ | 5593/12384 [11:51:52<14:22:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 45%|████▌ | 5593/12384 [11:52:00<14:22:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5594/12384 [11:52:00<14:22:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5594/12384 [11:52:07<14:22:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▌ | 5595/12384 [11:52:07<14:22:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▌ | 5595/12384 [11:52:15<14:22:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▌ | 5596/12384 [11:52:15<14:21:36, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▌ | 5596/12384 [11:52:22<14:21:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5597/12384 [11:52:22<14:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5597/12384 [11:52:30<14:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 45%|████▌ | 5598/12384 [11:52:30<14:30:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 45%|████▌ | 5598/12384 [11:52:38<14:30:51, 7.70s/it, loss=0.0005, acc=0.9978, iter_time=5.04s]
Epoch 0: 45%|████▌ | 5599/12384 [11:52:38<14:27:23, 7.67s/it, loss=0.0005, acc=0.9978, iter_time=5.04s]
Epoch 0: 45%|████▌ | 5599/12384 [11:52:46<14:27:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 45%|████▌ | 5600/12384 [11:52:46<14:27:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 45%|████▌ | 5600/12384 [11:52:53<14:27:41, 7.67s/it, loss=0.0001, acc=0.9989, iter_time=7.20s]
Epoch 0: 45%|████▌ | 5601/12384 [11:52:53<14:25:32, 7.66s/it, loss=0.0001, acc=0.9989, iter_time=7.20s]
Epoch 0: 45%|████▌ | 5601/12384 [11:53:01<14:25:32, 7.66s/it, loss=0.0001, acc=0.9986, iter_time=6.49s]
Epoch 0: 45%|████▌ | 5602/12384 [11:53:01<14:23:36, 7.64s/it, loss=0.0001, acc=0.9986, iter_time=6.49s]
Epoch 0: 45%|████▌ | 5602/12384 [11:53:08<14:23:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 45%|████▌ | 5603/12384 [11:53:08<14:22:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 45%|████▌ | 5603/12384 [11:53:16<14:22:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 45%|████▌ | 5604/12384 [11:53:16<14:22:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 45%|████▌ | 5604/12384 [11:53:24<14:22:08, 7.63s/it, loss=0.0004, acc=0.9985, iter_time=7.85s]
Epoch 0: 45%|████▌ | 5605/12384 [11:53:24<14:21:24, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=7.85s]
Epoch 0: 45%|████▌ | 5605/12384 [11:53:31<14:21:24, 7.62s/it, loss=0.0013, acc=0.9959, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5606/12384 [11:53:31<14:21:25, 7.63s/it, loss=0.0013, acc=0.9959, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5606/12384 [11:53:39<14:21:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 45%|████▌ | 5607/12384 [11:53:39<14:20:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 45%|████▌ | 5607/12384 [11:53:47<14:20:32, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=8.05s]
Epoch 0: 45%|████▌ | 5608/12384 [11:53:47<14:30:24, 7.71s/it, loss=0.0001, acc=0.9989, iter_time=8.05s]
Epoch 0: 45%|████▌ | 5608/12384 [11:53:54<14:30:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 0: 45%|████▌ | 5609/12384 [11:53:54<14:27:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 0: 45%|████▌ | 5609/12384 [11:54:02<14:27:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 45%|████▌ | 5610/12384 [11:54:02<14:24:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 45%|████▌ | 5610/12384 [11:54:10<14:24:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 45%|████▌ | 5611/12384 [11:54:10<14:22:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 45%|████▌ | 5611/12384 [11:54:17<14:22:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 45%|████▌ | 5612/12384 [11:54:17<14:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 45%|████▌ | 5612/12384 [11:54:25<14:20:56, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=4.55s]
Epoch 0: 45%|████▌ | 5613/12384 [11:54:25<14:19:12, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=4.55s]
Epoch 0: 45%|████▌ | 5613/12384 [11:54:32<14:19:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 45%|████▌ | 5614/12384 [11:54:32<14:19:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 45%|████▌ | 5614/12384 [11:54:40<14:19:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 45%|████▌ | 5615/12384 [11:54:40<14:18:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 45%|████▌ | 5615/12384 [11:54:48<14:18:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 45%|████▌ | 5616/12384 [11:54:48<14:18:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 45%|████▌ | 5616/12384 [11:54:55<14:18:38, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.66s]
Epoch 0: 45%|████▌ | 5617/12384 [11:54:55<14:18:33, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.66s]
Epoch 0: 45%|████▌ | 5617/12384 [11:55:03<14:18:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▌ | 5618/12384 [11:55:03<14:19:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 45%|████▌ | 5618/12384 [11:55:11<14:19:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 45%|████▌ | 5619/12384 [11:55:11<14:18:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 45%|████▌ | 5619/12384 [11:55:18<14:18:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▌ | 5620/12384 [11:55:18<14:17:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 45%|████▌ | 5620/12384 [11:55:26<14:17:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 45%|████▌ | 5621/12384 [11:55:26<14:17:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 45%|████▌ | 5621/12384 [11:55:33<14:17:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 45%|████▌ | 5622/12384 [11:55:33<14:17:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 45%|████▌ | 5622/12384 [11:55:41<14:17:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 45%|████▌ | 5623/12384 [11:55:41<14:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 45%|████▌ | 5623/12384 [11:55:49<14:18:03, 7.61s/it, loss=0.0006, acc=1.0000, iter_time=9.89s]
Epoch 0: 45%|████▌ | 5624/12384 [11:55:49<14:17:44, 7.61s/it, loss=0.0006, acc=1.0000, iter_time=9.89s]
Epoch 0: 45%|████▌ | 5624/12384 [11:55:56<14:17:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 45%|████▌ | 5625/12384 [11:55:56<14:17:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 45%|████▌ | 5625/12384 [11:56:04<14:17:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▌ | 5626/12384 [11:56:04<14:17:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 45%|████▌ | 5626/12384 [11:56:11<14:17:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5627/12384 [11:56:11<14:17:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 45%|████▌ | 5627/12384 [11:56:19<14:17:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 45%|████▌ | 5628/12384 [11:56:19<14:18:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 45%|████▌ | 5628/12384 [11:56:27<14:18:29, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=5.51s]
Epoch 0: 45%|████▌ | 5629/12384 [11:56:27<14:18:32, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=5.51s]
Epoch 0: 45%|████▌ | 5629/12384 [11:56:34<14:18:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 0: 45%|████▌ | 5630/12384 [11:56:34<14:18:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 0: 45%|████▌ | 5630/12384 [11:56:42<14:18:07, 7.62s/it, loss=0.0016, acc=0.9946, iter_time=6.65s]
Epoch 0: 45%|████▌ | 5631/12384 [11:56:42<14:17:58, 7.62s/it, loss=0.0016, acc=0.9946, iter_time=6.65s]
Epoch 0: 45%|████▌ | 5631/12384 [11:56:50<14:17:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.66s]
Epoch 0: 45%|████▌ | 5632/12384 [11:56:50<14:16:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.66s]
Epoch 0: 45%|████▌ | 5632/12384 [11:56:57<14:16:40, 7.61s/it, loss=0.0032, acc=0.9972, iter_time=7.49s]
Epoch 0: 45%|████▌ | 5633/12384 [11:56:57<14:17:16, 7.62s/it, loss=0.0032, acc=0.9972, iter_time=7.49s]
Epoch 0: 45%|████▌ | 5633/12384 [11:57:05<14:17:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 45%|████▌ | 5634/12384 [11:57:05<14:28:28, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 45%|████▌ | 5634/12384 [11:57:13<14:28:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5635/12384 [11:57:13<14:24:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5635/12384 [11:57:20<14:24:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 46%|████▌ | 5636/12384 [11:57:20<14:21:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 46%|████▌ | 5636/12384 [11:57:28<14:21:45, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=4.79s]
Epoch 0: 46%|████▌ | 5637/12384 [11:57:28<14:19:11, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=4.79s]
Epoch 0: 46%|████▌ | 5637/12384 [11:57:36<14:19:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 46%|████▌ | 5638/12384 [11:57:36<14:20:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 46%|████▌ | 5638/12384 [11:57:43<14:20:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 46%|████▌ | 5639/12384 [11:57:43<14:18:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 46%|████▌ | 5639/12384 [11:57:51<14:18:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 46%|████▌ | 5640/12384 [11:57:51<14:17:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 46%|████▌ | 5640/12384 [11:57:58<14:17:53, 7.63s/it, loss=0.0008, acc=0.9961, iter_time=6.70s]
Epoch 0: 46%|████▌ | 5641/12384 [11:57:58<14:17:16, 7.63s/it, loss=0.0008, acc=0.9961, iter_time=6.70s]
Epoch 0: 46%|████▌ | 5641/12384 [11:58:06<14:17:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.58s]
Epoch 0: 46%|████▌ | 5642/12384 [11:58:06<14:16:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.58s]
Epoch 0: 46%|████▌ | 5642/12384 [11:58:14<14:16:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5643/12384 [11:58:14<14:17:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5643/12384 [11:58:21<14:17:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 46%|████▌ | 5644/12384 [11:58:21<14:16:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 46%|████▌ | 5644/12384 [11:58:29<14:16:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 0: 46%|████▌ | 5645/12384 [11:58:29<14:18:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 0: 46%|████▌ | 5645/12384 [11:58:37<14:18:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 46%|████▌ | 5646/12384 [11:58:37<14:16:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 46%|████▌ | 5646/12384 [11:58:44<14:16:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▌ | 5647/12384 [11:58:44<14:16:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▌ | 5647/12384 [11:58:52<14:16:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 46%|████▌ | 5648/12384 [11:58:52<14:15:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 46%|████▌ | 5648/12384 [11:59:00<14:15:42, 7.62s/it, loss=0.0003, acc=0.9981, iter_time=7.53s]
Epoch 0: 46%|████▌ | 5649/12384 [11:59:00<14:25:25, 7.71s/it, loss=0.0003, acc=0.9981, iter_time=7.53s]
Epoch 0: 46%|████▌ | 5649/12384 [11:59:07<14:25:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 46%|████▌ | 5650/12384 [11:59:07<14:22:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 46%|████▌ | 5650/12384 [11:59:15<14:22:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 46%|████▌ | 5651/12384 [11:59:15<14:19:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 46%|████▌ | 5651/12384 [11:59:23<14:19:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.37s]
Epoch 0: 46%|████▌ | 5652/12384 [11:59:23<14:17:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.37s]
Epoch 0: 46%|████▌ | 5652/12384 [11:59:30<14:17:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 0: 46%|████▌ | 5653/12384 [11:59:30<14:16:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 0: 46%|████▌ | 5653/12384 [11:59:38<14:16:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 46%|████▌ | 5654/12384 [11:59:38<14:15:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 46%|████▌ | 5654/12384 [11:59:45<14:15:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5655/12384 [11:59:45<14:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5655/12384 [11:59:53<14:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 46%|████▌ | 5656/12384 [11:59:53<14:13:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 46%|████▌ | 5656/12384 [12:00:01<14:13:37, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 0: 46%|████▌ | 5657/12384 [12:00:01<14:12:29, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 0: 46%|████▌ | 5657/12384 [12:00:08<14:12:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5658/12384 [12:00:08<14:13:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5658/12384 [12:00:16<14:13:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5659/12384 [12:00:16<14:12:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5659/12384 [12:00:23<14:12:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 0: 46%|████▌ | 5660/12384 [12:00:23<14:12:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 0: 46%|████▌ | 5660/12384 [12:00:31<14:12:29, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=5.45s]
Epoch 0: 46%|████▌ | 5661/12384 [12:00:31<14:23:43, 7.71s/it, loss=0.0002, acc=0.9991, iter_time=5.45s]
Epoch 0: 46%|████▌ | 5661/12384 [12:00:39<14:23:43, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=10.72s]
Epoch 0: 46%|████▌ | 5662/12384 [12:00:39<14:22:06, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=10.72s]
Epoch 0: 46%|████▌ | 5662/12384 [12:00:47<14:22:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 46%|████▌ | 5663/12384 [12:00:47<14:19:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 46%|████▌ | 5663/12384 [12:00:54<14:19:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 46%|████▌ | 5664/12384 [12:00:54<14:17:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 46%|████▌ | 5664/12384 [12:01:02<14:17:43, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=3.73s]
Epoch 0: 46%|████▌ | 5665/12384 [12:01:02<14:17:52, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=3.73s]
Epoch 0: 46%|████▌ | 5665/12384 [12:01:10<14:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 0: 46%|████▌ | 5666/12384 [12:01:10<14:16:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 0: 46%|████▌ | 5666/12384 [12:01:17<14:16:09, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5667/12384 [12:01:17<14:14:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5667/12384 [12:01:25<14:14:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 0: 46%|████▌ | 5668/12384 [12:01:25<14:12:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 0: 46%|████▌ | 5668/12384 [12:01:32<14:12:53, 7.62s/it, loss=0.0016, acc=0.9964, iter_time=9.69s]
Epoch 0: 46%|████▌ | 5669/12384 [12:01:32<14:13:09, 7.62s/it, loss=0.0016, acc=0.9964, iter_time=9.69s]
Epoch 0: 46%|████▌ | 5669/12384 [12:01:40<14:13:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 46%|████▌ | 5670/12384 [12:01:40<14:12:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 46%|████▌ | 5670/12384 [12:01:48<14:12:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 0: 46%|████▌ | 5671/12384 [12:01:48<14:11:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 0: 46%|████▌ | 5671/12384 [12:01:55<14:11:27, 7.61s/it, loss=0.0006, acc=0.9997, iter_time=11.00s]
Epoch 0: 46%|████▌ | 5672/12384 [12:01:55<14:10:49, 7.61s/it, loss=0.0006, acc=0.9997, iter_time=11.00s]
Epoch 0: 46%|████▌ | 5672/12384 [12:02:03<14:10:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 46%|████▌ | 5673/12384 [12:02:03<14:10:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 46%|████▌ | 5673/12384 [12:02:11<14:10:16, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 46%|████▌ | 5674/12384 [12:02:11<14:19:18, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 0: 46%|████▌ | 5674/12384 [12:02:18<14:19:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▌ | 5675/12384 [12:02:18<14:16:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▌ | 5675/12384 [12:02:26<14:16:35, 7.66s/it, loss=0.0005, acc=0.9997, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5676/12384 [12:02:26<14:15:08, 7.65s/it, loss=0.0005, acc=0.9997, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5676/12384 [12:02:33<14:15:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▌ | 5677/12384 [12:02:33<14:14:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▌ | 5677/12384 [12:02:41<14:14:16, 7.64s/it, loss=0.0003, acc=0.9997, iter_time=7.65s]
Epoch 0: 46%|████▌ | 5678/12384 [12:02:41<14:15:39, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=7.65s]
Epoch 0: 46%|████▌ | 5678/12384 [12:02:49<14:15:39, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 46%|████▌ | 5679/12384 [12:02:49<14:14:10, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 46%|████▌ | 5679/12384 [12:02:56<14:14:10, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 46%|████▌ | 5680/12384 [12:02:56<14:14:04, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 46%|████▌ | 5680/12384 [12:03:04<14:14:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 46%|████▌ | 5681/12384 [12:03:04<14:12:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 46%|████▌ | 5681/12384 [12:03:12<14:12:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 0: 46%|████▌ | 5682/12384 [12:03:12<14:12:30, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 0: 46%|████▌ | 5682/12384 [12:03:19<14:12:30, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.18s]
Epoch 0: 46%|████▌ | 5683/12384 [12:03:19<14:12:01, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.18s]
Epoch 0: 46%|████▌ | 5683/12384 [12:03:27<14:12:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 0: 46%|████▌ | 5684/12384 [12:03:27<14:11:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 0: 46%|████▌ | 5684/12384 [12:03:35<14:11:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 46%|████▌ | 5685/12384 [12:03:35<14:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 46%|████▌ | 5685/12384 [12:03:42<14:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 46%|████▌ | 5686/12384 [12:03:42<14:10:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 46%|████▌ | 5686/12384 [12:03:50<14:10:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 46%|████▌ | 5687/12384 [12:03:50<14:21:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 46%|████▌ | 5687/12384 [12:03:58<14:21:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 46%|████▌ | 5688/12384 [12:03:58<14:17:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 46%|████▌ | 5688/12384 [12:04:05<14:17:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 46%|████▌ | 5689/12384 [12:04:05<14:15:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 46%|████▌ | 5689/12384 [12:04:13<14:15:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 46%|████▌ | 5690/12384 [12:04:13<14:12:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 46%|████▌ | 5690/12384 [12:04:20<14:12:44, 7.64s/it, loss=0.0009, acc=0.9977, iter_time=5.51s]
Epoch 0: 46%|████▌ | 5691/12384 [12:04:20<14:11:26, 7.63s/it, loss=0.0009, acc=0.9977, iter_time=5.51s]
Epoch 0: 46%|████▌ | 5691/12384 [12:04:28<14:11:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 0: 46%|████▌ | 5692/12384 [12:04:28<14:10:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 0: 46%|████▌ | 5692/12384 [12:04:36<14:10:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 0: 46%|████▌ | 5693/12384 [12:04:36<14:10:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 0: 46%|████▌ | 5693/12384 [12:04:43<14:10:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 46%|████▌ | 5694/12384 [12:04:43<14:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 46%|████▌ | 5694/12384 [12:04:51<14:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5695/12384 [12:04:51<14:08:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5695/12384 [12:04:59<14:08:15, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=7.99s]
Epoch 0: 46%|████▌ | 5696/12384 [12:04:59<14:08:41, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=7.99s]
Epoch 0: 46%|████▌ | 5696/12384 [12:05:06<14:08:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.73s]
Epoch 0: 46%|████▌ | 5697/12384 [12:05:06<14:08:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.73s]
Epoch 0: 46%|████▌ | 5697/12384 [12:05:14<14:08:41, 7.62s/it, loss=0.0067, acc=0.9841, iter_time=9.13s]
Epoch 0: 46%|████▌ | 5698/12384 [12:05:14<14:12:41, 7.65s/it, loss=0.0067, acc=0.9841, iter_time=9.13s]
Epoch 0: 46%|████▌ | 5698/12384 [12:05:21<14:12:41, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.74s]
Epoch 0: 46%|████▌ | 5699/12384 [12:05:21<14:10:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.74s]
Epoch 0: 46%|████▌ | 5699/12384 [12:05:29<14:10:50, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=8.29s]
Epoch 0: 46%|████▌ | 5700/12384 [12:05:29<14:19:24, 7.71s/it, loss=0.0005, acc=0.9979, iter_time=8.29s]
Epoch 0: 46%|████▌ | 5700/12384 [12:05:37<14:19:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 46%|████▌ | 5701/12384 [12:05:37<14:16:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 46%|████▌ | 5701/12384 [12:05:45<14:16:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 46%|████▌ | 5702/12384 [12:05:45<14:16:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 46%|████▌ | 5702/12384 [12:05:52<14:16:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 0: 46%|████▌ | 5703/12384 [12:05:52<14:13:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 0: 46%|████▌ | 5703/12384 [12:06:00<14:13:30, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 46%|████▌ | 5704/12384 [12:06:00<14:14:20, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 46%|████▌ | 5704/12384 [12:06:08<14:14:20, 7.67s/it, loss=0.0011, acc=0.9977, iter_time=5.81s]
Epoch 0: 46%|████▌ | 5705/12384 [12:06:08<14:12:37, 7.66s/it, loss=0.0011, acc=0.9977, iter_time=5.81s]
Epoch 0: 46%|████▌ | 5705/12384 [12:06:15<14:12:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 46%|████▌ | 5706/12384 [12:06:15<14:10:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 46%|████▌ | 5706/12384 [12:06:23<14:10:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 46%|████▌ | 5707/12384 [12:06:23<14:08:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 46%|████▌ | 5707/12384 [12:06:30<14:08:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 46%|████▌ | 5708/12384 [12:06:30<14:08:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 46%|████▌ | 5708/12384 [12:06:38<14:08:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 46%|████▌ | 5709/12384 [12:06:38<14:08:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 46%|████▌ | 5709/12384 [12:06:46<14:08:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.03s]
Epoch 0: 46%|████▌ | 5710/12384 [12:06:46<14:07:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.03s]
Epoch 0: 46%|████▌ | 5710/12384 [12:06:53<14:07:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 46%|████▌ | 5711/12384 [12:06:53<14:06:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 46%|████▌ | 5711/12384 [12:07:01<14:06:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 46%|████▌ | 5712/12384 [12:07:01<14:06:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 46%|████▌ | 5712/12384 [12:07:09<14:06:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 46%|████▌ | 5713/12384 [12:07:09<14:21:23, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 46%|████▌ | 5713/12384 [12:07:17<14:21:23, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 46%|████▌ | 5714/12384 [12:07:17<14:17:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 46%|████▌ | 5714/12384 [12:07:24<14:17:05, 7.71s/it, loss=0.0011, acc=0.9989, iter_time=10.69s]
Epoch 0: 46%|████▌ | 5715/12384 [12:07:24<14:13:50, 7.68s/it, loss=0.0011, acc=0.9989, iter_time=10.69s]
Epoch 0: 46%|████▌ | 5715/12384 [12:07:32<14:13:50, 7.68s/it, loss=0.0014, acc=1.0000, iter_time=7.63s]
Epoch 0: 46%|████▌ | 5716/12384 [12:07:32<14:11:47, 7.66s/it, loss=0.0014, acc=1.0000, iter_time=7.63s]
Epoch 0: 46%|████▌ | 5716/12384 [12:07:39<14:11:47, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5717/12384 [12:07:39<14:10:07, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▌ | 5717/12384 [12:07:47<14:10:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 46%|████▌ | 5718/12384 [12:07:47<14:09:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 46%|████▌ | 5718/12384 [12:07:55<14:09:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 46%|████▌ | 5719/12384 [12:07:55<14:07:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 46%|████▌ | 5719/12384 [12:08:02<14:07:32, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=8.00s]
Epoch 0: 46%|████▌ | 5720/12384 [12:08:02<14:06:48, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=8.00s]
Epoch 0: 46%|████▌ | 5720/12384 [12:08:10<14:06:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 46%|████▌ | 5721/12384 [12:08:10<14:06:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 46%|████▌ | 5721/12384 [12:08:17<14:06:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5722/12384 [12:08:17<14:05:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5722/12384 [12:08:25<14:05:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 46%|████▌ | 5723/12384 [12:08:25<14:06:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 46%|████▌ | 5723/12384 [12:08:33<14:06:34, 7.63s/it, loss=0.0003, acc=0.9987, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5724/12384 [12:08:33<14:05:50, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=7.61s]
Epoch 0: 46%|████▌ | 5724/12384 [12:08:40<14:05:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▌ | 5725/12384 [12:08:40<14:05:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▌ | 5725/12384 [12:08:48<14:05:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 46%|████▌ | 5726/12384 [12:08:48<14:04:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 46%|████▌ | 5726/12384 [12:08:56<14:04:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 46%|████▌ | 5727/12384 [12:08:56<14:04:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 46%|████▌ | 5727/12384 [12:09:03<14:04:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 46%|████▋ | 5728/12384 [12:09:03<14:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 46%|████▋ | 5728/12384 [12:09:11<14:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 46%|████▋ | 5729/12384 [12:09:11<14:04:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 46%|████▋ | 5729/12384 [12:09:18<14:04:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 46%|████▋ | 5730/12384 [12:09:18<14:04:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 46%|████▋ | 5730/12384 [12:09:26<14:04:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.26s]
Epoch 0: 46%|████▋ | 5731/12384 [12:09:26<14:03:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.26s]
Epoch 0: 46%|████▋ | 5731/12384 [12:09:34<14:03:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▋ | 5732/12384 [12:09:34<14:03:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▋ | 5732/12384 [12:09:41<14:03:43, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=6.67s]
Epoch 0: 46%|████▋ | 5733/12384 [12:09:41<14:03:16, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=6.67s]
Epoch 0: 46%|████▋ | 5733/12384 [12:09:49<14:03:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 0: 46%|████▋ | 5734/12384 [12:09:49<14:03:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 0: 46%|████▋ | 5734/12384 [12:09:56<14:03:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.10s]
Epoch 0: 46%|████▋ | 5735/12384 [12:09:56<14:03:37, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.10s]
Epoch 0: 46%|████▋ | 5735/12384 [12:10:04<14:03:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 46%|████▋ | 5736/12384 [12:10:04<14:03:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 46%|████▋ | 5736/12384 [12:10:12<14:03:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 46%|████▋ | 5737/12384 [12:10:12<14:03:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 46%|████▋ | 5737/12384 [12:10:19<14:03:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 46%|████▋ | 5738/12384 [12:10:19<14:03:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 46%|████▋ | 5738/12384 [12:10:27<14:03:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 46%|████▋ | 5739/12384 [12:10:27<14:13:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 46%|████▋ | 5739/12384 [12:10:35<14:13:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 46%|████▋ | 5740/12384 [12:10:35<14:10:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 46%|████▋ | 5740/12384 [12:10:42<14:10:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▋ | 5741/12384 [12:10:42<14:08:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▋ | 5741/12384 [12:10:50<14:08:11, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 46%|████▋ | 5742/12384 [12:10:50<14:06:26, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 46%|████▋ | 5742/12384 [12:10:58<14:06:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▋ | 5743/12384 [12:10:58<14:05:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▋ | 5743/12384 [12:11:05<14:05:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 46%|████▋ | 5744/12384 [12:11:05<14:04:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 46%|████▋ | 5744/12384 [12:11:13<14:04:12, 7.63s/it, loss=0.0003, acc=0.9984, iter_time=7.21s]
Epoch 0: 46%|████▋ | 5745/12384 [12:11:13<14:03:13, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.21s]
Epoch 0: 46%|████▋ | 5745/12384 [12:11:21<14:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▋ | 5746/12384 [12:11:21<14:02:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 46%|████▋ | 5746/12384 [12:11:28<14:02:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▋ | 5747/12384 [12:11:28<14:02:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▋ | 5747/12384 [12:11:36<14:02:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 46%|████▋ | 5748/12384 [12:11:36<14:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 46%|████▋ | 5748/12384 [12:11:43<14:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▋ | 5749/12384 [12:11:43<14:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 46%|████▋ | 5749/12384 [12:11:51<14:01:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 46%|████▋ | 5750/12384 [12:11:51<14:01:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 46%|████▋ | 5750/12384 [12:11:59<14:01:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 46%|████▋ | 5751/12384 [12:11:59<14:02:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 46%|████▋ | 5751/12384 [12:12:06<14:02:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 46%|████▋ | 5752/12384 [12:12:06<14:02:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 46%|████▋ | 5752/12384 [12:12:14<14:02:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 46%|████▋ | 5753/12384 [12:12:14<14:10:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 46%|████▋ | 5753/12384 [12:12:22<14:10:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▋ | 5754/12384 [12:12:22<14:08:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 46%|████▋ | 5754/12384 [12:12:29<14:08:12, 7.68s/it, loss=0.0012, acc=0.9926, iter_time=5.83s]
Epoch 0: 46%|████▋ | 5755/12384 [12:12:29<14:06:06, 7.66s/it, loss=0.0012, acc=0.9926, iter_time=5.83s]
Epoch 0: 46%|████▋ | 5755/12384 [12:12:37<14:06:06, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.65s]
Epoch 0: 46%|████▋ | 5756/12384 [12:12:37<14:03:44, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.65s]
Epoch 0: 46%|████▋ | 5756/12384 [12:12:45<14:03:44, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.47s]
Epoch 0: 46%|████▋ | 5757/12384 [12:12:45<14:02:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.47s]
Epoch 0: 46%|████▋ | 5757/12384 [12:12:52<14:02:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 46%|████▋ | 5758/12384 [12:12:52<14:01:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 46%|████▋ | 5758/12384 [12:13:00<14:01:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 47%|████▋ | 5759/12384 [12:13:00<14:01:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 47%|████▋ | 5759/12384 [12:13:07<14:01:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 0: 47%|████▋ | 5760/12384 [12:13:07<14:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 0: 47%|████▋ | 5760/12384 [12:13:15<14:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 47%|████▋ | 5761/12384 [12:13:15<14:00:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 47%|████▋ | 5761/12384 [12:13:23<14:00:25, 7.61s/it, loss=0.0004, acc=0.9968, iter_time=8.17s]
Epoch 0: 47%|████▋ | 5762/12384 [12:13:23<14:00:20, 7.61s/it, loss=0.0004, acc=0.9968, iter_time=8.17s]
Epoch 0: 47%|████▋ | 5762/12384 [12:13:30<14:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 47%|████▋ | 5763/12384 [12:13:30<14:00:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 47%|████▋ | 5763/12384 [12:13:38<14:00:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 47%|████▋ | 5764/12384 [12:13:38<13:59:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 47%|████▋ | 5764/12384 [12:13:46<13:59:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 47%|████▋ | 5765/12384 [12:13:46<14:10:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 47%|████▋ | 5765/12384 [12:13:53<14:10:20, 7.71s/it, loss=0.0005, acc=0.9986, iter_time=6.37s]
Epoch 0: 47%|████▋ | 5766/12384 [12:13:53<14:07:22, 7.68s/it, loss=0.0005, acc=0.9986, iter_time=6.37s]
Epoch 0: 47%|████▋ | 5766/12384 [12:14:01<14:07:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 47%|████▋ | 5767/12384 [12:14:01<14:04:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 47%|████▋ | 5767/12384 [12:14:09<14:04:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.74s]
Epoch 0: 47%|████▋ | 5768/12384 [12:14:09<14:04:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.74s]
Epoch 0: 47%|████▋ | 5768/12384 [12:14:16<14:04:05, 7.66s/it, loss=0.0014, acc=0.9975, iter_time=7.25s]
Epoch 0: 47%|████▋ | 5769/12384 [12:14:16<14:02:07, 7.64s/it, loss=0.0014, acc=0.9975, iter_time=7.25s]
Epoch 0: 47%|████▋ | 5769/12384 [12:14:24<14:02:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5770/12384 [12:14:24<14:01:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5770/12384 [12:14:31<14:01:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 47%|████▋ | 5771/12384 [12:14:31<13:59:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 47%|████▋ | 5771/12384 [12:14:39<13:59:45, 7.62s/it, loss=0.0004, acc=0.9965, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5772/12384 [12:14:39<13:59:47, 7.62s/it, loss=0.0004, acc=0.9965, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5772/12384 [12:14:47<13:59:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5773/12384 [12:14:47<13:59:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5773/12384 [12:14:54<13:59:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5774/12384 [12:14:54<13:58:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5774/12384 [12:15:02<13:58:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5775/12384 [12:15:02<13:58:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5775/12384 [12:15:09<13:58:20, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.98s]
Epoch 0: 47%|████▋ | 5776/12384 [12:15:09<13:58:18, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.98s]
Epoch 0: 47%|████▋ | 5776/12384 [12:15:17<13:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 47%|████▋ | 5777/12384 [12:15:17<13:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 47%|████▋ | 5777/12384 [12:15:25<13:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 47%|████▋ | 5778/12384 [12:15:25<14:01:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 47%|████▋ | 5778/12384 [12:15:33<14:01:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 0: 47%|████▋ | 5779/12384 [12:15:33<14:08:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 0: 47%|████▋ | 5779/12384 [12:15:40<14:08:55, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 47%|████▋ | 5780/12384 [12:15:40<14:04:43, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 47%|████▋ | 5780/12384 [12:15:48<14:04:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 47%|████▋ | 5781/12384 [12:15:48<14:02:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 47%|████▋ | 5781/12384 [12:15:56<14:02:54, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.91s]
Epoch 0: 47%|████▋ | 5782/12384 [12:15:56<14:03:17, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.91s]
Epoch 0: 47%|████▋ | 5782/12384 [12:16:03<14:03:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 47%|████▋ | 5783/12384 [12:16:03<14:01:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 47%|████▋ | 5783/12384 [12:16:11<14:01:55, 7.65s/it, loss=0.0005, acc=0.9983, iter_time=8.00s]
Epoch 0: 47%|████▋ | 5784/12384 [12:16:11<13:59:51, 7.64s/it, loss=0.0005, acc=0.9983, iter_time=8.00s]
Epoch 0: 47%|████▋ | 5784/12384 [12:16:18<13:59:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 47%|████▋ | 5785/12384 [12:16:18<13:59:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 47%|████▋ | 5785/12384 [12:16:26<13:59:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 47%|████▋ | 5786/12384 [12:16:26<13:58:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 47%|████▋ | 5786/12384 [12:16:34<13:58:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5787/12384 [12:16:34<13:57:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5787/12384 [12:16:41<13:57:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5788/12384 [12:16:41<13:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5788/12384 [12:16:49<13:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5789/12384 [12:16:49<13:56:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5789/12384 [12:16:56<13:56:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5790/12384 [12:16:56<13:56:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5790/12384 [12:17:04<13:56:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 47%|████▋ | 5791/12384 [12:17:04<13:55:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 47%|████▋ | 5791/12384 [12:17:12<13:55:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 47%|████▋ | 5792/12384 [12:17:12<14:06:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 47%|████▋ | 5792/12384 [12:17:20<14:06:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 0: 47%|████▋ | 5793/12384 [12:17:20<14:02:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 0: 47%|████▋ | 5793/12384 [12:17:27<14:02:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5794/12384 [12:17:27<14:00:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5794/12384 [12:17:35<14:00:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5795/12384 [12:17:35<13:59:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5795/12384 [12:17:42<13:59:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5796/12384 [12:17:42<13:58:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5796/12384 [12:17:50<13:58:41, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 47%|████▋ | 5797/12384 [12:17:50<13:57:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 47%|████▋ | 5797/12384 [12:17:58<13:57:33, 7.63s/it, loss=0.0005, acc=0.9976, iter_time=6.40s]
Epoch 0: 47%|████▋ | 5798/12384 [12:17:58<13:55:39, 7.61s/it, loss=0.0005, acc=0.9976, iter_time=6.40s]
Epoch 0: 47%|████▋ | 5798/12384 [12:18:05<13:55:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.75s]
Epoch 0: 47%|████▋ | 5799/12384 [12:18:05<13:59:07, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.75s]
Epoch 0: 47%|████▋ | 5799/12384 [12:18:13<13:59:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 47%|████▋ | 5800/12384 [12:18:13<13:57:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 47%|████▋ | 5800/12384 [12:18:21<13:57:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 47%|████▋ | 5801/12384 [12:18:21<13:56:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 47%|████▋ | 5801/12384 [12:18:28<13:56:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5802/12384 [12:18:28<13:55:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5802/12384 [12:18:36<13:55:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5803/12384 [12:18:36<13:55:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5803/12384 [12:18:43<13:55:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 0: 47%|████▋ | 5804/12384 [12:18:43<13:57:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 0: 47%|████▋ | 5804/12384 [12:18:51<13:57:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.72s]
Epoch 0: 47%|████▋ | 5805/12384 [12:18:51<14:05:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.72s]
Epoch 0: 47%|████▋ | 5805/12384 [12:18:59<14:05:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 47%|████▋ | 5806/12384 [12:18:59<14:02:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 47%|████▋ | 5806/12384 [12:19:07<14:02:22, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=5.83s]
Epoch 0: 47%|████▋ | 5807/12384 [12:19:07<13:58:46, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=5.83s]
Epoch 0: 47%|████▋ | 5807/12384 [12:19:14<13:58:46, 7.65s/it, loss=0.0009, acc=0.9983, iter_time=9.75s]
Epoch 0: 47%|████▋ | 5808/12384 [12:19:14<13:57:25, 7.64s/it, loss=0.0009, acc=0.9983, iter_time=9.75s]
Epoch 0: 47%|████▋ | 5808/12384 [12:19:22<13:57:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 47%|████▋ | 5809/12384 [12:19:22<13:56:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 47%|████▋ | 5809/12384 [12:19:29<13:56:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5810/12384 [12:19:29<13:55:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5810/12384 [12:19:37<13:55:46, 7.63s/it, loss=0.0008, acc=0.9983, iter_time=4.58s]
Epoch 0: 47%|████▋ | 5811/12384 [12:19:37<13:54:15, 7.62s/it, loss=0.0008, acc=0.9983, iter_time=4.58s]
Epoch 0: 47%|████▋ | 5811/12384 [12:19:45<13:54:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 0: 47%|████▋ | 5812/12384 [12:19:45<13:54:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 0: 47%|████▋ | 5812/12384 [12:19:52<13:54:25, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=7.65s]
Epoch 0: 47%|████▋ | 5813/12384 [12:19:52<13:54:27, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=7.65s]
Epoch 0: 47%|████▋ | 5813/12384 [12:20:00<13:54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5814/12384 [12:20:00<13:53:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5814/12384 [12:20:07<13:53:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5815/12384 [12:20:07<13:53:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5815/12384 [12:20:15<13:53:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 47%|████▋ | 5816/12384 [12:20:15<13:55:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 47%|████▋ | 5816/12384 [12:20:23<13:55:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 0: 47%|████▋ | 5817/12384 [12:20:23<13:54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 0: 47%|████▋ | 5817/12384 [12:20:31<13:54:27, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=10.81s]
Epoch 0: 47%|████▋ | 5818/12384 [12:20:31<14:04:37, 7.72s/it, loss=0.0002, acc=0.9999, iter_time=10.81s]
Epoch 0: 47%|████▋ | 5818/12384 [12:20:38<14:04:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 47%|████▋ | 5819/12384 [12:20:38<14:02:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 47%|████▋ | 5819/12384 [12:20:46<14:02:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 0: 47%|████▋ | 5820/12384 [12:20:46<14:00:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 0: 47%|████▋ | 5820/12384 [12:20:53<14:00:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5821/12384 [12:20:53<13:56:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5821/12384 [12:21:01<13:56:55, 7.65s/it, loss=0.0002, acc=0.9995, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5822/12384 [12:21:01<13:55:43, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5822/12384 [12:21:09<13:55:43, 7.64s/it, loss=0.0003, acc=0.9980, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5823/12384 [12:21:09<13:54:52, 7.63s/it, loss=0.0003, acc=0.9980, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5823/12384 [12:21:16<13:54:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 47%|████▋ | 5824/12384 [12:21:16<13:54:20, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 47%|████▋ | 5824/12384 [12:21:24<13:54:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 47%|████▋ | 5825/12384 [12:21:24<13:53:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 47%|████▋ | 5825/12384 [12:21:32<13:53:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5826/12384 [12:21:32<13:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5826/12384 [12:21:39<13:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5827/12384 [12:21:39<13:52:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5827/12384 [12:21:47<13:52:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 47%|████▋ | 5828/12384 [12:21:47<13:51:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 47%|████▋ | 5828/12384 [12:21:54<13:51:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5829/12384 [12:21:54<13:51:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5829/12384 [12:22:02<13:51:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 47%|████▋ | 5830/12384 [12:22:02<13:51:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 47%|████▋ | 5830/12384 [12:22:10<13:51:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 47%|████▋ | 5831/12384 [12:22:10<14:00:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 47%|████▋ | 5831/12384 [12:22:17<14:00:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 47%|████▋ | 5832/12384 [12:22:17<13:57:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 47%|████▋ | 5832/12384 [12:22:25<13:57:36, 7.67s/it, loss=0.0003, acc=0.9976, iter_time=7.21s]
Epoch 0: 47%|████▋ | 5833/12384 [12:22:25<13:55:37, 7.65s/it, loss=0.0003, acc=0.9976, iter_time=7.21s]
Epoch 0: 47%|████▋ | 5833/12384 [12:22:33<13:55:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 47%|████▋ | 5834/12384 [12:22:33<13:54:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 47%|████▋ | 5834/12384 [12:22:40<13:54:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 0: 47%|████▋ | 5835/12384 [12:22:40<13:53:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 0: 47%|████▋ | 5835/12384 [12:22:48<13:53:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 47%|████▋ | 5836/12384 [12:22:48<13:52:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 47%|████▋ | 5836/12384 [12:22:56<13:52:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5837/12384 [12:22:56<13:51:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5837/12384 [12:23:03<13:51:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 47%|████▋ | 5838/12384 [12:23:03<13:51:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 47%|████▋ | 5838/12384 [12:23:11<13:51:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 47%|████▋ | 5839/12384 [12:23:11<13:50:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 47%|████▋ | 5839/12384 [12:23:18<13:50:36, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.95s]
Epoch 0: 47%|████▋ | 5840/12384 [12:23:18<13:50:11, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.95s]
Epoch 0: 47%|████▋ | 5840/12384 [12:23:26<13:50:11, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.22s]
Epoch 0: 47%|████▋ | 5841/12384 [12:23:26<13:49:50, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.22s]
Epoch 0: 47%|████▋ | 5841/12384 [12:23:34<13:49:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5842/12384 [12:23:34<13:51:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5842/12384 [12:23:41<13:51:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 47%|████▋ | 5843/12384 [12:23:41<13:51:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 47%|████▋ | 5843/12384 [12:23:49<13:51:07, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=9.41s]
Epoch 0: 47%|████▋ | 5844/12384 [12:23:49<13:50:58, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=9.41s]
Epoch 0: 47%|████▋ | 5844/12384 [12:23:57<13:50:58, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.67s]
Epoch 0: 47%|████▋ | 5845/12384 [12:23:57<14:03:52, 7.74s/it, loss=0.0001, acc=0.9995, iter_time=7.67s]
Epoch 0: 47%|████▋ | 5845/12384 [12:24:05<14:03:52, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 47%|████▋ | 5846/12384 [12:24:05<13:59:38, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 47%|████▋ | 5846/12384 [12:24:12<13:59:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 47%|████▋ | 5847/12384 [12:24:12<13:59:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 47%|████▋ | 5847/12384 [12:24:20<13:59:38, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.41s]
Epoch 0: 47%|████▋ | 5848/12384 [12:24:20<13:57:05, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.41s]
Epoch 0: 47%|████▋ | 5848/12384 [12:24:27<13:57:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 47%|████▋ | 5849/12384 [12:24:27<13:54:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 47%|████▋ | 5849/12384 [12:24:35<13:54:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 47%|████▋ | 5850/12384 [12:24:35<13:52:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 47%|████▋ | 5850/12384 [12:24:43<13:52:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 47%|████▋ | 5851/12384 [12:24:43<13:51:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 47%|████▋ | 5851/12384 [12:24:50<13:51:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 47%|████▋ | 5852/12384 [12:24:50<13:50:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 47%|████▋ | 5852/12384 [12:24:58<13:50:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 47%|████▋ | 5853/12384 [12:24:58<13:49:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 47%|████▋ | 5853/12384 [12:25:06<13:49:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5854/12384 [12:25:06<13:49:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5854/12384 [12:25:13<13:49:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5855/12384 [12:25:13<13:48:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5855/12384 [12:25:21<13:48:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 47%|████▋ | 5856/12384 [12:25:21<13:48:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 47%|████▋ | 5856/12384 [12:25:29<13:48:02, 7.61s/it, loss=0.0005, acc=0.9978, iter_time=7.95s]
Epoch 0: 47%|████▋ | 5857/12384 [12:25:29<13:57:15, 7.70s/it, loss=0.0005, acc=0.9978, iter_time=7.95s]
Epoch 0: 47%|████▋ | 5857/12384 [12:25:36<13:57:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 47%|████▋ | 5858/12384 [12:25:36<13:54:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 47%|████▋ | 5858/12384 [12:25:44<13:54:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 47%|████▋ | 5859/12384 [12:25:44<13:52:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 47%|████▋ | 5859/12384 [12:25:51<13:52:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 0: 47%|████▋ | 5860/12384 [12:25:51<13:50:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 0: 47%|████▋ | 5860/12384 [12:25:59<13:50:37, 7.64s/it, loss=0.0003, acc=0.9995, iter_time=10.25s]
Epoch 0: 47%|████▋ | 5861/12384 [12:25:59<13:48:46, 7.62s/it, loss=0.0003, acc=0.9995, iter_time=10.25s]
Epoch 0: 47%|████▋ | 5861/12384 [12:26:07<13:48:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 0: 47%|████▋ | 5862/12384 [12:26:07<13:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 0: 47%|████▋ | 5862/12384 [12:26:14<13:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 47%|████▋ | 5863/12384 [12:26:14<13:48:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 47%|████▋ | 5863/12384 [12:26:22<13:48:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.51s]
Epoch 0: 47%|████▋ | 5864/12384 [12:26:22<13:48:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.51s]
Epoch 0: 47%|████▋ | 5864/12384 [12:26:30<13:48:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 0: 47%|████▋ | 5865/12384 [12:26:30<13:48:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 0: 47%|████▋ | 5865/12384 [12:26:37<13:48:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.20s]
Epoch 0: 47%|████▋ | 5866/12384 [12:26:37<13:47:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.20s]
Epoch 0: 47%|████▋ | 5866/12384 [12:26:45<13:47:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5867/12384 [12:26:45<13:46:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 47%|████▋ | 5867/12384 [12:26:52<13:46:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 47%|████▋ | 5868/12384 [12:26:52<13:45:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 47%|████▋ | 5868/12384 [12:27:00<13:45:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 47%|████▋ | 5869/12384 [12:27:00<13:45:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 47%|████▋ | 5869/12384 [12:27:08<13:45:08, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.69s]
Epoch 0: 47%|████▋ | 5870/12384 [12:27:08<13:46:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.69s]
Epoch 0: 47%|████▋ | 5870/12384 [12:27:16<13:46:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 47%|████▋ | 5871/12384 [12:27:16<13:56:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 47%|████▋ | 5871/12384 [12:27:23<13:56:50, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=8.30s]
Epoch 0: 47%|████▋ | 5872/12384 [12:27:23<13:54:19, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=8.30s]
Epoch 0: 47%|████▋ | 5872/12384 [12:27:31<13:54:19, 7.69s/it, loss=0.0003, acc=0.9999, iter_time=7.23s]
Epoch 0: 47%|████▋ | 5873/12384 [12:27:31<13:52:18, 7.67s/it, loss=0.0003, acc=0.9999, iter_time=7.23s]
Epoch 0: 47%|████▋ | 5873/12384 [12:27:38<13:52:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 47%|████▋ | 5874/12384 [12:27:38<13:50:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 47%|████▋ | 5874/12384 [12:27:46<13:50:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5875/12384 [12:27:46<13:48:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 47%|████▋ | 5875/12384 [12:27:54<13:48:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5876/12384 [12:27:54<13:47:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5876/12384 [12:28:01<13:47:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5877/12384 [12:28:01<13:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 47%|████▋ | 5877/12384 [12:28:09<13:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 47%|████▋ | 5878/12384 [12:28:09<13:45:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 47%|████▋ | 5878/12384 [12:28:17<13:45:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 47%|████▋ | 5879/12384 [12:28:17<13:48:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 47%|████▋ | 5879/12384 [12:28:24<13:48:54, 7.65s/it, loss=0.0004, acc=0.9997, iter_time=8.09s]
Epoch 0: 47%|████▋ | 5880/12384 [12:28:24<13:48:11, 7.64s/it, loss=0.0004, acc=0.9997, iter_time=8.09s]
Epoch 0: 47%|████▋ | 5880/12384 [12:28:32<13:48:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 0: 47%|████▋ | 5881/12384 [12:28:32<13:46:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 0: 47%|████▋ | 5881/12384 [12:28:39<13:46:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.35s]
Epoch 0: 47%|████▋ | 5882/12384 [12:28:39<13:46:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.35s]
Epoch 0: 47%|████▋ | 5882/12384 [12:28:47<13:46:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 48%|████▊ | 5883/12384 [12:28:47<13:55:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 48%|████▊ | 5883/12384 [12:28:55<13:55:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5884/12384 [12:28:55<13:52:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5884/12384 [12:29:02<13:52:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 48%|████▊ | 5885/12384 [12:29:02<13:48:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 48%|████▊ | 5885/12384 [12:29:10<13:48:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 48%|████▊ | 5886/12384 [12:29:10<13:46:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 48%|████▊ | 5886/12384 [12:29:18<13:46:54, 7.64s/it, loss=0.0004, acc=0.9969, iter_time=4.28s]
Epoch 0: 48%|████▊ | 5887/12384 [12:29:18<13:45:58, 7.63s/it, loss=0.0004, acc=0.9969, iter_time=4.28s]
Epoch 0: 48%|████▊ | 5887/12384 [12:29:25<13:45:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.30s]
Epoch 0: 48%|████▊ | 5888/12384 [12:29:25<13:45:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.30s]
Epoch 0: 48%|████▊ | 5888/12384 [12:29:33<13:45:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 48%|████▊ | 5889/12384 [12:29:33<13:44:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 48%|████▊ | 5889/12384 [12:29:40<13:44:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5890/12384 [12:29:40<13:44:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5890/12384 [12:29:48<13:44:05, 7.61s/it, loss=0.0013, acc=0.9979, iter_time=4.98s]
Epoch 0: 48%|████▊ | 5891/12384 [12:29:48<13:46:08, 7.63s/it, loss=0.0013, acc=0.9979, iter_time=4.98s]
Epoch 0: 48%|████▊ | 5891/12384 [12:29:56<13:46:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 48%|████▊ | 5892/12384 [12:29:56<13:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 48%|████▊ | 5892/12384 [12:30:03<13:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 48%|████▊ | 5893/12384 [12:30:03<13:43:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 48%|████▊ | 5893/12384 [12:30:11<13:43:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 48%|████▊ | 5894/12384 [12:30:11<13:43:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 48%|████▊ | 5894/12384 [12:30:19<13:43:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 0: 48%|████▊ | 5895/12384 [12:30:19<13:42:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 0: 48%|████▊ | 5895/12384 [12:30:26<13:42:25, 7.60s/it, loss=0.0009, acc=0.9966, iter_time=7.55s]
Epoch 0: 48%|████▊ | 5896/12384 [12:30:26<13:42:25, 7.61s/it, loss=0.0009, acc=0.9966, iter_time=7.55s]
Epoch 0: 48%|████▊ | 5896/12384 [12:30:34<13:42:25, 7.61s/it, loss=0.0003, acc=0.9983, iter_time=7.69s]
Epoch 0: 48%|████▊ | 5897/12384 [12:30:34<13:53:16, 7.71s/it, loss=0.0003, acc=0.9983, iter_time=7.69s]
Epoch 0: 48%|████▊ | 5897/12384 [12:30:42<13:53:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 48%|████▊ | 5898/12384 [12:30:42<13:50:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 48%|████▊ | 5898/12384 [12:30:49<13:50:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 48%|████▊ | 5899/12384 [12:30:49<13:48:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 48%|████▊ | 5899/12384 [12:30:57<13:48:27, 7.67s/it, loss=0.0002, acc=0.9985, iter_time=10.13s]
Epoch 0: 48%|████▊ | 5900/12384 [12:30:57<13:46:50, 7.65s/it, loss=0.0002, acc=0.9985, iter_time=10.13s]
Epoch 0: 48%|████▊ | 5900/12384 [12:31:05<13:46:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 48%|████▊ | 5901/12384 [12:31:05<13:45:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 48%|████▊ | 5901/12384 [12:31:12<13:45:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 0: 48%|████▊ | 5902/12384 [12:31:12<13:43:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 0: 48%|████▊ | 5902/12384 [12:31:20<13:43:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 48%|████▊ | 5903/12384 [12:31:20<13:42:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 48%|████▊ | 5903/12384 [12:31:27<13:42:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 48%|████▊ | 5904/12384 [12:31:27<13:42:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 48%|████▊ | 5904/12384 [12:31:35<13:42:31, 7.62s/it, loss=0.0005, acc=0.9989, iter_time=7.66s]
Epoch 0: 48%|████▊ | 5905/12384 [12:31:35<13:41:59, 7.61s/it, loss=0.0005, acc=0.9989, iter_time=7.66s]
Epoch 0: 48%|████▊ | 5905/12384 [12:31:43<13:41:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 48%|████▊ | 5906/12384 [12:31:43<13:41:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 48%|████▊ | 5906/12384 [12:31:50<13:41:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 48%|████▊ | 5907/12384 [12:31:50<13:42:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 48%|████▊ | 5907/12384 [12:31:58<13:42:23, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=10.20s]
Epoch 0: 48%|████▊ | 5908/12384 [12:31:58<13:41:45, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=10.20s]
Epoch 0: 48%|████▊ | 5908/12384 [12:32:05<13:41:45, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5909/12384 [12:32:05<13:41:20, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5909/12384 [12:32:13<13:41:20, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=7.32s]
Epoch 0: 48%|████▊ | 5910/12384 [12:32:13<13:40:38, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=7.32s]
Epoch 0: 48%|████▊ | 5910/12384 [12:32:21<13:40:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 48%|████▊ | 5911/12384 [12:32:21<13:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 48%|████▊ | 5911/12384 [12:32:28<13:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 48%|████▊ | 5912/12384 [12:32:28<13:41:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 48%|████▊ | 5912/12384 [12:32:36<13:41:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 48%|████▊ | 5913/12384 [12:32:36<13:40:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 48%|████▊ | 5913/12384 [12:32:43<13:40:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5914/12384 [12:32:43<13:39:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5914/12384 [12:32:51<13:39:49, 7.60s/it, loss=0.0004, acc=0.9986, iter_time=5.06s]
Epoch 0: 48%|████▊ | 5915/12384 [12:32:51<13:40:26, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=5.06s]
Epoch 0: 48%|████▊ | 5915/12384 [12:32:59<13:40:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 48%|████▊ | 5916/12384 [12:32:59<13:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 48%|████▊ | 5916/12384 [12:33:06<13:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5917/12384 [12:33:06<13:41:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5917/12384 [12:33:14<13:41:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5918/12384 [12:33:14<13:40:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5918/12384 [12:33:22<13:40:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5919/12384 [12:33:22<13:42:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5919/12384 [12:33:29<13:42:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 48%|████▊ | 5920/12384 [12:33:29<13:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 48%|████▊ | 5920/12384 [12:33:37<13:42:03, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=3.72s]
Epoch 0: 48%|████▊ | 5921/12384 [12:33:37<13:41:06, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=3.72s]
Epoch 0: 48%|████▊ | 5921/12384 [12:33:44<13:41:06, 7.62s/it, loss=0.0010, acc=1.0000, iter_time=11.13s]
Epoch 0: 48%|████▊ | 5922/12384 [12:33:44<13:41:07, 7.62s/it, loss=0.0010, acc=1.0000, iter_time=11.13s]
Epoch 0: 48%|████▊ | 5922/12384 [12:33:52<13:41:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 48%|████▊ | 5923/12384 [12:33:52<13:50:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 48%|████▊ | 5923/12384 [12:34:00<13:50:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 48%|████▊ | 5924/12384 [12:34:00<13:48:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 48%|████▊ | 5924/12384 [12:34:08<13:48:02, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=6.69s]
Epoch 0: 48%|████▊ | 5925/12384 [12:34:08<13:45:18, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.69s]
Epoch 0: 48%|████▊ | 5925/12384 [12:34:15<13:45:18, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.53s]
Epoch 0: 48%|████▊ | 5926/12384 [12:34:15<13:43:15, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.53s]
Epoch 0: 48%|████▊ | 5926/12384 [12:34:23<13:43:15, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5927/12384 [12:34:23<13:42:56, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5927/12384 [12:34:31<13:42:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5928/12384 [12:34:31<13:42:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5928/12384 [12:34:38<13:42:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 48%|████▊ | 5929/12384 [12:34:38<13:40:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 48%|████▊ | 5929/12384 [12:34:46<13:40:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 48%|████▊ | 5930/12384 [12:34:46<13:39:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 48%|████▊ | 5930/12384 [12:34:53<13:39:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 48%|████▊ | 5931/12384 [12:34:53<13:39:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 48%|████▊ | 5931/12384 [12:35:01<13:39:24, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=4.10s]
Epoch 0: 48%|████▊ | 5932/12384 [12:35:01<13:39:35, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=4.10s]
Epoch 0: 48%|████▊ | 5932/12384 [12:35:09<13:39:35, 7.62s/it, loss=0.0016, acc=0.9978, iter_time=11.17s]
Epoch 0: 48%|████▊ | 5933/12384 [12:35:09<13:39:44, 7.62s/it, loss=0.0016, acc=0.9978, iter_time=11.17s]
Epoch 0: 48%|████▊ | 5933/12384 [12:35:16<13:39:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5934/12384 [12:35:16<13:39:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5934/12384 [12:35:24<13:39:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 48%|████▊ | 5935/12384 [12:35:24<13:39:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 48%|████▊ | 5935/12384 [12:35:31<13:39:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 0: 48%|████▊ | 5936/12384 [12:35:31<13:39:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 0: 48%|████▊ | 5936/12384 [12:35:39<13:39:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.52s]
Epoch 0: 48%|████▊ | 5937/12384 [12:35:39<13:47:43, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.52s]
Epoch 0: 48%|████▊ | 5937/12384 [12:35:47<13:47:43, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 48%|████▊ | 5938/12384 [12:35:47<13:47:28, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 48%|████▊ | 5938/12384 [12:35:55<13:47:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5939/12384 [12:35:55<13:44:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5939/12384 [12:36:02<13:44:09, 7.67s/it, loss=0.0002, acc=0.9982, iter_time=5.81s]
Epoch 0: 48%|████▊ | 5940/12384 [12:36:02<13:41:29, 7.65s/it, loss=0.0002, acc=0.9982, iter_time=5.81s]
Epoch 0: 48%|████▊ | 5940/12384 [12:36:10<13:41:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 48%|████▊ | 5941/12384 [12:36:10<13:40:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 48%|████▊ | 5941/12384 [12:36:17<13:40:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 0: 48%|████▊ | 5942/12384 [12:36:17<13:39:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 0: 48%|████▊ | 5942/12384 [12:36:25<13:39:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 48%|████▊ | 5943/12384 [12:36:25<13:38:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 48%|████▊ | 5943/12384 [12:36:33<13:38:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 48%|████▊ | 5944/12384 [12:36:33<13:37:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 48%|████▊ | 5944/12384 [12:36:40<13:37:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 48%|████▊ | 5945/12384 [12:36:40<13:36:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 48%|████▊ | 5945/12384 [12:36:48<13:36:40, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5946/12384 [12:36:48<13:36:19, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5946/12384 [12:36:56<13:36:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5947/12384 [12:36:56<13:36:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5947/12384 [12:37:03<13:36:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 48%|████▊ | 5948/12384 [12:37:03<13:36:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 48%|████▊ | 5948/12384 [12:37:11<13:36:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 48%|████▊ | 5949/12384 [12:37:11<13:47:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 48%|████▊ | 5949/12384 [12:37:19<13:47:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 48%|████▊ | 5950/12384 [12:37:19<13:46:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 48%|████▊ | 5950/12384 [12:37:26<13:46:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 48%|████▊ | 5951/12384 [12:37:26<13:42:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 48%|████▊ | 5951/12384 [12:37:34<13:42:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 48%|████▊ | 5952/12384 [12:37:34<13:41:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 48%|████▊ | 5952/12384 [12:37:42<13:41:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 48%|████▊ | 5953/12384 [12:37:42<13:39:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 48%|████▊ | 5953/12384 [12:37:49<13:39:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 48%|████▊ | 5954/12384 [12:37:49<13:37:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 48%|████▊ | 5954/12384 [12:37:57<13:37:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 48%|████▊ | 5955/12384 [12:37:57<13:37:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 48%|████▊ | 5955/12384 [12:38:05<13:37:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 48%|████▊ | 5956/12384 [12:38:05<13:39:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 48%|████▊ | 5956/12384 [12:38:12<13:39:16, 7.65s/it, loss=0.0004, acc=0.9990, iter_time=10.20s]
Epoch 0: 48%|████▊ | 5957/12384 [12:38:12<13:38:13, 7.64s/it, loss=0.0004, acc=0.9990, iter_time=10.20s]
Epoch 0: 48%|████▊ | 5957/12384 [12:38:20<13:38:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 48%|████▊ | 5958/12384 [12:38:20<13:36:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 48%|████▊ | 5958/12384 [12:38:27<13:36:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 48%|████▊ | 5959/12384 [12:38:27<13:36:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 48%|████▊ | 5959/12384 [12:38:35<13:36:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.52s]
Epoch 0: 48%|████▊ | 5960/12384 [12:38:35<13:36:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.52s]
Epoch 0: 48%|████▊ | 5960/12384 [12:38:43<13:36:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 48%|████▊ | 5961/12384 [12:38:43<13:35:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 48%|████▊ | 5961/12384 [12:38:50<13:35:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5962/12384 [12:38:50<13:35:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5962/12384 [12:38:58<13:35:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 48%|████▊ | 5963/12384 [12:38:58<13:44:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 48%|████▊ | 5963/12384 [12:39:06<13:44:41, 7.71s/it, loss=0.0036, acc=0.9895, iter_time=7.04s]
Epoch 0: 48%|████▊ | 5964/12384 [12:39:06<13:41:15, 7.68s/it, loss=0.0036, acc=0.9895, iter_time=7.04s]
Epoch 0: 48%|████▊ | 5964/12384 [12:39:13<13:41:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 48%|████▊ | 5965/12384 [12:39:13<13:39:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 48%|████▊ | 5965/12384 [12:39:21<13:39:09, 7.66s/it, loss=0.0003, acc=0.9984, iter_time=7.64s]
Epoch 0: 48%|████▊ | 5966/12384 [12:39:21<13:37:58, 7.65s/it, loss=0.0003, acc=0.9984, iter_time=7.64s]
Epoch 0: 48%|████▊ | 5966/12384 [12:39:29<13:37:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5967/12384 [12:39:29<13:36:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5967/12384 [12:39:36<13:36:50, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=7.97s]
Epoch 0: 48%|████▊ | 5968/12384 [12:39:36<13:39:01, 7.66s/it, loss=0.0001, acc=0.9996, iter_time=7.97s]
Epoch 0: 48%|████▊ | 5968/12384 [12:39:44<13:39:01, 7.66s/it, loss=0.0002, acc=0.9993, iter_time=7.33s]
Epoch 0: 48%|████▊ | 5969/12384 [12:39:44<13:37:54, 7.65s/it, loss=0.0002, acc=0.9993, iter_time=7.33s]
Epoch 0: 48%|████▊ | 5969/12384 [12:39:52<13:37:54, 7.65s/it, loss=0.0002, acc=0.9994, iter_time=7.64s]
Epoch 0: 48%|████▊ | 5970/12384 [12:39:52<13:36:26, 7.64s/it, loss=0.0002, acc=0.9994, iter_time=7.64s]
Epoch 0: 48%|████▊ | 5970/12384 [12:39:59<13:36:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 48%|████▊ | 5971/12384 [12:39:59<13:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 48%|████▊ | 5971/12384 [12:40:07<13:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5972/12384 [12:40:07<13:33:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5972/12384 [12:40:14<13:33:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 48%|████▊ | 5973/12384 [12:40:14<13:33:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 48%|████▊ | 5973/12384 [12:40:22<13:33:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5974/12384 [12:40:22<13:33:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5974/12384 [12:40:30<13:33:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5975/12384 [12:40:30<13:32:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 5975/12384 [12:40:38<13:32:49, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=8.05s]
Epoch 0: 48%|████▊ | 5976/12384 [12:40:38<13:45:01, 7.72s/it, loss=0.0002, acc=0.9998, iter_time=8.05s]
Epoch 0: 48%|████▊ | 5976/12384 [12:40:45<13:45:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 48%|████▊ | 5977/12384 [12:40:45<13:41:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 48%|████▊ | 5977/12384 [12:40:53<13:41:39, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=4.79s]
Epoch 0: 48%|████▊ | 5978/12384 [12:40:53<13:39:09, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=4.79s]
Epoch 0: 48%|████▊ | 5978/12384 [12:41:00<13:39:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 0: 48%|████▊ | 5979/12384 [12:41:00<13:36:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 0: 48%|████▊ | 5979/12384 [12:41:08<13:36:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 48%|████▊ | 5980/12384 [12:41:08<13:34:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 48%|████▊ | 5980/12384 [12:41:16<13:34:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5981/12384 [12:41:16<13:34:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5981/12384 [12:41:23<13:34:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5982/12384 [12:41:23<13:35:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5982/12384 [12:41:31<13:35:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 48%|████▊ | 5983/12384 [12:41:31<13:36:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 48%|████▊ | 5983/12384 [12:41:39<13:36:46, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 48%|████▊ | 5984/12384 [12:41:39<13:35:46, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 48%|████▊ | 5984/12384 [12:41:46<13:35:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 0: 48%|████▊ | 5985/12384 [12:41:46<13:34:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 0: 48%|████▊ | 5985/12384 [12:41:54<13:34:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 48%|████▊ | 5986/12384 [12:41:54<13:33:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 48%|████▊ | 5986/12384 [12:42:01<13:33:33, 7.63s/it, loss=0.0002, acc=0.9981, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5987/12384 [12:42:01<13:32:55, 7.62s/it, loss=0.0002, acc=0.9981, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5987/12384 [12:42:09<13:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 48%|████▊ | 5988/12384 [12:42:09<13:32:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 48%|████▊ | 5988/12384 [12:42:17<13:32:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 48%|████▊ | 5989/12384 [12:42:17<13:41:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 48%|████▊ | 5989/12384 [12:42:25<13:41:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 0: 48%|████▊ | 5990/12384 [12:42:25<13:38:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 0: 48%|████▊ | 5990/12384 [12:42:32<13:38:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 48%|████▊ | 5991/12384 [12:42:32<13:35:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 48%|████▊ | 5991/12384 [12:42:40<13:35:44, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=10.78s]
Epoch 0: 48%|████▊ | 5992/12384 [12:42:40<13:34:14, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.78s]
Epoch 0: 48%|████▊ | 5992/12384 [12:42:47<13:34:14, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 0: 48%|████▊ | 5993/12384 [12:42:47<13:32:29, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 0: 48%|████▊ | 5993/12384 [12:42:55<13:32:29, 7.63s/it, loss=0.0007, acc=0.9997, iter_time=5.33s]
Epoch 0: 48%|████▊ | 5994/12384 [12:42:55<13:31:23, 7.62s/it, loss=0.0007, acc=0.9997, iter_time=5.33s]
Epoch 0: 48%|████▊ | 5994/12384 [12:43:03<13:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 48%|████▊ | 5995/12384 [12:43:03<13:31:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 48%|████▊ | 5995/12384 [12:43:10<13:31:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 0: 48%|████▊ | 5996/12384 [12:43:10<13:31:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 0: 48%|████▊ | 5996/12384 [12:43:18<13:31:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5997/12384 [12:43:18<13:30:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 48%|████▊ | 5997/12384 [12:43:25<13:30:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5998/12384 [12:43:25<13:32:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 48%|████▊ | 5998/12384 [12:43:33<13:32:19, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=4.53s]
Epoch 0: 48%|████▊ | 5999/12384 [12:43:33<13:31:19, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=4.53s]
Epoch 0: 48%|████▊ | 5999/12384 [12:43:41<13:31:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 0: 48%|████▊ | 6000/12384 [12:43:41<13:39:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 0: 48%|████▊ | 6000/12384 [12:43:49<13:39:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 48%|████▊ | 6001/12384 [12:43:49<13:35:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 48%|████▊ | 6001/12384 [12:43:57<13:35:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 0: 48%|████▊ | 6002/12384 [12:43:57<13:45:09, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 0: 48%|████▊ | 6002/12384 [12:44:04<13:45:09, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 0: 48%|████▊ | 6003/12384 [12:44:04<13:40:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 0: 48%|████▊ | 6003/12384 [12:44:12<13:40:39, 7.72s/it, loss=0.0002, acc=0.9990, iter_time=6.42s]
Epoch 0: 48%|████▊ | 6004/12384 [12:44:12<13:36:20, 7.68s/it, loss=0.0002, acc=0.9990, iter_time=6.42s]
Epoch 0: 48%|████▊ | 6004/12384 [12:44:19<13:36:20, 7.68s/it, loss=0.0005, acc=0.9966, iter_time=8.78s]
Epoch 0: 48%|████▊ | 6005/12384 [12:44:19<13:34:09, 7.66s/it, loss=0.0005, acc=0.9966, iter_time=8.78s]
Epoch 0: 48%|████▊ | 6005/12384 [12:44:27<13:34:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 6006/12384 [12:44:27<13:32:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 48%|████▊ | 6006/12384 [12:44:35<13:32:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 49%|████▊ | 6007/12384 [12:44:35<13:31:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 49%|████▊ | 6007/12384 [12:44:42<13:31:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 49%|████▊ | 6008/12384 [12:44:42<13:30:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 49%|████▊ | 6008/12384 [12:44:50<13:30:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 49%|████▊ | 6009/12384 [12:44:50<13:30:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 49%|████▊ | 6009/12384 [12:44:57<13:30:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 49%|████▊ | 6010/12384 [12:44:57<13:29:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 49%|████▊ | 6010/12384 [12:45:05<13:29:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 49%|████▊ | 6011/12384 [12:45:05<13:28:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 49%|████▊ | 6011/12384 [12:45:13<13:28:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 49%|████▊ | 6012/12384 [12:45:13<13:28:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 49%|████▊ | 6012/12384 [12:45:20<13:28:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 49%|████▊ | 6013/12384 [12:45:20<13:28:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 49%|████▊ | 6013/12384 [12:45:28<13:28:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 49%|████▊ | 6014/12384 [12:45:28<13:37:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 49%|████▊ | 6014/12384 [12:45:36<13:37:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 49%|████▊ | 6015/12384 [12:45:36<13:34:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 49%|████▊ | 6015/12384 [12:45:43<13:34:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 49%|████▊ | 6016/12384 [12:45:43<13:32:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 49%|████▊ | 6016/12384 [12:45:51<13:32:07, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=5.41s]
Epoch 0: 49%|████▊ | 6017/12384 [12:45:51<13:30:10, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=5.41s]
Epoch 0: 49%|████▊ | 6017/12384 [12:45:59<13:30:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 49%|████▊ | 6018/12384 [12:45:59<13:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 49%|████▊ | 6018/12384 [12:46:06<13:28:46, 7.62s/it, loss=0.0001, acc=0.9992, iter_time=7.67s]
Epoch 0: 49%|████▊ | 6019/12384 [12:46:06<13:29:58, 7.64s/it, loss=0.0001, acc=0.9992, iter_time=7.67s]
Epoch 0: 49%|████▊ | 6019/12384 [12:46:14<13:29:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▊ | 6020/12384 [12:46:14<13:29:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▊ | 6020/12384 [12:46:21<13:29:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 49%|████▊ | 6021/12384 [12:46:21<13:29:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 49%|████▊ | 6021/12384 [12:46:29<13:29:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 49%|████▊ | 6022/12384 [12:46:29<13:27:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 49%|████▊ | 6022/12384 [12:46:37<13:27:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▊ | 6023/12384 [12:46:37<13:27:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▊ | 6023/12384 [12:46:44<13:27:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▊ | 6024/12384 [12:46:44<13:29:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▊ | 6024/12384 [12:46:52<13:29:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 49%|████▊ | 6025/12384 [12:46:52<13:27:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 49%|████▊ | 6025/12384 [12:46:59<13:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 49%|████▊ | 6026/12384 [12:46:59<13:25:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 49%|████▊ | 6026/12384 [12:47:07<13:25:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 49%|████▊ | 6027/12384 [12:47:07<13:25:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 49%|████▊ | 6027/12384 [12:47:15<13:25:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 49%|████▊ | 6028/12384 [12:47:15<13:25:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 49%|████▊ | 6028/12384 [12:47:23<13:25:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 49%|████▊ | 6029/12384 [12:47:23<13:36:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 49%|████▊ | 6029/12384 [12:47:30<13:36:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 49%|████▊ | 6030/12384 [12:47:30<13:36:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 49%|████▊ | 6030/12384 [12:47:38<13:36:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 49%|████▊ | 6031/12384 [12:47:38<13:32:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 49%|████▊ | 6031/12384 [12:47:46<13:32:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 49%|████▊ | 6032/12384 [12:47:46<13:29:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 49%|████▊ | 6032/12384 [12:47:53<13:29:36, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.26s]
Epoch 0: 49%|████▊ | 6033/12384 [12:47:53<13:27:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.26s]
Epoch 0: 49%|████▊ | 6033/12384 [12:48:01<13:27:31, 7.63s/it, loss=0.0002, acc=0.9990, iter_time=7.43s]
Epoch 0: 49%|████▊ | 6034/12384 [12:48:01<13:26:46, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.43s]
Epoch 0: 49%|████▊ | 6034/12384 [12:48:08<13:26:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 49%|████▊ | 6035/12384 [12:48:08<13:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 49%|████▊ | 6035/12384 [12:48:16<13:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▊ | 6036/12384 [12:48:16<13:25:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▊ | 6036/12384 [12:48:24<13:25:37, 7.61s/it, loss=0.0006, acc=0.9976, iter_time=7.05s]
Epoch 0: 49%|████▊ | 6037/12384 [12:48:24<13:25:23, 7.61s/it, loss=0.0006, acc=0.9976, iter_time=7.05s]
Epoch 0: 49%|████▊ | 6037/12384 [12:48:31<13:25:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 49%|████▉ | 6038/12384 [12:48:31<13:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 49%|████▉ | 6038/12384 [12:48:39<13:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 49%|████▉ | 6039/12384 [12:48:39<13:25:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 49%|████▉ | 6039/12384 [12:48:46<13:25:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 49%|████▉ | 6040/12384 [12:48:46<13:24:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 49%|████▉ | 6040/12384 [12:48:54<13:24:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 0: 49%|████▉ | 6041/12384 [12:48:54<13:23:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 0: 49%|████▉ | 6041/12384 [12:49:02<13:23:26, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=10.43s]
Epoch 0: 49%|████▉ | 6042/12384 [12:49:02<13:23:16, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=10.43s]
Epoch 0: 49%|████▉ | 6042/12384 [12:49:09<13:23:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 49%|████▉ | 6043/12384 [12:49:09<13:23:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 49%|████▉ | 6043/12384 [12:49:17<13:23:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 49%|████▉ | 6044/12384 [12:49:17<13:22:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 49%|████▉ | 6044/12384 [12:49:24<13:22:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 49%|████▉ | 6045/12384 [12:49:24<13:23:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 49%|████▉ | 6045/12384 [12:49:32<13:23:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 49%|████▉ | 6046/12384 [12:49:32<13:22:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 49%|████▉ | 6046/12384 [12:49:40<13:22:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 49%|████▉ | 6047/12384 [12:49:40<13:23:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 49%|████▉ | 6047/12384 [12:49:47<13:23:00, 7.60s/it, loss=0.0004, acc=0.9982, iter_time=9.53s]
Epoch 0: 49%|████▉ | 6048/12384 [12:49:47<13:22:32, 7.60s/it, loss=0.0004, acc=0.9982, iter_time=9.53s]
Epoch 0: 49%|████▉ | 6048/12384 [12:49:55<13:22:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 49%|████▉ | 6049/12384 [12:49:55<13:22:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 49%|████▉ | 6049/12384 [12:50:02<13:22:33, 7.60s/it, loss=0.0004, acc=0.9975, iter_time=8.03s]
Epoch 0: 49%|████▉ | 6050/12384 [12:50:02<13:23:09, 7.61s/it, loss=0.0004, acc=0.9975, iter_time=8.03s]
Epoch 0: 49%|████▉ | 6050/12384 [12:50:10<13:23:09, 7.61s/it, loss=0.0005, acc=0.9985, iter_time=6.33s]
Epoch 0: 49%|████▉ | 6051/12384 [12:50:10<13:24:33, 7.62s/it, loss=0.0005, acc=0.9985, iter_time=6.33s]
Epoch 0: 49%|████▉ | 6051/12384 [12:50:18<13:24:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 49%|████▉ | 6052/12384 [12:50:18<13:23:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 49%|████▉ | 6052/12384 [12:50:25<13:23:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 49%|████▉ | 6053/12384 [12:50:25<13:23:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 49%|████▉ | 6053/12384 [12:50:33<13:23:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 0: 49%|████▉ | 6054/12384 [12:50:33<13:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 0: 49%|████▉ | 6054/12384 [12:50:41<13:22:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.87s]
Epoch 0: 49%|████▉ | 6055/12384 [12:50:41<13:33:45, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.87s]
Epoch 0: 49%|████▉ | 6055/12384 [12:50:48<13:33:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 49%|████▉ | 6056/12384 [12:50:48<13:29:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 49%|████▉ | 6056/12384 [12:50:56<13:29:44, 7.68s/it, loss=0.0116, acc=0.9756, iter_time=7.64s]
Epoch 0: 49%|████▉ | 6057/12384 [12:50:56<13:29:17, 7.67s/it, loss=0.0116, acc=0.9756, iter_time=7.64s]
Epoch 0: 49%|████▉ | 6057/12384 [12:51:04<13:29:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 49%|████▉ | 6058/12384 [12:51:04<13:26:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 49%|████▉ | 6058/12384 [12:51:11<13:26:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 49%|████▉ | 6059/12384 [12:51:11<13:25:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 49%|████▉ | 6059/12384 [12:51:19<13:25:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 49%|████▉ | 6060/12384 [12:51:19<13:25:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 49%|████▉ | 6060/12384 [12:51:27<13:25:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.42s]
Epoch 0: 49%|████▉ | 6061/12384 [12:51:27<13:24:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.42s]
Epoch 0: 49%|████▉ | 6061/12384 [12:51:34<13:24:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 0: 49%|████▉ | 6062/12384 [12:51:34<13:23:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 0: 49%|████▉ | 6062/12384 [12:51:42<13:23:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 0: 49%|████▉ | 6063/12384 [12:51:42<13:23:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 0: 49%|████▉ | 6063/12384 [12:51:49<13:23:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 0: 49%|████▉ | 6064/12384 [12:51:49<13:22:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 0: 49%|████▉ | 6064/12384 [12:51:57<13:22:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 0: 49%|████▉ | 6065/12384 [12:51:57<13:22:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 0: 49%|████▉ | 6065/12384 [12:52:05<13:22:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 0: 49%|████▉ | 6066/12384 [12:52:05<13:33:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 0: 49%|████▉ | 6066/12384 [12:52:13<13:33:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 49%|████▉ | 6067/12384 [12:52:13<13:29:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 49%|████▉ | 6067/12384 [12:52:20<13:29:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 49%|████▉ | 6068/12384 [12:52:20<13:26:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 49%|████▉ | 6068/12384 [12:52:28<13:26:53, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6069/12384 [12:52:28<13:25:47, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6069/12384 [12:52:35<13:25:47, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=7.63s]
Epoch 0: 49%|████▉ | 6070/12384 [12:52:35<13:24:42, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.63s]
Epoch 0: 49%|████▉ | 6070/12384 [12:52:43<13:24:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6071/12384 [12:52:43<13:23:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6071/12384 [12:52:51<13:23:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 49%|████▉ | 6072/12384 [12:52:51<13:22:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 49%|████▉ | 6072/12384 [12:52:58<13:22:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 49%|████▉ | 6073/12384 [12:52:58<13:21:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 49%|████▉ | 6073/12384 [12:53:06<13:21:30, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▉ | 6074/12384 [12:53:06<13:21:18, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▉ | 6074/12384 [12:53:14<13:21:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 49%|████▉ | 6075/12384 [12:53:14<13:20:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 49%|████▉ | 6075/12384 [12:53:21<13:20:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 49%|████▉ | 6076/12384 [12:53:21<13:20:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 49%|████▉ | 6076/12384 [12:53:29<13:20:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 0: 49%|████▉ | 6077/12384 [12:53:29<13:20:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 0: 49%|████▉ | 6077/12384 [12:53:36<13:20:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 0: 49%|████▉ | 6078/12384 [12:53:36<13:19:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 0: 49%|████▉ | 6078/12384 [12:53:44<13:19:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 0: 49%|████▉ | 6079/12384 [12:53:44<13:19:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 0: 49%|████▉ | 6079/12384 [12:53:52<13:19:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.09s]
Epoch 0: 49%|████▉ | 6080/12384 [12:53:52<13:19:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.09s]
Epoch 0: 49%|████▉ | 6080/12384 [12:53:59<13:19:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.20s]
Epoch 0: 49%|████▉ | 6081/12384 [12:53:59<13:30:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.20s]
Epoch 0: 49%|████▉ | 6081/12384 [12:54:07<13:30:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.96s]
Epoch 0: 49%|████▉ | 6082/12384 [12:54:07<13:27:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.96s]
Epoch 0: 49%|████▉ | 6082/12384 [12:54:15<13:27:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 49%|████▉ | 6083/12384 [12:54:15<13:25:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 49%|████▉ | 6083/12384 [12:54:22<13:25:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6084/12384 [12:54:22<13:22:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6084/12384 [12:54:30<13:22:20, 7.64s/it, loss=0.0004, acc=0.9992, iter_time=4.74s]
Epoch 0: 49%|████▉ | 6085/12384 [12:54:30<13:21:26, 7.63s/it, loss=0.0004, acc=0.9992, iter_time=4.74s]
Epoch 0: 49%|████▉ | 6085/12384 [12:54:38<13:21:26, 7.63s/it, loss=0.0020, acc=0.9964, iter_time=10.22s]
Epoch 0: 49%|████▉ | 6086/12384 [12:54:38<13:21:14, 7.63s/it, loss=0.0020, acc=0.9964, iter_time=10.22s]
Epoch 0: 49%|████▉ | 6086/12384 [12:54:45<13:21:14, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=6.14s]
Epoch 0: 49%|████▉ | 6087/12384 [12:54:45<13:20:13, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.14s]
Epoch 0: 49%|████▉ | 6087/12384 [12:54:53<13:20:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 0: 49%|████▉ | 6088/12384 [12:54:53<13:19:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 0: 49%|████▉ | 6088/12384 [12:55:00<13:19:03, 7.61s/it, loss=0.0003, acc=0.9973, iter_time=7.41s]
Epoch 0: 49%|████▉ | 6089/12384 [12:55:00<13:19:12, 7.62s/it, loss=0.0003, acc=0.9973, iter_time=7.41s]
Epoch 0: 49%|████▉ | 6089/12384 [12:55:08<13:19:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 49%|████▉ | 6090/12384 [12:55:08<13:18:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 49%|████▉ | 6090/12384 [12:55:16<13:18:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 49%|████▉ | 6091/12384 [12:55:16<13:18:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 49%|████▉ | 6091/12384 [12:55:24<13:18:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 49%|████▉ | 6092/12384 [12:55:24<13:26:49, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 49%|████▉ | 6092/12384 [12:55:31<13:26:49, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.29s]
Epoch 0: 49%|████▉ | 6093/12384 [12:55:31<13:23:20, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.29s]
Epoch 0: 49%|████▉ | 6093/12384 [12:55:39<13:23:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 49%|████▉ | 6094/12384 [12:55:39<13:21:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 49%|████▉ | 6094/12384 [12:55:46<13:21:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 0: 49%|████▉ | 6095/12384 [12:55:46<13:19:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 0: 49%|████▉ | 6095/12384 [12:55:54<13:19:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 49%|████▉ | 6096/12384 [12:55:54<13:18:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 49%|████▉ | 6096/12384 [12:56:01<13:18:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 0: 49%|████▉ | 6097/12384 [12:56:01<13:16:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 0: 49%|████▉ | 6097/12384 [12:56:09<13:16:58, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=7.01s]
Epoch 0: 49%|████▉ | 6098/12384 [12:56:09<13:17:18, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=7.01s]
Epoch 0: 49%|████▉ | 6098/12384 [12:56:17<13:17:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 49%|████▉ | 6099/12384 [12:56:17<13:16:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 49%|████▉ | 6099/12384 [12:56:24<13:16:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.61s]
Epoch 0: 49%|████▉ | 6100/12384 [12:56:24<13:17:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.61s]
Epoch 0: 49%|████▉ | 6100/12384 [12:56:32<13:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 49%|████▉ | 6101/12384 [12:56:32<13:17:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 49%|████▉ | 6101/12384 [12:56:40<13:17:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 49%|████▉ | 6102/12384 [12:56:40<13:16:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 49%|████▉ | 6102/12384 [12:56:47<13:16:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6103/12384 [12:56:47<13:16:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6103/12384 [12:56:55<13:16:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 49%|████▉ | 6104/12384 [12:56:55<13:15:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 49%|████▉ | 6104/12384 [12:57:02<13:15:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 49%|████▉ | 6105/12384 [12:57:02<13:17:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 49%|████▉ | 6105/12384 [12:57:10<13:17:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 49%|████▉ | 6106/12384 [12:57:10<13:17:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 49%|████▉ | 6106/12384 [12:57:18<13:17:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 0: 49%|████▉ | 6107/12384 [12:57:18<13:27:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 0: 49%|████▉ | 6107/12384 [12:57:26<13:27:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 49%|████▉ | 6108/12384 [12:57:26<13:23:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 49%|████▉ | 6108/12384 [12:57:33<13:23:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 49%|████▉ | 6109/12384 [12:57:33<13:21:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 49%|████▉ | 6109/12384 [12:57:41<13:21:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 49%|████▉ | 6110/12384 [12:57:41<13:19:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 49%|████▉ | 6110/12384 [12:57:48<13:19:54, 7.65s/it, loss=0.0004, acc=0.9984, iter_time=5.89s]
Epoch 0: 49%|████▉ | 6111/12384 [12:57:48<13:18:47, 7.64s/it, loss=0.0004, acc=0.9984, iter_time=5.89s]
Epoch 0: 49%|████▉ | 6111/12384 [12:57:56<13:18:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 0: 49%|████▉ | 6112/12384 [12:57:56<13:17:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 0: 49%|████▉ | 6112/12384 [12:58:04<13:17:51, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=4.34s]
Epoch 0: 49%|████▉ | 6113/12384 [12:58:04<13:16:57, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=4.34s]
Epoch 0: 49%|████▉ | 6113/12384 [12:58:11<13:16:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 49%|████▉ | 6114/12384 [12:58:11<13:16:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 49%|████▉ | 6114/12384 [12:58:19<13:16:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.89s]
Epoch 0: 49%|████▉ | 6115/12384 [12:58:19<13:15:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.89s]
Epoch 0: 49%|████▉ | 6115/12384 [12:58:26<13:15:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 49%|████▉ | 6116/12384 [12:58:26<13:15:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 49%|████▉ | 6116/12384 [12:58:34<13:15:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 0: 49%|████▉ | 6117/12384 [12:58:34<13:14:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 0: 49%|████▉ | 6117/12384 [12:58:42<13:14:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 49%|████▉ | 6118/12384 [12:58:42<13:23:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 49%|████▉ | 6118/12384 [12:58:50<13:23:10, 7.69s/it, loss=0.0018, acc=0.9968, iter_time=6.40s]
Epoch 0: 49%|████▉ | 6119/12384 [12:58:50<13:20:54, 7.67s/it, loss=0.0018, acc=0.9968, iter_time=6.40s]
Epoch 0: 49%|████▉ | 6119/12384 [12:58:57<13:20:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 49%|████▉ | 6120/12384 [12:58:57<13:18:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 49%|████▉ | 6120/12384 [12:59:05<13:18:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 49%|████▉ | 6121/12384 [12:59:05<13:17:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 49%|████▉ | 6121/12384 [12:59:12<13:17:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 49%|████▉ | 6122/12384 [12:59:12<13:16:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 49%|████▉ | 6122/12384 [12:59:20<13:16:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 49%|████▉ | 6123/12384 [12:59:20<13:15:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 49%|████▉ | 6123/12384 [12:59:28<13:15:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▉ | 6124/12384 [12:59:28<13:15:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▉ | 6124/12384 [12:59:35<13:15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▉ | 6125/12384 [12:59:35<13:15:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 49%|████▉ | 6125/12384 [12:59:43<13:15:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 49%|████▉ | 6126/12384 [12:59:43<13:14:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 49%|████▉ | 6126/12384 [12:59:50<13:14:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6127/12384 [12:59:50<13:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 49%|████▉ | 6127/12384 [12:59:58<13:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 49%|████▉ | 6128/12384 [12:59:58<13:13:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 49%|████▉ | 6128/12384 [13:00:06<13:13:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 49%|████▉ | 6129/12384 [13:00:06<13:12:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 49%|████▉ | 6129/12384 [13:00:13<13:12:36, 7.60s/it, loss=0.0003, acc=0.9982, iter_time=7.85s]
Epoch 0: 49%|████▉ | 6130/12384 [13:00:13<13:13:42, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=7.85s]
Epoch 0: 49%|████▉ | 6130/12384 [13:00:21<13:13:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 0: 50%|████▉ | 6131/12384 [13:00:21<13:14:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 0: 50%|████▉ | 6131/12384 [13:00:28<13:14:05, 7.62s/it, loss=0.0003, acc=0.9981, iter_time=8.49s]
Epoch 0: 50%|████▉ | 6132/12384 [13:00:28<13:13:26, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=8.49s]
Epoch 0: 50%|████▉ | 6132/12384 [13:00:36<13:13:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 50%|████▉ | 6133/12384 [13:00:36<13:23:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 50%|████▉ | 6133/12384 [13:00:44<13:23:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 0: 50%|████▉ | 6134/12384 [13:00:44<13:20:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 0: 50%|████▉ | 6134/12384 [13:00:52<13:20:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 50%|████▉ | 6135/12384 [13:00:52<13:18:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 50%|████▉ | 6135/12384 [13:00:59<13:18:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 50%|████▉ | 6136/12384 [13:00:59<13:19:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 50%|████▉ | 6136/12384 [13:01:07<13:19:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 50%|████▉ | 6137/12384 [13:01:07<13:17:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 50%|████▉ | 6137/12384 [13:01:15<13:17:12, 7.66s/it, loss=0.0004, acc=0.9993, iter_time=7.63s]
Epoch 0: 50%|████▉ | 6138/12384 [13:01:15<13:15:48, 7.64s/it, loss=0.0004, acc=0.9993, iter_time=7.63s]
Epoch 0: 50%|████▉ | 6138/12384 [13:01:22<13:15:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 50%|████▉ | 6139/12384 [13:01:22<13:15:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 50%|████▉ | 6139/12384 [13:01:30<13:15:03, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=8.26s]
Epoch 0: 50%|████▉ | 6140/12384 [13:01:30<13:14:16, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.26s]
Epoch 0: 50%|████▉ | 6140/12384 [13:01:37<13:14:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 50%|████▉ | 6141/12384 [13:01:37<13:13:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 50%|████▉ | 6141/12384 [13:01:45<13:13:29, 7.63s/it, loss=0.0007, acc=1.0000, iter_time=8.72s]
Epoch 0: 50%|████▉ | 6142/12384 [13:01:45<13:12:11, 7.61s/it, loss=0.0007, acc=1.0000, iter_time=8.72s]
Epoch 0: 50%|████▉ | 6142/12384 [13:01:53<13:12:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 50%|████▉ | 6143/12384 [13:01:53<13:12:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 50%|████▉ | 6143/12384 [13:02:00<13:12:20, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.95s]
Epoch 0: 50%|████▉ | 6144/12384 [13:02:00<13:12:27, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.95s]
Epoch 0: 50%|████▉ | 6144/12384 [13:02:08<13:12:27, 7.62s/it, loss=0.0007, acc=0.9988, iter_time=6.18s]
Epoch 0: 50%|████▉ | 6145/12384 [13:02:08<13:12:53, 7.63s/it, loss=0.0007, acc=0.9988, iter_time=6.18s]
Epoch 0: 50%|████▉ | 6145/12384 [13:02:16<13:12:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 50%|████▉ | 6146/12384 [13:02:16<13:11:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 50%|████▉ | 6146/12384 [13:02:23<13:11:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|████▉ | 6147/12384 [13:02:23<13:11:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|████▉ | 6147/12384 [13:02:31<13:11:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 50%|████▉ | 6148/12384 [13:02:31<13:11:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 50%|████▉ | 6148/12384 [13:02:38<13:11:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|████▉ | 6149/12384 [13:02:38<13:10:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|████▉ | 6149/12384 [13:02:46<13:10:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 50%|████▉ | 6150/12384 [13:02:46<13:10:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 50%|████▉ | 6150/12384 [13:02:54<13:10:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 50%|████▉ | 6151/12384 [13:02:54<13:11:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 50%|████▉ | 6151/12384 [13:03:01<13:11:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 50%|████▉ | 6152/12384 [13:03:01<13:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 50%|████▉ | 6152/12384 [13:03:09<13:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 50%|████▉ | 6153/12384 [13:03:09<13:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 50%|████▉ | 6153/12384 [13:03:16<13:11:16, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.00s]
Epoch 0: 50%|████▉ | 6154/12384 [13:03:16<13:09:52, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.00s]
Epoch 0: 50%|████▉ | 6154/12384 [13:03:24<13:09:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 50%|████▉ | 6155/12384 [13:03:24<13:09:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 50%|████▉ | 6155/12384 [13:03:32<13:09:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 50%|████▉ | 6156/12384 [13:03:32<13:09:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 50%|████▉ | 6156/12384 [13:03:39<13:09:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 50%|████▉ | 6157/12384 [13:03:39<13:09:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 50%|████▉ | 6157/12384 [13:03:47<13:09:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 50%|████▉ | 6158/12384 [13:03:47<13:09:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 50%|████▉ | 6158/12384 [13:03:54<13:09:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 50%|████▉ | 6159/12384 [13:03:54<13:09:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 50%|████▉ | 6159/12384 [13:04:02<13:09:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 50%|████▉ | 6160/12384 [13:04:02<13:20:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 50%|████▉ | 6160/12384 [13:04:10<13:20:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 50%|████▉ | 6161/12384 [13:04:10<13:16:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 50%|████▉ | 6161/12384 [13:04:18<13:16:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 50%|████▉ | 6162/12384 [13:04:18<13:14:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 50%|████▉ | 6162/12384 [13:04:25<13:14:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|████▉ | 6163/12384 [13:04:25<13:12:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|████▉ | 6163/12384 [13:04:33<13:12:34, 7.64s/it, loss=0.0003, acc=0.9980, iter_time=5.26s]
Epoch 0: 50%|████▉ | 6164/12384 [13:04:33<13:11:55, 7.64s/it, loss=0.0003, acc=0.9980, iter_time=5.26s]
Epoch 0: 50%|████▉ | 6164/12384 [13:04:41<13:11:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 50%|████▉ | 6165/12384 [13:04:41<13:12:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 50%|████▉ | 6165/12384 [13:04:48<13:12:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 50%|████▉ | 6166/12384 [13:04:48<13:10:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 50%|████▉ | 6166/12384 [13:04:56<13:10:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 50%|████▉ | 6167/12384 [13:04:56<13:09:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 50%|████▉ | 6167/12384 [13:05:03<13:09:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 50%|████▉ | 6168/12384 [13:05:03<13:09:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 50%|████▉ | 6168/12384 [13:05:11<13:09:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 0: 50%|████▉ | 6169/12384 [13:05:11<13:07:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 0: 50%|████▉ | 6169/12384 [13:05:19<13:07:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 50%|████▉ | 6170/12384 [13:05:19<13:07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 50%|████▉ | 6170/12384 [13:05:26<13:07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 0: 50%|████▉ | 6171/12384 [13:05:26<13:07:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 0: 50%|████▉ | 6171/12384 [13:05:34<13:07:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.46s]
Epoch 0: 50%|████▉ | 6172/12384 [13:05:34<13:08:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.46s]
Epoch 0: 50%|████▉ | 6172/12384 [13:05:41<13:08:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 50%|████▉ | 6173/12384 [13:05:41<13:07:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 50%|████▉ | 6173/12384 [13:05:49<13:07:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 0: 50%|████▉ | 6174/12384 [13:05:49<13:07:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 0: 50%|████▉ | 6174/12384 [13:05:57<13:07:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 0: 50%|████▉ | 6175/12384 [13:05:57<13:06:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 0: 50%|████▉ | 6175/12384 [13:06:04<13:06:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 0: 50%|████▉ | 6176/12384 [13:06:04<13:06:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 0: 50%|████▉ | 6176/12384 [13:06:12<13:06:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 50%|████▉ | 6177/12384 [13:06:12<13:06:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 50%|████▉ | 6177/12384 [13:06:19<13:06:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 50%|████▉ | 6178/12384 [13:06:19<13:06:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 50%|████▉ | 6178/12384 [13:06:27<13:06:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 50%|████▉ | 6179/12384 [13:06:27<13:09:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 50%|████▉ | 6179/12384 [13:06:35<13:09:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|████▉ | 6180/12384 [13:06:35<13:08:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|████▉ | 6180/12384 [13:06:42<13:08:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 50%|████▉ | 6181/12384 [13:06:42<13:08:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 50%|████▉ | 6181/12384 [13:06:50<13:08:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|████▉ | 6182/12384 [13:06:50<13:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|████▉ | 6182/12384 [13:06:57<13:07:03, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=6.39s]
Epoch 0: 50%|████▉ | 6183/12384 [13:06:57<13:06:03, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=6.39s]
Epoch 0: 50%|████▉ | 6183/12384 [13:07:05<13:06:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 0: 50%|████▉ | 6184/12384 [13:07:05<13:06:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 0: 50%|████▉ | 6184/12384 [13:07:13<13:06:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 50%|████▉ | 6185/12384 [13:07:13<13:07:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 50%|████▉ | 6185/12384 [13:07:21<13:07:26, 7.62s/it, loss=0.0004, acc=0.9980, iter_time=7.38s]
Epoch 0: 50%|████▉ | 6186/12384 [13:07:21<13:17:16, 7.72s/it, loss=0.0004, acc=0.9980, iter_time=7.38s]
Epoch 0: 50%|████▉ | 6186/12384 [13:07:28<13:17:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 50%|████▉ | 6187/12384 [13:07:28<13:13:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 50%|████▉ | 6187/12384 [13:07:36<13:13:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 50%|████▉ | 6188/12384 [13:07:36<13:10:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 50%|████▉ | 6188/12384 [13:07:43<13:10:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|████▉ | 6189/12384 [13:07:43<13:08:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|████▉ | 6189/12384 [13:07:51<13:08:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|████▉ | 6190/12384 [13:07:51<13:07:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|████▉ | 6190/12384 [13:07:59<13:07:32, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=4.22s]
Epoch 0: 50%|████▉ | 6191/12384 [13:07:59<13:06:30, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=4.22s]
Epoch 0: 50%|████▉ | 6191/12384 [13:08:06<13:06:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 0: 50%|█████ | 6192/12384 [13:08:06<13:06:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 0: 50%|█████ | 6192/12384 [13:08:14<13:06:52, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=7.24s]
Epoch 0: 50%|█████ | 6193/12384 [13:08:14<13:06:05, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=7.24s]
Epoch 0: 50%|█████ | 6193/12384 [13:08:22<13:06:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|█████ | 6194/12384 [13:08:22<13:05:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|█████ | 6194/12384 [13:08:29<13:05:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 50%|█████ | 6195/12384 [13:08:29<13:04:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 50%|█████ | 6195/12384 [13:08:37<13:04:47, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.61s]
Epoch 0: 50%|█████ | 6196/12384 [13:08:37<13:04:26, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.61s]
Epoch 0: 50%|█████ | 6196/12384 [13:08:45<13:04:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 50%|█████ | 6197/12384 [13:08:45<13:12:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 50%|█████ | 6197/12384 [13:08:52<13:12:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|█████ | 6198/12384 [13:08:52<13:09:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|█████ | 6198/12384 [13:09:00<13:09:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|█████ | 6199/12384 [13:09:00<13:07:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|█████ | 6199/12384 [13:09:07<13:07:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 50%|█████ | 6200/12384 [13:09:07<13:06:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 50%|█████ | 6200/12384 [13:09:15<13:06:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 0: 50%|█████ | 6201/12384 [13:09:15<13:04:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 0: 50%|█████ | 6201/12384 [13:09:23<13:04:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 0: 50%|█████ | 6202/12384 [13:09:23<13:05:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 0: 50%|█████ | 6202/12384 [13:09:30<13:05:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 50%|█████ | 6203/12384 [13:09:30<13:04:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 50%|█████ | 6203/12384 [13:09:38<13:04:10, 7.61s/it, loss=0.0008, acc=0.9974, iter_time=4.82s]
Epoch 0: 50%|█████ | 6204/12384 [13:09:38<13:03:37, 7.61s/it, loss=0.0008, acc=0.9974, iter_time=4.82s]
Epoch 0: 50%|█████ | 6204/12384 [13:09:45<13:03:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 50%|█████ | 6205/12384 [13:09:45<13:03:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 50%|█████ | 6205/12384 [13:09:53<13:03:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 50%|█████ | 6206/12384 [13:09:53<13:03:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 50%|█████ | 6206/12384 [13:10:01<13:03:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 50%|█████ | 6207/12384 [13:10:01<13:03:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 50%|█████ | 6207/12384 [13:10:08<13:03:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 50%|█████ | 6208/12384 [13:10:08<13:03:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 50%|█████ | 6208/12384 [13:10:16<13:03:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 50%|█████ | 6209/12384 [13:10:16<13:03:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 50%|█████ | 6209/12384 [13:10:23<13:03:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 50%|█████ | 6210/12384 [13:10:23<13:02:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 50%|█████ | 6210/12384 [13:10:31<13:02:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|█████ | 6211/12384 [13:10:31<13:03:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|█████ | 6211/12384 [13:10:39<13:03:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 50%|█████ | 6212/12384 [13:10:39<13:03:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 50%|█████ | 6212/12384 [13:10:47<13:03:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 50%|█████ | 6213/12384 [13:10:47<13:12:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 50%|█████ | 6213/12384 [13:10:54<13:12:37, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.47s]
Epoch 0: 50%|█████ | 6214/12384 [13:10:54<13:09:17, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.47s]
Epoch 0: 50%|█████ | 6214/12384 [13:11:02<13:09:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 50%|█████ | 6215/12384 [13:11:02<13:06:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 50%|█████ | 6215/12384 [13:11:09<13:06:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 50%|█████ | 6216/12384 [13:11:09<13:05:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 50%|█████ | 6216/12384 [13:11:17<13:05:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 50%|█████ | 6217/12384 [13:11:17<13:04:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 50%|█████ | 6217/12384 [13:11:25<13:04:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|█████ | 6218/12384 [13:11:25<13:03:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|█████ | 6218/12384 [13:11:32<13:03:28, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.59s]
Epoch 0: 50%|█████ | 6219/12384 [13:11:32<13:03:41, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.59s]
Epoch 0: 50%|█████ | 6219/12384 [13:11:40<13:03:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 50%|█████ | 6220/12384 [13:11:40<13:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 50%|█████ | 6220/12384 [13:11:48<13:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 50%|█████ | 6221/12384 [13:11:48<13:02:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 50%|█████ | 6221/12384 [13:11:55<13:02:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 50%|█████ | 6222/12384 [13:11:55<13:02:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 50%|█████ | 6222/12384 [13:12:03<13:02:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 0: 50%|█████ | 6223/12384 [13:12:03<13:01:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 0: 50%|█████ | 6223/12384 [13:12:10<13:01:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 0: 50%|█████ | 6224/12384 [13:12:10<13:01:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 0: 50%|█████ | 6224/12384 [13:12:18<13:01:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=2.81s]
Epoch 0: 50%|█████ | 6225/12384 [13:12:18<13:01:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=2.81s]
Epoch 0: 50%|█████ | 6225/12384 [13:12:26<13:01:30, 7.61s/it, loss=0.0003, acc=0.9989, iter_time=12.03s]
Epoch 0: 50%|█████ | 6226/12384 [13:12:26<13:01:10, 7.61s/it, loss=0.0003, acc=0.9989, iter_time=12.03s]
Epoch 0: 50%|█████ | 6226/12384 [13:12:33<13:01:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 50%|█████ | 6227/12384 [13:12:33<13:01:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 50%|█████ | 6227/12384 [13:12:41<13:01:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|█████ | 6228/12384 [13:12:41<13:00:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 50%|█████ | 6228/12384 [13:12:48<13:00:13, 7.60s/it, loss=0.0006, acc=0.9960, iter_time=5.54s]
Epoch 0: 50%|█████ | 6229/12384 [13:12:48<12:59:37, 7.60s/it, loss=0.0006, acc=0.9960, iter_time=5.54s]
Epoch 0: 50%|█████ | 6229/12384 [13:12:56<12:59:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 50%|█████ | 6230/12384 [13:12:56<12:59:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 50%|█████ | 6230/12384 [13:13:04<12:59:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 50%|█████ | 6231/12384 [13:13:04<13:00:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 50%|█████ | 6231/12384 [13:13:11<13:00:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 50%|█████ | 6232/12384 [13:13:11<13:00:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 50%|█████ | 6232/12384 [13:13:19<13:00:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 50%|█████ | 6233/12384 [13:13:19<12:59:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 50%|█████ | 6233/12384 [13:13:26<12:59:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 50%|█████ | 6234/12384 [13:13:26<13:00:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 50%|█████ | 6234/12384 [13:13:34<13:00:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 50%|█████ | 6235/12384 [13:13:34<12:59:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 50%|█████ | 6235/12384 [13:13:42<12:59:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 50%|█████ | 6236/12384 [13:13:42<12:59:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 50%|█████ | 6236/12384 [13:13:49<12:59:36, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=6.50s]
Epoch 0: 50%|█████ | 6237/12384 [13:13:49<12:59:27, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=6.50s]
Epoch 0: 50%|█████ | 6237/12384 [13:13:57<12:59:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 50%|█████ | 6238/12384 [13:13:57<12:59:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 50%|█████ | 6238/12384 [13:14:05<12:59:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 0: 50%|█████ | 6239/12384 [13:14:05<13:08:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 0: 50%|█████ | 6239/12384 [13:14:12<13:08:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 50%|█████ | 6240/12384 [13:14:12<13:05:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 50%|█████ | 6240/12384 [13:14:20<13:05:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 50%|█████ | 6241/12384 [13:14:20<13:04:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 50%|█████ | 6241/12384 [13:14:28<13:04:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 50%|█████ | 6242/12384 [13:14:28<13:02:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 50%|█████ | 6242/12384 [13:14:35<13:02:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 50%|█████ | 6243/12384 [13:14:35<13:01:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 50%|█████ | 6243/12384 [13:14:43<13:01:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|█████ | 6244/12384 [13:14:43<13:00:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|█████ | 6244/12384 [13:14:50<13:00:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 50%|█████ | 6245/12384 [13:14:50<12:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 50%|█████ | 6245/12384 [13:14:58<12:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|█████ | 6246/12384 [13:14:58<13:02:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 50%|█████ | 6246/12384 [13:15:06<13:02:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 50%|█████ | 6247/12384 [13:15:06<13:01:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 50%|█████ | 6247/12384 [13:15:13<13:01:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 50%|█████ | 6248/12384 [13:15:13<13:00:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 50%|█████ | 6248/12384 [13:15:21<13:00:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 0: 50%|█████ | 6249/12384 [13:15:21<13:02:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 0: 50%|█████ | 6249/12384 [13:15:29<13:02:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 0: 50%|█████ | 6250/12384 [13:15:29<13:00:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 0: 50%|█████ | 6250/12384 [13:15:36<13:00:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 50%|█████ | 6251/12384 [13:15:36<13:01:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 50%|█████ | 6251/12384 [13:15:44<13:01:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 50%|█████ | 6252/12384 [13:15:44<13:00:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 50%|█████ | 6252/12384 [13:15:52<13:00:09, 7.63s/it, loss=0.0009, acc=0.9970, iter_time=7.58s]
Epoch 0: 50%|█████ | 6253/12384 [13:15:52<12:59:22, 7.63s/it, loss=0.0009, acc=0.9970, iter_time=7.58s]
Epoch 0: 50%|█████ | 6253/12384 [13:15:59<12:59:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 0: 51%|█████ | 6254/12384 [13:15:59<12:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 0: 51%|█████ | 6254/12384 [13:16:07<12:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 0: 51%|█████ | 6255/12384 [13:16:07<12:58:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 0: 51%|█████ | 6255/12384 [13:16:14<12:58:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 51%|█████ | 6256/12384 [13:16:14<12:57:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 51%|█████ | 6256/12384 [13:16:22<12:57:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 51%|█████ | 6257/12384 [13:16:22<12:56:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 51%|█████ | 6257/12384 [13:16:30<12:56:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 0: 51%|█████ | 6258/12384 [13:16:30<12:57:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 0: 51%|█████ | 6258/12384 [13:16:37<12:57:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 0: 51%|█████ | 6259/12384 [13:16:37<12:58:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 0: 51%|█████ | 6259/12384 [13:16:45<12:58:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████ | 6260/12384 [13:16:45<12:57:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████ | 6260/12384 [13:16:53<12:57:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 0: 51%|█████ | 6261/12384 [13:16:53<12:57:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 0: 51%|█████ | 6261/12384 [13:17:00<12:57:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 51%|█████ | 6262/12384 [13:17:00<12:56:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 51%|█████ | 6262/12384 [13:17:08<12:56:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 51%|█████ | 6263/12384 [13:17:08<12:56:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 51%|█████ | 6263/12384 [13:17:15<12:56:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 0: 51%|█████ | 6264/12384 [13:17:15<12:55:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 0: 51%|█████ | 6264/12384 [13:17:23<12:55:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 51%|█████ | 6265/12384 [13:17:23<13:05:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 51%|█████ | 6265/12384 [13:17:31<13:05:34, 7.70s/it, loss=0.0006, acc=0.9998, iter_time=9.08s]
Epoch 0: 51%|█████ | 6266/12384 [13:17:31<13:03:02, 7.68s/it, loss=0.0006, acc=0.9998, iter_time=9.08s]
Epoch 0: 51%|█████ | 6266/12384 [13:17:38<13:03:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6267/12384 [13:17:38<13:01:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6267/12384 [13:17:46<13:01:24, 7.66s/it, loss=0.0004, acc=0.9998, iter_time=5.10s]
Epoch 0: 51%|█████ | 6268/12384 [13:17:46<13:00:17, 7.65s/it, loss=0.0004, acc=0.9998, iter_time=5.10s]
Epoch 0: 51%|█████ | 6268/12384 [13:17:54<13:00:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6269/12384 [13:17:54<12:59:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6269/12384 [13:18:01<12:59:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 51%|█████ | 6270/12384 [13:18:01<12:58:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 51%|█████ | 6270/12384 [13:18:09<12:58:58, 7.64s/it, loss=0.0013, acc=0.9978, iter_time=5.56s]
Epoch 0: 51%|█████ | 6271/12384 [13:18:09<12:57:48, 7.63s/it, loss=0.0013, acc=0.9978, iter_time=5.56s]
Epoch 0: 51%|█████ | 6271/12384 [13:18:17<12:57:48, 7.63s/it, loss=0.0003, acc=0.9981, iter_time=10.03s]
Epoch 0: 51%|█████ | 6272/12384 [13:18:17<12:56:29, 7.62s/it, loss=0.0003, acc=0.9981, iter_time=10.03s]
Epoch 0: 51%|█████ | 6272/12384 [13:18:24<12:56:29, 7.62s/it, loss=0.0002, acc=0.9981, iter_time=7.22s]
Epoch 0: 51%|█████ | 6273/12384 [13:18:24<12:56:24, 7.62s/it, loss=0.0002, acc=0.9981, iter_time=7.22s]
Epoch 0: 51%|█████ | 6273/12384 [13:18:32<12:56:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6274/12384 [13:18:32<12:56:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6274/12384 [13:18:40<12:56:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 51%|█████ | 6275/12384 [13:18:40<13:04:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 51%|█████ | 6275/12384 [13:18:47<13:04:41, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 51%|█████ | 6276/12384 [13:18:47<13:01:58, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 51%|█████ | 6276/12384 [13:18:55<13:01:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6277/12384 [13:18:55<12:59:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6277/12384 [13:19:03<12:59:57, 7.66s/it, loss=0.0008, acc=0.9982, iter_time=7.30s]
Epoch 0: 51%|█████ | 6278/12384 [13:19:03<12:58:30, 7.65s/it, loss=0.0008, acc=0.9982, iter_time=7.30s]
Epoch 0: 51%|█████ | 6278/12384 [13:19:10<12:58:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 51%|█████ | 6279/12384 [13:19:10<12:56:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 51%|█████ | 6279/12384 [13:19:18<12:56:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.56s]
Epoch 0: 51%|█████ | 6280/12384 [13:19:18<12:56:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.56s]
Epoch 0: 51%|█████ | 6280/12384 [13:19:25<12:56:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 51%|█████ | 6281/12384 [13:19:25<12:55:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 51%|█████ | 6281/12384 [13:19:33<12:55:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 51%|█████ | 6282/12384 [13:19:33<12:54:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 51%|█████ | 6282/12384 [13:19:41<12:54:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████ | 6283/12384 [13:19:41<12:54:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████ | 6283/12384 [13:19:48<12:54:06, 7.61s/it, loss=0.0020, acc=0.9979, iter_time=7.59s]
Epoch 0: 51%|█████ | 6284/12384 [13:19:48<12:53:37, 7.61s/it, loss=0.0020, acc=0.9979, iter_time=7.59s]
Epoch 0: 51%|█████ | 6284/12384 [13:19:56<12:53:37, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.53s]
Epoch 0: 51%|█████ | 6285/12384 [13:19:56<12:53:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.53s]
Epoch 0: 51%|█████ | 6285/12384 [13:20:03<12:53:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 51%|█████ | 6286/12384 [13:20:03<12:53:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 51%|█████ | 6286/12384 [13:20:11<12:53:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 51%|█████ | 6287/12384 [13:20:11<12:53:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 51%|█████ | 6287/12384 [13:20:19<12:53:33, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=9.23s]
Epoch 0: 51%|█████ | 6288/12384 [13:20:19<12:53:29, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=9.23s]
Epoch 0: 51%|█████ | 6288/12384 [13:20:26<12:53:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 51%|█████ | 6289/12384 [13:20:26<12:53:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 51%|█████ | 6289/12384 [13:20:34<12:53:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 51%|█████ | 6290/12384 [13:20:34<12:53:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 51%|█████ | 6290/12384 [13:20:42<12:53:36, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 51%|█████ | 6291/12384 [13:20:42<13:04:09, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 51%|█████ | 6291/12384 [13:20:49<13:04:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 51%|█████ | 6292/12384 [13:20:49<13:00:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 51%|█████ | 6292/12384 [13:20:57<13:00:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 51%|█████ | 6293/12384 [13:20:57<12:57:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 51%|█████ | 6293/12384 [13:21:05<12:57:58, 7.66s/it, loss=0.0006, acc=0.9987, iter_time=10.16s]
Epoch 0: 51%|█████ | 6294/12384 [13:21:05<12:56:30, 7.65s/it, loss=0.0006, acc=0.9987, iter_time=10.16s]
Epoch 0: 51%|█████ | 6294/12384 [13:21:12<12:56:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6295/12384 [13:21:12<12:55:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6295/12384 [13:21:20<12:55:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 51%|█████ | 6296/12384 [13:21:20<12:53:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 51%|█████ | 6296/12384 [13:21:28<12:53:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 0: 51%|█████ | 6297/12384 [13:21:28<12:55:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 0: 51%|█████ | 6297/12384 [13:21:35<12:55:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6298/12384 [13:21:35<12:54:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6298/12384 [13:21:43<12:54:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 51%|█████ | 6299/12384 [13:21:43<12:53:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 51%|█████ | 6299/12384 [13:21:50<12:53:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 51%|█████ | 6300/12384 [13:21:50<12:52:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 51%|█████ | 6300/12384 [13:21:58<12:52:48, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 51%|█████ | 6301/12384 [13:21:58<12:52:39, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 51%|█████ | 6301/12384 [13:22:06<12:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 51%|█████ | 6302/12384 [13:22:06<13:00:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 51%|█████ | 6302/12384 [13:22:14<13:00:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████ | 6303/12384 [13:22:14<12:58:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████ | 6303/12384 [13:22:21<12:58:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 51%|█████ | 6304/12384 [13:22:21<12:56:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 51%|█████ | 6304/12384 [13:22:29<12:56:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 51%|█████ | 6305/12384 [13:22:29<12:54:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 51%|█████ | 6305/12384 [13:22:36<12:54:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 51%|█████ | 6306/12384 [13:22:36<12:54:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 51%|█████ | 6306/12384 [13:22:44<12:54:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 51%|█████ | 6307/12384 [13:22:44<12:53:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 51%|█████ | 6307/12384 [13:22:52<12:53:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6308/12384 [13:22:52<12:52:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6308/12384 [13:22:59<12:52:47, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.08s]
Epoch 0: 51%|█████ | 6309/12384 [13:22:59<12:51:55, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.08s]
Epoch 0: 51%|█████ | 6309/12384 [13:23:07<12:51:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 51%|█████ | 6310/12384 [13:23:07<12:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 51%|█████ | 6310/12384 [13:23:15<12:51:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.85s]
Epoch 0: 51%|█████ | 6311/12384 [13:23:15<12:53:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.85s]
Epoch 0: 51%|█████ | 6311/12384 [13:23:23<12:53:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 51%|█████ | 6312/12384 [13:23:23<13:14:09, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 51%|█████ | 6312/12384 [13:23:32<13:14:09, 7.85s/it, loss=0.0001, acc=0.9998, iter_time=8.53s]
Epoch 0: 51%|█████ | 6313/12384 [13:23:32<13:36:15, 8.07s/it, loss=0.0001, acc=0.9998, iter_time=8.53s]
Epoch 0: 51%|█████ | 6313/12384 [13:23:40<13:36:15, 8.07s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 0: 51%|█████ | 6314/12384 [13:23:40<13:37:51, 8.08s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 0: 51%|█████ | 6314/12384 [13:23:48<13:37:51, 8.08s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 0: 51%|█████ | 6315/12384 [13:23:48<13:47:15, 8.18s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 0: 51%|█████ | 6315/12384 [13:23:56<13:47:15, 8.18s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 51%|█████ | 6316/12384 [13:23:56<13:50:18, 8.21s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 51%|█████ | 6316/12384 [13:24:04<13:50:18, 8.21s/it, loss=0.0001, acc=0.9998, iter_time=7.66s]
Epoch 0: 51%|█████ | 6317/12384 [13:24:04<13:41:56, 8.13s/it, loss=0.0001, acc=0.9998, iter_time=7.66s]
Epoch 0: 51%|█████ | 6317/12384 [13:24:12<13:41:56, 8.13s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 51%|█████ | 6318/12384 [13:24:12<13:28:14, 7.99s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 51%|█████ | 6318/12384 [13:24:20<13:28:14, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 0: 51%|█████ | 6319/12384 [13:24:20<13:18:51, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 0: 51%|█████ | 6319/12384 [13:24:27<13:18:51, 7.90s/it, loss=0.0002, acc=0.9999, iter_time=12.04s]
Epoch 0: 51%|█████ | 6320/12384 [13:24:27<13:11:28, 7.83s/it, loss=0.0002, acc=0.9999, iter_time=12.04s]
Epoch 0: 51%|█████ | 6320/12384 [13:24:35<13:11:28, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 51%|█████ | 6321/12384 [13:24:35<13:04:10, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 51%|█████ | 6321/12384 [13:24:43<13:04:10, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 51%|█████ | 6322/12384 [13:24:43<13:00:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 51%|█████ | 6322/12384 [13:24:50<13:00:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 51%|█████ | 6323/12384 [13:24:50<12:59:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 51%|█████ | 6323/12384 [13:24:58<12:59:05, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.45s]
Epoch 0: 51%|█████ | 6324/12384 [13:24:58<12:58:39, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.45s]
Epoch 0: 51%|█████ | 6324/12384 [13:25:06<12:58:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 51%|█████ | 6325/12384 [13:25:06<13:22:30, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 51%|█████ | 6325/12384 [13:25:14<13:22:30, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 51%|█████ | 6326/12384 [13:25:14<13:11:37, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 51%|█████ | 6326/12384 [13:25:22<13:11:37, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 51%|█████ | 6327/12384 [13:25:22<13:04:39, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 51%|█████ | 6327/12384 [13:25:29<13:04:39, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 51%|█████ | 6328/12384 [13:25:29<12:59:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 51%|█████ | 6328/12384 [13:25:37<12:59:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 51%|█████ | 6329/12384 [13:25:37<12:54:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 51%|█████ | 6329/12384 [13:25:44<12:54:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 0: 51%|█████ | 6330/12384 [13:25:44<12:53:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 0: 51%|█████ | 6330/12384 [13:25:52<12:53:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 51%|█████ | 6331/12384 [13:25:52<12:52:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 51%|█████ | 6331/12384 [13:26:00<12:52:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 51%|█████ | 6332/12384 [13:26:00<12:51:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 51%|█████ | 6332/12384 [13:26:07<12:51:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6333/12384 [13:26:07<12:50:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6333/12384 [13:26:15<12:50:59, 7.64s/it, loss=0.0002, acc=0.9990, iter_time=7.61s]
Epoch 0: 51%|█████ | 6334/12384 [13:26:15<12:50:04, 7.64s/it, loss=0.0002, acc=0.9990, iter_time=7.61s]
Epoch 0: 51%|█████ | 6334/12384 [13:26:23<12:50:04, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6335/12384 [13:26:23<12:49:31, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6335/12384 [13:26:30<12:49:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 51%|█████ | 6336/12384 [13:26:30<12:49:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 51%|█████ | 6336/12384 [13:26:38<12:49:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6337/12384 [13:26:38<12:48:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 51%|█████ | 6337/12384 [13:26:45<12:48:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6338/12384 [13:26:45<12:47:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████ | 6338/12384 [13:26:53<12:47:56, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=7.62s]
Epoch 0: 51%|█████ | 6339/12384 [13:26:53<12:48:55, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=7.62s]
Epoch 0: 51%|█████ | 6339/12384 [13:27:01<12:48:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 0: 51%|█████ | 6340/12384 [13:27:01<12:49:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 0: 51%|█████ | 6340/12384 [13:27:08<12:49:11, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.40s]
Epoch 0: 51%|█████ | 6341/12384 [13:27:08<12:49:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.40s]
Epoch 0: 51%|█████ | 6341/12384 [13:27:16<12:49:26, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=6.87s]
Epoch 0: 51%|█████ | 6342/12384 [13:27:16<12:49:02, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=6.87s]
Epoch 0: 51%|█████ | 6342/12384 [13:27:24<12:49:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 0: 51%|█████ | 6343/12384 [13:27:24<12:49:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 0: 51%|█████ | 6343/12384 [13:27:32<12:49:28, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.11s]
Epoch 0: 51%|█████ | 6344/12384 [13:27:32<12:58:31, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=8.11s]
Epoch 0: 51%|█████ | 6344/12384 [13:27:39<12:58:31, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.18s]
Epoch 0: 51%|█████ | 6345/12384 [13:27:39<12:54:31, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.18s]
Epoch 0: 51%|█████ | 6345/12384 [13:27:47<12:54:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 51%|█████ | 6346/12384 [13:27:47<12:52:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 51%|█████ | 6346/12384 [13:27:55<12:52:49, 7.68s/it, loss=0.0002, acc=0.9988, iter_time=7.73s]
Epoch 0: 51%|█████▏ | 6347/12384 [13:27:55<12:52:42, 7.68s/it, loss=0.0002, acc=0.9988, iter_time=7.73s]
Epoch 0: 51%|█████▏ | 6347/12384 [13:28:02<12:52:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 51%|█████▏ | 6348/12384 [13:28:02<12:52:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 51%|█████▏ | 6348/12384 [13:28:10<12:52:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 0: 51%|█████▏ | 6349/12384 [13:28:10<12:49:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 0: 51%|█████▏ | 6349/12384 [13:28:17<12:49:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 0: 51%|█████▏ | 6350/12384 [13:28:17<12:48:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 0: 51%|█████▏ | 6350/12384 [13:28:25<12:48:41, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 51%|█████▏ | 6351/12384 [13:28:25<12:46:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 51%|█████▏ | 6351/12384 [13:28:33<12:46:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 51%|█████▏ | 6352/12384 [13:28:33<12:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 51%|█████▏ | 6352/12384 [13:28:40<12:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 0: 51%|█████▏ | 6353/12384 [13:28:40<12:45:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 0: 51%|█████▏ | 6353/12384 [13:28:48<12:45:22, 7.61s/it, loss=0.0004, acc=0.9989, iter_time=7.07s]
Epoch 0: 51%|█████▏ | 6354/12384 [13:28:48<12:45:28, 7.62s/it, loss=0.0004, acc=0.9989, iter_time=7.07s]
Epoch 0: 51%|█████▏ | 6354/12384 [13:28:56<12:45:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.05s]
Epoch 0: 51%|█████▏ | 6355/12384 [13:28:56<12:53:28, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.05s]
Epoch 0: 51%|█████▏ | 6355/12384 [13:29:03<12:53:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 51%|█████▏ | 6356/12384 [13:29:03<12:50:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 51%|█████▏ | 6356/12384 [13:29:11<12:50:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 51%|█████▏ | 6357/12384 [13:29:11<12:48:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 51%|█████▏ | 6357/12384 [13:29:19<12:48:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 51%|█████▏ | 6358/12384 [13:29:19<12:46:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 51%|█████▏ | 6358/12384 [13:29:26<12:46:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 51%|█████▏ | 6359/12384 [13:29:26<12:45:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 51%|█████▏ | 6359/12384 [13:29:34<12:45:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 51%|█████▏ | 6360/12384 [13:29:34<12:44:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 51%|█████▏ | 6360/12384 [13:29:41<12:44:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 51%|█████▏ | 6361/12384 [13:29:41<12:43:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 51%|█████▏ | 6361/12384 [13:29:49<12:43:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 51%|█████▏ | 6362/12384 [13:29:49<12:43:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 51%|█████▏ | 6362/12384 [13:29:57<12:43:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████▏ | 6363/12384 [13:29:57<12:45:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████▏ | 6363/12384 [13:30:04<12:45:58, 7.63s/it, loss=0.0004, acc=0.9991, iter_time=4.54s]
Epoch 0: 51%|█████▏ | 6364/12384 [13:30:04<12:45:36, 7.63s/it, loss=0.0004, acc=0.9991, iter_time=4.54s]
Epoch 0: 51%|█████▏ | 6364/12384 [13:30:12<12:45:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 51%|█████▏ | 6365/12384 [13:30:12<12:45:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 51%|█████▏ | 6365/12384 [13:30:19<12:45:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 51%|█████▏ | 6366/12384 [13:30:19<12:44:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 51%|█████▏ | 6366/12384 [13:30:27<12:44:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 51%|█████▏ | 6367/12384 [13:30:27<12:44:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 51%|█████▏ | 6367/12384 [13:30:35<12:44:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 0: 51%|█████▏ | 6368/12384 [13:30:35<12:47:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 0: 51%|█████▏ | 6368/12384 [13:30:42<12:47:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 51%|█████▏ | 6369/12384 [13:30:42<12:45:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 51%|█████▏ | 6369/12384 [13:30:50<12:45:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 51%|█████▏ | 6370/12384 [13:30:50<12:54:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 51%|█████▏ | 6370/12384 [13:30:58<12:54:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 51%|█████▏ | 6371/12384 [13:30:58<12:50:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 51%|█████▏ | 6371/12384 [13:31:06<12:50:53, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████▏ | 6372/12384 [13:31:06<12:48:24, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 51%|█████▏ | 6372/12384 [13:31:13<12:48:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 51%|█████▏ | 6373/12384 [13:31:13<12:46:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 51%|█████▏ | 6373/12384 [13:31:21<12:46:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████▏ | 6374/12384 [13:31:21<12:45:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 51%|█████▏ | 6374/12384 [13:31:28<12:45:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 51%|█████▏ | 6375/12384 [13:31:28<12:44:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 51%|█████▏ | 6375/12384 [13:31:36<12:44:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 51%|█████▏ | 6376/12384 [13:31:36<12:44:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 51%|█████▏ | 6376/12384 [13:31:44<12:44:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 51%|█████▏ | 6377/12384 [13:31:44<12:43:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 51%|█████▏ | 6377/12384 [13:31:51<12:43:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6378/12384 [13:31:51<12:42:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6378/12384 [13:31:59<12:42:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 52%|█████▏ | 6379/12384 [13:31:59<12:41:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 52%|█████▏ | 6379/12384 [13:32:06<12:41:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 52%|█████▏ | 6380/12384 [13:32:06<12:40:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 52%|█████▏ | 6380/12384 [13:32:14<12:40:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 52%|█████▏ | 6381/12384 [13:32:14<12:48:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 52%|█████▏ | 6381/12384 [13:32:22<12:48:43, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=7.59s]
Epoch 0: 52%|█████▏ | 6382/12384 [13:32:22<12:46:34, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=7.59s]
Epoch 0: 52%|█████▏ | 6382/12384 [13:32:30<12:46:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 52%|█████▏ | 6383/12384 [13:32:30<12:45:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 52%|█████▏ | 6383/12384 [13:32:37<12:45:30, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.67s]
Epoch 0: 52%|█████▏ | 6384/12384 [13:32:37<12:43:56, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.67s]
Epoch 0: 52%|█████▏ | 6384/12384 [13:32:45<12:43:56, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 0: 52%|█████▏ | 6385/12384 [13:32:45<12:43:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 0: 52%|█████▏ | 6385/12384 [13:32:52<12:43:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 52%|█████▏ | 6386/12384 [13:32:52<12:42:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 52%|█████▏ | 6386/12384 [13:33:00<12:42:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 52%|█████▏ | 6387/12384 [13:33:00<12:41:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 52%|█████▏ | 6387/12384 [13:33:08<12:41:50, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=9.70s]
Epoch 0: 52%|█████▏ | 6388/12384 [13:33:08<12:41:12, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=9.70s]
Epoch 0: 52%|█████▏ | 6388/12384 [13:33:15<12:41:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 52%|█████▏ | 6389/12384 [13:33:15<12:41:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 52%|█████▏ | 6389/12384 [13:33:23<12:41:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 0: 52%|█████▏ | 6390/12384 [13:33:23<12:41:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 0: 52%|█████▏ | 6390/12384 [13:33:30<12:41:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.43s]
Epoch 0: 52%|█████▏ | 6391/12384 [13:33:30<12:41:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.43s]
Epoch 0: 52%|█████▏ | 6391/12384 [13:33:38<12:41:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 52%|█████▏ | 6392/12384 [13:33:38<12:40:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 52%|█████▏ | 6392/12384 [13:33:46<12:40:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 52%|█████▏ | 6393/12384 [13:33:46<12:40:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 52%|█████▏ | 6393/12384 [13:33:53<12:40:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 52%|█████▏ | 6394/12384 [13:33:53<12:40:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 52%|█████▏ | 6394/12384 [13:34:01<12:40:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 52%|█████▏ | 6395/12384 [13:34:01<12:40:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 52%|█████▏ | 6395/12384 [13:34:09<12:40:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6396/12384 [13:34:09<12:39:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6396/12384 [13:34:16<12:39:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 52%|█████▏ | 6397/12384 [13:34:16<12:48:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 52%|█████▏ | 6397/12384 [13:34:24<12:48:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 52%|█████▏ | 6398/12384 [13:34:24<12:46:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 52%|█████▏ | 6398/12384 [13:34:32<12:46:02, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=9.14s]
Epoch 0: 52%|█████▏ | 6399/12384 [13:34:32<12:43:16, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=9.14s]
Epoch 0: 52%|█████▏ | 6399/12384 [13:34:39<12:43:16, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 52%|█████▏ | 6400/12384 [13:34:39<12:41:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 52%|█████▏ | 6400/12384 [13:34:47<12:41:07, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.21s]
Epoch 0: 52%|█████▏ | 6401/12384 [13:34:47<12:41:08, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.21s]
Epoch 0: 52%|█████▏ | 6401/12384 [13:34:54<12:41:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 52%|█████▏ | 6402/12384 [13:34:54<12:40:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 52%|█████▏ | 6402/12384 [13:35:02<12:40:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6403/12384 [13:35:02<12:39:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6403/12384 [13:35:10<12:39:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 52%|█████▏ | 6404/12384 [13:35:10<12:38:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 52%|█████▏ | 6404/12384 [13:35:17<12:38:27, 7.61s/it, loss=0.0003, acc=0.9977, iter_time=4.79s]
Epoch 0: 52%|█████▏ | 6405/12384 [13:35:17<12:38:21, 7.61s/it, loss=0.0003, acc=0.9977, iter_time=4.79s]
Epoch 0: 52%|█████▏ | 6405/12384 [13:35:25<12:38:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.41s]
Epoch 0: 52%|█████▏ | 6406/12384 [13:35:25<12:37:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.41s]
Epoch 0: 52%|█████▏ | 6406/12384 [13:35:33<12:37:51, 7.61s/it, loss=0.0004, acc=0.9975, iter_time=7.89s]
Epoch 0: 52%|█████▏ | 6407/12384 [13:35:33<12:45:56, 7.69s/it, loss=0.0004, acc=0.9975, iter_time=7.89s]
Epoch 0: 52%|█████▏ | 6407/12384 [13:35:40<12:45:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 52%|█████▏ | 6408/12384 [13:35:40<12:43:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 52%|█████▏ | 6408/12384 [13:35:48<12:43:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.36s]
Epoch 0: 52%|█████▏ | 6409/12384 [13:35:48<12:41:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.36s]
Epoch 0: 52%|█████▏ | 6409/12384 [13:35:56<12:41:21, 7.65s/it, loss=0.0002, acc=0.9994, iter_time=11.45s]
Epoch 0: 52%|█████▏ | 6410/12384 [13:35:56<12:40:37, 7.64s/it, loss=0.0002, acc=0.9994, iter_time=11.45s]
Epoch 0: 52%|█████▏ | 6410/12384 [13:36:03<12:40:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 52%|█████▏ | 6411/12384 [13:36:03<12:39:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 52%|█████▏ | 6411/12384 [13:36:11<12:39:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6412/12384 [13:36:11<12:38:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6412/12384 [13:36:18<12:38:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6413/12384 [13:36:18<12:38:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6413/12384 [13:36:26<12:38:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6414/12384 [13:36:26<12:38:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6414/12384 [13:36:34<12:38:08, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.00s]
Epoch 0: 52%|█████▏ | 6415/12384 [13:36:34<12:37:50, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.00s]
Epoch 0: 52%|█████▏ | 6415/12384 [13:36:41<12:37:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 52%|█████▏ | 6416/12384 [13:36:41<12:37:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 52%|█████▏ | 6416/12384 [13:36:49<12:37:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 0: 52%|█████▏ | 6417/12384 [13:36:49<12:37:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 0: 52%|█████▏ | 6417/12384 [13:36:57<12:37:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 52%|█████▏ | 6418/12384 [13:36:57<12:37:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 52%|█████▏ | 6418/12384 [13:37:04<12:37:23, 7.62s/it, loss=0.0007, acc=0.9976, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6419/12384 [13:37:04<12:36:42, 7.61s/it, loss=0.0007, acc=0.9976, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6419/12384 [13:37:12<12:36:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6420/12384 [13:37:12<12:36:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6420/12384 [13:37:19<12:36:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6421/12384 [13:37:19<12:35:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6421/12384 [13:37:27<12:35:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6422/12384 [13:37:27<12:35:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6422/12384 [13:37:35<12:35:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 52%|█████▏ | 6423/12384 [13:37:35<12:45:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 52%|█████▏ | 6423/12384 [13:37:43<12:45:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 52%|█████▏ | 6424/12384 [13:37:43<12:45:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 52%|█████▏ | 6424/12384 [13:37:50<12:45:57, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 52%|█████▏ | 6425/12384 [13:37:50<12:42:19, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 52%|█████▏ | 6425/12384 [13:37:58<12:42:19, 7.68s/it, loss=0.0002, acc=0.9997, iter_time=7.66s]
Epoch 0: 52%|█████▏ | 6426/12384 [13:37:58<12:41:51, 7.67s/it, loss=0.0002, acc=0.9997, iter_time=7.66s]
Epoch 0: 52%|█████▏ | 6426/12384 [13:38:05<12:41:51, 7.67s/it, loss=0.0003, acc=0.9984, iter_time=5.49s]
Epoch 0: 52%|█████▏ | 6427/12384 [13:38:05<12:40:14, 7.66s/it, loss=0.0003, acc=0.9984, iter_time=5.49s]
Epoch 0: 52%|█████▏ | 6427/12384 [13:38:13<12:40:14, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=9.74s]
Epoch 0: 52%|█████▏ | 6428/12384 [13:38:13<12:38:20, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=9.74s]
Epoch 0: 52%|█████▏ | 6428/12384 [13:38:21<12:38:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6429/12384 [13:38:21<12:37:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6429/12384 [13:38:28<12:37:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 52%|█████▏ | 6430/12384 [13:38:28<12:36:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 52%|█████▏ | 6430/12384 [13:38:36<12:36:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 52%|█████▏ | 6431/12384 [13:38:36<12:36:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 52%|█████▏ | 6431/12384 [13:38:44<12:36:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 52%|█████▏ | 6432/12384 [13:38:44<12:35:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 52%|█████▏ | 6432/12384 [13:38:51<12:35:59, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.51s]
Epoch 0: 52%|█████▏ | 6433/12384 [13:38:51<12:43:24, 7.70s/it, loss=0.0002, acc=0.9999, iter_time=7.51s]
Epoch 0: 52%|█████▏ | 6433/12384 [13:38:59<12:43:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6434/12384 [13:38:59<12:41:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6434/12384 [13:39:07<12:41:15, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6435/12384 [13:39:07<12:38:35, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6435/12384 [13:39:14<12:38:35, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6436/12384 [13:39:14<12:37:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6436/12384 [13:39:22<12:37:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6437/12384 [13:39:22<12:36:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6437/12384 [13:39:29<12:36:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 52%|█████▏ | 6438/12384 [13:39:29<12:36:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 52%|█████▏ | 6438/12384 [13:39:37<12:36:02, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.79s]
Epoch 0: 52%|█████▏ | 6439/12384 [13:39:37<12:35:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.79s]
Epoch 0: 52%|█████▏ | 6439/12384 [13:39:45<12:35:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 52%|█████▏ | 6440/12384 [13:39:45<12:34:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 52%|█████▏ | 6440/12384 [13:39:52<12:34:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 0: 52%|█████▏ | 6441/12384 [13:39:52<12:33:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 0: 52%|█████▏ | 6441/12384 [13:40:00<12:33:44, 7.61s/it, loss=0.0002, acc=0.9977, iter_time=5.32s]
Epoch 0: 52%|█████▏ | 6442/12384 [13:40:00<12:34:07, 7.61s/it, loss=0.0002, acc=0.9977, iter_time=5.32s]
Epoch 0: 52%|█████▏ | 6442/12384 [13:40:08<12:34:07, 7.61s/it, loss=0.0003, acc=0.9985, iter_time=7.13s]
Epoch 0: 52%|█████▏ | 6443/12384 [13:40:08<12:34:11, 7.62s/it, loss=0.0003, acc=0.9985, iter_time=7.13s]
Epoch 0: 52%|█████▏ | 6443/12384 [13:40:15<12:34:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 0: 52%|█████▏ | 6444/12384 [13:40:15<12:33:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 0: 52%|█████▏ | 6444/12384 [13:40:23<12:33:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6445/12384 [13:40:23<12:33:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6445/12384 [13:40:30<12:33:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6446/12384 [13:40:30<12:33:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6446/12384 [13:40:38<12:33:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6447/12384 [13:40:38<12:33:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6447/12384 [13:40:46<12:33:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 52%|█████▏ | 6448/12384 [13:40:46<12:33:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 52%|█████▏ | 6448/12384 [13:40:54<12:33:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 52%|█████▏ | 6449/12384 [13:40:54<12:43:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 52%|█████▏ | 6449/12384 [13:41:01<12:43:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 52%|█████▏ | 6450/12384 [13:41:01<12:40:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 52%|█████▏ | 6450/12384 [13:41:09<12:40:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 52%|█████▏ | 6451/12384 [13:41:09<12:38:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 52%|█████▏ | 6451/12384 [13:41:16<12:38:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 52%|█████▏ | 6452/12384 [13:41:16<12:35:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 52%|█████▏ | 6452/12384 [13:41:24<12:35:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 52%|█████▏ | 6453/12384 [13:41:24<12:35:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 52%|█████▏ | 6453/12384 [13:41:32<12:35:12, 7.64s/it, loss=0.0005, acc=0.9977, iter_time=6.85s]
Epoch 0: 52%|█████▏ | 6454/12384 [13:41:32<12:34:23, 7.63s/it, loss=0.0005, acc=0.9977, iter_time=6.85s]
Epoch 0: 52%|█████▏ | 6454/12384 [13:41:39<12:34:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 0: 52%|█████▏ | 6455/12384 [13:41:39<12:33:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 0: 52%|█████▏ | 6455/12384 [13:41:47<12:33:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 52%|█████▏ | 6456/12384 [13:41:47<12:32:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 52%|█████▏ | 6456/12384 [13:41:55<12:32:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 52%|█████▏ | 6457/12384 [13:41:55<12:35:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 52%|█████▏ | 6457/12384 [13:42:02<12:35:10, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 52%|█████▏ | 6458/12384 [13:42:02<12:33:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 52%|█████▏ | 6458/12384 [13:42:10<12:33:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 52%|█████▏ | 6459/12384 [13:42:10<12:41:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 52%|█████▏ | 6459/12384 [13:42:18<12:41:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6460/12384 [13:42:18<12:38:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6460/12384 [13:42:25<12:38:49, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6461/12384 [13:42:25<12:36:25, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6461/12384 [13:42:33<12:36:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6462/12384 [13:42:33<12:35:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6462/12384 [13:42:41<12:35:03, 7.65s/it, loss=0.0003, acc=0.9984, iter_time=5.36s]
Epoch 0: 52%|█████▏ | 6463/12384 [13:42:41<12:34:03, 7.64s/it, loss=0.0003, acc=0.9984, iter_time=5.36s]
Epoch 0: 52%|█████▏ | 6463/12384 [13:42:48<12:34:03, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=10.28s]
Epoch 0: 52%|█████▏ | 6464/12384 [13:42:48<12:33:22, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=10.28s]
Epoch 0: 52%|█████▏ | 6464/12384 [13:42:56<12:33:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 0: 52%|█████▏ | 6465/12384 [13:42:56<12:32:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 0: 52%|█████▏ | 6465/12384 [13:43:03<12:32:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 52%|█████▏ | 6466/12384 [13:43:03<12:33:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 52%|█████▏ | 6466/12384 [13:43:11<12:33:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 52%|█████▏ | 6467/12384 [13:43:11<12:33:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 52%|█████▏ | 6467/12384 [13:43:19<12:33:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6468/12384 [13:43:19<12:32:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6468/12384 [13:43:26<12:32:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6469/12384 [13:43:26<12:31:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6469/12384 [13:43:34<12:31:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 52%|█████▏ | 6470/12384 [13:43:34<12:43:56, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 52%|█████▏ | 6470/12384 [13:43:42<12:43:56, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 0: 52%|█████▏ | 6471/12384 [13:43:42<12:39:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 0: 52%|█████▏ | 6471/12384 [13:43:50<12:39:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 52%|█████▏ | 6472/12384 [13:43:50<12:37:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 52%|█████▏ | 6472/12384 [13:43:57<12:37:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 52%|█████▏ | 6473/12384 [13:43:57<12:34:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 52%|█████▏ | 6473/12384 [13:44:05<12:34:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 52%|█████▏ | 6474/12384 [13:44:05<12:32:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 52%|█████▏ | 6474/12384 [13:44:13<12:32:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.92s]
Epoch 0: 52%|█████▏ | 6475/12384 [13:44:13<12:41:43, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=10.92s]
Epoch 0: 52%|█████▏ | 6475/12384 [13:44:20<12:41:43, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 52%|█████▏ | 6476/12384 [13:44:20<12:37:10, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 52%|█████▏ | 6476/12384 [13:44:28<12:37:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 0: 52%|█████▏ | 6477/12384 [13:44:28<12:35:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 0: 52%|█████▏ | 6477/12384 [13:44:36<12:35:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 52%|█████▏ | 6478/12384 [13:44:36<12:33:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 52%|█████▏ | 6478/12384 [13:44:43<12:33:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 52%|█████▏ | 6479/12384 [13:44:43<12:32:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 52%|█████▏ | 6479/12384 [13:44:51<12:32:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 52%|█████▏ | 6480/12384 [13:44:51<12:31:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 52%|█████▏ | 6480/12384 [13:44:58<12:31:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 52%|█████▏ | 6481/12384 [13:44:58<12:30:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 52%|█████▏ | 6481/12384 [13:45:06<12:30:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 52%|█████▏ | 6482/12384 [13:45:06<12:30:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 52%|█████▏ | 6482/12384 [13:45:14<12:30:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 52%|█████▏ | 6483/12384 [13:45:14<12:27:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 52%|█████▏ | 6483/12384 [13:45:21<12:27:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 0: 52%|█████▏ | 6484/12384 [13:45:21<12:28:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 0: 52%|█████▏ | 6484/12384 [13:45:29<12:28:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 52%|█████▏ | 6485/12384 [13:45:29<12:29:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 52%|█████▏ | 6485/12384 [13:45:36<12:29:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 52%|█████▏ | 6486/12384 [13:45:36<12:28:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 52%|█████▏ | 6486/12384 [13:45:44<12:28:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.64s]
Epoch 0: 52%|█████▏ | 6487/12384 [13:45:44<12:28:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.64s]
Epoch 0: 52%|█████▏ | 6487/12384 [13:45:52<12:28:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 52%|█████▏ | 6488/12384 [13:45:52<12:28:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 52%|█████▏ | 6488/12384 [13:45:59<12:28:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 52%|█████▏ | 6489/12384 [13:45:59<12:28:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 52%|█████▏ | 6489/12384 [13:46:07<12:28:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6490/12384 [13:46:07<12:27:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6490/12384 [13:46:14<12:27:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 52%|█████▏ | 6491/12384 [13:46:14<12:27:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 52%|█████▏ | 6491/12384 [13:46:22<12:27:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 52%|█████▏ | 6492/12384 [13:46:22<12:27:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 52%|█████▏ | 6492/12384 [13:46:30<12:27:25, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.91s]
Epoch 0: 52%|█████▏ | 6493/12384 [13:46:30<12:27:05, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.91s]
Epoch 0: 52%|█████▏ | 6493/12384 [13:46:37<12:27:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6494/12384 [13:46:37<12:27:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 52%|█████▏ | 6494/12384 [13:46:45<12:27:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6495/12384 [13:46:45<12:29:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 52%|█████▏ | 6495/12384 [13:46:53<12:29:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.07s]
Epoch 0: 52%|█████▏ | 6496/12384 [13:46:53<12:28:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.07s]
Epoch 0: 52%|█████▏ | 6496/12384 [13:47:00<12:28:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 52%|█████▏ | 6497/12384 [13:47:00<12:29:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 52%|█████▏ | 6497/12384 [13:47:08<12:29:19, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.69s]
Epoch 0: 52%|█████▏ | 6498/12384 [13:47:08<12:28:36, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.69s]
Epoch 0: 52%|█████▏ | 6498/12384 [13:47:16<12:28:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6499/12384 [13:47:16<12:27:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 52%|█████▏ | 6499/12384 [13:47:23<12:27:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 52%|█████▏ | 6500/12384 [13:47:23<12:33:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 52%|█████▏ | 6500/12384 [13:47:31<12:33:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 0: 52%|█████▏ | 6501/12384 [13:47:31<12:41:09, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 0: 52%|█████▏ | 6501/12384 [13:47:39<12:41:09, 7.76s/it, loss=0.0002, acc=1.0000, iter_time=8.20s]
Epoch 0: 53%|█████▎ | 6502/12384 [13:47:39<12:36:02, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=8.20s]
Epoch 0: 53%|█████▎ | 6502/12384 [13:47:47<12:36:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 53%|█████▎ | 6503/12384 [13:47:47<12:34:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 53%|█████▎ | 6503/12384 [13:47:54<12:34:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 53%|█████▎ | 6504/12384 [13:47:54<12:34:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 53%|█████▎ | 6504/12384 [13:48:02<12:34:04, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=6.12s]
Epoch 0: 53%|█████▎ | 6505/12384 [13:48:02<12:31:18, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.12s]
Epoch 0: 53%|█████▎ | 6505/12384 [13:48:09<12:31:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 53%|█████▎ | 6506/12384 [13:48:09<12:29:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 53%|█████▎ | 6506/12384 [13:48:17<12:29:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 0: 53%|█████▎ | 6507/12384 [13:48:17<12:28:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 0: 53%|█████▎ | 6507/12384 [13:48:25<12:28:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 53%|█████▎ | 6508/12384 [13:48:25<12:27:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 53%|█████▎ | 6508/12384 [13:48:32<12:27:36, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=9.05s]
Epoch 0: 53%|█████▎ | 6509/12384 [13:48:32<12:26:24, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=9.05s]
Epoch 0: 53%|█████▎ | 6509/12384 [13:48:40<12:26:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 53%|█████▎ | 6510/12384 [13:48:40<12:26:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 53%|█████▎ | 6510/12384 [13:48:48<12:26:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 0: 53%|█████▎ | 6511/12384 [13:48:48<12:28:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 0: 53%|█████▎ | 6511/12384 [13:48:55<12:28:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 53%|█████▎ | 6512/12384 [13:48:55<12:27:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 53%|█████▎ | 6512/12384 [13:49:03<12:27:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 53%|█████▎ | 6513/12384 [13:49:03<12:26:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 53%|█████▎ | 6513/12384 [13:49:11<12:26:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.40s]
Epoch 0: 53%|█████▎ | 6514/12384 [13:49:11<12:28:48, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.40s]
Epoch 0: 53%|█████▎ | 6514/12384 [13:49:18<12:28:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 53%|█████▎ | 6515/12384 [13:49:18<12:27:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 53%|█████▎ | 6515/12384 [13:49:26<12:27:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 53%|█████▎ | 6516/12384 [13:49:26<12:27:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 53%|█████▎ | 6516/12384 [13:49:33<12:27:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 53%|█████▎ | 6517/12384 [13:49:33<12:26:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 53%|█████▎ | 6517/12384 [13:49:41<12:26:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 53%|█████▎ | 6518/12384 [13:49:41<12:25:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 53%|█████▎ | 6518/12384 [13:49:49<12:25:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 53%|█████▎ | 6519/12384 [13:49:49<12:24:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 53%|█████▎ | 6519/12384 [13:49:56<12:24:57, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=7.71s]
Epoch 0: 53%|█████▎ | 6520/12384 [13:49:56<12:25:46, 7.63s/it, loss=0.0002, acc=0.9988, iter_time=7.71s]
Epoch 0: 53%|█████▎ | 6520/12384 [13:50:04<12:25:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 53%|█████▎ | 6521/12384 [13:50:04<12:24:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 53%|█████▎ | 6521/12384 [13:50:12<12:24:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 53%|█████▎ | 6522/12384 [13:50:12<12:25:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 53%|█████▎ | 6522/12384 [13:50:19<12:25:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 53%|█████▎ | 6523/12384 [13:50:19<12:25:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 53%|█████▎ | 6523/12384 [13:50:27<12:25:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 53%|█████▎ | 6524/12384 [13:50:27<12:24:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 53%|█████▎ | 6524/12384 [13:50:34<12:24:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 53%|█████▎ | 6525/12384 [13:50:34<12:24:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 53%|█████▎ | 6525/12384 [13:50:42<12:24:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 0: 53%|█████▎ | 6526/12384 [13:50:42<12:24:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 0: 53%|█████▎ | 6526/12384 [13:50:50<12:24:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 53%|█████▎ | 6527/12384 [13:50:50<12:24:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 53%|█████▎ | 6527/12384 [13:50:58<12:24:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 0: 53%|█████▎ | 6528/12384 [13:50:58<12:35:02, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 0: 53%|█████▎ | 6528/12384 [13:51:05<12:35:02, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 0: 53%|█████▎ | 6529/12384 [13:51:05<12:30:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 0: 53%|█████▎ | 6529/12384 [13:51:13<12:30:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 0: 53%|█████▎ | 6530/12384 [13:51:13<12:27:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 0: 53%|█████▎ | 6530/12384 [13:51:20<12:27:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6531/12384 [13:51:20<12:25:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6531/12384 [13:51:28<12:25:17, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=7.60s]
Epoch 0: 53%|█████▎ | 6532/12384 [13:51:28<12:24:45, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=7.60s]
Epoch 0: 53%|█████▎ | 6532/12384 [13:51:36<12:24:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 53%|█████▎ | 6533/12384 [13:51:36<12:24:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 53%|█████▎ | 6533/12384 [13:51:43<12:24:04, 7.63s/it, loss=0.0007, acc=0.9960, iter_time=8.21s]
Epoch 0: 53%|█████▎ | 6534/12384 [13:51:43<12:24:12, 7.63s/it, loss=0.0007, acc=0.9960, iter_time=8.21s]
Epoch 0: 53%|█████▎ | 6534/12384 [13:51:51<12:24:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 53%|█████▎ | 6535/12384 [13:51:51<12:23:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 53%|█████▎ | 6535/12384 [13:51:58<12:23:02, 7.62s/it, loss=0.0014, acc=0.9990, iter_time=8.54s]
Epoch 0: 53%|█████▎ | 6536/12384 [13:51:58<12:22:44, 7.62s/it, loss=0.0014, acc=0.9990, iter_time=8.54s]
Epoch 0: 53%|█████▎ | 6536/12384 [13:52:06<12:22:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 0: 53%|█████▎ | 6537/12384 [13:52:06<12:24:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 0: 53%|█████▎ | 6537/12384 [13:52:14<12:24:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.26s]
Epoch 0: 53%|█████▎ | 6538/12384 [13:52:14<12:32:46, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=8.26s]
Epoch 0: 53%|█████▎ | 6538/12384 [13:52:22<12:32:46, 7.73s/it, loss=0.0002, acc=0.9989, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6539/12384 [13:52:22<12:29:09, 7.69s/it, loss=0.0002, acc=0.9989, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6539/12384 [13:52:29<12:29:09, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6540/12384 [13:52:29<12:28:45, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6540/12384 [13:52:37<12:28:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 53%|█████▎ | 6541/12384 [13:52:37<12:26:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 53%|█████▎ | 6541/12384 [13:52:45<12:26:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 53%|█████▎ | 6542/12384 [13:52:45<12:24:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 53%|█████▎ | 6542/12384 [13:52:52<12:24:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6543/12384 [13:52:52<12:23:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6543/12384 [13:53:00<12:23:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 53%|█████▎ | 6544/12384 [13:53:00<12:22:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 53%|█████▎ | 6544/12384 [13:53:07<12:22:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 53%|█████▎ | 6545/12384 [13:53:07<12:22:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 53%|█████▎ | 6545/12384 [13:53:15<12:22:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 0: 53%|█████▎ | 6546/12384 [13:53:15<12:21:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 0: 53%|█████▎ | 6546/12384 [13:53:23<12:21:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.34s]
Epoch 0: 53%|█████▎ | 6547/12384 [13:53:23<12:23:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.34s]
Epoch 0: 53%|█████▎ | 6547/12384 [13:53:30<12:23:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 0: 53%|█████▎ | 6548/12384 [13:53:30<12:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 0: 53%|█████▎ | 6548/12384 [13:53:38<12:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 53%|█████▎ | 6549/12384 [13:53:38<12:22:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 53%|█████▎ | 6549/12384 [13:53:46<12:22:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 53%|█████▎ | 6550/12384 [13:53:46<12:22:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 53%|█████▎ | 6550/12384 [13:53:53<12:22:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 53%|█████▎ | 6551/12384 [13:53:53<12:21:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 53%|█████▎ | 6551/12384 [13:54:01<12:21:36, 7.63s/it, loss=0.0003, acc=0.9989, iter_time=8.00s]
Epoch 0: 53%|█████▎ | 6552/12384 [13:54:01<12:21:03, 7.62s/it, loss=0.0003, acc=0.9989, iter_time=8.00s]
Epoch 0: 53%|█████▎ | 6552/12384 [13:54:08<12:21:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 53%|█████▎ | 6553/12384 [13:54:08<12:20:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 53%|█████▎ | 6553/12384 [13:54:17<12:20:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 53%|█████▎ | 6554/12384 [13:54:17<12:32:34, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 53%|█████▎ | 6554/12384 [13:54:24<12:32:34, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 53%|█████▎ | 6555/12384 [13:54:24<12:29:26, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 53%|█████▎ | 6555/12384 [13:54:32<12:29:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 53%|█████▎ | 6556/12384 [13:54:32<12:26:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 53%|█████▎ | 6556/12384 [13:54:39<12:26:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 53%|█████▎ | 6557/12384 [13:54:39<12:24:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 53%|█████▎ | 6557/12384 [13:54:47<12:24:37, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 53%|█████▎ | 6558/12384 [13:54:47<12:22:51, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.84s]
Epoch 0: 53%|█████▎ | 6558/12384 [13:54:55<12:22:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6559/12384 [13:54:55<12:21:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6559/12384 [13:55:02<12:21:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 53%|█████▎ | 6560/12384 [13:55:02<12:20:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 53%|█████▎ | 6560/12384 [13:55:10<12:20:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 53%|█████▎ | 6561/12384 [13:55:10<12:22:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 53%|█████▎ | 6561/12384 [13:55:18<12:22:05, 7.65s/it, loss=0.0004, acc=0.9997, iter_time=7.62s]
Epoch 0: 53%|█████▎ | 6562/12384 [13:55:18<12:21:01, 7.64s/it, loss=0.0004, acc=0.9997, iter_time=7.62s]
Epoch 0: 53%|█████▎ | 6562/12384 [13:55:25<12:21:01, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=5.51s]
Epoch 0: 53%|█████▎ | 6563/12384 [13:55:25<12:20:26, 7.63s/it, loss=0.0002, acc=0.9997, iter_time=5.51s]
Epoch 0: 53%|█████▎ | 6563/12384 [13:55:33<12:20:26, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=9.99s]
Epoch 0: 53%|█████▎ | 6564/12384 [13:55:33<12:27:37, 7.71s/it, loss=0.0001, acc=0.9998, iter_time=9.99s]
Epoch 0: 53%|█████▎ | 6564/12384 [13:55:41<12:27:37, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.01s]
Epoch 0: 53%|█████▎ | 6565/12384 [13:55:41<12:24:10, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.01s]
Epoch 0: 53%|█████▎ | 6565/12384 [13:55:48<12:24:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 53%|█████▎ | 6566/12384 [13:55:48<12:21:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 53%|█████▎ | 6566/12384 [13:55:56<12:21:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 53%|█████▎ | 6567/12384 [13:55:56<12:20:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 53%|█████▎ | 6567/12384 [13:56:03<12:20:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 53%|█████▎ | 6568/12384 [13:56:03<12:20:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 53%|█████▎ | 6568/12384 [13:56:11<12:20:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 53%|█████▎ | 6569/12384 [13:56:11<12:19:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 53%|█████▎ | 6569/12384 [13:56:19<12:19:30, 7.63s/it, loss=0.0002, acc=0.9992, iter_time=6.43s]
Epoch 0: 53%|█████▎ | 6570/12384 [13:56:19<12:18:27, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=6.43s]
Epoch 0: 53%|█████▎ | 6570/12384 [13:56:27<12:18:27, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.54s]
Epoch 0: 53%|█████▎ | 6571/12384 [13:56:27<12:36:15, 7.81s/it, loss=0.0002, acc=1.0000, iter_time=5.54s]
Epoch 0: 53%|█████▎ | 6571/12384 [13:56:35<12:36:15, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=11.48s]
Epoch 0: 53%|█████▎ | 6572/12384 [13:56:35<12:30:52, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=11.48s]
Epoch 0: 53%|█████▎ | 6572/12384 [13:56:42<12:30:52, 7.75s/it, loss=0.0004, acc=0.9997, iter_time=4.02s]
Epoch 0: 53%|█████▎ | 6573/12384 [13:56:42<12:27:05, 7.71s/it, loss=0.0004, acc=0.9997, iter_time=4.02s]
Epoch 0: 53%|█████▎ | 6573/12384 [13:56:50<12:27:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 0: 53%|█████▎ | 6574/12384 [13:56:50<12:23:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 0: 53%|█████▎ | 6574/12384 [13:56:57<12:23:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 53%|█████▎ | 6575/12384 [13:56:57<12:21:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 53%|█████▎ | 6575/12384 [13:57:05<12:21:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 53%|█████▎ | 6576/12384 [13:57:05<12:20:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 53%|█████▎ | 6576/12384 [13:57:13<12:20:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 53%|█████▎ | 6577/12384 [13:57:13<12:19:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 53%|█████▎ | 6577/12384 [13:57:20<12:19:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.61s]
Epoch 0: 53%|█████▎ | 6578/12384 [13:57:20<12:20:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.61s]
Epoch 0: 53%|█████▎ | 6578/12384 [13:57:28<12:20:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 53%|█████▎ | 6579/12384 [13:57:28<12:20:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 53%|█████▎ | 6579/12384 [13:57:36<12:20:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 53%|█████▎ | 6580/12384 [13:57:36<12:19:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 53%|█████▎ | 6580/12384 [13:57:44<12:19:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 53%|█████▎ | 6581/12384 [13:57:44<12:27:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 53%|█████▎ | 6581/12384 [13:57:51<12:27:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 53%|█████▎ | 6582/12384 [13:57:51<12:23:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 53%|█████▎ | 6582/12384 [13:57:59<12:23:59, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6583/12384 [13:57:59<12:21:28, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6583/12384 [13:58:06<12:21:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 53%|█████▎ | 6584/12384 [13:58:06<12:21:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 53%|█████▎ | 6584/12384 [13:58:14<12:21:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 53%|█████▎ | 6585/12384 [13:58:14<12:19:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 53%|█████▎ | 6585/12384 [13:58:22<12:19:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 53%|█████▎ | 6586/12384 [13:58:22<12:18:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 53%|█████▎ | 6586/12384 [13:58:29<12:18:35, 7.64s/it, loss=0.0003, acc=0.9992, iter_time=7.62s]
Epoch 0: 53%|█████▎ | 6587/12384 [13:58:29<12:17:44, 7.64s/it, loss=0.0003, acc=0.9992, iter_time=7.62s]
Epoch 0: 53%|█████▎ | 6587/12384 [13:58:37<12:17:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6588/12384 [13:58:37<12:17:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6588/12384 [13:58:44<12:17:15, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6589/12384 [13:58:44<12:16:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6589/12384 [13:58:52<12:16:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.92s]
Epoch 0: 53%|█████▎ | 6590/12384 [13:58:52<12:24:25, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.92s]
Epoch 0: 53%|█████▎ | 6590/12384 [13:59:00<12:24:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6591/12384 [13:59:00<12:21:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6591/12384 [13:59:08<12:21:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6592/12384 [13:59:08<12:19:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 53%|█████▎ | 6592/12384 [13:59:15<12:19:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 0: 53%|█████▎ | 6593/12384 [13:59:15<12:17:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 0: 53%|█████▎ | 6593/12384 [13:59:23<12:17:41, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 0: 53%|█████▎ | 6594/12384 [13:59:23<12:17:04, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 0: 53%|█████▎ | 6594/12384 [13:59:31<12:17:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.17s]
Epoch 0: 53%|█████▎ | 6595/12384 [13:59:31<12:19:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.17s]
Epoch 0: 53%|█████▎ | 6595/12384 [13:59:38<12:19:12, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=11.01s]
Epoch 0: 53%|█████▎ | 6596/12384 [13:59:38<12:17:05, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.01s]
Epoch 0: 53%|█████▎ | 6596/12384 [13:59:46<12:17:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6597/12384 [13:59:46<12:17:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6597/12384 [13:59:53<12:17:10, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6598/12384 [13:59:53<12:16:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6598/12384 [14:00:01<12:16:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 53%|█████▎ | 6599/12384 [14:00:01<12:16:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 53%|█████▎ | 6599/12384 [14:00:09<12:16:57, 7.64s/it, loss=0.0002, acc=0.9989, iter_time=8.00s]
Epoch 0: 53%|█████▎ | 6600/12384 [14:00:09<12:15:39, 7.63s/it, loss=0.0002, acc=0.9989, iter_time=8.00s]
Epoch 0: 53%|█████▎ | 6600/12384 [14:00:16<12:15:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 53%|█████▎ | 6601/12384 [14:00:16<12:15:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 53%|█████▎ | 6601/12384 [14:00:24<12:15:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 53%|█████▎ | 6602/12384 [14:00:24<12:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 53%|█████▎ | 6602/12384 [14:00:32<12:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 53%|█████▎ | 6603/12384 [14:00:32<12:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 53%|█████▎ | 6603/12384 [14:00:39<12:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 53%|█████▎ | 6604/12384 [14:00:39<12:14:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 53%|█████▎ | 6604/12384 [14:00:47<12:14:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 53%|█████▎ | 6605/12384 [14:00:47<12:15:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 53%|█████▎ | 6605/12384 [14:00:54<12:15:15, 7.63s/it, loss=0.0002, acc=0.9985, iter_time=9.46s]
Epoch 0: 53%|█████▎ | 6606/12384 [14:00:54<12:14:45, 7.63s/it, loss=0.0002, acc=0.9985, iter_time=9.46s]
Epoch 0: 53%|█████▎ | 6606/12384 [14:01:04<12:14:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 53%|█████▎ | 6607/12384 [14:01:04<13:00:42, 8.11s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 53%|█████▎ | 6607/12384 [14:01:11<13:00:42, 8.11s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 53%|█████▎ | 6608/12384 [14:01:11<12:46:42, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 53%|█████▎ | 6608/12384 [14:01:19<12:46:42, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 53%|█████▎ | 6609/12384 [14:01:19<12:36:29, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 53%|█████▎ | 6609/12384 [14:01:27<12:36:29, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6610/12384 [14:01:27<12:28:47, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6610/12384 [14:01:34<12:28:47, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 53%|█████▎ | 6611/12384 [14:01:34<12:23:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 53%|█████▎ | 6611/12384 [14:01:42<12:23:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 53%|█████▎ | 6612/12384 [14:01:42<12:20:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 53%|█████▎ | 6612/12384 [14:01:49<12:20:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6613/12384 [14:01:49<12:18:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6613/12384 [14:01:57<12:18:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 53%|█████▎ | 6614/12384 [14:01:57<12:16:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 53%|█████▎ | 6614/12384 [14:02:05<12:16:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 53%|█████▎ | 6615/12384 [14:02:05<12:14:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 53%|█████▎ | 6615/12384 [14:02:13<12:14:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 53%|█████▎ | 6616/12384 [14:02:13<12:22:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 53%|█████▎ | 6616/12384 [14:02:20<12:22:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 53%|█████▎ | 6617/12384 [14:02:20<12:18:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 53%|█████▎ | 6617/12384 [14:02:28<12:18:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6618/12384 [14:02:28<12:16:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 53%|█████▎ | 6618/12384 [14:02:35<12:16:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 53%|█████▎ | 6619/12384 [14:02:35<12:15:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 53%|█████▎ | 6619/12384 [14:02:43<12:15:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 53%|█████▎ | 6620/12384 [14:02:43<12:13:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 53%|█████▎ | 6620/12384 [14:02:51<12:13:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6621/12384 [14:02:51<12:13:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 53%|█████▎ | 6621/12384 [14:02:58<12:13:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 53%|█████▎ | 6622/12384 [14:02:58<12:11:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 53%|█████▎ | 6622/12384 [14:03:06<12:11:33, 7.62s/it, loss=0.0008, acc=0.9973, iter_time=8.51s]
Epoch 0: 53%|█████▎ | 6623/12384 [14:03:06<12:11:18, 7.62s/it, loss=0.0008, acc=0.9973, iter_time=8.51s]
Epoch 0: 53%|█████▎ | 6623/12384 [14:03:13<12:11:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 53%|█████▎ | 6624/12384 [14:03:13<12:11:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 53%|█████▎ | 6624/12384 [14:03:21<12:11:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 53%|█████▎ | 6625/12384 [14:03:21<12:10:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 53%|█████▎ | 6625/12384 [14:03:29<12:10:43, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.62s]
Epoch 0: 54%|█████▎ | 6626/12384 [14:03:29<12:10:30, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.62s]
Epoch 0: 54%|█████▎ | 6626/12384 [14:03:36<12:10:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▎ | 6627/12384 [14:03:36<12:10:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▎ | 6627/12384 [14:03:44<12:10:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 54%|█████▎ | 6628/12384 [14:03:44<12:10:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 54%|█████▎ | 6628/12384 [14:03:51<12:10:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 54%|█████▎ | 6629/12384 [14:03:51<12:11:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 54%|█████▎ | 6629/12384 [14:03:59<12:11:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 54%|█████▎ | 6630/12384 [14:03:59<12:11:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 54%|█████▎ | 6630/12384 [14:04:07<12:11:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 54%|█████▎ | 6631/12384 [14:04:07<12:10:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 54%|█████▎ | 6631/12384 [14:04:14<12:10:21, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=7.99s]
Epoch 0: 54%|█████▎ | 6632/12384 [14:04:14<12:10:23, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=7.99s]
Epoch 0: 54%|█████▎ | 6632/12384 [14:04:22<12:10:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 54%|█████▎ | 6633/12384 [14:04:22<12:20:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 54%|█████▎ | 6633/12384 [14:04:30<12:20:28, 7.73s/it, loss=0.0005, acc=0.9985, iter_time=7.59s]
Epoch 0: 54%|█████▎ | 6634/12384 [14:04:30<12:17:20, 7.69s/it, loss=0.0005, acc=0.9985, iter_time=7.59s]
Epoch 0: 54%|█████▎ | 6634/12384 [14:04:38<12:17:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 54%|█████▎ | 6635/12384 [14:04:38<12:14:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 54%|█████▎ | 6635/12384 [14:04:45<12:14:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▎ | 6636/12384 [14:04:45<12:12:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▎ | 6636/12384 [14:04:53<12:12:35, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 54%|█████▎ | 6637/12384 [14:04:53<12:11:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 54%|█████▎ | 6637/12384 [14:05:00<12:11:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 0: 54%|█████▎ | 6638/12384 [14:05:00<12:10:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 0: 54%|█████▎ | 6638/12384 [14:05:08<12:10:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 54%|█████▎ | 6639/12384 [14:05:08<12:09:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 54%|█████▎ | 6639/12384 [14:05:16<12:09:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 54%|█████▎ | 6640/12384 [14:05:16<12:10:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 54%|█████▎ | 6640/12384 [14:05:23<12:10:30, 7.63s/it, loss=0.0011, acc=0.9973, iter_time=7.25s]
Epoch 0: 54%|█████▎ | 6641/12384 [14:05:23<12:09:56, 7.63s/it, loss=0.0011, acc=0.9973, iter_time=7.25s]
Epoch 0: 54%|█████▎ | 6641/12384 [14:05:31<12:09:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 54%|█████▎ | 6642/12384 [14:05:31<12:17:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 54%|█████▎ | 6642/12384 [14:05:39<12:17:04, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=4.73s]
Epoch 0: 54%|█████▎ | 6643/12384 [14:05:39<12:14:55, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.73s]
Epoch 0: 54%|█████▎ | 6643/12384 [14:05:46<12:14:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 54%|█████▎ | 6644/12384 [14:05:46<12:12:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 54%|█████▎ | 6644/12384 [14:05:54<12:12:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▎ | 6645/12384 [14:05:54<12:10:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▎ | 6645/12384 [14:06:02<12:10:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▎ | 6646/12384 [14:06:02<12:09:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▎ | 6646/12384 [14:06:09<12:09:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▎ | 6647/12384 [14:06:09<12:08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▎ | 6647/12384 [14:06:17<12:08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 54%|█████▎ | 6648/12384 [14:06:17<12:08:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 54%|█████▎ | 6648/12384 [14:06:24<12:08:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 54%|█████▎ | 6649/12384 [14:06:24<12:08:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 54%|█████▎ | 6649/12384 [14:06:32<12:08:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 54%|█████▎ | 6650/12384 [14:06:32<12:10:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 54%|█████▎ | 6650/12384 [14:06:40<12:10:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 0: 54%|█████▎ | 6651/12384 [14:06:40<12:09:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 0: 54%|█████▎ | 6651/12384 [14:06:47<12:09:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 0: 54%|█████▎ | 6652/12384 [14:06:47<12:08:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 0: 54%|█████▎ | 6652/12384 [14:06:55<12:08:30, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=8.48s]
Epoch 0: 54%|█████▎ | 6653/12384 [14:06:55<12:08:13, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=8.48s]
Epoch 0: 54%|█████▎ | 6653/12384 [14:07:03<12:08:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 54%|█████▎ | 6654/12384 [14:07:03<12:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 54%|█████▎ | 6654/12384 [14:07:10<12:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 54%|█████▎ | 6655/12384 [14:07:10<12:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 54%|█████▎ | 6655/12384 [14:07:18<12:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 0: 54%|█████▎ | 6656/12384 [14:07:18<12:06:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 0: 54%|█████▎ | 6656/12384 [14:07:25<12:06:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 54%|█████▍ | 6657/12384 [14:07:25<12:06:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 54%|█████▍ | 6657/12384 [14:07:33<12:06:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 54%|█████▍ | 6658/12384 [14:07:33<12:05:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 54%|█████▍ | 6658/12384 [14:07:41<12:05:43, 7.60s/it, loss=0.0011, acc=0.9969, iter_time=8.89s]
Epoch 0: 54%|█████▍ | 6659/12384 [14:07:41<12:14:51, 7.70s/it, loss=0.0011, acc=0.9969, iter_time=8.89s]
Epoch 0: 54%|█████▍ | 6659/12384 [14:07:48<12:14:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 54%|█████▍ | 6660/12384 [14:07:48<12:11:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 54%|█████▍ | 6660/12384 [14:07:56<12:11:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6661/12384 [14:07:56<12:09:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6661/12384 [14:08:04<12:09:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 54%|█████▍ | 6662/12384 [14:08:04<12:08:20, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 54%|█████▍ | 6662/12384 [14:08:11<12:08:20, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6663/12384 [14:08:11<12:07:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6663/12384 [14:08:19<12:07:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 0: 54%|█████▍ | 6664/12384 [14:08:19<12:06:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 0: 54%|█████▍ | 6664/12384 [14:08:26<12:06:19, 7.62s/it, loss=0.0010, acc=0.9978, iter_time=7.65s]
Epoch 0: 54%|█████▍ | 6665/12384 [14:08:26<12:05:42, 7.61s/it, loss=0.0010, acc=0.9978, iter_time=7.65s]
Epoch 0: 54%|█████▍ | 6665/12384 [14:08:34<12:05:42, 7.61s/it, loss=0.0002, acc=0.9983, iter_time=7.62s]
Epoch 0: 54%|█████▍ | 6666/12384 [14:08:34<12:05:43, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=7.62s]
Epoch 0: 54%|█████▍ | 6666/12384 [14:08:42<12:05:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 54%|█████▍ | 6667/12384 [14:08:42<12:05:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 54%|█████▍ | 6667/12384 [14:08:50<12:05:50, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=10.81s]
Epoch 0: 54%|█████▍ | 6668/12384 [14:08:50<12:14:32, 7.71s/it, loss=0.0002, acc=0.9998, iter_time=10.81s]
Epoch 0: 54%|█████▍ | 6668/12384 [14:08:57<12:14:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6669/12384 [14:08:57<12:11:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6669/12384 [14:09:05<12:11:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 54%|█████▍ | 6670/12384 [14:09:05<12:09:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 54%|█████▍ | 6670/12384 [14:09:12<12:09:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 54%|█████▍ | 6671/12384 [14:09:12<12:07:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 54%|█████▍ | 6671/12384 [14:09:20<12:07:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 54%|█████▍ | 6672/12384 [14:09:20<12:07:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 54%|█████▍ | 6672/12384 [14:09:28<12:07:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 54%|█████▍ | 6673/12384 [14:09:28<12:06:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 54%|█████▍ | 6673/12384 [14:09:35<12:06:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 54%|█████▍ | 6674/12384 [14:09:35<12:05:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 54%|█████▍ | 6674/12384 [14:09:43<12:05:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▍ | 6675/12384 [14:09:43<12:05:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▍ | 6675/12384 [14:09:51<12:05:04, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=4.09s]
Epoch 0: 54%|█████▍ | 6676/12384 [14:09:51<12:04:00, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=4.09s]
Epoch 0: 54%|█████▍ | 6676/12384 [14:09:58<12:04:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 0: 54%|█████▍ | 6677/12384 [14:09:58<12:04:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 0: 54%|█████▍ | 6677/12384 [14:10:06<12:04:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 54%|█████▍ | 6678/12384 [14:10:06<12:04:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 54%|█████▍ | 6678/12384 [14:10:13<12:04:24, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=10.15s]
Epoch 0: 54%|█████▍ | 6679/12384 [14:10:13<12:04:17, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=10.15s]
Epoch 0: 54%|█████▍ | 6679/12384 [14:10:21<12:04:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 54%|█████▍ | 6680/12384 [14:10:21<12:04:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 54%|█████▍ | 6680/12384 [14:10:29<12:04:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 0: 54%|█████▍ | 6681/12384 [14:10:29<12:03:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 0: 54%|█████▍ | 6681/12384 [14:10:36<12:03:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 54%|█████▍ | 6682/12384 [14:10:36<12:05:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 54%|█████▍ | 6682/12384 [14:10:44<12:05:16, 7.63s/it, loss=0.0028, acc=0.9951, iter_time=6.08s]
Epoch 0: 54%|█████▍ | 6683/12384 [14:10:44<12:06:21, 7.64s/it, loss=0.0028, acc=0.9951, iter_time=6.08s]
Epoch 0: 54%|█████▍ | 6683/12384 [14:10:52<12:06:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 54%|█████▍ | 6684/12384 [14:10:52<12:05:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 54%|█████▍ | 6684/12384 [14:11:00<12:05:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 54%|█████▍ | 6685/12384 [14:11:00<12:14:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 54%|█████▍ | 6685/12384 [14:11:07<12:14:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 54%|█████▍ | 6686/12384 [14:11:07<12:10:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 54%|█████▍ | 6686/12384 [14:11:15<12:10:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 54%|█████▍ | 6687/12384 [14:11:15<12:08:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 54%|█████▍ | 6687/12384 [14:11:22<12:08:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 54%|█████▍ | 6688/12384 [14:11:22<12:06:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 54%|█████▍ | 6688/12384 [14:11:30<12:06:20, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 54%|█████▍ | 6689/12384 [14:11:30<12:04:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 54%|█████▍ | 6689/12384 [14:11:38<12:04:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 54%|█████▍ | 6690/12384 [14:11:38<12:03:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 54%|█████▍ | 6690/12384 [14:11:45<12:03:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 54%|█████▍ | 6691/12384 [14:11:45<12:03:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 54%|█████▍ | 6691/12384 [14:11:53<12:03:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 0: 54%|█████▍ | 6692/12384 [14:11:53<12:02:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 0: 54%|█████▍ | 6692/12384 [14:12:00<12:02:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 54%|█████▍ | 6693/12384 [14:12:00<12:02:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 54%|█████▍ | 6693/12384 [14:12:08<12:02:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 54%|█████▍ | 6694/12384 [14:12:08<12:03:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 54%|█████▍ | 6694/12384 [14:12:16<12:03:01, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=8.83s]
Epoch 0: 54%|█████▍ | 6695/12384 [14:12:16<12:04:15, 7.64s/it, loss=0.0001, acc=0.9995, iter_time=8.83s]
Epoch 0: 54%|█████▍ | 6695/12384 [14:12:23<12:04:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 54%|█████▍ | 6696/12384 [14:12:23<12:03:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 54%|█████▍ | 6696/12384 [14:12:31<12:03:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 54%|█████▍ | 6697/12384 [14:12:31<12:03:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 54%|█████▍ | 6697/12384 [14:12:39<12:03:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 54%|█████▍ | 6698/12384 [14:12:39<12:04:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 54%|█████▍ | 6698/12384 [14:12:46<12:04:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 54%|█████▍ | 6699/12384 [14:12:46<12:03:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 54%|█████▍ | 6699/12384 [14:12:54<12:03:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 54%|█████▍ | 6700/12384 [14:12:54<12:02:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 54%|█████▍ | 6700/12384 [14:13:01<12:02:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 54%|█████▍ | 6701/12384 [14:13:01<12:02:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 54%|█████▍ | 6701/12384 [14:13:09<12:02:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 54%|█████▍ | 6702/12384 [14:13:09<12:02:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 54%|█████▍ | 6702/12384 [14:13:17<12:02:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 54%|█████▍ | 6703/12384 [14:13:17<12:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 54%|█████▍ | 6703/12384 [14:13:24<12:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 54%|█████▍ | 6704/12384 [14:13:24<12:01:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 54%|█████▍ | 6704/12384 [14:13:32<12:01:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.71s]
Epoch 0: 54%|█████▍ | 6705/12384 [14:13:32<12:00:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.71s]
Epoch 0: 54%|█████▍ | 6705/12384 [14:13:40<12:00:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 0: 54%|█████▍ | 6706/12384 [14:13:40<12:00:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 0: 54%|█████▍ | 6706/12384 [14:13:47<12:00:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6707/12384 [14:13:47<12:00:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6707/12384 [14:13:55<12:00:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 54%|█████▍ | 6708/12384 [14:13:55<12:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 54%|█████▍ | 6708/12384 [14:14:02<12:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 54%|█████▍ | 6709/12384 [14:14:02<12:00:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 54%|█████▍ | 6709/12384 [14:14:10<12:00:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6710/12384 [14:14:10<11:59:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 54%|█████▍ | 6710/12384 [14:14:18<11:59:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 54%|█████▍ | 6711/12384 [14:14:18<11:59:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 54%|█████▍ | 6711/12384 [14:14:26<11:59:44, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.87s]
Epoch 0: 54%|█████▍ | 6712/12384 [14:14:26<12:09:37, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=9.87s]
Epoch 0: 54%|█████▍ | 6712/12384 [14:14:33<12:09:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 54%|█████▍ | 6713/12384 [14:14:33<12:06:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 54%|█████▍ | 6713/12384 [14:14:41<12:06:37, 7.69s/it, loss=0.0012, acc=0.9974, iter_time=7.63s]
Epoch 0: 54%|█████▍ | 6714/12384 [14:14:41<12:04:16, 7.66s/it, loss=0.0012, acc=0.9974, iter_time=7.63s]
Epoch 0: 54%|█████▍ | 6714/12384 [14:14:48<12:04:16, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=5.34s]
Epoch 0: 54%|█████▍ | 6715/12384 [14:14:48<12:01:48, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=5.34s]
Epoch 0: 54%|█████▍ | 6715/12384 [14:14:56<12:01:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 54%|█████▍ | 6716/12384 [14:14:56<12:00:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 54%|█████▍ | 6716/12384 [14:15:04<12:00:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 54%|█████▍ | 6717/12384 [14:15:04<12:01:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 54%|█████▍ | 6717/12384 [14:15:11<12:01:34, 7.64s/it, loss=0.0000, acc=0.9999, iter_time=7.67s]
Epoch 0: 54%|█████▍ | 6718/12384 [14:15:11<12:00:44, 7.63s/it, loss=0.0000, acc=0.9999, iter_time=7.67s]
Epoch 0: 54%|█████▍ | 6718/12384 [14:15:19<12:00:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 54%|█████▍ | 6719/12384 [14:15:19<12:00:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 54%|█████▍ | 6719/12384 [14:15:26<12:00:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 54%|█████▍ | 6720/12384 [14:15:26<11:59:57, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 54%|█████▍ | 6720/12384 [14:15:34<11:59:57, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.83s]
Epoch 0: 54%|█████▍ | 6721/12384 [14:15:34<12:07:07, 7.70s/it, loss=0.0002, acc=0.9999, iter_time=7.83s]
Epoch 0: 54%|█████▍ | 6721/12384 [14:15:42<12:07:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 54%|█████▍ | 6722/12384 [14:15:42<12:04:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 54%|█████▍ | 6722/12384 [14:15:50<12:04:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 54%|█████▍ | 6723/12384 [14:15:50<12:03:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 54%|█████▍ | 6723/12384 [14:15:57<12:03:16, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 0: 54%|█████▍ | 6724/12384 [14:15:57<12:01:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 0: 54%|█████▍ | 6724/12384 [14:16:05<12:01:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.47s]
Epoch 0: 54%|█████▍ | 6725/12384 [14:16:05<12:00:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.47s]
Epoch 0: 54%|█████▍ | 6725/12384 [14:16:12<12:00:46, 7.64s/it, loss=0.0004, acc=0.9991, iter_time=7.32s]
Epoch 0: 54%|█████▍ | 6726/12384 [14:16:12<12:00:03, 7.64s/it, loss=0.0004, acc=0.9991, iter_time=7.32s]
Epoch 0: 54%|█████▍ | 6726/12384 [14:16:20<12:00:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 54%|█████▍ | 6727/12384 [14:16:20<11:59:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 54%|█████▍ | 6727/12384 [14:16:28<11:59:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 54%|█████▍ | 6728/12384 [14:16:28<12:01:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 54%|█████▍ | 6728/12384 [14:16:35<12:01:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 54%|█████▍ | 6729/12384 [14:16:35<12:00:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 54%|█████▍ | 6729/12384 [14:16:43<12:00:42, 7.65s/it, loss=0.0011, acc=1.0000, iter_time=7.63s]
Epoch 0: 54%|█████▍ | 6730/12384 [14:16:43<11:58:38, 7.63s/it, loss=0.0011, acc=1.0000, iter_time=7.63s]
Epoch 0: 54%|█████▍ | 6730/12384 [14:16:51<11:58:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 54%|█████▍ | 6731/12384 [14:16:51<11:58:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 54%|█████▍ | 6731/12384 [14:16:58<11:58:17, 7.62s/it, loss=0.0007, acc=0.9986, iter_time=4.02s]
Epoch 0: 54%|█████▍ | 6732/12384 [14:16:58<11:58:02, 7.62s/it, loss=0.0007, acc=0.9986, iter_time=4.02s]
Epoch 0: 54%|█████▍ | 6732/12384 [14:17:06<11:58:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 54%|█████▍ | 6733/12384 [14:17:06<11:56:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 54%|█████▍ | 6733/12384 [14:17:13<11:56:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▍ | 6734/12384 [14:17:13<11:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▍ | 6734/12384 [14:17:21<11:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 54%|█████▍ | 6735/12384 [14:17:21<11:56:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 54%|█████▍ | 6735/12384 [14:17:29<11:56:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 54%|█████▍ | 6736/12384 [14:17:29<11:57:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 54%|█████▍ | 6736/12384 [14:17:36<11:57:00, 7.62s/it, loss=0.0178, acc=0.9747, iter_time=7.24s]
Epoch 0: 54%|█████▍ | 6737/12384 [14:17:36<11:56:46, 7.62s/it, loss=0.0178, acc=0.9747, iter_time=7.24s]
Epoch 0: 54%|█████▍ | 6737/12384 [14:17:44<11:56:46, 7.62s/it, loss=0.0001, acc=0.9993, iter_time=7.69s]
Epoch 0: 54%|█████▍ | 6738/12384 [14:17:44<12:05:57, 7.71s/it, loss=0.0001, acc=0.9993, iter_time=7.69s]
Epoch 0: 54%|█████▍ | 6738/12384 [14:17:52<12:05:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 54%|█████▍ | 6739/12384 [14:17:52<12:02:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 54%|█████▍ | 6739/12384 [14:17:59<12:02:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 54%|█████▍ | 6740/12384 [14:17:59<12:00:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 54%|█████▍ | 6740/12384 [14:18:07<12:00:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 54%|█████▍ | 6741/12384 [14:18:07<11:58:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 54%|█████▍ | 6741/12384 [14:18:15<11:58:32, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▍ | 6742/12384 [14:18:15<11:56:54, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▍ | 6742/12384 [14:18:22<11:56:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 54%|█████▍ | 6743/12384 [14:18:22<11:56:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 54%|█████▍ | 6743/12384 [14:18:30<11:56:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 0: 54%|█████▍ | 6744/12384 [14:18:30<11:55:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 0: 54%|█████▍ | 6744/12384 [14:18:37<11:55:40, 7.61s/it, loss=0.0005, acc=0.9989, iter_time=7.21s]
Epoch 0: 54%|█████▍ | 6745/12384 [14:18:37<11:55:11, 7.61s/it, loss=0.0005, acc=0.9989, iter_time=7.21s]
Epoch 0: 54%|█████▍ | 6745/12384 [14:18:45<11:55:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 54%|█████▍ | 6746/12384 [14:18:45<11:55:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 54%|█████▍ | 6746/12384 [14:18:53<11:55:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 54%|█████▍ | 6747/12384 [14:18:53<12:03:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 54%|█████▍ | 6747/12384 [14:19:01<12:03:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▍ | 6748/12384 [14:19:01<12:00:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 54%|█████▍ | 6748/12384 [14:19:08<12:00:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 54%|█████▍ | 6749/12384 [14:19:08<11:59:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 54%|█████▍ | 6749/12384 [14:19:16<11:59:06, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=10.34s]
Epoch 0: 55%|█████▍ | 6750/12384 [14:19:16<11:57:59, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=10.34s]
Epoch 0: 55%|█████▍ | 6750/12384 [14:19:23<11:57:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 0: 55%|█████▍ | 6751/12384 [14:19:23<11:56:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 0: 55%|█████▍ | 6751/12384 [14:19:31<11:56:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 0: 55%|█████▍ | 6752/12384 [14:19:31<11:55:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 0: 55%|█████▍ | 6752/12384 [14:19:39<11:55:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 55%|█████▍ | 6753/12384 [14:19:39<11:54:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 55%|█████▍ | 6753/12384 [14:19:46<11:54:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▍ | 6754/12384 [14:19:46<11:54:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▍ | 6754/12384 [14:19:54<11:54:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▍ | 6755/12384 [14:19:54<11:54:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▍ | 6755/12384 [14:20:01<11:54:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 55%|█████▍ | 6756/12384 [14:20:01<11:55:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 55%|█████▍ | 6756/12384 [14:20:09<11:55:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▍ | 6757/12384 [14:20:09<11:54:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▍ | 6757/12384 [14:20:17<11:54:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 55%|█████▍ | 6758/12384 [14:20:17<11:54:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 55%|█████▍ | 6758/12384 [14:20:24<11:54:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 55%|█████▍ | 6759/12384 [14:20:24<11:54:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 55%|█████▍ | 6759/12384 [14:20:32<11:54:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 0: 55%|█████▍ | 6760/12384 [14:20:32<11:53:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 0: 55%|█████▍ | 6760/12384 [14:20:40<11:53:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 55%|█████▍ | 6761/12384 [14:20:40<11:52:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 55%|█████▍ | 6761/12384 [14:20:47<11:52:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▍ | 6762/12384 [14:20:47<11:52:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▍ | 6762/12384 [14:20:55<11:52:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▍ | 6763/12384 [14:20:55<11:52:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▍ | 6763/12384 [14:21:02<11:52:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▍ | 6764/12384 [14:21:02<11:54:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▍ | 6764/12384 [14:21:10<11:54:19, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.69s]
Epoch 0: 55%|█████▍ | 6765/12384 [14:21:10<12:02:55, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.69s]
Epoch 0: 55%|█████▍ | 6765/12384 [14:21:18<12:02:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 55%|█████▍ | 6766/12384 [14:21:18<12:00:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 55%|█████▍ | 6766/12384 [14:21:26<12:00:15, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 55%|█████▍ | 6767/12384 [14:21:26<11:59:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 55%|█████▍ | 6767/12384 [14:21:33<11:59:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 55%|█████▍ | 6768/12384 [14:21:33<11:57:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 55%|█████▍ | 6768/12384 [14:21:41<11:57:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 55%|█████▍ | 6769/12384 [14:21:41<11:55:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 55%|█████▍ | 6769/12384 [14:21:48<11:55:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 55%|█████▍ | 6770/12384 [14:21:48<11:54:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 55%|█████▍ | 6770/12384 [14:21:56<11:54:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 55%|█████▍ | 6771/12384 [14:21:56<11:53:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 0: 55%|█████▍ | 6771/12384 [14:22:04<11:53:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 55%|█████▍ | 6772/12384 [14:22:04<11:52:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 55%|█████▍ | 6772/12384 [14:22:11<11:52:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 0: 55%|█████▍ | 6773/12384 [14:22:11<11:52:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 0: 55%|█████▍ | 6773/12384 [14:22:19<11:52:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.48s]
Epoch 0: 55%|█████▍ | 6774/12384 [14:22:19<11:51:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.48s]
Epoch 0: 55%|█████▍ | 6774/12384 [14:22:27<11:51:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▍ | 6775/12384 [14:22:27<11:51:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▍ | 6775/12384 [14:22:34<11:51:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 55%|█████▍ | 6776/12384 [14:22:34<11:51:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 55%|█████▍ | 6776/12384 [14:22:42<11:51:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 55%|█████▍ | 6777/12384 [14:22:42<11:51:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 55%|█████▍ | 6777/12384 [14:22:49<11:51:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 0: 55%|█████▍ | 6778/12384 [14:22:49<11:51:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 0: 55%|█████▍ | 6778/12384 [14:22:57<11:51:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 0: 55%|█████▍ | 6779/12384 [14:22:57<11:52:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 0: 55%|█████▍ | 6779/12384 [14:23:05<11:52:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 55%|█████▍ | 6780/12384 [14:23:05<11:51:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 55%|█████▍ | 6780/12384 [14:23:12<11:51:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 55%|█████▍ | 6781/12384 [14:23:12<11:52:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 55%|█████▍ | 6781/12384 [14:23:20<11:52:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 0: 55%|█████▍ | 6782/12384 [14:23:20<11:52:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 0: 55%|█████▍ | 6782/12384 [14:23:28<11:52:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.74s]
Epoch 0: 55%|█████▍ | 6783/12384 [14:23:28<11:52:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.74s]
Epoch 0: 55%|█████▍ | 6783/12384 [14:23:35<11:52:03, 7.63s/it, loss=0.0002, acc=0.9994, iter_time=8.50s]
Epoch 0: 55%|█████▍ | 6784/12384 [14:23:35<11:51:40, 7.63s/it, loss=0.0002, acc=0.9994, iter_time=8.50s]
Epoch 0: 55%|█████▍ | 6784/12384 [14:23:43<11:51:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 55%|█████▍ | 6785/12384 [14:23:43<11:53:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 55%|█████▍ | 6785/12384 [14:23:50<11:53:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 55%|█████▍ | 6786/12384 [14:23:50<11:52:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 55%|█████▍ | 6786/12384 [14:23:58<11:52:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▍ | 6787/12384 [14:23:58<11:51:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▍ | 6787/12384 [14:24:06<11:51:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▍ | 6788/12384 [14:24:06<11:51:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▍ | 6788/12384 [14:24:13<11:51:59, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 55%|█████▍ | 6789/12384 [14:24:13<11:51:33, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 55%|█████▍ | 6789/12384 [14:24:21<11:51:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 55%|█████▍ | 6790/12384 [14:24:21<11:51:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 55%|█████▍ | 6790/12384 [14:24:29<11:51:10, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.67s]
Epoch 0: 55%|█████▍ | 6791/12384 [14:24:29<11:59:51, 7.72s/it, loss=0.0003, acc=1.0000, iter_time=7.67s]
Epoch 0: 55%|█████▍ | 6791/12384 [14:24:37<11:59:51, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 55%|█████▍ | 6792/12384 [14:24:37<11:56:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 55%|█████▍ | 6792/12384 [14:24:44<11:56:11, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=3.84s]
Epoch 0: 55%|█████▍ | 6793/12384 [14:24:44<11:54:30, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=3.84s]
Epoch 0: 55%|█████▍ | 6793/12384 [14:24:52<11:54:30, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 55%|█████▍ | 6794/12384 [14:24:52<11:53:20, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 55%|█████▍ | 6794/12384 [14:24:59<11:53:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 55%|█████▍ | 6795/12384 [14:24:59<11:52:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 55%|█████▍ | 6795/12384 [14:25:07<11:52:12, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 55%|█████▍ | 6796/12384 [14:25:07<11:51:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 55%|█████▍ | 6796/12384 [14:25:15<11:51:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 55%|█████▍ | 6797/12384 [14:25:15<11:50:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 55%|█████▍ | 6797/12384 [14:25:22<11:50:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 55%|█████▍ | 6798/12384 [14:25:22<11:50:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 55%|█████▍ | 6798/12384 [14:25:30<11:50:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 55%|█████▍ | 6799/12384 [14:25:30<11:50:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 55%|█████▍ | 6799/12384 [14:25:37<11:50:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.32s]
Epoch 0: 55%|█████▍ | 6800/12384 [14:25:37<11:49:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.32s]
Epoch 0: 55%|█████▍ | 6800/12384 [14:25:45<11:49:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 55%|█████▍ | 6801/12384 [14:25:45<11:49:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 55%|█████▍ | 6801/12384 [14:25:53<11:49:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 55%|█████▍ | 6802/12384 [14:25:53<11:48:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 55%|█████▍ | 6802/12384 [14:26:00<11:48:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▍ | 6803/12384 [14:26:00<11:47:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▍ | 6803/12384 [14:26:08<11:47:51, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.59s]
Epoch 0: 55%|█████▍ | 6804/12384 [14:26:08<11:47:55, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.59s]
Epoch 0: 55%|█████▍ | 6804/12384 [14:26:16<11:47:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▍ | 6805/12384 [14:26:16<11:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▍ | 6805/12384 [14:26:23<11:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▍ | 6806/12384 [14:26:23<11:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▍ | 6806/12384 [14:26:31<11:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▍ | 6807/12384 [14:26:31<11:46:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▍ | 6807/12384 [14:26:38<11:46:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 55%|█████▍ | 6808/12384 [14:26:38<11:47:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 55%|█████▍ | 6808/12384 [14:26:46<11:47:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 55%|█████▍ | 6809/12384 [14:26:46<11:48:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 55%|█████▍ | 6809/12384 [14:26:54<11:48:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 55%|█████▍ | 6810/12384 [14:26:54<11:47:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 55%|█████▍ | 6810/12384 [14:27:01<11:47:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 0: 55%|█████▍ | 6811/12384 [14:27:01<11:47:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 0: 55%|█████▍ | 6811/12384 [14:27:09<11:47:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▌ | 6812/12384 [14:27:09<11:46:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▌ | 6812/12384 [14:27:16<11:46:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 55%|█████▌ | 6813/12384 [14:27:16<11:46:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 55%|█████▌ | 6813/12384 [14:27:24<11:46:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 55%|█████▌ | 6814/12384 [14:27:24<11:46:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 55%|█████▌ | 6814/12384 [14:27:32<11:46:40, 7.61s/it, loss=0.0027, acc=0.9956, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6815/12384 [14:27:32<11:46:12, 7.61s/it, loss=0.0027, acc=0.9956, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6815/12384 [14:27:39<11:46:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 55%|█████▌ | 6816/12384 [14:27:39<11:45:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 55%|█████▌ | 6816/12384 [14:27:47<11:45:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 55%|█████▌ | 6817/12384 [14:27:47<11:57:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 55%|█████▌ | 6817/12384 [14:27:55<11:57:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 55%|█████▌ | 6818/12384 [14:27:55<11:53:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 55%|█████▌ | 6818/12384 [14:28:02<11:53:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6819/12384 [14:28:02<11:50:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6819/12384 [14:28:10<11:50:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▌ | 6820/12384 [14:28:10<11:49:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▌ | 6820/12384 [14:28:18<11:49:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 0: 55%|█████▌ | 6821/12384 [14:28:18<11:48:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 0: 55%|█████▌ | 6821/12384 [14:28:25<11:48:23, 7.64s/it, loss=0.0005, acc=0.9980, iter_time=10.99s]
Epoch 0: 55%|█████▌ | 6822/12384 [14:28:25<11:47:19, 7.63s/it, loss=0.0005, acc=0.9980, iter_time=10.99s]
Epoch 0: 55%|█████▌ | 6822/12384 [14:28:33<11:47:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 55%|█████▌ | 6823/12384 [14:28:33<11:46:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 55%|█████▌ | 6823/12384 [14:28:41<11:46:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 55%|█████▌ | 6824/12384 [14:28:41<11:46:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 55%|█████▌ | 6824/12384 [14:28:48<11:46:12, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.36s]
Epoch 0: 55%|█████▌ | 6825/12384 [14:28:48<11:45:34, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.36s]
Epoch 0: 55%|█████▌ | 6825/12384 [14:28:56<11:45:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 0: 55%|█████▌ | 6826/12384 [14:28:56<11:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 0: 55%|█████▌ | 6826/12384 [14:29:03<11:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 55%|█████▌ | 6827/12384 [14:29:03<11:45:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 55%|█████▌ | 6827/12384 [14:29:11<11:45:44, 7.62s/it, loss=0.0004, acc=0.9991, iter_time=9.13s]
Epoch 0: 55%|█████▌ | 6828/12384 [14:29:11<11:45:12, 7.62s/it, loss=0.0004, acc=0.9991, iter_time=9.13s]
Epoch 0: 55%|█████▌ | 6828/12384 [14:29:19<11:45:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▌ | 6829/12384 [14:29:19<11:45:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▌ | 6829/12384 [14:29:26<11:45:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 55%|█████▌ | 6830/12384 [14:29:26<11:48:26, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 55%|█████▌ | 6830/12384 [14:29:34<11:48:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 0: 55%|█████▌ | 6831/12384 [14:29:34<11:46:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 0: 55%|█████▌ | 6831/12384 [14:29:42<11:46:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 0: 55%|█████▌ | 6832/12384 [14:29:42<11:45:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 0: 55%|█████▌ | 6832/12384 [14:29:49<11:45:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 0: 55%|█████▌ | 6833/12384 [14:29:49<11:44:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 0: 55%|█████▌ | 6833/12384 [14:29:57<11:44:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 55%|█████▌ | 6834/12384 [14:29:57<11:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 55%|█████▌ | 6834/12384 [14:30:04<11:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 55%|█████▌ | 6835/12384 [14:30:04<11:47:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 55%|█████▌ | 6835/12384 [14:30:12<11:47:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▌ | 6836/12384 [14:30:12<11:45:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▌ | 6836/12384 [14:30:20<11:45:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6837/12384 [14:30:20<11:44:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6837/12384 [14:30:27<11:44:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 0: 55%|█████▌ | 6838/12384 [14:30:27<11:44:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 0: 55%|█████▌ | 6838/12384 [14:30:35<11:44:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 55%|█████▌ | 6839/12384 [14:30:35<11:43:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 55%|█████▌ | 6839/12384 [14:30:43<11:43:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 55%|█████▌ | 6840/12384 [14:30:43<11:43:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 55%|█████▌ | 6840/12384 [14:30:50<11:43:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 55%|█████▌ | 6841/12384 [14:30:50<11:43:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 55%|█████▌ | 6841/12384 [14:30:58<11:43:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 55%|█████▌ | 6842/12384 [14:30:58<11:43:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 55%|█████▌ | 6842/12384 [14:31:06<11:43:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 55%|█████▌ | 6843/12384 [14:31:06<11:51:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 55%|█████▌ | 6843/12384 [14:31:13<11:51:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 0: 55%|█████▌ | 6844/12384 [14:31:13<11:48:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 0: 55%|█████▌ | 6844/12384 [14:31:21<11:48:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 0: 55%|█████▌ | 6845/12384 [14:31:21<11:46:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 0: 55%|█████▌ | 6845/12384 [14:31:28<11:46:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 55%|█████▌ | 6846/12384 [14:31:28<11:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 55%|█████▌ | 6846/12384 [14:31:36<11:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 55%|█████▌ | 6847/12384 [14:31:36<11:45:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 55%|█████▌ | 6847/12384 [14:31:44<11:45:41, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.05s]
Epoch 0: 55%|█████▌ | 6848/12384 [14:31:44<11:44:36, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.05s]
Epoch 0: 55%|█████▌ | 6848/12384 [14:31:51<11:44:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 55%|█████▌ | 6849/12384 [14:31:51<11:43:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 55%|█████▌ | 6849/12384 [14:31:59<11:43:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 55%|█████▌ | 6850/12384 [14:31:59<11:43:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 55%|█████▌ | 6850/12384 [14:32:07<11:43:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 55%|█████▌ | 6851/12384 [14:32:07<11:51:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 55%|█████▌ | 6851/12384 [14:32:14<11:51:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 55%|█████▌ | 6852/12384 [14:32:14<11:47:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 55%|█████▌ | 6852/12384 [14:32:22<11:47:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 55%|█████▌ | 6853/12384 [14:32:22<11:45:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 55%|█████▌ | 6853/12384 [14:32:30<11:45:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6854/12384 [14:32:30<11:44:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6854/12384 [14:32:37<11:44:19, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6855/12384 [14:32:37<11:43:16, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6855/12384 [14:32:45<11:43:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6856/12384 [14:32:45<11:44:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 55%|█████▌ | 6856/12384 [14:32:53<11:44:10, 7.64s/it, loss=0.0004, acc=0.9991, iter_time=7.66s]
Epoch 0: 55%|█████▌ | 6857/12384 [14:32:53<11:42:47, 7.63s/it, loss=0.0004, acc=0.9991, iter_time=7.66s]
Epoch 0: 55%|█████▌ | 6857/12384 [14:33:00<11:42:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▌ | 6858/12384 [14:33:00<11:42:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 55%|█████▌ | 6858/12384 [14:33:08<11:42:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6859/12384 [14:33:08<11:42:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6859/12384 [14:33:15<11:42:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 55%|█████▌ | 6860/12384 [14:33:15<11:42:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 55%|█████▌ | 6860/12384 [14:33:23<11:42:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▌ | 6861/12384 [14:33:23<11:42:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 55%|█████▌ | 6861/12384 [14:33:31<11:42:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6862/12384 [14:33:31<11:41:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6862/12384 [14:33:38<11:41:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 55%|█████▌ | 6863/12384 [14:33:38<11:41:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 55%|█████▌ | 6863/12384 [14:33:46<11:41:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 55%|█████▌ | 6864/12384 [14:33:46<11:41:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 55%|█████▌ | 6864/12384 [14:33:54<11:41:05, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=7.64s]
Epoch 0: 55%|█████▌ | 6865/12384 [14:33:54<11:40:22, 7.61s/it, loss=0.0002, acc=0.9989, iter_time=7.64s]
Epoch 0: 55%|█████▌ | 6865/12384 [14:34:01<11:40:22, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 55%|█████▌ | 6866/12384 [14:34:01<11:41:17, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 55%|█████▌ | 6866/12384 [14:34:09<11:41:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6867/12384 [14:34:09<11:41:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6867/12384 [14:34:16<11:41:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6868/12384 [14:34:16<11:40:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 55%|█████▌ | 6868/12384 [14:34:24<11:40:29, 7.62s/it, loss=0.0009, acc=0.9967, iter_time=5.32s]
Epoch 0: 55%|█████▌ | 6869/12384 [14:34:24<11:48:15, 7.71s/it, loss=0.0009, acc=0.9967, iter_time=5.32s]
Epoch 0: 55%|█████▌ | 6869/12384 [14:34:32<11:48:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 0: 55%|█████▌ | 6870/12384 [14:34:32<11:45:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 0: 55%|█████▌ | 6870/12384 [14:34:40<11:45:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 55%|█████▌ | 6871/12384 [14:34:40<11:43:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 55%|█████▌ | 6871/12384 [14:34:47<11:43:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 0: 55%|█████▌ | 6872/12384 [14:34:47<11:42:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 0: 55%|█████▌ | 6872/12384 [14:34:55<11:42:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 0: 55%|█████▌ | 6873/12384 [14:34:55<11:40:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 0: 55%|█████▌ | 6873/12384 [14:35:02<11:40:50, 7.63s/it, loss=0.0006, acc=0.9974, iter_time=10.19s]
Epoch 0: 56%|█████▌ | 6874/12384 [14:35:02<11:40:09, 7.62s/it, loss=0.0006, acc=0.9974, iter_time=10.19s]
Epoch 0: 56%|█████▌ | 6874/12384 [14:35:10<11:40:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6875/12384 [14:35:10<11:39:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6875/12384 [14:35:18<11:39:20, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6876/12384 [14:35:18<11:38:34, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6876/12384 [14:35:25<11:38:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 56%|█████▌ | 6877/12384 [14:35:25<11:38:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 56%|█████▌ | 6877/12384 [14:35:33<11:38:19, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=7.91s]
Epoch 0: 56%|█████▌ | 6878/12384 [14:35:33<11:45:52, 7.69s/it, loss=0.0000, acc=0.9999, iter_time=7.91s]
Epoch 0: 56%|█████▌ | 6878/12384 [14:35:41<11:45:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 56%|█████▌ | 6879/12384 [14:35:41<11:42:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 56%|█████▌ | 6879/12384 [14:35:48<11:42:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 56%|█████▌ | 6880/12384 [14:35:48<11:41:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 56%|█████▌ | 6880/12384 [14:35:56<11:41:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 56%|█████▌ | 6881/12384 [14:35:56<11:39:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 56%|█████▌ | 6881/12384 [14:36:03<11:39:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6882/12384 [14:36:03<11:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6882/12384 [14:36:11<11:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 56%|█████▌ | 6883/12384 [14:36:11<11:39:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 56%|█████▌ | 6883/12384 [14:36:19<11:39:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 0: 56%|█████▌ | 6884/12384 [14:36:19<11:38:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 0: 56%|█████▌ | 6884/12384 [14:36:26<11:38:44, 7.62s/it, loss=0.0003, acc=0.9990, iter_time=7.31s]
Epoch 0: 56%|█████▌ | 6885/12384 [14:36:26<11:38:27, 7.62s/it, loss=0.0003, acc=0.9990, iter_time=7.31s]
Epoch 0: 56%|█████▌ | 6885/12384 [14:36:34<11:38:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 56%|█████▌ | 6886/12384 [14:36:34<11:38:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 56%|█████▌ | 6886/12384 [14:36:41<11:38:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 0: 56%|█████▌ | 6887/12384 [14:36:41<11:36:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 0: 56%|█████▌ | 6887/12384 [14:36:49<11:36:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 0: 56%|█████▌ | 6888/12384 [14:36:49<11:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 0: 56%|█████▌ | 6888/12384 [14:36:57<11:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 0: 56%|█████▌ | 6889/12384 [14:36:57<11:37:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 0: 56%|█████▌ | 6889/12384 [14:37:04<11:37:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 0: 56%|█████▌ | 6890/12384 [14:37:04<11:37:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 0: 56%|█████▌ | 6890/12384 [14:37:12<11:37:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6891/12384 [14:37:12<11:37:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6891/12384 [14:37:20<11:37:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6892/12384 [14:37:20<11:36:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6892/12384 [14:37:27<11:36:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 56%|█████▌ | 6893/12384 [14:37:27<11:36:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 56%|█████▌ | 6893/12384 [14:37:35<11:36:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6894/12384 [14:37:35<11:36:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6894/12384 [14:37:42<11:36:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6895/12384 [14:37:42<11:36:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6895/12384 [14:37:50<11:36:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 56%|█████▌ | 6896/12384 [14:37:50<11:44:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 56%|█████▌ | 6896/12384 [14:37:58<11:44:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 0: 56%|█████▌ | 6897/12384 [14:37:58<11:42:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 0: 56%|█████▌ | 6897/12384 [14:38:06<11:42:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 56%|█████▌ | 6898/12384 [14:38:06<11:42:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 56%|█████▌ | 6898/12384 [14:38:13<11:42:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 56%|█████▌ | 6899/12384 [14:38:13<11:40:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 56%|█████▌ | 6899/12384 [14:38:21<11:40:45, 7.67s/it, loss=0.0002, acc=0.9997, iter_time=9.15s]
Epoch 0: 56%|█████▌ | 6900/12384 [14:38:21<11:39:24, 7.65s/it, loss=0.0002, acc=0.9997, iter_time=9.15s]
Epoch 0: 56%|█████▌ | 6900/12384 [14:38:28<11:39:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 56%|█████▌ | 6901/12384 [14:38:28<11:38:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 56%|█████▌ | 6901/12384 [14:38:36<11:38:21, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6902/12384 [14:38:36<11:37:20, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▌ | 6902/12384 [14:38:44<11:37:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 56%|█████▌ | 6903/12384 [14:38:44<11:38:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 56%|█████▌ | 6903/12384 [14:38:51<11:38:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 0: 56%|█████▌ | 6904/12384 [14:38:51<11:37:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 0: 56%|█████▌ | 6904/12384 [14:38:59<11:37:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.51s]
Epoch 0: 56%|█████▌ | 6905/12384 [14:38:59<11:36:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.51s]
Epoch 0: 56%|█████▌ | 6905/12384 [14:39:07<11:36:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 0: 56%|█████▌ | 6906/12384 [14:39:07<11:36:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 0: 56%|█████▌ | 6906/12384 [14:39:14<11:36:15, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=6.11s]
Epoch 0: 56%|█████▌ | 6907/12384 [14:39:14<11:35:49, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.11s]
Epoch 0: 56%|█████▌ | 6907/12384 [14:39:22<11:35:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 56%|█████▌ | 6908/12384 [14:39:22<11:35:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 56%|█████▌ | 6908/12384 [14:39:29<11:35:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 56%|█████▌ | 6909/12384 [14:39:29<11:34:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 56%|█████▌ | 6909/12384 [14:39:37<11:34:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 0: 56%|█████▌ | 6910/12384 [14:39:37<11:33:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 0: 56%|█████▌ | 6910/12384 [14:39:45<11:33:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 56%|█████▌ | 6911/12384 [14:39:45<11:35:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 56%|█████▌ | 6911/12384 [14:39:52<11:35:49, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.99s]
Epoch 0: 56%|█████▌ | 6912/12384 [14:39:52<11:35:18, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.99s]
Epoch 0: 56%|█████▌ | 6912/12384 [14:40:00<11:35:18, 7.62s/it, loss=0.0013, acc=0.9972, iter_time=4.67s]
Epoch 0: 56%|█████▌ | 6913/12384 [14:40:00<11:35:16, 7.62s/it, loss=0.0013, acc=0.9972, iter_time=4.67s]
Epoch 0: 56%|█████▌ | 6913/12384 [14:40:08<11:35:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 0: 56%|█████▌ | 6914/12384 [14:40:08<11:35:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 0: 56%|█████▌ | 6914/12384 [14:40:15<11:35:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 56%|█████▌ | 6915/12384 [14:40:15<11:33:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 56%|█████▌ | 6915/12384 [14:40:23<11:33:51, 7.61s/it, loss=0.0008, acc=1.0000, iter_time=8.18s]
Epoch 0: 56%|█████▌ | 6916/12384 [14:40:23<11:33:12, 7.61s/it, loss=0.0008, acc=1.0000, iter_time=8.18s]
Epoch 0: 56%|█████▌ | 6916/12384 [14:40:30<11:33:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 0: 56%|█████▌ | 6917/12384 [14:40:30<11:33:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 0: 56%|█████▌ | 6917/12384 [14:40:38<11:33:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 56%|█████▌ | 6918/12384 [14:40:38<11:33:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 56%|█████▌ | 6918/12384 [14:40:46<11:33:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▌ | 6919/12384 [14:40:46<11:33:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▌ | 6919/12384 [14:40:53<11:33:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 56%|█████▌ | 6920/12384 [14:40:53<11:33:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 56%|█████▌ | 6920/12384 [14:41:01<11:33:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 0: 56%|█████▌ | 6921/12384 [14:41:01<11:33:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 0: 56%|█████▌ | 6921/12384 [14:41:09<11:33:16, 7.61s/it, loss=0.0042, acc=0.9876, iter_time=8.61s]
Epoch 0: 56%|█████▌ | 6922/12384 [14:41:09<11:41:26, 7.71s/it, loss=0.0042, acc=0.9876, iter_time=8.61s]
Epoch 0: 56%|█████▌ | 6922/12384 [14:41:16<11:41:26, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 0: 56%|█████▌ | 6923/12384 [14:41:16<11:38:30, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 0: 56%|█████▌ | 6923/12384 [14:41:24<11:38:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6924/12384 [14:41:24<11:36:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6924/12384 [14:41:32<11:36:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 56%|█████▌ | 6925/12384 [14:41:32<11:34:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 56%|█████▌ | 6925/12384 [14:41:39<11:34:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 56%|█████▌ | 6926/12384 [14:41:39<11:33:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 56%|█████▌ | 6926/12384 [14:41:47<11:33:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6927/12384 [14:41:47<11:33:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 56%|█████▌ | 6927/12384 [14:41:54<11:33:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 56%|█████▌ | 6928/12384 [14:41:54<11:32:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 56%|█████▌ | 6928/12384 [14:42:02<11:32:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 56%|█████▌ | 6929/12384 [14:42:02<11:32:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 56%|█████▌ | 6929/12384 [14:42:10<11:32:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 0: 56%|█████▌ | 6930/12384 [14:42:10<11:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 0: 56%|█████▌ | 6930/12384 [14:42:17<11:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 56%|█████▌ | 6931/12384 [14:42:17<11:31:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 56%|█████▌ | 6931/12384 [14:42:25<11:31:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 56%|█████▌ | 6932/12384 [14:42:25<11:32:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 56%|█████▌ | 6932/12384 [14:42:32<11:32:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 56%|█████▌ | 6933/12384 [14:42:32<11:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 56%|█████▌ | 6933/12384 [14:42:40<11:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 56%|█████▌ | 6934/12384 [14:42:40<11:31:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 56%|█████▌ | 6934/12384 [14:42:48<11:31:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 56%|█████▌ | 6935/12384 [14:42:48<11:31:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 0: 56%|█████▌ | 6935/12384 [14:42:55<11:31:30, 7.61s/it, loss=0.0003, acc=0.9977, iter_time=10.39s]
Epoch 0: 56%|█████▌ | 6936/12384 [14:42:55<11:31:18, 7.61s/it, loss=0.0003, acc=0.9977, iter_time=10.39s]
Epoch 0: 56%|█████▌ | 6936/12384 [14:43:03<11:31:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 56%|█████▌ | 6937/12384 [14:43:03<11:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 56%|█████▌ | 6937/12384 [14:43:11<11:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 56%|█████▌ | 6938/12384 [14:43:11<11:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 56%|█████▌ | 6938/12384 [14:43:18<11:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 56%|█████▌ | 6939/12384 [14:43:18<11:30:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 56%|█████▌ | 6939/12384 [14:43:26<11:30:39, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=8.09s]
Epoch 0: 56%|█████▌ | 6940/12384 [14:43:26<11:30:46, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=8.09s]
Epoch 0: 56%|█████▌ | 6940/12384 [14:43:33<11:30:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.31s]
Epoch 0: 56%|█████▌ | 6941/12384 [14:43:33<11:30:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.31s]
Epoch 0: 56%|█████▌ | 6941/12384 [14:43:41<11:30:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 56%|█████▌ | 6942/12384 [14:43:41<11:29:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 56%|█████▌ | 6942/12384 [14:43:49<11:29:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 56%|█████▌ | 6943/12384 [14:43:49<11:29:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 56%|█████▌ | 6943/12384 [14:43:56<11:29:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 0: 56%|█████▌ | 6944/12384 [14:43:56<11:29:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 0: 56%|█████▌ | 6944/12384 [14:44:04<11:29:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 56%|█████▌ | 6945/12384 [14:44:04<11:29:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 56%|█████▌ | 6945/12384 [14:44:11<11:29:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 0: 56%|█████▌ | 6946/12384 [14:44:11<11:29:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 0: 56%|█████▌ | 6946/12384 [14:44:19<11:29:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 56%|█████▌ | 6947/12384 [14:44:19<11:29:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 56%|█████▌ | 6947/12384 [14:44:27<11:29:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 56%|█████▌ | 6948/12384 [14:44:27<11:30:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 56%|█████▌ | 6948/12384 [14:44:35<11:30:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.98s]
Epoch 0: 56%|█████▌ | 6949/12384 [14:44:35<11:37:34, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.98s]
Epoch 0: 56%|█████▌ | 6949/12384 [14:44:42<11:37:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 56%|█████▌ | 6950/12384 [14:44:42<11:35:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 56%|█████▌ | 6950/12384 [14:44:50<11:35:00, 7.67s/it, loss=0.0010, acc=0.9985, iter_time=5.97s]
Epoch 0: 56%|█████▌ | 6951/12384 [14:44:50<11:32:59, 7.65s/it, loss=0.0010, acc=0.9985, iter_time=5.97s]
Epoch 0: 56%|█████▌ | 6951/12384 [14:44:57<11:32:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 56%|█████▌ | 6952/12384 [14:44:57<11:32:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 56%|█████▌ | 6952/12384 [14:45:05<11:32:12, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=5.13s]
Epoch 0: 56%|█████▌ | 6953/12384 [14:45:05<11:31:16, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=5.13s]
Epoch 0: 56%|█████▌ | 6953/12384 [14:45:13<11:31:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 56%|█████▌ | 6954/12384 [14:45:13<11:30:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 56%|█████▌ | 6954/12384 [14:45:20<11:30:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 56%|█████▌ | 6955/12384 [14:45:20<11:29:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 56%|█████▌ | 6955/12384 [14:45:28<11:29:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.74s]
Epoch 0: 56%|█████▌ | 6956/12384 [14:45:28<11:29:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.74s]
Epoch 0: 56%|█████▌ | 6956/12384 [14:45:35<11:29:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 0: 56%|█████▌ | 6957/12384 [14:45:35<11:28:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 0: 56%|█████▌ | 6957/12384 [14:45:43<11:28:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 56%|█████▌ | 6958/12384 [14:45:43<11:28:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 56%|█████▌ | 6958/12384 [14:45:51<11:28:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 56%|█████▌ | 6959/12384 [14:45:51<11:28:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 56%|█████▌ | 6959/12384 [14:45:58<11:28:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 56%|█████▌ | 6960/12384 [14:45:58<11:27:25, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 0: 56%|█████▌ | 6960/12384 [14:46:06<11:27:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 0: 56%|█████▌ | 6961/12384 [14:46:06<11:27:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 0: 56%|█████▌ | 6961/12384 [14:46:13<11:27:20, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.25s]
Epoch 0: 56%|█████▌ | 6962/12384 [14:46:13<11:28:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.25s]
Epoch 0: 56%|█████▌ | 6962/12384 [14:46:21<11:28:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 56%|█████▌ | 6963/12384 [14:46:21<11:27:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 56%|█████▌ | 6963/12384 [14:46:29<11:27:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▌ | 6964/12384 [14:46:29<11:27:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▌ | 6964/12384 [14:46:36<11:27:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 0: 56%|█████▌ | 6965/12384 [14:46:36<11:27:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 0: 56%|█████▌ | 6965/12384 [14:46:44<11:27:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 56%|█████▋ | 6966/12384 [14:46:44<11:27:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 56%|█████▋ | 6966/12384 [14:46:51<11:27:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 56%|█████▋ | 6967/12384 [14:46:51<11:26:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 56%|█████▋ | 6967/12384 [14:46:59<11:26:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 56%|█████▋ | 6968/12384 [14:46:59<11:26:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 56%|█████▋ | 6968/12384 [14:47:07<11:26:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 56%|█████▋ | 6969/12384 [14:47:07<11:26:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 56%|█████▋ | 6969/12384 [14:47:14<11:26:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 56%|█████▋ | 6970/12384 [14:47:14<11:26:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 56%|█████▋ | 6970/12384 [14:47:22<11:26:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 56%|█████▋ | 6971/12384 [14:47:22<11:26:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 56%|█████▋ | 6971/12384 [14:47:30<11:26:25, 7.61s/it, loss=0.0005, acc=0.9971, iter_time=5.81s]
Epoch 0: 56%|█████▋ | 6972/12384 [14:47:30<11:26:21, 7.61s/it, loss=0.0005, acc=0.9971, iter_time=5.81s]
Epoch 0: 56%|█████▋ | 6972/12384 [14:47:37<11:26:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 56%|█████▋ | 6973/12384 [14:47:37<11:27:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 56%|█████▋ | 6973/12384 [14:47:45<11:27:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 0: 56%|█████▋ | 6974/12384 [14:47:45<11:26:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 0: 56%|█████▋ | 6974/12384 [14:47:53<11:26:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 56%|█████▋ | 6975/12384 [14:47:53<11:34:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 56%|█████▋ | 6975/12384 [14:48:00<11:34:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 56%|█████▋ | 6976/12384 [14:48:00<11:32:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 56%|█████▋ | 6976/12384 [14:48:08<11:32:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 56%|█████▋ | 6977/12384 [14:48:08<11:29:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 56%|█████▋ | 6977/12384 [14:48:16<11:29:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 56%|█████▋ | 6978/12384 [14:48:16<11:28:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 56%|█████▋ | 6978/12384 [14:48:23<11:28:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▋ | 6979/12384 [14:48:23<11:27:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▋ | 6979/12384 [14:48:31<11:27:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▋ | 6980/12384 [14:48:31<11:26:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▋ | 6980/12384 [14:48:38<11:26:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 56%|█████▋ | 6981/12384 [14:48:38<11:29:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 56%|█████▋ | 6981/12384 [14:48:46<11:29:10, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.00s]
Epoch 0: 56%|█████▋ | 6982/12384 [14:48:46<11:27:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.00s]
Epoch 0: 56%|█████▋ | 6982/12384 [14:48:54<11:27:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 56%|█████▋ | 6983/12384 [14:48:54<11:34:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 56%|█████▋ | 6983/12384 [14:49:02<11:34:40, 7.72s/it, loss=0.0002, acc=0.9998, iter_time=7.54s]
Epoch 0: 56%|█████▋ | 6984/12384 [14:49:02<11:31:19, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=7.54s]
Epoch 0: 56%|█████▋ | 6984/12384 [14:49:09<11:31:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 56%|█████▋ | 6985/12384 [14:49:09<11:29:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 56%|█████▋ | 6985/12384 [14:49:17<11:29:53, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 0: 56%|█████▋ | 6986/12384 [14:49:17<11:27:50, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 0: 56%|█████▋ | 6986/12384 [14:49:24<11:27:50, 7.65s/it, loss=0.0003, acc=0.9981, iter_time=7.61s]
Epoch 0: 56%|█████▋ | 6987/12384 [14:49:24<11:26:45, 7.63s/it, loss=0.0003, acc=0.9981, iter_time=7.61s]
Epoch 0: 56%|█████▋ | 6987/12384 [14:49:32<11:26:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▋ | 6988/12384 [14:49:32<11:25:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 56%|█████▋ | 6988/12384 [14:49:40<11:25:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 56%|█████▋ | 6989/12384 [14:49:40<11:25:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 56%|█████▋ | 6989/12384 [14:49:47<11:25:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 0: 56%|█████▋ | 6990/12384 [14:49:47<11:24:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 0: 56%|█████▋ | 6990/12384 [14:49:55<11:24:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 56%|█████▋ | 6991/12384 [14:49:55<11:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 56%|█████▋ | 6991/12384 [14:50:02<11:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 56%|█████▋ | 6992/12384 [14:50:02<11:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 56%|█████▋ | 6992/12384 [14:50:10<11:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 56%|█████▋ | 6993/12384 [14:50:10<11:24:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 56%|█████▋ | 6993/12384 [14:50:18<11:24:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 56%|█████▋ | 6994/12384 [14:50:18<11:24:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 56%|█████▋ | 6994/12384 [14:50:25<11:24:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▋ | 6995/12384 [14:50:25<11:24:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 56%|█████▋ | 6995/12384 [14:50:33<11:24:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 56%|█████▋ | 6996/12384 [14:50:33<11:23:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 56%|█████▋ | 6996/12384 [14:50:41<11:23:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 0: 57%|█████▋ | 6997/12384 [14:50:41<11:23:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 0: 57%|█████▋ | 6997/12384 [14:50:48<11:23:15, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=10.16s]
Epoch 0: 57%|█████▋ | 6998/12384 [14:50:48<11:22:39, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=10.16s]
Epoch 0: 57%|█████▋ | 6998/12384 [14:50:56<11:22:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 6999/12384 [14:50:56<11:22:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 6999/12384 [14:51:03<11:22:23, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 57%|█████▋ | 7000/12384 [14:51:03<11:27:25, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 57%|█████▋ | 7000/12384 [14:51:11<11:27:25, 7.66s/it, loss=0.0006, acc=0.9989, iter_time=7.46s]
Epoch 0: 57%|█████▋ | 7001/12384 [14:51:11<11:34:42, 7.74s/it, loss=0.0006, acc=0.9989, iter_time=7.46s]
Epoch 0: 57%|█████▋ | 7001/12384 [14:51:19<11:34:42, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 57%|█████▋ | 7002/12384 [14:51:19<11:30:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 57%|█████▋ | 7002/12384 [14:51:27<11:30:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 57%|█████▋ | 7003/12384 [14:51:27<11:27:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 57%|█████▋ | 7003/12384 [14:51:34<11:27:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 57%|█████▋ | 7004/12384 [14:51:34<11:25:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 57%|█████▋ | 7004/12384 [14:51:42<11:25:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 57%|█████▋ | 7005/12384 [14:51:42<11:24:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 57%|█████▋ | 7005/12384 [14:51:49<11:24:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 57%|█████▋ | 7006/12384 [14:51:49<11:23:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 57%|█████▋ | 7006/12384 [14:51:57<11:23:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 57%|█████▋ | 7007/12384 [14:51:57<11:23:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 57%|█████▋ | 7007/12384 [14:52:05<11:23:19, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.12s]
Epoch 0: 57%|█████▋ | 7008/12384 [14:52:05<11:25:22, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.12s]
Epoch 0: 57%|█████▋ | 7008/12384 [14:52:12<11:25:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 57%|█████▋ | 7009/12384 [14:52:12<11:24:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 57%|█████▋ | 7009/12384 [14:52:20<11:24:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 57%|█████▋ | 7010/12384 [14:52:20<11:31:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 57%|█████▋ | 7010/12384 [14:52:28<11:31:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7011/12384 [14:52:28<11:28:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7011/12384 [14:52:35<11:28:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7012/12384 [14:52:35<11:26:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7012/12384 [14:52:43<11:26:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 57%|█████▋ | 7013/12384 [14:52:43<11:25:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 57%|█████▋ | 7013/12384 [14:52:51<11:25:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 57%|█████▋ | 7014/12384 [14:52:51<11:24:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 57%|█████▋ | 7014/12384 [14:52:58<11:24:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7015/12384 [14:52:58<11:24:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7015/12384 [14:53:06<11:24:26, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 57%|█████▋ | 7016/12384 [14:53:06<11:23:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 0: 57%|█████▋ | 7016/12384 [14:53:14<11:23:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 57%|█████▋ | 7017/12384 [14:53:14<11:23:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 57%|█████▋ | 7017/12384 [14:53:21<11:23:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.82s]
Epoch 0: 57%|█████▋ | 7018/12384 [14:53:21<11:23:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.82s]
Epoch 0: 57%|█████▋ | 7018/12384 [14:53:29<11:23:20, 7.64s/it, loss=0.0004, acc=0.9989, iter_time=9.37s]
Epoch 0: 57%|█████▋ | 7019/12384 [14:53:29<11:22:18, 7.63s/it, loss=0.0004, acc=0.9989, iter_time=9.37s]
Epoch 0: 57%|█████▋ | 7019/12384 [14:53:37<11:22:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 57%|█████▋ | 7020/12384 [14:53:37<11:21:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 57%|█████▋ | 7020/12384 [14:53:44<11:21:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7021/12384 [14:53:44<11:20:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7021/12384 [14:53:52<11:20:53, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7022/12384 [14:53:52<11:20:38, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7022/12384 [14:53:59<11:20:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7023/12384 [14:53:59<11:20:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7023/12384 [14:54:07<11:20:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 57%|█████▋ | 7024/12384 [14:54:07<11:20:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 57%|█████▋ | 7024/12384 [14:54:15<11:20:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 57%|█████▋ | 7025/12384 [14:54:15<11:19:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 57%|█████▋ | 7025/12384 [14:54:22<11:19:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7026/12384 [14:54:22<11:19:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7026/12384 [14:54:30<11:19:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 57%|█████▋ | 7027/12384 [14:54:30<11:28:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 57%|█████▋ | 7027/12384 [14:54:38<11:28:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 57%|█████▋ | 7028/12384 [14:54:38<11:25:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 57%|█████▋ | 7028/12384 [14:54:45<11:25:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7029/12384 [14:54:45<11:23:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7029/12384 [14:54:53<11:23:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 57%|█████▋ | 7030/12384 [14:54:53<11:22:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 57%|█████▋ | 7030/12384 [14:55:01<11:22:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 57%|█████▋ | 7031/12384 [14:55:01<11:20:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 57%|█████▋ | 7031/12384 [14:55:08<11:20:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 57%|█████▋ | 7032/12384 [14:55:08<11:20:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 57%|█████▋ | 7032/12384 [14:55:16<11:20:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 57%|█████▋ | 7033/12384 [14:55:16<11:20:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 57%|█████▋ | 7033/12384 [14:55:23<11:20:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 57%|█████▋ | 7034/12384 [14:55:23<11:19:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 57%|█████▋ | 7034/12384 [14:55:31<11:19:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.60s]
Epoch 0: 57%|█████▋ | 7035/12384 [14:55:31<11:19:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.60s]
Epoch 0: 57%|█████▋ | 7035/12384 [14:55:39<11:19:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7036/12384 [14:55:39<11:18:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7036/12384 [14:55:46<11:18:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 57%|█████▋ | 7037/12384 [14:55:46<11:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 57%|█████▋ | 7037/12384 [14:55:54<11:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 57%|█████▋ | 7038/12384 [14:55:54<11:18:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 57%|█████▋ | 7038/12384 [14:56:01<11:18:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 57%|█████▋ | 7039/12384 [14:56:01<11:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 57%|█████▋ | 7039/12384 [14:56:09<11:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 57%|█████▋ | 7040/12384 [14:56:09<11:18:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 57%|█████▋ | 7040/12384 [14:56:17<11:18:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 0: 57%|█████▋ | 7041/12384 [14:56:17<11:18:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 0: 57%|█████▋ | 7041/12384 [14:56:24<11:18:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 57%|█████▋ | 7042/12384 [14:56:24<11:18:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 57%|█████▋ | 7042/12384 [14:56:32<11:18:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 57%|█████▋ | 7043/12384 [14:56:32<11:18:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 57%|█████▋ | 7043/12384 [14:56:40<11:18:11, 7.62s/it, loss=0.0004, acc=0.9984, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7044/12384 [14:56:40<11:17:49, 7.62s/it, loss=0.0004, acc=0.9984, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7044/12384 [14:56:47<11:17:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 57%|█████▋ | 7045/12384 [14:56:47<11:18:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 57%|█████▋ | 7045/12384 [14:56:55<11:18:06, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=8.24s]
Epoch 0: 57%|█████▋ | 7046/12384 [14:56:55<11:17:22, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=8.24s]
Epoch 0: 57%|█████▋ | 7046/12384 [14:57:02<11:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7047/12384 [14:57:02<11:16:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7047/12384 [14:57:10<11:16:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 57%|█████▋ | 7048/12384 [14:57:10<11:17:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 57%|█████▋ | 7048/12384 [14:57:18<11:17:08, 7.61s/it, loss=0.0010, acc=0.9988, iter_time=6.04s]
Epoch 0: 57%|█████▋ | 7049/12384 [14:57:18<11:16:29, 7.61s/it, loss=0.0010, acc=0.9988, iter_time=6.04s]
Epoch 0: 57%|█████▋ | 7049/12384 [14:57:25<11:16:29, 7.61s/it, loss=0.0006, acc=0.9969, iter_time=9.22s]
Epoch 0: 57%|█████▋ | 7050/12384 [14:57:25<11:16:51, 7.61s/it, loss=0.0006, acc=0.9969, iter_time=9.22s]
Epoch 0: 57%|█████▋ | 7050/12384 [14:57:33<11:16:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 57%|█████▋ | 7051/12384 [14:57:33<11:16:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 57%|█████▋ | 7051/12384 [14:57:40<11:16:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7052/12384 [14:57:40<11:16:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7052/12384 [14:57:48<11:16:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 57%|█████▋ | 7053/12384 [14:57:48<11:25:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 57%|█████▋ | 7053/12384 [14:57:56<11:25:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 57%|█████▋ | 7054/12384 [14:57:56<11:23:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 57%|█████▋ | 7054/12384 [14:58:04<11:23:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7055/12384 [14:58:04<11:19:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7055/12384 [14:58:11<11:19:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 57%|█████▋ | 7056/12384 [14:58:11<11:20:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 57%|█████▋ | 7056/12384 [14:58:19<11:20:18, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=7.28s]
Epoch 0: 57%|█████▋ | 7057/12384 [14:58:19<11:18:48, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.28s]
Epoch 0: 57%|█████▋ | 7057/12384 [14:58:27<11:18:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 57%|█████▋ | 7058/12384 [14:58:27<11:18:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 57%|█████▋ | 7058/12384 [14:58:34<11:18:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 57%|█████▋ | 7059/12384 [14:58:34<11:17:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 57%|█████▋ | 7059/12384 [14:58:42<11:17:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 57%|█████▋ | 7060/12384 [14:58:42<11:16:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 57%|█████▋ | 7060/12384 [14:58:49<11:16:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 57%|█████▋ | 7061/12384 [14:58:49<11:15:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 57%|█████▋ | 7061/12384 [14:58:57<11:15:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 57%|█████▋ | 7062/12384 [14:58:57<11:15:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 57%|█████▋ | 7062/12384 [14:59:05<11:15:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7063/12384 [14:59:05<11:14:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7063/12384 [14:59:12<11:14:51, 7.61s/it, loss=0.0008, acc=0.9986, iter_time=8.28s]
Epoch 0: 57%|█████▋ | 7064/12384 [14:59:12<11:22:13, 7.69s/it, loss=0.0008, acc=0.9986, iter_time=8.28s]
Epoch 0: 57%|█████▋ | 7064/12384 [14:59:20<11:22:13, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.39s]
Epoch 0: 57%|█████▋ | 7065/12384 [14:59:20<11:20:04, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.39s]
Epoch 0: 57%|█████▋ | 7065/12384 [14:59:28<11:20:04, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.43s]
Epoch 0: 57%|█████▋ | 7066/12384 [14:59:28<11:18:58, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.43s]
Epoch 0: 57%|█████▋ | 7066/12384 [14:59:35<11:18:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 57%|█████▋ | 7067/12384 [14:59:35<11:17:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 57%|█████▋ | 7067/12384 [14:59:43<11:17:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 57%|█████▋ | 7068/12384 [14:59:43<11:16:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 57%|█████▋ | 7068/12384 [14:59:51<11:16:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 57%|█████▋ | 7069/12384 [14:59:51<11:15:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 57%|█████▋ | 7069/12384 [14:59:58<11:15:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 0: 57%|█████▋ | 7070/12384 [14:59:58<11:14:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 0: 57%|█████▋ | 7070/12384 [15:00:06<11:14:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 57%|█████▋ | 7071/12384 [15:00:06<11:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 57%|█████▋ | 7071/12384 [15:00:13<11:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 57%|█████▋ | 7072/12384 [15:00:13<11:15:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 57%|█████▋ | 7072/12384 [15:00:21<11:15:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 57%|█████▋ | 7073/12384 [15:00:21<11:14:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 57%|█████▋ | 7073/12384 [15:00:29<11:14:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 57%|█████▋ | 7074/12384 [15:00:29<11:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 57%|█████▋ | 7074/12384 [15:00:36<11:13:23, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=10.18s]
Epoch 0: 57%|█████▋ | 7075/12384 [15:00:36<11:13:00, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=10.18s]
Epoch 0: 57%|█████▋ | 7075/12384 [15:00:44<11:13:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7076/12384 [15:00:44<11:12:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7076/12384 [15:00:51<11:12:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7077/12384 [15:00:51<11:12:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7077/12384 [15:00:59<11:12:35, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7078/12384 [15:00:59<11:12:36, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7078/12384 [15:01:07<11:12:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7079/12384 [15:01:07<11:12:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7079/12384 [15:01:15<11:12:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 57%|█████▋ | 7080/12384 [15:01:15<11:22:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 57%|█████▋ | 7080/12384 [15:01:22<11:22:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 57%|█████▋ | 7081/12384 [15:01:22<11:19:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 57%|█████▋ | 7081/12384 [15:01:30<11:19:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7082/12384 [15:01:30<11:16:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7082/12384 [15:01:37<11:16:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7083/12384 [15:01:37<11:14:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7083/12384 [15:01:45<11:14:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 57%|█████▋ | 7084/12384 [15:01:45<11:13:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 57%|█████▋ | 7084/12384 [15:01:53<11:13:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 0: 57%|█████▋ | 7085/12384 [15:01:53<11:12:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 0: 57%|█████▋ | 7085/12384 [15:02:00<11:12:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.13s]
Epoch 0: 57%|█████▋ | 7086/12384 [15:02:00<11:12:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.13s]
Epoch 0: 57%|█████▋ | 7086/12384 [15:02:08<11:12:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7087/12384 [15:02:08<11:13:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7087/12384 [15:02:15<11:13:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 57%|█████▋ | 7088/12384 [15:02:15<11:13:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 57%|█████▋ | 7088/12384 [15:02:23<11:13:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 57%|█████▋ | 7089/12384 [15:02:23<11:12:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 57%|█████▋ | 7089/12384 [15:02:31<11:12:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 57%|█████▋ | 7090/12384 [15:02:31<11:20:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 57%|█████▋ | 7090/12384 [15:02:39<11:20:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 57%|█████▋ | 7091/12384 [15:02:39<11:17:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 57%|█████▋ | 7091/12384 [15:02:46<11:17:32, 7.68s/it, loss=0.0003, acc=0.9987, iter_time=11.20s]
Epoch 0: 57%|█████▋ | 7092/12384 [15:02:46<11:15:52, 7.66s/it, loss=0.0003, acc=0.9987, iter_time=11.20s]
Epoch 0: 57%|█████▋ | 7092/12384 [15:02:54<11:15:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 57%|█████▋ | 7093/12384 [15:02:54<11:13:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 57%|█████▋ | 7093/12384 [15:03:01<11:13:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 57%|█████▋ | 7094/12384 [15:03:01<11:12:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 57%|█████▋ | 7094/12384 [15:03:09<11:12:32, 7.63s/it, loss=0.0007, acc=0.9978, iter_time=8.25s]
Epoch 0: 57%|█████▋ | 7095/12384 [15:03:09<11:14:09, 7.65s/it, loss=0.0007, acc=0.9978, iter_time=8.25s]
Epoch 0: 57%|█████▋ | 7095/12384 [15:03:17<11:14:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 57%|█████▋ | 7096/12384 [15:03:17<11:13:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 57%|█████▋ | 7096/12384 [15:03:24<11:13:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 57%|█████▋ | 7097/12384 [15:03:24<11:12:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 57%|█████▋ | 7097/12384 [15:03:32<11:12:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7098/12384 [15:03:32<11:12:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7098/12384 [15:03:40<11:12:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7099/12384 [15:03:40<11:11:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7099/12384 [15:03:47<11:11:48, 7.63s/it, loss=0.0004, acc=0.9981, iter_time=8.01s]
Epoch 0: 57%|█████▋ | 7100/12384 [15:03:47<11:10:43, 7.62s/it, loss=0.0004, acc=0.9981, iter_time=8.01s]
Epoch 0: 57%|█████▋ | 7100/12384 [15:03:55<11:10:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 0: 57%|█████▋ | 7101/12384 [15:03:55<11:09:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 0: 57%|█████▋ | 7101/12384 [15:04:02<11:09:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 0: 57%|█████▋ | 7102/12384 [15:04:02<11:10:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 0: 57%|█████▋ | 7102/12384 [15:04:10<11:10:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 57%|█████▋ | 7103/12384 [15:04:10<11:09:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 57%|█████▋ | 7103/12384 [15:04:18<11:09:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 57%|█████▋ | 7104/12384 [15:04:18<11:09:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 57%|█████▋ | 7104/12384 [15:04:25<11:09:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 57%|█████▋ | 7105/12384 [15:04:25<11:10:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 57%|█████▋ | 7105/12384 [15:04:33<11:10:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 0: 57%|█████▋ | 7106/12384 [15:04:33<11:19:20, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 0: 57%|█████▋ | 7106/12384 [15:04:41<11:19:20, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 57%|█████▋ | 7107/12384 [15:04:41<11:16:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 57%|█████▋ | 7107/12384 [15:04:48<11:16:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7108/12384 [15:04:48<11:14:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7108/12384 [15:04:56<11:14:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7109/12384 [15:04:56<11:12:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7109/12384 [15:05:04<11:12:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7110/12384 [15:05:04<11:11:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7110/12384 [15:05:11<11:11:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7111/12384 [15:05:11<11:10:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 57%|█████▋ | 7111/12384 [15:05:19<11:10:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 57%|█████▋ | 7112/12384 [15:05:19<11:09:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 57%|█████▋ | 7112/12384 [15:05:27<11:09:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 57%|█████▋ | 7113/12384 [15:05:27<11:09:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 57%|█████▋ | 7113/12384 [15:05:34<11:09:25, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=11.21s]
Epoch 0: 57%|█████▋ | 7114/12384 [15:05:34<11:08:47, 7.61s/it, loss=0.0002, acc=0.9995, iter_time=11.21s]
Epoch 0: 57%|█████▋ | 7114/12384 [15:05:42<11:08:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 0: 57%|█████▋ | 7115/12384 [15:05:42<11:09:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 0: 57%|█████▋ | 7115/12384 [15:05:49<11:09:00, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=11.21s]
Epoch 0: 57%|█████▋ | 7116/12384 [15:05:49<11:08:42, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=11.21s]
Epoch 0: 57%|█████▋ | 7116/12384 [15:05:57<11:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7117/12384 [15:05:57<11:08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 57%|█████▋ | 7117/12384 [15:06:05<11:08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7118/12384 [15:06:05<11:08:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 57%|█████▋ | 7118/12384 [15:06:12<11:08:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7119/12384 [15:06:12<11:07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 57%|█████▋ | 7119/12384 [15:06:20<11:07:59, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=8.02s]
Epoch 0: 57%|█████▋ | 7120/12384 [15:06:20<11:08:10, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=8.02s]
Epoch 0: 57%|█████▋ | 7120/12384 [15:06:27<11:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 58%|█████▊ | 7121/12384 [15:06:27<11:07:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 58%|█████▊ | 7121/12384 [15:06:35<11:07:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.43s]
Epoch 0: 58%|█████▊ | 7122/12384 [15:06:35<11:07:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.43s]
Epoch 0: 58%|█████▊ | 7122/12384 [15:06:43<11:07:52, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=11.81s]
Epoch 0: 58%|█████▊ | 7123/12384 [15:06:43<11:08:13, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=11.81s]
Epoch 0: 58%|█████▊ | 7123/12384 [15:06:50<11:08:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 58%|█████▊ | 7124/12384 [15:06:50<11:10:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 58%|█████▊ | 7124/12384 [15:06:58<11:10:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 58%|█████▊ | 7125/12384 [15:06:58<11:10:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 58%|█████▊ | 7125/12384 [15:07:06<11:10:06, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 58%|█████▊ | 7126/12384 [15:07:06<11:08:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 58%|█████▊ | 7126/12384 [15:07:13<11:08:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7127/12384 [15:07:13<11:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7127/12384 [15:07:21<11:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 58%|█████▊ | 7128/12384 [15:07:21<11:07:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 58%|█████▊ | 7128/12384 [15:07:28<11:07:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 58%|█████▊ | 7129/12384 [15:07:28<11:06:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 58%|█████▊ | 7129/12384 [15:07:36<11:06:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 58%|█████▊ | 7130/12384 [15:07:36<11:07:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 58%|█████▊ | 7130/12384 [15:07:44<11:07:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 58%|█████▊ | 7131/12384 [15:07:44<11:07:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 58%|█████▊ | 7131/12384 [15:07:51<11:07:06, 7.62s/it, loss=0.0010, acc=0.9986, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7132/12384 [15:07:51<11:06:08, 7.61s/it, loss=0.0010, acc=0.9986, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7132/12384 [15:07:59<11:06:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7133/12384 [15:07:59<11:14:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7133/12384 [15:08:07<11:14:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 58%|█████▊ | 7134/12384 [15:08:07<11:11:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 58%|█████▊ | 7134/12384 [15:08:14<11:11:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 58%|█████▊ | 7135/12384 [15:08:14<11:10:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 58%|█████▊ | 7135/12384 [15:08:22<11:10:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7136/12384 [15:08:22<11:09:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7136/12384 [15:08:30<11:09:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7137/12384 [15:08:30<11:08:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7137/12384 [15:08:37<11:08:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 58%|█████▊ | 7138/12384 [15:08:37<11:09:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 58%|█████▊ | 7138/12384 [15:08:45<11:09:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 0: 58%|█████▊ | 7139/12384 [15:08:45<11:10:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 0: 58%|█████▊ | 7139/12384 [15:08:53<11:10:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 58%|█████▊ | 7140/12384 [15:08:53<11:08:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 58%|█████▊ | 7140/12384 [15:09:00<11:08:44, 7.65s/it, loss=0.0012, acc=0.9987, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7141/12384 [15:09:00<11:07:04, 7.63s/it, loss=0.0012, acc=0.9987, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7141/12384 [15:09:08<11:07:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7142/12384 [15:09:08<11:06:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7142/12384 [15:09:16<11:06:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 0: 58%|█████▊ | 7143/12384 [15:09:16<11:05:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 0: 58%|█████▊ | 7143/12384 [15:09:23<11:05:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 0: 58%|█████▊ | 7144/12384 [15:09:23<11:04:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 0: 58%|█████▊ | 7144/12384 [15:09:31<11:04:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 58%|█████▊ | 7145/12384 [15:09:31<11:04:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 58%|█████▊ | 7145/12384 [15:09:38<11:04:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 58%|█████▊ | 7146/12384 [15:09:38<11:07:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 58%|█████▊ | 7146/12384 [15:09:46<11:07:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 58%|█████▊ | 7147/12384 [15:09:46<11:06:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 58%|█████▊ | 7147/12384 [15:09:54<11:06:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=2.47s]
Epoch 0: 58%|█████▊ | 7148/12384 [15:09:54<11:05:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=2.47s]
Epoch 0: 58%|█████▊ | 7148/12384 [15:10:01<11:05:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 0: 58%|█████▊ | 7149/12384 [15:10:01<11:05:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 0: 58%|█████▊ | 7149/12384 [15:10:09<11:05:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 0: 58%|█████▊ | 7150/12384 [15:10:09<11:04:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 0: 58%|█████▊ | 7150/12384 [15:10:17<11:04:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 58%|█████▊ | 7151/12384 [15:10:17<11:28:49, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 58%|█████▊ | 7151/12384 [15:10:25<11:28:49, 7.90s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7152/12384 [15:10:25<11:22:30, 7.83s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7152/12384 [15:10:33<11:22:30, 7.83s/it, loss=0.0001, acc=0.9999, iter_time=7.67s]
Epoch 0: 58%|█████▊ | 7153/12384 [15:10:33<11:17:45, 7.77s/it, loss=0.0001, acc=0.9999, iter_time=7.67s]
Epoch 0: 58%|█████▊ | 7153/12384 [15:10:40<11:17:45, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 0: 58%|█████▊ | 7154/12384 [15:10:40<11:13:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 0: 58%|█████▊ | 7154/12384 [15:10:48<11:13:19, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.38s]
Epoch 0: 58%|█████▊ | 7155/12384 [15:10:48<11:09:55, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.38s]
Epoch 0: 58%|█████▊ | 7155/12384 [15:10:56<11:09:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 58%|█████▊ | 7156/12384 [15:10:56<11:09:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 58%|█████▊ | 7156/12384 [15:11:03<11:09:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 0: 58%|█████▊ | 7157/12384 [15:11:03<11:08:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 0: 58%|█████▊ | 7157/12384 [15:11:11<11:08:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 58%|█████▊ | 7158/12384 [15:11:11<11:06:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 58%|█████▊ | 7158/12384 [15:11:19<11:06:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 58%|█████▊ | 7159/12384 [15:11:19<11:13:58, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 58%|█████▊ | 7159/12384 [15:11:26<11:13:58, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 58%|█████▊ | 7160/12384 [15:11:26<11:10:48, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 58%|█████▊ | 7160/12384 [15:11:34<11:10:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 58%|█████▊ | 7161/12384 [15:11:34<11:08:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 58%|█████▊ | 7161/12384 [15:11:42<11:08:30, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.16s]
Epoch 0: 58%|█████▊ | 7162/12384 [15:11:42<11:06:40, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.16s]
Epoch 0: 58%|█████▊ | 7162/12384 [15:11:49<11:06:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 0: 58%|█████▊ | 7163/12384 [15:11:49<11:04:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 0: 58%|█████▊ | 7163/12384 [15:11:57<11:04:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 58%|█████▊ | 7164/12384 [15:11:57<11:06:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 58%|█████▊ | 7164/12384 [15:12:05<11:06:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 58%|█████▊ | 7165/12384 [15:12:05<11:04:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 58%|█████▊ | 7165/12384 [15:12:12<11:04:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 58%|█████▊ | 7166/12384 [15:12:12<11:04:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 58%|█████▊ | 7166/12384 [15:12:20<11:04:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 58%|█████▊ | 7167/12384 [15:12:20<11:04:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 58%|█████▊ | 7167/12384 [15:12:28<11:04:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 58%|█████▊ | 7168/12384 [15:12:28<11:04:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 58%|█████▊ | 7168/12384 [15:12:35<11:04:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 58%|█████▊ | 7169/12384 [15:12:35<11:03:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 58%|█████▊ | 7169/12384 [15:12:43<11:03:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 0: 58%|█████▊ | 7170/12384 [15:12:43<11:03:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 0: 58%|█████▊ | 7170/12384 [15:12:50<11:03:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 58%|█████▊ | 7171/12384 [15:12:50<11:02:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 58%|█████▊ | 7171/12384 [15:12:58<11:02:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 58%|█████▊ | 7172/12384 [15:12:58<11:01:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 58%|█████▊ | 7172/12384 [15:13:06<11:01:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 58%|█████▊ | 7173/12384 [15:13:06<11:01:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 58%|█████▊ | 7173/12384 [15:13:13<11:01:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 58%|█████▊ | 7174/12384 [15:13:13<11:00:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 58%|█████▊ | 7174/12384 [15:13:21<11:00:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 58%|█████▊ | 7175/12384 [15:13:21<11:00:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 58%|█████▊ | 7175/12384 [15:13:28<11:00:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 58%|█████▊ | 7176/12384 [15:13:28<11:01:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 58%|█████▊ | 7176/12384 [15:13:36<11:01:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 58%|█████▊ | 7177/12384 [15:13:36<11:01:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 58%|█████▊ | 7177/12384 [15:13:44<11:01:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 58%|█████▊ | 7178/12384 [15:13:44<11:00:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 58%|█████▊ | 7178/12384 [15:13:51<11:00:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 58%|█████▊ | 7179/12384 [15:13:51<10:59:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 58%|█████▊ | 7179/12384 [15:13:59<10:59:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 58%|█████▊ | 7180/12384 [15:13:59<10:59:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 58%|█████▊ | 7180/12384 [15:14:06<10:59:18, 7.60s/it, loss=0.0005, acc=0.9985, iter_time=7.90s]
Epoch 0: 58%|█████▊ | 7181/12384 [15:14:06<10:59:00, 7.60s/it, loss=0.0005, acc=0.9985, iter_time=7.90s]
Epoch 0: 58%|█████▊ | 7181/12384 [15:14:14<10:59:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7182/12384 [15:14:14<10:58:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7182/12384 [15:14:22<10:58:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7183/12384 [15:14:22<10:59:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7183/12384 [15:14:29<10:59:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 58%|█████▊ | 7184/12384 [15:14:29<10:59:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 58%|█████▊ | 7184/12384 [15:14:37<10:59:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 0: 58%|█████▊ | 7185/12384 [15:14:37<11:08:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 0: 58%|█████▊ | 7185/12384 [15:14:45<11:08:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.06s]
Epoch 0: 58%|█████▊ | 7186/12384 [15:14:45<11:06:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.06s]
Epoch 0: 58%|█████▊ | 7186/12384 [15:14:52<11:06:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 58%|█████▊ | 7187/12384 [15:14:52<11:04:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 58%|█████▊ | 7187/12384 [15:15:00<11:04:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 58%|█████▊ | 7188/12384 [15:15:00<11:02:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 58%|█████▊ | 7188/12384 [15:15:08<11:02:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.10s]
Epoch 0: 58%|█████▊ | 7189/12384 [15:15:08<11:02:05, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.10s]
Epoch 0: 58%|█████▊ | 7189/12384 [15:15:15<11:02:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 58%|█████▊ | 7190/12384 [15:15:15<11:00:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 58%|█████▊ | 7190/12384 [15:15:23<11:00:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 58%|█████▊ | 7191/12384 [15:15:23<11:04:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 58%|█████▊ | 7191/12384 [15:15:31<11:04:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 58%|█████▊ | 7192/12384 [15:15:31<11:02:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 58%|█████▊ | 7192/12384 [15:15:38<11:02:29, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 58%|█████▊ | 7193/12384 [15:15:38<11:00:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 58%|█████▊ | 7193/12384 [15:15:46<11:00:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7194/12384 [15:15:46<10:59:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7194/12384 [15:15:54<10:59:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 58%|█████▊ | 7195/12384 [15:15:54<10:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 58%|█████▊ | 7195/12384 [15:16:01<10:58:52, 7.62s/it, loss=0.0038, acc=0.9945, iter_time=7.96s]
Epoch 0: 58%|█████▊ | 7196/12384 [15:16:01<10:58:23, 7.61s/it, loss=0.0038, acc=0.9945, iter_time=7.96s]
Epoch 0: 58%|█████▊ | 7196/12384 [15:16:09<10:58:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 58%|█████▊ | 7197/12384 [15:16:09<10:58:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 58%|█████▊ | 7197/12384 [15:16:16<10:58:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 0: 58%|█████▊ | 7198/12384 [15:16:16<10:58:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 0: 58%|█████▊ | 7198/12384 [15:16:24<10:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 58%|█████▊ | 7199/12384 [15:16:24<10:58:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 58%|█████▊ | 7199/12384 [15:16:32<10:58:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 58%|█████▊ | 7200/12384 [15:16:32<10:57:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 58%|█████▊ | 7200/12384 [15:16:39<10:57:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 58%|█████▊ | 7201/12384 [15:16:39<10:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 58%|█████▊ | 7201/12384 [15:16:47<10:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 0: 58%|█████▊ | 7202/12384 [15:16:47<10:58:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 0: 58%|█████▊ | 7202/12384 [15:16:54<10:58:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 58%|█████▊ | 7203/12384 [15:16:54<10:57:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 58%|█████▊ | 7203/12384 [15:17:02<10:57:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 58%|█████▊ | 7204/12384 [15:17:02<10:56:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 58%|█████▊ | 7204/12384 [15:17:10<10:56:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 58%|█████▊ | 7205/12384 [15:17:10<10:56:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 58%|█████▊ | 7205/12384 [15:17:17<10:56:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7206/12384 [15:17:17<10:56:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7206/12384 [15:17:25<10:56:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7207/12384 [15:17:25<10:56:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7207/12384 [15:17:32<10:56:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 58%|█████▊ | 7208/12384 [15:17:32<10:55:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 58%|█████▊ | 7208/12384 [15:17:40<10:55:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 58%|█████▊ | 7209/12384 [15:17:40<10:56:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 58%|█████▊ | 7209/12384 [15:17:48<10:56:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7210/12384 [15:17:48<10:55:28, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7210/12384 [15:17:56<10:55:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 58%|█████▊ | 7211/12384 [15:17:56<11:03:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 58%|█████▊ | 7211/12384 [15:18:03<11:03:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 58%|█████▊ | 7212/12384 [15:18:03<11:03:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 58%|█████▊ | 7212/12384 [15:18:11<11:03:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7213/12384 [15:18:11<11:01:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7213/12384 [15:18:19<11:01:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7214/12384 [15:18:19<11:02:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7214/12384 [15:18:26<11:02:59, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.79s]
Epoch 0: 58%|█████▊ | 7215/12384 [15:18:26<11:03:10, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.79s]
Epoch 0: 58%|█████▊ | 7215/12384 [15:18:34<11:03:10, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=8.01s]
Epoch 0: 58%|█████▊ | 7216/12384 [15:18:34<11:01:33, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=8.01s]
Epoch 0: 58%|█████▊ | 7216/12384 [15:18:42<11:01:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 58%|█████▊ | 7217/12384 [15:18:42<10:59:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 58%|█████▊ | 7217/12384 [15:18:49<10:59:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 0: 58%|█████▊ | 7218/12384 [15:18:49<10:58:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 0: 58%|█████▊ | 7218/12384 [15:18:57<10:58:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 58%|█████▊ | 7219/12384 [15:18:57<10:57:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 58%|█████▊ | 7219/12384 [15:19:04<10:57:52, 7.64s/it, loss=0.0004, acc=0.9966, iter_time=4.76s]
Epoch 0: 58%|█████▊ | 7220/12384 [15:19:04<10:57:05, 7.63s/it, loss=0.0004, acc=0.9966, iter_time=4.76s]
Epoch 0: 58%|█████▊ | 7220/12384 [15:19:12<10:57:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 0: 58%|█████▊ | 7221/12384 [15:19:12<10:56:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 0: 58%|█████▊ | 7221/12384 [15:19:20<10:56:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 58%|█████▊ | 7222/12384 [15:19:20<10:56:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 58%|█████▊ | 7222/12384 [15:19:27<10:56:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 58%|█████▊ | 7223/12384 [15:19:27<10:58:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 58%|█████▊ | 7223/12384 [15:19:35<10:58:09, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7224/12384 [15:19:35<10:57:06, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.65s]
Epoch 0: 58%|█████▊ | 7224/12384 [15:19:43<10:57:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 58%|█████▊ | 7225/12384 [15:19:43<10:56:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 58%|█████▊ | 7225/12384 [15:19:50<10:56:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 58%|█████▊ | 7226/12384 [15:19:50<10:56:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 58%|█████▊ | 7226/12384 [15:19:58<10:56:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 58%|█████▊ | 7227/12384 [15:19:58<10:55:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 58%|█████▊ | 7227/12384 [15:20:05<10:55:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 58%|█████▊ | 7228/12384 [15:20:05<10:54:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 58%|█████▊ | 7228/12384 [15:20:13<10:54:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 0: 58%|█████▊ | 7229/12384 [15:20:13<10:54:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 0: 58%|█████▊ | 7229/12384 [15:20:21<10:54:03, 7.61s/it, loss=0.0001, acc=0.9990, iter_time=8.25s]
Epoch 0: 58%|█████▊ | 7230/12384 [15:20:21<10:53:41, 7.61s/it, loss=0.0001, acc=0.9990, iter_time=8.25s]
Epoch 0: 58%|█████▊ | 7230/12384 [15:20:28<10:53:41, 7.61s/it, loss=0.0003, acc=0.9987, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7231/12384 [15:20:28<10:54:21, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=7.60s]
Epoch 0: 58%|█████▊ | 7231/12384 [15:20:36<10:54:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 58%|█████▊ | 7232/12384 [15:20:36<10:54:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 58%|█████▊ | 7232/12384 [15:20:44<10:54:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 58%|█████▊ | 7233/12384 [15:20:44<10:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 58%|█████▊ | 7233/12384 [15:20:51<10:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 58%|█████▊ | 7234/12384 [15:20:51<10:53:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 58%|█████▊ | 7234/12384 [15:20:59<10:53:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 58%|█████▊ | 7235/12384 [15:20:59<10:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 58%|█████▊ | 7235/12384 [15:21:06<10:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 58%|█████▊ | 7236/12384 [15:21:06<10:53:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 58%|█████▊ | 7236/12384 [15:21:14<10:53:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.52s]
Epoch 0: 58%|█████▊ | 7237/12384 [15:21:14<11:01:19, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=4.52s]
Epoch 0: 58%|█████▊ | 7237/12384 [15:21:22<11:01:19, 7.71s/it, loss=0.0001, acc=0.9986, iter_time=11.00s]
Epoch 0: 58%|█████▊ | 7238/12384 [15:21:22<10:58:36, 7.68s/it, loss=0.0001, acc=0.9986, iter_time=11.00s]
Epoch 0: 58%|█████▊ | 7238/12384 [15:21:30<10:58:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 58%|█████▊ | 7239/12384 [15:21:30<10:56:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 58%|█████▊ | 7239/12384 [15:21:37<10:56:46, 7.66s/it, loss=0.0002, acc=0.9985, iter_time=11.01s]
Epoch 0: 58%|█████▊ | 7240/12384 [15:21:37<10:56:11, 7.65s/it, loss=0.0002, acc=0.9985, iter_time=11.01s]
Epoch 0: 58%|█████▊ | 7240/12384 [15:21:45<10:56:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 58%|█████▊ | 7241/12384 [15:21:45<10:55:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 58%|█████▊ | 7241/12384 [15:21:52<10:55:03, 7.64s/it, loss=0.0004, acc=0.9988, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7242/12384 [15:21:52<10:53:44, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=7.61s]
Epoch 0: 58%|█████▊ | 7242/12384 [15:22:00<10:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7243/12384 [15:22:00<10:53:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 58%|█████▊ | 7243/12384 [15:22:08<10:53:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 58%|█████▊ | 7244/12384 [15:22:08<10:52:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 58%|█████▊ | 7244/12384 [15:22:15<10:52:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 59%|█████▊ | 7245/12384 [15:22:15<10:53:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 59%|█████▊ | 7245/12384 [15:22:23<10:53:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 59%|█████▊ | 7246/12384 [15:22:23<10:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 59%|█████▊ | 7246/12384 [15:22:30<10:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 59%|█████▊ | 7247/12384 [15:22:30<10:51:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 59%|█████▊ | 7247/12384 [15:22:38<10:51:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.46s]
Epoch 0: 59%|█████▊ | 7248/12384 [15:22:38<10:51:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.46s]
Epoch 0: 59%|█████▊ | 7248/12384 [15:22:46<10:51:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 59%|█████▊ | 7249/12384 [15:22:46<10:50:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 59%|█████▊ | 7249/12384 [15:22:53<10:50:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 59%|█████▊ | 7250/12384 [15:22:53<10:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 59%|█████▊ | 7250/12384 [15:23:01<10:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 59%|█████▊ | 7251/12384 [15:23:01<10:50:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 59%|█████▊ | 7251/12384 [15:23:09<10:50:50, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.05s]
Epoch 0: 59%|█████▊ | 7252/12384 [15:23:09<10:50:56, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.05s]
Epoch 0: 59%|█████▊ | 7252/12384 [15:23:16<10:50:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.13s]
Epoch 0: 59%|█████▊ | 7253/12384 [15:23:16<10:51:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.13s]
Epoch 0: 59%|█████▊ | 7253/12384 [15:23:24<10:51:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 59%|█████▊ | 7254/12384 [15:23:24<10:50:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 59%|█████▊ | 7254/12384 [15:23:31<10:50:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 59%|█████▊ | 7255/12384 [15:23:31<10:52:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 59%|█████▊ | 7255/12384 [15:23:39<10:52:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 59%|█████▊ | 7256/12384 [15:23:39<10:52:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 59%|█████▊ | 7256/12384 [15:23:47<10:52:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 0: 59%|█████▊ | 7257/12384 [15:23:47<10:52:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 0: 59%|█████▊ | 7257/12384 [15:23:54<10:52:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 59%|█████▊ | 7258/12384 [15:23:54<10:53:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 59%|█████▊ | 7258/12384 [15:24:02<10:53:46, 7.65s/it, loss=0.0028, acc=0.9977, iter_time=5.63s]
Epoch 0: 59%|█████▊ | 7259/12384 [15:24:02<10:52:31, 7.64s/it, loss=0.0028, acc=0.9977, iter_time=5.63s]
Epoch 0: 59%|█████▊ | 7259/12384 [15:24:10<10:52:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 59%|█████▊ | 7260/12384 [15:24:10<10:51:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 59%|█████▊ | 7260/12384 [15:24:17<10:51:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 59%|█████▊ | 7261/12384 [15:24:17<10:50:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 59%|█████▊ | 7261/12384 [15:24:25<10:50:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 59%|█████▊ | 7262/12384 [15:24:25<10:50:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 59%|█████▊ | 7262/12384 [15:24:32<10:50:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▊ | 7263/12384 [15:24:32<10:49:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▊ | 7263/12384 [15:24:40<10:49:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 59%|█████▊ | 7264/12384 [15:24:40<10:59:57, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 59%|█████▊ | 7264/12384 [15:24:48<10:59:57, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 59%|█████▊ | 7265/12384 [15:24:48<10:58:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 59%|█████▊ | 7265/12384 [15:24:56<10:58:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 59%|█████▊ | 7266/12384 [15:24:56<10:55:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 59%|█████▊ | 7266/12384 [15:25:03<10:55:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 59%|█████▊ | 7267/12384 [15:25:03<10:53:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 59%|█████▊ | 7267/12384 [15:25:11<10:53:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 59%|█████▊ | 7268/12384 [15:25:11<10:52:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 59%|█████▊ | 7268/12384 [15:25:19<10:52:04, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 59%|█████▊ | 7269/12384 [15:25:19<10:50:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 59%|█████▊ | 7269/12384 [15:25:26<10:50:54, 7.64s/it, loss=0.0026, acc=0.9961, iter_time=5.51s]
Epoch 0: 59%|█████▊ | 7270/12384 [15:25:26<10:50:38, 7.63s/it, loss=0.0026, acc=0.9961, iter_time=5.51s]
Epoch 0: 59%|█████▊ | 7270/12384 [15:25:34<10:50:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.80s]
Epoch 0: 59%|█████▊ | 7271/12384 [15:25:34<10:49:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.80s]
Epoch 0: 59%|█████▊ | 7271/12384 [15:25:41<10:49:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 59%|█████▊ | 7272/12384 [15:25:41<10:49:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 59%|█████▊ | 7272/12384 [15:25:49<10:49:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 59%|█████▊ | 7273/12384 [15:25:49<10:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 59%|█████▊ | 7273/12384 [15:25:57<10:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 59%|█████▊ | 7274/12384 [15:25:57<10:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 59%|█████▊ | 7274/12384 [15:26:04<10:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 59%|█████▊ | 7275/12384 [15:26:04<10:48:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 59%|█████▊ | 7275/12384 [15:26:12<10:48:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▉ | 7276/12384 [15:26:12<10:47:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▉ | 7276/12384 [15:26:19<10:47:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 59%|█████▉ | 7277/12384 [15:26:19<10:48:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 59%|█████▉ | 7277/12384 [15:26:27<10:48:08, 7.61s/it, loss=0.0002, acc=0.9997, iter_time=9.43s]
Epoch 0: 59%|█████▉ | 7278/12384 [15:26:27<10:47:55, 7.61s/it, loss=0.0002, acc=0.9997, iter_time=9.43s]
Epoch 0: 59%|█████▉ | 7278/12384 [15:26:35<10:47:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 59%|█████▉ | 7279/12384 [15:26:35<10:47:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 59%|█████▉ | 7279/12384 [15:26:42<10:47:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 59%|█████▉ | 7280/12384 [15:26:42<10:47:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 59%|█████▉ | 7280/12384 [15:26:50<10:47:41, 7.61s/it, loss=0.0030, acc=0.9978, iter_time=6.67s]
Epoch 0: 59%|█████▉ | 7281/12384 [15:26:50<10:47:24, 7.61s/it, loss=0.0030, acc=0.9978, iter_time=6.67s]
Epoch 0: 59%|█████▉ | 7281/12384 [15:26:58<10:47:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 0: 59%|█████▉ | 7282/12384 [15:26:58<10:47:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 0: 59%|█████▉ | 7282/12384 [15:27:05<10:47:25, 7.61s/it, loss=0.0008, acc=0.9960, iter_time=8.48s]
Epoch 0: 59%|█████▉ | 7283/12384 [15:27:05<10:47:33, 7.62s/it, loss=0.0008, acc=0.9960, iter_time=8.48s]
Epoch 0: 59%|█████▉ | 7283/12384 [15:27:13<10:47:33, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=8.90s]
Epoch 0: 59%|█████▉ | 7284/12384 [15:27:13<10:47:12, 7.61s/it, loss=0.0001, acc=0.9994, iter_time=8.90s]
Epoch 0: 59%|█████▉ | 7284/12384 [15:27:20<10:47:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 59%|█████▉ | 7285/12384 [15:27:20<10:47:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 59%|█████▉ | 7285/12384 [15:27:28<10:47:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 59%|█████▉ | 7286/12384 [15:27:28<10:49:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 59%|█████▉ | 7286/12384 [15:27:36<10:49:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 0: 59%|█████▉ | 7287/12384 [15:27:36<10:48:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 0: 59%|█████▉ | 7287/12384 [15:27:43<10:48:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 0: 59%|█████▉ | 7288/12384 [15:27:43<10:48:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 0: 59%|█████▉ | 7288/12384 [15:27:51<10:48:19, 7.63s/it, loss=0.0006, acc=0.9971, iter_time=7.65s]
Epoch 0: 59%|█████▉ | 7289/12384 [15:27:51<10:47:11, 7.62s/it, loss=0.0006, acc=0.9971, iter_time=7.65s]
Epoch 0: 59%|█████▉ | 7289/12384 [15:27:59<10:47:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 59%|█████▉ | 7290/12384 [15:27:59<10:56:32, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 59%|█████▉ | 7290/12384 [15:28:07<10:56:32, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 59%|█████▉ | 7291/12384 [15:28:07<10:53:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 59%|█████▉ | 7291/12384 [15:28:14<10:53:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 59%|█████▉ | 7292/12384 [15:28:14<10:51:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 59%|█████▉ | 7292/12384 [15:28:22<10:51:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 0: 59%|█████▉ | 7293/12384 [15:28:22<10:49:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 0: 59%|█████▉ | 7293/12384 [15:28:29<10:49:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 59%|█████▉ | 7294/12384 [15:28:29<10:48:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 59%|█████▉ | 7294/12384 [15:28:37<10:48:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.59s]
Epoch 0: 59%|█████▉ | 7295/12384 [15:28:37<10:47:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.59s]
Epoch 0: 59%|█████▉ | 7295/12384 [15:28:45<10:47:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=12.04s]
Epoch 0: 59%|█████▉ | 7296/12384 [15:28:45<10:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=12.04s]
Epoch 0: 59%|█████▉ | 7296/12384 [15:28:52<10:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 0: 59%|█████▉ | 7297/12384 [15:28:52<10:44:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 0: 59%|█████▉ | 7297/12384 [15:29:00<10:44:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 59%|█████▉ | 7298/12384 [15:29:00<10:45:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 59%|█████▉ | 7298/12384 [15:29:07<10:45:12, 7.61s/it, loss=0.0003, acc=0.9971, iter_time=5.53s]
Epoch 0: 59%|█████▉ | 7299/12384 [15:29:07<10:47:01, 7.63s/it, loss=0.0003, acc=0.9971, iter_time=5.53s]
Epoch 0: 59%|█████▉ | 7299/12384 [15:29:15<10:47:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 59%|█████▉ | 7300/12384 [15:29:15<10:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 59%|█████▉ | 7300/12384 [15:29:23<10:45:55, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.62s]
Epoch 0: 59%|█████▉ | 7301/12384 [15:29:23<10:55:32, 7.74s/it, loss=0.0001, acc=0.9999, iter_time=7.62s]
Epoch 0: 59%|█████▉ | 7301/12384 [15:29:31<10:55:32, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 59%|█████▉ | 7302/12384 [15:29:31<10:52:43, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 59%|█████▉ | 7302/12384 [15:29:38<10:52:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 59%|█████▉ | 7303/12384 [15:29:38<10:49:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 59%|█████▉ | 7303/12384 [15:29:46<10:49:51, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 59%|█████▉ | 7304/12384 [15:29:46<10:48:16, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 59%|█████▉ | 7304/12384 [15:29:54<10:48:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 0: 59%|█████▉ | 7305/12384 [15:29:54<10:47:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 0: 59%|█████▉ | 7305/12384 [15:30:01<10:47:17, 7.65s/it, loss=0.0013, acc=0.9962, iter_time=7.64s]
Epoch 0: 59%|█████▉ | 7306/12384 [15:30:01<10:48:12, 7.66s/it, loss=0.0013, acc=0.9962, iter_time=7.64s]
Epoch 0: 59%|█████▉ | 7306/12384 [15:30:09<10:48:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 59%|█████▉ | 7307/12384 [15:30:09<10:46:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 0: 59%|█████▉ | 7307/12384 [15:30:16<10:46:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 59%|█████▉ | 7308/12384 [15:30:16<10:45:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 59%|█████▉ | 7308/12384 [15:30:24<10:45:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 59%|█████▉ | 7309/12384 [15:30:24<10:44:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 59%|█████▉ | 7309/12384 [15:30:32<10:44:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 59%|█████▉ | 7310/12384 [15:30:32<10:43:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 59%|█████▉ | 7310/12384 [15:30:39<10:43:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 59%|█████▉ | 7311/12384 [15:30:39<10:44:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 59%|█████▉ | 7311/12384 [15:30:47<10:44:06, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=8.02s]
Epoch 0: 59%|█████▉ | 7312/12384 [15:30:47<10:43:48, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=8.02s]
Epoch 0: 59%|█████▉ | 7312/12384 [15:30:54<10:43:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 0: 59%|█████▉ | 7313/12384 [15:30:54<10:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 0: 59%|█████▉ | 7313/12384 [15:31:02<10:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 0: 59%|█████▉ | 7314/12384 [15:31:02<10:43:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 0: 59%|█████▉ | 7314/12384 [15:31:10<10:43:29, 7.62s/it, loss=0.0007, acc=0.9971, iter_time=5.90s]
Epoch 0: 59%|█████▉ | 7315/12384 [15:31:10<10:42:52, 7.61s/it, loss=0.0007, acc=0.9971, iter_time=5.90s]
Epoch 0: 59%|█████▉ | 7315/12384 [15:31:17<10:42:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 59%|█████▉ | 7316/12384 [15:31:17<10:43:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 59%|█████▉ | 7316/12384 [15:31:25<10:43:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 59%|█████▉ | 7317/12384 [15:31:25<10:51:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 59%|█████▉ | 7317/12384 [15:31:33<10:51:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 59%|█████▉ | 7318/12384 [15:31:33<10:48:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 59%|█████▉ | 7318/12384 [15:31:40<10:48:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 59%|█████▉ | 7319/12384 [15:31:40<10:46:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 59%|█████▉ | 7319/12384 [15:31:48<10:46:08, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 59%|█████▉ | 7320/12384 [15:31:48<10:45:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 59%|█████▉ | 7320/12384 [15:31:56<10:45:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 59%|█████▉ | 7321/12384 [15:31:56<10:45:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 59%|█████▉ | 7321/12384 [15:32:03<10:45:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 59%|█████▉ | 7322/12384 [15:32:03<10:46:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 59%|█████▉ | 7322/12384 [15:32:11<10:46:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 0: 59%|█████▉ | 7323/12384 [15:32:11<10:46:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 0: 59%|█████▉ | 7323/12384 [15:32:19<10:46:43, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 59%|█████▉ | 7324/12384 [15:32:19<10:45:50, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 59%|█████▉ | 7324/12384 [15:32:26<10:45:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 59%|█████▉ | 7325/12384 [15:32:26<10:44:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 59%|█████▉ | 7325/12384 [15:32:34<10:44:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 59%|█████▉ | 7326/12384 [15:32:34<10:43:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 59%|█████▉ | 7326/12384 [15:32:42<10:43:18, 7.63s/it, loss=0.0003, acc=0.9984, iter_time=5.83s]
Epoch 0: 59%|█████▉ | 7327/12384 [15:32:42<10:43:00, 7.63s/it, loss=0.0003, acc=0.9984, iter_time=5.83s]
Epoch 0: 59%|█████▉ | 7327/12384 [15:32:49<10:43:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 0: 59%|█████▉ | 7328/12384 [15:32:49<10:43:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 0: 59%|█████▉ | 7328/12384 [15:32:57<10:43:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 59%|█████▉ | 7329/12384 [15:32:57<10:42:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 59%|█████▉ | 7329/12384 [15:33:04<10:42:21, 7.62s/it, loss=0.0005, acc=0.9993, iter_time=7.60s]
Epoch 0: 59%|█████▉ | 7330/12384 [15:33:04<10:41:32, 7.62s/it, loss=0.0005, acc=0.9993, iter_time=7.60s]
Epoch 0: 59%|█████▉ | 7330/12384 [15:33:12<10:41:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 59%|█████▉ | 7331/12384 [15:33:12<10:41:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 59%|█████▉ | 7331/12384 [15:33:20<10:41:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 59%|█████▉ | 7332/12384 [15:33:20<10:41:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 59%|█████▉ | 7332/12384 [15:33:27<10:41:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 59%|█████▉ | 7333/12384 [15:33:27<10:41:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 59%|█████▉ | 7333/12384 [15:33:35<10:41:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 59%|█████▉ | 7334/12384 [15:33:35<10:41:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 59%|█████▉ | 7334/12384 [15:33:43<10:41:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 59%|█████▉ | 7335/12384 [15:33:43<10:41:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 59%|█████▉ | 7335/12384 [15:33:50<10:41:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 59%|█████▉ | 7336/12384 [15:33:50<10:41:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 59%|█████▉ | 7336/12384 [15:33:58<10:41:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.97s]
Epoch 0: 59%|█████▉ | 7337/12384 [15:33:58<10:49:58, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=3.97s]
Epoch 0: 59%|█████▉ | 7337/12384 [15:34:06<10:49:58, 7.73s/it, loss=0.0001, acc=0.9995, iter_time=8.70s]
Epoch 0: 59%|█████▉ | 7338/12384 [15:34:06<10:53:47, 7.77s/it, loss=0.0001, acc=0.9995, iter_time=8.70s]
Epoch 0: 59%|█████▉ | 7338/12384 [15:34:14<10:53:47, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 0: 59%|█████▉ | 7339/12384 [15:34:14<10:57:15, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 0: 59%|█████▉ | 7339/12384 [15:34:22<10:57:15, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 59%|█████▉ | 7340/12384 [15:34:22<11:04:28, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 59%|█████▉ | 7340/12384 [15:34:30<11:04:28, 7.90s/it, loss=0.0013, acc=0.9982, iter_time=7.93s]
Epoch 0: 59%|█████▉ | 7341/12384 [15:34:30<11:04:15, 7.90s/it, loss=0.0013, acc=0.9982, iter_time=7.93s]
Epoch 0: 59%|█████▉ | 7341/12384 [15:34:38<11:04:15, 7.90s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 59%|█████▉ | 7342/12384 [15:34:38<11:05:59, 7.93s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 59%|█████▉ | 7342/12384 [15:34:46<11:05:59, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 59%|█████▉ | 7343/12384 [15:34:46<11:17:44, 8.07s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 59%|█████▉ | 7343/12384 [15:34:54<11:17:44, 8.07s/it, loss=0.0001, acc=0.9991, iter_time=8.75s]
Epoch 0: 59%|█████▉ | 7344/12384 [15:34:54<11:16:21, 8.05s/it, loss=0.0001, acc=0.9991, iter_time=8.75s]
Epoch 0: 59%|█████▉ | 7344/12384 [15:35:02<11:16:21, 8.05s/it, loss=0.0006, acc=0.9995, iter_time=6.55s]
Epoch 0: 59%|█████▉ | 7345/12384 [15:35:02<11:16:51, 8.06s/it, loss=0.0006, acc=0.9995, iter_time=6.55s]
Epoch 0: 59%|█████▉ | 7345/12384 [15:35:10<11:16:51, 8.06s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 59%|█████▉ | 7346/12384 [15:35:10<11:15:13, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 59%|█████▉ | 7346/12384 [15:35:18<11:15:13, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 59%|█████▉ | 7347/12384 [15:35:18<11:14:44, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 59%|█████▉ | 7347/12384 [15:35:26<11:14:44, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 59%|█████▉ | 7348/12384 [15:35:26<11:11:22, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 59%|█████▉ | 7348/12384 [15:35:34<11:11:22, 8.00s/it, loss=0.0003, acc=0.9975, iter_time=8.00s]
Epoch 0: 59%|█████▉ | 7349/12384 [15:35:34<11:12:51, 8.02s/it, loss=0.0003, acc=0.9975, iter_time=8.00s]
Epoch 0: 59%|█████▉ | 7349/12384 [15:35:43<11:12:51, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 59%|█████▉ | 7350/12384 [15:35:43<11:15:02, 8.05s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 59%|█████▉ | 7350/12384 [15:35:50<11:15:02, 8.05s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 59%|█████▉ | 7351/12384 [15:35:50<11:11:40, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 59%|█████▉ | 7351/12384 [15:35:59<11:11:40, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 59%|█████▉ | 7352/12384 [15:35:59<11:15:41, 8.06s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 59%|█████▉ | 7352/12384 [15:36:06<11:15:41, 8.06s/it, loss=0.0002, acc=0.9998, iter_time=5.66s]
Epoch 0: 59%|█████▉ | 7353/12384 [15:36:06<11:08:13, 7.97s/it, loss=0.0002, acc=0.9998, iter_time=5.66s]
Epoch 0: 59%|█████▉ | 7353/12384 [15:36:14<11:08:13, 7.97s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 0: 59%|█████▉ | 7354/12384 [15:36:14<11:00:57, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 0: 59%|█████▉ | 7354/12384 [15:36:22<11:00:57, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 59%|█████▉ | 7355/12384 [15:36:22<10:54:08, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 59%|█████▉ | 7355/12384 [15:36:29<10:54:08, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 59%|█████▉ | 7356/12384 [15:36:29<10:48:36, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 59%|█████▉ | 7356/12384 [15:36:37<10:48:36, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 59%|█████▉ | 7357/12384 [15:36:37<10:45:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 59%|█████▉ | 7357/12384 [15:36:45<10:45:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▉ | 7358/12384 [15:36:45<10:43:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▉ | 7358/12384 [15:36:52<10:43:10, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▉ | 7359/12384 [15:36:52<10:41:09, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▉ | 7359/12384 [15:37:00<10:41:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 59%|█████▉ | 7360/12384 [15:37:00<10:39:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 59%|█████▉ | 7360/12384 [15:37:07<10:39:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 59%|█████▉ | 7361/12384 [15:37:07<10:39:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 59%|█████▉ | 7361/12384 [15:37:15<10:39:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▉ | 7362/12384 [15:37:15<10:38:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 59%|█████▉ | 7362/12384 [15:37:23<10:38:05, 7.62s/it, loss=0.0020, acc=0.9941, iter_time=5.30s]
Epoch 0: 59%|█████▉ | 7363/12384 [15:37:23<10:37:44, 7.62s/it, loss=0.0020, acc=0.9941, iter_time=5.30s]
Epoch 0: 59%|█████▉ | 7363/12384 [15:37:30<10:37:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.85s]
Epoch 0: 59%|█████▉ | 7364/12384 [15:37:30<10:37:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.85s]
Epoch 0: 59%|█████▉ | 7364/12384 [15:37:38<10:37:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 59%|█████▉ | 7365/12384 [15:37:38<10:37:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 59%|█████▉ | 7365/12384 [15:37:45<10:37:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 59%|█████▉ | 7366/12384 [15:37:45<10:36:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 59%|█████▉ | 7366/12384 [15:37:53<10:36:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 59%|█████▉ | 7367/12384 [15:37:53<10:35:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 59%|█████▉ | 7367/12384 [15:38:01<10:35:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 59%|█████▉ | 7368/12384 [15:38:01<10:35:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 59%|█████▉ | 7368/12384 [15:38:08<10:35:38, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.36s]
Epoch 0: 60%|█████▉ | 7369/12384 [15:38:08<10:43:31, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.36s]
Epoch 0: 60%|█████▉ | 7369/12384 [15:38:16<10:43:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 60%|█████▉ | 7370/12384 [15:38:16<10:41:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 60%|█████▉ | 7370/12384 [15:38:24<10:41:52, 7.68s/it, loss=0.0039, acc=0.9970, iter_time=9.11s]
Epoch 0: 60%|█████▉ | 7371/12384 [15:38:24<10:39:56, 7.66s/it, loss=0.0039, acc=0.9970, iter_time=9.11s]
Epoch 0: 60%|█████▉ | 7371/12384 [15:38:31<10:39:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 60%|█████▉ | 7372/12384 [15:38:31<10:40:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 60%|█████▉ | 7372/12384 [15:38:39<10:40:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|█████▉ | 7373/12384 [15:38:39<10:40:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|█████▉ | 7373/12384 [15:38:47<10:40:36, 7.67s/it, loss=0.0002, acc=0.9997, iter_time=7.66s]
Epoch 0: 60%|█████▉ | 7374/12384 [15:38:47<10:39:14, 7.66s/it, loss=0.0002, acc=0.9997, iter_time=7.66s]
Epoch 0: 60%|█████▉ | 7374/12384 [15:38:54<10:39:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 60%|█████▉ | 7375/12384 [15:38:54<10:38:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 60%|█████▉ | 7375/12384 [15:39:02<10:38:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 0: 60%|█████▉ | 7376/12384 [15:39:02<10:37:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 0: 60%|█████▉ | 7376/12384 [15:39:10<10:37:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 60%|█████▉ | 7377/12384 [15:39:10<10:37:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 60%|█████▉ | 7377/12384 [15:39:18<10:37:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 60%|█████▉ | 7378/12384 [15:39:18<11:00:47, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 60%|█████▉ | 7378/12384 [15:39:27<11:00:47, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 60%|█████▉ | 7379/12384 [15:39:27<11:10:53, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 60%|█████▉ | 7379/12384 [15:39:35<11:10:53, 8.04s/it, loss=0.0001, acc=1.0000, iter_time=8.42s]
Epoch 0: 60%|█████▉ | 7380/12384 [15:39:35<11:22:45, 8.19s/it, loss=0.0001, acc=1.0000, iter_time=8.42s]
Epoch 0: 60%|█████▉ | 7380/12384 [15:39:43<11:22:45, 8.19s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 0: 60%|█████▉ | 7381/12384 [15:39:43<11:25:35, 8.22s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 0: 60%|█████▉ | 7381/12384 [15:39:51<11:25:35, 8.22s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 60%|█████▉ | 7382/12384 [15:39:51<11:10:29, 8.04s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 60%|█████▉ | 7382/12384 [15:39:59<11:10:29, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 60%|█████▉ | 7383/12384 [15:39:59<10:59:19, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 60%|█████▉ | 7383/12384 [15:40:06<10:59:19, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 60%|█████▉ | 7384/12384 [15:40:06<10:51:13, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 60%|█████▉ | 7384/12384 [15:40:14<10:51:13, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 60%|█████▉ | 7385/12384 [15:40:14<10:45:38, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 60%|█████▉ | 7385/12384 [15:40:21<10:45:38, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 60%|█████▉ | 7386/12384 [15:40:21<10:42:29, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 60%|█████▉ | 7386/12384 [15:40:29<10:42:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|█████▉ | 7387/12384 [15:40:29<10:39:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|█████▉ | 7387/12384 [15:40:37<10:39:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 60%|█████▉ | 7388/12384 [15:40:37<10:39:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 60%|█████▉ | 7388/12384 [15:40:44<10:39:24, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=6.71s]
Epoch 0: 60%|█████▉ | 7389/12384 [15:40:44<10:37:23, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=6.71s]
Epoch 0: 60%|█████▉ | 7389/12384 [15:40:52<10:37:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 60%|█████▉ | 7390/12384 [15:40:52<10:36:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 60%|█████▉ | 7390/12384 [15:41:00<10:36:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 60%|█████▉ | 7391/12384 [15:41:00<10:37:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 60%|█████▉ | 7391/12384 [15:41:07<10:37:03, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 60%|█████▉ | 7392/12384 [15:41:07<10:35:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 60%|█████▉ | 7392/12384 [15:41:15<10:35:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.78s]
Epoch 0: 60%|█████▉ | 7393/12384 [15:41:15<10:34:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.78s]
Epoch 0: 60%|█████▉ | 7393/12384 [15:41:22<10:34:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 60%|█████▉ | 7394/12384 [15:41:22<10:33:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 60%|█████▉ | 7394/12384 [15:41:30<10:33:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 60%|█████▉ | 7395/12384 [15:41:30<10:42:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 60%|█████▉ | 7395/12384 [15:41:38<10:42:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 60%|█████▉ | 7396/12384 [15:41:38<10:43:14, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 60%|█████▉ | 7396/12384 [15:41:46<10:43:14, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 60%|█████▉ | 7397/12384 [15:41:46<10:40:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 60%|█████▉ | 7397/12384 [15:41:53<10:40:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 60%|█████▉ | 7398/12384 [15:41:53<10:40:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 60%|█████▉ | 7398/12384 [15:42:01<10:40:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 0: 60%|█████▉ | 7399/12384 [15:42:01<10:41:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 0: 60%|█████▉ | 7399/12384 [15:42:09<10:41:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 60%|█████▉ | 7400/12384 [15:42:09<10:39:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 60%|█████▉ | 7400/12384 [15:42:16<10:39:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 60%|█████▉ | 7401/12384 [15:42:16<10:36:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 60%|█████▉ | 7401/12384 [15:42:24<10:36:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 60%|█████▉ | 7402/12384 [15:42:24<10:35:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 60%|█████▉ | 7402/12384 [15:42:32<10:35:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 60%|█████▉ | 7403/12384 [15:42:32<10:34:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 60%|█████▉ | 7403/12384 [15:42:39<10:34:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 60%|█████▉ | 7404/12384 [15:42:39<10:33:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 60%|█████▉ | 7404/12384 [15:42:47<10:33:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 60%|█████▉ | 7405/12384 [15:42:47<10:39:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 60%|█████▉ | 7405/12384 [15:42:55<10:39:48, 7.71s/it, loss=0.0004, acc=0.9981, iter_time=7.59s]
Epoch 0: 60%|█████▉ | 7406/12384 [15:42:55<10:37:20, 7.68s/it, loss=0.0004, acc=0.9981, iter_time=7.59s]
Epoch 0: 60%|█████▉ | 7406/12384 [15:43:02<10:37:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 60%|█████▉ | 7407/12384 [15:43:02<10:35:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 60%|█████▉ | 7407/12384 [15:43:10<10:35:43, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=10.98s]
Epoch 0: 60%|█████▉ | 7408/12384 [15:43:10<10:37:12, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=10.98s]
Epoch 0: 60%|█████▉ | 7408/12384 [15:43:18<10:37:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 60%|█████▉ | 7409/12384 [15:43:18<10:37:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 60%|█████▉ | 7409/12384 [15:43:25<10:37:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 0: 60%|█████▉ | 7410/12384 [15:43:25<10:35:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 0: 60%|█████▉ | 7410/12384 [15:43:33<10:35:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 60%|█████▉ | 7411/12384 [15:43:33<10:34:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 60%|█████▉ | 7411/12384 [15:43:41<10:34:00, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|█████▉ | 7412/12384 [15:43:41<10:33:21, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|█████▉ | 7412/12384 [15:43:48<10:33:21, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 60%|█████▉ | 7413/12384 [15:43:48<10:33:19, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 60%|█████▉ | 7413/12384 [15:43:56<10:33:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 60%|█████▉ | 7414/12384 [15:43:56<10:32:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 60%|█████▉ | 7414/12384 [15:44:04<10:32:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 60%|█████▉ | 7415/12384 [15:44:04<10:33:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 60%|█████▉ | 7415/12384 [15:44:11<10:33:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 60%|█████▉ | 7416/12384 [15:44:11<10:32:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 60%|█████▉ | 7416/12384 [15:44:19<10:32:49, 7.64s/it, loss=0.0023, acc=0.9947, iter_time=7.72s]
Epoch 0: 60%|█████▉ | 7417/12384 [15:44:19<10:33:28, 7.65s/it, loss=0.0023, acc=0.9947, iter_time=7.72s]
Epoch 0: 60%|█████▉ | 7417/12384 [15:44:27<10:33:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 60%|█████▉ | 7418/12384 [15:44:27<10:32:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 60%|█████▉ | 7418/12384 [15:44:34<10:32:22, 7.64s/it, loss=0.0001, acc=0.9990, iter_time=10.62s]
Epoch 0: 60%|█████▉ | 7419/12384 [15:44:34<10:31:15, 7.63s/it, loss=0.0001, acc=0.9990, iter_time=10.62s]
Epoch 0: 60%|█████▉ | 7419/12384 [15:44:42<10:31:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 60%|█████▉ | 7420/12384 [15:44:42<10:30:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 60%|█████▉ | 7420/12384 [15:44:50<10:30:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 60%|█████▉ | 7421/12384 [15:44:50<10:38:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 60%|█████▉ | 7421/12384 [15:44:57<10:38:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 60%|█████▉ | 7422/12384 [15:44:57<10:37:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 60%|█████▉ | 7422/12384 [15:45:05<10:37:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 60%|█████▉ | 7423/12384 [15:45:05<10:35:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 60%|█████▉ | 7423/12384 [15:45:13<10:35:43, 7.69s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 60%|█████▉ | 7424/12384 [15:45:13<10:35:01, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 60%|█████▉ | 7424/12384 [15:45:20<10:35:01, 7.68s/it, loss=0.0003, acc=0.9984, iter_time=7.66s]
Epoch 0: 60%|█████▉ | 7425/12384 [15:45:20<10:32:57, 7.66s/it, loss=0.0003, acc=0.9984, iter_time=7.66s]
Epoch 0: 60%|█████▉ | 7425/12384 [15:45:28<10:32:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 60%|█████▉ | 7426/12384 [15:45:28<10:34:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 60%|█████▉ | 7426/12384 [15:45:36<10:34:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 60%|█████▉ | 7427/12384 [15:45:36<10:32:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 60%|█████▉ | 7427/12384 [15:45:43<10:32:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|█████▉ | 7428/12384 [15:45:43<10:31:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|█████▉ | 7428/12384 [15:45:51<10:31:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 60%|█████▉ | 7429/12384 [15:45:51<10:30:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 60%|█████▉ | 7429/12384 [15:45:59<10:30:06, 7.63s/it, loss=0.0004, acc=0.9989, iter_time=7.60s]
Epoch 0: 60%|█████▉ | 7430/12384 [15:45:59<10:29:51, 7.63s/it, loss=0.0004, acc=0.9989, iter_time=7.60s]
Epoch 0: 60%|█████▉ | 7430/12384 [15:46:06<10:29:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 60%|██████ | 7431/12384 [15:46:06<10:31:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 60%|██████ | 7431/12384 [15:46:14<10:31:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 60%|██████ | 7432/12384 [15:46:14<10:31:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 60%|██████ | 7432/12384 [15:46:22<10:31:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 60%|██████ | 7433/12384 [15:46:22<10:31:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 60%|██████ | 7433/12384 [15:46:29<10:31:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 60%|██████ | 7434/12384 [15:46:29<10:30:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 60%|██████ | 7434/12384 [15:46:37<10:30:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|██████ | 7435/12384 [15:46:37<10:29:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|██████ | 7435/12384 [15:46:44<10:29:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 0: 60%|██████ | 7436/12384 [15:46:44<10:29:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 0: 60%|██████ | 7436/12384 [15:46:52<10:29:04, 7.63s/it, loss=0.0025, acc=0.9974, iter_time=8.45s]
Epoch 0: 60%|██████ | 7437/12384 [15:46:52<10:28:58, 7.63s/it, loss=0.0025, acc=0.9974, iter_time=8.45s]
Epoch 0: 60%|██████ | 7437/12384 [15:47:00<10:28:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 60%|██████ | 7438/12384 [15:47:00<10:28:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 60%|██████ | 7438/12384 [15:47:07<10:28:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 60%|██████ | 7439/12384 [15:47:07<10:28:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 60%|██████ | 7439/12384 [15:47:15<10:28:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 60%|██████ | 7440/12384 [15:47:15<10:28:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 60%|██████ | 7440/12384 [15:47:22<10:28:16, 7.62s/it, loss=0.0002, acc=0.9984, iter_time=7.23s]
Epoch 0: 60%|██████ | 7441/12384 [15:47:22<10:27:29, 7.62s/it, loss=0.0002, acc=0.9984, iter_time=7.23s]
Epoch 0: 60%|██████ | 7441/12384 [15:47:30<10:27:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|██████ | 7442/12384 [15:47:30<10:26:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|██████ | 7442/12384 [15:47:38<10:26:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 60%|██████ | 7443/12384 [15:47:38<10:27:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 60%|██████ | 7443/12384 [15:47:45<10:27:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 60%|██████ | 7444/12384 [15:47:45<10:27:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 60%|██████ | 7444/12384 [15:47:53<10:27:07, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.59s]
Epoch 0: 60%|██████ | 7445/12384 [15:47:53<10:26:47, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.59s]
Epoch 0: 60%|██████ | 7445/12384 [15:48:01<10:26:47, 7.61s/it, loss=0.0016, acc=0.9966, iter_time=4.81s]
Epoch 0: 60%|██████ | 7446/12384 [15:48:01<10:26:21, 7.61s/it, loss=0.0016, acc=0.9966, iter_time=4.81s]
Epoch 0: 60%|██████ | 7446/12384 [15:48:08<10:26:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.80s]
Epoch 0: 60%|██████ | 7447/12384 [15:48:08<10:28:06, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.80s]
Epoch 0: 60%|██████ | 7447/12384 [15:48:16<10:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 0: 60%|██████ | 7448/12384 [15:48:16<10:35:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 0: 60%|██████ | 7448/12384 [15:48:24<10:35:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 0: 60%|██████ | 7449/12384 [15:48:24<10:40:38, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 0: 60%|██████ | 7449/12384 [15:48:32<10:40:38, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 60%|██████ | 7450/12384 [15:48:32<10:45:02, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 60%|██████ | 7450/12384 [15:48:40<10:45:02, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 0: 60%|██████ | 7451/12384 [15:48:40<10:48:22, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 0: 60%|██████ | 7451/12384 [15:48:48<10:48:22, 7.89s/it, loss=0.0002, acc=1.0000, iter_time=10.55s]
Epoch 0: 60%|██████ | 7452/12384 [15:48:48<10:48:35, 7.89s/it, loss=0.0002, acc=1.0000, iter_time=10.55s]
Epoch 0: 60%|██████ | 7452/12384 [15:48:56<10:48:35, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 0: 60%|██████ | 7453/12384 [15:48:56<10:50:56, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 0: 60%|██████ | 7453/12384 [15:49:04<10:50:56, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 60%|██████ | 7454/12384 [15:49:04<10:53:17, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 60%|██████ | 7454/12384 [15:49:12<10:53:17, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 60%|██████ | 7455/12384 [15:49:12<10:52:47, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 60%|██████ | 7455/12384 [15:49:20<10:52:47, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 60%|██████ | 7456/12384 [15:49:20<10:50:08, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 60%|██████ | 7456/12384 [15:49:28<10:50:08, 7.92s/it, loss=0.0002, acc=0.9993, iter_time=7.97s]
Epoch 0: 60%|██████ | 7457/12384 [15:49:28<10:52:04, 7.94s/it, loss=0.0002, acc=0.9993, iter_time=7.97s]
Epoch 0: 60%|██████ | 7457/12384 [15:49:36<10:52:04, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 60%|██████ | 7458/12384 [15:49:36<10:58:24, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 60%|██████ | 7458/12384 [15:49:44<10:58:24, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 60%|██████ | 7459/12384 [15:49:44<10:48:31, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 60%|██████ | 7459/12384 [15:49:51<10:48:31, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 0: 60%|██████ | 7460/12384 [15:49:51<10:41:03, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 0: 60%|██████ | 7460/12384 [15:49:59<10:41:03, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 60%|██████ | 7461/12384 [15:49:59<10:36:30, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 60%|██████ | 7461/12384 [15:50:06<10:36:30, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 60%|██████ | 7462/12384 [15:50:06<10:34:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 60%|██████ | 7462/12384 [15:50:14<10:34:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 60%|██████ | 7463/12384 [15:50:14<10:31:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 60%|██████ | 7463/12384 [15:50:22<10:31:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 60%|██████ | 7464/12384 [15:50:22<10:29:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 60%|██████ | 7464/12384 [15:50:29<10:29:41, 7.68s/it, loss=0.0004, acc=0.9971, iter_time=5.60s]
Epoch 0: 60%|██████ | 7465/12384 [15:50:29<10:28:02, 7.66s/it, loss=0.0004, acc=0.9971, iter_time=5.60s]
Epoch 0: 60%|██████ | 7465/12384 [15:50:37<10:28:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 60%|██████ | 7466/12384 [15:50:37<10:26:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 60%|██████ | 7466/12384 [15:50:45<10:26:22, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=7.30s]
Epoch 0: 60%|██████ | 7467/12384 [15:50:45<10:25:39, 7.63s/it, loss=0.0002, acc=0.9997, iter_time=7.30s]
Epoch 0: 60%|██████ | 7467/12384 [15:50:52<10:25:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 60%|██████ | 7468/12384 [15:50:52<10:25:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 60%|██████ | 7468/12384 [15:51:00<10:25:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|██████ | 7469/12384 [15:51:00<10:24:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|██████ | 7469/12384 [15:51:07<10:24:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|██████ | 7470/12384 [15:51:07<10:24:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|██████ | 7470/12384 [15:51:15<10:24:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|██████ | 7471/12384 [15:51:15<10:23:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|██████ | 7471/12384 [15:51:23<10:23:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 60%|██████ | 7472/12384 [15:51:23<10:22:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 60%|██████ | 7472/12384 [15:51:30<10:22:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 60%|██████ | 7473/12384 [15:51:30<10:23:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 60%|██████ | 7473/12384 [15:51:38<10:23:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 60%|██████ | 7474/12384 [15:51:38<10:30:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 60%|██████ | 7474/12384 [15:51:46<10:30:27, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 0: 60%|██████ | 7475/12384 [15:51:46<10:28:02, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 0: 60%|██████ | 7475/12384 [15:51:53<10:28:02, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=4.22s]
Epoch 0: 60%|██████ | 7476/12384 [15:51:53<10:26:26, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=4.22s]
Epoch 0: 60%|██████ | 7476/12384 [15:52:01<10:26:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 0: 60%|██████ | 7477/12384 [15:52:01<10:24:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 0: 60%|██████ | 7477/12384 [15:52:09<10:24:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|██████ | 7478/12384 [15:52:09<10:24:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 60%|██████ | 7478/12384 [15:52:16<10:24:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|██████ | 7479/12384 [15:52:16<10:26:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 60%|██████ | 7479/12384 [15:52:24<10:26:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 60%|██████ | 7480/12384 [15:52:24<10:25:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 60%|██████ | 7480/12384 [15:52:32<10:25:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 60%|██████ | 7481/12384 [15:52:32<10:25:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 60%|██████ | 7481/12384 [15:52:39<10:25:18, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 60%|██████ | 7482/12384 [15:52:39<10:23:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 60%|██████ | 7482/12384 [15:52:47<10:23:55, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=6.96s]
Epoch 0: 60%|██████ | 7483/12384 [15:52:47<10:22:39, 7.62s/it, loss=0.0003, acc=0.9999, iter_time=6.96s]
Epoch 0: 60%|██████ | 7483/12384 [15:52:54<10:22:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 0: 60%|██████ | 7484/12384 [15:52:54<10:21:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 0: 60%|██████ | 7484/12384 [15:53:02<10:21:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 60%|██████ | 7485/12384 [15:53:02<10:28:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 60%|██████ | 7485/12384 [15:53:10<10:28:57, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 60%|██████ | 7486/12384 [15:53:10<10:27:49, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 60%|██████ | 7486/12384 [15:53:18<10:27:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 0: 60%|██████ | 7487/12384 [15:53:18<10:25:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 0: 60%|██████ | 7487/12384 [15:53:25<10:25:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 60%|██████ | 7488/12384 [15:53:25<10:23:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 60%|██████ | 7488/12384 [15:53:33<10:23:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 60%|██████ | 7489/12384 [15:53:33<10:24:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 60%|██████ | 7489/12384 [15:53:40<10:24:22, 7.65s/it, loss=0.0063, acc=0.9881, iter_time=7.59s]
Epoch 0: 60%|██████ | 7490/12384 [15:53:40<10:22:45, 7.63s/it, loss=0.0063, acc=0.9881, iter_time=7.59s]
Epoch 0: 60%|██████ | 7490/12384 [15:53:48<10:22:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 60%|██████ | 7491/12384 [15:53:48<10:21:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 60%|██████ | 7491/12384 [15:53:56<10:21:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 60%|██████ | 7492/12384 [15:53:56<10:21:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 60%|██████ | 7492/12384 [15:54:03<10:21:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 61%|██████ | 7493/12384 [15:54:03<10:20:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 61%|██████ | 7493/12384 [15:54:11<10:20:39, 7.61s/it, loss=0.0004, acc=0.9980, iter_time=7.60s]
Epoch 0: 61%|██████ | 7494/12384 [15:54:11<10:20:28, 7.61s/it, loss=0.0004, acc=0.9980, iter_time=7.60s]
Epoch 0: 61%|██████ | 7494/12384 [15:54:18<10:20:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 61%|██████ | 7495/12384 [15:54:18<10:20:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 61%|██████ | 7495/12384 [15:54:26<10:20:35, 7.62s/it, loss=0.0004, acc=0.9983, iter_time=10.15s]
Epoch 0: 61%|██████ | 7496/12384 [15:54:26<10:23:13, 7.65s/it, loss=0.0004, acc=0.9983, iter_time=10.15s]
Epoch 0: 61%|██████ | 7496/12384 [15:54:34<10:23:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 61%|██████ | 7497/12384 [15:54:34<10:22:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 61%|██████ | 7497/12384 [15:54:41<10:22:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 61%|██████ | 7498/12384 [15:54:41<10:21:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 61%|██████ | 7498/12384 [15:54:49<10:21:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 61%|██████ | 7499/12384 [15:54:49<10:20:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 61%|██████ | 7499/12384 [15:54:57<10:20:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 61%|██████ | 7500/12384 [15:54:57<10:24:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 61%|██████ | 7500/12384 [15:55:05<10:24:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 0: 61%|██████ | 7501/12384 [15:55:05<10:31:24, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 0: 61%|██████ | 7501/12384 [15:55:12<10:31:24, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 61%|██████ | 7502/12384 [15:55:12<10:27:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 61%|██████ | 7502/12384 [15:55:20<10:27:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 61%|██████ | 7503/12384 [15:55:20<10:25:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 61%|██████ | 7503/12384 [15:55:28<10:25:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 0: 61%|██████ | 7504/12384 [15:55:28<10:23:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 0: 61%|██████ | 7504/12384 [15:55:35<10:23:22, 7.66s/it, loss=0.0058, acc=0.9980, iter_time=7.21s]
Epoch 0: 61%|██████ | 7505/12384 [15:55:35<10:21:32, 7.64s/it, loss=0.0058, acc=0.9980, iter_time=7.21s]
Epoch 0: 61%|██████ | 7505/12384 [15:55:43<10:21:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 61%|██████ | 7506/12384 [15:55:43<10:22:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 61%|██████ | 7506/12384 [15:55:51<10:22:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 61%|██████ | 7507/12384 [15:55:51<10:21:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 61%|██████ | 7507/12384 [15:55:58<10:21:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 61%|██████ | 7508/12384 [15:55:58<10:20:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 61%|██████ | 7508/12384 [15:56:06<10:20:27, 7.63s/it, loss=0.0006, acc=0.9982, iter_time=7.59s]
Epoch 0: 61%|██████ | 7509/12384 [15:56:06<10:19:16, 7.62s/it, loss=0.0006, acc=0.9982, iter_time=7.59s]
Epoch 0: 61%|██████ | 7509/12384 [15:56:13<10:19:16, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=4.47s]
Epoch 0: 61%|██████ | 7510/12384 [15:56:13<10:19:07, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=4.47s]
Epoch 0: 61%|██████ | 7510/12384 [15:56:21<10:19:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.06s]
Epoch 0: 61%|██████ | 7511/12384 [15:56:21<10:25:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.06s]
Epoch 0: 61%|██████ | 7511/12384 [15:56:29<10:25:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 61%|██████ | 7512/12384 [15:56:29<10:23:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 61%|██████ | 7512/12384 [15:56:36<10:23:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 61%|██████ | 7513/12384 [15:56:36<10:21:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 61%|██████ | 7513/12384 [15:56:44<10:21:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 61%|██████ | 7514/12384 [15:56:44<10:20:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 61%|██████ | 7514/12384 [15:56:52<10:20:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 61%|██████ | 7515/12384 [15:56:52<10:18:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 61%|██████ | 7515/12384 [15:56:59<10:18:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 61%|██████ | 7516/12384 [15:56:59<10:17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 61%|██████ | 7516/12384 [15:57:07<10:17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 61%|██████ | 7517/12384 [15:57:07<10:20:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 61%|██████ | 7517/12384 [15:57:15<10:20:04, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 61%|██████ | 7518/12384 [15:57:15<10:18:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 61%|██████ | 7518/12384 [15:57:22<10:18:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 61%|██████ | 7519/12384 [15:57:22<10:17:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 61%|██████ | 7519/12384 [15:57:30<10:17:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 0: 61%|██████ | 7520/12384 [15:57:30<10:18:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 0: 61%|██████ | 7520/12384 [15:57:37<10:18:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 61%|██████ | 7521/12384 [15:57:37<10:17:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 61%|██████ | 7521/12384 [15:57:45<10:17:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 61%|██████ | 7522/12384 [15:57:45<10:17:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 61%|██████ | 7522/12384 [15:57:53<10:17:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 61%|██████ | 7523/12384 [15:57:53<10:17:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 61%|██████ | 7523/12384 [15:58:00<10:17:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 61%|██████ | 7524/12384 [15:58:00<10:17:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 61%|██████ | 7524/12384 [15:58:08<10:17:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.56s]
Epoch 0: 61%|██████ | 7525/12384 [15:58:08<10:17:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.56s]
Epoch 0: 61%|██████ | 7525/12384 [15:58:16<10:17:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 61%|██████ | 7526/12384 [15:58:16<10:17:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 61%|██████ | 7526/12384 [15:58:23<10:17:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 61%|██████ | 7527/12384 [15:58:23<10:24:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 61%|██████ | 7527/12384 [15:58:31<10:24:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 61%|██████ | 7528/12384 [15:58:31<10:22:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 61%|██████ | 7528/12384 [15:58:39<10:22:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 0: 61%|██████ | 7529/12384 [15:58:39<10:20:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 0: 61%|██████ | 7529/12384 [15:58:46<10:20:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 61%|██████ | 7530/12384 [15:58:46<10:19:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 61%|██████ | 7530/12384 [15:58:54<10:19:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 61%|██████ | 7531/12384 [15:58:54<10:18:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 61%|██████ | 7531/12384 [15:59:02<10:18:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 61%|██████ | 7532/12384 [15:59:02<10:19:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 61%|██████ | 7532/12384 [15:59:09<10:19:03, 7.66s/it, loss=0.0005, acc=0.9981, iter_time=8.01s]
Epoch 0: 61%|██████ | 7533/12384 [15:59:09<10:18:00, 7.64s/it, loss=0.0005, acc=0.9981, iter_time=8.01s]
Epoch 0: 61%|██████ | 7533/12384 [15:59:17<10:18:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 61%|██████ | 7534/12384 [15:59:17<10:17:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 61%|██████ | 7534/12384 [15:59:25<10:17:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 61%|██████ | 7535/12384 [15:59:25<10:23:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 61%|██████ | 7535/12384 [15:59:32<10:23:46, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 61%|██████ | 7536/12384 [15:59:32<10:21:35, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 61%|██████ | 7536/12384 [15:59:40<10:21:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 0: 61%|██████ | 7537/12384 [15:59:40<10:19:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 0: 61%|██████ | 7537/12384 [15:59:48<10:19:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 61%|██████ | 7538/12384 [15:59:48<10:17:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 61%|██████ | 7538/12384 [15:59:55<10:17:54, 7.65s/it, loss=0.0007, acc=0.9993, iter_time=7.60s]
Epoch 0: 61%|██████ | 7539/12384 [15:59:55<10:16:55, 7.64s/it, loss=0.0007, acc=0.9993, iter_time=7.60s]
Epoch 0: 61%|██████ | 7539/12384 [16:00:03<10:16:55, 7.64s/it, loss=0.0002, acc=0.9994, iter_time=7.61s]
Epoch 0: 61%|██████ | 7540/12384 [16:00:03<10:16:21, 7.63s/it, loss=0.0002, acc=0.9994, iter_time=7.61s]
Epoch 0: 61%|██████ | 7540/12384 [16:00:10<10:16:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 61%|██████ | 7541/12384 [16:00:10<10:15:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 61%|██████ | 7541/12384 [16:00:18<10:15:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 61%|██████ | 7542/12384 [16:00:18<10:15:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 61%|██████ | 7542/12384 [16:00:26<10:15:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 0: 61%|██████ | 7543/12384 [16:00:26<10:15:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 0: 61%|██████ | 7543/12384 [16:00:33<10:15:21, 7.63s/it, loss=0.0016, acc=0.9969, iter_time=8.03s]
Epoch 0: 61%|██████ | 7544/12384 [16:00:33<10:15:36, 7.63s/it, loss=0.0016, acc=0.9969, iter_time=8.03s]
Epoch 0: 61%|██████ | 7544/12384 [16:00:41<10:15:36, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=7.25s]
Epoch 0: 61%|██████ | 7545/12384 [16:00:41<10:15:03, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=7.25s]
Epoch 0: 61%|██████ | 7545/12384 [16:00:49<10:15:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 61%|██████ | 7546/12384 [16:00:49<10:14:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 61%|██████ | 7546/12384 [16:00:56<10:14:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 61%|██████ | 7547/12384 [16:00:56<10:13:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 61%|██████ | 7547/12384 [16:01:04<10:13:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 61%|██████ | 7548/12384 [16:01:04<10:13:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 61%|██████ | 7548/12384 [16:01:11<10:13:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 61%|██████ | 7549/12384 [16:01:11<10:13:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 61%|██████ | 7549/12384 [16:01:19<10:13:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 61%|██████ | 7550/12384 [16:01:19<10:13:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 61%|██████ | 7550/12384 [16:01:27<10:13:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.01s]
Epoch 0: 61%|██████ | 7551/12384 [16:01:27<10:15:10, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.01s]
Epoch 0: 61%|██████ | 7551/12384 [16:01:34<10:15:10, 7.64s/it, loss=0.0001, acc=0.9992, iter_time=10.34s]
Epoch 0: 61%|██████ | 7552/12384 [16:01:34<10:15:34, 7.64s/it, loss=0.0001, acc=0.9992, iter_time=10.34s]
Epoch 0: 61%|██████ | 7552/12384 [16:01:42<10:15:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 61%|██████ | 7553/12384 [16:01:42<10:24:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 61%|██████ | 7553/12384 [16:01:50<10:24:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 61%|██████ | 7554/12384 [16:01:50<10:20:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 61%|██████ | 7554/12384 [16:01:58<10:20:39, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=4.48s]
Epoch 0: 61%|██████ | 7555/12384 [16:01:58<10:17:41, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=4.48s]
Epoch 0: 61%|██████ | 7555/12384 [16:02:05<10:17:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 0: 61%|██████ | 7556/12384 [16:02:05<10:15:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 0: 61%|██████ | 7556/12384 [16:02:13<10:15:30, 7.65s/it, loss=0.0006, acc=0.9985, iter_time=4.24s]
Epoch 0: 61%|██████ | 7557/12384 [16:02:13<10:15:16, 7.65s/it, loss=0.0006, acc=0.9985, iter_time=4.24s]
Epoch 0: 61%|██████ | 7557/12384 [16:02:20<10:15:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 0: 61%|██████ | 7558/12384 [16:02:20<10:14:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 0: 61%|██████ | 7558/12384 [16:02:28<10:14:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 61%|██████ | 7559/12384 [16:02:28<10:14:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 61%|██████ | 7559/12384 [16:02:36<10:14:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 61%|██████ | 7560/12384 [16:02:36<10:12:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 61%|██████ | 7560/12384 [16:02:43<10:12:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 61%|██████ | 7561/12384 [16:02:43<10:12:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 61%|██████ | 7561/12384 [16:02:51<10:12:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 61%|██████ | 7562/12384 [16:02:51<10:12:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 61%|██████ | 7562/12384 [16:02:58<10:12:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.08s]
Epoch 0: 61%|██████ | 7563/12384 [16:02:58<10:11:39, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.08s]
Epoch 0: 61%|██████ | 7563/12384 [16:03:06<10:11:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 61%|██████ | 7564/12384 [16:03:06<10:11:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 61%|██████ | 7564/12384 [16:03:14<10:11:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 61%|██████ | 7565/12384 [16:03:14<10:10:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 0: 61%|██████ | 7565/12384 [16:03:21<10:10:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 61%|██████ | 7566/12384 [16:03:21<10:11:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 61%|██████ | 7566/12384 [16:03:29<10:11:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 0: 61%|██████ | 7567/12384 [16:03:29<10:11:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 0: 61%|██████ | 7567/12384 [16:03:37<10:11:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.96s]
Epoch 0: 61%|██████ | 7568/12384 [16:03:37<10:10:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.96s]
Epoch 0: 61%|██████ | 7568/12384 [16:03:44<10:10:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 61%|██████ | 7569/12384 [16:03:44<10:10:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 61%|██████ | 7569/12384 [16:03:52<10:10:41, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 61%|██████ | 7570/12384 [16:03:52<10:10:18, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 61%|██████ | 7570/12384 [16:03:59<10:10:18, 7.61s/it, loss=0.0011, acc=0.9978, iter_time=6.67s]
Epoch 0: 61%|██████ | 7571/12384 [16:03:59<10:10:45, 7.61s/it, loss=0.0011, acc=0.9978, iter_time=6.67s]
Epoch 0: 61%|██████ | 7571/12384 [16:04:07<10:10:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 61%|██████ | 7572/12384 [16:04:07<10:10:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 61%|██████ | 7572/12384 [16:04:15<10:10:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 61%|██████ | 7573/12384 [16:04:15<10:10:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 61%|██████ | 7573/12384 [16:04:22<10:10:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 61%|██████ | 7574/12384 [16:04:22<10:09:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 61%|██████ | 7574/12384 [16:04:30<10:09:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 0: 61%|██████ | 7575/12384 [16:04:30<10:10:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 0: 61%|██████ | 7575/12384 [16:04:37<10:10:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.08s]
Epoch 0: 61%|██████ | 7576/12384 [16:04:37<10:09:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.08s]
Epoch 0: 61%|██████ | 7576/12384 [16:04:45<10:09:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 0: 61%|██████ | 7577/12384 [16:04:45<10:10:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 0: 61%|██████ | 7577/12384 [16:04:52<10:10:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 61%|██████ | 7578/12384 [16:04:52<10:02:18, 7.52s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 61%|██████ | 7578/12384 [16:05:00<10:02:18, 7.52s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 61%|██████ | 7579/12384 [16:05:00<10:11:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 61%|██████ | 7579/12384 [16:05:08<10:11:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 61%|██████ | 7580/12384 [16:05:08<10:10:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 61%|██████ | 7580/12384 [16:05:16<10:10:31, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.59s]
Epoch 0: 61%|██████ | 7581/12384 [16:05:16<10:12:46, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.59s]
Epoch 0: 61%|██████ | 7581/12384 [16:05:23<10:12:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 61%|██████ | 7582/12384 [16:05:23<10:11:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 61%|██████ | 7582/12384 [16:05:31<10:11:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 61%|██████ | 7583/12384 [16:05:31<10:11:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 61%|██████ | 7583/12384 [16:05:38<10:11:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 61%|██████ | 7584/12384 [16:05:38<10:10:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 61%|██████ | 7584/12384 [16:05:46<10:10:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 61%|██████ | 7585/12384 [16:05:46<10:10:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 61%|██████ | 7585/12384 [16:05:54<10:10:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 61%|██████▏ | 7586/12384 [16:05:54<10:09:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 61%|██████▏ | 7586/12384 [16:06:02<10:09:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 0: 61%|██████▏ | 7587/12384 [16:06:02<10:15:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 0: 61%|██████▏ | 7587/12384 [16:06:09<10:15:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 61%|██████▏ | 7588/12384 [16:06:09<10:12:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 61%|██████▏ | 7588/12384 [16:06:17<10:12:52, 7.67s/it, loss=0.0003, acc=0.9985, iter_time=5.29s]
Epoch 0: 61%|██████▏ | 7589/12384 [16:06:17<10:11:37, 7.65s/it, loss=0.0003, acc=0.9985, iter_time=5.29s]
Epoch 0: 61%|██████▏ | 7589/12384 [16:06:24<10:11:37, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.96s]
Epoch 0: 61%|██████▏ | 7590/12384 [16:06:24<10:10:41, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.96s]
Epoch 0: 61%|██████▏ | 7590/12384 [16:06:32<10:10:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 0: 61%|██████▏ | 7591/12384 [16:06:32<10:10:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 0: 61%|██████▏ | 7591/12384 [16:06:40<10:10:19, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 61%|██████▏ | 7592/12384 [16:06:40<10:09:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 61%|██████▏ | 7592/12384 [16:06:47<10:09:01, 7.63s/it, loss=0.0000, acc=0.9999, iter_time=7.66s]
Epoch 0: 61%|██████▏ | 7593/12384 [16:06:47<10:08:15, 7.62s/it, loss=0.0000, acc=0.9999, iter_time=7.66s]
Epoch 0: 61%|██████▏ | 7593/12384 [16:06:55<10:08:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 61%|██████▏ | 7594/12384 [16:06:55<10:09:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 61%|██████▏ | 7594/12384 [16:07:02<10:09:42, 7.64s/it, loss=0.0006, acc=0.9988, iter_time=8.02s]
Epoch 0: 61%|██████▏ | 7595/12384 [16:07:02<10:09:16, 7.63s/it, loss=0.0006, acc=0.9988, iter_time=8.02s]
Epoch 0: 61%|██████▏ | 7595/12384 [16:07:10<10:09:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 61%|██████▏ | 7596/12384 [16:07:10<10:08:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 61%|██████▏ | 7596/12384 [16:07:18<10:08:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 61%|██████▏ | 7597/12384 [16:07:18<10:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 61%|██████▏ | 7597/12384 [16:07:25<10:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 61%|██████▏ | 7598/12384 [16:07:25<10:07:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 61%|██████▏ | 7598/12384 [16:07:33<10:07:46, 7.62s/it, loss=0.0007, acc=0.9972, iter_time=7.61s]
Epoch 0: 61%|██████▏ | 7599/12384 [16:07:33<10:07:41, 7.62s/it, loss=0.0007, acc=0.9972, iter_time=7.61s]
Epoch 0: 61%|██████▏ | 7599/12384 [16:07:41<10:07:41, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=8.03s]
Epoch 0: 61%|██████▏ | 7600/12384 [16:07:41<10:07:38, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=8.03s]
Epoch 0: 61%|██████▏ | 7600/12384 [16:07:48<10:07:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 61%|██████▏ | 7601/12384 [16:07:48<10:09:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 61%|██████▏ | 7601/12384 [16:07:56<10:09:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 61%|██████▏ | 7602/12384 [16:07:56<10:10:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 61%|██████▏ | 7602/12384 [16:08:04<10:10:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 0: 61%|██████▏ | 7603/12384 [16:08:04<10:10:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 0: 61%|██████▏ | 7603/12384 [16:08:11<10:10:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 61%|██████▏ | 7604/12384 [16:08:11<10:12:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 61%|██████▏ | 7604/12384 [16:08:19<10:12:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 61%|██████▏ | 7605/12384 [16:08:19<10:18:00, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 61%|██████▏ | 7605/12384 [16:08:27<10:18:00, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 61%|██████▏ | 7606/12384 [16:08:27<10:16:40, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 61%|██████▏ | 7606/12384 [16:08:35<10:16:40, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 61%|██████▏ | 7607/12384 [16:08:35<10:13:38, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 61%|██████▏ | 7607/12384 [16:08:42<10:13:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 61%|██████▏ | 7608/12384 [16:08:42<10:11:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 61%|██████▏ | 7608/12384 [16:08:50<10:11:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 0: 61%|██████▏ | 7609/12384 [16:08:50<10:10:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 0: 61%|██████▏ | 7609/12384 [16:08:58<10:10:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 61%|██████▏ | 7610/12384 [16:08:58<10:10:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 61%|██████▏ | 7610/12384 [16:09:05<10:10:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 61%|██████▏ | 7611/12384 [16:09:05<10:08:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 61%|██████▏ | 7611/12384 [16:09:13<10:08:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 61%|██████▏ | 7612/12384 [16:09:13<10:07:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 61%|██████▏ | 7612/12384 [16:09:21<10:07:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 61%|██████▏ | 7613/12384 [16:09:21<10:13:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 61%|██████▏ | 7613/12384 [16:09:28<10:13:44, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 61%|██████▏ | 7614/12384 [16:09:28<10:11:38, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 61%|██████▏ | 7614/12384 [16:09:36<10:11:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 61%|██████▏ | 7615/12384 [16:09:36<10:11:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 61%|██████▏ | 7615/12384 [16:09:44<10:11:51, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 61%|██████▏ | 7616/12384 [16:09:44<10:09:58, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 61%|██████▏ | 7616/12384 [16:09:51<10:09:58, 7.68s/it, loss=0.0003, acc=0.9988, iter_time=5.40s]
Epoch 0: 62%|██████▏ | 7617/12384 [16:09:51<10:09:18, 7.67s/it, loss=0.0003, acc=0.9988, iter_time=5.40s]
Epoch 0: 62%|██████▏ | 7617/12384 [16:09:59<10:09:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 62%|██████▏ | 7618/12384 [16:09:59<10:08:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 62%|██████▏ | 7618/12384 [16:10:07<10:08:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 62%|██████▏ | 7619/12384 [16:10:07<10:07:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 62%|██████▏ | 7619/12384 [16:10:14<10:07:22, 7.65s/it, loss=0.0003, acc=0.9980, iter_time=9.44s]
Epoch 0: 62%|██████▏ | 7620/12384 [16:10:14<10:06:47, 7.64s/it, loss=0.0003, acc=0.9980, iter_time=9.44s]
Epoch 0: 62%|██████▏ | 7620/12384 [16:10:22<10:06:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 62%|██████▏ | 7621/12384 [16:10:22<10:06:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 62%|██████▏ | 7621/12384 [16:10:29<10:06:26, 7.64s/it, loss=0.0003, acc=0.9989, iter_time=9.91s]
Epoch 0: 62%|██████▏ | 7622/12384 [16:10:29<10:04:59, 7.62s/it, loss=0.0003, acc=0.9989, iter_time=9.91s]
Epoch 0: 62%|██████▏ | 7622/12384 [16:10:37<10:04:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7623/12384 [16:10:37<10:05:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7623/12384 [16:10:45<10:05:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7624/12384 [16:10:45<10:04:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7624/12384 [16:10:52<10:04:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7625/12384 [16:10:52<10:04:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7625/12384 [16:11:00<10:04:36, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=6.71s]
Epoch 0: 62%|██████▏ | 7626/12384 [16:11:00<10:04:20, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=6.71s]
Epoch 0: 62%|██████▏ | 7626/12384 [16:11:08<10:04:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 62%|██████▏ | 7627/12384 [16:11:08<10:03:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 62%|██████▏ | 7627/12384 [16:11:15<10:03:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 62%|██████▏ | 7628/12384 [16:11:15<10:03:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 62%|██████▏ | 7628/12384 [16:11:23<10:03:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 0: 62%|██████▏ | 7629/12384 [16:11:23<10:02:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 0: 62%|██████▏ | 7629/12384 [16:11:30<10:02:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 62%|██████▏ | 7630/12384 [16:11:30<10:02:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 62%|██████▏ | 7630/12384 [16:11:38<10:02:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 0: 62%|██████▏ | 7631/12384 [16:11:38<10:03:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 0: 62%|██████▏ | 7631/12384 [16:11:46<10:03:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 0: 62%|██████▏ | 7632/12384 [16:11:46<10:09:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 0: 62%|██████▏ | 7632/12384 [16:11:53<10:09:31, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7633/12384 [16:11:53<10:07:15, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7633/12384 [16:12:01<10:07:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 62%|██████▏ | 7634/12384 [16:12:01<10:05:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 62%|██████▏ | 7634/12384 [16:12:09<10:05:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 62%|██████▏ | 7635/12384 [16:12:09<10:04:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 62%|██████▏ | 7635/12384 [16:12:16<10:04:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 62%|██████▏ | 7636/12384 [16:12:16<10:04:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 62%|██████▏ | 7636/12384 [16:12:24<10:04:14, 7.64s/it, loss=0.0010, acc=0.9983, iter_time=7.63s]
Epoch 0: 62%|██████▏ | 7637/12384 [16:12:24<10:03:09, 7.62s/it, loss=0.0010, acc=0.9983, iter_time=7.63s]
Epoch 0: 62%|██████▏ | 7637/12384 [16:12:31<10:03:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7638/12384 [16:12:31<10:02:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7638/12384 [16:12:39<10:02:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 0: 62%|██████▏ | 7639/12384 [16:12:39<10:02:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 0: 62%|██████▏ | 7639/12384 [16:12:47<10:02:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 62%|██████▏ | 7640/12384 [16:12:47<10:02:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 62%|██████▏ | 7640/12384 [16:12:54<10:02:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7641/12384 [16:12:54<10:01:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7641/12384 [16:13:02<10:01:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 62%|██████▏ | 7642/12384 [16:13:02<10:01:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 62%|██████▏ | 7642/12384 [16:13:10<10:01:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 62%|██████▏ | 7643/12384 [16:13:10<10:00:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 62%|██████▏ | 7643/12384 [16:13:17<10:00:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 0: 62%|██████▏ | 7644/12384 [16:13:17<10:01:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 0: 62%|██████▏ | 7644/12384 [16:13:25<10:01:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 62%|██████▏ | 7645/12384 [16:13:25<10:01:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 62%|██████▏ | 7645/12384 [16:13:32<10:01:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 0: 62%|██████▏ | 7646/12384 [16:13:32<10:01:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 0: 62%|██████▏ | 7646/12384 [16:13:40<10:01:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 0: 62%|██████▏ | 7647/12384 [16:13:40<10:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 0: 62%|██████▏ | 7647/12384 [16:13:48<10:00:58, 7.61s/it, loss=0.0008, acc=0.9967, iter_time=8.00s]
Epoch 0: 62%|██████▏ | 7648/12384 [16:13:48<10:02:46, 7.64s/it, loss=0.0008, acc=0.9967, iter_time=8.00s]
Epoch 0: 62%|██████▏ | 7648/12384 [16:13:55<10:02:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 0: 62%|██████▏ | 7649/12384 [16:13:55<10:03:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 0: 62%|██████▏ | 7649/12384 [16:14:03<10:03:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 62%|██████▏ | 7650/12384 [16:14:03<10:02:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 62%|██████▏ | 7650/12384 [16:14:11<10:02:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 0: 62%|██████▏ | 7651/12384 [16:14:11<10:02:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 0: 62%|██████▏ | 7651/12384 [16:14:18<10:02:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 0: 62%|██████▏ | 7652/12384 [16:14:18<10:03:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 0: 62%|██████▏ | 7652/12384 [16:14:26<10:03:00, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=5.08s]
Epoch 0: 62%|██████▏ | 7653/12384 [16:14:26<10:01:39, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.08s]
Epoch 0: 62%|██████▏ | 7653/12384 [16:14:33<10:01:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 62%|██████▏ | 7654/12384 [16:14:33<10:00:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 62%|██████▏ | 7654/12384 [16:14:41<10:00:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 62%|██████▏ | 7655/12384 [16:14:41<10:00:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 62%|██████▏ | 7655/12384 [16:14:49<10:00:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 0: 62%|██████▏ | 7656/12384 [16:14:49<10:02:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 0: 62%|██████▏ | 7656/12384 [16:14:56<10:02:39, 7.65s/it, loss=0.0003, acc=0.9984, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7657/12384 [16:14:56<10:01:41, 7.64s/it, loss=0.0003, acc=0.9984, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7657/12384 [16:15:04<10:01:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 62%|██████▏ | 7658/12384 [16:15:04<10:09:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 62%|██████▏ | 7658/12384 [16:15:12<10:09:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 62%|██████▏ | 7659/12384 [16:15:12<10:07:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 62%|██████▏ | 7659/12384 [16:15:20<10:07:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 62%|██████▏ | 7660/12384 [16:15:20<10:04:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 62%|██████▏ | 7660/12384 [16:15:27<10:04:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7661/12384 [16:15:27<10:03:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7661/12384 [16:15:35<10:03:16, 7.66s/it, loss=0.0001, acc=0.9997, iter_time=6.98s]
Epoch 0: 62%|██████▏ | 7662/12384 [16:15:35<10:01:17, 7.64s/it, loss=0.0001, acc=0.9997, iter_time=6.98s]
Epoch 0: 62%|██████▏ | 7662/12384 [16:15:42<10:01:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 62%|██████▏ | 7663/12384 [16:15:42<10:00:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 62%|██████▏ | 7663/12384 [16:15:50<10:00:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 62%|██████▏ | 7664/12384 [16:15:50<10:01:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 62%|██████▏ | 7664/12384 [16:15:58<10:01:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 62%|██████▏ | 7665/12384 [16:15:58<10:00:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 62%|██████▏ | 7665/12384 [16:16:05<10:00:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 62%|██████▏ | 7666/12384 [16:16:05<10:00:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 62%|██████▏ | 7666/12384 [16:16:13<10:00:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 62%|██████▏ | 7667/12384 [16:16:13<9:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 62%|██████▏ | 7667/12384 [16:16:21<9:59:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7668/12384 [16:16:21<9:59:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7668/12384 [16:16:28<9:59:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 62%|██████▏ | 7669/12384 [16:16:28<9:58:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 62%|██████▏ | 7669/12384 [16:16:36<9:58:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 62%|██████▏ | 7670/12384 [16:16:36<9:58:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 62%|██████▏ | 7670/12384 [16:16:43<9:58:55, 7.62s/it, loss=0.0009, acc=0.9968, iter_time=5.61s]
Epoch 0: 62%|██████▏ | 7671/12384 [16:16:43<9:59:28, 7.63s/it, loss=0.0009, acc=0.9968, iter_time=5.61s]
Epoch 0: 62%|██████▏ | 7671/12384 [16:16:51<9:59:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 62%|██████▏ | 7672/12384 [16:16:51<9:59:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 62%|██████▏ | 7672/12384 [16:16:59<9:59:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 62%|██████▏ | 7673/12384 [16:16:59<9:58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 62%|██████▏ | 7673/12384 [16:17:06<9:58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 0: 62%|██████▏ | 7674/12384 [16:17:06<9:58:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 0: 62%|██████▏ | 7674/12384 [16:17:14<9:58:20, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=10.64s]
Epoch 0: 62%|██████▏ | 7675/12384 [16:17:14<9:57:40, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=10.64s]
Epoch 0: 62%|██████▏ | 7675/12384 [16:17:22<9:57:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 62%|██████▏ | 7676/12384 [16:17:22<9:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 62%|██████▏ | 7676/12384 [16:17:29<9:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 62%|██████▏ | 7677/12384 [16:17:29<9:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 62%|██████▏ | 7677/12384 [16:17:37<9:57:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7678/12384 [16:17:37<9:57:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7678/12384 [16:17:44<9:57:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7679/12384 [16:17:44<9:56:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7679/12384 [16:17:52<9:56:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 62%|██████▏ | 7680/12384 [16:17:52<9:56:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 62%|██████▏ | 7680/12384 [16:18:00<9:56:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 62%|██████▏ | 7681/12384 [16:18:00<9:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 62%|██████▏ | 7681/12384 [16:18:07<9:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 62%|██████▏ | 7682/12384 [16:18:07<9:57:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 62%|██████▏ | 7682/12384 [16:18:15<9:57:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7683/12384 [16:18:15<9:57:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 62%|██████▏ | 7683/12384 [16:18:23<9:57:14, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=6.98s]
Epoch 0: 62%|██████▏ | 7684/12384 [16:18:23<9:57:55, 7.63s/it, loss=0.0003, acc=0.9986, iter_time=6.98s]
Epoch 0: 62%|██████▏ | 7684/12384 [16:18:31<9:57:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 62%|██████▏ | 7685/12384 [16:18:31<10:06:32, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 62%|██████▏ | 7685/12384 [16:18:38<10:06:32, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 62%|██████▏ | 7686/12384 [16:18:38<10:03:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 62%|██████▏ | 7686/12384 [16:18:46<10:03:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7687/12384 [16:18:46<10:00:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7687/12384 [16:18:53<10:00:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 62%|██████▏ | 7688/12384 [16:18:53<9:59:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 62%|██████▏ | 7688/12384 [16:19:01<9:59:56, 7.67s/it, loss=0.0006, acc=0.9988, iter_time=7.23s]
Epoch 0: 62%|██████▏ | 7689/12384 [16:19:01<9:58:44, 7.65s/it, loss=0.0006, acc=0.9988, iter_time=7.23s]
Epoch 0: 62%|██████▏ | 7689/12384 [16:19:09<9:58:44, 7.65s/it, loss=0.0007, acc=0.9961, iter_time=7.67s]
Epoch 0: 62%|██████▏ | 7690/12384 [16:19:09<9:58:41, 7.65s/it, loss=0.0007, acc=0.9961, iter_time=7.67s]
Epoch 0: 62%|██████▏ | 7690/12384 [16:19:16<9:58:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7691/12384 [16:19:16<9:57:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7691/12384 [16:19:24<9:57:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 62%|██████▏ | 7692/12384 [16:19:24<9:56:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 62%|██████▏ | 7692/12384 [16:19:32<9:56:21, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.47s]
Epoch 0: 62%|██████▏ | 7693/12384 [16:19:32<10:03:07, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=8.47s]
Epoch 0: 62%|██████▏ | 7693/12384 [16:19:39<10:03:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 62%|██████▏ | 7694/12384 [16:19:39<10:00:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 62%|██████▏ | 7694/12384 [16:19:47<10:00:42, 7.69s/it, loss=0.0001, acc=0.9989, iter_time=6.02s]
Epoch 0: 62%|██████▏ | 7695/12384 [16:19:47<9:58:00, 7.65s/it, loss=0.0001, acc=0.9989, iter_time=6.02s]
Epoch 0: 62%|██████▏ | 7695/12384 [16:19:55<9:58:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 62%|██████▏ | 7696/12384 [16:19:55<9:56:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 62%|██████▏ | 7696/12384 [16:20:02<9:56:35, 7.64s/it, loss=0.0003, acc=0.9990, iter_time=6.65s]
Epoch 0: 62%|██████▏ | 7697/12384 [16:20:02<9:56:29, 7.64s/it, loss=0.0003, acc=0.9990, iter_time=6.65s]
Epoch 0: 62%|██████▏ | 7697/12384 [16:20:10<9:56:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 62%|██████▏ | 7698/12384 [16:20:10<9:57:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 62%|██████▏ | 7698/12384 [16:20:18<9:57:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 62%|██████▏ | 7699/12384 [16:20:18<9:57:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 62%|██████▏ | 7699/12384 [16:20:25<9:57:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 0: 62%|██████▏ | 7700/12384 [16:20:25<9:56:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 0: 62%|██████▏ | 7700/12384 [16:20:33<9:56:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 62%|██████▏ | 7701/12384 [16:20:33<9:55:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 62%|██████▏ | 7701/12384 [16:20:40<9:55:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7702/12384 [16:20:40<9:54:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 62%|██████▏ | 7702/12384 [16:20:48<9:54:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 62%|██████▏ | 7703/12384 [16:20:48<9:54:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 62%|██████▏ | 7703/12384 [16:20:56<9:54:29, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=9.49s]
Epoch 0: 62%|██████▏ | 7704/12384 [16:20:56<9:54:13, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=9.49s]
Epoch 0: 62%|██████▏ | 7704/12384 [16:21:03<9:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 0: 62%|██████▏ | 7705/12384 [16:21:03<9:54:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 0: 62%|██████▏ | 7705/12384 [16:21:11<9:54:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 0: 62%|██████▏ | 7706/12384 [16:21:11<9:53:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 0: 62%|██████▏ | 7706/12384 [16:21:18<9:53:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 0: 62%|██████▏ | 7707/12384 [16:21:18<9:53:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 0: 62%|██████▏ | 7707/12384 [16:21:26<9:53:26, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=9.74s]
Epoch 0: 62%|██████▏ | 7708/12384 [16:21:26<9:54:11, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=9.74s]
Epoch 0: 62%|██████▏ | 7708/12384 [16:21:34<9:54:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 62%|██████▏ | 7709/12384 [16:21:34<9:55:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 62%|██████▏ | 7709/12384 [16:21:41<9:55:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 62%|██████▏ | 7710/12384 [16:21:41<9:54:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 62%|██████▏ | 7710/12384 [16:21:49<9:54:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 62%|██████▏ | 7711/12384 [16:21:49<10:02:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 62%|██████▏ | 7711/12384 [16:21:57<10:02:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 62%|██████▏ | 7712/12384 [16:21:57<9:58:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 62%|██████▏ | 7712/12384 [16:22:05<9:58:54, 7.69s/it, loss=0.0002, acc=0.9998, iter_time=7.34s]
Epoch 0: 62%|██████▏ | 7713/12384 [16:22:05<9:56:33, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.34s]
Epoch 0: 62%|██████▏ | 7713/12384 [16:22:12<9:56:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 62%|██████▏ | 7714/12384 [16:22:12<9:55:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 62%|██████▏ | 7714/12384 [16:22:20<9:55:34, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 62%|██████▏ | 7715/12384 [16:22:20<9:54:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 62%|██████▏ | 7715/12384 [16:22:27<9:54:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 62%|██████▏ | 7716/12384 [16:22:27<9:53:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 62%|██████▏ | 7716/12384 [16:22:35<9:53:21, 7.63s/it, loss=0.0009, acc=1.0000, iter_time=6.95s]
Epoch 0: 62%|██████▏ | 7717/12384 [16:22:35<9:52:32, 7.62s/it, loss=0.0009, acc=1.0000, iter_time=6.95s]
Epoch 0: 62%|██████▏ | 7717/12384 [16:22:43<9:52:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 62%|██████▏ | 7718/12384 [16:22:43<9:52:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 62%|██████▏ | 7718/12384 [16:22:50<9:52:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 62%|██████▏ | 7719/12384 [16:22:50<9:58:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 62%|██████▏ | 7719/12384 [16:22:58<9:58:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 62%|██████▏ | 7720/12384 [16:22:58<9:56:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 62%|██████▏ | 7720/12384 [16:23:06<9:56:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 62%|██████▏ | 7721/12384 [16:23:06<9:54:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 62%|██████▏ | 7721/12384 [16:23:13<9:54:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 62%|██████▏ | 7722/12384 [16:23:13<9:53:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 62%|██████▏ | 7722/12384 [16:23:21<9:53:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7723/12384 [16:23:21<9:52:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7723/12384 [16:23:29<9:52:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 62%|██████▏ | 7724/12384 [16:23:29<9:52:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 62%|██████▏ | 7724/12384 [16:23:36<9:52:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 62%|██████▏ | 7725/12384 [16:23:36<9:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 62%|██████▏ | 7725/12384 [16:23:44<9:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 0: 62%|██████▏ | 7726/12384 [16:23:44<9:51:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 0: 62%|██████▏ | 7726/12384 [16:23:51<9:51:07, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.73s]
Epoch 0: 62%|██████▏ | 7727/12384 [16:23:51<9:51:14, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.73s]
Epoch 0: 62%|██████▏ | 7727/12384 [16:23:59<9:51:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 62%|██████▏ | 7728/12384 [16:23:59<9:51:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 0: 62%|██████▏ | 7728/12384 [16:24:07<9:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 62%|██████▏ | 7729/12384 [16:24:07<9:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 62%|██████▏ | 7729/12384 [16:24:14<9:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7730/12384 [16:24:14<9:50:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 62%|██████▏ | 7730/12384 [16:24:22<9:50:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 62%|██████▏ | 7731/12384 [16:24:22<9:50:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 62%|██████▏ | 7731/12384 [16:24:29<9:50:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 62%|██████▏ | 7732/12384 [16:24:29<9:51:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 62%|██████▏ | 7732/12384 [16:24:37<9:51:22, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.17s]
Epoch 0: 62%|██████▏ | 7733/12384 [16:24:37<9:50:50, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.17s]
Epoch 0: 62%|██████▏ | 7733/12384 [16:24:45<9:50:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 0: 62%|██████▏ | 7734/12384 [16:24:45<9:52:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 0: 62%|██████▏ | 7734/12384 [16:24:52<9:52:54, 7.65s/it, loss=0.0006, acc=0.9981, iter_time=10.05s]
Epoch 0: 62%|██████▏ | 7735/12384 [16:24:52<9:51:54, 7.64s/it, loss=0.0006, acc=0.9981, iter_time=10.05s]
Epoch 0: 62%|██████▏ | 7735/12384 [16:25:00<9:51:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 62%|██████▏ | 7736/12384 [16:25:00<9:52:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 62%|██████▏ | 7736/12384 [16:25:08<9:52:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 62%|██████▏ | 7737/12384 [16:25:08<9:59:12, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 62%|██████▏ | 7737/12384 [16:25:16<9:59:12, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 62%|██████▏ | 7738/12384 [16:25:16<9:56:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 62%|██████▏ | 7738/12384 [16:25:23<9:56:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 62%|██████▏ | 7739/12384 [16:25:23<9:54:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 62%|██████▏ | 7739/12384 [16:25:31<9:54:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 62%|██████▎ | 7740/12384 [16:25:31<9:53:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 62%|██████▎ | 7740/12384 [16:25:38<9:53:07, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=9.06s]
Epoch 0: 63%|██████▎ | 7741/12384 [16:25:38<9:51:01, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.06s]
Epoch 0: 63%|██████▎ | 7741/12384 [16:25:46<9:51:01, 7.64s/it, loss=0.0002, acc=0.9991, iter_time=7.28s]
Epoch 0: 63%|██████▎ | 7742/12384 [16:25:46<9:49:52, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=7.28s]
Epoch 0: 63%|██████▎ | 7742/12384 [16:25:54<9:49:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7743/12384 [16:25:54<9:49:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7743/12384 [16:26:01<9:49:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 63%|██████▎ | 7744/12384 [16:26:01<9:49:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 63%|██████▎ | 7744/12384 [16:26:09<9:49:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 63%|██████▎ | 7745/12384 [16:26:09<9:55:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 63%|██████▎ | 7745/12384 [16:26:17<9:55:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7746/12384 [16:26:17<9:53:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7746/12384 [16:26:24<9:53:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 63%|██████▎ | 7747/12384 [16:26:24<9:52:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 63%|██████▎ | 7747/12384 [16:26:32<9:52:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 63%|██████▎ | 7748/12384 [16:26:32<9:50:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 63%|██████▎ | 7748/12384 [16:26:40<9:50:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7749/12384 [16:26:40<9:49:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7749/12384 [16:26:47<9:49:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 63%|██████▎ | 7750/12384 [16:26:47<9:48:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 63%|██████▎ | 7750/12384 [16:26:55<9:48:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 63%|██████▎ | 7751/12384 [16:26:55<9:48:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 63%|██████▎ | 7751/12384 [16:27:02<9:48:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 63%|██████▎ | 7752/12384 [16:27:02<9:48:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 63%|██████▎ | 7752/12384 [16:27:10<9:48:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 63%|██████▎ | 7753/12384 [16:27:10<9:48:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 63%|██████▎ | 7753/12384 [16:27:18<9:48:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 63%|██████▎ | 7754/12384 [16:27:18<9:48:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 63%|██████▎ | 7754/12384 [16:27:25<9:48:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.06s]
Epoch 0: 63%|██████▎ | 7755/12384 [16:27:25<9:48:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.06s]
Epoch 0: 63%|██████▎ | 7755/12384 [16:27:33<9:48:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 63%|██████▎ | 7756/12384 [16:27:33<9:47:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 63%|██████▎ | 7756/12384 [16:27:41<9:47:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 63%|██████▎ | 7757/12384 [16:27:41<9:46:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 63%|██████▎ | 7757/12384 [16:27:48<9:46:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 63%|██████▎ | 7758/12384 [16:27:48<9:46:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 63%|██████▎ | 7758/12384 [16:27:56<9:46:37, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 63%|██████▎ | 7759/12384 [16:27:56<9:46:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 63%|██████▎ | 7759/12384 [16:28:03<9:46:24, 7.61s/it, loss=0.0004, acc=0.9987, iter_time=8.00s]
Epoch 0: 63%|██████▎ | 7760/12384 [16:28:03<9:46:24, 7.61s/it, loss=0.0004, acc=0.9987, iter_time=8.00s]
Epoch 0: 63%|██████▎ | 7760/12384 [16:28:11<9:46:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 63%|██████▎ | 7761/12384 [16:28:11<9:46:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 63%|██████▎ | 7761/12384 [16:28:19<9:46:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 63%|██████▎ | 7762/12384 [16:28:19<9:46:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 63%|██████▎ | 7762/12384 [16:28:27<9:46:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 63%|██████▎ | 7763/12384 [16:28:27<9:53:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 63%|██████▎ | 7763/12384 [16:28:34<9:53:36, 7.71s/it, loss=0.0008, acc=0.9980, iter_time=7.89s]
Epoch 0: 63%|██████▎ | 7764/12384 [16:28:34<9:51:05, 7.68s/it, loss=0.0008, acc=0.9980, iter_time=7.89s]
Epoch 0: 63%|██████▎ | 7764/12384 [16:28:42<9:51:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 63%|██████▎ | 7765/12384 [16:28:42<9:49:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 63%|██████▎ | 7765/12384 [16:28:49<9:49:44, 7.66s/it, loss=0.0002, acc=0.9982, iter_time=7.62s]
Epoch 0: 63%|██████▎ | 7766/12384 [16:28:49<9:48:35, 7.65s/it, loss=0.0002, acc=0.9982, iter_time=7.62s]
Epoch 0: 63%|██████▎ | 7766/12384 [16:28:57<9:48:35, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7767/12384 [16:28:57<9:47:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7767/12384 [16:29:05<9:47:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 63%|██████▎ | 7768/12384 [16:29:05<9:47:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 63%|██████▎ | 7768/12384 [16:29:12<9:47:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 63%|██████▎ | 7769/12384 [16:29:12<9:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 63%|██████▎ | 7769/12384 [16:29:20<9:46:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 63%|██████▎ | 7770/12384 [16:29:20<9:45:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 63%|██████▎ | 7770/12384 [16:29:28<9:45:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 63%|██████▎ | 7771/12384 [16:29:28<9:52:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 63%|██████▎ | 7771/12384 [16:29:35<9:52:17, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 63%|██████▎ | 7772/12384 [16:29:35<9:49:47, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 63%|██████▎ | 7772/12384 [16:29:43<9:49:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 63%|██████▎ | 7773/12384 [16:29:43<9:48:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 63%|██████▎ | 7773/12384 [16:29:51<9:48:26, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=6.17s]
Epoch 0: 63%|██████▎ | 7774/12384 [16:29:51<9:47:27, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=6.17s]
Epoch 0: 63%|██████▎ | 7774/12384 [16:29:58<9:47:27, 7.65s/it, loss=0.0036, acc=0.9944, iter_time=5.93s]
Epoch 0: 63%|██████▎ | 7775/12384 [16:29:58<9:46:14, 7.63s/it, loss=0.0036, acc=0.9944, iter_time=5.93s]
Epoch 0: 63%|██████▎ | 7775/12384 [16:30:06<9:46:14, 7.63s/it, loss=0.0004, acc=0.9984, iter_time=11.11s]
Epoch 0: 63%|██████▎ | 7776/12384 [16:30:06<9:45:56, 7.63s/it, loss=0.0004, acc=0.9984, iter_time=11.11s]
Epoch 0: 63%|██████▎ | 7776/12384 [16:30:13<9:45:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 0: 63%|██████▎ | 7777/12384 [16:30:13<9:45:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 0: 63%|██████▎ | 7777/12384 [16:30:21<9:45:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7778/12384 [16:30:21<9:45:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7778/12384 [16:30:29<9:45:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 63%|██████▎ | 7779/12384 [16:30:29<9:45:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 63%|██████▎ | 7779/12384 [16:30:36<9:45:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 63%|██████▎ | 7780/12384 [16:30:36<9:45:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 63%|██████▎ | 7780/12384 [16:30:44<9:45:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7781/12384 [16:30:44<9:45:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7781/12384 [16:30:52<9:45:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 63%|██████▎ | 7782/12384 [16:30:52<9:45:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 63%|██████▎ | 7782/12384 [16:30:59<9:45:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 63%|██████▎ | 7783/12384 [16:30:59<9:45:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 63%|██████▎ | 7783/12384 [16:31:07<9:45:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 63%|██████▎ | 7784/12384 [16:31:07<9:44:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 63%|██████▎ | 7784/12384 [16:31:14<9:44:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 63%|██████▎ | 7785/12384 [16:31:14<9:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 63%|██████▎ | 7785/12384 [16:31:22<9:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 63%|██████▎ | 7786/12384 [16:31:22<9:43:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 63%|██████▎ | 7786/12384 [16:31:30<9:43:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 63%|██████▎ | 7787/12384 [16:31:30<9:42:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 63%|██████▎ | 7787/12384 [16:31:37<9:42:29, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 0: 63%|██████▎ | 7788/12384 [16:31:37<9:42:26, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 0: 63%|██████▎ | 7788/12384 [16:31:45<9:42:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 0: 63%|██████▎ | 7789/12384 [16:31:45<9:50:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 0: 63%|██████▎ | 7789/12384 [16:31:53<9:50:03, 7.70s/it, loss=0.0002, acc=0.9999, iter_time=7.89s]
Epoch 0: 63%|██████▎ | 7790/12384 [16:31:53<9:47:28, 7.67s/it, loss=0.0002, acc=0.9999, iter_time=7.89s]
Epoch 0: 63%|██████▎ | 7790/12384 [16:32:00<9:47:28, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=4.22s]
Epoch 0: 63%|██████▎ | 7791/12384 [16:32:00<9:45:31, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=4.22s]
Epoch 0: 63%|██████▎ | 7791/12384 [16:32:08<9:45:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 0: 63%|██████▎ | 7792/12384 [16:32:08<9:44:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 0: 63%|██████▎ | 7792/12384 [16:32:15<9:44:18, 7.63s/it, loss=0.0006, acc=0.9979, iter_time=7.22s]
Epoch 0: 63%|██████▎ | 7793/12384 [16:32:15<9:43:20, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=7.22s]
Epoch 0: 63%|██████▎ | 7793/12384 [16:32:23<9:43:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 63%|██████▎ | 7794/12384 [16:32:23<9:43:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 63%|██████▎ | 7794/12384 [16:32:31<9:43:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 63%|██████▎ | 7795/12384 [16:32:31<9:42:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 63%|██████▎ | 7795/12384 [16:32:38<9:42:19, 7.61s/it, loss=0.0012, acc=0.9970, iter_time=6.67s]
Epoch 0: 63%|██████▎ | 7796/12384 [16:32:38<9:42:03, 7.61s/it, loss=0.0012, acc=0.9970, iter_time=6.67s]
Epoch 0: 63%|██████▎ | 7796/12384 [16:32:46<9:42:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 63%|██████▎ | 7797/12384 [16:32:46<9:48:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 63%|██████▎ | 7797/12384 [16:32:54<9:48:34, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 0: 63%|██████▎ | 7798/12384 [16:32:54<9:46:36, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 0: 63%|██████▎ | 7798/12384 [16:33:01<9:46:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 63%|██████▎ | 7799/12384 [16:33:01<9:44:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 63%|██████▎ | 7799/12384 [16:33:09<9:44:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 63%|██████▎ | 7800/12384 [16:33:09<9:44:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 63%|██████▎ | 7800/12384 [16:33:17<9:44:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 63%|██████▎ | 7801/12384 [16:33:17<9:43:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 63%|██████▎ | 7801/12384 [16:33:24<9:43:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 63%|██████▎ | 7802/12384 [16:33:24<9:42:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 63%|██████▎ | 7802/12384 [16:33:32<9:42:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 63%|██████▎ | 7803/12384 [16:33:32<9:41:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 63%|██████▎ | 7803/12384 [16:33:39<9:41:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 63%|██████▎ | 7804/12384 [16:33:39<9:41:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 63%|██████▎ | 7804/12384 [16:33:47<9:41:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 63%|██████▎ | 7805/12384 [16:33:47<9:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 63%|██████▎ | 7805/12384 [16:33:55<9:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 63%|██████▎ | 7806/12384 [16:33:55<9:40:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 63%|██████▎ | 7806/12384 [16:34:02<9:40:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=2.93s]
Epoch 0: 63%|██████▎ | 7807/12384 [16:34:02<9:40:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=2.93s]
Epoch 0: 63%|██████▎ | 7807/12384 [16:34:10<9:40:56, 7.62s/it, loss=0.0005, acc=0.9980, iter_time=12.70s]
Epoch 0: 63%|██████▎ | 7808/12384 [16:34:10<9:42:05, 7.63s/it, loss=0.0005, acc=0.9980, iter_time=12.70s]
Epoch 0: 63%|██████▎ | 7808/12384 [16:34:18<9:42:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 63%|██████▎ | 7809/12384 [16:34:18<9:40:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 0: 63%|██████▎ | 7809/12384 [16:34:25<9:40:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 63%|██████▎ | 7810/12384 [16:34:25<9:40:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 63%|██████▎ | 7810/12384 [16:34:33<9:40:12, 7.61s/it, loss=0.0001, acc=0.9991, iter_time=6.12s]
Epoch 0: 63%|██████▎ | 7811/12384 [16:34:33<9:40:07, 7.61s/it, loss=0.0001, acc=0.9991, iter_time=6.12s]
Epoch 0: 63%|██████▎ | 7811/12384 [16:34:40<9:40:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 63%|██████▎ | 7812/12384 [16:34:40<9:39:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 63%|██████▎ | 7812/12384 [16:34:48<9:39:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 63%|██████▎ | 7813/12384 [16:34:48<9:39:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 63%|██████▎ | 7813/12384 [16:34:56<9:39:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 0: 63%|██████▎ | 7814/12384 [16:34:56<9:39:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 0: 63%|██████▎ | 7814/12384 [16:35:03<9:39:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7815/12384 [16:35:03<9:39:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7815/12384 [16:35:11<9:39:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 0: 63%|██████▎ | 7816/12384 [16:35:11<9:47:02, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 0: 63%|██████▎ | 7816/12384 [16:35:19<9:47:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 63%|██████▎ | 7817/12384 [16:35:19<9:44:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 63%|██████▎ | 7817/12384 [16:35:26<9:44:59, 7.69s/it, loss=0.0003, acc=0.9982, iter_time=7.64s]
Epoch 0: 63%|██████▎ | 7818/12384 [16:35:26<9:42:59, 7.66s/it, loss=0.0003, acc=0.9982, iter_time=7.64s]
Epoch 0: 63%|██████▎ | 7818/12384 [16:35:34<9:42:59, 7.66s/it, loss=0.0001, acc=0.9996, iter_time=6.74s]
Epoch 0: 63%|██████▎ | 7819/12384 [16:35:34<9:41:22, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=6.74s]
Epoch 0: 63%|██████▎ | 7819/12384 [16:35:42<9:41:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 63%|██████▎ | 7820/12384 [16:35:42<9:40:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 63%|██████▎ | 7820/12384 [16:35:49<9:40:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 63%|██████▎ | 7821/12384 [16:35:49<9:40:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 63%|██████▎ | 7821/12384 [16:35:57<9:40:47, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.58s]
Epoch 0: 63%|██████▎ | 7822/12384 [16:35:57<9:40:37, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.58s]
Epoch 0: 63%|██████▎ | 7822/12384 [16:36:04<9:40:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 63%|██████▎ | 7823/12384 [16:36:04<9:39:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 63%|██████▎ | 7823/12384 [16:36:12<9:39:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.32s]
Epoch 0: 63%|██████▎ | 7824/12384 [16:36:12<9:46:00, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.32s]
Epoch 0: 63%|██████▎ | 7824/12384 [16:36:20<9:46:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 0: 63%|██████▎ | 7825/12384 [16:36:20<9:43:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 0: 63%|██████▎ | 7825/12384 [16:36:28<9:43:40, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 63%|██████▎ | 7826/12384 [16:36:28<9:42:06, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 63%|██████▎ | 7826/12384 [16:36:35<9:42:06, 7.66s/it, loss=0.0028, acc=0.9944, iter_time=7.71s]
Epoch 0: 63%|██████▎ | 7827/12384 [16:36:35<9:42:11, 7.67s/it, loss=0.0028, acc=0.9944, iter_time=7.71s]
Epoch 0: 63%|██████▎ | 7827/12384 [16:36:43<9:42:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 63%|██████▎ | 7828/12384 [16:36:43<9:40:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 63%|██████▎ | 7828/12384 [16:36:50<9:40:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.40s]
Epoch 0: 63%|██████▎ | 7829/12384 [16:36:50<9:39:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.40s]
Epoch 0: 63%|██████▎ | 7829/12384 [16:36:58<9:39:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.79s]
Epoch 0: 63%|██████▎ | 7830/12384 [16:36:58<9:39:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.79s]
Epoch 0: 63%|██████▎ | 7830/12384 [16:37:06<9:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 63%|██████▎ | 7831/12384 [16:37:06<9:39:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 63%|██████▎ | 7831/12384 [16:37:13<9:39:16, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=8.03s]
Epoch 0: 63%|██████▎ | 7832/12384 [16:37:13<9:38:32, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=8.03s]
Epoch 0: 63%|██████▎ | 7832/12384 [16:37:21<9:38:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 63%|██████▎ | 7833/12384 [16:37:21<9:37:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 63%|██████▎ | 7833/12384 [16:37:29<9:37:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 63%|██████▎ | 7834/12384 [16:37:29<9:38:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 63%|██████▎ | 7834/12384 [16:37:36<9:38:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 63%|██████▎ | 7835/12384 [16:37:36<9:37:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 63%|██████▎ | 7835/12384 [16:37:44<9:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7836/12384 [16:37:44<9:38:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7836/12384 [16:37:52<9:38:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 63%|██████▎ | 7837/12384 [16:37:52<9:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 63%|██████▎ | 7837/12384 [16:37:59<9:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7838/12384 [16:37:59<9:37:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 63%|██████▎ | 7838/12384 [16:38:07<9:37:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 63%|██████▎ | 7839/12384 [16:38:07<9:37:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 63%|██████▎ | 7839/12384 [16:38:14<9:37:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 63%|██████▎ | 7840/12384 [16:38:14<9:37:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 63%|██████▎ | 7840/12384 [16:38:22<9:37:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 63%|██████▎ | 7841/12384 [16:38:22<9:38:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 63%|██████▎ | 7841/12384 [16:38:30<9:38:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 0: 63%|██████▎ | 7842/12384 [16:38:30<9:45:41, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 0: 63%|██████▎ | 7842/12384 [16:38:38<9:45:41, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 63%|██████▎ | 7843/12384 [16:38:38<9:43:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 63%|██████▎ | 7843/12384 [16:38:45<9:43:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 63%|██████▎ | 7844/12384 [16:38:45<9:41:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 63%|██████▎ | 7844/12384 [16:38:53<9:41:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 63%|██████▎ | 7845/12384 [16:38:53<9:39:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 63%|██████▎ | 7845/12384 [16:39:00<9:39:33, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.79s]
Epoch 0: 63%|██████▎ | 7846/12384 [16:39:00<9:38:01, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.79s]
Epoch 0: 63%|██████▎ | 7846/12384 [16:39:08<9:38:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 63%|██████▎ | 7847/12384 [16:39:08<9:37:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 63%|██████▎ | 7847/12384 [16:39:16<9:37:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 63%|██████▎ | 7848/12384 [16:39:16<9:36:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 63%|██████▎ | 7848/12384 [16:39:23<9:36:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 63%|██████▎ | 7849/12384 [16:39:23<9:36:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 63%|██████▎ | 7849/12384 [16:39:31<9:36:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 63%|██████▎ | 7850/12384 [16:39:31<9:35:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 63%|██████▎ | 7850/12384 [16:39:39<9:35:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.71s]
Epoch 0: 63%|██████▎ | 7851/12384 [16:39:39<9:35:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.71s]
Epoch 0: 63%|██████▎ | 7851/12384 [16:39:46<9:35:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 63%|██████▎ | 7852/12384 [16:39:46<9:35:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 63%|██████▎ | 7852/12384 [16:39:54<9:35:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 63%|██████▎ | 7853/12384 [16:39:54<9:35:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 63%|██████▎ | 7853/12384 [16:40:01<9:35:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 63%|██████▎ | 7854/12384 [16:40:01<9:34:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 63%|██████▎ | 7854/12384 [16:40:09<9:34:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 63%|██████▎ | 7855/12384 [16:40:09<9:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 63%|██████▎ | 7855/12384 [16:40:17<9:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 63%|██████▎ | 7856/12384 [16:40:17<9:34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 63%|██████▎ | 7856/12384 [16:40:24<9:34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 63%|██████▎ | 7857/12384 [16:40:24<9:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 63%|██████▎ | 7857/12384 [16:40:32<9:34:54, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=6.15s]
Epoch 0: 63%|██████▎ | 7858/12384 [16:40:32<9:34:54, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=6.15s]
Epoch 0: 63%|██████▎ | 7858/12384 [16:40:40<9:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 63%|██████▎ | 7859/12384 [16:40:40<9:35:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 63%|██████▎ | 7859/12384 [16:40:47<9:35:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 63%|██████▎ | 7860/12384 [16:40:47<9:35:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 63%|██████▎ | 7860/12384 [16:40:55<9:35:06, 7.63s/it, loss=0.0001, acc=0.9989, iter_time=9.55s]
Epoch 0: 63%|██████▎ | 7861/12384 [16:40:55<9:34:19, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=9.55s]
Epoch 0: 63%|██████▎ | 7861/12384 [16:41:02<9:34:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.67s]
Epoch 0: 63%|██████▎ | 7862/12384 [16:41:02<9:33:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.67s]
Epoch 0: 63%|██████▎ | 7862/12384 [16:41:10<9:33:52, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=10.71s]
Epoch 0: 63%|██████▎ | 7863/12384 [16:41:10<9:33:16, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=10.71s]
Epoch 0: 63%|██████▎ | 7863/12384 [16:41:18<9:33:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 64%|██████▎ | 7864/12384 [16:41:18<9:34:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 64%|██████▎ | 7864/12384 [16:41:25<9:34:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 64%|██████▎ | 7865/12384 [16:41:25<9:34:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 64%|██████▎ | 7865/12384 [16:41:33<9:34:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 64%|██████▎ | 7866/12384 [16:41:33<9:34:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 64%|██████▎ | 7866/12384 [16:41:40<9:34:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 64%|██████▎ | 7867/12384 [16:41:40<9:33:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 64%|██████▎ | 7867/12384 [16:41:48<9:33:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▎ | 7868/12384 [16:41:48<9:32:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▎ | 7868/12384 [16:41:56<9:32:46, 7.61s/it, loss=0.0008, acc=0.9966, iter_time=7.65s]
Epoch 0: 64%|██████▎ | 7869/12384 [16:41:56<9:40:33, 7.72s/it, loss=0.0008, acc=0.9966, iter_time=7.65s]
Epoch 0: 64%|██████▎ | 7869/12384 [16:42:04<9:40:33, 7.72s/it, loss=0.0001, acc=0.9990, iter_time=7.90s]
Epoch 0: 64%|██████▎ | 7870/12384 [16:42:04<9:37:45, 7.68s/it, loss=0.0001, acc=0.9990, iter_time=7.90s]
Epoch 0: 64%|██████▎ | 7870/12384 [16:42:11<9:37:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 64%|██████▎ | 7871/12384 [16:42:11<9:36:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 64%|██████▎ | 7871/12384 [16:42:19<9:36:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 64%|██████▎ | 7872/12384 [16:42:19<9:35:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 64%|██████▎ | 7872/12384 [16:42:26<9:35:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 0: 64%|██████▎ | 7873/12384 [16:42:26<9:35:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 0: 64%|██████▎ | 7873/12384 [16:42:34<9:35:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 64%|██████▎ | 7874/12384 [16:42:34<9:33:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 64%|██████▎ | 7874/12384 [16:42:42<9:33:57, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=8.23s]
Epoch 0: 64%|██████▎ | 7875/12384 [16:42:42<9:33:37, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=8.23s]
Epoch 0: 64%|██████▎ | 7875/12384 [16:42:49<9:33:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 64%|██████▎ | 7876/12384 [16:42:49<9:34:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 64%|██████▎ | 7876/12384 [16:42:57<9:34:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 64%|██████▎ | 7877/12384 [16:42:57<9:40:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 64%|██████▎ | 7877/12384 [16:43:05<9:40:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 64%|██████▎ | 7878/12384 [16:43:05<9:40:27, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 64%|██████▎ | 7878/12384 [16:43:13<9:40:27, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 64%|██████▎ | 7879/12384 [16:43:13<9:37:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 64%|██████▎ | 7879/12384 [16:43:20<9:37:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 64%|██████▎ | 7880/12384 [16:43:20<9:34:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 64%|██████▎ | 7880/12384 [16:43:28<9:34:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 0: 64%|██████▎ | 7881/12384 [16:43:28<9:33:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 0: 64%|██████▎ | 7881/12384 [16:43:35<9:33:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 0: 64%|██████▎ | 7882/12384 [16:43:35<9:32:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 0: 64%|██████▎ | 7882/12384 [16:43:43<9:32:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 64%|██████▎ | 7883/12384 [16:43:43<9:33:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 64%|██████▎ | 7883/12384 [16:43:51<9:33:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 64%|██████▎ | 7884/12384 [16:43:51<9:32:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 64%|██████▎ | 7884/12384 [16:43:58<9:32:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 64%|██████▎ | 7885/12384 [16:43:58<9:32:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 64%|██████▎ | 7885/12384 [16:44:06<9:32:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 64%|██████▎ | 7886/12384 [16:44:06<9:31:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 64%|██████▎ | 7886/12384 [16:44:14<9:31:08, 7.62s/it, loss=0.0010, acc=0.9977, iter_time=7.01s]
Epoch 0: 64%|██████▎ | 7887/12384 [16:44:14<9:30:32, 7.61s/it, loss=0.0010, acc=0.9977, iter_time=7.01s]
Epoch 0: 64%|██████▎ | 7887/12384 [16:44:21<9:30:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 0: 64%|██████▎ | 7888/12384 [16:44:21<9:30:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 0: 64%|██████▎ | 7888/12384 [16:44:29<9:30:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 64%|██████▎ | 7889/12384 [16:44:29<9:31:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 64%|██████▎ | 7889/12384 [16:44:36<9:31:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 64%|██████▎ | 7890/12384 [16:44:36<9:30:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 64%|██████▎ | 7890/12384 [16:44:44<9:30:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 0: 64%|██████▎ | 7891/12384 [16:44:44<9:30:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 0: 64%|██████▎ | 7891/12384 [16:44:52<9:30:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 64%|██████▎ | 7892/12384 [16:44:52<9:30:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 64%|██████▎ | 7892/12384 [16:44:59<9:30:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▎ | 7893/12384 [16:44:59<9:30:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▎ | 7893/12384 [16:45:07<9:30:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 64%|██████▎ | 7894/12384 [16:45:07<9:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 64%|██████▎ | 7894/12384 [16:45:15<9:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 64%|██████▍ | 7895/12384 [16:45:15<9:37:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 64%|██████▍ | 7895/12384 [16:45:22<9:37:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 64%|██████▍ | 7896/12384 [16:45:22<9:34:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 64%|██████▍ | 7896/12384 [16:45:30<9:34:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 0: 64%|██████▍ | 7897/12384 [16:45:30<9:32:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 0: 64%|██████▍ | 7897/12384 [16:45:38<9:32:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 64%|██████▍ | 7898/12384 [16:45:38<9:31:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 64%|██████▍ | 7898/12384 [16:45:45<9:31:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 64%|██████▍ | 7899/12384 [16:45:45<9:31:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 64%|██████▍ | 7899/12384 [16:45:53<9:31:01, 7.64s/it, loss=0.0003, acc=0.9994, iter_time=8.07s]
Epoch 0: 64%|██████▍ | 7900/12384 [16:45:53<9:30:41, 7.64s/it, loss=0.0003, acc=0.9994, iter_time=8.07s]
Epoch 0: 64%|██████▍ | 7900/12384 [16:46:01<9:30:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 64%|██████▍ | 7901/12384 [16:46:01<9:29:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 64%|██████▍ | 7901/12384 [16:46:08<9:29:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 64%|██████▍ | 7902/12384 [16:46:08<9:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 64%|██████▍ | 7902/12384 [16:46:16<9:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 0: 64%|██████▍ | 7903/12384 [16:46:16<9:35:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 0: 64%|██████▍ | 7903/12384 [16:46:24<9:35:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 64%|██████▍ | 7904/12384 [16:46:24<9:33:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 64%|██████▍ | 7904/12384 [16:46:31<9:33:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 64%|██████▍ | 7905/12384 [16:46:31<9:31:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 64%|██████▍ | 7905/12384 [16:46:39<9:31:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7906/12384 [16:46:39<9:30:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7906/12384 [16:46:46<9:30:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7907/12384 [16:46:46<9:29:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7907/12384 [16:46:54<9:29:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 64%|██████▍ | 7908/12384 [16:46:54<9:29:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 64%|██████▍ | 7908/12384 [16:47:02<9:29:22, 7.63s/it, loss=0.0005, acc=0.9988, iter_time=7.64s]
Epoch 0: 64%|██████▍ | 7909/12384 [16:47:02<9:29:07, 7.63s/it, loss=0.0005, acc=0.9988, iter_time=7.64s]
Epoch 0: 64%|██████▍ | 7909/12384 [16:47:09<9:29:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7910/12384 [16:47:09<9:28:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7910/12384 [16:47:17<9:28:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 64%|██████▍ | 7911/12384 [16:47:17<9:28:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 64%|██████▍ | 7911/12384 [16:47:25<9:28:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 0: 64%|██████▍ | 7912/12384 [16:47:25<9:27:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 0: 64%|██████▍ | 7912/12384 [16:47:32<9:27:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 64%|██████▍ | 7913/12384 [16:47:32<9:27:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 64%|██████▍ | 7913/12384 [16:47:40<9:27:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 64%|██████▍ | 7914/12384 [16:47:40<9:27:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 64%|██████▍ | 7914/12384 [16:47:47<9:27:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 64%|██████▍ | 7915/12384 [16:47:47<9:27:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 64%|██████▍ | 7915/12384 [16:47:55<9:27:32, 7.62s/it, loss=0.0007, acc=0.9983, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7916/12384 [16:47:55<9:28:43, 7.64s/it, loss=0.0007, acc=0.9983, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7916/12384 [16:48:03<9:28:43, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=5.86s]
Epoch 0: 64%|██████▍ | 7917/12384 [16:48:03<9:28:15, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=5.86s]
Epoch 0: 64%|██████▍ | 7917/12384 [16:48:10<9:28:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 64%|██████▍ | 7918/12384 [16:48:10<9:27:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 64%|██████▍ | 7918/12384 [16:48:18<9:27:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 64%|██████▍ | 7919/12384 [16:48:18<9:26:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 64%|██████▍ | 7919/12384 [16:48:26<9:26:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 64%|██████▍ | 7920/12384 [16:48:26<9:26:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 64%|██████▍ | 7920/12384 [16:48:34<9:26:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 64%|██████▍ | 7921/12384 [16:48:34<9:34:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 64%|██████▍ | 7921/12384 [16:48:41<9:34:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 64%|██████▍ | 7922/12384 [16:48:41<9:31:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 64%|██████▍ | 7922/12384 [16:48:49<9:31:09, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=3.58s]
Epoch 0: 64%|██████▍ | 7923/12384 [16:48:49<9:29:31, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=3.58s]
Epoch 0: 64%|██████▍ | 7923/12384 [16:48:56<9:29:31, 7.66s/it, loss=0.0015, acc=0.9970, iter_time=11.62s]
Epoch 0: 64%|██████▍ | 7924/12384 [16:48:56<9:27:48, 7.64s/it, loss=0.0015, acc=0.9970, iter_time=11.62s]
Epoch 0: 64%|██████▍ | 7924/12384 [16:49:04<9:27:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 64%|██████▍ | 7925/12384 [16:49:04<9:27:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 64%|██████▍ | 7925/12384 [16:49:12<9:27:05, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.56s]
Epoch 0: 64%|██████▍ | 7926/12384 [16:49:12<9:26:13, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.56s]
Epoch 0: 64%|██████▍ | 7926/12384 [16:49:19<9:26:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 0: 64%|██████▍ | 7927/12384 [16:49:19<9:26:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 0: 64%|██████▍ | 7927/12384 [16:49:27<9:26:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 64%|██████▍ | 7928/12384 [16:49:27<9:27:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 64%|██████▍ | 7928/12384 [16:49:35<9:27:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 64%|██████▍ | 7929/12384 [16:49:35<9:33:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 64%|██████▍ | 7929/12384 [16:49:42<9:33:10, 7.72s/it, loss=0.0017, acc=0.9938, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7930/12384 [16:49:42<9:30:19, 7.68s/it, loss=0.0017, acc=0.9938, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7930/12384 [16:49:50<9:30:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7931/12384 [16:49:50<9:28:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7931/12384 [16:49:58<9:28:16, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7932/12384 [16:49:58<9:27:04, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7932/12384 [16:50:05<9:27:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7933/12384 [16:50:05<9:26:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7933/12384 [16:50:13<9:26:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 64%|██████▍ | 7934/12384 [16:50:13<9:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 64%|██████▍ | 7934/12384 [16:50:20<9:25:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.69s]
Epoch 0: 64%|██████▍ | 7935/12384 [16:50:20<9:24:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.69s]
Epoch 0: 64%|██████▍ | 7935/12384 [16:50:28<9:24:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 0: 64%|██████▍ | 7936/12384 [16:50:28<9:24:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 0: 64%|██████▍ | 7936/12384 [16:50:36<9:24:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 0: 64%|██████▍ | 7937/12384 [16:50:36<9:24:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 0: 64%|██████▍ | 7937/12384 [16:50:43<9:24:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 64%|██████▍ | 7938/12384 [16:50:43<9:24:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 64%|██████▍ | 7938/12384 [16:50:51<9:24:26, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=7.20s]
Epoch 0: 64%|██████▍ | 7939/12384 [16:50:51<9:23:30, 7.61s/it, loss=0.0006, acc=0.9979, iter_time=7.20s]
Epoch 0: 64%|██████▍ | 7939/12384 [16:50:58<9:23:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 64%|██████▍ | 7940/12384 [16:50:58<9:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 64%|██████▍ | 7940/12384 [16:51:06<9:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 64%|██████▍ | 7941/12384 [16:51:06<9:22:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 64%|██████▍ | 7941/12384 [16:51:14<9:22:53, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.75s]
Epoch 0: 64%|██████▍ | 7942/12384 [16:51:14<9:22:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.75s]
Epoch 0: 64%|██████▍ | 7942/12384 [16:51:21<9:22:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 0: 64%|██████▍ | 7943/12384 [16:51:21<9:22:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 0: 64%|██████▍ | 7943/12384 [16:51:29<9:22:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 64%|██████▍ | 7944/12384 [16:51:29<9:22:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 64%|██████▍ | 7944/12384 [16:51:36<9:22:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 64%|██████▍ | 7945/12384 [16:51:36<9:22:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 64%|██████▍ | 7945/12384 [16:51:44<9:22:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 64%|██████▍ | 7946/12384 [16:51:44<9:23:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 64%|██████▍ | 7946/12384 [16:51:52<9:23:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 0: 64%|██████▍ | 7947/12384 [16:51:52<9:30:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 0: 64%|██████▍ | 7947/12384 [16:52:00<9:30:35, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 0: 64%|██████▍ | 7948/12384 [16:52:00<9:28:05, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 0: 64%|██████▍ | 7948/12384 [16:52:07<9:28:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 64%|██████▍ | 7949/12384 [16:52:07<9:26:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 64%|██████▍ | 7949/12384 [16:52:15<9:26:20, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.82s]
Epoch 0: 64%|██████▍ | 7950/12384 [16:52:15<9:25:05, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.82s]
Epoch 0: 64%|██████▍ | 7950/12384 [16:52:22<9:25:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 64%|██████▍ | 7951/12384 [16:52:22<9:23:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 64%|██████▍ | 7951/12384 [16:52:30<9:23:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 64%|██████▍ | 7952/12384 [16:52:30<9:23:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 64%|██████▍ | 7952/12384 [16:52:38<9:23:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 64%|██████▍ | 7953/12384 [16:52:38<9:22:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 64%|██████▍ | 7953/12384 [16:52:45<9:22:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7954/12384 [16:52:45<9:22:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7954/12384 [16:52:53<9:22:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 64%|██████▍ | 7955/12384 [16:52:53<9:29:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 64%|██████▍ | 7955/12384 [16:53:01<9:29:54, 7.72s/it, loss=0.0005, acc=0.9976, iter_time=7.59s]
Epoch 0: 64%|██████▍ | 7956/12384 [16:53:01<9:27:00, 7.68s/it, loss=0.0005, acc=0.9976, iter_time=7.59s]
Epoch 0: 64%|██████▍ | 7956/12384 [16:53:08<9:27:00, 7.68s/it, loss=0.0010, acc=0.9974, iter_time=7.62s]
Epoch 0: 64%|██████▍ | 7957/12384 [16:53:08<9:25:12, 7.66s/it, loss=0.0010, acc=0.9974, iter_time=7.62s]
Epoch 0: 64%|██████▍ | 7957/12384 [16:53:16<9:25:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 64%|██████▍ | 7958/12384 [16:53:16<9:23:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 64%|██████▍ | 7958/12384 [16:53:24<9:23:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.98s]
Epoch 0: 64%|██████▍ | 7959/12384 [16:53:24<9:22:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.98s]
Epoch 0: 64%|██████▍ | 7959/12384 [16:53:31<9:22:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 0: 64%|██████▍ | 7960/12384 [16:53:31<9:21:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 0: 64%|██████▍ | 7960/12384 [16:53:39<9:21:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 64%|██████▍ | 7961/12384 [16:53:39<9:21:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 64%|██████▍ | 7961/12384 [16:53:46<9:21:09, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7962/12384 [16:53:46<9:20:55, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7962/12384 [16:53:54<9:20:55, 7.61s/it, loss=0.0010, acc=0.9963, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7963/12384 [16:53:54<9:20:56, 7.61s/it, loss=0.0010, acc=0.9963, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7963/12384 [16:54:02<9:20:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 64%|██████▍ | 7964/12384 [16:54:02<9:20:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 64%|██████▍ | 7964/12384 [16:54:09<9:20:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 64%|██████▍ | 7965/12384 [16:54:09<9:20:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 64%|██████▍ | 7965/12384 [16:54:17<9:20:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 64%|██████▍ | 7966/12384 [16:54:17<9:20:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 64%|██████▍ | 7966/12384 [16:54:24<9:20:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 64%|██████▍ | 7967/12384 [16:54:24<9:20:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 64%|██████▍ | 7967/12384 [16:54:32<9:20:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 0: 64%|██████▍ | 7968/12384 [16:54:32<9:20:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 0: 64%|██████▍ | 7968/12384 [16:54:40<9:20:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 64%|██████▍ | 7969/12384 [16:54:40<9:20:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 64%|██████▍ | 7969/12384 [16:54:47<9:20:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 0: 64%|██████▍ | 7970/12384 [16:54:47<9:20:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 0: 64%|██████▍ | 7970/12384 [16:54:55<9:20:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 64%|██████▍ | 7971/12384 [16:54:55<9:19:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 64%|██████▍ | 7971/12384 [16:55:03<9:19:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 64%|██████▍ | 7972/12384 [16:55:03<9:19:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 64%|██████▍ | 7972/12384 [16:55:10<9:19:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 64%|██████▍ | 7973/12384 [16:55:10<9:27:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 64%|██████▍ | 7973/12384 [16:55:18<9:27:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 64%|██████▍ | 7974/12384 [16:55:18<9:24:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 64%|██████▍ | 7974/12384 [16:55:26<9:24:42, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.48s]
Epoch 0: 64%|██████▍ | 7975/12384 [16:55:26<9:22:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.48s]
Epoch 0: 64%|██████▍ | 7975/12384 [16:55:33<9:22:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 0: 64%|██████▍ | 7976/12384 [16:55:33<9:21:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 0: 64%|██████▍ | 7976/12384 [16:55:41<9:21:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 64%|██████▍ | 7977/12384 [16:55:41<9:20:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 64%|██████▍ | 7977/12384 [16:55:48<9:20:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7978/12384 [16:55:48<9:20:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 64%|██████▍ | 7978/12384 [16:55:56<9:20:06, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 64%|██████▍ | 7979/12384 [16:55:56<9:19:34, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 0: 64%|██████▍ | 7979/12384 [16:56:04<9:19:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 64%|██████▍ | 7980/12384 [16:56:04<9:19:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 64%|██████▍ | 7980/12384 [16:56:12<9:19:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 64%|██████▍ | 7981/12384 [16:56:12<9:25:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 64%|██████▍ | 7981/12384 [16:56:19<9:25:17, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7982/12384 [16:56:19<9:23:00, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 64%|██████▍ | 7982/12384 [16:56:27<9:23:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 64%|██████▍ | 7983/12384 [16:56:27<9:22:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 64%|██████▍ | 7983/12384 [16:56:35<9:22:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 64%|██████▍ | 7984/12384 [16:56:35<9:21:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 64%|██████▍ | 7984/12384 [16:56:42<9:21:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 0: 64%|██████▍ | 7985/12384 [16:56:42<9:20:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 0: 64%|██████▍ | 7985/12384 [16:56:50<9:20:42, 7.65s/it, loss=0.0028, acc=0.9967, iter_time=8.80s]
Epoch 0: 64%|██████▍ | 7986/12384 [16:56:50<9:20:55, 7.65s/it, loss=0.0028, acc=0.9967, iter_time=8.80s]
Epoch 0: 64%|██████▍ | 7986/12384 [16:56:57<9:20:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 64%|██████▍ | 7987/12384 [16:56:57<9:19:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 64%|██████▍ | 7987/12384 [16:57:05<9:19:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 65%|██████▍ | 7988/12384 [16:57:05<9:19:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 65%|██████▍ | 7988/12384 [16:57:13<9:19:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 0: 65%|██████▍ | 7989/12384 [16:57:13<9:18:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 0: 65%|██████▍ | 7989/12384 [16:57:20<9:18:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 65%|██████▍ | 7990/12384 [16:57:20<9:17:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 65%|██████▍ | 7990/12384 [16:57:28<9:17:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 0: 65%|██████▍ | 7991/12384 [16:57:28<9:17:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 0: 65%|██████▍ | 7991/12384 [16:57:35<9:17:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 65%|██████▍ | 7992/12384 [16:57:35<9:17:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 65%|██████▍ | 7992/12384 [16:57:43<9:17:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 65%|██████▍ | 7993/12384 [16:57:43<9:16:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 65%|██████▍ | 7993/12384 [16:57:51<9:16:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 7994/12384 [16:57:51<9:16:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 7994/12384 [16:57:58<9:16:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 65%|██████▍ | 7995/12384 [16:57:58<9:15:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 65%|██████▍ | 7995/12384 [16:58:06<9:15:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 65%|██████▍ | 7996/12384 [16:58:06<9:15:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 65%|██████▍ | 7996/12384 [16:58:13<9:15:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 65%|██████▍ | 7997/12384 [16:58:13<9:15:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 65%|██████▍ | 7997/12384 [16:58:21<9:15:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 65%|██████▍ | 7998/12384 [16:58:21<9:15:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 65%|██████▍ | 7998/12384 [16:58:29<9:15:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 65%|██████▍ | 7999/12384 [16:58:29<9:15:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 65%|██████▍ | 7999/12384 [16:58:37<9:15:42, 7.60s/it, loss=0.0003, acc=0.9984, iter_time=8.35s]
Epoch 0: 65%|██████▍ | 8000/12384 [16:58:37<9:27:03, 7.76s/it, loss=0.0003, acc=0.9984, iter_time=8.35s]
Epoch 0: 65%|██████▍ | 8000/12384 [16:58:44<9:27:03, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 65%|██████▍ | 8001/12384 [16:58:44<9:23:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 65%|██████▍ | 8001/12384 [16:58:52<9:23:35, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▍ | 8002/12384 [16:58:52<9:21:05, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▍ | 8002/12384 [16:59:00<9:21:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 65%|██████▍ | 8003/12384 [16:59:00<9:18:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 65%|██████▍ | 8003/12384 [16:59:07<9:18:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 65%|██████▍ | 8004/12384 [16:59:07<9:19:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 65%|██████▍ | 8004/12384 [16:59:15<9:19:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 65%|██████▍ | 8005/12384 [16:59:15<9:18:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 65%|██████▍ | 8005/12384 [16:59:23<9:18:02, 7.65s/it, loss=0.0001, acc=0.9991, iter_time=7.88s]
Epoch 0: 65%|██████▍ | 8006/12384 [16:59:23<9:22:35, 7.71s/it, loss=0.0001, acc=0.9991, iter_time=7.88s]
Epoch 0: 65%|██████▍ | 8006/12384 [16:59:30<9:22:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.58s]
Epoch 0: 65%|██████▍ | 8007/12384 [16:59:30<9:20:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.58s]
Epoch 0: 65%|██████▍ | 8007/12384 [16:59:38<9:20:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 0: 65%|██████▍ | 8008/12384 [16:59:38<9:19:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 0: 65%|██████▍ | 8008/12384 [16:59:46<9:19:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 0: 65%|██████▍ | 8009/12384 [16:59:46<9:17:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 0: 65%|██████▍ | 8009/12384 [16:59:53<9:17:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 65%|██████▍ | 8010/12384 [16:59:53<9:16:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 65%|██████▍ | 8010/12384 [17:00:01<9:16:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 65%|██████▍ | 8011/12384 [17:00:01<9:15:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 65%|██████▍ | 8011/12384 [17:00:08<9:15:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 65%|██████▍ | 8012/12384 [17:00:08<9:15:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 65%|██████▍ | 8012/12384 [17:00:16<9:15:20, 7.62s/it, loss=0.0007, acc=0.9986, iter_time=7.61s]
Epoch 0: 65%|██████▍ | 8013/12384 [17:00:16<9:14:34, 7.61s/it, loss=0.0007, acc=0.9986, iter_time=7.61s]
Epoch 0: 65%|██████▍ | 8013/12384 [17:00:24<9:14:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▍ | 8014/12384 [17:00:24<9:14:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▍ | 8014/12384 [17:00:31<9:14:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 65%|██████▍ | 8015/12384 [17:00:31<9:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 65%|██████▍ | 8015/12384 [17:00:39<9:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 65%|██████▍ | 8016/12384 [17:00:39<9:14:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 65%|██████▍ | 8016/12384 [17:00:46<9:14:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 65%|██████▍ | 8017/12384 [17:00:46<9:14:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 65%|██████▍ | 8017/12384 [17:00:54<9:14:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▍ | 8018/12384 [17:00:54<9:13:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▍ | 8018/12384 [17:01:02<9:13:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▍ | 8019/12384 [17:01:02<9:13:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▍ | 8019/12384 [17:01:09<9:13:36, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 65%|██████▍ | 8020/12384 [17:01:09<9:15:23, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 65%|██████▍ | 8020/12384 [17:01:17<9:15:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 65%|██████▍ | 8021/12384 [17:01:17<9:14:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 65%|██████▍ | 8021/12384 [17:01:25<9:14:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 8022/12384 [17:01:25<9:13:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 8022/12384 [17:01:32<9:13:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 65%|██████▍ | 8023/12384 [17:01:32<9:13:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 65%|██████▍ | 8023/12384 [17:01:40<9:13:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 65%|██████▍ | 8024/12384 [17:01:40<9:14:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 65%|██████▍ | 8024/12384 [17:01:47<9:14:20, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.65s]
Epoch 0: 65%|██████▍ | 8025/12384 [17:01:47<9:14:17, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.65s]
Epoch 0: 65%|██████▍ | 8025/12384 [17:01:55<9:14:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 65%|██████▍ | 8026/12384 [17:01:55<9:19:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 65%|██████▍ | 8026/12384 [17:02:03<9:19:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 0: 65%|██████▍ | 8027/12384 [17:02:03<9:16:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 0: 65%|██████▍ | 8027/12384 [17:02:11<9:16:57, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.86s]
Epoch 0: 65%|██████▍ | 8028/12384 [17:02:11<9:16:50, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.86s]
Epoch 0: 65%|██████▍ | 8028/12384 [17:02:18<9:16:50, 7.67s/it, loss=0.0006, acc=0.9988, iter_time=9.69s]
Epoch 0: 65%|██████▍ | 8029/12384 [17:02:18<9:15:27, 7.65s/it, loss=0.0006, acc=0.9988, iter_time=9.69s]
Epoch 0: 65%|██████▍ | 8029/12384 [17:02:26<9:15:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 8030/12384 [17:02:26<9:14:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 8030/12384 [17:02:33<9:14:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 65%|██████▍ | 8031/12384 [17:02:33<9:13:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 65%|██████▍ | 8031/12384 [17:02:41<9:13:17, 7.63s/it, loss=0.0008, acc=0.9976, iter_time=7.98s]
Epoch 0: 65%|██████▍ | 8032/12384 [17:02:41<9:12:59, 7.62s/it, loss=0.0008, acc=0.9976, iter_time=7.98s]
Epoch 0: 65%|██████▍ | 8032/12384 [17:02:49<9:12:59, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=4.48s]
Epoch 0: 65%|██████▍ | 8033/12384 [17:02:49<9:12:41, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=4.48s]
Epoch 0: 65%|██████▍ | 8033/12384 [17:02:56<9:12:41, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=10.36s]
Epoch 0: 65%|██████▍ | 8034/12384 [17:02:56<9:11:57, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=10.36s]
Epoch 0: 65%|██████▍ | 8034/12384 [17:03:04<9:11:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 65%|██████▍ | 8035/12384 [17:03:04<9:11:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 65%|██████▍ | 8035/12384 [17:03:11<9:11:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 65%|██████▍ | 8036/12384 [17:03:11<9:11:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 65%|██████▍ | 8036/12384 [17:03:19<9:11:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 65%|██████▍ | 8037/12384 [17:03:19<9:11:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 65%|██████▍ | 8037/12384 [17:03:27<9:11:26, 7.61s/it, loss=0.0002, acc=0.9989, iter_time=9.62s]
Epoch 0: 65%|██████▍ | 8038/12384 [17:03:27<9:10:58, 7.61s/it, loss=0.0002, acc=0.9989, iter_time=9.62s]
Epoch 0: 65%|██████▍ | 8038/12384 [17:03:34<9:10:58, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.56s]
Epoch 0: 65%|██████▍ | 8039/12384 [17:03:34<9:10:56, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.56s]
Epoch 0: 65%|██████▍ | 8039/12384 [17:03:42<9:10:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.61s]
Epoch 0: 65%|██████▍ | 8040/12384 [17:03:42<9:10:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.61s]
Epoch 0: 65%|██████▍ | 8040/12384 [17:03:49<9:10:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 65%|██████▍ | 8041/12384 [17:03:49<9:10:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 65%|██████▍ | 8041/12384 [17:03:57<9:10:47, 7.61s/it, loss=0.0012, acc=0.9988, iter_time=7.91s]
Epoch 0: 65%|██████▍ | 8042/12384 [17:03:57<9:11:10, 7.62s/it, loss=0.0012, acc=0.9988, iter_time=7.91s]
Epoch 0: 65%|██████▍ | 8042/12384 [17:04:05<9:11:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 0: 65%|██████▍ | 8043/12384 [17:04:05<9:10:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 0: 65%|██████▍ | 8043/12384 [17:04:12<9:10:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 65%|██████▍ | 8044/12384 [17:04:12<9:09:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 65%|██████▍ | 8044/12384 [17:04:20<9:09:46, 7.60s/it, loss=0.0003, acc=0.9994, iter_time=11.09s]
Epoch 0: 65%|██████▍ | 8045/12384 [17:04:20<9:09:56, 7.60s/it, loss=0.0003, acc=0.9994, iter_time=11.09s]
Epoch 0: 65%|██████▍ | 8045/12384 [17:04:28<9:09:56, 7.60s/it, loss=0.0013, acc=0.9981, iter_time=7.64s]
Epoch 0: 65%|██████▍ | 8046/12384 [17:04:28<9:09:57, 7.61s/it, loss=0.0013, acc=0.9981, iter_time=7.64s]
Epoch 0: 65%|██████▍ | 8046/12384 [17:04:35<9:09:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 8047/12384 [17:04:35<9:10:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 8047/12384 [17:04:43<9:10:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 8048/12384 [17:04:43<9:10:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▍ | 8048/12384 [17:04:50<9:10:15, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 65%|██████▍ | 8049/12384 [17:04:50<9:09:48, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 65%|██████▍ | 8049/12384 [17:04:58<9:09:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 65%|██████▌ | 8050/12384 [17:04:58<9:10:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 65%|██████▌ | 8050/12384 [17:05:06<9:10:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.59s]
Epoch 0: 65%|██████▌ | 8051/12384 [17:05:06<9:09:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.59s]
Epoch 0: 65%|██████▌ | 8051/12384 [17:05:13<9:09:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 65%|██████▌ | 8052/12384 [17:05:13<9:09:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 65%|██████▌ | 8052/12384 [17:05:21<9:09:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 65%|██████▌ | 8053/12384 [17:05:21<9:17:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 65%|██████▌ | 8053/12384 [17:05:29<9:17:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 65%|██████▌ | 8054/12384 [17:05:29<9:14:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 65%|██████▌ | 8054/12384 [17:05:36<9:14:52, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 65%|██████▌ | 8055/12384 [17:05:36<9:12:56, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 65%|██████▌ | 8055/12384 [17:05:44<9:12:56, 7.66s/it, loss=0.0006, acc=0.9981, iter_time=7.54s]
Epoch 0: 65%|██████▌ | 8056/12384 [17:05:44<9:11:33, 7.65s/it, loss=0.0006, acc=0.9981, iter_time=7.54s]
Epoch 0: 65%|██████▌ | 8056/12384 [17:05:52<9:11:33, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 65%|██████▌ | 8057/12384 [17:05:52<9:10:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 65%|██████▌ | 8057/12384 [17:05:59<9:10:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 65%|██████▌ | 8058/12384 [17:05:59<9:09:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 65%|██████▌ | 8058/12384 [17:06:07<9:09:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▌ | 8059/12384 [17:06:07<9:09:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 65%|██████▌ | 8059/12384 [17:06:14<9:09:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 0: 65%|██████▌ | 8060/12384 [17:06:14<9:08:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 0: 65%|██████▌ | 8060/12384 [17:06:22<9:08:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 65%|██████▌ | 8061/12384 [17:06:22<9:08:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 65%|██████▌ | 8061/12384 [17:06:30<9:08:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 65%|██████▌ | 8062/12384 [17:06:30<9:08:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 65%|██████▌ | 8062/12384 [17:06:37<9:08:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 65%|██████▌ | 8063/12384 [17:06:37<9:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 65%|██████▌ | 8063/12384 [17:06:45<9:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 65%|██████▌ | 8064/12384 [17:06:45<9:07:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 65%|██████▌ | 8064/12384 [17:06:52<9:07:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 0: 65%|██████▌ | 8065/12384 [17:06:52<9:07:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 0: 65%|██████▌ | 8065/12384 [17:07:00<9:07:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 65%|██████▌ | 8066/12384 [17:07:00<9:07:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 65%|██████▌ | 8066/12384 [17:07:08<9:07:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 0: 65%|██████▌ | 8067/12384 [17:07:08<9:08:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 0: 65%|██████▌ | 8067/12384 [17:07:15<9:08:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 0: 65%|██████▌ | 8068/12384 [17:07:15<9:09:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 0: 65%|██████▌ | 8068/12384 [17:07:23<9:09:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 65%|██████▌ | 8069/12384 [17:07:23<9:08:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 65%|██████▌ | 8069/12384 [17:07:31<9:08:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8070/12384 [17:07:31<9:08:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8070/12384 [17:07:38<9:08:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8071/12384 [17:07:38<9:07:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8071/12384 [17:07:46<9:07:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 65%|██████▌ | 8072/12384 [17:07:46<9:07:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 65%|██████▌ | 8072/12384 [17:07:53<9:07:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.29s]
Epoch 0: 65%|██████▌ | 8073/12384 [17:07:53<9:07:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.29s]
Epoch 0: 65%|██████▌ | 8073/12384 [17:08:01<9:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 65%|██████▌ | 8074/12384 [17:08:01<9:06:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 65%|██████▌ | 8074/12384 [17:08:09<9:06:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 65%|██████▌ | 8075/12384 [17:08:09<9:06:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 65%|██████▌ | 8075/12384 [17:08:16<9:06:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 0: 65%|██████▌ | 8076/12384 [17:08:16<9:06:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 0: 65%|██████▌ | 8076/12384 [17:08:24<9:06:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8077/12384 [17:08:24<9:06:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8077/12384 [17:08:31<9:06:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 65%|██████▌ | 8078/12384 [17:08:31<9:06:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 65%|██████▌ | 8078/12384 [17:08:39<9:06:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 65%|██████▌ | 8079/12384 [17:08:39<9:12:51, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 65%|██████▌ | 8079/12384 [17:08:47<9:12:51, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.86s]
Epoch 0: 65%|██████▌ | 8080/12384 [17:08:47<9:11:01, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.86s]
Epoch 0: 65%|██████▌ | 8080/12384 [17:08:55<9:11:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 65%|██████▌ | 8081/12384 [17:08:55<9:08:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 65%|██████▌ | 8081/12384 [17:09:02<9:08:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 65%|██████▌ | 8082/12384 [17:09:02<9:08:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 65%|██████▌ | 8082/12384 [17:09:10<9:08:10, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=6.13s]
Epoch 0: 65%|██████▌ | 8083/12384 [17:09:10<9:07:34, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=6.13s]
Epoch 0: 65%|██████▌ | 8083/12384 [17:09:17<9:07:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 0: 65%|██████▌ | 8084/12384 [17:09:17<9:07:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 0: 65%|██████▌ | 8084/12384 [17:09:25<9:07:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 65%|██████▌ | 8085/12384 [17:09:25<9:06:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 65%|██████▌ | 8085/12384 [17:09:33<9:06:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.75s]
Epoch 0: 65%|██████▌ | 8086/12384 [17:09:33<9:06:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.75s]
Epoch 0: 65%|██████▌ | 8086/12384 [17:09:40<9:06:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 0: 65%|██████▌ | 8087/12384 [17:09:40<9:06:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 0: 65%|██████▌ | 8087/12384 [17:09:48<9:06:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 0: 65%|██████▌ | 8088/12384 [17:09:48<9:05:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 0: 65%|██████▌ | 8088/12384 [17:09:56<9:05:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 65%|██████▌ | 8089/12384 [17:09:56<9:05:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 65%|██████▌ | 8089/12384 [17:10:03<9:05:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 65%|██████▌ | 8090/12384 [17:10:03<9:05:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 65%|██████▌ | 8090/12384 [17:10:11<9:05:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 65%|██████▌ | 8091/12384 [17:10:11<9:04:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 65%|██████▌ | 8091/12384 [17:10:18<9:04:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 65%|██████▌ | 8092/12384 [17:10:18<9:04:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 65%|██████▌ | 8092/12384 [17:10:26<9:04:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 65%|██████▌ | 8093/12384 [17:10:26<9:03:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 65%|██████▌ | 8093/12384 [17:10:34<9:03:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.73s]
Epoch 0: 65%|██████▌ | 8094/12384 [17:10:34<9:04:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.73s]
Epoch 0: 65%|██████▌ | 8094/12384 [17:10:41<9:04:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 65%|██████▌ | 8095/12384 [17:10:41<9:04:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 65%|██████▌ | 8095/12384 [17:10:49<9:04:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 65%|██████▌ | 8096/12384 [17:10:49<9:04:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 65%|██████▌ | 8096/12384 [17:10:56<9:04:44, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=7.23s]
Epoch 0: 65%|██████▌ | 8097/12384 [17:10:56<9:04:57, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.23s]
Epoch 0: 65%|██████▌ | 8097/12384 [17:11:04<9:04:57, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 65%|██████▌ | 8098/12384 [17:11:04<9:04:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 65%|██████▌ | 8098/12384 [17:11:12<9:04:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8099/12384 [17:11:12<9:04:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8099/12384 [17:11:19<9:04:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 65%|██████▌ | 8100/12384 [17:11:19<9:04:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 65%|██████▌ | 8100/12384 [17:11:27<9:04:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 65%|██████▌ | 8101/12384 [17:11:27<9:03:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 65%|██████▌ | 8101/12384 [17:11:35<9:03:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8102/12384 [17:11:35<9:03:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 65%|██████▌ | 8102/12384 [17:11:42<9:03:28, 7.62s/it, loss=0.0001, acc=0.9983, iter_time=7.62s]
Epoch 0: 65%|██████▌ | 8103/12384 [17:11:42<9:02:58, 7.61s/it, loss=0.0001, acc=0.9983, iter_time=7.62s]
Epoch 0: 65%|██████▌ | 8103/12384 [17:11:50<9:02:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 65%|██████▌ | 8104/12384 [17:11:50<9:03:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 65%|██████▌ | 8104/12384 [17:11:58<9:03:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 65%|██████▌ | 8105/12384 [17:11:58<9:08:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 65%|██████▌ | 8105/12384 [17:12:05<9:08:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 65%|██████▌ | 8106/12384 [17:12:05<9:06:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 65%|██████▌ | 8106/12384 [17:12:13<9:06:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 65%|██████▌ | 8107/12384 [17:12:13<9:05:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 65%|██████▌ | 8107/12384 [17:12:21<9:05:40, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.81s]
Epoch 0: 65%|██████▌ | 8108/12384 [17:12:21<9:06:47, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.81s]
Epoch 0: 65%|██████▌ | 8108/12384 [17:12:28<9:06:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 0: 65%|██████▌ | 8109/12384 [17:12:28<9:05:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 0: 65%|██████▌ | 8109/12384 [17:12:36<9:05:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 0: 65%|██████▌ | 8110/12384 [17:12:36<9:03:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 0: 65%|██████▌ | 8110/12384 [17:12:43<9:03:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.68s]
Epoch 0: 65%|██████▌ | 8111/12384 [17:12:43<9:02:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.68s]
Epoch 0: 65%|██████▌ | 8111/12384 [17:12:51<9:02:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 66%|██████▌ | 8112/12384 [17:12:51<9:02:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 66%|██████▌ | 8112/12384 [17:12:59<9:02:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 66%|██████▌ | 8113/12384 [17:12:59<9:01:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 66%|██████▌ | 8113/12384 [17:13:06<9:01:59, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=10.13s]
Epoch 0: 66%|██████▌ | 8114/12384 [17:13:06<9:01:26, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=10.13s]
Epoch 0: 66%|██████▌ | 8114/12384 [17:13:14<9:01:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 66%|██████▌ | 8115/12384 [17:13:14<9:00:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 66%|██████▌ | 8115/12384 [17:13:21<9:00:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 66%|██████▌ | 8116/12384 [17:13:21<9:01:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 66%|██████▌ | 8116/12384 [17:13:29<9:01:53, 7.62s/it, loss=0.0001, acc=0.9987, iter_time=7.59s]
Epoch 0: 66%|██████▌ | 8117/12384 [17:13:29<9:01:06, 7.61s/it, loss=0.0001, acc=0.9987, iter_time=7.59s]
Epoch 0: 66%|██████▌ | 8117/12384 [17:13:37<9:01:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 0: 66%|██████▌ | 8118/12384 [17:13:37<9:01:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 0: 66%|██████▌ | 8118/12384 [17:13:44<9:01:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 66%|██████▌ | 8119/12384 [17:13:44<9:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 66%|██████▌ | 8119/12384 [17:13:52<9:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 66%|██████▌ | 8120/12384 [17:13:52<9:00:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 66%|██████▌ | 8120/12384 [17:13:59<9:00:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 0: 66%|██████▌ | 8121/12384 [17:13:59<9:00:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 0: 66%|██████▌ | 8121/12384 [17:14:07<9:00:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 66%|██████▌ | 8122/12384 [17:14:07<9:01:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 66%|██████▌ | 8122/12384 [17:14:15<9:01:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 66%|██████▌ | 8123/12384 [17:14:15<9:00:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 66%|██████▌ | 8123/12384 [17:14:22<9:00:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 66%|██████▌ | 8124/12384 [17:14:22<9:00:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 66%|██████▌ | 8124/12384 [17:14:30<9:00:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 66%|██████▌ | 8125/12384 [17:14:30<9:00:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 66%|██████▌ | 8125/12384 [17:14:38<9:00:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 66%|██████▌ | 8126/12384 [17:14:38<9:01:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 66%|██████▌ | 8126/12384 [17:14:45<9:01:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 0: 66%|██████▌ | 8127/12384 [17:14:45<9:01:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 0: 66%|██████▌ | 8127/12384 [17:14:53<9:01:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 0: 66%|██████▌ | 8128/12384 [17:14:53<9:01:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 0: 66%|██████▌ | 8128/12384 [17:15:01<9:01:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 0: 66%|██████▌ | 8129/12384 [17:15:01<9:01:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 0: 66%|██████▌ | 8129/12384 [17:15:08<9:01:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 66%|██████▌ | 8130/12384 [17:15:08<9:00:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 66%|██████▌ | 8130/12384 [17:15:16<9:00:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 66%|██████▌ | 8131/12384 [17:15:16<9:07:42, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 66%|██████▌ | 8131/12384 [17:15:24<9:07:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 66%|██████▌ | 8132/12384 [17:15:24<9:05:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 66%|██████▌ | 8132/12384 [17:15:31<9:05:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 66%|██████▌ | 8133/12384 [17:15:31<9:02:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 66%|██████▌ | 8133/12384 [17:15:39<9:02:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 66%|██████▌ | 8134/12384 [17:15:39<9:01:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 66%|██████▌ | 8134/12384 [17:15:46<9:01:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 66%|██████▌ | 8135/12384 [17:15:46<9:00:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 66%|██████▌ | 8135/12384 [17:15:54<9:00:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 66%|██████▌ | 8136/12384 [17:15:54<8:59:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 66%|██████▌ | 8136/12384 [17:16:02<8:59:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 66%|██████▌ | 8137/12384 [17:16:02<8:59:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 66%|██████▌ | 8137/12384 [17:16:09<8:59:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.60s]
Epoch 0: 66%|██████▌ | 8138/12384 [17:16:09<8:59:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.60s]
Epoch 0: 66%|██████▌ | 8138/12384 [17:16:17<8:59:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 0: 66%|██████▌ | 8139/12384 [17:16:17<8:59:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 0: 66%|██████▌ | 8139/12384 [17:16:25<8:59:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 66%|██████▌ | 8140/12384 [17:16:25<8:58:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 66%|██████▌ | 8140/12384 [17:16:32<8:58:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 66%|██████▌ | 8141/12384 [17:16:32<9:00:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 66%|██████▌ | 8141/12384 [17:16:40<9:00:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8142/12384 [17:16:40<8:59:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8142/12384 [17:16:48<8:59:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 0: 66%|██████▌ | 8143/12384 [17:16:48<9:00:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 0: 66%|██████▌ | 8143/12384 [17:16:55<9:00:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 0: 66%|██████▌ | 8144/12384 [17:16:55<9:01:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 0: 66%|██████▌ | 8144/12384 [17:17:03<9:01:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 66%|██████▌ | 8145/12384 [17:17:03<9:06:28, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 66%|██████▌ | 8145/12384 [17:17:11<9:06:28, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 66%|██████▌ | 8146/12384 [17:17:11<9:03:54, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 66%|██████▌ | 8146/12384 [17:17:18<9:03:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 66%|██████▌ | 8147/12384 [17:17:18<9:01:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 66%|██████▌ | 8147/12384 [17:17:26<9:01:37, 7.67s/it, loss=0.0002, acc=0.9990, iter_time=10.90s]
Epoch 0: 66%|██████▌ | 8148/12384 [17:17:26<8:59:45, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=10.90s]
Epoch 0: 66%|██████▌ | 8148/12384 [17:17:34<8:59:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8149/12384 [17:17:34<8:59:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8149/12384 [17:17:41<8:59:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 66%|██████▌ | 8150/12384 [17:17:41<8:59:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 66%|██████▌ | 8150/12384 [17:17:49<8:59:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 0: 66%|██████▌ | 8151/12384 [17:17:49<8:59:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 0: 66%|██████▌ | 8151/12384 [17:17:56<8:59:04, 7.64s/it, loss=0.0001, acc=0.9986, iter_time=11.00s]
Epoch 0: 66%|██████▌ | 8152/12384 [17:17:56<8:58:17, 7.63s/it, loss=0.0001, acc=0.9986, iter_time=11.00s]
Epoch 0: 66%|██████▌ | 8152/12384 [17:18:04<8:58:17, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.20s]
Epoch 0: 66%|██████▌ | 8153/12384 [17:18:04<8:57:37, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.20s]
Epoch 0: 66%|██████▌ | 8153/12384 [17:18:12<8:57:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 66%|██████▌ | 8154/12384 [17:18:12<8:56:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 66%|██████▌ | 8154/12384 [17:18:19<8:56:58, 7.62s/it, loss=0.0001, acc=0.9993, iter_time=7.82s]
Epoch 0: 66%|██████▌ | 8155/12384 [17:18:19<8:58:52, 7.65s/it, loss=0.0001, acc=0.9993, iter_time=7.82s]
Epoch 0: 66%|██████▌ | 8155/12384 [17:18:27<8:58:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 0: 66%|██████▌ | 8156/12384 [17:18:27<8:57:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 0: 66%|██████▌ | 8156/12384 [17:18:35<8:57:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 66%|██████▌ | 8157/12384 [17:18:35<9:03:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 66%|██████▌ | 8157/12384 [17:18:43<9:03:52, 7.72s/it, loss=0.0003, acc=0.9998, iter_time=9.11s]
Epoch 0: 66%|██████▌ | 8158/12384 [17:18:43<9:02:05, 7.70s/it, loss=0.0003, acc=0.9998, iter_time=9.11s]
Epoch 0: 66%|██████▌ | 8158/12384 [17:18:50<9:02:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 66%|██████▌ | 8159/12384 [17:18:50<9:00:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 66%|██████▌ | 8159/12384 [17:18:58<9:00:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 66%|██████▌ | 8160/12384 [17:18:58<8:59:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 66%|██████▌ | 8160/12384 [17:19:05<8:59:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 66%|██████▌ | 8161/12384 [17:19:05<8:59:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 66%|██████▌ | 8161/12384 [17:19:13<8:59:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 66%|██████▌ | 8162/12384 [17:19:13<8:58:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 66%|██████▌ | 8162/12384 [17:19:21<8:58:33, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.00s]
Epoch 0: 66%|██████▌ | 8163/12384 [17:19:21<8:57:37, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.00s]
Epoch 0: 66%|██████▌ | 8163/12384 [17:19:28<8:57:37, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.23s]
Epoch 0: 66%|██████▌ | 8164/12384 [17:19:28<8:57:01, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.23s]
Epoch 0: 66%|██████▌ | 8164/12384 [17:19:36<8:57:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 66%|██████▌ | 8165/12384 [17:19:36<9:04:15, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 66%|██████▌ | 8165/12384 [17:19:44<9:04:15, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8166/12384 [17:19:44<9:01:31, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8166/12384 [17:19:52<9:01:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 66%|██████▌ | 8167/12384 [17:19:52<8:59:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 66%|██████▌ | 8167/12384 [17:19:59<8:59:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 66%|██████▌ | 8168/12384 [17:19:59<8:57:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 66%|██████▌ | 8168/12384 [17:20:07<8:57:01, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=3.36s]
Epoch 0: 66%|██████▌ | 8169/12384 [17:20:07<8:55:57, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=3.36s]
Epoch 0: 66%|██████▌ | 8169/12384 [17:20:14<8:55:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 0: 66%|██████▌ | 8170/12384 [17:20:14<8:54:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 0: 66%|██████▌ | 8170/12384 [17:20:22<8:54:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.38s]
Epoch 0: 66%|██████▌ | 8171/12384 [17:20:22<8:54:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.38s]
Epoch 0: 66%|██████▌ | 8171/12384 [17:20:30<8:54:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 66%|██████▌ | 8172/12384 [17:20:30<8:53:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 66%|██████▌ | 8172/12384 [17:20:37<8:53:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8173/12384 [17:20:37<8:53:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8173/12384 [17:20:45<8:53:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8174/12384 [17:20:45<8:53:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8174/12384 [17:20:52<8:53:27, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 66%|██████▌ | 8175/12384 [17:20:52<8:53:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 66%|██████▌ | 8175/12384 [17:21:00<8:53:49, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=8.00s]
Epoch 0: 66%|██████▌ | 8176/12384 [17:21:00<8:53:21, 7.60s/it, loss=0.0005, acc=0.9982, iter_time=8.00s]
Epoch 0: 66%|██████▌ | 8176/12384 [17:21:08<8:53:21, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 66%|██████▌ | 8177/12384 [17:21:08<8:53:04, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 66%|██████▌ | 8177/12384 [17:21:15<8:53:04, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 66%|██████▌ | 8178/12384 [17:21:15<8:55:07, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 66%|██████▌ | 8178/12384 [17:21:23<8:55:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 66%|██████▌ | 8179/12384 [17:21:23<8:54:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 66%|██████▌ | 8179/12384 [17:21:30<8:54:53, 7.63s/it, loss=0.0003, acc=0.9981, iter_time=5.32s]
Epoch 0: 66%|██████▌ | 8180/12384 [17:21:30<8:53:30, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=5.32s]
Epoch 0: 66%|██████▌ | 8180/12384 [17:21:38<8:53:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 0: 66%|██████▌ | 8181/12384 [17:21:38<8:53:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 0: 66%|██████▌ | 8181/12384 [17:21:46<8:53:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 66%|██████▌ | 8182/12384 [17:21:46<8:53:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 66%|██████▌ | 8182/12384 [17:21:53<8:53:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 66%|██████▌ | 8183/12384 [17:21:53<8:52:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 66%|██████▌ | 8183/12384 [17:22:01<8:52:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 0: 66%|██████▌ | 8184/12384 [17:22:01<8:59:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 0: 66%|██████▌ | 8184/12384 [17:22:09<8:59:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 0: 66%|██████▌ | 8185/12384 [17:22:09<8:57:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 0: 66%|██████▌ | 8185/12384 [17:22:16<8:57:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 66%|██████▌ | 8186/12384 [17:22:16<8:55:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 66%|██████▌ | 8186/12384 [17:22:24<8:55:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 0: 66%|██████▌ | 8187/12384 [17:22:24<8:54:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 0: 66%|██████▌ | 8187/12384 [17:22:32<8:54:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 66%|██████▌ | 8188/12384 [17:22:32<8:53:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 66%|██████▌ | 8188/12384 [17:22:39<8:53:46, 7.63s/it, loss=0.0073, acc=0.9837, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8189/12384 [17:22:39<8:52:49, 7.62s/it, loss=0.0073, acc=0.9837, iter_time=7.60s]
Epoch 0: 66%|██████▌ | 8189/12384 [17:22:47<8:52:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 66%|██████▌ | 8190/12384 [17:22:47<8:58:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 66%|██████▌ | 8190/12384 [17:22:55<8:58:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 66%|██████▌ | 8191/12384 [17:22:55<8:55:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 66%|██████▌ | 8191/12384 [17:23:02<8:55:54, 7.67s/it, loss=0.0007, acc=0.9980, iter_time=8.33s]
Epoch 0: 66%|██████▌ | 8192/12384 [17:23:02<8:54:38, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=8.33s]
Epoch 0: 66%|██████▌ | 8192/12384 [17:23:10<8:54:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 66%|██████▌ | 8193/12384 [17:23:10<8:53:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 66%|██████▌ | 8193/12384 [17:23:18<8:53:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 66%|██████▌ | 8194/12384 [17:23:18<8:53:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 66%|██████▌ | 8194/12384 [17:23:25<8:53:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 66%|██████▌ | 8195/12384 [17:23:25<8:52:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 66%|██████▌ | 8195/12384 [17:23:33<8:52:47, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.93s]
Epoch 0: 66%|██████▌ | 8196/12384 [17:23:33<8:52:35, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.93s]
Epoch 0: 66%|██████▌ | 8196/12384 [17:23:40<8:52:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 66%|██████▌ | 8197/12384 [17:23:40<8:52:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 66%|██████▌ | 8197/12384 [17:23:48<8:52:15, 7.63s/it, loss=0.0004, acc=0.9975, iter_time=4.61s]
Epoch 0: 66%|██████▌ | 8198/12384 [17:23:48<8:51:45, 7.62s/it, loss=0.0004, acc=0.9975, iter_time=4.61s]
Epoch 0: 66%|██████▌ | 8198/12384 [17:23:56<8:51:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 66%|██████▌ | 8199/12384 [17:23:56<8:51:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 66%|██████▌ | 8199/12384 [17:24:03<8:51:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 66%|██████▌ | 8200/12384 [17:24:03<8:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 66%|██████▌ | 8200/12384 [17:24:11<8:51:10, 7.62s/it, loss=0.0010, acc=0.9975, iter_time=7.20s]
Epoch 0: 66%|██████▌ | 8201/12384 [17:24:11<8:51:04, 7.62s/it, loss=0.0010, acc=0.9975, iter_time=7.20s]
Epoch 0: 66%|██████▌ | 8201/12384 [17:24:19<8:51:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 0: 66%|██████▌ | 8202/12384 [17:24:19<8:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 0: 66%|██████▌ | 8202/12384 [17:24:26<8:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 66%|██████▌ | 8203/12384 [17:24:26<8:50:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 66%|██████▌ | 8203/12384 [17:24:34<8:50:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 66%|██████▌ | 8204/12384 [17:24:34<8:51:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 66%|██████▌ | 8204/12384 [17:24:41<8:51:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 66%|██████▋ | 8205/12384 [17:24:41<8:50:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 66%|██████▋ | 8205/12384 [17:24:49<8:50:56, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=8.18s]
Epoch 0: 66%|██████▋ | 8206/12384 [17:24:49<8:50:57, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=8.18s]
Epoch 0: 66%|██████▋ | 8206/12384 [17:24:57<8:50:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 66%|██████▋ | 8207/12384 [17:24:57<8:51:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 66%|██████▋ | 8207/12384 [17:25:04<8:51:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 0: 66%|██████▋ | 8208/12384 [17:25:04<8:51:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 0: 66%|██████▋ | 8208/12384 [17:25:12<8:51:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.01s]
Epoch 0: 66%|██████▋ | 8209/12384 [17:25:12<8:50:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.01s]
Epoch 0: 66%|██████▋ | 8209/12384 [17:25:20<8:50:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 66%|██████▋ | 8210/12384 [17:25:20<8:57:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 66%|██████▋ | 8210/12384 [17:25:27<8:57:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 66%|██████▋ | 8211/12384 [17:25:27<8:54:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 66%|██████▋ | 8211/12384 [17:25:35<8:54:45, 7.69s/it, loss=0.0001, acc=0.9984, iter_time=6.66s]
Epoch 0: 66%|██████▋ | 8212/12384 [17:25:35<8:52:48, 7.66s/it, loss=0.0001, acc=0.9984, iter_time=6.66s]
Epoch 0: 66%|██████▋ | 8212/12384 [17:25:43<8:52:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 0: 66%|██████▋ | 8213/12384 [17:25:43<8:51:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 0: 66%|██████▋ | 8213/12384 [17:25:50<8:51:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 0: 66%|██████▋ | 8214/12384 [17:25:50<8:52:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 0: 66%|██████▋ | 8214/12384 [17:25:58<8:52:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 66%|██████▋ | 8215/12384 [17:25:58<8:51:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 0: 66%|██████▋ | 8215/12384 [17:26:06<8:51:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 66%|██████▋ | 8216/12384 [17:26:06<8:50:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 66%|██████▋ | 8216/12384 [17:26:13<8:50:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 66%|██████▋ | 8217/12384 [17:26:13<8:49:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 66%|██████▋ | 8217/12384 [17:26:21<8:49:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 66%|██████▋ | 8218/12384 [17:26:21<8:48:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 66%|██████▋ | 8218/12384 [17:26:28<8:48:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 66%|██████▋ | 8219/12384 [17:26:28<8:49:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 66%|██████▋ | 8219/12384 [17:26:36<8:49:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 66%|██████▋ | 8220/12384 [17:26:36<8:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 66%|██████▋ | 8220/12384 [17:26:44<8:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 66%|██████▋ | 8221/12384 [17:26:44<8:48:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 66%|██████▋ | 8221/12384 [17:26:51<8:48:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 0: 66%|██████▋ | 8222/12384 [17:26:51<8:48:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 0: 66%|██████▋ | 8222/12384 [17:26:59<8:48:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 66%|██████▋ | 8223/12384 [17:26:59<8:47:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 66%|██████▋ | 8223/12384 [17:27:06<8:47:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 66%|██████▋ | 8224/12384 [17:27:06<8:47:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 66%|██████▋ | 8224/12384 [17:27:14<8:47:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 66%|██████▋ | 8225/12384 [17:27:14<8:47:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 66%|██████▋ | 8225/12384 [17:27:22<8:47:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 0: 66%|██████▋ | 8226/12384 [17:27:22<8:47:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 0: 66%|██████▋ | 8226/12384 [17:27:29<8:47:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 0: 66%|██████▋ | 8227/12384 [17:27:29<8:47:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 0: 66%|██████▋ | 8227/12384 [17:27:37<8:47:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 66%|██████▋ | 8228/12384 [17:27:37<8:47:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 66%|██████▋ | 8228/12384 [17:27:45<8:47:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.33s]
Epoch 0: 66%|██████▋ | 8229/12384 [17:27:45<8:47:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.33s]
Epoch 0: 66%|██████▋ | 8229/12384 [17:27:52<8:47:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 66%|██████▋ | 8230/12384 [17:27:52<8:47:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 66%|██████▋ | 8230/12384 [17:28:00<8:47:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 66%|██████▋ | 8231/12384 [17:28:00<8:46:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 66%|██████▋ | 8231/12384 [17:28:07<8:46:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 0: 66%|██████▋ | 8232/12384 [17:28:07<8:46:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 0: 66%|██████▋ | 8232/12384 [17:28:15<8:46:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 66%|██████▋ | 8233/12384 [17:28:15<8:46:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 66%|██████▋ | 8233/12384 [17:28:23<8:46:06, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▋ | 8234/12384 [17:28:23<8:45:44, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 66%|██████▋ | 8234/12384 [17:28:30<8:45:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 66%|██████▋ | 8235/12384 [17:28:30<8:45:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 66%|██████▋ | 8235/12384 [17:28:38<8:45:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 67%|██████▋ | 8236/12384 [17:28:38<8:45:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 67%|██████▋ | 8236/12384 [17:28:46<8:45:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 67%|██████▋ | 8237/12384 [17:28:46<8:52:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 67%|██████▋ | 8237/12384 [17:28:53<8:52:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 67%|██████▋ | 8238/12384 [17:28:53<8:50:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 67%|██████▋ | 8238/12384 [17:29:01<8:50:38, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8239/12384 [17:29:01<8:49:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8239/12384 [17:29:09<8:49:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 67%|██████▋ | 8240/12384 [17:29:09<8:48:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 67%|██████▋ | 8240/12384 [17:29:16<8:48:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 67%|██████▋ | 8241/12384 [17:29:16<8:47:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 67%|██████▋ | 8241/12384 [17:29:24<8:47:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8242/12384 [17:29:24<8:46:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8242/12384 [17:29:31<8:46:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8243/12384 [17:29:31<8:45:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8243/12384 [17:29:39<8:45:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 67%|██████▋ | 8244/12384 [17:29:39<8:52:07, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 67%|██████▋ | 8244/12384 [17:29:47<8:52:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8245/12384 [17:29:47<8:50:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8245/12384 [17:29:55<8:50:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8246/12384 [17:29:55<8:48:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8246/12384 [17:30:02<8:48:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 0: 67%|██████▋ | 8247/12384 [17:30:02<8:49:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 0: 67%|██████▋ | 8247/12384 [17:30:10<8:49:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 0: 67%|██████▋ | 8248/12384 [17:30:10<8:48:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 0: 67%|██████▋ | 8248/12384 [17:30:18<8:48:10, 7.66s/it, loss=0.0001, acc=0.9986, iter_time=7.65s]
Epoch 0: 67%|██████▋ | 8249/12384 [17:30:18<8:46:33, 7.64s/it, loss=0.0001, acc=0.9986, iter_time=7.65s]
Epoch 0: 67%|██████▋ | 8249/12384 [17:30:25<8:46:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 67%|██████▋ | 8250/12384 [17:30:25<8:46:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 67%|██████▋ | 8250/12384 [17:30:33<8:46:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 67%|██████▋ | 8251/12384 [17:30:33<8:45:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 67%|██████▋ | 8251/12384 [17:30:40<8:45:40, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 67%|██████▋ | 8252/12384 [17:30:40<8:45:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 67%|██████▋ | 8252/12384 [17:30:48<8:45:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 67%|██████▋ | 8253/12384 [17:30:48<8:44:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 67%|██████▋ | 8253/12384 [17:30:56<8:44:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 67%|██████▋ | 8254/12384 [17:30:56<8:43:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 67%|██████▋ | 8254/12384 [17:31:03<8:43:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 67%|██████▋ | 8255/12384 [17:31:03<8:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 67%|██████▋ | 8255/12384 [17:31:11<8:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 67%|██████▋ | 8256/12384 [17:31:11<8:43:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 67%|██████▋ | 8256/12384 [17:31:18<8:43:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 67%|██████▋ | 8257/12384 [17:31:18<8:42:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 67%|██████▋ | 8257/12384 [17:31:26<8:42:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8258/12384 [17:31:26<8:44:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8258/12384 [17:31:34<8:44:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 67%|██████▋ | 8259/12384 [17:31:34<8:43:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 67%|██████▋ | 8259/12384 [17:31:41<8:43:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 67%|██████▋ | 8260/12384 [17:31:41<8:43:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 67%|██████▋ | 8260/12384 [17:31:49<8:43:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 67%|██████▋ | 8261/12384 [17:31:49<8:44:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 67%|██████▋ | 8261/12384 [17:31:57<8:44:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8262/12384 [17:31:57<8:43:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8262/12384 [17:32:04<8:43:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 67%|██████▋ | 8263/12384 [17:32:04<8:50:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 67%|██████▋ | 8263/12384 [17:32:12<8:50:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 67%|██████▋ | 8264/12384 [17:32:12<8:47:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 67%|██████▋ | 8264/12384 [17:32:20<8:47:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 0: 67%|██████▋ | 8265/12384 [17:32:20<8:46:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 0: 67%|██████▋ | 8265/12384 [17:32:27<8:46:05, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.68s]
Epoch 0: 67%|██████▋ | 8266/12384 [17:32:27<8:45:06, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.68s]
Epoch 0: 67%|██████▋ | 8266/12384 [17:32:35<8:45:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 67%|██████▋ | 8267/12384 [17:32:35<8:44:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 67%|██████▋ | 8267/12384 [17:32:42<8:44:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8268/12384 [17:32:42<8:43:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8268/12384 [17:32:50<8:43:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 67%|██████▋ | 8269/12384 [17:32:50<8:42:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 67%|██████▋ | 8269/12384 [17:32:58<8:42:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 0: 67%|██████▋ | 8270/12384 [17:32:58<8:42:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 0: 67%|██████▋ | 8270/12384 [17:33:06<8:42:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 67%|██████▋ | 8271/12384 [17:33:06<8:47:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 67%|██████▋ | 8271/12384 [17:33:13<8:47:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 67%|██████▋ | 8272/12384 [17:33:13<8:45:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 67%|██████▋ | 8272/12384 [17:33:21<8:45:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 67%|██████▋ | 8273/12384 [17:33:21<8:44:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 67%|██████▋ | 8273/12384 [17:33:28<8:44:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8274/12384 [17:33:28<8:42:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8274/12384 [17:33:36<8:42:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8275/12384 [17:33:36<8:42:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8275/12384 [17:33:44<8:42:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 67%|██████▋ | 8276/12384 [17:33:44<8:42:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 67%|██████▋ | 8276/12384 [17:33:51<8:42:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 67%|██████▋ | 8277/12384 [17:33:51<8:41:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 67%|██████▋ | 8277/12384 [17:33:59<8:41:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 67%|██████▋ | 8278/12384 [17:33:59<8:41:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 67%|██████▋ | 8278/12384 [17:34:07<8:41:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 67%|██████▋ | 8279/12384 [17:34:07<8:41:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 67%|██████▋ | 8279/12384 [17:34:14<8:41:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 67%|██████▋ | 8280/12384 [17:34:14<8:41:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 67%|██████▋ | 8280/12384 [17:34:22<8:41:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 67%|██████▋ | 8281/12384 [17:34:22<8:41:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 67%|██████▋ | 8281/12384 [17:34:29<8:41:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 0: 67%|██████▋ | 8282/12384 [17:34:29<8:39:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 0: 67%|██████▋ | 8282/12384 [17:34:37<8:39:23, 7.60s/it, loss=0.0001, acc=0.9999, iter_time=7.89s]
Epoch 0: 67%|██████▋ | 8283/12384 [17:34:37<8:39:38, 7.60s/it, loss=0.0001, acc=0.9999, iter_time=7.89s]
Epoch 0: 67%|██████▋ | 8283/12384 [17:34:45<8:39:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 0: 67%|██████▋ | 8284/12384 [17:34:45<8:40:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 0: 67%|██████▋ | 8284/12384 [17:34:52<8:40:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 67%|██████▋ | 8285/12384 [17:34:52<8:40:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 67%|██████▋ | 8285/12384 [17:35:00<8:40:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 67%|██████▋ | 8286/12384 [17:35:00<8:40:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 67%|██████▋ | 8286/12384 [17:35:07<8:40:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8287/12384 [17:35:07<8:40:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8287/12384 [17:35:15<8:40:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 67%|██████▋ | 8288/12384 [17:35:15<8:41:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 67%|██████▋ | 8288/12384 [17:35:23<8:41:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 67%|██████▋ | 8289/12384 [17:35:23<8:48:27, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 67%|██████▋ | 8289/12384 [17:35:31<8:48:27, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 67%|██████▋ | 8290/12384 [17:35:31<8:45:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 67%|██████▋ | 8290/12384 [17:35:38<8:45:34, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.07s]
Epoch 0: 67%|██████▋ | 8291/12384 [17:35:38<8:43:51, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.07s]
Epoch 0: 67%|██████▋ | 8291/12384 [17:35:46<8:43:51, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 0: 67%|██████▋ | 8292/12384 [17:35:46<8:41:58, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 0: 67%|██████▋ | 8292/12384 [17:35:54<8:41:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 67%|██████▋ | 8293/12384 [17:35:54<8:41:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 67%|██████▋ | 8293/12384 [17:36:01<8:41:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 67%|██████▋ | 8294/12384 [17:36:01<8:41:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 67%|██████▋ | 8294/12384 [17:36:09<8:41:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 0: 67%|██████▋ | 8295/12384 [17:36:09<8:40:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 0: 67%|██████▋ | 8295/12384 [17:36:17<8:40:12, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=8.59s]
Epoch 0: 67%|██████▋ | 8296/12384 [17:36:17<8:45:12, 7.71s/it, loss=0.0004, acc=1.0000, iter_time=8.59s]
Epoch 0: 67%|██████▋ | 8296/12384 [17:36:24<8:45:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 67%|██████▋ | 8297/12384 [17:36:24<8:43:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 67%|██████▋ | 8297/12384 [17:36:32<8:43:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 67%|██████▋ | 8298/12384 [17:36:32<8:41:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 67%|██████▋ | 8298/12384 [17:36:40<8:41:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 67%|██████▋ | 8299/12384 [17:36:40<8:40:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 67%|██████▋ | 8299/12384 [17:36:47<8:40:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 67%|██████▋ | 8300/12384 [17:36:47<8:40:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 67%|██████▋ | 8300/12384 [17:36:55<8:40:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 67%|██████▋ | 8301/12384 [17:36:55<8:39:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 67%|██████▋ | 8301/12384 [17:37:02<8:39:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 67%|██████▋ | 8302/12384 [17:37:02<8:39:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 67%|██████▋ | 8302/12384 [17:37:10<8:39:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8303/12384 [17:37:10<8:38:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 67%|██████▋ | 8303/12384 [17:37:18<8:38:03, 7.62s/it, loss=0.0008, acc=0.9975, iter_time=7.99s]
Epoch 0: 67%|██████▋ | 8304/12384 [17:37:18<8:37:45, 7.61s/it, loss=0.0008, acc=0.9975, iter_time=7.99s]
Epoch 0: 67%|██████▋ | 8304/12384 [17:37:25<8:37:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 67%|██████▋ | 8305/12384 [17:37:25<8:37:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 67%|██████▋ | 8305/12384 [17:37:33<8:37:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 67%|██████▋ | 8306/12384 [17:37:33<8:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 67%|██████▋ | 8306/12384 [17:37:40<8:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8307/12384 [17:37:40<8:37:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8307/12384 [17:37:48<8:37:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 0: 67%|██████▋ | 8308/12384 [17:37:48<8:37:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 0: 67%|██████▋ | 8308/12384 [17:37:56<8:37:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 0: 67%|██████▋ | 8309/12384 [17:37:56<8:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 0: 67%|██████▋ | 8309/12384 [17:38:03<8:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 67%|██████▋ | 8310/12384 [17:38:03<8:36:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 67%|██████▋ | 8310/12384 [17:38:11<8:36:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 67%|██████▋ | 8311/12384 [17:38:11<8:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 67%|██████▋ | 8311/12384 [17:38:18<8:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 0: 67%|██████▋ | 8312/12384 [17:38:18<8:36:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 0: 67%|██████▋ | 8312/12384 [17:38:26<8:36:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 67%|██████▋ | 8313/12384 [17:38:26<8:35:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 67%|██████▋ | 8313/12384 [17:38:34<8:35:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 67%|██████▋ | 8314/12384 [17:38:34<8:36:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 67%|██████▋ | 8314/12384 [17:38:42<8:36:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 67%|██████▋ | 8315/12384 [17:38:42<8:43:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 67%|██████▋ | 8315/12384 [17:38:49<8:43:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 67%|██████▋ | 8316/12384 [17:38:49<8:42:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 67%|██████▋ | 8316/12384 [17:38:57<8:42:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 67%|██████▋ | 8317/12384 [17:38:57<8:40:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 67%|██████▋ | 8317/12384 [17:39:05<8:40:31, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 67%|██████▋ | 8318/12384 [17:39:05<8:38:56, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 67%|██████▋ | 8318/12384 [17:39:12<8:38:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 67%|██████▋ | 8319/12384 [17:39:12<8:37:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 67%|██████▋ | 8319/12384 [17:39:20<8:37:58, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 67%|██████▋ | 8320/12384 [17:39:20<8:37:21, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 67%|██████▋ | 8320/12384 [17:39:27<8:37:21, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 67%|██████▋ | 8321/12384 [17:39:27<8:37:17, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 67%|██████▋ | 8321/12384 [17:39:35<8:37:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 67%|██████▋ | 8322/12384 [17:39:35<8:42:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 67%|██████▋ | 8322/12384 [17:39:43<8:42:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 67%|██████▋ | 8323/12384 [17:39:43<8:42:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 67%|██████▋ | 8323/12384 [17:39:51<8:42:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 67%|██████▋ | 8324/12384 [17:39:51<8:40:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 67%|██████▋ | 8324/12384 [17:39:58<8:40:02, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 67%|██████▋ | 8325/12384 [17:39:58<8:38:32, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 67%|██████▋ | 8325/12384 [17:40:06<8:38:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8326/12384 [17:40:06<8:37:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8326/12384 [17:40:14<8:37:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8327/12384 [17:40:14<8:37:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8327/12384 [17:40:21<8:37:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8328/12384 [17:40:21<8:36:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 67%|██████▋ | 8328/12384 [17:40:29<8:36:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 67%|██████▋ | 8329/12384 [17:40:29<8:35:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 67%|██████▋ | 8329/12384 [17:40:36<8:35:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 67%|██████▋ | 8330/12384 [17:40:36<8:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 67%|██████▋ | 8330/12384 [17:40:44<8:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 67%|██████▋ | 8331/12384 [17:40:44<8:35:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 67%|██████▋ | 8331/12384 [17:40:52<8:35:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 67%|██████▋ | 8332/12384 [17:40:52<8:34:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 67%|██████▋ | 8332/12384 [17:40:59<8:34:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 67%|██████▋ | 8333/12384 [17:40:59<8:34:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 67%|██████▋ | 8333/12384 [17:41:07<8:34:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 67%|██████▋ | 8334/12384 [17:41:07<8:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 67%|██████▋ | 8334/12384 [17:41:14<8:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 67%|██████▋ | 8335/12384 [17:41:14<8:33:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 67%|██████▋ | 8335/12384 [17:41:22<8:33:21, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=10.51s]
Epoch 0: 67%|██████▋ | 8336/12384 [17:41:22<8:33:14, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=10.51s]
Epoch 0: 67%|██████▋ | 8336/12384 [17:41:30<8:33:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 67%|██████▋ | 8337/12384 [17:41:30<8:32:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 67%|██████▋ | 8337/12384 [17:41:37<8:32:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 67%|██████▋ | 8338/12384 [17:41:37<8:32:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 67%|██████▋ | 8338/12384 [17:41:45<8:32:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 67%|██████▋ | 8339/12384 [17:41:45<8:32:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 67%|██████▋ | 8339/12384 [17:41:52<8:32:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 67%|██████▋ | 8340/12384 [17:41:52<8:32:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 67%|██████▋ | 8340/12384 [17:42:00<8:32:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 67%|██████▋ | 8341/12384 [17:42:00<8:39:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 67%|██████▋ | 8341/12384 [17:42:08<8:39:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 67%|██████▋ | 8342/12384 [17:42:08<8:37:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 67%|██████▋ | 8342/12384 [17:42:16<8:37:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 67%|██████▋ | 8343/12384 [17:42:16<8:36:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 67%|██████▋ | 8343/12384 [17:42:23<8:36:05, 7.66s/it, loss=0.0004, acc=0.9984, iter_time=7.99s]
Epoch 0: 67%|██████▋ | 8344/12384 [17:42:23<8:34:37, 7.64s/it, loss=0.0004, acc=0.9984, iter_time=7.99s]
Epoch 0: 67%|██████▋ | 8344/12384 [17:42:31<8:34:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 0: 67%|██████▋ | 8345/12384 [17:42:31<8:33:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 0: 67%|██████▋ | 8345/12384 [17:42:38<8:33:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 67%|██████▋ | 8346/12384 [17:42:38<8:33:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 67%|██████▋ | 8346/12384 [17:42:46<8:33:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 67%|██████▋ | 8347/12384 [17:42:46<8:32:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 67%|██████▋ | 8347/12384 [17:42:54<8:32:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 67%|██████▋ | 8348/12384 [17:42:54<8:32:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 67%|██████▋ | 8348/12384 [17:43:01<8:32:13, 7.61s/it, loss=0.0006, acc=0.9983, iter_time=5.77s]
Epoch 0: 67%|██████▋ | 8349/12384 [17:43:01<8:33:17, 7.63s/it, loss=0.0006, acc=0.9983, iter_time=5.77s]
Epoch 0: 67%|██████▋ | 8349/12384 [17:43:09<8:33:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 67%|██████▋ | 8350/12384 [17:43:09<8:32:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 67%|██████▋ | 8350/12384 [17:43:17<8:32:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 0: 67%|██████▋ | 8351/12384 [17:43:17<8:32:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 0: 67%|██████▋ | 8351/12384 [17:43:24<8:32:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 67%|██████▋ | 8352/12384 [17:43:24<8:31:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 67%|██████▋ | 8352/12384 [17:43:32<8:31:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 67%|██████▋ | 8353/12384 [17:43:32<8:31:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 67%|██████▋ | 8353/12384 [17:43:39<8:31:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.30s]
Epoch 0: 67%|██████▋ | 8354/12384 [17:43:39<8:30:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.30s]
Epoch 0: 67%|██████▋ | 8354/12384 [17:43:47<8:30:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8355/12384 [17:43:47<8:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8355/12384 [17:43:55<8:30:55, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.34s]
Epoch 0: 67%|██████▋ | 8356/12384 [17:43:55<8:30:44, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.34s]
Epoch 0: 67%|██████▋ | 8356/12384 [17:44:02<8:30:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 67%|██████▋ | 8357/12384 [17:44:02<8:30:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 67%|██████▋ | 8357/12384 [17:44:10<8:30:19, 7.60s/it, loss=0.0000, acc=0.9996, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8358/12384 [17:44:10<8:30:28, 7.61s/it, loss=0.0000, acc=0.9996, iter_time=7.60s]
Epoch 0: 67%|██████▋ | 8358/12384 [17:44:17<8:30:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 67%|██████▋ | 8359/12384 [17:44:17<8:30:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 67%|██████▋ | 8359/12384 [17:44:25<8:30:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 0: 68%|██████▊ | 8360/12384 [17:44:25<8:29:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 0: 68%|██████▊ | 8360/12384 [17:44:33<8:29:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 68%|██████▊ | 8361/12384 [17:44:33<8:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 68%|██████▊ | 8361/12384 [17:44:40<8:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 68%|██████▊ | 8362/12384 [17:44:40<8:30:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 68%|██████▊ | 8362/12384 [17:44:48<8:30:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 68%|██████▊ | 8363/12384 [17:44:48<8:29:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 68%|██████▊ | 8363/12384 [17:44:55<8:29:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 68%|██████▊ | 8364/12384 [17:44:55<8:29:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 68%|██████▊ | 8364/12384 [17:45:03<8:29:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8365/12384 [17:45:03<8:29:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8365/12384 [17:45:11<8:29:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8366/12384 [17:45:11<8:29:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8366/12384 [17:45:18<8:29:11, 7.60s/it, loss=0.0002, acc=0.9990, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8367/12384 [17:45:18<8:28:48, 7.60s/it, loss=0.0002, acc=0.9990, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8367/12384 [17:45:26<8:28:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 68%|██████▊ | 8368/12384 [17:45:26<8:35:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 68%|██████▊ | 8368/12384 [17:45:34<8:35:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 68%|██████▊ | 8369/12384 [17:45:34<8:33:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 68%|██████▊ | 8369/12384 [17:45:41<8:33:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8370/12384 [17:45:41<8:32:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8370/12384 [17:45:49<8:32:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 68%|██████▊ | 8371/12384 [17:45:49<8:30:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 0: 68%|██████▊ | 8371/12384 [17:45:57<8:30:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 68%|██████▊ | 8372/12384 [17:45:57<8:30:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 68%|██████▊ | 8372/12384 [17:46:04<8:30:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 68%|██████▊ | 8373/12384 [17:46:04<8:29:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 68%|██████▊ | 8373/12384 [17:46:12<8:29:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 68%|██████▊ | 8374/12384 [17:46:12<8:34:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 68%|██████▊ | 8374/12384 [17:46:20<8:34:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8375/12384 [17:46:20<8:32:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8375/12384 [17:46:27<8:32:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 68%|██████▊ | 8376/12384 [17:46:27<8:32:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 68%|██████▊ | 8376/12384 [17:46:35<8:32:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 68%|██████▊ | 8377/12384 [17:46:35<8:31:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 68%|██████▊ | 8377/12384 [17:46:43<8:31:13, 7.66s/it, loss=0.0004, acc=0.9990, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8378/12384 [17:46:43<8:30:36, 7.65s/it, loss=0.0004, acc=0.9990, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8378/12384 [17:46:50<8:30:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 0: 68%|██████▊ | 8379/12384 [17:46:50<8:29:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 0: 68%|██████▊ | 8379/12384 [17:46:58<8:29:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.65s]
Epoch 0: 68%|██████▊ | 8380/12384 [17:46:58<8:29:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.65s]
Epoch 0: 68%|██████▊ | 8380/12384 [17:47:05<8:29:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 68%|██████▊ | 8381/12384 [17:47:05<8:29:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 68%|██████▊ | 8381/12384 [17:47:13<8:29:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 68%|██████▊ | 8382/12384 [17:47:13<8:28:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 68%|██████▊ | 8382/12384 [17:47:21<8:28:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.34s]
Epoch 0: 68%|██████▊ | 8383/12384 [17:47:21<8:28:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.34s]
Epoch 0: 68%|██████▊ | 8383/12384 [17:47:28<8:28:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 68%|██████▊ | 8384/12384 [17:47:28<8:27:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 68%|██████▊ | 8384/12384 [17:47:36<8:27:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 0: 68%|██████▊ | 8385/12384 [17:47:36<8:27:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 0: 68%|██████▊ | 8385/12384 [17:47:44<8:27:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.41s]
Epoch 0: 68%|██████▊ | 8386/12384 [17:47:44<8:27:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.41s]
Epoch 0: 68%|██████▊ | 8386/12384 [17:47:51<8:27:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8387/12384 [17:47:51<8:27:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8387/12384 [17:47:59<8:27:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8388/12384 [17:47:59<8:26:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8388/12384 [17:48:06<8:26:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8389/12384 [17:48:06<8:26:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8389/12384 [17:48:14<8:26:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8390/12384 [17:48:14<8:26:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8390/12384 [17:48:22<8:26:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 68%|██████▊ | 8391/12384 [17:48:22<8:26:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 68%|██████▊ | 8391/12384 [17:48:29<8:26:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 0: 68%|██████▊ | 8392/12384 [17:48:29<8:26:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 0: 68%|██████▊ | 8392/12384 [17:48:37<8:26:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 68%|██████▊ | 8393/12384 [17:48:37<8:25:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 68%|██████▊ | 8393/12384 [17:48:45<8:25:53, 7.61s/it, loss=0.0005, acc=0.9975, iter_time=7.66s]
Epoch 0: 68%|██████▊ | 8394/12384 [17:48:45<8:32:22, 7.70s/it, loss=0.0005, acc=0.9975, iter_time=7.66s]
Epoch 0: 68%|██████▊ | 8394/12384 [17:48:52<8:32:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 68%|██████▊ | 8395/12384 [17:48:52<8:30:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 68%|██████▊ | 8395/12384 [17:49:00<8:30:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8396/12384 [17:49:00<8:28:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8396/12384 [17:49:08<8:28:49, 7.66s/it, loss=0.0000, acc=0.9997, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8397/12384 [17:49:08<8:27:49, 7.64s/it, loss=0.0000, acc=0.9997, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8397/12384 [17:49:15<8:27:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8398/12384 [17:49:15<8:26:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8398/12384 [17:49:23<8:26:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8399/12384 [17:49:23<8:26:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8399/12384 [17:49:30<8:26:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 68%|██████▊ | 8400/12384 [17:49:30<8:26:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 68%|██████▊ | 8400/12384 [17:49:38<8:26:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 0: 68%|██████▊ | 8401/12384 [17:49:38<8:31:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 0: 68%|██████▊ | 8401/12384 [17:49:46<8:31:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 68%|██████▊ | 8402/12384 [17:49:46<8:29:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 68%|██████▊ | 8402/12384 [17:49:53<8:29:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 68%|██████▊ | 8403/12384 [17:49:53<8:27:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 68%|██████▊ | 8403/12384 [17:50:01<8:27:30, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8404/12384 [17:50:01<8:26:51, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8404/12384 [17:50:09<8:26:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8405/12384 [17:50:09<8:26:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8405/12384 [17:50:16<8:26:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8406/12384 [17:50:16<8:25:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8406/12384 [17:50:24<8:25:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8407/12384 [17:50:24<8:25:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8407/12384 [17:50:32<8:25:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8408/12384 [17:50:32<8:25:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8408/12384 [17:50:39<8:25:21, 7.63s/it, loss=0.0008, acc=0.9969, iter_time=7.66s]
Epoch 0: 68%|██████▊ | 8409/12384 [17:50:39<8:24:43, 7.62s/it, loss=0.0008, acc=0.9969, iter_time=7.66s]
Epoch 0: 68%|██████▊ | 8409/12384 [17:50:47<8:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8410/12384 [17:50:47<8:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8410/12384 [17:50:54<8:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8411/12384 [17:50:54<8:25:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8411/12384 [17:51:02<8:25:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 68%|██████▊ | 8412/12384 [17:51:02<8:24:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 68%|██████▊ | 8412/12384 [17:51:10<8:24:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 68%|██████▊ | 8413/12384 [17:51:10<8:24:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 68%|██████▊ | 8413/12384 [17:51:17<8:24:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8414/12384 [17:51:17<8:24:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8414/12384 [17:51:25<8:24:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8415/12384 [17:51:25<8:23:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8415/12384 [17:51:32<8:23:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 68%|██████▊ | 8416/12384 [17:51:32<8:23:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 68%|██████▊ | 8416/12384 [17:51:40<8:23:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 68%|██████▊ | 8417/12384 [17:51:40<8:22:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 68%|██████▊ | 8417/12384 [17:51:48<8:22:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 68%|██████▊ | 8418/12384 [17:51:48<8:22:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 68%|██████▊ | 8418/12384 [17:51:55<8:22:25, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.19s]
Epoch 0: 68%|██████▊ | 8419/12384 [17:51:55<8:22:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.19s]
Epoch 0: 68%|██████▊ | 8419/12384 [17:52:03<8:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 68%|██████▊ | 8420/12384 [17:52:03<8:22:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 68%|██████▊ | 8420/12384 [17:52:11<8:22:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 0: 68%|██████▊ | 8421/12384 [17:52:11<8:29:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 0: 68%|██████▊ | 8421/12384 [17:52:18<8:29:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 0: 68%|██████▊ | 8422/12384 [17:52:18<8:27:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 0: 68%|██████▊ | 8422/12384 [17:52:26<8:27:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8423/12384 [17:52:26<8:25:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8423/12384 [17:52:34<8:25:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 68%|██████▊ | 8424/12384 [17:52:34<8:25:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 68%|██████▊ | 8424/12384 [17:52:41<8:25:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 0: 68%|██████▊ | 8425/12384 [17:52:41<8:24:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 0: 68%|██████▊ | 8425/12384 [17:52:49<8:24:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 0: 68%|██████▊ | 8426/12384 [17:52:49<8:23:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 0: 68%|██████▊ | 8426/12384 [17:52:57<8:23:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 0: 68%|██████▊ | 8427/12384 [17:52:57<8:23:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 0: 68%|██████▊ | 8427/12384 [17:53:04<8:23:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.83s]
Epoch 0: 68%|██████▊ | 8428/12384 [17:53:04<8:22:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.83s]
Epoch 0: 68%|██████▊ | 8428/12384 [17:53:12<8:22:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.47s]
Epoch 0: 68%|██████▊ | 8429/12384 [17:53:12<8:22:40, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.47s]
Epoch 0: 68%|██████▊ | 8429/12384 [17:53:19<8:22:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8430/12384 [17:53:19<8:22:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8430/12384 [17:53:27<8:22:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8431/12384 [17:53:27<8:21:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8431/12384 [17:53:35<8:21:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 68%|██████▊ | 8432/12384 [17:53:35<8:21:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 68%|██████▊ | 8432/12384 [17:53:42<8:21:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 68%|██████▊ | 8433/12384 [17:53:42<8:21:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 68%|██████▊ | 8433/12384 [17:53:50<8:21:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8434/12384 [17:53:50<8:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8434/12384 [17:53:57<8:21:18, 7.61s/it, loss=0.0024, acc=0.9950, iter_time=6.42s]
Epoch 0: 68%|██████▊ | 8435/12384 [17:53:57<8:20:48, 7.61s/it, loss=0.0024, acc=0.9950, iter_time=6.42s]
Epoch 0: 68%|██████▊ | 8435/12384 [17:54:05<8:20:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 68%|██████▊ | 8436/12384 [17:54:05<8:20:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 68%|██████▊ | 8436/12384 [17:54:13<8:20:35, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8437/12384 [17:54:13<8:20:17, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8437/12384 [17:54:20<8:20:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 68%|██████▊ | 8438/12384 [17:54:20<8:20:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 68%|██████▊ | 8438/12384 [17:54:28<8:20:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 0: 68%|██████▊ | 8439/12384 [17:54:28<8:20:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 0: 68%|██████▊ | 8439/12384 [17:54:35<8:20:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 68%|██████▊ | 8440/12384 [17:54:35<8:20:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 68%|██████▊ | 8440/12384 [17:54:43<8:20:20, 7.61s/it, loss=0.0009, acc=0.9961, iter_time=7.20s]
Epoch 0: 68%|██████▊ | 8441/12384 [17:54:43<8:20:15, 7.61s/it, loss=0.0009, acc=0.9961, iter_time=7.20s]
Epoch 0: 68%|██████▊ | 8441/12384 [17:54:51<8:20:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8442/12384 [17:54:51<8:19:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8442/12384 [17:54:58<8:19:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 68%|██████▊ | 8443/12384 [17:54:58<8:19:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 68%|██████▊ | 8443/12384 [17:55:06<8:19:26, 7.60s/it, loss=0.0039, acc=0.9962, iter_time=5.09s]
Epoch 0: 68%|██████▊ | 8444/12384 [17:55:06<8:19:45, 7.61s/it, loss=0.0039, acc=0.9962, iter_time=5.09s]
Epoch 0: 68%|██████▊ | 8444/12384 [17:55:14<8:19:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.22s]
Epoch 0: 68%|██████▊ | 8445/12384 [17:55:14<8:19:09, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.22s]
Epoch 0: 68%|██████▊ | 8445/12384 [17:55:21<8:19:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 68%|██████▊ | 8446/12384 [17:55:21<8:20:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 68%|██████▊ | 8446/12384 [17:55:29<8:20:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 68%|██████▊ | 8447/12384 [17:55:29<8:26:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 68%|██████▊ | 8447/12384 [17:55:37<8:26:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 68%|██████▊ | 8448/12384 [17:55:37<8:24:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 68%|██████▊ | 8448/12384 [17:55:44<8:24:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 68%|██████▊ | 8449/12384 [17:55:44<8:23:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 68%|██████▊ | 8449/12384 [17:55:52<8:23:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 68%|██████▊ | 8450/12384 [17:55:52<8:22:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 68%|██████▊ | 8450/12384 [17:56:00<8:22:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 68%|██████▊ | 8451/12384 [17:56:00<8:20:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 68%|██████▊ | 8451/12384 [17:56:07<8:20:57, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8452/12384 [17:56:07<8:19:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8452/12384 [17:56:15<8:19:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8453/12384 [17:56:15<8:19:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8453/12384 [17:56:22<8:19:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8454/12384 [17:56:22<8:18:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 68%|██████▊ | 8454/12384 [17:56:30<8:18:30, 7.61s/it, loss=0.0004, acc=0.9980, iter_time=6.40s]
Epoch 0: 68%|██████▊ | 8455/12384 [17:56:30<8:17:57, 7.60s/it, loss=0.0004, acc=0.9980, iter_time=6.40s]
Epoch 0: 68%|██████▊ | 8455/12384 [17:56:38<8:17:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 68%|██████▊ | 8456/12384 [17:56:38<8:18:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 68%|██████▊ | 8456/12384 [17:56:45<8:18:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8457/12384 [17:56:45<8:19:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8457/12384 [17:56:53<8:19:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 0: 68%|██████▊ | 8458/12384 [17:56:53<8:18:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 0: 68%|██████▊ | 8458/12384 [17:57:00<8:18:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 68%|██████▊ | 8459/12384 [17:57:00<8:18:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 68%|██████▊ | 8459/12384 [17:57:08<8:18:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 0: 68%|██████▊ | 8460/12384 [17:57:08<8:18:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 0: 68%|██████▊ | 8460/12384 [17:57:16<8:18:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 68%|██████▊ | 8461/12384 [17:57:16<8:18:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 68%|██████▊ | 8461/12384 [17:57:23<8:18:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 0: 68%|██████▊ | 8462/12384 [17:57:23<8:17:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 0: 68%|██████▊ | 8462/12384 [17:57:31<8:17:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 68%|██████▊ | 8463/12384 [17:57:31<8:18:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 68%|██████▊ | 8463/12384 [17:57:39<8:18:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 68%|██████▊ | 8464/12384 [17:57:39<8:18:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 68%|██████▊ | 8464/12384 [17:57:46<8:18:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 68%|██████▊ | 8465/12384 [17:57:46<8:18:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 68%|██████▊ | 8465/12384 [17:57:54<8:18:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.18s]
Epoch 0: 68%|██████▊ | 8466/12384 [17:57:54<8:19:16, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.18s]
Epoch 0: 68%|██████▊ | 8466/12384 [17:58:02<8:19:16, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=5.58s]
Epoch 0: 68%|██████▊ | 8467/12384 [17:58:02<8:18:05, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=5.58s]
Epoch 0: 68%|██████▊ | 8467/12384 [17:58:09<8:18:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 68%|██████▊ | 8468/12384 [17:58:09<8:17:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 68%|██████▊ | 8468/12384 [17:58:17<8:17:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8469/12384 [17:58:17<8:17:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8469/12384 [17:58:24<8:17:26, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8470/12384 [17:58:24<8:17:13, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 68%|██████▊ | 8470/12384 [17:58:32<8:17:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8471/12384 [17:58:32<8:17:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 68%|██████▊ | 8471/12384 [17:58:40<8:17:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 68%|██████▊ | 8472/12384 [17:58:40<8:17:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 68%|██████▊ | 8472/12384 [17:58:48<8:17:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 68%|██████▊ | 8473/12384 [17:58:48<8:23:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 68%|██████▊ | 8473/12384 [17:58:55<8:23:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 0: 68%|██████▊ | 8474/12384 [17:58:55<8:20:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 0: 68%|██████▊ | 8474/12384 [17:59:03<8:20:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 68%|██████▊ | 8475/12384 [17:59:03<8:18:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 68%|██████▊ | 8475/12384 [17:59:10<8:18:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 68%|██████▊ | 8476/12384 [17:59:10<8:17:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 68%|██████▊ | 8476/12384 [17:59:18<8:17:28, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8477/12384 [17:59:18<8:16:50, 7.63s/it, loss=0.0005, acc=0.9993, iter_time=7.59s]
Epoch 0: 68%|██████▊ | 8477/12384 [17:59:26<8:16:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8478/12384 [17:59:26<8:17:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 68%|██████▊ | 8478/12384 [17:59:33<8:17:14, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8479/12384 [17:59:33<8:16:11, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.64s]
Epoch 0: 68%|██████▊ | 8479/12384 [17:59:41<8:16:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 68%|██████▊ | 8480/12384 [17:59:41<8:16:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 68%|██████▊ | 8480/12384 [17:59:48<8:16:11, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.27s]
Epoch 0: 68%|██████▊ | 8481/12384 [17:59:48<8:15:43, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.27s]
Epoch 0: 68%|██████▊ | 8481/12384 [17:59:56<8:15:43, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.67s]
Epoch 0: 68%|██████▊ | 8482/12384 [17:59:56<8:16:32, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.67s]
Epoch 0: 68%|██████▊ | 8482/12384 [18:00:04<8:16:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 68%|██████▊ | 8483/12384 [18:00:04<8:17:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 68%|██████▊ | 8483/12384 [18:00:12<8:17:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 69%|██████▊ | 8484/12384 [18:00:12<8:18:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 69%|██████▊ | 8484/12384 [18:00:19<8:18:48, 7.67s/it, loss=0.0011, acc=0.9977, iter_time=7.71s]
Epoch 0: 69%|██████▊ | 8485/12384 [18:00:19<8:17:29, 7.66s/it, loss=0.0011, acc=0.9977, iter_time=7.71s]
Epoch 0: 69%|██████▊ | 8485/12384 [18:00:27<8:17:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 69%|██████▊ | 8486/12384 [18:00:27<8:16:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 69%|██████▊ | 8486/12384 [18:00:34<8:16:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 69%|██████▊ | 8487/12384 [18:00:34<8:15:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 69%|██████▊ | 8487/12384 [18:00:42<8:15:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 69%|██████▊ | 8488/12384 [18:00:42<8:15:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 69%|██████▊ | 8488/12384 [18:00:50<8:15:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 69%|██████▊ | 8489/12384 [18:00:50<8:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 69%|██████▊ | 8489/12384 [18:00:57<8:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▊ | 8490/12384 [18:00:57<8:14:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▊ | 8490/12384 [18:01:05<8:14:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 69%|██████▊ | 8491/12384 [18:01:05<8:14:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 69%|██████▊ | 8491/12384 [18:01:12<8:14:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 69%|██████▊ | 8492/12384 [18:01:12<8:14:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 69%|██████▊ | 8492/12384 [18:01:20<8:14:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▊ | 8493/12384 [18:01:20<8:14:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▊ | 8493/12384 [18:01:28<8:14:06, 7.62s/it, loss=0.0010, acc=1.0000, iter_time=5.39s]
Epoch 0: 69%|██████▊ | 8494/12384 [18:01:28<8:15:50, 7.65s/it, loss=0.0010, acc=1.0000, iter_time=5.39s]
Epoch 0: 69%|██████▊ | 8494/12384 [18:01:35<8:15:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 69%|██████▊ | 8495/12384 [18:01:35<8:16:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 69%|██████▊ | 8495/12384 [18:01:43<8:16:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 69%|██████▊ | 8496/12384 [18:01:43<8:15:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 69%|██████▊ | 8496/12384 [18:01:51<8:15:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 69%|██████▊ | 8497/12384 [18:01:51<8:15:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 69%|██████▊ | 8497/12384 [18:01:58<8:15:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 69%|██████▊ | 8498/12384 [18:01:58<8:14:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 69%|██████▊ | 8498/12384 [18:02:06<8:14:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 69%|██████▊ | 8499/12384 [18:02:06<8:20:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 69%|██████▊ | 8499/12384 [18:02:14<8:20:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 69%|██████▊ | 8500/12384 [18:02:14<8:21:31, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 69%|██████▊ | 8500/12384 [18:02:22<8:21:31, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 69%|██████▊ | 8501/12384 [18:02:22<8:18:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 69%|██████▊ | 8501/12384 [18:02:29<8:18:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 69%|██████▊ | 8502/12384 [18:02:29<8:18:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 69%|██████▊ | 8502/12384 [18:02:37<8:18:18, 7.70s/it, loss=0.0003, acc=0.9984, iter_time=7.41s]
Epoch 0: 69%|██████▊ | 8503/12384 [18:02:37<8:16:37, 7.68s/it, loss=0.0003, acc=0.9984, iter_time=7.41s]
Epoch 0: 69%|██████▊ | 8503/12384 [18:02:45<8:16:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 69%|██████▊ | 8504/12384 [18:02:45<8:17:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 69%|██████▊ | 8504/12384 [18:02:52<8:17:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 69%|██████▊ | 8505/12384 [18:02:52<8:16:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 69%|██████▊ | 8505/12384 [18:03:00<8:16:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 69%|██████▊ | 8506/12384 [18:03:00<8:14:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 69%|██████▊ | 8506/12384 [18:03:08<8:14:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 69%|██████▊ | 8507/12384 [18:03:08<8:19:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 69%|██████▊ | 8507/12384 [18:03:16<8:19:36, 7.73s/it, loss=0.0003, acc=0.9998, iter_time=7.60s]
Epoch 0: 69%|██████▊ | 8508/12384 [18:03:16<8:18:49, 7.72s/it, loss=0.0003, acc=0.9998, iter_time=7.60s]
Epoch 0: 69%|██████▊ | 8508/12384 [18:03:23<8:18:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 0: 69%|██████▊ | 8509/12384 [18:03:23<8:18:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 0: 69%|██████▊ | 8509/12384 [18:03:31<8:18:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 0: 69%|██████▊ | 8510/12384 [18:03:31<8:16:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 0: 69%|██████▊ | 8510/12384 [18:03:39<8:16:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▊ | 8511/12384 [18:03:39<8:15:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▊ | 8511/12384 [18:03:46<8:15:13, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 69%|██████▊ | 8512/12384 [18:03:46<8:14:11, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 69%|██████▊ | 8512/12384 [18:03:54<8:14:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 69%|██████▊ | 8513/12384 [18:03:54<8:13:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 69%|██████▊ | 8513/12384 [18:04:01<8:13:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 69%|██████▉ | 8514/12384 [18:04:01<8:12:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 69%|██████▉ | 8514/12384 [18:04:09<8:12:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.75s]
Epoch 0: 69%|██████▉ | 8515/12384 [18:04:09<8:11:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.75s]
Epoch 0: 69%|██████▉ | 8515/12384 [18:04:17<8:11:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 0: 69%|██████▉ | 8516/12384 [18:04:17<8:11:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 0: 69%|██████▉ | 8516/12384 [18:04:24<8:11:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 69%|██████▉ | 8517/12384 [18:04:24<8:11:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 69%|██████▉ | 8517/12384 [18:04:32<8:11:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8518/12384 [18:04:32<8:10:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8518/12384 [18:04:39<8:10:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 69%|██████▉ | 8519/12384 [18:04:39<8:10:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 69%|██████▉ | 8519/12384 [18:04:47<8:10:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 69%|██████▉ | 8520/12384 [18:04:47<8:09:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 69%|██████▉ | 8520/12384 [18:04:55<8:09:56, 7.61s/it, loss=0.0005, acc=0.9981, iter_time=7.20s]
Epoch 0: 69%|██████▉ | 8521/12384 [18:04:55<8:09:48, 7.61s/it, loss=0.0005, acc=0.9981, iter_time=7.20s]
Epoch 0: 69%|██████▉ | 8521/12384 [18:05:02<8:09:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8522/12384 [18:05:02<8:10:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8522/12384 [18:05:10<8:10:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 69%|██████▉ | 8523/12384 [18:05:10<8:09:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 69%|██████▉ | 8523/12384 [18:05:17<8:09:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 69%|██████▉ | 8524/12384 [18:05:17<8:09:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 69%|██████▉ | 8524/12384 [18:05:25<8:09:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 69%|██████▉ | 8525/12384 [18:05:25<8:16:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 69%|██████▉ | 8525/12384 [18:05:33<8:16:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 69%|██████▉ | 8526/12384 [18:05:33<8:14:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 69%|██████▉ | 8526/12384 [18:05:41<8:14:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 69%|██████▉ | 8527/12384 [18:05:41<8:13:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 69%|██████▉ | 8527/12384 [18:05:48<8:13:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 69%|██████▉ | 8528/12384 [18:05:48<8:12:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 69%|██████▉ | 8528/12384 [18:05:56<8:12:03, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.71s]
Epoch 0: 69%|██████▉ | 8529/12384 [18:05:56<8:11:22, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.71s]
Epoch 0: 69%|██████▉ | 8529/12384 [18:06:04<8:11:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 69%|██████▉ | 8530/12384 [18:06:04<8:10:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 69%|██████▉ | 8530/12384 [18:06:11<8:10:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 0: 69%|██████▉ | 8531/12384 [18:06:11<8:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 0: 69%|██████▉ | 8531/12384 [18:06:19<8:09:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 69%|██████▉ | 8532/12384 [18:06:19<8:11:14, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 69%|██████▉ | 8532/12384 [18:06:27<8:11:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 69%|██████▉ | 8533/12384 [18:06:27<8:15:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 69%|██████▉ | 8533/12384 [18:06:34<8:15:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 69%|██████▉ | 8534/12384 [18:06:34<8:13:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 69%|██████▉ | 8534/12384 [18:06:42<8:13:52, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 69%|██████▉ | 8535/12384 [18:06:42<8:13:09, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 69%|██████▉ | 8535/12384 [18:06:50<8:13:09, 7.69s/it, loss=0.0004, acc=0.9988, iter_time=8.06s]
Epoch 0: 69%|██████▉ | 8536/12384 [18:06:50<8:11:46, 7.67s/it, loss=0.0004, acc=0.9988, iter_time=8.06s]
Epoch 0: 69%|██████▉ | 8536/12384 [18:06:57<8:11:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 69%|██████▉ | 8537/12384 [18:06:57<8:10:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 69%|██████▉ | 8537/12384 [18:07:05<8:10:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 69%|██████▉ | 8538/12384 [18:07:05<8:10:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 69%|██████▉ | 8538/12384 [18:07:13<8:10:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 69%|██████▉ | 8539/12384 [18:07:13<8:08:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 69%|██████▉ | 8539/12384 [18:07:20<8:08:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 69%|██████▉ | 8540/12384 [18:07:20<8:08:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 69%|██████▉ | 8540/12384 [18:07:28<8:08:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 69%|██████▉ | 8541/12384 [18:07:28<8:08:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 69%|██████▉ | 8541/12384 [18:07:35<8:08:17, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=11.13s]
Epoch 0: 69%|██████▉ | 8542/12384 [18:07:35<8:08:16, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=11.13s]
Epoch 0: 69%|██████▉ | 8542/12384 [18:07:43<8:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 69%|██████▉ | 8543/12384 [18:07:43<8:07:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 69%|██████▉ | 8543/12384 [18:07:51<8:07:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 69%|██████▉ | 8544/12384 [18:07:51<8:07:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 0: 69%|██████▉ | 8544/12384 [18:07:58<8:07:12, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=7.64s]
Epoch 0: 69%|██████▉ | 8545/12384 [18:07:58<8:06:49, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=7.64s]
Epoch 0: 69%|██████▉ | 8545/12384 [18:08:06<8:06:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 0: 69%|██████▉ | 8546/12384 [18:08:06<8:06:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 0: 69%|██████▉ | 8546/12384 [18:08:13<8:06:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 0: 69%|██████▉ | 8547/12384 [18:08:13<8:06:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 0: 69%|██████▉ | 8547/12384 [18:08:21<8:06:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 69%|██████▉ | 8548/12384 [18:08:21<8:06:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 69%|██████▉ | 8548/12384 [18:08:29<8:06:17, 7.61s/it, loss=0.0005, acc=0.9983, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8549/12384 [18:08:29<8:06:03, 7.60s/it, loss=0.0005, acc=0.9983, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8549/12384 [18:08:36<8:06:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 69%|██████▉ | 8550/12384 [18:08:36<8:06:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 69%|██████▉ | 8550/12384 [18:08:44<8:06:11, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.21s]
Epoch 0: 69%|██████▉ | 8551/12384 [18:08:44<8:07:14, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.21s]
Epoch 0: 69%|██████▉ | 8551/12384 [18:08:52<8:07:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 69%|██████▉ | 8552/12384 [18:08:52<8:12:51, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 69%|██████▉ | 8552/12384 [18:08:59<8:12:51, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 69%|██████▉ | 8553/12384 [18:08:59<8:10:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 69%|██████▉ | 8553/12384 [18:09:07<8:10:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 69%|██████▉ | 8554/12384 [18:09:07<8:08:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 69%|██████▉ | 8554/12384 [18:09:15<8:08:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 0: 69%|██████▉ | 8555/12384 [18:09:15<8:08:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 0: 69%|██████▉ | 8555/12384 [18:09:22<8:08:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 0: 69%|██████▉ | 8556/12384 [18:09:22<8:06:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 0: 69%|██████▉ | 8556/12384 [18:09:30<8:06:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 69%|██████▉ | 8557/12384 [18:09:30<8:07:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 69%|██████▉ | 8557/12384 [18:09:38<8:07:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 69%|██████▉ | 8558/12384 [18:09:38<8:07:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 69%|██████▉ | 8558/12384 [18:09:45<8:07:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▉ | 8559/12384 [18:09:45<8:06:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▉ | 8559/12384 [18:09:53<8:06:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 69%|██████▉ | 8560/12384 [18:09:53<8:11:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 69%|██████▉ | 8560/12384 [18:10:01<8:11:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 69%|██████▉ | 8561/12384 [18:10:01<8:09:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 69%|██████▉ | 8561/12384 [18:10:08<8:09:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▉ | 8562/12384 [18:10:08<8:08:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▉ | 8562/12384 [18:10:16<8:08:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 69%|██████▉ | 8563/12384 [18:10:16<8:07:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 69%|██████▉ | 8563/12384 [18:10:23<8:07:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 69%|██████▉ | 8564/12384 [18:10:23<8:05:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 69%|██████▉ | 8564/12384 [18:10:31<8:05:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 69%|██████▉ | 8565/12384 [18:10:31<8:05:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 69%|██████▉ | 8565/12384 [18:10:39<8:05:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 0: 69%|██████▉ | 8566/12384 [18:10:39<8:04:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 0: 69%|██████▉ | 8566/12384 [18:10:46<8:04:35, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=10.38s]
Epoch 0: 69%|██████▉ | 8567/12384 [18:10:46<8:04:18, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=10.38s]
Epoch 0: 69%|██████▉ | 8567/12384 [18:10:54<8:04:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 69%|██████▉ | 8568/12384 [18:10:54<8:04:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 69%|██████▉ | 8568/12384 [18:11:02<8:04:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.11s]
Epoch 0: 69%|██████▉ | 8569/12384 [18:11:02<8:03:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.11s]
Epoch 0: 69%|██████▉ | 8569/12384 [18:11:09<8:03:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 69%|██████▉ | 8570/12384 [18:11:09<8:03:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 69%|██████▉ | 8570/12384 [18:11:17<8:03:55, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.08s]
Epoch 0: 69%|██████▉ | 8571/12384 [18:11:17<8:03:53, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.08s]
Epoch 0: 69%|██████▉ | 8571/12384 [18:11:24<8:03:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8572/12384 [18:11:24<8:03:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8572/12384 [18:11:32<8:03:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 69%|██████▉ | 8573/12384 [18:11:32<8:03:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 69%|██████▉ | 8573/12384 [18:11:40<8:03:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 69%|██████▉ | 8574/12384 [18:11:40<8:03:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 69%|██████▉ | 8574/12384 [18:11:47<8:03:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8575/12384 [18:11:47<8:03:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8575/12384 [18:11:55<8:03:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 69%|██████▉ | 8576/12384 [18:11:55<8:03:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 69%|██████▉ | 8576/12384 [18:12:02<8:03:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 69%|██████▉ | 8577/12384 [18:12:02<8:03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 69%|██████▉ | 8577/12384 [18:12:10<8:03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 69%|██████▉ | 8578/12384 [18:12:10<8:09:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 69%|██████▉ | 8578/12384 [18:12:18<8:09:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 69%|██████▉ | 8579/12384 [18:12:18<8:06:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 69%|██████▉ | 8579/12384 [18:12:26<8:06:52, 7.68s/it, loss=0.0013, acc=0.9978, iter_time=7.68s]
Epoch 0: 69%|██████▉ | 8580/12384 [18:12:26<8:06:37, 7.68s/it, loss=0.0013, acc=0.9978, iter_time=7.68s]
Epoch 0: 69%|██████▉ | 8580/12384 [18:12:33<8:06:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▉ | 8581/12384 [18:12:33<8:06:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▉ | 8581/12384 [18:12:41<8:06:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 69%|██████▉ | 8582/12384 [18:12:41<8:05:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 69%|██████▉ | 8582/12384 [18:12:49<8:05:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 69%|██████▉ | 8583/12384 [18:12:49<8:04:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 69%|██████▉ | 8583/12384 [18:12:56<8:04:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 69%|██████▉ | 8584/12384 [18:12:56<8:04:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 69%|██████▉ | 8584/12384 [18:13:04<8:04:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.78s]
Epoch 0: 69%|██████▉ | 8585/12384 [18:13:04<8:03:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.78s]
Epoch 0: 69%|██████▉ | 8585/12384 [18:13:12<8:03:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 0: 69%|██████▉ | 8586/12384 [18:13:12<8:08:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 0: 69%|██████▉ | 8586/12384 [18:13:19<8:08:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 69%|██████▉ | 8587/12384 [18:13:19<8:06:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 69%|██████▉ | 8587/12384 [18:13:27<8:06:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 69%|██████▉ | 8588/12384 [18:13:27<8:04:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 69%|██████▉ | 8588/12384 [18:13:35<8:04:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 69%|██████▉ | 8589/12384 [18:13:35<8:03:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 69%|██████▉ | 8589/12384 [18:13:42<8:03:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 69%|██████▉ | 8590/12384 [18:13:42<8:02:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 69%|██████▉ | 8590/12384 [18:13:50<8:02:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 0: 69%|██████▉ | 8591/12384 [18:13:50<8:02:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 0: 69%|██████▉ | 8591/12384 [18:13:57<8:02:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▉ | 8592/12384 [18:13:57<8:02:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 69%|██████▉ | 8592/12384 [18:14:05<8:02:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 69%|██████▉ | 8593/12384 [18:14:05<8:01:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 69%|██████▉ | 8593/12384 [18:14:13<8:01:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 69%|██████▉ | 8594/12384 [18:14:13<8:01:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 69%|██████▉ | 8594/12384 [18:14:20<8:01:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 69%|██████▉ | 8595/12384 [18:14:20<8:01:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 69%|██████▉ | 8595/12384 [18:14:28<8:01:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 69%|██████▉ | 8596/12384 [18:14:28<8:01:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 69%|██████▉ | 8596/12384 [18:14:35<8:01:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 69%|██████▉ | 8597/12384 [18:14:35<8:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 0: 69%|██████▉ | 8597/12384 [18:14:43<8:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 69%|██████▉ | 8598/12384 [18:14:43<8:00:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 69%|██████▉ | 8598/12384 [18:14:51<8:00:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8599/12384 [18:14:51<8:00:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8599/12384 [18:14:58<8:00:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 69%|██████▉ | 8600/12384 [18:14:58<8:00:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 69%|██████▉ | 8600/12384 [18:15:06<8:00:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 69%|██████▉ | 8601/12384 [18:15:06<7:59:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 69%|██████▉ | 8601/12384 [18:15:13<7:59:38, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=7.60s]
Epoch 0: 69%|██████▉ | 8602/12384 [18:15:13<7:59:14, 7.60s/it, loss=0.0008, acc=0.9979, iter_time=7.60s]
Epoch 0: 69%|██████▉ | 8602/12384 [18:15:21<7:59:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8603/12384 [18:15:21<7:59:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 69%|██████▉ | 8603/12384 [18:15:29<7:59:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 69%|██████▉ | 8604/12384 [18:15:29<7:59:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 69%|██████▉ | 8604/12384 [18:15:37<7:59:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 69%|██████▉ | 8605/12384 [18:15:37<8:06:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 69%|██████▉ | 8605/12384 [18:15:44<8:06:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 69%|██████▉ | 8606/12384 [18:15:44<8:04:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 69%|██████▉ | 8606/12384 [18:15:52<8:04:09, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=10.94s]
Epoch 0: 70%|██████▉ | 8607/12384 [18:15:52<8:02:15, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.94s]
Epoch 0: 70%|██████▉ | 8607/12384 [18:16:00<8:02:15, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=8.00s]
Epoch 0: 70%|██████▉ | 8608/12384 [18:16:00<8:01:21, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=8.00s]
Epoch 0: 70%|██████▉ | 8608/12384 [18:16:07<8:01:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 70%|██████▉ | 8609/12384 [18:16:07<7:59:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 70%|██████▉ | 8609/12384 [18:16:15<7:59:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8610/12384 [18:16:15<7:59:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8610/12384 [18:16:22<7:59:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 70%|██████▉ | 8611/12384 [18:16:22<8:00:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 70%|██████▉ | 8611/12384 [18:16:30<8:00:10, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.75s]
Epoch 0: 70%|██████▉ | 8612/12384 [18:16:30<7:59:40, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.75s]
Epoch 0: 70%|██████▉ | 8612/12384 [18:16:38<7:59:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 70%|██████▉ | 8613/12384 [18:16:38<8:04:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 70%|██████▉ | 8613/12384 [18:16:46<8:04:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8614/12384 [18:16:46<8:02:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8614/12384 [18:16:53<8:02:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 70%|██████▉ | 8615/12384 [18:16:53<8:01:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 70%|██████▉ | 8615/12384 [18:17:01<8:01:04, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=10.00s]
Epoch 0: 70%|██████▉ | 8616/12384 [18:17:01<8:00:15, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=10.00s]
Epoch 0: 70%|██████▉ | 8616/12384 [18:17:08<8:00:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 70%|██████▉ | 8617/12384 [18:17:08<7:59:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 70%|██████▉ | 8617/12384 [18:17:16<7:59:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8618/12384 [18:17:16<7:58:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8618/12384 [18:17:24<7:58:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|██████▉ | 8619/12384 [18:17:24<7:58:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|██████▉ | 8619/12384 [18:17:31<7:58:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 70%|██████▉ | 8620/12384 [18:17:31<7:57:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 70%|██████▉ | 8620/12384 [18:17:39<7:57:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 0: 70%|██████▉ | 8621/12384 [18:17:39<7:57:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 0: 70%|██████▉ | 8621/12384 [18:17:46<7:57:10, 7.61s/it, loss=0.0010, acc=0.9950, iter_time=10.47s]
Epoch 0: 70%|██████▉ | 8622/12384 [18:17:46<7:56:41, 7.60s/it, loss=0.0010, acc=0.9950, iter_time=10.47s]
Epoch 0: 70%|██████▉ | 8622/12384 [18:17:54<7:56:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8623/12384 [18:17:54<7:56:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8623/12384 [18:18:02<7:56:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 70%|██████▉ | 8624/12384 [18:18:02<7:56:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 70%|██████▉ | 8624/12384 [18:18:09<7:56:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 70%|██████▉ | 8625/12384 [18:18:09<7:57:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 70%|██████▉ | 8625/12384 [18:18:17<7:57:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 70%|██████▉ | 8626/12384 [18:18:17<7:58:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 70%|██████▉ | 8626/12384 [18:18:25<7:58:54, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 70%|██████▉ | 8627/12384 [18:18:25<7:57:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 70%|██████▉ | 8627/12384 [18:18:32<7:57:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8628/12384 [18:18:32<7:57:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8628/12384 [18:18:40<7:57:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8629/12384 [18:18:40<7:56:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8629/12384 [18:18:47<7:56:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|██████▉ | 8630/12384 [18:18:47<7:56:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|██████▉ | 8630/12384 [18:18:55<7:56:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 70%|██████▉ | 8631/12384 [18:18:55<8:02:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 70%|██████▉ | 8631/12384 [18:19:03<8:02:45, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.82s]
Epoch 0: 70%|██████▉ | 8632/12384 [18:19:03<8:00:10, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.82s]
Epoch 0: 70%|██████▉ | 8632/12384 [18:19:11<8:00:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 70%|██████▉ | 8633/12384 [18:19:11<7:58:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 70%|██████▉ | 8633/12384 [18:19:18<7:58:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 70%|██████▉ | 8634/12384 [18:19:18<7:58:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 70%|██████▉ | 8634/12384 [18:19:26<7:58:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8635/12384 [18:19:26<7:57:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8635/12384 [18:19:33<7:57:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8636/12384 [18:19:33<7:56:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8636/12384 [18:19:41<7:56:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 70%|██████▉ | 8637/12384 [18:19:41<7:55:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 70%|██████▉ | 8637/12384 [18:19:49<7:55:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 70%|██████▉ | 8638/12384 [18:19:49<7:55:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 70%|██████▉ | 8638/12384 [18:19:56<7:55:33, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=7.91s]
Epoch 0: 70%|██████▉ | 8639/12384 [18:19:56<8:00:37, 7.70s/it, loss=0.0001, acc=0.9996, iter_time=7.91s]
Epoch 0: 70%|██████▉ | 8639/12384 [18:20:04<8:00:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 70%|██████▉ | 8640/12384 [18:20:04<7:58:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 70%|██████▉ | 8640/12384 [18:20:12<7:58:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 70%|██████▉ | 8641/12384 [18:20:12<7:57:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 70%|██████▉ | 8641/12384 [18:20:19<7:57:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 70%|██████▉ | 8642/12384 [18:20:19<7:58:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 70%|██████▉ | 8642/12384 [18:20:27<7:58:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8643/12384 [18:20:27<7:57:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8643/12384 [18:20:35<7:57:24, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=5.28s]
Epoch 0: 70%|██████▉ | 8644/12384 [18:20:35<7:56:04, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=5.28s]
Epoch 0: 70%|██████▉ | 8644/12384 [18:20:42<7:56:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 0: 70%|██████▉ | 8645/12384 [18:20:42<7:56:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 0: 70%|██████▉ | 8645/12384 [18:20:50<7:56:18, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=10.79s]
Epoch 0: 70%|██████▉ | 8646/12384 [18:20:50<7:55:29, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=10.79s]
Epoch 0: 70%|██████▉ | 8646/12384 [18:20:57<7:55:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8647/12384 [18:20:57<7:54:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8647/12384 [18:21:05<7:54:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 70%|██████▉ | 8648/12384 [18:21:05<7:54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 70%|██████▉ | 8648/12384 [18:21:13<7:54:27, 7.62s/it, loss=0.0005, acc=0.9990, iter_time=4.60s]
Epoch 0: 70%|██████▉ | 8649/12384 [18:21:13<7:54:28, 7.62s/it, loss=0.0005, acc=0.9990, iter_time=4.60s]
Epoch 0: 70%|██████▉ | 8649/12384 [18:21:20<7:54:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 70%|██████▉ | 8650/12384 [18:21:20<7:55:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 70%|██████▉ | 8650/12384 [18:21:28<7:55:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 70%|██████▉ | 8651/12384 [18:21:28<7:54:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 70%|██████▉ | 8651/12384 [18:21:36<7:54:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 70%|██████▉ | 8652/12384 [18:21:36<7:54:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 70%|██████▉ | 8652/12384 [18:21:43<7:54:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 70%|██████▉ | 8653/12384 [18:21:43<7:54:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 70%|██████▉ | 8653/12384 [18:21:51<7:54:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.57s]
Epoch 0: 70%|██████▉ | 8654/12384 [18:21:51<7:53:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.57s]
Epoch 0: 70%|██████▉ | 8654/12384 [18:21:58<7:53:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8655/12384 [18:21:58<7:53:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8655/12384 [18:22:06<7:53:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 70%|██████▉ | 8656/12384 [18:22:06<7:53:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 70%|██████▉ | 8656/12384 [18:22:14<7:53:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 70%|██████▉ | 8657/12384 [18:22:14<7:59:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 70%|██████▉ | 8657/12384 [18:22:22<7:59:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8658/12384 [18:22:22<7:57:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|██████▉ | 8658/12384 [18:22:29<7:57:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 0: 70%|██████▉ | 8659/12384 [18:22:29<7:55:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 0: 70%|██████▉ | 8659/12384 [18:22:37<7:55:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 70%|██████▉ | 8660/12384 [18:22:37<7:54:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 70%|██████▉ | 8660/12384 [18:22:44<7:54:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 70%|██████▉ | 8661/12384 [18:22:44<7:53:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 70%|██████▉ | 8661/12384 [18:22:52<7:53:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 70%|██████▉ | 8662/12384 [18:22:52<7:52:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 70%|██████▉ | 8662/12384 [18:23:00<7:52:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 70%|██████▉ | 8663/12384 [18:23:00<7:52:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 70%|██████▉ | 8663/12384 [18:23:07<7:52:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 70%|██████▉ | 8664/12384 [18:23:07<7:54:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 70%|██████▉ | 8664/12384 [18:23:15<7:54:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 70%|██████▉ | 8665/12384 [18:23:15<7:58:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 70%|██████▉ | 8665/12384 [18:23:23<7:58:14, 7.72s/it, loss=0.0002, acc=0.9989, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8666/12384 [18:23:23<7:55:57, 7.68s/it, loss=0.0002, acc=0.9989, iter_time=7.60s]
Epoch 0: 70%|██████▉ | 8666/12384 [18:23:30<7:55:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 70%|██████▉ | 8667/12384 [18:23:30<7:54:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 70%|██████▉ | 8667/12384 [18:23:38<7:54:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 70%|██████▉ | 8668/12384 [18:23:38<7:53:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 70%|██████▉ | 8668/12384 [18:23:46<7:53:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 0: 70%|███████ | 8669/12384 [18:23:46<7:52:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 0: 70%|███████ | 8669/12384 [18:23:53<7:52:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 70%|███████ | 8670/12384 [18:23:53<7:51:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 70%|███████ | 8670/12384 [18:24:01<7:51:41, 7.62s/it, loss=0.0005, acc=0.9995, iter_time=9.65s]
Epoch 0: 70%|███████ | 8671/12384 [18:24:01<7:53:19, 7.65s/it, loss=0.0005, acc=0.9995, iter_time=9.65s]
Epoch 0: 70%|███████ | 8671/12384 [18:24:09<7:53:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 70%|███████ | 8672/12384 [18:24:09<7:53:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 70%|███████ | 8672/12384 [18:24:16<7:53:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 70%|███████ | 8673/12384 [18:24:16<7:52:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 70%|███████ | 8673/12384 [18:24:24<7:52:55, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 70%|███████ | 8674/12384 [18:24:24<7:52:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 70%|███████ | 8674/12384 [18:24:31<7:52:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 70%|███████ | 8675/12384 [18:24:31<7:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 70%|███████ | 8675/12384 [18:24:39<7:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 70%|███████ | 8676/12384 [18:24:39<7:50:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 70%|███████ | 8676/12384 [18:24:47<7:50:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8677/12384 [18:24:47<7:50:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8677/12384 [18:24:54<7:50:26, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.05s]
Epoch 0: 70%|███████ | 8678/12384 [18:24:54<7:49:54, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.05s]
Epoch 0: 70%|███████ | 8678/12384 [18:25:02<7:49:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 70%|███████ | 8679/12384 [18:25:02<7:49:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 70%|███████ | 8679/12384 [18:25:09<7:49:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 70%|███████ | 8680/12384 [18:25:09<7:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 70%|███████ | 8680/12384 [18:25:17<7:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 70%|███████ | 8681/12384 [18:25:17<7:49:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 70%|███████ | 8681/12384 [18:25:25<7:49:42, 7.61s/it, loss=0.0002, acc=0.9988, iter_time=10.46s]
Epoch 0: 70%|███████ | 8682/12384 [18:25:25<7:50:17, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=10.46s]
Epoch 0: 70%|███████ | 8682/12384 [18:25:33<7:50:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 70%|███████ | 8683/12384 [18:25:33<7:55:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 70%|███████ | 8683/12384 [18:25:40<7:55:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 0: 70%|███████ | 8684/12384 [18:25:40<7:54:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 0: 70%|███████ | 8684/12384 [18:25:48<7:54:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 70%|███████ | 8685/12384 [18:25:48<7:52:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 70%|███████ | 8685/12384 [18:25:55<7:52:18, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8686/12384 [18:25:55<7:51:06, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8686/12384 [18:26:03<7:51:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 70%|███████ | 8687/12384 [18:26:03<7:50:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 70%|███████ | 8687/12384 [18:26:11<7:50:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 0: 70%|███████ | 8688/12384 [18:26:11<7:50:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 0: 70%|███████ | 8688/12384 [18:26:18<7:50:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 70%|███████ | 8689/12384 [18:26:18<7:49:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 70%|███████ | 8689/12384 [18:26:26<7:49:58, 7.63s/it, loss=0.0018, acc=0.9951, iter_time=7.61s]
Epoch 0: 70%|███████ | 8690/12384 [18:26:26<7:49:44, 7.63s/it, loss=0.0018, acc=0.9951, iter_time=7.61s]
Epoch 0: 70%|███████ | 8690/12384 [18:26:34<7:49:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 70%|███████ | 8691/12384 [18:26:34<7:54:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 70%|███████ | 8691/12384 [18:26:41<7:54:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8692/12384 [18:26:41<7:52:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8692/12384 [18:26:49<7:52:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 70%|███████ | 8693/12384 [18:26:49<7:51:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 70%|███████ | 8693/12384 [18:26:57<7:51:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|███████ | 8694/12384 [18:26:57<7:51:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|███████ | 8694/12384 [18:27:04<7:51:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 70%|███████ | 8695/12384 [18:27:04<7:50:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 70%|███████ | 8695/12384 [18:27:12<7:50:40, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 70%|███████ | 8696/12384 [18:27:12<7:49:18, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 70%|███████ | 8696/12384 [18:27:20<7:49:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 0: 70%|███████ | 8697/12384 [18:27:20<7:48:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 0: 70%|███████ | 8697/12384 [18:27:27<7:48:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 70%|███████ | 8698/12384 [18:27:27<7:49:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 70%|███████ | 8698/12384 [18:27:35<7:49:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 70%|███████ | 8699/12384 [18:27:35<7:49:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 70%|███████ | 8699/12384 [18:27:43<7:49:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 70%|███████ | 8700/12384 [18:27:43<7:49:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 70%|███████ | 8700/12384 [18:27:50<7:49:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 70%|███████ | 8701/12384 [18:27:50<7:48:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 70%|███████ | 8701/12384 [18:27:58<7:48:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|███████ | 8702/12384 [18:27:58<7:48:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|███████ | 8702/12384 [18:28:05<7:48:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 70%|███████ | 8703/12384 [18:28:05<7:47:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 70%|███████ | 8703/12384 [18:28:13<7:47:21, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.04s]
Epoch 0: 70%|███████ | 8704/12384 [18:28:13<7:47:27, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.04s]
Epoch 0: 70%|███████ | 8704/12384 [18:28:21<7:47:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 70%|███████ | 8705/12384 [18:28:21<7:47:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 70%|███████ | 8705/12384 [18:28:28<7:47:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 0: 70%|███████ | 8706/12384 [18:28:28<7:46:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 0: 70%|███████ | 8706/12384 [18:28:36<7:46:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 0: 70%|███████ | 8707/12384 [18:28:36<7:46:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 0: 70%|███████ | 8707/12384 [18:28:43<7:46:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 70%|███████ | 8708/12384 [18:28:43<7:46:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 70%|███████ | 8708/12384 [18:28:51<7:46:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.34s]
Epoch 0: 70%|███████ | 8709/12384 [18:28:51<7:52:07, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.34s]
Epoch 0: 70%|███████ | 8709/12384 [18:28:59<7:52:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 70%|███████ | 8710/12384 [18:28:59<7:50:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 70%|███████ | 8710/12384 [18:29:07<7:50:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 70%|███████ | 8711/12384 [18:29:07<7:49:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 70%|███████ | 8711/12384 [18:29:14<7:49:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 70%|███████ | 8712/12384 [18:29:14<7:48:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 70%|███████ | 8712/12384 [18:29:22<7:48:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 70%|███████ | 8713/12384 [18:29:22<7:48:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 70%|███████ | 8713/12384 [18:29:30<7:48:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8714/12384 [18:29:30<7:47:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8714/12384 [18:29:37<7:47:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|███████ | 8715/12384 [18:29:37<7:47:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|███████ | 8715/12384 [18:29:45<7:47:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 70%|███████ | 8716/12384 [18:29:45<7:47:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 70%|███████ | 8716/12384 [18:29:52<7:47:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 70%|███████ | 8717/12384 [18:29:52<7:46:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 70%|███████ | 8717/12384 [18:30:00<7:46:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 70%|███████ | 8718/12384 [18:30:00<7:45:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 70%|███████ | 8718/12384 [18:30:08<7:45:50, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8719/12384 [18:30:08<7:45:35, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 70%|███████ | 8719/12384 [18:30:15<7:45:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 70%|███████ | 8720/12384 [18:30:15<7:45:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 70%|███████ | 8720/12384 [18:30:23<7:45:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 0: 70%|███████ | 8721/12384 [18:30:23<7:45:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 0: 70%|███████ | 8721/12384 [18:30:31<7:45:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 0: 70%|███████ | 8722/12384 [18:30:31<7:44:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 0: 70%|███████ | 8722/12384 [18:30:38<7:44:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|███████ | 8723/12384 [18:30:38<7:44:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 70%|███████ | 8723/12384 [18:30:46<7:44:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 70%|███████ | 8724/12384 [18:30:46<7:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 70%|███████ | 8724/12384 [18:30:53<7:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 70%|███████ | 8725/12384 [18:30:53<7:44:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 70%|███████ | 8725/12384 [18:31:01<7:44:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 70%|███████ | 8726/12384 [18:31:01<7:45:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 70%|███████ | 8726/12384 [18:31:09<7:45:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|███████ | 8727/12384 [18:31:09<7:45:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 70%|███████ | 8727/12384 [18:31:16<7:45:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 70%|███████ | 8728/12384 [18:31:16<7:44:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 70%|███████ | 8728/12384 [18:31:24<7:44:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 70%|███████ | 8729/12384 [18:31:24<7:44:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 70%|███████ | 8729/12384 [18:31:31<7:44:06, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=5.50s]
Epoch 0: 70%|███████ | 8730/12384 [18:31:31<7:43:15, 7.61s/it, loss=0.0003, acc=0.9984, iter_time=5.50s]
Epoch 0: 70%|███████ | 8730/12384 [18:31:39<7:43:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 71%|███████ | 8731/12384 [18:31:39<7:43:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 71%|███████ | 8731/12384 [18:31:47<7:43:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 71%|███████ | 8732/12384 [18:31:47<7:43:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 71%|███████ | 8732/12384 [18:31:54<7:43:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 71%|███████ | 8733/12384 [18:31:54<7:43:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 71%|███████ | 8733/12384 [18:32:02<7:43:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 71%|███████ | 8734/12384 [18:32:02<7:42:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 71%|███████ | 8734/12384 [18:32:10<7:42:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8735/12384 [18:32:10<7:42:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8735/12384 [18:32:17<7:42:47, 7.61s/it, loss=0.0003, acc=0.9997, iter_time=7.91s]
Epoch 0: 71%|███████ | 8736/12384 [18:32:17<7:49:19, 7.72s/it, loss=0.0003, acc=0.9997, iter_time=7.91s]
Epoch 0: 71%|███████ | 8736/12384 [18:32:25<7:49:19, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 71%|███████ | 8737/12384 [18:32:25<7:47:20, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 71%|███████ | 8737/12384 [18:32:33<7:47:20, 7.69s/it, loss=0.0003, acc=0.9983, iter_time=7.64s]
Epoch 0: 71%|███████ | 8738/12384 [18:32:33<7:45:50, 7.67s/it, loss=0.0003, acc=0.9983, iter_time=7.64s]
Epoch 0: 71%|███████ | 8738/12384 [18:32:40<7:45:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8739/12384 [18:32:40<7:45:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8739/12384 [18:32:48<7:45:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 71%|███████ | 8740/12384 [18:32:48<7:44:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 71%|███████ | 8740/12384 [18:32:56<7:44:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 71%|███████ | 8741/12384 [18:32:56<7:44:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 71%|███████ | 8741/12384 [18:33:03<7:44:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 71%|███████ | 8742/12384 [18:33:03<7:44:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 71%|███████ | 8742/12384 [18:33:11<7:44:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8743/12384 [18:33:11<7:43:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8743/12384 [18:33:19<7:43:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 71%|███████ | 8744/12384 [18:33:19<7:42:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 71%|███████ | 8744/12384 [18:33:26<7:42:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 71%|███████ | 8745/12384 [18:33:26<7:43:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 71%|███████ | 8745/12384 [18:33:34<7:43:11, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.10s]
Epoch 0: 71%|███████ | 8746/12384 [18:33:34<7:42:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.10s]
Epoch 0: 71%|███████ | 8746/12384 [18:33:41<7:42:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 0: 71%|███████ | 8747/12384 [18:33:41<7:43:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 0: 71%|███████ | 8747/12384 [18:33:49<7:43:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.40s]
Epoch 0: 71%|███████ | 8748/12384 [18:33:49<7:42:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.40s]
Epoch 0: 71%|███████ | 8748/12384 [18:33:57<7:42:29, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.87s]
Epoch 0: 71%|███████ | 8749/12384 [18:33:57<7:42:34, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.87s]
Epoch 0: 71%|███████ | 8749/12384 [18:34:04<7:42:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 71%|███████ | 8750/12384 [18:34:04<7:43:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 71%|███████ | 8750/12384 [18:34:12<7:43:13, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 71%|███████ | 8751/12384 [18:34:12<7:42:40, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 0: 71%|███████ | 8751/12384 [18:34:20<7:42:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 71%|███████ | 8752/12384 [18:34:20<7:42:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 71%|███████ | 8752/12384 [18:34:27<7:42:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 71%|███████ | 8753/12384 [18:34:27<7:41:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 71%|███████ | 8753/12384 [18:34:35<7:41:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 71%|███████ | 8754/12384 [18:34:35<7:42:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 71%|███████ | 8754/12384 [18:34:43<7:42:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8755/12384 [18:34:43<7:41:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8755/12384 [18:34:50<7:41:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 71%|███████ | 8756/12384 [18:34:50<7:41:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 71%|███████ | 8756/12384 [18:34:58<7:41:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 71%|███████ | 8757/12384 [18:34:58<7:40:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 71%|███████ | 8757/12384 [18:35:05<7:40:34, 7.62s/it, loss=0.0005, acc=0.9979, iter_time=6.12s]
Epoch 0: 71%|███████ | 8758/12384 [18:35:05<7:39:55, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=6.12s]
Epoch 0: 71%|███████ | 8758/12384 [18:35:13<7:39:55, 7.61s/it, loss=0.0001, acc=0.9990, iter_time=9.08s]
Epoch 0: 71%|███████ | 8759/12384 [18:35:13<7:39:52, 7.61s/it, loss=0.0001, acc=0.9990, iter_time=9.08s]
Epoch 0: 71%|███████ | 8759/12384 [18:35:21<7:39:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 71%|███████ | 8760/12384 [18:35:21<7:41:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 71%|███████ | 8760/12384 [18:35:28<7:41:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 71%|███████ | 8761/12384 [18:35:28<7:40:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 71%|███████ | 8761/12384 [18:35:36<7:40:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 71%|███████ | 8762/12384 [18:35:36<7:46:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 71%|███████ | 8762/12384 [18:35:44<7:46:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 71%|███████ | 8763/12384 [18:35:44<7:43:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 71%|███████ | 8763/12384 [18:35:51<7:43:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8764/12384 [18:35:51<7:42:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8764/12384 [18:35:59<7:42:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 71%|███████ | 8765/12384 [18:35:59<7:41:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 71%|███████ | 8765/12384 [18:36:07<7:41:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 71%|███████ | 8766/12384 [18:36:07<7:40:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 71%|███████ | 8766/12384 [18:36:14<7:40:21, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=7.63s]
Epoch 0: 71%|███████ | 8767/12384 [18:36:14<7:39:55, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=7.63s]
Epoch 0: 71%|███████ | 8767/12384 [18:36:22<7:39:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 71%|███████ | 8768/12384 [18:36:22<7:39:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 71%|███████ | 8768/12384 [18:36:29<7:39:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 71%|███████ | 8769/12384 [18:36:29<7:38:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 71%|███████ | 8769/12384 [18:36:37<7:38:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 0: 71%|███████ | 8770/12384 [18:36:37<7:43:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 0: 71%|███████ | 8770/12384 [18:36:45<7:43:34, 7.70s/it, loss=0.0013, acc=0.9982, iter_time=7.59s]
Epoch 0: 71%|███████ | 8771/12384 [18:36:45<7:41:42, 7.67s/it, loss=0.0013, acc=0.9982, iter_time=7.59s]
Epoch 0: 71%|███████ | 8771/12384 [18:36:53<7:41:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 71%|███████ | 8772/12384 [18:36:53<7:40:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 71%|███████ | 8772/12384 [18:37:00<7:40:08, 7.64s/it, loss=0.0004, acc=0.9997, iter_time=9.32s]
Epoch 0: 71%|███████ | 8773/12384 [18:37:00<7:40:17, 7.65s/it, loss=0.0004, acc=0.9997, iter_time=9.32s]
Epoch 0: 71%|███████ | 8773/12384 [18:37:08<7:40:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 0: 71%|███████ | 8774/12384 [18:37:08<7:39:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 0: 71%|███████ | 8774/12384 [18:37:15<7:39:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 0: 71%|███████ | 8775/12384 [18:37:15<7:38:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 0: 71%|███████ | 8775/12384 [18:37:23<7:38:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 71%|███████ | 8776/12384 [18:37:23<7:39:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 71%|███████ | 8776/12384 [18:37:31<7:39:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 71%|███████ | 8777/12384 [18:37:31<7:38:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 71%|███████ | 8777/12384 [18:37:38<7:38:54, 7.63s/it, loss=0.0006, acc=0.9995, iter_time=7.61s]
Epoch 0: 71%|███████ | 8778/12384 [18:37:38<7:38:08, 7.62s/it, loss=0.0006, acc=0.9995, iter_time=7.61s]
Epoch 0: 71%|███████ | 8778/12384 [18:37:46<7:38:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 71%|███████ | 8779/12384 [18:37:46<7:37:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 71%|███████ | 8779/12384 [18:37:54<7:37:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8780/12384 [18:37:54<7:37:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8780/12384 [18:38:01<7:37:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8781/12384 [18:38:01<7:36:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8781/12384 [18:38:09<7:36:58, 7.61s/it, loss=0.0012, acc=0.9985, iter_time=7.59s]
Epoch 0: 71%|███████ | 8782/12384 [18:38:09<7:36:51, 7.61s/it, loss=0.0012, acc=0.9985, iter_time=7.59s]
Epoch 0: 71%|███████ | 8782/12384 [18:38:16<7:36:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 71%|███████ | 8783/12384 [18:38:16<7:36:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 71%|███████ | 8783/12384 [18:38:24<7:36:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 71%|███████ | 8784/12384 [18:38:24<7:36:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 71%|███████ | 8784/12384 [18:38:32<7:36:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 71%|███████ | 8785/12384 [18:38:32<7:37:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 71%|███████ | 8785/12384 [18:38:39<7:37:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 71%|███████ | 8786/12384 [18:38:39<7:36:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 71%|███████ | 8786/12384 [18:38:47<7:36:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8787/12384 [18:38:47<7:35:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8787/12384 [18:38:54<7:35:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8788/12384 [18:38:54<7:35:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8788/12384 [18:39:02<7:35:44, 7.60s/it, loss=0.0004, acc=0.9996, iter_time=7.65s]
Epoch 0: 71%|███████ | 8789/12384 [18:39:02<7:42:01, 7.71s/it, loss=0.0004, acc=0.9996, iter_time=7.65s]
Epoch 0: 71%|███████ | 8789/12384 [18:39:10<7:42:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 71%|███████ | 8790/12384 [18:39:10<7:39:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 71%|███████ | 8790/12384 [18:39:18<7:39:53, 7.68s/it, loss=0.0022, acc=0.9967, iter_time=10.25s]
Epoch 0: 71%|███████ | 8791/12384 [18:39:18<7:38:06, 7.65s/it, loss=0.0022, acc=0.9967, iter_time=10.25s]
Epoch 0: 71%|███████ | 8791/12384 [18:39:25<7:38:06, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.60s]
Epoch 0: 71%|███████ | 8792/12384 [18:39:25<7:36:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.60s]
Epoch 0: 71%|███████ | 8792/12384 [18:39:33<7:36:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 71%|███████ | 8793/12384 [18:39:33<7:36:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 71%|███████ | 8793/12384 [18:39:40<7:36:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8794/12384 [18:39:40<7:35:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8794/12384 [18:39:48<7:35:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8795/12384 [18:39:48<7:35:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8795/12384 [18:39:56<7:35:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8796/12384 [18:39:56<7:35:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8796/12384 [18:40:03<7:35:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 71%|███████ | 8797/12384 [18:40:03<7:40:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 71%|███████ | 8797/12384 [18:40:11<7:40:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8798/12384 [18:40:11<7:38:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8798/12384 [18:40:19<7:38:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 71%|███████ | 8799/12384 [18:40:19<7:37:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 71%|███████ | 8799/12384 [18:40:26<7:37:11, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 71%|███████ | 8800/12384 [18:40:26<7:36:11, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 71%|███████ | 8800/12384 [18:40:34<7:36:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 71%|███████ | 8801/12384 [18:40:34<7:37:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 71%|███████ | 8801/12384 [18:40:42<7:37:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 71%|███████ | 8802/12384 [18:40:42<7:36:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 71%|███████ | 8802/12384 [18:40:49<7:36:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8803/12384 [18:40:49<7:35:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8803/12384 [18:40:57<7:35:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 71%|███████ | 8804/12384 [18:40:57<7:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 71%|███████ | 8804/12384 [18:41:04<7:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8805/12384 [18:41:04<7:34:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8805/12384 [18:41:12<7:34:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8806/12384 [18:41:12<7:34:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 71%|███████ | 8806/12384 [18:41:20<7:34:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 71%|███████ | 8807/12384 [18:41:20<7:34:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 71%|███████ | 8807/12384 [18:41:27<7:34:31, 7.62s/it, loss=0.0005, acc=0.9973, iter_time=8.18s]
Epoch 0: 71%|███████ | 8808/12384 [18:41:27<7:33:44, 7.61s/it, loss=0.0005, acc=0.9973, iter_time=8.18s]
Epoch 0: 71%|███████ | 8808/12384 [18:41:35<7:33:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 71%|███████ | 8809/12384 [18:41:35<7:33:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 71%|███████ | 8809/12384 [18:41:42<7:33:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 71%|███████ | 8810/12384 [18:41:42<7:33:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 71%|███████ | 8810/12384 [18:41:50<7:33:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 71%|███████ | 8811/12384 [18:41:50<7:33:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 71%|███████ | 8811/12384 [18:41:58<7:33:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8812/12384 [18:41:58<7:33:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████ | 8812/12384 [18:42:05<7:33:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 71%|███████ | 8813/12384 [18:42:05<7:32:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 71%|███████ | 8813/12384 [18:42:13<7:32:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=3.75s]
Epoch 0: 71%|███████ | 8814/12384 [18:42:13<7:31:56, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=3.75s]
Epoch 0: 71%|███████ | 8814/12384 [18:42:21<7:31:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 0: 71%|███████ | 8815/12384 [18:42:21<7:37:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 0: 71%|███████ | 8815/12384 [18:42:28<7:37:53, 7.70s/it, loss=0.0004, acc=0.9980, iter_time=9.05s]
Epoch 0: 71%|███████ | 8816/12384 [18:42:28<7:36:16, 7.67s/it, loss=0.0004, acc=0.9980, iter_time=9.05s]
Epoch 0: 71%|███████ | 8816/12384 [18:42:36<7:36:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 71%|███████ | 8817/12384 [18:42:36<7:34:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 71%|███████ | 8817/12384 [18:42:44<7:34:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 71%|███████ | 8818/12384 [18:42:44<7:33:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 71%|███████ | 8818/12384 [18:42:51<7:33:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 71%|███████ | 8819/12384 [18:42:51<7:33:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 71%|███████ | 8819/12384 [18:42:59<7:33:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.26s]
Epoch 0: 71%|███████ | 8820/12384 [18:42:59<7:32:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.26s]
Epoch 0: 71%|███████ | 8820/12384 [18:43:06<7:32:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 71%|███████ | 8821/12384 [18:43:06<7:32:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 71%|███████ | 8821/12384 [18:43:14<7:32:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 71%|███████ | 8822/12384 [18:43:14<7:32:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 71%|███████ | 8822/12384 [18:43:22<7:32:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 71%|███████ | 8823/12384 [18:43:22<7:31:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 71%|███████ | 8823/12384 [18:43:29<7:31:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 0: 71%|███████▏ | 8824/12384 [18:43:29<7:31:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 0: 71%|███████▏ | 8824/12384 [18:43:37<7:31:58, 7.62s/it, loss=0.0003, acc=0.9993, iter_time=7.21s]
Epoch 0: 71%|███████▏ | 8825/12384 [18:43:37<7:31:20, 7.61s/it, loss=0.0003, acc=0.9993, iter_time=7.21s]
Epoch 0: 71%|███████▏ | 8825/12384 [18:43:44<7:31:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 71%|███████▏ | 8826/12384 [18:43:44<7:31:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 71%|███████▏ | 8826/12384 [18:43:52<7:31:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 71%|███████▏ | 8827/12384 [18:43:52<7:31:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 71%|███████▏ | 8827/12384 [18:44:00<7:31:03, 7.61s/it, loss=0.0006, acc=0.9981, iter_time=4.28s]
Epoch 0: 71%|███████▏ | 8828/12384 [18:44:00<7:30:52, 7.61s/it, loss=0.0006, acc=0.9981, iter_time=4.28s]
Epoch 0: 71%|███████▏ | 8828/12384 [18:44:07<7:30:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 0: 71%|███████▏ | 8829/12384 [18:44:07<7:30:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 0: 71%|███████▏ | 8829/12384 [18:44:15<7:30:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████▏ | 8830/12384 [18:44:15<7:30:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████▏ | 8830/12384 [18:44:23<7:30:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████▏ | 8831/12384 [18:44:23<7:30:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 71%|███████▏ | 8831/12384 [18:44:30<7:30:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 71%|███████▏ | 8832/12384 [18:44:30<7:30:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 71%|███████▏ | 8832/12384 [18:44:38<7:30:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 71%|███████▏ | 8833/12384 [18:44:38<7:31:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 71%|███████▏ | 8833/12384 [18:44:45<7:31:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 71%|███████▏ | 8834/12384 [18:44:45<7:31:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 71%|███████▏ | 8834/12384 [18:44:53<7:31:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 71%|███████▏ | 8835/12384 [18:44:53<7:30:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 71%|███████▏ | 8835/12384 [18:45:01<7:30:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 71%|███████▏ | 8836/12384 [18:45:01<7:30:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 71%|███████▏ | 8836/12384 [18:45:08<7:30:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.40s]
Epoch 0: 71%|███████▏ | 8837/12384 [18:45:08<7:30:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.40s]
Epoch 0: 71%|███████▏ | 8837/12384 [18:45:16<7:30:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 71%|███████▏ | 8838/12384 [18:45:16<7:29:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 71%|███████▏ | 8838/12384 [18:45:24<7:29:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 71%|███████▏ | 8839/12384 [18:45:24<7:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 71%|███████▏ | 8839/12384 [18:45:31<7:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 0: 71%|███████▏ | 8840/12384 [18:45:31<7:31:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 0: 71%|███████▏ | 8840/12384 [18:45:39<7:31:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 71%|███████▏ | 8841/12384 [18:45:39<7:35:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 71%|███████▏ | 8841/12384 [18:45:47<7:35:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 71%|███████▏ | 8842/12384 [18:45:47<7:33:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 71%|███████▏ | 8842/12384 [18:45:54<7:33:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 71%|███████▏ | 8843/12384 [18:45:54<7:31:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 71%|███████▏ | 8843/12384 [18:46:02<7:31:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 71%|███████▏ | 8844/12384 [18:46:02<7:30:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 71%|███████▏ | 8844/12384 [18:46:10<7:30:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 71%|███████▏ | 8845/12384 [18:46:10<7:30:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 71%|███████▏ | 8845/12384 [18:46:17<7:30:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 71%|███████▏ | 8846/12384 [18:46:17<7:29:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 71%|███████▏ | 8846/12384 [18:46:25<7:29:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 71%|███████▏ | 8847/12384 [18:46:25<7:29:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 71%|███████▏ | 8847/12384 [18:46:32<7:29:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 71%|███████▏ | 8848/12384 [18:46:32<7:29:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 71%|███████▏ | 8848/12384 [18:46:40<7:29:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 0: 71%|███████▏ | 8849/12384 [18:46:40<7:28:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 0: 71%|███████▏ | 8849/12384 [18:46:48<7:28:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 71%|███████▏ | 8850/12384 [18:46:48<7:28:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 71%|███████▏ | 8850/12384 [18:46:55<7:28:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 0: 71%|███████▏ | 8851/12384 [18:46:55<7:28:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 0: 71%|███████▏ | 8851/12384 [18:47:03<7:28:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 0: 71%|███████▏ | 8852/12384 [18:47:03<7:28:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 0: 71%|███████▏ | 8852/12384 [18:47:10<7:28:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 71%|███████▏ | 8853/12384 [18:47:10<7:28:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 71%|███████▏ | 8853/12384 [18:47:18<7:28:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 71%|███████▏ | 8854/12384 [18:47:18<7:28:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 71%|███████▏ | 8854/12384 [18:47:26<7:28:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8855/12384 [18:47:26<7:27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8855/12384 [18:47:33<7:27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 72%|███████▏ | 8856/12384 [18:47:33<7:27:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 72%|███████▏ | 8856/12384 [18:47:41<7:27:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 72%|███████▏ | 8857/12384 [18:47:41<7:27:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 72%|███████▏ | 8857/12384 [18:47:48<7:27:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8858/12384 [18:47:48<7:27:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8858/12384 [18:47:56<7:27:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 72%|███████▏ | 8859/12384 [18:47:56<7:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 72%|███████▏ | 8859/12384 [18:48:04<7:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8860/12384 [18:48:04<7:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8860/12384 [18:48:11<7:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 72%|███████▏ | 8861/12384 [18:48:11<7:27:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 72%|███████▏ | 8861/12384 [18:48:19<7:27:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 72%|███████▏ | 8862/12384 [18:48:19<7:28:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 72%|███████▏ | 8862/12384 [18:48:27<7:28:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 72%|███████▏ | 8863/12384 [18:48:27<7:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 72%|███████▏ | 8863/12384 [18:48:34<7:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 72%|███████▏ | 8864/12384 [18:48:34<7:26:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 72%|███████▏ | 8864/12384 [18:48:42<7:26:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8865/12384 [18:48:42<7:26:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8865/12384 [18:48:49<7:26:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 72%|███████▏ | 8866/12384 [18:48:49<7:26:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 72%|███████▏ | 8866/12384 [18:48:57<7:26:14, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.71s]
Epoch 0: 72%|███████▏ | 8867/12384 [18:48:57<7:33:27, 7.74s/it, loss=0.0002, acc=1.0000, iter_time=5.71s]
Epoch 0: 72%|███████▏ | 8867/12384 [18:49:05<7:33:27, 7.74s/it, loss=0.0001, acc=0.9998, iter_time=11.13s]
Epoch 0: 72%|███████▏ | 8868/12384 [18:49:05<7:31:06, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=11.13s]
Epoch 0: 72%|███████▏ | 8868/12384 [18:49:13<7:31:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 72%|███████▏ | 8869/12384 [18:49:13<7:29:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 72%|███████▏ | 8869/12384 [18:49:20<7:29:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 0: 72%|███████▏ | 8870/12384 [18:49:20<7:28:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 0: 72%|███████▏ | 8870/12384 [18:49:28<7:28:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 72%|███████▏ | 8871/12384 [18:49:28<7:27:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 72%|███████▏ | 8871/12384 [18:49:36<7:27:39, 7.65s/it, loss=0.0008, acc=0.9980, iter_time=7.56s]
Epoch 0: 72%|███████▏ | 8872/12384 [18:49:36<7:27:09, 7.64s/it, loss=0.0008, acc=0.9980, iter_time=7.56s]
Epoch 0: 72%|███████▏ | 8872/12384 [18:49:43<7:27:09, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8873/12384 [18:49:43<7:26:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8873/12384 [18:49:51<7:26:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 0: 72%|███████▏ | 8874/12384 [18:49:51<7:26:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 0: 72%|███████▏ | 8874/12384 [18:49:58<7:26:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 72%|███████▏ | 8875/12384 [18:49:58<7:26:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 72%|███████▏ | 8875/12384 [18:50:06<7:26:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 72%|███████▏ | 8876/12384 [18:50:06<7:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 72%|███████▏ | 8876/12384 [18:50:14<7:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8877/12384 [18:50:14<7:25:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8877/12384 [18:50:21<7:25:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 72%|███████▏ | 8878/12384 [18:50:21<7:25:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 72%|███████▏ | 8878/12384 [18:50:29<7:25:27, 7.62s/it, loss=0.0011, acc=0.9980, iter_time=9.41s]
Epoch 0: 72%|███████▏ | 8879/12384 [18:50:29<7:25:02, 7.62s/it, loss=0.0011, acc=0.9980, iter_time=9.41s]
Epoch 0: 72%|███████▏ | 8879/12384 [18:50:37<7:25:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 72%|███████▏ | 8880/12384 [18:50:37<7:25:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 72%|███████▏ | 8880/12384 [18:50:44<7:25:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 72%|███████▏ | 8881/12384 [18:50:44<7:25:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 72%|███████▏ | 8881/12384 [18:50:52<7:25:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 72%|███████▏ | 8882/12384 [18:50:52<7:24:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 72%|███████▏ | 8882/12384 [18:50:59<7:24:59, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=6.41s]
Epoch 0: 72%|███████▏ | 8883/12384 [18:50:59<7:24:42, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=6.41s]
Epoch 0: 72%|███████▏ | 8883/12384 [18:51:07<7:24:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 72%|███████▏ | 8884/12384 [18:51:07<7:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 72%|███████▏ | 8884/12384 [18:51:15<7:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 72%|███████▏ | 8885/12384 [18:51:15<7:23:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 72%|███████▏ | 8885/12384 [18:51:22<7:23:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8886/12384 [18:51:22<7:23:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8886/12384 [18:51:30<7:23:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8887/12384 [18:51:30<7:23:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8887/12384 [18:51:37<7:23:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 72%|███████▏ | 8888/12384 [18:51:37<7:24:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 72%|███████▏ | 8888/12384 [18:51:45<7:24:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 0: 72%|███████▏ | 8889/12384 [18:51:45<7:24:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 0: 72%|███████▏ | 8889/12384 [18:51:53<7:24:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 72%|███████▏ | 8890/12384 [18:51:53<7:23:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 72%|███████▏ | 8890/12384 [18:52:00<7:23:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 72%|███████▏ | 8891/12384 [18:52:00<7:23:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 72%|███████▏ | 8891/12384 [18:52:08<7:23:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8892/12384 [18:52:08<7:23:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8892/12384 [18:52:16<7:23:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 72%|███████▏ | 8893/12384 [18:52:16<7:30:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 72%|███████▏ | 8893/12384 [18:52:24<7:30:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 72%|███████▏ | 8894/12384 [18:52:24<7:28:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 72%|███████▏ | 8894/12384 [18:52:31<7:28:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 72%|███████▏ | 8895/12384 [18:52:31<7:26:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 72%|███████▏ | 8895/12384 [18:52:39<7:26:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 72%|███████▏ | 8896/12384 [18:52:39<7:25:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 72%|███████▏ | 8896/12384 [18:52:46<7:25:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 72%|███████▏ | 8897/12384 [18:52:46<7:24:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 72%|███████▏ | 8897/12384 [18:52:54<7:24:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 72%|███████▏ | 8898/12384 [18:52:54<7:23:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 72%|███████▏ | 8898/12384 [18:53:02<7:23:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 72%|███████▏ | 8899/12384 [18:53:02<7:22:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 72%|███████▏ | 8899/12384 [18:53:09<7:22:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 72%|███████▏ | 8900/12384 [18:53:09<7:22:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 72%|███████▏ | 8900/12384 [18:53:17<7:22:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.49s]
Epoch 0: 72%|███████▏ | 8901/12384 [18:53:17<7:26:43, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.49s]
Epoch 0: 72%|███████▏ | 8901/12384 [18:53:25<7:26:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 72%|███████▏ | 8902/12384 [18:53:25<7:25:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 72%|███████▏ | 8902/12384 [18:53:32<7:25:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 72%|███████▏ | 8903/12384 [18:53:32<7:23:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 72%|███████▏ | 8903/12384 [18:53:40<7:23:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 72%|███████▏ | 8904/12384 [18:53:40<7:24:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 72%|███████▏ | 8904/12384 [18:53:48<7:24:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 72%|███████▏ | 8905/12384 [18:53:48<7:23:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 72%|███████▏ | 8905/12384 [18:53:55<7:23:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8906/12384 [18:53:55<7:22:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8906/12384 [18:54:03<7:22:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8907/12384 [18:54:03<7:21:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8907/12384 [18:54:10<7:21:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 72%|███████▏ | 8908/12384 [18:54:10<7:21:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 72%|███████▏ | 8908/12384 [18:54:18<7:21:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 72%|███████▏ | 8909/12384 [18:54:18<7:21:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 72%|███████▏ | 8909/12384 [18:54:26<7:21:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8910/12384 [18:54:26<7:21:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8910/12384 [18:54:33<7:21:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 72%|███████▏ | 8911/12384 [18:54:33<7:21:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 72%|███████▏ | 8911/12384 [18:54:41<7:21:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 72%|███████▏ | 8912/12384 [18:54:41<7:22:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 72%|███████▏ | 8912/12384 [18:54:49<7:22:18, 7.64s/it, loss=0.0001, acc=0.9989, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8913/12384 [18:54:49<7:21:26, 7.63s/it, loss=0.0001, acc=0.9989, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8913/12384 [18:54:56<7:21:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 72%|███████▏ | 8914/12384 [18:54:56<7:20:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 72%|███████▏ | 8914/12384 [18:55:04<7:20:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 72%|███████▏ | 8915/12384 [18:55:04<7:20:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 72%|███████▏ | 8915/12384 [18:55:11<7:20:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8916/12384 [18:55:11<7:20:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8916/12384 [18:55:19<7:20:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 72%|███████▏ | 8917/12384 [18:55:19<7:20:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 72%|███████▏ | 8917/12384 [18:55:27<7:20:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8918/12384 [18:55:27<7:20:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8918/12384 [18:55:34<7:20:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 72%|███████▏ | 8919/12384 [18:55:34<7:19:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 72%|███████▏ | 8919/12384 [18:55:42<7:19:56, 7.62s/it, loss=0.0001, acc=0.9993, iter_time=11.51s]
Epoch 0: 72%|███████▏ | 8920/12384 [18:55:42<7:25:27, 7.72s/it, loss=0.0001, acc=0.9993, iter_time=11.51s]
Epoch 0: 72%|███████▏ | 8920/12384 [18:55:50<7:25:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8921/12384 [18:55:50<7:23:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8921/12384 [18:55:57<7:23:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 72%|███████▏ | 8922/12384 [18:55:57<7:21:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 72%|███████▏ | 8922/12384 [18:56:05<7:21:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 72%|███████▏ | 8923/12384 [18:56:05<7:22:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 72%|███████▏ | 8923/12384 [18:56:13<7:22:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 72%|███████▏ | 8924/12384 [18:56:13<7:21:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 72%|███████▏ | 8924/12384 [18:56:20<7:21:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 72%|███████▏ | 8925/12384 [18:56:20<7:20:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 72%|███████▏ | 8925/12384 [18:56:28<7:20:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8926/12384 [18:56:28<7:20:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8926/12384 [18:56:36<7:20:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 72%|███████▏ | 8927/12384 [18:56:36<7:19:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 72%|███████▏ | 8927/12384 [18:56:44<7:19:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 0: 72%|███████▏ | 8928/12384 [18:56:44<7:24:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 0: 72%|███████▏ | 8928/12384 [18:56:51<7:24:18, 7.71s/it, loss=0.0003, acc=0.9995, iter_time=7.20s]
Epoch 0: 72%|███████▏ | 8929/12384 [18:56:51<7:22:16, 7.68s/it, loss=0.0003, acc=0.9995, iter_time=7.20s]
Epoch 0: 72%|███████▏ | 8929/12384 [18:56:59<7:22:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 72%|███████▏ | 8930/12384 [18:56:59<7:21:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 72%|███████▏ | 8930/12384 [18:57:06<7:21:10, 7.66s/it, loss=0.0003, acc=0.9985, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8931/12384 [18:57:06<7:19:50, 7.64s/it, loss=0.0003, acc=0.9985, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8931/12384 [18:57:14<7:19:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8932/12384 [18:57:14<7:19:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8932/12384 [18:57:22<7:19:11, 7.63s/it, loss=0.0004, acc=0.9981, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8933/12384 [18:57:22<7:18:38, 7.63s/it, loss=0.0004, acc=0.9981, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8933/12384 [18:57:29<7:18:38, 7.63s/it, loss=0.0002, acc=0.9997, iter_time=5.52s]
Epoch 0: 72%|███████▏ | 8934/12384 [18:57:29<7:20:05, 7.65s/it, loss=0.0002, acc=0.9997, iter_time=5.52s]
Epoch 0: 72%|███████▏ | 8934/12384 [18:57:37<7:20:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 72%|███████▏ | 8935/12384 [18:57:37<7:19:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 72%|███████▏ | 8935/12384 [18:57:45<7:19:16, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=10.97s]
Epoch 0: 72%|███████▏ | 8936/12384 [18:57:45<7:18:50, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=10.97s]
Epoch 0: 72%|███████▏ | 8936/12384 [18:57:52<7:18:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8937/12384 [18:57:52<7:18:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8937/12384 [18:58:00<7:18:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8938/12384 [18:58:00<7:18:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8938/12384 [18:58:07<7:18:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8939/12384 [18:58:07<7:17:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 72%|███████▏ | 8939/12384 [18:58:15<7:17:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 72%|███████▏ | 8940/12384 [18:58:15<7:16:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 72%|███████▏ | 8940/12384 [18:58:23<7:16:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 72%|███████▏ | 8941/12384 [18:58:23<7:16:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 72%|███████▏ | 8941/12384 [18:58:30<7:16:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 72%|███████▏ | 8942/12384 [18:58:30<7:16:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 72%|███████▏ | 8942/12384 [18:58:38<7:16:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8943/12384 [18:58:38<7:17:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8943/12384 [18:58:45<7:17:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 72%|███████▏ | 8944/12384 [18:58:45<7:16:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 72%|███████▏ | 8944/12384 [18:58:53<7:16:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 0: 72%|███████▏ | 8945/12384 [18:58:53<7:16:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 0: 72%|███████▏ | 8945/12384 [18:59:01<7:16:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 0: 72%|███████▏ | 8946/12384 [18:59:01<7:21:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 0: 72%|███████▏ | 8946/12384 [18:59:09<7:21:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 72%|███████▏ | 8947/12384 [18:59:09<7:19:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 72%|███████▏ | 8947/12384 [18:59:16<7:19:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 72%|███████▏ | 8948/12384 [18:59:16<7:18:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 72%|███████▏ | 8948/12384 [18:59:24<7:18:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 72%|███████▏ | 8949/12384 [18:59:24<7:17:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 72%|███████▏ | 8949/12384 [18:59:31<7:17:19, 7.64s/it, loss=0.0004, acc=0.9988, iter_time=9.20s]
Epoch 0: 72%|███████▏ | 8950/12384 [18:59:31<7:16:27, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=9.20s]
Epoch 0: 72%|███████▏ | 8950/12384 [18:59:39<7:16:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.43s]
Epoch 0: 72%|███████▏ | 8951/12384 [18:59:39<7:15:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.43s]
Epoch 0: 72%|███████▏ | 8951/12384 [18:59:47<7:15:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 0: 72%|███████▏ | 8952/12384 [18:59:47<7:15:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 0: 72%|███████▏ | 8952/12384 [18:59:54<7:15:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8953/12384 [18:59:54<7:15:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8953/12384 [19:00:02<7:15:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 72%|███████▏ | 8954/12384 [19:00:02<7:15:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 72%|███████▏ | 8954/12384 [19:00:09<7:15:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 72%|███████▏ | 8955/12384 [19:00:09<7:15:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 72%|███████▏ | 8955/12384 [19:00:17<7:15:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 72%|███████▏ | 8956/12384 [19:00:17<7:15:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 72%|███████▏ | 8956/12384 [19:00:25<7:15:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 72%|███████▏ | 8957/12384 [19:00:25<7:15:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 72%|███████▏ | 8957/12384 [19:00:32<7:15:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8958/12384 [19:00:32<7:15:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 72%|███████▏ | 8958/12384 [19:00:40<7:15:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 72%|███████▏ | 8959/12384 [19:00:40<7:15:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 72%|███████▏ | 8959/12384 [19:00:48<7:15:29, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.58s]
Epoch 0: 72%|███████▏ | 8960/12384 [19:00:48<7:15:10, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.58s]
Epoch 0: 72%|███████▏ | 8960/12384 [19:00:55<7:15:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8961/12384 [19:00:55<7:16:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 72%|███████▏ | 8961/12384 [19:01:03<7:16:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 72%|███████▏ | 8962/12384 [19:01:03<7:16:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 72%|███████▏ | 8962/12384 [19:01:10<7:16:05, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=5.86s]
Epoch 0: 72%|███████▏ | 8963/12384 [19:01:10<7:15:30, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=5.86s]
Epoch 0: 72%|███████▏ | 8963/12384 [19:01:18<7:15:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 72%|███████▏ | 8964/12384 [19:01:18<7:15:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 72%|███████▏ | 8964/12384 [19:01:26<7:15:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8965/12384 [19:01:26<7:14:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8965/12384 [19:01:33<7:14:14, 7.62s/it, loss=0.0012, acc=0.9954, iter_time=7.59s]
Epoch 0: 72%|███████▏ | 8966/12384 [19:01:33<7:13:47, 7.61s/it, loss=0.0012, acc=0.9954, iter_time=7.59s]
Epoch 0: 72%|███████▏ | 8966/12384 [19:01:41<7:13:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8967/12384 [19:01:41<7:13:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 72%|███████▏ | 8967/12384 [19:01:49<7:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 72%|███████▏ | 8968/12384 [19:01:49<7:13:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 72%|███████▏ | 8968/12384 [19:01:56<7:13:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 72%|███████▏ | 8969/12384 [19:01:56<7:13:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 72%|███████▏ | 8969/12384 [19:02:04<7:13:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8970/12384 [19:02:04<7:13:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8970/12384 [19:02:11<7:13:13, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=7.29s]
Epoch 0: 72%|███████▏ | 8971/12384 [19:02:11<7:12:53, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=7.29s]
Epoch 0: 72%|███████▏ | 8971/12384 [19:02:19<7:12:53, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.92s]
Epoch 0: 72%|███████▏ | 8972/12384 [19:02:19<7:12:27, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=7.92s]
Epoch 0: 72%|███████▏ | 8972/12384 [19:02:27<7:12:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8973/12384 [19:02:27<7:17:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 72%|███████▏ | 8973/12384 [19:02:35<7:17:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 72%|███████▏ | 8974/12384 [19:02:35<7:16:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 72%|███████▏ | 8974/12384 [19:02:42<7:16:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 72%|███████▏ | 8975/12384 [19:02:42<7:16:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 72%|███████▏ | 8975/12384 [19:02:50<7:16:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 72%|███████▏ | 8976/12384 [19:02:50<7:15:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 72%|███████▏ | 8976/12384 [19:02:57<7:15:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 72%|███████▏ | 8977/12384 [19:02:57<7:14:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 72%|███████▏ | 8977/12384 [19:03:05<7:14:23, 7.65s/it, loss=0.0001, acc=0.9997, iter_time=5.11s]
Epoch 0: 72%|███████▏ | 8978/12384 [19:03:05<7:13:30, 7.64s/it, loss=0.0001, acc=0.9997, iter_time=5.11s]
Epoch 0: 72%|███████▏ | 8978/12384 [19:03:13<7:13:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 73%|███████▎ | 8979/12384 [19:03:13<7:12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 73%|███████▎ | 8979/12384 [19:03:20<7:12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 73%|███████▎ | 8980/12384 [19:03:20<7:11:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 73%|███████▎ | 8980/12384 [19:03:28<7:11:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 73%|███████▎ | 8981/12384 [19:03:28<7:16:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 73%|███████▎ | 8981/12384 [19:03:36<7:16:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 0: 73%|███████▎ | 8982/12384 [19:03:36<7:14:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 0: 73%|███████▎ | 8982/12384 [19:03:43<7:14:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 73%|███████▎ | 8983/12384 [19:03:43<7:13:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 73%|███████▎ | 8983/12384 [19:03:51<7:13:29, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.52s]
Epoch 0: 73%|███████▎ | 8984/12384 [19:03:51<7:12:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.52s]
Epoch 0: 73%|███████▎ | 8984/12384 [19:03:59<7:12:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 0: 73%|███████▎ | 8985/12384 [19:03:59<7:12:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 0: 73%|███████▎ | 8985/12384 [19:04:06<7:12:21, 7.63s/it, loss=0.0006, acc=0.9989, iter_time=10.78s]
Epoch 0: 73%|███████▎ | 8986/12384 [19:04:06<7:11:41, 7.62s/it, loss=0.0006, acc=0.9989, iter_time=10.78s]
Epoch 0: 73%|███████▎ | 8986/12384 [19:04:14<7:11:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 8987/12384 [19:04:14<7:12:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 8987/12384 [19:04:21<7:12:13, 7.63s/it, loss=0.0004, acc=0.9989, iter_time=6.56s]
Epoch 0: 73%|███████▎ | 8988/12384 [19:04:21<7:11:25, 7.62s/it, loss=0.0004, acc=0.9989, iter_time=6.56s]
Epoch 0: 73%|███████▎ | 8988/12384 [19:04:29<7:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 0: 73%|███████▎ | 8989/12384 [19:04:29<7:11:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 0: 73%|███████▎ | 8989/12384 [19:04:37<7:11:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 73%|███████▎ | 8990/12384 [19:04:37<7:12:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 73%|███████▎ | 8990/12384 [19:04:44<7:12:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 73%|███████▎ | 8991/12384 [19:04:44<7:11:52, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 73%|███████▎ | 8991/12384 [19:04:52<7:11:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 73%|███████▎ | 8992/12384 [19:04:52<7:11:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 73%|███████▎ | 8992/12384 [19:05:00<7:11:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 73%|███████▎ | 8993/12384 [19:05:00<7:11:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 73%|███████▎ | 8993/12384 [19:05:07<7:11:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 73%|███████▎ | 8994/12384 [19:05:07<7:10:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 73%|███████▎ | 8994/12384 [19:05:15<7:10:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 73%|███████▎ | 8995/12384 [19:05:15<7:10:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 73%|███████▎ | 8995/12384 [19:05:22<7:10:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 73%|███████▎ | 8996/12384 [19:05:22<7:10:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 73%|███████▎ | 8996/12384 [19:05:30<7:10:17, 7.62s/it, loss=0.0003, acc=0.9979, iter_time=7.64s]
Epoch 0: 73%|███████▎ | 8997/12384 [19:05:30<7:09:49, 7.61s/it, loss=0.0003, acc=0.9979, iter_time=7.64s]
Epoch 0: 73%|███████▎ | 8997/12384 [19:05:38<7:09:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 73%|███████▎ | 8998/12384 [19:05:38<7:09:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 73%|███████▎ | 8998/12384 [19:05:46<7:09:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 73%|███████▎ | 8999/12384 [19:05:46<7:14:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 73%|███████▎ | 8999/12384 [19:05:53<7:14:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 0: 73%|███████▎ | 9000/12384 [19:05:53<7:16:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 0: 73%|███████▎ | 9000/12384 [19:06:01<7:16:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 73%|███████▎ | 9001/12384 [19:06:01<7:14:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 73%|███████▎ | 9001/12384 [19:06:09<7:14:01, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=5.54s]
Epoch 0: 73%|███████▎ | 9002/12384 [19:06:09<7:12:35, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=5.54s]
Epoch 0: 73%|███████▎ | 9002/12384 [19:06:16<7:12:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 73%|███████▎ | 9003/12384 [19:06:16<7:11:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 73%|███████▎ | 9003/12384 [19:06:24<7:11:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 73%|███████▎ | 9004/12384 [19:06:24<7:10:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 73%|███████▎ | 9004/12384 [19:06:31<7:10:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9005/12384 [19:06:31<7:09:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9005/12384 [19:06:39<7:09:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 73%|███████▎ | 9006/12384 [19:06:39<7:13:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 73%|███████▎ | 9006/12384 [19:06:47<7:13:38, 7.70s/it, loss=0.0031, acc=0.9944, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9007/12384 [19:06:47<7:12:49, 7.69s/it, loss=0.0031, acc=0.9944, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9007/12384 [19:06:55<7:12:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9008/12384 [19:06:55<7:11:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9008/12384 [19:07:02<7:11:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 0: 73%|███████▎ | 9009/12384 [19:07:02<7:10:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 0: 73%|███████▎ | 9009/12384 [19:07:10<7:10:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 0: 73%|███████▎ | 9010/12384 [19:07:10<7:11:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 0: 73%|███████▎ | 9010/12384 [19:07:17<7:11:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 73%|███████▎ | 9011/12384 [19:07:17<7:10:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 0: 73%|███████▎ | 9011/12384 [19:07:25<7:10:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 73%|███████▎ | 9012/12384 [19:07:25<7:08:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 73%|███████▎ | 9012/12384 [19:07:33<7:08:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 0: 73%|███████▎ | 9013/12384 [19:07:33<7:08:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 0: 73%|███████▎ | 9013/12384 [19:07:40<7:08:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 0: 73%|███████▎ | 9014/12384 [19:07:40<7:07:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 0: 73%|███████▎ | 9014/12384 [19:07:48<7:07:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 73%|███████▎ | 9015/12384 [19:07:48<7:07:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 73%|███████▎ | 9015/12384 [19:07:56<7:07:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 73%|███████▎ | 9016/12384 [19:07:56<7:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 73%|███████▎ | 9016/12384 [19:08:03<7:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 0: 73%|███████▎ | 9017/12384 [19:08:03<7:07:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 0: 73%|███████▎ | 9017/12384 [19:08:11<7:07:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 73%|███████▎ | 9018/12384 [19:08:11<7:06:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 73%|███████▎ | 9018/12384 [19:08:18<7:06:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 73%|███████▎ | 9019/12384 [19:08:18<7:06:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 73%|███████▎ | 9019/12384 [19:08:26<7:06:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 0: 73%|███████▎ | 9020/12384 [19:08:26<7:05:49, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 0: 73%|███████▎ | 9020/12384 [19:08:33<7:05:49, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 73%|███████▎ | 9021/12384 [19:08:33<7:05:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 73%|███████▎ | 9021/12384 [19:08:41<7:05:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9022/12384 [19:08:41<7:05:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9022/12384 [19:08:49<7:05:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 73%|███████▎ | 9023/12384 [19:08:49<7:05:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 73%|███████▎ | 9023/12384 [19:08:56<7:05:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 73%|███████▎ | 9024/12384 [19:08:56<7:05:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 73%|███████▎ | 9024/12384 [19:09:04<7:05:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 73%|███████▎ | 9025/12384 [19:09:04<7:11:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 73%|███████▎ | 9025/12384 [19:09:12<7:11:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 73%|███████▎ | 9026/12384 [19:09:12<7:10:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 73%|███████▎ | 9026/12384 [19:09:20<7:10:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 73%|███████▎ | 9027/12384 [19:09:20<7:08:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 73%|███████▎ | 9027/12384 [19:09:27<7:08:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 73%|███████▎ | 9028/12384 [19:09:27<7:07:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 73%|███████▎ | 9028/12384 [19:09:35<7:07:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 0: 73%|███████▎ | 9029/12384 [19:09:35<7:08:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 0: 73%|███████▎ | 9029/12384 [19:09:42<7:08:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 73%|███████▎ | 9030/12384 [19:09:42<7:07:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 73%|███████▎ | 9030/12384 [19:09:50<7:07:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9031/12384 [19:09:50<7:06:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9031/12384 [19:09:58<7:06:35, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=7.94s]
Epoch 0: 73%|███████▎ | 9032/12384 [19:09:58<7:06:28, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=7.94s]
Epoch 0: 73%|███████▎ | 9032/12384 [19:10:05<7:06:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 73%|███████▎ | 9033/12384 [19:10:05<7:07:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 73%|███████▎ | 9033/12384 [19:10:13<7:07:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 73%|███████▎ | 9034/12384 [19:10:13<7:07:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 73%|███████▎ | 9034/12384 [19:10:21<7:07:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 73%|███████▎ | 9035/12384 [19:10:21<7:06:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 73%|███████▎ | 9035/12384 [19:10:28<7:06:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 73%|███████▎ | 9036/12384 [19:10:28<7:06:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 73%|███████▎ | 9036/12384 [19:10:36<7:06:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.58s]
Epoch 0: 73%|███████▎ | 9037/12384 [19:10:36<7:05:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.58s]
Epoch 0: 73%|███████▎ | 9037/12384 [19:10:44<7:05:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 73%|███████▎ | 9038/12384 [19:10:44<7:05:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 73%|███████▎ | 9038/12384 [19:10:51<7:05:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 73%|███████▎ | 9039/12384 [19:10:51<7:06:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 73%|███████▎ | 9039/12384 [19:10:59<7:06:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 0: 73%|███████▎ | 9040/12384 [19:10:59<7:05:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 0: 73%|███████▎ | 9040/12384 [19:11:06<7:05:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 73%|███████▎ | 9041/12384 [19:11:06<7:05:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 73%|███████▎ | 9041/12384 [19:11:14<7:05:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9042/12384 [19:11:14<7:04:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9042/12384 [19:11:22<7:04:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 73%|███████▎ | 9043/12384 [19:11:22<7:03:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 73%|███████▎ | 9043/12384 [19:11:29<7:03:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.05s]
Epoch 0: 73%|███████▎ | 9044/12384 [19:11:29<7:03:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.05s]
Epoch 0: 73%|███████▎ | 9044/12384 [19:11:37<7:03:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 73%|███████▎ | 9045/12384 [19:11:37<7:03:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 73%|███████▎ | 9045/12384 [19:11:44<7:03:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9046/12384 [19:11:44<7:03:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9046/12384 [19:11:52<7:03:15, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=6.99s]
Epoch 0: 73%|███████▎ | 9047/12384 [19:11:52<7:03:10, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=6.99s]
Epoch 0: 73%|███████▎ | 9047/12384 [19:12:00<7:03:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 73%|███████▎ | 9048/12384 [19:12:00<7:04:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 73%|███████▎ | 9048/12384 [19:12:07<7:04:47, 7.64s/it, loss=0.0001, acc=0.9992, iter_time=7.66s]
Epoch 0: 73%|███████▎ | 9049/12384 [19:12:07<7:04:04, 7.63s/it, loss=0.0001, acc=0.9992, iter_time=7.66s]
Epoch 0: 73%|███████▎ | 9049/12384 [19:12:15<7:04:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 73%|███████▎ | 9050/12384 [19:12:15<7:03:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 73%|███████▎ | 9050/12384 [19:12:23<7:03:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 73%|███████▎ | 9051/12384 [19:12:23<7:10:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 73%|███████▎ | 9051/12384 [19:12:31<7:10:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 0: 73%|███████▎ | 9052/12384 [19:12:31<7:07:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 0: 73%|███████▎ | 9052/12384 [19:12:38<7:07:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 73%|███████▎ | 9053/12384 [19:12:38<7:05:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 73%|███████▎ | 9053/12384 [19:12:46<7:05:59, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=10.71s]
Epoch 0: 73%|███████▎ | 9054/12384 [19:12:46<7:04:40, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=10.71s]
Epoch 0: 73%|███████▎ | 9054/12384 [19:12:53<7:04:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 73%|███████▎ | 9055/12384 [19:12:53<7:03:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 73%|███████▎ | 9055/12384 [19:13:01<7:03:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 73%|███████▎ | 9056/12384 [19:13:01<7:03:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 73%|███████▎ | 9056/12384 [19:13:09<7:03:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 73%|███████▎ | 9057/12384 [19:13:09<7:02:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 73%|███████▎ | 9057/12384 [19:13:16<7:02:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 73%|███████▎ | 9058/12384 [19:13:16<7:02:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 73%|███████▎ | 9058/12384 [19:13:24<7:02:33, 7.62s/it, loss=0.0003, acc=0.9985, iter_time=9.73s]
Epoch 0: 73%|███████▎ | 9059/12384 [19:13:24<7:07:10, 7.71s/it, loss=0.0003, acc=0.9985, iter_time=9.73s]
Epoch 0: 73%|███████▎ | 9059/12384 [19:13:32<7:07:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 73%|███████▎ | 9060/12384 [19:13:32<7:06:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 73%|███████▎ | 9060/12384 [19:13:39<7:06:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 73%|███████▎ | 9061/12384 [19:13:39<7:04:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 73%|███████▎ | 9061/12384 [19:13:47<7:04:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 73%|███████▎ | 9062/12384 [19:13:47<7:03:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 73%|███████▎ | 9062/12384 [19:13:55<7:03:31, 7.65s/it, loss=0.0002, acc=0.9993, iter_time=10.08s]
Epoch 0: 73%|███████▎ | 9063/12384 [19:13:55<7:02:58, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=10.08s]
Epoch 0: 73%|███████▎ | 9063/12384 [19:14:02<7:02:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 73%|███████▎ | 9064/12384 [19:14:02<7:02:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 73%|███████▎ | 9064/12384 [19:14:10<7:02:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 73%|███████▎ | 9065/12384 [19:14:10<7:01:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 73%|███████▎ | 9065/12384 [19:14:18<7:01:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.76s]
Epoch 0: 73%|███████▎ | 9066/12384 [19:14:18<7:01:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.76s]
Epoch 0: 73%|███████▎ | 9066/12384 [19:14:25<7:01:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 73%|███████▎ | 9067/12384 [19:14:25<7:01:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 73%|███████▎ | 9067/12384 [19:14:33<7:01:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 0: 73%|███████▎ | 9068/12384 [19:14:33<7:00:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 0: 73%|███████▎ | 9068/12384 [19:14:40<7:00:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 0: 73%|███████▎ | 9069/12384 [19:14:40<7:01:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 0: 73%|███████▎ | 9069/12384 [19:14:48<7:01:58, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9070/12384 [19:14:48<7:01:24, 7.63s/it, loss=0.0003, acc=0.9991, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9070/12384 [19:14:56<7:01:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9071/12384 [19:14:56<7:01:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9071/12384 [19:15:03<7:01:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 73%|███████▎ | 9072/12384 [19:15:03<7:00:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 73%|███████▎ | 9072/12384 [19:15:11<7:00:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 73%|███████▎ | 9073/12384 [19:15:11<7:00:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 73%|███████▎ | 9073/12384 [19:15:18<7:00:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9074/12384 [19:15:18<7:00:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9074/12384 [19:15:26<7:00:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 73%|███████▎ | 9075/12384 [19:15:26<6:59:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 73%|███████▎ | 9075/12384 [19:15:34<6:59:23, 7.60s/it, loss=0.0002, acc=0.9994, iter_time=9.57s]
Epoch 0: 73%|███████▎ | 9076/12384 [19:15:34<6:59:20, 7.61s/it, loss=0.0002, acc=0.9994, iter_time=9.57s]
Epoch 0: 73%|███████▎ | 9076/12384 [19:15:42<6:59:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 73%|███████▎ | 9077/12384 [19:15:42<7:05:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 73%|███████▎ | 9077/12384 [19:15:49<7:05:04, 7.71s/it, loss=0.0002, acc=0.9997, iter_time=7.35s]
Epoch 0: 73%|███████▎ | 9078/12384 [19:15:49<7:03:14, 7.68s/it, loss=0.0002, acc=0.9997, iter_time=7.35s]
Epoch 0: 73%|███████▎ | 9078/12384 [19:15:57<7:03:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 73%|███████▎ | 9079/12384 [19:15:57<7:02:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 73%|███████▎ | 9079/12384 [19:16:05<7:02:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 73%|███████▎ | 9080/12384 [19:16:05<7:01:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 73%|███████▎ | 9080/12384 [19:16:12<7:01:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 73%|███████▎ | 9081/12384 [19:16:12<7:00:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 73%|███████▎ | 9081/12384 [19:16:20<7:00:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 73%|███████▎ | 9082/12384 [19:16:20<7:00:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 73%|███████▎ | 9082/12384 [19:16:27<7:00:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 73%|███████▎ | 9083/12384 [19:16:27<7:00:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 73%|███████▎ | 9083/12384 [19:16:35<7:00:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 73%|███████▎ | 9084/12384 [19:16:35<6:59:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 73%|███████▎ | 9084/12384 [19:16:43<6:59:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 73%|███████▎ | 9085/12384 [19:16:43<7:03:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 73%|███████▎ | 9085/12384 [19:16:50<7:03:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 73%|███████▎ | 9086/12384 [19:16:50<7:02:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 73%|███████▎ | 9086/12384 [19:16:58<7:02:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 73%|███████▎ | 9087/12384 [19:16:58<7:02:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 73%|███████▎ | 9087/12384 [19:17:06<7:02:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 73%|███████▎ | 9088/12384 [19:17:06<7:01:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 73%|███████▎ | 9088/12384 [19:17:13<7:01:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 73%|███████▎ | 9089/12384 [19:17:13<6:59:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 73%|███████▎ | 9089/12384 [19:17:21<6:59:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 73%|███████▎ | 9090/12384 [19:17:21<6:59:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 73%|███████▎ | 9090/12384 [19:17:29<6:59:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 73%|███████▎ | 9091/12384 [19:17:29<6:58:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 73%|███████▎ | 9091/12384 [19:17:36<6:58:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 73%|███████▎ | 9092/12384 [19:17:36<6:57:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 73%|███████▎ | 9092/12384 [19:17:44<6:57:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 73%|███████▎ | 9093/12384 [19:17:44<6:57:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 73%|███████▎ | 9093/12384 [19:17:51<6:57:41, 7.62s/it, loss=0.0006, acc=0.9976, iter_time=5.69s]
Epoch 0: 73%|███████▎ | 9094/12384 [19:17:51<6:57:30, 7.61s/it, loss=0.0006, acc=0.9976, iter_time=5.69s]
Epoch 0: 73%|███████▎ | 9094/12384 [19:17:59<6:57:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 73%|███████▎ | 9095/12384 [19:17:59<6:57:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 73%|███████▎ | 9095/12384 [19:18:07<6:57:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 73%|███████▎ | 9096/12384 [19:18:07<6:57:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 73%|███████▎ | 9096/12384 [19:18:14<6:57:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 73%|███████▎ | 9097/12384 [19:18:14<6:57:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 73%|███████▎ | 9097/12384 [19:18:22<6:57:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 73%|███████▎ | 9098/12384 [19:18:22<6:57:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 73%|███████▎ | 9098/12384 [19:18:30<6:57:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9099/12384 [19:18:30<6:57:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 73%|███████▎ | 9099/12384 [19:18:37<6:57:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 73%|███████▎ | 9100/12384 [19:18:37<6:57:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 73%|███████▎ | 9100/12384 [19:18:45<6:57:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.36s]
Epoch 0: 73%|███████▎ | 9101/12384 [19:18:45<6:59:26, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.36s]
Epoch 0: 73%|███████▎ | 9101/12384 [19:18:53<6:59:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9102/12384 [19:18:53<6:58:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 73%|███████▎ | 9102/12384 [19:19:00<6:58:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 74%|███████▎ | 9103/12384 [19:19:00<6:59:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 74%|███████▎ | 9103/12384 [19:19:08<6:59:15, 7.67s/it, loss=0.0006, acc=0.9977, iter_time=9.36s]
Epoch 0: 74%|███████▎ | 9104/12384 [19:19:08<7:04:52, 7.77s/it, loss=0.0006, acc=0.9977, iter_time=9.36s]
Epoch 0: 74%|███████▎ | 9104/12384 [19:19:16<7:04:52, 7.77s/it, loss=0.0005, acc=0.9990, iter_time=7.55s]
Epoch 0: 74%|███████▎ | 9105/12384 [19:19:16<7:03:12, 7.74s/it, loss=0.0005, acc=0.9990, iter_time=7.55s]
Epoch 0: 74%|███████▎ | 9105/12384 [19:19:24<7:03:12, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 74%|███████▎ | 9106/12384 [19:19:24<7:02:18, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 74%|███████▎ | 9106/12384 [19:19:31<7:02:18, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 74%|███████▎ | 9107/12384 [19:19:31<7:01:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 74%|███████▎ | 9107/12384 [19:19:39<7:01:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 74%|███████▎ | 9108/12384 [19:19:39<6:59:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 74%|███████▎ | 9108/12384 [19:19:47<6:59:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▎ | 9109/12384 [19:19:47<6:58:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▎ | 9109/12384 [19:19:54<6:58:11, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▎ | 9110/12384 [19:19:54<6:57:28, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▎ | 9110/12384 [19:20:02<6:57:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 74%|███████▎ | 9111/12384 [19:20:02<6:56:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 74%|███████▎ | 9111/12384 [19:20:09<6:56:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 74%|███████▎ | 9112/12384 [19:20:09<6:56:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 74%|███████▎ | 9112/12384 [19:20:17<6:56:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.06s]
Epoch 0: 74%|███████▎ | 9113/12384 [19:20:17<6:55:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.06s]
Epoch 0: 74%|███████▎ | 9113/12384 [19:20:25<6:55:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 0: 74%|███████▎ | 9114/12384 [19:20:25<6:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 0: 74%|███████▎ | 9114/12384 [19:20:32<6:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 74%|███████▎ | 9115/12384 [19:20:32<6:54:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 74%|███████▎ | 9115/12384 [19:20:40<6:54:38, 7.61s/it, loss=0.0006, acc=0.9989, iter_time=4.81s]
Epoch 0: 74%|███████▎ | 9116/12384 [19:20:40<6:54:37, 7.61s/it, loss=0.0006, acc=0.9989, iter_time=4.81s]
Epoch 0: 74%|███████▎ | 9116/12384 [19:20:47<6:54:37, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=10.40s]
Epoch 0: 74%|███████▎ | 9117/12384 [19:20:47<6:54:24, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=10.40s]
Epoch 0: 74%|███████▎ | 9117/12384 [19:20:55<6:54:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 74%|███████▎ | 9118/12384 [19:20:55<6:54:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 74%|███████▎ | 9118/12384 [19:21:03<6:54:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 74%|███████▎ | 9119/12384 [19:21:03<6:54:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 74%|███████▎ | 9119/12384 [19:21:10<6:54:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 74%|███████▎ | 9120/12384 [19:21:10<6:54:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 74%|███████▎ | 9120/12384 [19:21:18<6:54:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 74%|███████▎ | 9121/12384 [19:21:18<6:54:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 0: 74%|███████▎ | 9121/12384 [19:21:26<6:54:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▎ | 9122/12384 [19:21:26<6:54:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▎ | 9122/12384 [19:21:33<6:54:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▎ | 9123/12384 [19:21:33<6:53:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▎ | 9123/12384 [19:21:41<6:53:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▎ | 9124/12384 [19:21:41<6:53:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▎ | 9124/12384 [19:21:48<6:53:37, 7.61s/it, loss=0.0001, acc=0.9993, iter_time=7.60s]
Epoch 0: 74%|███████▎ | 9125/12384 [19:21:48<6:53:27, 7.61s/it, loss=0.0001, acc=0.9993, iter_time=7.60s]
Epoch 0: 74%|███████▎ | 9125/12384 [19:21:56<6:53:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▎ | 9126/12384 [19:21:56<6:53:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▎ | 9126/12384 [19:22:04<6:53:29, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=5.84s]
Epoch 0: 74%|███████▎ | 9127/12384 [19:22:04<6:53:17, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=5.84s]
Epoch 0: 74%|███████▎ | 9127/12384 [19:22:11<6:53:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 0: 74%|███████▎ | 9128/12384 [19:22:11<6:53:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 0: 74%|███████▎ | 9128/12384 [19:22:19<6:53:19, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=7.23s]
Epoch 0: 74%|███████▎ | 9129/12384 [19:22:19<6:53:07, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=7.23s]
Epoch 0: 74%|███████▎ | 9129/12384 [19:22:27<6:53:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 0: 74%|███████▎ | 9130/12384 [19:22:27<6:58:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 0: 74%|███████▎ | 9130/12384 [19:22:34<6:58:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 74%|███████▎ | 9131/12384 [19:22:34<6:57:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 74%|███████▎ | 9131/12384 [19:22:42<6:57:02, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 74%|███████▎ | 9132/12384 [19:22:42<6:55:34, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 74%|███████▎ | 9132/12384 [19:22:50<6:55:34, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▎ | 9133/12384 [19:22:50<6:54:18, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▎ | 9133/12384 [19:22:57<6:54:18, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=5.87s]
Epoch 0: 74%|███████▍ | 9134/12384 [19:22:57<6:53:40, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=5.87s]
Epoch 0: 74%|███████▍ | 9134/12384 [19:23:05<6:53:40, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.82s]
Epoch 0: 74%|███████▍ | 9135/12384 [19:23:05<6:53:17, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.82s]
Epoch 0: 74%|███████▍ | 9135/12384 [19:23:13<6:53:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 0: 74%|███████▍ | 9136/12384 [19:23:13<6:53:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 0: 74%|███████▍ | 9136/12384 [19:23:20<6:53:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 74%|███████▍ | 9137/12384 [19:23:20<6:52:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 74%|███████▍ | 9137/12384 [19:23:28<6:52:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 74%|███████▍ | 9138/12384 [19:23:28<6:57:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 74%|███████▍ | 9138/12384 [19:23:36<6:57:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▍ | 9139/12384 [19:23:36<6:56:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▍ | 9139/12384 [19:23:43<6:56:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 74%|███████▍ | 9140/12384 [19:23:43<6:55:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 74%|███████▍ | 9140/12384 [19:23:51<6:55:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 74%|███████▍ | 9141/12384 [19:23:51<6:54:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 74%|███████▍ | 9141/12384 [19:23:59<6:54:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 74%|███████▍ | 9142/12384 [19:23:59<6:53:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 74%|███████▍ | 9142/12384 [19:24:06<6:53:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 74%|███████▍ | 9143/12384 [19:24:06<6:53:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 74%|███████▍ | 9143/12384 [19:24:14<6:53:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 0: 74%|███████▍ | 9144/12384 [19:24:14<6:53:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 0: 74%|███████▍ | 9144/12384 [19:24:22<6:53:59, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=7.32s]
Epoch 0: 74%|███████▍ | 9145/12384 [19:24:22<6:52:48, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.32s]
Epoch 0: 74%|███████▍ | 9145/12384 [19:24:29<6:52:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 74%|███████▍ | 9146/12384 [19:24:29<6:52:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 74%|███████▍ | 9146/12384 [19:24:37<6:52:10, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=10.16s]
Epoch 0: 74%|███████▍ | 9147/12384 [19:24:37<6:51:22, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=10.16s]
Epoch 0: 74%|███████▍ | 9147/12384 [19:24:44<6:51:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9148/12384 [19:24:44<6:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9148/12384 [19:24:52<6:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9149/12384 [19:24:52<6:50:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9149/12384 [19:25:00<6:50:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 74%|███████▍ | 9150/12384 [19:25:00<6:50:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 74%|███████▍ | 9150/12384 [19:25:07<6:50:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 74%|███████▍ | 9151/12384 [19:25:07<6:50:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 74%|███████▍ | 9151/12384 [19:25:15<6:50:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 74%|███████▍ | 9152/12384 [19:25:15<6:49:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 74%|███████▍ | 9152/12384 [19:25:22<6:49:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 74%|███████▍ | 9153/12384 [19:25:22<6:50:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 74%|███████▍ | 9153/12384 [19:25:30<6:50:57, 7.63s/it, loss=0.0006, acc=0.9991, iter_time=5.55s]
Epoch 0: 74%|███████▍ | 9154/12384 [19:25:30<6:50:22, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=5.55s]
Epoch 0: 74%|███████▍ | 9154/12384 [19:25:38<6:50:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 74%|███████▍ | 9155/12384 [19:25:38<6:50:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 74%|███████▍ | 9155/12384 [19:25:45<6:50:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 74%|███████▍ | 9156/12384 [19:25:45<6:50:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 74%|███████▍ | 9156/12384 [19:25:53<6:50:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 0: 74%|███████▍ | 9157/12384 [19:25:53<6:55:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 0: 74%|███████▍ | 9157/12384 [19:26:01<6:55:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 0: 74%|███████▍ | 9158/12384 [19:26:01<6:52:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 0: 74%|███████▍ | 9158/12384 [19:26:09<6:52:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 74%|███████▍ | 9159/12384 [19:26:09<6:52:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 74%|███████▍ | 9159/12384 [19:26:16<6:52:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 74%|███████▍ | 9160/12384 [19:26:16<6:51:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 74%|███████▍ | 9160/12384 [19:26:24<6:51:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 74%|███████▍ | 9161/12384 [19:26:24<6:50:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 74%|███████▍ | 9161/12384 [19:26:31<6:50:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 74%|███████▍ | 9162/12384 [19:26:31<6:50:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 74%|███████▍ | 9162/12384 [19:26:39<6:50:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 74%|███████▍ | 9163/12384 [19:26:39<6:54:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 74%|███████▍ | 9163/12384 [19:26:47<6:54:26, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9164/12384 [19:26:47<6:52:47, 7.69s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9164/12384 [19:26:55<6:52:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 74%|███████▍ | 9165/12384 [19:26:55<6:51:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 74%|███████▍ | 9165/12384 [19:27:02<6:51:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 74%|███████▍ | 9166/12384 [19:27:02<6:50:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 74%|███████▍ | 9166/12384 [19:27:10<6:50:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 0: 74%|███████▍ | 9167/12384 [19:27:10<6:49:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 0: 74%|███████▍ | 9167/12384 [19:27:17<6:49:33, 7.64s/it, loss=0.0006, acc=0.9981, iter_time=11.93s]
Epoch 0: 74%|███████▍ | 9168/12384 [19:27:17<6:49:07, 7.63s/it, loss=0.0006, acc=0.9981, iter_time=11.93s]
Epoch 0: 74%|███████▍ | 9168/12384 [19:27:25<6:49:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 74%|███████▍ | 9169/12384 [19:27:25<6:48:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 74%|███████▍ | 9169/12384 [19:27:33<6:48:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9170/12384 [19:27:33<6:48:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9170/12384 [19:27:40<6:48:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9171/12384 [19:27:40<6:48:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9171/12384 [19:27:48<6:48:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 74%|███████▍ | 9172/12384 [19:27:48<6:47:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 74%|███████▍ | 9172/12384 [19:27:55<6:47:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 74%|███████▍ | 9173/12384 [19:27:55<6:47:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 74%|███████▍ | 9173/12384 [19:28:03<6:47:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▍ | 9174/12384 [19:28:03<6:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▍ | 9174/12384 [19:28:11<6:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 74%|███████▍ | 9175/12384 [19:28:11<6:47:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 74%|███████▍ | 9175/12384 [19:28:18<6:47:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 74%|███████▍ | 9176/12384 [19:28:18<6:46:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 74%|███████▍ | 9176/12384 [19:28:26<6:46:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▍ | 9177/12384 [19:28:26<6:46:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▍ | 9177/12384 [19:28:33<6:46:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▍ | 9178/12384 [19:28:33<6:46:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▍ | 9178/12384 [19:28:41<6:46:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 74%|███████▍ | 9179/12384 [19:28:41<6:46:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 74%|███████▍ | 9179/12384 [19:28:49<6:46:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 0: 74%|███████▍ | 9180/12384 [19:28:49<6:46:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 0: 74%|███████▍ | 9180/12384 [19:28:56<6:46:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 74%|███████▍ | 9181/12384 [19:28:56<6:45:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 74%|███████▍ | 9181/12384 [19:29:04<6:45:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 74%|███████▍ | 9182/12384 [19:29:04<6:45:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 74%|███████▍ | 9182/12384 [19:29:12<6:45:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 74%|███████▍ | 9183/12384 [19:29:12<6:51:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 74%|███████▍ | 9183/12384 [19:29:19<6:51:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 74%|███████▍ | 9184/12384 [19:29:19<6:49:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 74%|███████▍ | 9184/12384 [19:29:27<6:49:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▍ | 9185/12384 [19:29:27<6:48:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▍ | 9185/12384 [19:29:35<6:48:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9186/12384 [19:29:35<6:47:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9186/12384 [19:29:42<6:47:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9187/12384 [19:29:42<6:46:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9187/12384 [19:29:50<6:46:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9188/12384 [19:29:50<6:46:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9188/12384 [19:29:58<6:46:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9189/12384 [19:29:58<6:46:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9189/12384 [19:30:05<6:46:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 74%|███████▍ | 9190/12384 [19:30:05<6:50:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 74%|███████▍ | 9190/12384 [19:30:13<6:50:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9191/12384 [19:30:13<6:48:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9191/12384 [19:30:21<6:48:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 74%|███████▍ | 9192/12384 [19:30:21<6:47:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 74%|███████▍ | 9192/12384 [19:30:28<6:47:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 74%|███████▍ | 9193/12384 [19:30:28<6:47:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 74%|███████▍ | 9193/12384 [19:30:36<6:47:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 74%|███████▍ | 9194/12384 [19:30:36<6:46:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 74%|███████▍ | 9194/12384 [19:30:44<6:46:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9195/12384 [19:30:44<6:45:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9195/12384 [19:30:51<6:45:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9196/12384 [19:30:51<6:45:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9196/12384 [19:30:59<6:45:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9197/12384 [19:30:59<6:44:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9197/12384 [19:31:06<6:44:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9198/12384 [19:31:06<6:44:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9198/12384 [19:31:14<6:44:47, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.63s]
Epoch 0: 74%|███████▍ | 9199/12384 [19:31:14<6:44:32, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.63s]
Epoch 0: 74%|███████▍ | 9199/12384 [19:31:22<6:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 74%|███████▍ | 9200/12384 [19:31:22<6:45:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 74%|███████▍ | 9200/12384 [19:31:29<6:45:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 74%|███████▍ | 9201/12384 [19:31:29<6:44:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 74%|███████▍ | 9201/12384 [19:31:37<6:44:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9202/12384 [19:31:37<6:44:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9202/12384 [19:31:44<6:44:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 74%|███████▍ | 9203/12384 [19:31:44<6:43:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 74%|███████▍ | 9203/12384 [19:31:52<6:43:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9204/12384 [19:31:52<6:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9204/12384 [19:32:00<6:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 74%|███████▍ | 9205/12384 [19:32:00<6:43:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 74%|███████▍ | 9205/12384 [19:32:07<6:43:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 74%|███████▍ | 9206/12384 [19:32:07<6:43:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 74%|███████▍ | 9206/12384 [19:32:15<6:43:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▍ | 9207/12384 [19:32:15<6:43:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 74%|███████▍ | 9207/12384 [19:32:23<6:43:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 74%|███████▍ | 9208/12384 [19:32:23<6:43:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 74%|███████▍ | 9208/12384 [19:32:31<6:43:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 74%|███████▍ | 9209/12384 [19:32:31<6:48:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 74%|███████▍ | 9209/12384 [19:32:38<6:48:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 0: 74%|███████▍ | 9210/12384 [19:32:38<6:46:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 0: 74%|███████▍ | 9210/12384 [19:32:46<6:46:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 74%|███████▍ | 9211/12384 [19:32:46<6:45:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 74%|███████▍ | 9211/12384 [19:32:53<6:45:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 74%|███████▍ | 9212/12384 [19:32:53<6:44:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 74%|███████▍ | 9212/12384 [19:33:01<6:44:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 74%|███████▍ | 9213/12384 [19:33:01<6:43:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 74%|███████▍ | 9213/12384 [19:33:09<6:43:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 0: 74%|███████▍ | 9214/12384 [19:33:09<6:43:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 0: 74%|███████▍ | 9214/12384 [19:33:16<6:43:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.27s]
Epoch 0: 74%|███████▍ | 9215/12384 [19:33:16<6:47:13, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=11.27s]
Epoch 0: 74%|███████▍ | 9215/12384 [19:33:24<6:47:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 74%|███████▍ | 9216/12384 [19:33:24<6:45:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 74%|███████▍ | 9216/12384 [19:33:32<6:45:27, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 74%|███████▍ | 9217/12384 [19:33:32<6:44:29, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 0: 74%|███████▍ | 9217/12384 [19:33:39<6:44:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 74%|███████▍ | 9218/12384 [19:33:39<6:43:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 74%|███████▍ | 9218/12384 [19:33:47<6:43:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 74%|███████▍ | 9219/12384 [19:33:47<6:43:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 74%|███████▍ | 9219/12384 [19:33:55<6:43:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▍ | 9220/12384 [19:33:55<6:42:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 74%|███████▍ | 9220/12384 [19:34:02<6:42:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9221/12384 [19:34:02<6:42:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 74%|███████▍ | 9221/12384 [19:34:10<6:42:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 74%|███████▍ | 9222/12384 [19:34:10<6:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 74%|███████▍ | 9222/12384 [19:34:17<6:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9223/12384 [19:34:17<6:41:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 74%|███████▍ | 9223/12384 [19:34:25<6:41:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 74%|███████▍ | 9224/12384 [19:34:25<6:41:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 74%|███████▍ | 9224/12384 [19:34:33<6:41:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 74%|███████▍ | 9225/12384 [19:34:33<6:40:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 74%|███████▍ | 9225/12384 [19:34:40<6:40:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 74%|███████▍ | 9226/12384 [19:34:40<6:41:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 74%|███████▍ | 9226/12384 [19:34:48<6:41:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.05s]
Epoch 0: 75%|███████▍ | 9227/12384 [19:34:48<6:41:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.05s]
Epoch 0: 75%|███████▍ | 9227/12384 [19:34:56<6:41:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.40s]
Epoch 0: 75%|███████▍ | 9228/12384 [19:34:56<6:40:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.40s]
Epoch 0: 75%|███████▍ | 9228/12384 [19:35:03<6:40:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 75%|███████▍ | 9229/12384 [19:35:03<6:40:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 75%|███████▍ | 9229/12384 [19:35:11<6:40:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 75%|███████▍ | 9230/12384 [19:35:11<6:39:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 75%|███████▍ | 9230/12384 [19:35:18<6:39:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▍ | 9231/12384 [19:35:18<6:39:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▍ | 9231/12384 [19:35:26<6:39:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 75%|███████▍ | 9232/12384 [19:35:26<6:39:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 75%|███████▍ | 9232/12384 [19:35:34<6:39:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 0: 75%|███████▍ | 9233/12384 [19:35:34<6:39:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 0: 75%|███████▍ | 9233/12384 [19:35:41<6:39:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 75%|███████▍ | 9234/12384 [19:35:41<6:39:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 75%|███████▍ | 9234/12384 [19:35:49<6:39:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 75%|███████▍ | 9235/12384 [19:35:49<6:44:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 75%|███████▍ | 9235/12384 [19:35:57<6:44:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 0: 75%|███████▍ | 9236/12384 [19:35:57<6:43:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 0: 75%|███████▍ | 9236/12384 [19:36:04<6:43:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 75%|███████▍ | 9237/12384 [19:36:04<6:41:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 75%|███████▍ | 9237/12384 [19:36:12<6:41:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 75%|███████▍ | 9238/12384 [19:36:12<6:40:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 75%|███████▍ | 9238/12384 [19:36:20<6:40:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 75%|███████▍ | 9239/12384 [19:36:20<6:40:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 75%|███████▍ | 9239/12384 [19:36:27<6:40:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 75%|███████▍ | 9240/12384 [19:36:27<6:40:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 75%|███████▍ | 9240/12384 [19:36:35<6:40:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 75%|███████▍ | 9241/12384 [19:36:35<6:43:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 75%|███████▍ | 9241/12384 [19:36:43<6:43:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▍ | 9242/12384 [19:36:43<6:42:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▍ | 9242/12384 [19:36:50<6:42:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 75%|███████▍ | 9243/12384 [19:36:50<6:41:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 75%|███████▍ | 9243/12384 [19:36:58<6:41:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 75%|███████▍ | 9244/12384 [19:36:58<6:40:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 75%|███████▍ | 9244/12384 [19:37:06<6:40:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 75%|███████▍ | 9245/12384 [19:37:06<6:39:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 75%|███████▍ | 9245/12384 [19:37:13<6:39:50, 7.64s/it, loss=0.0002, acc=0.9984, iter_time=5.33s]
Epoch 0: 75%|███████▍ | 9246/12384 [19:37:13<6:39:00, 7.63s/it, loss=0.0002, acc=0.9984, iter_time=5.33s]
Epoch 0: 75%|███████▍ | 9246/12384 [19:37:21<6:39:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 0: 75%|███████▍ | 9247/12384 [19:37:21<6:38:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 0: 75%|███████▍ | 9247/12384 [19:37:28<6:38:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 0: 75%|███████▍ | 9248/12384 [19:37:28<6:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 0: 75%|███████▍ | 9248/12384 [19:37:36<6:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 75%|███████▍ | 9249/12384 [19:37:36<6:37:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 75%|███████▍ | 9249/12384 [19:37:44<6:37:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 75%|███████▍ | 9250/12384 [19:37:44<6:38:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 75%|███████▍ | 9250/12384 [19:37:51<6:38:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 75%|███████▍ | 9251/12384 [19:37:51<6:37:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 75%|███████▍ | 9251/12384 [19:37:59<6:37:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 75%|███████▍ | 9252/12384 [19:37:59<6:37:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 75%|███████▍ | 9252/12384 [19:38:06<6:37:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 75%|███████▍ | 9253/12384 [19:38:06<6:37:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 75%|███████▍ | 9253/12384 [19:38:14<6:37:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▍ | 9254/12384 [19:38:14<6:37:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▍ | 9254/12384 [19:38:22<6:37:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 75%|███████▍ | 9255/12384 [19:38:22<6:37:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 75%|███████▍ | 9255/12384 [19:38:29<6:37:16, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=8.00s]
Epoch 0: 75%|███████▍ | 9256/12384 [19:38:29<6:36:59, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=8.00s]
Epoch 0: 75%|███████▍ | 9256/12384 [19:38:37<6:36:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 75%|███████▍ | 9257/12384 [19:38:37<6:36:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 75%|███████▍ | 9257/12384 [19:38:45<6:36:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 75%|███████▍ | 9258/12384 [19:38:45<6:36:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 75%|███████▍ | 9258/12384 [19:38:52<6:36:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 75%|███████▍ | 9259/12384 [19:38:52<6:36:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 75%|███████▍ | 9259/12384 [19:39:00<6:36:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▍ | 9260/12384 [19:39:00<6:35:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▍ | 9260/12384 [19:39:08<6:35:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 75%|███████▍ | 9261/12384 [19:39:08<6:41:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 75%|███████▍ | 9261/12384 [19:39:15<6:41:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 75%|███████▍ | 9262/12384 [19:39:15<6:40:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 75%|███████▍ | 9262/12384 [19:39:23<6:40:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 0: 75%|███████▍ | 9263/12384 [19:39:23<6:39:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 0: 75%|███████▍ | 9263/12384 [19:39:31<6:39:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 75%|███████▍ | 9264/12384 [19:39:31<6:38:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 75%|███████▍ | 9264/12384 [19:39:38<6:38:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 75%|███████▍ | 9265/12384 [19:39:38<6:37:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 75%|███████▍ | 9265/12384 [19:39:46<6:37:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 75%|███████▍ | 9266/12384 [19:39:46<6:36:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 75%|███████▍ | 9266/12384 [19:39:54<6:36:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 75%|███████▍ | 9267/12384 [19:39:54<6:40:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 75%|███████▍ | 9267/12384 [19:40:01<6:40:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▍ | 9268/12384 [19:40:01<6:39:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▍ | 9268/12384 [19:40:09<6:39:01, 7.68s/it, loss=0.0003, acc=0.9979, iter_time=6.67s]
Epoch 0: 75%|███████▍ | 9269/12384 [19:40:09<6:37:39, 7.66s/it, loss=0.0003, acc=0.9979, iter_time=6.67s]
Epoch 0: 75%|███████▍ | 9269/12384 [19:40:17<6:37:39, 7.66s/it, loss=0.0017, acc=0.9982, iter_time=8.56s]
Epoch 0: 75%|███████▍ | 9270/12384 [19:40:17<6:36:37, 7.64s/it, loss=0.0017, acc=0.9982, iter_time=8.56s]
Epoch 0: 75%|███████▍ | 9270/12384 [19:40:24<6:36:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▍ | 9271/12384 [19:40:24<6:37:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▍ | 9271/12384 [19:40:32<6:37:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 75%|███████▍ | 9272/12384 [19:40:32<6:36:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 75%|███████▍ | 9272/12384 [19:40:39<6:36:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 75%|███████▍ | 9273/12384 [19:40:39<6:35:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 0: 75%|███████▍ | 9273/12384 [19:40:47<6:35:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 75%|███████▍ | 9274/12384 [19:40:47<6:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 75%|███████▍ | 9274/12384 [19:40:55<6:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 75%|███████▍ | 9275/12384 [19:40:55<6:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 75%|███████▍ | 9275/12384 [19:41:02<6:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 75%|███████▍ | 9276/12384 [19:41:02<6:34:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 75%|███████▍ | 9276/12384 [19:41:10<6:34:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 75%|███████▍ | 9277/12384 [19:41:10<6:34:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 75%|███████▍ | 9277/12384 [19:41:17<6:34:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 75%|███████▍ | 9278/12384 [19:41:17<6:34:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 75%|███████▍ | 9278/12384 [19:41:25<6:34:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 75%|███████▍ | 9279/12384 [19:41:25<6:33:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 75%|███████▍ | 9279/12384 [19:41:33<6:33:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 75%|███████▍ | 9280/12384 [19:41:33<6:33:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 75%|███████▍ | 9280/12384 [19:41:40<6:33:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 75%|███████▍ | 9281/12384 [19:41:40<6:33:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 75%|███████▍ | 9281/12384 [19:41:48<6:33:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 75%|███████▍ | 9282/12384 [19:41:48<6:33:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 75%|███████▍ | 9282/12384 [19:41:56<6:33:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 75%|███████▍ | 9283/12384 [19:41:56<6:33:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 75%|███████▍ | 9283/12384 [19:42:03<6:33:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 0: 75%|███████▍ | 9284/12384 [19:42:03<6:33:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 0: 75%|███████▍ | 9284/12384 [19:42:11<6:33:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 75%|███████▍ | 9285/12384 [19:42:11<6:33:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 75%|███████▍ | 9285/12384 [19:42:18<6:33:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 0: 75%|███████▍ | 9286/12384 [19:42:18<6:32:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 0: 75%|███████▍ | 9286/12384 [19:42:26<6:32:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 75%|███████▍ | 9287/12384 [19:42:26<6:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 75%|███████▍ | 9287/12384 [19:42:34<6:32:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 75%|███████▌ | 9288/12384 [19:42:34<6:37:53, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 75%|███████▌ | 9288/12384 [19:42:42<6:37:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 0: 75%|███████▌ | 9289/12384 [19:42:42<6:35:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 0: 75%|███████▌ | 9289/12384 [19:42:49<6:35:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 75%|███████▌ | 9290/12384 [19:42:49<6:34:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 75%|███████▌ | 9290/12384 [19:42:57<6:34:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 75%|███████▌ | 9291/12384 [19:42:57<6:33:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 75%|███████▌ | 9291/12384 [19:43:04<6:33:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 75%|███████▌ | 9292/12384 [19:43:04<6:32:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 75%|███████▌ | 9292/12384 [19:43:12<6:32:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 75%|███████▌ | 9293/12384 [19:43:12<6:36:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 75%|███████▌ | 9293/12384 [19:43:20<6:36:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 75%|███████▌ | 9294/12384 [19:43:20<6:35:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 75%|███████▌ | 9294/12384 [19:43:27<6:35:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 75%|███████▌ | 9295/12384 [19:43:27<6:33:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 75%|███████▌ | 9295/12384 [19:43:35<6:33:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 75%|███████▌ | 9296/12384 [19:43:35<6:33:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 75%|███████▌ | 9296/12384 [19:43:43<6:33:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 0: 75%|███████▌ | 9297/12384 [19:43:43<6:32:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 0: 75%|███████▌ | 9297/12384 [19:43:50<6:32:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 75%|███████▌ | 9298/12384 [19:43:50<6:32:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 75%|███████▌ | 9298/12384 [19:43:58<6:32:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 0: 75%|███████▌ | 9299/12384 [19:43:58<6:32:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 0: 75%|███████▌ | 9299/12384 [19:44:05<6:32:00, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=8.03s]
Epoch 0: 75%|███████▌ | 9300/12384 [19:44:05<6:31:50, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=8.03s]
Epoch 0: 75%|███████▌ | 9300/12384 [19:44:13<6:31:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 75%|███████▌ | 9301/12384 [19:44:13<6:31:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 75%|███████▌ | 9301/12384 [19:44:21<6:31:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▌ | 9302/12384 [19:44:21<6:31:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▌ | 9302/12384 [19:44:28<6:31:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9303/12384 [19:44:28<6:30:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9303/12384 [19:44:36<6:30:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 75%|███████▌ | 9304/12384 [19:44:36<6:31:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 75%|███████▌ | 9304/12384 [19:44:44<6:31:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 75%|███████▌ | 9305/12384 [19:44:44<6:30:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 75%|███████▌ | 9305/12384 [19:44:51<6:30:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 75%|███████▌ | 9306/12384 [19:44:51<6:30:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 75%|███████▌ | 9306/12384 [19:44:59<6:30:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 75%|███████▌ | 9307/12384 [19:44:59<6:30:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 75%|███████▌ | 9307/12384 [19:45:06<6:30:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▌ | 9308/12384 [19:45:06<6:31:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▌ | 9308/12384 [19:45:14<6:31:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 75%|███████▌ | 9309/12384 [19:45:14<6:31:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 75%|███████▌ | 9309/12384 [19:45:22<6:31:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 75%|███████▌ | 9310/12384 [19:45:22<6:30:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 75%|███████▌ | 9310/12384 [19:45:29<6:30:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 75%|███████▌ | 9311/12384 [19:45:29<6:30:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 75%|███████▌ | 9311/12384 [19:45:37<6:30:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 75%|███████▌ | 9312/12384 [19:45:37<6:30:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 75%|███████▌ | 9312/12384 [19:45:44<6:30:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 75%|███████▌ | 9313/12384 [19:45:44<6:29:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 75%|███████▌ | 9313/12384 [19:45:52<6:29:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 75%|███████▌ | 9314/12384 [19:45:52<6:34:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 75%|███████▌ | 9314/12384 [19:46:00<6:34:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 75%|███████▌ | 9315/12384 [19:46:00<6:33:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 75%|███████▌ | 9315/12384 [19:46:08<6:33:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9316/12384 [19:46:08<6:31:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9316/12384 [19:46:15<6:31:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 75%|███████▌ | 9317/12384 [19:46:15<6:30:53, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 75%|███████▌ | 9317/12384 [19:46:23<6:30:53, 7.65s/it, loss=0.0038, acc=0.9963, iter_time=4.63s]
Epoch 0: 75%|███████▌ | 9318/12384 [19:46:23<6:30:21, 7.64s/it, loss=0.0038, acc=0.9963, iter_time=4.63s]
Epoch 0: 75%|███████▌ | 9318/12384 [19:46:31<6:30:21, 7.64s/it, loss=0.0002, acc=0.9992, iter_time=11.13s]
Epoch 0: 75%|███████▌ | 9319/12384 [19:46:31<6:29:56, 7.63s/it, loss=0.0002, acc=0.9992, iter_time=11.13s]
Epoch 0: 75%|███████▌ | 9319/12384 [19:46:38<6:29:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 75%|███████▌ | 9320/12384 [19:46:38<6:33:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 75%|███████▌ | 9320/12384 [19:46:46<6:33:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 75%|███████▌ | 9321/12384 [19:46:46<6:32:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 75%|███████▌ | 9321/12384 [19:46:54<6:32:21, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 75%|███████▌ | 9322/12384 [19:46:54<6:31:01, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 75%|███████▌ | 9322/12384 [19:47:01<6:31:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 75%|███████▌ | 9323/12384 [19:47:01<6:30:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 75%|███████▌ | 9323/12384 [19:47:09<6:30:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 0: 75%|███████▌ | 9324/12384 [19:47:09<6:29:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 0: 75%|███████▌ | 9324/12384 [19:47:16<6:29:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 75%|███████▌ | 9325/12384 [19:47:16<6:29:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 75%|███████▌ | 9325/12384 [19:47:24<6:29:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9326/12384 [19:47:24<6:28:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9326/12384 [19:47:32<6:28:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 75%|███████▌ | 9327/12384 [19:47:32<6:28:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 75%|███████▌ | 9327/12384 [19:47:39<6:28:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 75%|███████▌ | 9328/12384 [19:47:39<6:27:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 75%|███████▌ | 9328/12384 [19:47:47<6:27:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 75%|███████▌ | 9329/12384 [19:47:47<6:27:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 75%|███████▌ | 9329/12384 [19:47:55<6:27:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 75%|███████▌ | 9330/12384 [19:47:55<6:27:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 75%|███████▌ | 9330/12384 [19:48:02<6:27:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.45s]
Epoch 0: 75%|███████▌ | 9331/12384 [19:48:02<6:29:16, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.45s]
Epoch 0: 75%|███████▌ | 9331/12384 [19:48:10<6:29:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 0: 75%|███████▌ | 9332/12384 [19:48:10<6:28:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 0: 75%|███████▌ | 9332/12384 [19:48:17<6:28:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 75%|███████▌ | 9333/12384 [19:48:17<6:27:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 75%|███████▌ | 9333/12384 [19:48:25<6:27:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 75%|███████▌ | 9334/12384 [19:48:25<6:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 75%|███████▌ | 9334/12384 [19:48:33<6:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▌ | 9335/12384 [19:48:33<6:27:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▌ | 9335/12384 [19:48:40<6:27:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 75%|███████▌ | 9336/12384 [19:48:40<6:26:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 75%|███████▌ | 9336/12384 [19:48:48<6:26:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 75%|███████▌ | 9337/12384 [19:48:48<6:26:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 75%|███████▌ | 9337/12384 [19:48:56<6:26:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 75%|███████▌ | 9338/12384 [19:48:56<6:26:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 75%|███████▌ | 9338/12384 [19:49:03<6:26:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9339/12384 [19:49:03<6:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9339/12384 [19:49:11<6:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9340/12384 [19:49:11<6:26:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 75%|███████▌ | 9340/12384 [19:49:19<6:26:30, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=5.15s]
Epoch 0: 75%|███████▌ | 9341/12384 [19:49:19<6:31:14, 7.71s/it, loss=0.0003, acc=0.9986, iter_time=5.15s]
Epoch 0: 75%|███████▌ | 9341/12384 [19:49:26<6:31:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 75%|███████▌ | 9342/12384 [19:49:26<6:29:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 75%|███████▌ | 9342/12384 [19:49:34<6:29:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 75%|███████▌ | 9343/12384 [19:49:34<6:28:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 75%|███████▌ | 9343/12384 [19:49:42<6:28:07, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 75%|███████▌ | 9344/12384 [19:49:42<6:27:29, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 75%|███████▌ | 9344/12384 [19:49:49<6:27:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 75%|███████▌ | 9345/12384 [19:49:49<6:26:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 75%|███████▌ | 9345/12384 [19:49:57<6:26:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 75%|███████▌ | 9346/12384 [19:49:57<6:30:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 75%|███████▌ | 9346/12384 [19:50:05<6:30:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▌ | 9347/12384 [19:50:05<6:28:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 75%|███████▌ | 9347/12384 [19:50:12<6:28:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 75%|███████▌ | 9348/12384 [19:50:12<6:27:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 75%|███████▌ | 9348/12384 [19:50:20<6:27:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 75%|███████▌ | 9349/12384 [19:50:20<6:26:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 75%|███████▌ | 9349/12384 [19:50:27<6:26:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 76%|███████▌ | 9350/12384 [19:50:27<6:25:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 76%|███████▌ | 9350/12384 [19:50:35<6:25:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 76%|███████▌ | 9351/12384 [19:50:35<6:25:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 76%|███████▌ | 9351/12384 [19:50:43<6:25:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9352/12384 [19:50:43<6:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9352/12384 [19:50:49<6:25:16, 7.62s/it, loss=0.0007, acc=0.9994, iter_time=5.05s]
Epoch 0: 76%|███████▌ | 9353/12384 [19:50:49<6:08:42, 7.30s/it, loss=0.0007, acc=0.9994, iter_time=5.05s]
Epoch 0: 76%|███████▌ | 9353/12384 [19:50:57<6:08:42, 7.30s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 76%|███████▌ | 9354/12384 [19:50:57<6:13:23, 7.39s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 76%|███████▌ | 9354/12384 [19:51:04<6:13:23, 7.39s/it, loss=0.0001, acc=0.9998, iter_time=9.38s]
Epoch 0: 76%|███████▌ | 9355/12384 [19:51:04<6:16:40, 7.46s/it, loss=0.0001, acc=0.9998, iter_time=9.38s]
Epoch 0: 76%|███████▌ | 9355/12384 [19:51:12<6:16:40, 7.46s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 0: 76%|███████▌ | 9356/12384 [19:51:12<6:18:56, 7.51s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 0: 76%|███████▌ | 9356/12384 [19:51:20<6:18:56, 7.51s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 76%|███████▌ | 9357/12384 [19:51:20<6:20:23, 7.54s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 76%|███████▌ | 9357/12384 [19:51:27<6:20:23, 7.54s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 76%|███████▌ | 9358/12384 [19:51:27<6:21:12, 7.56s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 76%|███████▌ | 9358/12384 [19:51:35<6:21:12, 7.56s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 76%|███████▌ | 9359/12384 [19:51:35<6:21:50, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 76%|███████▌ | 9359/12384 [19:51:43<6:21:50, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 76%|███████▌ | 9360/12384 [19:51:43<6:22:16, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 76%|███████▌ | 9360/12384 [19:51:50<6:22:16, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 76%|███████▌ | 9361/12384 [19:51:50<6:22:28, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 76%|███████▌ | 9361/12384 [19:51:58<6:22:28, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9362/12384 [19:51:58<6:22:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9362/12384 [19:52:05<6:22:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 76%|███████▌ | 9363/12384 [19:52:05<6:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 76%|███████▌ | 9363/12384 [19:52:13<6:22:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 76%|███████▌ | 9364/12384 [19:52:13<6:22:30, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 76%|███████▌ | 9364/12384 [19:52:21<6:22:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 76%|███████▌ | 9365/12384 [19:52:21<6:22:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 76%|███████▌ | 9365/12384 [19:52:28<6:22:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 76%|███████▌ | 9366/12384 [19:52:28<6:22:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 76%|███████▌ | 9366/12384 [19:52:36<6:22:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 76%|███████▌ | 9367/12384 [19:52:36<6:27:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 76%|███████▌ | 9367/12384 [19:52:44<6:27:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 76%|███████▌ | 9368/12384 [19:52:44<6:26:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 76%|███████▌ | 9368/12384 [19:52:51<6:26:08, 7.68s/it, loss=0.0031, acc=0.9918, iter_time=7.64s]
Epoch 0: 76%|███████▌ | 9369/12384 [19:52:51<6:24:43, 7.66s/it, loss=0.0031, acc=0.9918, iter_time=7.64s]
Epoch 0: 76%|███████▌ | 9369/12384 [19:52:59<6:24:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 76%|███████▌ | 9370/12384 [19:52:59<6:23:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 76%|███████▌ | 9370/12384 [19:53:07<6:23:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 76%|███████▌ | 9371/12384 [19:53:07<6:24:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 76%|███████▌ | 9371/12384 [19:53:14<6:24:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 0: 76%|███████▌ | 9372/12384 [19:53:14<6:23:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 0: 76%|███████▌ | 9372/12384 [19:53:22<6:23:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 76%|███████▌ | 9373/12384 [19:53:22<6:27:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 76%|███████▌ | 9373/12384 [19:53:30<6:27:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 76%|███████▌ | 9374/12384 [19:53:30<6:25:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 76%|███████▌ | 9374/12384 [19:53:37<6:25:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9375/12384 [19:53:37<6:24:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9375/12384 [19:53:45<6:24:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 76%|███████▌ | 9376/12384 [19:53:45<6:23:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 76%|███████▌ | 9376/12384 [19:53:53<6:23:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 0: 76%|███████▌ | 9377/12384 [19:53:53<6:22:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 0: 76%|███████▌ | 9377/12384 [19:54:00<6:22:45, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=10.97s]
Epoch 0: 76%|███████▌ | 9378/12384 [19:54:00<6:22:19, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=10.97s]
Epoch 0: 76%|███████▌ | 9378/12384 [19:54:08<6:22:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 76%|███████▌ | 9379/12384 [19:54:08<6:21:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 76%|███████▌ | 9379/12384 [19:54:15<6:21:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.52s]
Epoch 0: 76%|███████▌ | 9380/12384 [19:54:15<6:21:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.52s]
Epoch 0: 76%|███████▌ | 9380/12384 [19:54:23<6:21:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 76%|███████▌ | 9381/12384 [19:54:23<6:21:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 76%|███████▌ | 9381/12384 [19:54:31<6:21:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 76%|███████▌ | 9382/12384 [19:54:31<6:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 76%|███████▌ | 9382/12384 [19:54:38<6:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 0: 76%|███████▌ | 9383/12384 [19:54:38<6:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 0: 76%|███████▌ | 9383/12384 [19:54:46<6:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 0: 76%|███████▌ | 9384/12384 [19:54:46<6:20:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 0: 76%|███████▌ | 9384/12384 [19:54:53<6:20:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 76%|███████▌ | 9385/12384 [19:54:53<6:20:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 76%|███████▌ | 9385/12384 [19:55:01<6:20:03, 7.60s/it, loss=0.0002, acc=0.9976, iter_time=6.08s]
Epoch 0: 76%|███████▌ | 9386/12384 [19:55:01<6:19:54, 7.60s/it, loss=0.0002, acc=0.9976, iter_time=6.08s]
Epoch 0: 76%|███████▌ | 9386/12384 [19:55:09<6:19:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 0: 76%|███████▌ | 9387/12384 [19:55:09<6:21:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 0: 76%|███████▌ | 9387/12384 [19:55:16<6:21:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 0: 76%|███████▌ | 9388/12384 [19:55:16<6:20:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 0: 76%|███████▌ | 9388/12384 [19:55:24<6:20:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 76%|███████▌ | 9389/12384 [19:55:24<6:20:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 76%|███████▌ | 9389/12384 [19:55:32<6:20:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 76%|███████▌ | 9390/12384 [19:55:32<6:20:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 76%|███████▌ | 9390/12384 [19:55:39<6:20:00, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.78s]
Epoch 0: 76%|███████▌ | 9391/12384 [19:55:39<6:19:54, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.78s]
Epoch 0: 76%|███████▌ | 9391/12384 [19:55:47<6:19:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 0: 76%|███████▌ | 9392/12384 [19:55:47<6:20:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 0: 76%|███████▌ | 9392/12384 [19:55:55<6:20:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 76%|███████▌ | 9393/12384 [19:55:55<6:24:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 76%|███████▌ | 9393/12384 [19:56:02<6:24:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 76%|███████▌ | 9394/12384 [19:56:02<6:22:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 76%|███████▌ | 9394/12384 [19:56:10<6:22:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 76%|███████▌ | 9395/12384 [19:56:10<6:21:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 76%|███████▌ | 9395/12384 [19:56:18<6:21:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9396/12384 [19:56:18<6:20:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9396/12384 [19:56:25<6:20:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9397/12384 [19:56:25<6:19:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9397/12384 [19:56:33<6:19:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 76%|███████▌ | 9398/12384 [19:56:33<6:19:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 76%|███████▌ | 9398/12384 [19:56:41<6:19:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 76%|███████▌ | 9399/12384 [19:56:41<6:23:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 76%|███████▌ | 9399/12384 [19:56:48<6:23:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 76%|███████▌ | 9400/12384 [19:56:48<6:22:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 76%|███████▌ | 9400/12384 [19:56:56<6:22:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 76%|███████▌ | 9401/12384 [19:56:56<6:21:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 76%|███████▌ | 9401/12384 [19:57:03<6:21:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9402/12384 [19:57:03<6:20:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9402/12384 [19:57:11<6:20:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 76%|███████▌ | 9403/12384 [19:57:11<6:19:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 76%|███████▌ | 9403/12384 [19:57:19<6:19:13, 7.63s/it, loss=0.0004, acc=0.9993, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9404/12384 [19:57:19<6:18:59, 7.63s/it, loss=0.0004, acc=0.9993, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9404/12384 [19:57:26<6:18:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 76%|███████▌ | 9405/12384 [19:57:26<6:18:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 0: 76%|███████▌ | 9405/12384 [19:57:34<6:18:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 76%|███████▌ | 9406/12384 [19:57:34<6:18:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 76%|███████▌ | 9406/12384 [19:57:42<6:18:27, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=8.57s]
Epoch 0: 76%|███████▌ | 9407/12384 [19:57:42<6:18:24, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=8.57s]
Epoch 0: 76%|███████▌ | 9407/12384 [19:57:49<6:18:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 76%|███████▌ | 9408/12384 [19:57:49<6:17:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 76%|███████▌ | 9408/12384 [19:57:57<6:17:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 0: 76%|███████▌ | 9409/12384 [19:57:57<6:17:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 0: 76%|███████▌ | 9409/12384 [19:58:04<6:17:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 76%|███████▌ | 9410/12384 [19:58:04<6:17:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 76%|███████▌ | 9410/12384 [19:58:12<6:17:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 76%|███████▌ | 9411/12384 [19:58:12<6:17:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 76%|███████▌ | 9411/12384 [19:58:20<6:17:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 76%|███████▌ | 9412/12384 [19:58:20<6:17:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 76%|███████▌ | 9412/12384 [19:58:27<6:17:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 76%|███████▌ | 9413/12384 [19:58:27<6:17:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 76%|███████▌ | 9413/12384 [19:58:35<6:17:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 76%|███████▌ | 9414/12384 [19:58:35<6:18:36, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 76%|███████▌ | 9414/12384 [19:58:43<6:18:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 76%|███████▌ | 9415/12384 [19:58:43<6:18:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 76%|███████▌ | 9415/12384 [19:58:50<6:18:05, 7.64s/it, loss=0.0011, acc=0.9981, iter_time=9.82s]
Epoch 0: 76%|███████▌ | 9416/12384 [19:58:50<6:18:34, 7.65s/it, loss=0.0011, acc=0.9981, iter_time=9.82s]
Epoch 0: 76%|███████▌ | 9416/12384 [19:58:58<6:18:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 76%|███████▌ | 9417/12384 [19:58:58<6:17:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 76%|███████▌ | 9417/12384 [19:59:06<6:17:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 76%|███████▌ | 9418/12384 [19:59:06<6:18:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 76%|███████▌ | 9418/12384 [19:59:14<6:18:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 0: 76%|███████▌ | 9419/12384 [19:59:14<6:22:48, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 0: 76%|███████▌ | 9419/12384 [19:59:21<6:22:48, 7.75s/it, loss=0.0004, acc=0.9973, iter_time=10.21s]
Epoch 0: 76%|███████▌ | 9420/12384 [19:59:21<6:20:23, 7.70s/it, loss=0.0004, acc=0.9973, iter_time=10.21s]
Epoch 0: 76%|███████▌ | 9420/12384 [19:59:29<6:20:23, 7.70s/it, loss=0.0008, acc=0.9980, iter_time=6.42s]
Epoch 0: 76%|███████▌ | 9421/12384 [19:59:29<6:19:12, 7.68s/it, loss=0.0008, acc=0.9980, iter_time=6.42s]
Epoch 0: 76%|███████▌ | 9421/12384 [19:59:36<6:19:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 76%|███████▌ | 9422/12384 [19:59:36<6:17:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 76%|███████▌ | 9422/12384 [19:59:44<6:17:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9423/12384 [19:59:44<6:16:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9423/12384 [19:59:52<6:16:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 76%|███████▌ | 9424/12384 [19:59:52<6:16:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 76%|███████▌ | 9424/12384 [19:59:59<6:16:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 0: 76%|███████▌ | 9425/12384 [19:59:59<6:19:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 0: 76%|███████▌ | 9425/12384 [20:00:07<6:19:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9426/12384 [20:00:07<6:18:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9426/12384 [20:00:15<6:18:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 76%|███████▌ | 9427/12384 [20:00:15<6:17:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 76%|███████▌ | 9427/12384 [20:00:22<6:17:02, 7.65s/it, loss=0.0005, acc=0.9972, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9428/12384 [20:00:22<6:16:03, 7.63s/it, loss=0.0005, acc=0.9972, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9428/12384 [20:00:30<6:16:03, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.63s]
Epoch 0: 76%|███████▌ | 9429/12384 [20:00:30<6:15:40, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.63s]
Epoch 0: 76%|███████▌ | 9429/12384 [20:00:37<6:15:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 76%|███████▌ | 9430/12384 [20:00:37<6:15:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 76%|███████▌ | 9430/12384 [20:00:45<6:15:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 0: 76%|███████▌ | 9431/12384 [20:00:45<6:14:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 0: 76%|███████▌ | 9431/12384 [20:00:53<6:14:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 0: 76%|███████▌ | 9432/12384 [20:00:53<6:14:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 0: 76%|███████▌ | 9432/12384 [20:01:00<6:14:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 76%|███████▌ | 9433/12384 [20:01:00<6:14:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 76%|███████▌ | 9433/12384 [20:01:08<6:14:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9434/12384 [20:01:08<6:14:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▌ | 9434/12384 [20:01:16<6:14:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 76%|███████▌ | 9435/12384 [20:01:16<6:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 76%|███████▌ | 9435/12384 [20:01:23<6:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 0: 76%|███████▌ | 9436/12384 [20:01:23<6:13:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 0: 76%|███████▌ | 9436/12384 [20:01:31<6:13:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 76%|███████▌ | 9437/12384 [20:01:31<6:14:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 76%|███████▌ | 9437/12384 [20:01:38<6:14:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 76%|███████▌ | 9438/12384 [20:01:38<6:13:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 76%|███████▌ | 9438/12384 [20:01:46<6:13:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9439/12384 [20:01:46<6:13:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 76%|███████▌ | 9439/12384 [20:01:54<6:13:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 76%|███████▌ | 9440/12384 [20:01:54<6:13:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 76%|███████▌ | 9440/12384 [20:02:01<6:13:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 76%|███████▌ | 9441/12384 [20:02:01<6:13:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 76%|███████▌ | 9441/12384 [20:02:09<6:13:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 0: 76%|███████▌ | 9442/12384 [20:02:09<6:13:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 0: 76%|███████▌ | 9442/12384 [20:02:16<6:13:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 76%|███████▋ | 9443/12384 [20:02:16<6:13:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 76%|███████▋ | 9443/12384 [20:02:24<6:13:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 76%|███████▋ | 9444/12384 [20:02:24<6:13:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 76%|███████▋ | 9444/12384 [20:02:32<6:13:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.46s]
Epoch 0: 76%|███████▋ | 9445/12384 [20:02:32<6:18:00, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.46s]
Epoch 0: 76%|███████▋ | 9445/12384 [20:02:40<6:18:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 76%|███████▋ | 9446/12384 [20:02:40<6:16:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 76%|███████▋ | 9446/12384 [20:02:47<6:16:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 76%|███████▋ | 9447/12384 [20:02:47<6:14:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 76%|███████▋ | 9447/12384 [20:02:55<6:14:52, 7.66s/it, loss=0.0001, acc=0.9993, iter_time=7.57s]
Epoch 0: 76%|███████▋ | 9448/12384 [20:02:55<6:14:06, 7.65s/it, loss=0.0001, acc=0.9993, iter_time=7.57s]
Epoch 0: 76%|███████▋ | 9448/12384 [20:03:02<6:14:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 76%|███████▋ | 9449/12384 [20:03:02<6:13:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 76%|███████▋ | 9449/12384 [20:03:10<6:13:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 76%|███████▋ | 9450/12384 [20:03:10<6:12:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 76%|███████▋ | 9450/12384 [20:03:18<6:12:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 76%|███████▋ | 9451/12384 [20:03:18<6:16:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 76%|███████▋ | 9451/12384 [20:03:26<6:16:21, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 76%|███████▋ | 9452/12384 [20:03:26<6:16:14, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 76%|███████▋ | 9452/12384 [20:03:33<6:16:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 76%|███████▋ | 9453/12384 [20:03:33<6:14:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 76%|███████▋ | 9453/12384 [20:03:41<6:14:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 76%|███████▋ | 9454/12384 [20:03:41<6:13:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 76%|███████▋ | 9454/12384 [20:03:48<6:13:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 76%|███████▋ | 9455/12384 [20:03:48<6:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 76%|███████▋ | 9455/12384 [20:03:56<6:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 76%|███████▋ | 9456/12384 [20:03:56<6:12:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 76%|███████▋ | 9456/12384 [20:04:04<6:12:04, 7.62s/it, loss=0.0003, acc=0.9979, iter_time=6.63s]
Epoch 0: 76%|███████▋ | 9457/12384 [20:04:04<6:11:51, 7.62s/it, loss=0.0003, acc=0.9979, iter_time=6.63s]
Epoch 0: 76%|███████▋ | 9457/12384 [20:04:11<6:11:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 76%|███████▋ | 9458/12384 [20:04:11<6:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 76%|███████▋ | 9458/12384 [20:04:19<6:11:15, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=9.90s]
Epoch 0: 76%|███████▋ | 9459/12384 [20:04:19<6:11:21, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=9.90s]
Epoch 0: 76%|███████▋ | 9459/12384 [20:04:26<6:11:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 76%|███████▋ | 9460/12384 [20:04:26<6:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 76%|███████▋ | 9460/12384 [20:04:34<6:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 76%|███████▋ | 9461/12384 [20:04:34<6:10:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 76%|███████▋ | 9461/12384 [20:04:42<6:10:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▋ | 9462/12384 [20:04:42<6:10:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▋ | 9462/12384 [20:04:49<6:10:53, 7.62s/it, loss=0.0005, acc=0.9977, iter_time=7.63s]
Epoch 0: 76%|███████▋ | 9463/12384 [20:04:49<6:12:11, 7.65s/it, loss=0.0005, acc=0.9977, iter_time=7.63s]
Epoch 0: 76%|███████▋ | 9463/12384 [20:04:57<6:12:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 76%|███████▋ | 9464/12384 [20:04:57<6:11:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 76%|███████▋ | 9464/12384 [20:05:05<6:11:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 76%|███████▋ | 9465/12384 [20:05:05<6:11:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 76%|███████▋ | 9465/12384 [20:05:12<6:11:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 76%|███████▋ | 9466/12384 [20:05:12<6:11:54, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 0: 76%|███████▋ | 9466/12384 [20:05:20<6:11:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 76%|███████▋ | 9467/12384 [20:05:20<6:11:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 76%|███████▋ | 9467/12384 [20:05:28<6:11:31, 7.64s/it, loss=0.0007, acc=0.9982, iter_time=7.63s]
Epoch 0: 76%|███████▋ | 9468/12384 [20:05:28<6:10:39, 7.63s/it, loss=0.0007, acc=0.9982, iter_time=7.63s]
Epoch 0: 76%|███████▋ | 9468/12384 [20:05:35<6:10:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 76%|███████▋ | 9469/12384 [20:05:35<6:10:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 0: 76%|███████▋ | 9469/12384 [20:05:43<6:10:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 76%|███████▋ | 9470/12384 [20:05:43<6:10:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 76%|███████▋ | 9470/12384 [20:05:50<6:10:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▋ | 9471/12384 [20:05:50<6:09:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 76%|███████▋ | 9471/12384 [20:05:58<6:09:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 76%|███████▋ | 9472/12384 [20:05:58<6:14:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 76%|███████▋ | 9472/12384 [20:06:06<6:14:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 76%|███████▋ | 9473/12384 [20:06:06<6:13:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 76%|███████▋ | 9473/12384 [20:06:14<6:13:10, 7.69s/it, loss=0.0001, acc=0.9997, iter_time=8.48s]
Epoch 0: 77%|███████▋ | 9474/12384 [20:06:14<6:11:50, 7.67s/it, loss=0.0001, acc=0.9997, iter_time=8.48s]
Epoch 0: 77%|███████▋ | 9474/12384 [20:06:21<6:11:50, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9475/12384 [20:06:21<6:10:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9475/12384 [20:06:29<6:10:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 77%|███████▋ | 9476/12384 [20:06:29<6:09:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 77%|███████▋ | 9476/12384 [20:06:36<6:09:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 77%|███████▋ | 9477/12384 [20:06:36<6:09:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 77%|███████▋ | 9477/12384 [20:06:44<6:09:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9478/12384 [20:06:44<6:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9478/12384 [20:06:52<6:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9479/12384 [20:06:52<6:09:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9479/12384 [20:06:59<6:09:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 77%|███████▋ | 9480/12384 [20:06:59<6:08:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 77%|███████▋ | 9480/12384 [20:07:07<6:08:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 77%|███████▋ | 9481/12384 [20:07:07<6:08:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 77%|███████▋ | 9481/12384 [20:07:14<6:08:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9482/12384 [20:07:14<6:08:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9482/12384 [20:07:22<6:08:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 77%|███████▋ | 9483/12384 [20:07:22<6:08:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 77%|███████▋ | 9483/12384 [20:07:30<6:08:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 77%|███████▋ | 9484/12384 [20:07:30<6:07:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 77%|███████▋ | 9484/12384 [20:07:37<6:07:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 77%|███████▋ | 9485/12384 [20:07:37<6:07:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 77%|███████▋ | 9485/12384 [20:07:45<6:07:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 0: 77%|███████▋ | 9486/12384 [20:07:45<6:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 0: 77%|███████▋ | 9486/12384 [20:07:53<6:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 77%|███████▋ | 9487/12384 [20:07:53<6:07:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 77%|███████▋ | 9487/12384 [20:08:00<6:07:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 77%|███████▋ | 9488/12384 [20:08:00<6:07:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 77%|███████▋ | 9488/12384 [20:08:08<6:07:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 0: 77%|███████▋ | 9489/12384 [20:08:08<6:07:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 0: 77%|███████▋ | 9489/12384 [20:08:15<6:07:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 77%|███████▋ | 9490/12384 [20:08:15<6:06:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 77%|███████▋ | 9490/12384 [20:08:23<6:06:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 77%|███████▋ | 9491/12384 [20:08:23<6:06:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 77%|███████▋ | 9491/12384 [20:08:31<6:06:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 77%|███████▋ | 9492/12384 [20:08:31<6:06:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 77%|███████▋ | 9492/12384 [20:08:38<6:06:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9493/12384 [20:08:38<6:06:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9493/12384 [20:08:46<6:06:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9494/12384 [20:08:46<6:06:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9494/12384 [20:08:53<6:06:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9495/12384 [20:08:53<6:06:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9495/12384 [20:09:01<6:06:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9496/12384 [20:09:01<6:06:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9496/12384 [20:09:09<6:06:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 77%|███████▋ | 9497/12384 [20:09:09<6:06:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 77%|███████▋ | 9497/12384 [20:09:17<6:06:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 77%|███████▋ | 9498/12384 [20:09:17<6:10:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 77%|███████▋ | 9498/12384 [20:09:24<6:10:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 77%|███████▋ | 9499/12384 [20:09:24<6:09:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 0: 77%|███████▋ | 9499/12384 [20:09:32<6:09:19, 7.68s/it, loss=0.0003, acc=0.9998, iter_time=8.61s]
Epoch 0: 77%|███████▋ | 9500/12384 [20:09:32<6:11:47, 7.73s/it, loss=0.0003, acc=0.9998, iter_time=8.61s]
Epoch 0: 77%|███████▋ | 9500/12384 [20:09:40<6:11:47, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 0: 77%|███████▋ | 9501/12384 [20:09:40<6:10:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 0: 77%|███████▋ | 9501/12384 [20:09:47<6:10:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 77%|███████▋ | 9502/12384 [20:09:47<6:08:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 77%|███████▋ | 9502/12384 [20:09:55<6:08:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 77%|███████▋ | 9503/12384 [20:09:55<6:07:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 77%|███████▋ | 9503/12384 [20:10:03<6:07:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 0: 77%|███████▋ | 9504/12384 [20:10:03<6:11:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 0: 77%|███████▋ | 9504/12384 [20:10:10<6:11:31, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=5.99s]
Epoch 0: 77%|███████▋ | 9505/12384 [20:10:10<6:09:57, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.99s]
Epoch 0: 77%|███████▋ | 9505/12384 [20:10:18<6:09:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 0: 77%|███████▋ | 9506/12384 [20:10:18<6:08:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 0: 77%|███████▋ | 9506/12384 [20:10:26<6:08:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 77%|███████▋ | 9507/12384 [20:10:26<6:07:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 77%|███████▋ | 9507/12384 [20:10:33<6:07:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9508/12384 [20:10:33<6:07:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9508/12384 [20:10:41<6:07:16, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 77%|███████▋ | 9509/12384 [20:10:41<6:06:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 77%|███████▋ | 9509/12384 [20:10:49<6:06:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9510/12384 [20:10:49<6:05:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9510/12384 [20:10:56<6:05:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9511/12384 [20:10:56<6:05:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9511/12384 [20:11:04<6:05:17, 7.63s/it, loss=0.0004, acc=0.9999, iter_time=8.00s]
Epoch 0: 77%|███████▋ | 9512/12384 [20:11:04<6:04:48, 7.62s/it, loss=0.0004, acc=0.9999, iter_time=8.00s]
Epoch 0: 77%|███████▋ | 9512/12384 [20:11:11<6:04:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 0: 77%|███████▋ | 9513/12384 [20:11:11<6:04:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 0: 77%|███████▋ | 9513/12384 [20:11:19<6:04:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 77%|███████▋ | 9514/12384 [20:11:19<6:05:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 77%|███████▋ | 9514/12384 [20:11:27<6:05:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 77%|███████▋ | 9515/12384 [20:11:27<6:05:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 77%|███████▋ | 9515/12384 [20:11:34<6:05:11, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 77%|███████▋ | 9516/12384 [20:11:34<6:04:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 0: 77%|███████▋ | 9516/12384 [20:11:42<6:04:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9517/12384 [20:11:42<6:04:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9517/12384 [20:11:50<6:04:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9518/12384 [20:11:50<6:04:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9518/12384 [20:11:57<6:04:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9519/12384 [20:11:57<6:03:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9519/12384 [20:12:05<6:03:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 77%|███████▋ | 9520/12384 [20:12:05<6:03:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 77%|███████▋ | 9520/12384 [20:12:12<6:03:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 0: 77%|███████▋ | 9521/12384 [20:12:12<6:03:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 0: 77%|███████▋ | 9521/12384 [20:12:20<6:03:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 77%|███████▋ | 9522/12384 [20:12:20<6:03:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 77%|███████▋ | 9522/12384 [20:12:28<6:03:17, 7.62s/it, loss=0.0001, acc=0.9985, iter_time=8.51s]
Epoch 0: 77%|███████▋ | 9523/12384 [20:12:28<6:03:14, 7.62s/it, loss=0.0001, acc=0.9985, iter_time=8.51s]
Epoch 0: 77%|███████▋ | 9523/12384 [20:12:35<6:03:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 0: 77%|███████▋ | 9524/12384 [20:12:35<6:02:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 0: 77%|███████▋ | 9524/12384 [20:12:43<6:02:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 0: 77%|███████▋ | 9525/12384 [20:12:43<6:06:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 0: 77%|███████▋ | 9525/12384 [20:12:51<6:06:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 0: 77%|███████▋ | 9526/12384 [20:12:51<6:06:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 0: 77%|███████▋ | 9526/12384 [20:12:58<6:06:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 77%|███████▋ | 9527/12384 [20:12:58<6:05:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 77%|███████▋ | 9527/12384 [20:13:06<6:05:18, 7.67s/it, loss=0.0009, acc=0.9987, iter_time=8.34s]
Epoch 0: 77%|███████▋ | 9528/12384 [20:13:06<6:04:28, 7.66s/it, loss=0.0009, acc=0.9987, iter_time=8.34s]
Epoch 0: 77%|███████▋ | 9528/12384 [20:13:14<6:04:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 0: 77%|███████▋ | 9529/12384 [20:13:14<6:03:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 0: 77%|███████▋ | 9529/12384 [20:13:22<6:03:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 0: 77%|███████▋ | 9530/12384 [20:13:22<6:07:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 0: 77%|███████▋ | 9530/12384 [20:13:29<6:07:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9531/12384 [20:13:29<6:05:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9531/12384 [20:13:37<6:05:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9532/12384 [20:13:37<6:04:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9532/12384 [20:13:44<6:04:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9533/12384 [20:13:44<6:03:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9533/12384 [20:13:52<6:03:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 77%|███████▋ | 9534/12384 [20:13:52<6:02:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 77%|███████▋ | 9534/12384 [20:14:00<6:02:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9535/12384 [20:14:00<6:02:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9535/12384 [20:14:07<6:02:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 77%|███████▋ | 9536/12384 [20:14:07<6:01:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 77%|███████▋ | 9536/12384 [20:14:15<6:01:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 77%|███████▋ | 9537/12384 [20:14:15<6:01:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 77%|███████▋ | 9537/12384 [20:14:22<6:01:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9538/12384 [20:14:22<6:01:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9538/12384 [20:14:30<6:01:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9539/12384 [20:14:30<6:01:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9539/12384 [20:14:38<6:01:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 0: 77%|███████▋ | 9540/12384 [20:14:38<6:00:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 0: 77%|███████▋ | 9540/12384 [20:14:45<6:00:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.06s]
Epoch 0: 77%|███████▋ | 9541/12384 [20:14:45<6:00:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.06s]
Epoch 0: 77%|███████▋ | 9541/12384 [20:14:53<6:00:30, 7.61s/it, loss=0.0010, acc=0.9948, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9542/12384 [20:14:53<6:00:18, 7.61s/it, loss=0.0010, acc=0.9948, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9542/12384 [20:15:00<6:00:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9543/12384 [20:15:00<6:00:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9543/12384 [20:15:08<6:00:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 77%|███████▋ | 9544/12384 [20:15:08<5:59:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 77%|███████▋ | 9544/12384 [20:15:16<5:59:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 77%|███████▋ | 9545/12384 [20:15:16<5:59:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 77%|███████▋ | 9545/12384 [20:15:23<5:59:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 77%|███████▋ | 9546/12384 [20:15:23<6:00:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 77%|███████▋ | 9546/12384 [20:15:31<6:00:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.37s]
Epoch 0: 77%|███████▋ | 9547/12384 [20:15:31<5:59:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.37s]
Epoch 0: 77%|███████▋ | 9547/12384 [20:15:39<5:59:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 77%|███████▋ | 9548/12384 [20:15:39<5:59:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 77%|███████▋ | 9548/12384 [20:15:46<5:59:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9549/12384 [20:15:46<5:59:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9549/12384 [20:15:54<5:59:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 0: 77%|███████▋ | 9550/12384 [20:15:54<5:59:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 0: 77%|███████▋ | 9550/12384 [20:16:02<5:59:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 77%|███████▋ | 9551/12384 [20:16:02<6:04:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 77%|███████▋ | 9551/12384 [20:16:09<6:04:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 77%|███████▋ | 9552/12384 [20:16:09<6:02:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 77%|███████▋ | 9552/12384 [20:16:17<6:02:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 77%|███████▋ | 9553/12384 [20:16:17<6:01:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 77%|███████▋ | 9553/12384 [20:16:25<6:01:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9554/12384 [20:16:25<6:00:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9554/12384 [20:16:32<6:00:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9555/12384 [20:16:32<5:59:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9555/12384 [20:16:40<5:59:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 77%|███████▋ | 9556/12384 [20:16:40<5:59:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 77%|███████▋ | 9556/12384 [20:16:47<5:59:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 0: 77%|███████▋ | 9557/12384 [20:16:47<5:59:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 0: 77%|███████▋ | 9557/12384 [20:16:55<5:59:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 77%|███████▋ | 9558/12384 [20:16:55<5:58:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 77%|███████▋ | 9558/12384 [20:17:03<5:58:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9559/12384 [20:17:03<5:58:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9559/12384 [20:17:10<5:58:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 77%|███████▋ | 9560/12384 [20:17:10<5:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 77%|███████▋ | 9560/12384 [20:17:18<5:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 77%|███████▋ | 9561/12384 [20:17:18<5:58:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 77%|███████▋ | 9561/12384 [20:17:25<5:58:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 77%|███████▋ | 9562/12384 [20:17:25<5:58:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 77%|███████▋ | 9562/12384 [20:17:33<5:58:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 77%|███████▋ | 9563/12384 [20:17:33<5:57:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 77%|███████▋ | 9563/12384 [20:17:41<5:57:58, 7.61s/it, loss=0.0001, acc=0.9985, iter_time=8.23s]
Epoch 0: 77%|███████▋ | 9564/12384 [20:17:41<5:57:28, 7.61s/it, loss=0.0001, acc=0.9985, iter_time=8.23s]
Epoch 0: 77%|███████▋ | 9564/12384 [20:17:48<5:57:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 77%|███████▋ | 9565/12384 [20:17:48<5:58:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 77%|███████▋ | 9565/12384 [20:17:56<5:58:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 0: 77%|███████▋ | 9566/12384 [20:17:56<5:57:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 0: 77%|███████▋ | 9566/12384 [20:18:04<5:57:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 0: 77%|███████▋ | 9567/12384 [20:18:04<5:57:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 0: 77%|███████▋ | 9567/12384 [20:18:11<5:57:23, 7.61s/it, loss=0.0003, acc=0.9983, iter_time=8.00s]
Epoch 0: 77%|███████▋ | 9568/12384 [20:18:11<5:57:04, 7.61s/it, loss=0.0003, acc=0.9983, iter_time=8.00s]
Epoch 0: 77%|███████▋ | 9568/12384 [20:18:19<5:57:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 77%|███████▋ | 9569/12384 [20:18:19<5:56:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 77%|███████▋ | 9569/12384 [20:18:26<5:56:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9570/12384 [20:18:26<5:56:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9570/12384 [20:18:34<5:56:32, 7.60s/it, loss=0.0001, acc=0.9992, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9571/12384 [20:18:34<5:56:38, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9571/12384 [20:18:42<5:56:38, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9572/12384 [20:18:42<5:56:33, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=7.63s]
Epoch 0: 77%|███████▋ | 9572/12384 [20:18:49<5:56:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 77%|███████▋ | 9573/12384 [20:18:49<5:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 77%|███████▋ | 9573/12384 [20:18:57<5:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 77%|███████▋ | 9574/12384 [20:18:57<5:56:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 77%|███████▋ | 9574/12384 [20:19:04<5:56:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 0: 77%|███████▋ | 9575/12384 [20:19:04<5:56:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 0: 77%|███████▋ | 9575/12384 [20:19:12<5:56:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 77%|███████▋ | 9576/12384 [20:19:12<5:56:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 77%|███████▋ | 9576/12384 [20:19:20<5:56:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 0: 77%|███████▋ | 9577/12384 [20:19:20<6:01:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 0: 77%|███████▋ | 9577/12384 [20:19:28<6:01:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 0: 77%|███████▋ | 9578/12384 [20:19:28<5:59:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 0: 77%|███████▋ | 9578/12384 [20:19:35<5:59:52, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=5.10s]
Epoch 0: 77%|███████▋ | 9579/12384 [20:19:35<5:59:24, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=5.10s]
Epoch 0: 77%|███████▋ | 9579/12384 [20:19:43<5:59:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 77%|███████▋ | 9580/12384 [20:19:43<5:57:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 0: 77%|███████▋ | 9580/12384 [20:19:50<5:57:53, 7.66s/it, loss=0.0001, acc=0.9996, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9581/12384 [20:19:50<5:56:55, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=7.60s]
Epoch 0: 77%|███████▋ | 9581/12384 [20:19:58<5:56:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9582/12384 [20:19:58<5:56:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 77%|███████▋ | 9582/12384 [20:20:06<5:56:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 77%|███████▋ | 9583/12384 [20:20:06<6:00:02, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 77%|███████▋ | 9583/12384 [20:20:14<6:00:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 77%|███████▋ | 9584/12384 [20:20:14<5:58:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 77%|███████▋ | 9584/12384 [20:20:21<5:58:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 0: 77%|███████▋ | 9585/12384 [20:20:21<5:57:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 0: 77%|███████▋ | 9585/12384 [20:20:29<5:57:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 77%|███████▋ | 9586/12384 [20:20:29<5:56:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 77%|███████▋ | 9586/12384 [20:20:36<5:56:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 77%|███████▋ | 9587/12384 [20:20:36<5:55:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 77%|███████▋ | 9587/12384 [20:20:44<5:55:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 77%|███████▋ | 9588/12384 [20:20:44<5:55:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 77%|███████▋ | 9588/12384 [20:20:52<5:55:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 77%|███████▋ | 9589/12384 [20:20:52<5:54:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 77%|███████▋ | 9589/12384 [20:20:59<5:54:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 77%|███████▋ | 9590/12384 [20:20:59<5:54:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 77%|███████▋ | 9590/12384 [20:21:07<5:54:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 0: 77%|███████▋ | 9591/12384 [20:21:07<5:54:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 0: 77%|███████▋ | 9591/12384 [20:21:14<5:54:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.24s]
Epoch 0: 77%|███████▋ | 9592/12384 [20:21:14<5:54:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.24s]
Epoch 0: 77%|███████▋ | 9592/12384 [20:21:22<5:54:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 77%|███████▋ | 9593/12384 [20:21:22<5:54:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 77%|███████▋ | 9593/12384 [20:21:30<5:54:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9594/12384 [20:21:30<5:54:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 77%|███████▋ | 9594/12384 [20:21:37<5:54:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9595/12384 [20:21:37<5:53:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 77%|███████▋ | 9595/12384 [20:21:45<5:53:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 77%|███████▋ | 9596/12384 [20:21:45<5:53:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 77%|███████▋ | 9596/12384 [20:21:53<5:53:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 77%|███████▋ | 9597/12384 [20:21:53<5:53:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 77%|███████▋ | 9597/12384 [20:22:00<5:53:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 78%|███████▊ | 9598/12384 [20:22:00<5:53:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 0: 78%|███████▊ | 9598/12384 [20:22:08<5:53:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 78%|███████▊ | 9599/12384 [20:22:08<5:53:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 78%|███████▊ | 9599/12384 [20:22:15<5:53:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 0: 78%|███████▊ | 9600/12384 [20:22:15<5:53:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 0: 78%|███████▊ | 9600/12384 [20:22:23<5:53:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 0: 78%|███████▊ | 9601/12384 [20:22:23<5:53:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 0: 78%|███████▊ | 9601/12384 [20:22:31<5:53:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 78%|███████▊ | 9602/12384 [20:22:31<5:52:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 78%|███████▊ | 9602/12384 [20:22:39<5:52:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 78%|███████▊ | 9603/12384 [20:22:39<5:57:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 78%|███████▊ | 9603/12384 [20:22:46<5:57:23, 7.71s/it, loss=0.0016, acc=0.9969, iter_time=9.10s]
Epoch 0: 78%|███████▊ | 9604/12384 [20:22:46<5:55:41, 7.68s/it, loss=0.0016, acc=0.9969, iter_time=9.10s]
Epoch 0: 78%|███████▊ | 9604/12384 [20:22:54<5:55:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9605/12384 [20:22:54<5:54:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9605/12384 [20:23:01<5:54:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 0: 78%|███████▊ | 9606/12384 [20:23:01<5:53:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 0: 78%|███████▊ | 9606/12384 [20:23:09<5:53:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 78%|███████▊ | 9607/12384 [20:23:09<5:52:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 78%|███████▊ | 9607/12384 [20:23:17<5:52:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 78%|███████▊ | 9608/12384 [20:23:17<5:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 78%|███████▊ | 9608/12384 [20:23:24<5:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 78%|███████▊ | 9609/12384 [20:23:24<5:56:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 78%|███████▊ | 9609/12384 [20:23:32<5:56:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 78%|███████▊ | 9610/12384 [20:23:32<5:54:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 78%|███████▊ | 9610/12384 [20:23:40<5:54:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9611/12384 [20:23:40<5:54:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9611/12384 [20:23:47<5:54:05, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 78%|███████▊ | 9612/12384 [20:23:47<5:53:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 78%|███████▊ | 9612/12384 [20:23:55<5:53:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 78%|███████▊ | 9613/12384 [20:23:55<5:52:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 78%|███████▊ | 9613/12384 [20:24:03<5:52:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 78%|███████▊ | 9614/12384 [20:24:03<5:51:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 78%|███████▊ | 9614/12384 [20:24:10<5:51:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 78%|███████▊ | 9615/12384 [20:24:10<5:51:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 78%|███████▊ | 9615/12384 [20:24:18<5:51:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 0: 78%|███████▊ | 9616/12384 [20:24:18<5:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 0: 78%|███████▊ | 9616/12384 [20:24:25<5:51:39, 7.62s/it, loss=0.0012, acc=0.9961, iter_time=5.46s]
Epoch 0: 78%|███████▊ | 9617/12384 [20:24:25<5:51:06, 7.61s/it, loss=0.0012, acc=0.9961, iter_time=5.46s]
Epoch 0: 78%|███████▊ | 9617/12384 [20:24:33<5:51:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 78%|███████▊ | 9618/12384 [20:24:33<5:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 0: 78%|███████▊ | 9618/12384 [20:24:41<5:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 78%|███████▊ | 9619/12384 [20:24:41<5:50:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 78%|███████▊ | 9619/12384 [20:24:48<5:50:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 78%|███████▊ | 9620/12384 [20:24:48<5:50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 78%|███████▊ | 9620/12384 [20:24:56<5:50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 78%|███████▊ | 9621/12384 [20:24:56<5:50:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 78%|███████▊ | 9621/12384 [20:25:03<5:50:43, 7.62s/it, loss=0.0005, acc=0.9974, iter_time=5.60s]
Epoch 0: 78%|███████▊ | 9622/12384 [20:25:03<5:50:37, 7.62s/it, loss=0.0005, acc=0.9974, iter_time=5.60s]
Epoch 0: 78%|███████▊ | 9622/12384 [20:25:11<5:50:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 78%|███████▊ | 9623/12384 [20:25:11<5:50:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 78%|███████▊ | 9623/12384 [20:25:19<5:50:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 78%|███████▊ | 9624/12384 [20:25:19<5:50:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 78%|███████▊ | 9624/12384 [20:25:26<5:50:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 78%|███████▊ | 9625/12384 [20:25:26<5:49:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.02s]
Epoch 0: 78%|███████▊ | 9625/12384 [20:25:34<5:49:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 78%|███████▊ | 9626/12384 [20:25:34<5:49:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 78%|███████▊ | 9626/12384 [20:25:41<5:49:28, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 78%|███████▊ | 9627/12384 [20:25:41<5:49:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 78%|███████▊ | 9627/12384 [20:25:49<5:49:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 78%|███████▊ | 9628/12384 [20:25:49<5:49:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 78%|███████▊ | 9628/12384 [20:25:57<5:49:09, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 78%|███████▊ | 9629/12384 [20:25:57<5:53:38, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 78%|███████▊ | 9629/12384 [20:26:05<5:53:38, 7.70s/it, loss=0.0006, acc=0.9984, iter_time=7.88s]
Epoch 0: 78%|███████▊ | 9630/12384 [20:26:05<5:52:13, 7.67s/it, loss=0.0006, acc=0.9984, iter_time=7.88s]
Epoch 0: 78%|███████▊ | 9630/12384 [20:26:12<5:52:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 78%|███████▊ | 9631/12384 [20:26:12<5:52:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 78%|███████▊ | 9631/12384 [20:26:20<5:52:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 0: 78%|███████▊ | 9632/12384 [20:26:20<5:52:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 0: 78%|███████▊ | 9632/12384 [20:26:28<5:52:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 78%|███████▊ | 9633/12384 [20:26:28<5:51:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 78%|███████▊ | 9633/12384 [20:26:35<5:51:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9634/12384 [20:26:35<5:50:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9634/12384 [20:26:43<5:50:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 78%|███████▊ | 9635/12384 [20:26:43<5:50:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 78%|███████▊ | 9635/12384 [20:26:50<5:50:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 78%|███████▊ | 9636/12384 [20:26:50<5:49:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 78%|███████▊ | 9636/12384 [20:26:58<5:49:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 78%|███████▊ | 9637/12384 [20:26:58<5:49:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 78%|███████▊ | 9637/12384 [20:27:06<5:49:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 0: 78%|███████▊ | 9638/12384 [20:27:06<5:49:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 0: 78%|███████▊ | 9638/12384 [20:27:13<5:49:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 0: 78%|███████▊ | 9639/12384 [20:27:13<5:49:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 0: 78%|███████▊ | 9639/12384 [20:27:21<5:49:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9640/12384 [20:27:21<5:48:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9640/12384 [20:27:29<5:48:51, 7.63s/it, loss=0.0003, acc=0.9981, iter_time=7.67s]
Epoch 0: 78%|███████▊ | 9641/12384 [20:27:29<5:48:37, 7.63s/it, loss=0.0003, acc=0.9981, iter_time=7.67s]
Epoch 0: 78%|███████▊ | 9641/12384 [20:27:36<5:48:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 78%|███████▊ | 9642/12384 [20:27:36<5:48:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 78%|███████▊ | 9642/12384 [20:27:44<5:48:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 78%|███████▊ | 9643/12384 [20:27:44<5:47:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 78%|███████▊ | 9643/12384 [20:27:51<5:47:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 78%|███████▊ | 9644/12384 [20:27:51<5:47:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 78%|███████▊ | 9644/12384 [20:27:59<5:47:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 78%|███████▊ | 9645/12384 [20:27:59<5:47:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 78%|███████▊ | 9645/12384 [20:28:07<5:47:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9646/12384 [20:28:07<5:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9646/12384 [20:28:14<5:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 78%|███████▊ | 9647/12384 [20:28:14<5:47:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 78%|███████▊ | 9647/12384 [20:28:22<5:47:21, 7.61s/it, loss=0.0007, acc=0.9976, iter_time=8.60s]
Epoch 0: 78%|███████▊ | 9648/12384 [20:28:22<5:47:01, 7.61s/it, loss=0.0007, acc=0.9976, iter_time=8.60s]
Epoch 0: 78%|███████▊ | 9648/12384 [20:28:29<5:47:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 0: 78%|███████▊ | 9649/12384 [20:28:29<5:46:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 0: 78%|███████▊ | 9649/12384 [20:28:37<5:46:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 0: 78%|███████▊ | 9650/12384 [20:28:37<5:46:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 0: 78%|███████▊ | 9650/12384 [20:28:45<5:46:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 78%|███████▊ | 9651/12384 [20:28:45<5:46:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 78%|███████▊ | 9651/12384 [20:28:52<5:46:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 78%|███████▊ | 9652/12384 [20:28:52<5:46:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 78%|███████▊ | 9652/12384 [20:29:00<5:46:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9653/12384 [20:29:00<5:46:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 78%|███████▊ | 9653/12384 [20:29:08<5:46:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 78%|███████▊ | 9654/12384 [20:29:08<5:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 78%|███████▊ | 9654/12384 [20:29:15<5:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 78%|███████▊ | 9655/12384 [20:29:15<5:46:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 78%|███████▊ | 9655/12384 [20:29:23<5:46:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 78%|███████▊ | 9656/12384 [20:29:23<5:51:15, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 78%|███████▊ | 9656/12384 [20:29:31<5:51:15, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 78%|███████▊ | 9657/12384 [20:29:31<5:49:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 78%|███████▊ | 9657/12384 [20:29:38<5:49:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 0: 78%|███████▊ | 9658/12384 [20:29:38<5:48:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 0: 78%|███████▊ | 9658/12384 [20:29:46<5:48:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 0: 78%|███████▊ | 9659/12384 [20:29:46<5:48:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 0: 78%|███████▊ | 9659/12384 [20:29:54<5:48:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 78%|███████▊ | 9660/12384 [20:29:54<5:49:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 78%|███████▊ | 9660/12384 [20:30:01<5:49:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 78%|███████▊ | 9661/12384 [20:30:01<5:48:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 78%|███████▊ | 9661/12384 [20:30:09<5:48:08, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 78%|███████▊ | 9662/12384 [20:30:09<5:51:04, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 78%|███████▊ | 9662/12384 [20:30:17<5:51:04, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 78%|███████▊ | 9663/12384 [20:30:17<5:49:21, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 78%|███████▊ | 9663/12384 [20:30:24<5:49:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 78%|███████▊ | 9664/12384 [20:30:24<5:47:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 78%|███████▊ | 9664/12384 [20:30:32<5:47:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 78%|███████▊ | 9665/12384 [20:30:32<5:47:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 78%|███████▊ | 9665/12384 [20:30:40<5:47:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 78%|███████▊ | 9666/12384 [20:30:40<5:46:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 78%|███████▊ | 9666/12384 [20:30:47<5:46:18, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 78%|███████▊ | 9667/12384 [20:30:47<5:45:42, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 78%|███████▊ | 9667/12384 [20:30:55<5:45:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 78%|███████▊ | 9668/12384 [20:30:55<5:45:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 78%|███████▊ | 9668/12384 [20:31:03<5:45:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 78%|███████▊ | 9669/12384 [20:31:03<5:44:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 78%|███████▊ | 9669/12384 [20:31:10<5:44:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 78%|███████▊ | 9670/12384 [20:31:10<5:44:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 78%|███████▊ | 9670/12384 [20:31:18<5:44:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.97s]
Epoch 0: 78%|███████▊ | 9671/12384 [20:31:18<5:44:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.97s]
Epoch 0: 78%|███████▊ | 9671/12384 [20:31:25<5:44:45, 7.62s/it, loss=0.0012, acc=0.9970, iter_time=8.01s]
Epoch 0: 78%|███████▊ | 9672/12384 [20:31:25<5:44:18, 7.62s/it, loss=0.0012, acc=0.9970, iter_time=8.01s]
Epoch 0: 78%|███████▊ | 9672/12384 [20:31:33<5:44:18, 7.62s/it, loss=0.0004, acc=0.9978, iter_time=4.96s]
Epoch 0: 78%|███████▊ | 9673/12384 [20:31:33<5:44:20, 7.62s/it, loss=0.0004, acc=0.9978, iter_time=4.96s]
Epoch 0: 78%|███████▊ | 9673/12384 [20:31:41<5:44:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.79s]
Epoch 0: 78%|███████▊ | 9674/12384 [20:31:41<5:44:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.79s]
Epoch 0: 78%|███████▊ | 9674/12384 [20:31:48<5:44:12, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.23s]
Epoch 0: 78%|███████▊ | 9675/12384 [20:31:48<5:45:08, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.23s]
Epoch 0: 78%|███████▊ | 9675/12384 [20:31:56<5:45:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 78%|███████▊ | 9676/12384 [20:31:56<5:45:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 78%|███████▊ | 9676/12384 [20:32:04<5:45:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 78%|███████▊ | 9677/12384 [20:32:04<5:44:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 78%|███████▊ | 9677/12384 [20:32:11<5:44:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 78%|███████▊ | 9678/12384 [20:32:11<5:43:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 78%|███████▊ | 9678/12384 [20:32:19<5:43:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 78%|███████▊ | 9679/12384 [20:32:19<5:43:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 78%|███████▊ | 9679/12384 [20:32:26<5:43:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 78%|███████▊ | 9680/12384 [20:32:26<5:43:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 78%|███████▊ | 9680/12384 [20:32:34<5:43:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 0: 78%|███████▊ | 9681/12384 [20:32:34<5:43:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 0: 78%|███████▊ | 9681/12384 [20:32:42<5:43:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 78%|███████▊ | 9682/12384 [20:32:42<5:47:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 78%|███████▊ | 9682/12384 [20:32:50<5:47:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 78%|███████▊ | 9683/12384 [20:32:50<5:45:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 78%|███████▊ | 9683/12384 [20:32:57<5:45:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 78%|███████▊ | 9684/12384 [20:32:57<5:44:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 78%|███████▊ | 9684/12384 [20:33:05<5:44:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 78%|███████▊ | 9685/12384 [20:33:05<5:46:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 78%|███████▊ | 9685/12384 [20:33:13<5:46:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 78%|███████▊ | 9686/12384 [20:33:13<5:44:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 78%|███████▊ | 9686/12384 [20:33:20<5:44:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 78%|███████▊ | 9687/12384 [20:33:20<5:43:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 78%|███████▊ | 9687/12384 [20:33:28<5:43:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 78%|███████▊ | 9688/12384 [20:33:28<5:47:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 78%|███████▊ | 9688/12384 [20:33:36<5:47:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 78%|███████▊ | 9689/12384 [20:33:36<5:45:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 78%|███████▊ | 9689/12384 [20:33:43<5:45:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 78%|███████▊ | 9690/12384 [20:33:43<5:44:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 78%|███████▊ | 9690/12384 [20:33:51<5:44:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 78%|███████▊ | 9691/12384 [20:33:51<5:43:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 78%|███████▊ | 9691/12384 [20:33:59<5:43:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 78%|███████▊ | 9692/12384 [20:33:59<5:42:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 78%|███████▊ | 9692/12384 [20:34:06<5:42:45, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.13s]
Epoch 0: 78%|███████▊ | 9693/12384 [20:34:06<5:42:20, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.13s]
Epoch 0: 78%|███████▊ | 9693/12384 [20:34:14<5:42:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 78%|███████▊ | 9694/12384 [20:34:14<5:42:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 78%|███████▊ | 9694/12384 [20:34:21<5:42:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 78%|███████▊ | 9695/12384 [20:34:21<5:41:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 78%|███████▊ | 9695/12384 [20:34:29<5:41:23, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=8.75s]
Epoch 0: 78%|███████▊ | 9696/12384 [20:34:29<5:41:43, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.75s]
Epoch 0: 78%|███████▊ | 9696/12384 [20:34:37<5:41:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 78%|███████▊ | 9697/12384 [20:34:37<5:41:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 78%|███████▊ | 9697/12384 [20:34:44<5:41:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 0: 78%|███████▊ | 9698/12384 [20:34:44<5:40:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 0: 78%|███████▊ | 9698/12384 [20:34:52<5:40:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 0: 78%|███████▊ | 9699/12384 [20:34:52<5:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 0: 78%|███████▊ | 9699/12384 [20:34:59<5:40:40, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=11.03s]
Epoch 0: 78%|███████▊ | 9700/12384 [20:34:59<5:40:31, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=11.03s]
Epoch 0: 78%|███████▊ | 9700/12384 [20:35:07<5:40:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 78%|███████▊ | 9701/12384 [20:35:07<5:40:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 78%|███████▊ | 9701/12384 [20:35:15<5:40:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 0: 78%|███████▊ | 9702/12384 [20:35:15<5:40:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 0: 78%|███████▊ | 9702/12384 [20:35:22<5:40:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.45s]
Epoch 0: 78%|███████▊ | 9703/12384 [20:35:22<5:40:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.45s]
Epoch 0: 78%|███████▊ | 9703/12384 [20:35:30<5:40:27, 7.62s/it, loss=0.0004, acc=0.9989, iter_time=7.56s]
Epoch 0: 78%|███████▊ | 9704/12384 [20:35:30<5:40:15, 7.62s/it, loss=0.0004, acc=0.9989, iter_time=7.56s]
Epoch 0: 78%|███████▊ | 9704/12384 [20:35:38<5:40:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 78%|███████▊ | 9705/12384 [20:35:38<5:40:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 78%|███████▊ | 9705/12384 [20:35:45<5:40:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 78%|███████▊ | 9706/12384 [20:35:45<5:40:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 78%|███████▊ | 9706/12384 [20:35:53<5:40:09, 7.62s/it, loss=0.0004, acc=0.9980, iter_time=9.66s]
Epoch 0: 78%|███████▊ | 9707/12384 [20:35:53<5:39:43, 7.61s/it, loss=0.0004, acc=0.9980, iter_time=9.66s]
Epoch 0: 78%|███████▊ | 9707/12384 [20:36:00<5:39:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 78%|███████▊ | 9708/12384 [20:36:00<5:39:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 78%|███████▊ | 9708/12384 [20:36:08<5:39:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.78s]
Epoch 0: 78%|███████▊ | 9709/12384 [20:36:08<5:43:42, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.78s]
Epoch 0: 78%|███████▊ | 9709/12384 [20:36:16<5:43:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 0: 78%|███████▊ | 9710/12384 [20:36:16<5:42:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 0: 78%|███████▊ | 9710/12384 [20:36:24<5:42:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 78%|███████▊ | 9711/12384 [20:36:24<5:41:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 78%|███████▊ | 9711/12384 [20:36:31<5:41:53, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 78%|███████▊ | 9712/12384 [20:36:31<5:41:06, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 78%|███████▊ | 9712/12384 [20:36:39<5:41:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 78%|███████▊ | 9713/12384 [20:36:39<5:40:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 78%|███████▊ | 9713/12384 [20:36:47<5:40:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 78%|███████▊ | 9714/12384 [20:36:47<5:43:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 78%|███████▊ | 9714/12384 [20:36:54<5:43:05, 7.71s/it, loss=0.0004, acc=0.9983, iter_time=5.55s]
Epoch 0: 78%|███████▊ | 9715/12384 [20:36:54<5:41:41, 7.68s/it, loss=0.0004, acc=0.9983, iter_time=5.55s]
Epoch 0: 78%|███████▊ | 9715/12384 [20:37:02<5:41:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 78%|███████▊ | 9716/12384 [20:37:02<5:40:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 78%|███████▊ | 9716/12384 [20:37:10<5:40:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 78%|███████▊ | 9717/12384 [20:37:10<5:39:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 78%|███████▊ | 9717/12384 [20:37:17<5:39:57, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 0: 78%|███████▊ | 9718/12384 [20:37:17<5:39:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 0: 78%|███████▊ | 9718/12384 [20:37:25<5:39:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 78%|███████▊ | 9719/12384 [20:37:25<5:38:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 78%|███████▊ | 9719/12384 [20:37:32<5:38:37, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=8.02s]
Epoch 0: 78%|███████▊ | 9720/12384 [20:37:32<5:38:30, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=8.02s]
Epoch 0: 78%|███████▊ | 9720/12384 [20:37:40<5:38:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 78%|███████▊ | 9721/12384 [20:37:40<5:38:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 78%|███████▊ | 9721/12384 [20:37:48<5:38:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.04s]
Epoch 0: 79%|███████▊ | 9722/12384 [20:37:48<5:38:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.04s]
Epoch 0: 79%|███████▊ | 9722/12384 [20:37:55<5:38:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 79%|███████▊ | 9723/12384 [20:37:55<5:38:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 79%|███████▊ | 9723/12384 [20:38:03<5:38:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 79%|███████▊ | 9724/12384 [20:38:03<5:37:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 79%|███████▊ | 9724/12384 [20:38:10<5:37:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 79%|███████▊ | 9725/12384 [20:38:10<5:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 79%|███████▊ | 9725/12384 [20:38:18<5:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 79%|███████▊ | 9726/12384 [20:38:18<5:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 79%|███████▊ | 9726/12384 [20:38:26<5:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 79%|███████▊ | 9727/12384 [20:38:26<5:36:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 79%|███████▊ | 9727/12384 [20:38:33<5:36:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 79%|███████▊ | 9728/12384 [20:38:33<5:36:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 79%|███████▊ | 9728/12384 [20:38:41<5:36:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 79%|███████▊ | 9729/12384 [20:38:41<5:36:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 79%|███████▊ | 9729/12384 [20:38:49<5:36:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 79%|███████▊ | 9730/12384 [20:38:49<5:36:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 79%|███████▊ | 9730/12384 [20:38:56<5:36:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 79%|███████▊ | 9731/12384 [20:38:56<5:36:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 79%|███████▊ | 9731/12384 [20:39:04<5:36:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 79%|███████▊ | 9732/12384 [20:39:04<5:36:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 79%|███████▊ | 9732/12384 [20:39:11<5:36:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 0: 79%|███████▊ | 9733/12384 [20:39:11<5:35:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 0: 79%|███████▊ | 9733/12384 [20:39:19<5:35:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 79%|███████▊ | 9734/12384 [20:39:19<5:35:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 79%|███████▊ | 9734/12384 [20:39:27<5:35:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 0: 79%|███████▊ | 9735/12384 [20:39:27<5:39:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 0: 79%|███████▊ | 9735/12384 [20:39:34<5:39:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 0: 79%|███████▊ | 9736/12384 [20:39:34<5:38:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 0: 79%|███████▊ | 9736/12384 [20:39:42<5:38:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 79%|███████▊ | 9737/12384 [20:39:42<5:37:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 79%|███████▊ | 9737/12384 [20:39:50<5:37:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 79%|███████▊ | 9738/12384 [20:39:50<5:37:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 79%|███████▊ | 9738/12384 [20:39:57<5:37:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.20s]
Epoch 0: 79%|███████▊ | 9739/12384 [20:39:57<5:37:34, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.20s]
Epoch 0: 79%|███████▊ | 9739/12384 [20:40:05<5:37:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 79%|███████▊ | 9740/12384 [20:40:05<5:40:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 79%|███████▊ | 9740/12384 [20:40:13<5:40:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 79%|███████▊ | 9741/12384 [20:40:13<5:39:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 79%|███████▊ | 9741/12384 [20:40:21<5:39:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 79%|███████▊ | 9742/12384 [20:40:21<5:37:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 79%|███████▊ | 9742/12384 [20:40:28<5:37:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 79%|███████▊ | 9743/12384 [20:40:28<5:36:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 79%|███████▊ | 9743/12384 [20:40:36<5:36:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 0: 79%|███████▊ | 9744/12384 [20:40:36<5:36:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 0: 79%|███████▊ | 9744/12384 [20:40:43<5:36:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 79%|███████▊ | 9745/12384 [20:40:43<5:36:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 79%|███████▊ | 9745/12384 [20:40:51<5:36:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 79%|███████▊ | 9746/12384 [20:40:51<5:35:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 79%|███████▊ | 9746/12384 [20:40:59<5:35:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▊ | 9747/12384 [20:40:59<5:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▊ | 9747/12384 [20:41:06<5:35:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 79%|███████▊ | 9748/12384 [20:41:06<5:34:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 79%|███████▊ | 9748/12384 [20:41:14<5:34:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 0: 79%|███████▊ | 9749/12384 [20:41:14<5:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 0: 79%|███████▊ | 9749/12384 [20:41:21<5:34:46, 7.62s/it, loss=0.0005, acc=0.9976, iter_time=11.52s]
Epoch 0: 79%|███████▊ | 9750/12384 [20:41:21<5:34:17, 7.61s/it, loss=0.0005, acc=0.9976, iter_time=11.52s]
Epoch 0: 79%|███████▊ | 9750/12384 [20:41:29<5:34:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 79%|███████▊ | 9751/12384 [20:41:29<5:34:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 79%|███████▊ | 9751/12384 [20:41:37<5:34:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 79%|███████▊ | 9752/12384 [20:41:37<5:34:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 79%|███████▊ | 9752/12384 [20:41:44<5:34:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 0: 79%|███████▉ | 9753/12384 [20:41:44<5:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 0: 79%|███████▉ | 9753/12384 [20:41:52<5:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 79%|███████▉ | 9754/12384 [20:41:52<5:33:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 79%|███████▉ | 9754/12384 [20:42:00<5:33:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 79%|███████▉ | 9755/12384 [20:42:00<5:33:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 79%|███████▉ | 9755/12384 [20:42:07<5:33:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9756/12384 [20:42:07<5:33:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9756/12384 [20:42:15<5:33:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 79%|███████▉ | 9757/12384 [20:42:15<5:33:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 79%|███████▉ | 9757/12384 [20:42:22<5:33:06, 7.61s/it, loss=0.0002, acc=0.9987, iter_time=6.75s]
Epoch 0: 79%|███████▉ | 9758/12384 [20:42:22<5:33:09, 7.61s/it, loss=0.0002, acc=0.9987, iter_time=6.75s]
Epoch 0: 79%|███████▉ | 9758/12384 [20:42:30<5:33:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 0: 79%|███████▉ | 9759/12384 [20:42:30<5:33:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 0: 79%|███████▉ | 9759/12384 [20:42:38<5:33:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 79%|███████▉ | 9760/12384 [20:42:38<5:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 79%|███████▉ | 9760/12384 [20:42:45<5:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 0: 79%|███████▉ | 9761/12384 [20:42:45<5:36:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 0: 79%|███████▉ | 9761/12384 [20:42:53<5:36:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 79%|███████▉ | 9762/12384 [20:42:53<5:35:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 79%|███████▉ | 9762/12384 [20:43:01<5:35:22, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 79%|███████▉ | 9763/12384 [20:43:01<5:34:31, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 0: 79%|███████▉ | 9763/12384 [20:43:08<5:34:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 79%|███████▉ | 9764/12384 [20:43:08<5:34:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 0: 79%|███████▉ | 9764/12384 [20:43:16<5:34:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 79%|███████▉ | 9765/12384 [20:43:16<5:33:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 0: 79%|███████▉ | 9765/12384 [20:43:24<5:33:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 79%|███████▉ | 9766/12384 [20:43:24<5:33:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 79%|███████▉ | 9766/12384 [20:43:31<5:33:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 79%|███████▉ | 9767/12384 [20:43:31<5:36:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 79%|███████▉ | 9767/12384 [20:43:39<5:36:30, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 79%|███████▉ | 9768/12384 [20:43:39<5:35:16, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 79%|███████▉ | 9768/12384 [20:43:47<5:35:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 79%|███████▉ | 9769/12384 [20:43:47<5:33:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 79%|███████▉ | 9769/12384 [20:43:54<5:33:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 79%|███████▉ | 9770/12384 [20:43:54<5:33:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 79%|███████▉ | 9770/12384 [20:44:02<5:33:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 0: 79%|███████▉ | 9771/12384 [20:44:02<5:32:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 0: 79%|███████▉ | 9771/12384 [20:44:10<5:32:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 79%|███████▉ | 9772/12384 [20:44:10<5:32:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 79%|███████▉ | 9772/12384 [20:44:17<5:32:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9773/12384 [20:44:17<5:31:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9773/12384 [20:44:25<5:31:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9774/12384 [20:44:25<5:31:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9774/12384 [20:44:32<5:31:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 79%|███████▉ | 9775/12384 [20:44:32<5:31:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 79%|███████▉ | 9775/12384 [20:44:40<5:31:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 79%|███████▉ | 9776/12384 [20:44:40<5:31:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 79%|███████▉ | 9776/12384 [20:44:48<5:31:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 79%|███████▉ | 9777/12384 [20:44:48<5:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 79%|███████▉ | 9777/12384 [20:44:55<5:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 79%|███████▉ | 9778/12384 [20:44:55<5:30:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 79%|███████▉ | 9778/12384 [20:45:03<5:30:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 79%|███████▉ | 9779/12384 [20:45:03<5:30:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 79%|███████▉ | 9779/12384 [20:45:10<5:30:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 79%|███████▉ | 9780/12384 [20:45:10<5:30:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 79%|███████▉ | 9780/12384 [20:45:18<5:30:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 79%|███████▉ | 9781/12384 [20:45:18<5:30:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 79%|███████▉ | 9781/12384 [20:45:26<5:30:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 79%|███████▉ | 9782/12384 [20:45:26<5:30:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 0: 79%|███████▉ | 9782/12384 [20:45:33<5:30:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 79%|███████▉ | 9783/12384 [20:45:33<5:29:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 79%|███████▉ | 9783/12384 [20:45:41<5:29:53, 7.61s/it, loss=0.0000, acc=0.9996, iter_time=7.99s]
Epoch 0: 79%|███████▉ | 9784/12384 [20:45:41<5:30:30, 7.63s/it, loss=0.0000, acc=0.9996, iter_time=7.99s]
Epoch 0: 79%|███████▉ | 9784/12384 [20:45:49<5:30:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 79%|███████▉ | 9785/12384 [20:45:49<5:30:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 79%|███████▉ | 9785/12384 [20:45:56<5:30:03, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=5.30s]
Epoch 0: 79%|███████▉ | 9786/12384 [20:45:56<5:29:50, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=5.30s]
Epoch 0: 79%|███████▉ | 9786/12384 [20:46:04<5:29:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 0: 79%|███████▉ | 9787/12384 [20:46:04<5:34:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 0: 79%|███████▉ | 9787/12384 [20:46:12<5:34:10, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.91s]
Epoch 0: 79%|███████▉ | 9788/12384 [20:46:12<5:32:26, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.91s]
Epoch 0: 79%|███████▉ | 9788/12384 [20:46:19<5:32:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 79%|███████▉ | 9789/12384 [20:46:19<5:31:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 79%|███████▉ | 9789/12384 [20:46:27<5:31:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 79%|███████▉ | 9790/12384 [20:46:27<5:30:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 79%|███████▉ | 9790/12384 [20:46:35<5:30:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 79%|███████▉ | 9791/12384 [20:46:35<5:29:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 79%|███████▉ | 9791/12384 [20:46:42<5:29:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 79%|███████▉ | 9792/12384 [20:46:42<5:29:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 79%|███████▉ | 9792/12384 [20:46:50<5:29:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 79%|███████▉ | 9793/12384 [20:46:50<5:33:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 79%|███████▉ | 9793/12384 [20:46:58<5:33:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9794/12384 [20:46:58<5:31:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9794/12384 [20:47:05<5:31:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 0: 79%|███████▉ | 9795/12384 [20:47:05<5:30:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 0: 79%|███████▉ | 9795/12384 [20:47:13<5:30:39, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=11.56s]
Epoch 0: 79%|███████▉ | 9796/12384 [20:47:13<5:30:07, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=11.56s]
Epoch 0: 79%|███████▉ | 9796/12384 [20:47:21<5:30:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 79%|███████▉ | 9797/12384 [20:47:21<5:30:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 79%|███████▉ | 9797/12384 [20:47:28<5:30:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 79%|███████▉ | 9798/12384 [20:47:28<5:30:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 79%|███████▉ | 9798/12384 [20:47:36<5:30:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 0: 79%|███████▉ | 9799/12384 [20:47:36<5:29:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 0: 79%|███████▉ | 9799/12384 [20:47:44<5:29:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 79%|███████▉ | 9800/12384 [20:47:44<5:28:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 79%|███████▉ | 9800/12384 [20:47:51<5:28:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 79%|███████▉ | 9801/12384 [20:47:51<5:28:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 79%|███████▉ | 9801/12384 [20:47:59<5:28:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 79%|███████▉ | 9802/12384 [20:47:59<5:28:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 79%|███████▉ | 9802/12384 [20:48:06<5:28:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 79%|███████▉ | 9803/12384 [20:48:06<5:27:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 79%|███████▉ | 9803/12384 [20:48:14<5:27:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 79%|███████▉ | 9804/12384 [20:48:14<5:26:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 79%|███████▉ | 9804/12384 [20:48:22<5:26:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 79%|███████▉ | 9805/12384 [20:48:22<5:27:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 79%|███████▉ | 9805/12384 [20:48:29<5:27:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.01s]
Epoch 0: 79%|███████▉ | 9806/12384 [20:48:29<5:26:31, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.01s]
Epoch 0: 79%|███████▉ | 9806/12384 [20:48:37<5:26:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 79%|███████▉ | 9807/12384 [20:48:37<5:26:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 79%|███████▉ | 9807/12384 [20:48:44<5:26:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 79%|███████▉ | 9808/12384 [20:48:44<5:26:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 79%|███████▉ | 9808/12384 [20:48:52<5:26:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 0: 79%|███████▉ | 9809/12384 [20:48:52<5:26:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 0: 79%|███████▉ | 9809/12384 [20:49:00<5:26:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 0: 79%|███████▉ | 9810/12384 [20:49:00<5:26:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 0: 79%|███████▉ | 9810/12384 [20:49:07<5:26:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 79%|███████▉ | 9811/12384 [20:49:07<5:27:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 79%|███████▉ | 9811/12384 [20:49:15<5:27:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9812/12384 [20:49:15<5:26:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9812/12384 [20:49:23<5:26:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 79%|███████▉ | 9813/12384 [20:49:23<5:30:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 79%|███████▉ | 9813/12384 [20:49:30<5:30:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 79%|███████▉ | 9814/12384 [20:49:30<5:29:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 79%|███████▉ | 9814/12384 [20:49:38<5:29:39, 7.70s/it, loss=0.0003, acc=0.9977, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9815/12384 [20:49:38<5:28:52, 7.68s/it, loss=0.0003, acc=0.9977, iter_time=7.61s]
Epoch 0: 79%|███████▉ | 9815/12384 [20:49:46<5:28:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 79%|███████▉ | 9816/12384 [20:49:46<5:28:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 79%|███████▉ | 9816/12384 [20:49:53<5:28:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 0: 79%|███████▉ | 9817/12384 [20:49:53<5:28:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 0: 79%|███████▉ | 9817/12384 [20:50:01<5:28:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 79%|███████▉ | 9818/12384 [20:50:01<5:27:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 79%|███████▉ | 9818/12384 [20:50:09<5:27:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 79%|███████▉ | 9819/12384 [20:50:09<5:26:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 79%|███████▉ | 9819/12384 [20:50:16<5:26:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 79%|███████▉ | 9820/12384 [20:50:16<5:29:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 79%|███████▉ | 9820/12384 [20:50:24<5:29:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 79%|███████▉ | 9821/12384 [20:50:24<5:28:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 79%|███████▉ | 9821/12384 [20:50:32<5:28:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 79%|███████▉ | 9822/12384 [20:50:32<5:27:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 0: 79%|███████▉ | 9822/12384 [20:50:39<5:27:28, 7.67s/it, loss=0.0002, acc=0.9994, iter_time=9.40s]
Epoch 0: 79%|███████▉ | 9823/12384 [20:50:39<5:26:41, 7.65s/it, loss=0.0002, acc=0.9994, iter_time=9.40s]
Epoch 0: 79%|███████▉ | 9823/12384 [20:50:47<5:26:41, 7.65s/it, loss=0.0001, acc=0.9993, iter_time=8.02s]
Epoch 0: 79%|███████▉ | 9824/12384 [20:50:47<5:26:20, 7.65s/it, loss=0.0001, acc=0.9993, iter_time=8.02s]
Epoch 0: 79%|███████▉ | 9824/12384 [20:50:55<5:26:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 0: 79%|███████▉ | 9825/12384 [20:50:55<5:25:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 0: 79%|███████▉ | 9825/12384 [20:51:02<5:25:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 79%|███████▉ | 9826/12384 [20:51:02<5:26:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 79%|███████▉ | 9826/12384 [20:51:10<5:26:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 79%|███████▉ | 9827/12384 [20:51:10<5:25:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 79%|███████▉ | 9827/12384 [20:51:17<5:25:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 79%|███████▉ | 9828/12384 [20:51:17<5:24:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 79%|███████▉ | 9828/12384 [20:51:25<5:24:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 79%|███████▉ | 9829/12384 [20:51:25<5:24:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 79%|███████▉ | 9829/12384 [20:51:33<5:24:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 79%|███████▉ | 9830/12384 [20:51:33<5:24:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 0: 79%|███████▉ | 9830/12384 [20:51:40<5:24:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 79%|███████▉ | 9831/12384 [20:51:40<5:23:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 79%|███████▉ | 9831/12384 [20:51:48<5:23:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 79%|███████▉ | 9832/12384 [20:51:48<5:24:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 79%|███████▉ | 9832/12384 [20:51:56<5:24:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 79%|███████▉ | 9833/12384 [20:51:56<5:23:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 79%|███████▉ | 9833/12384 [20:52:03<5:23:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 79%|███████▉ | 9834/12384 [20:52:03<5:23:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 79%|███████▉ | 9834/12384 [20:52:11<5:23:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 79%|███████▉ | 9835/12384 [20:52:11<5:23:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 79%|███████▉ | 9835/12384 [20:52:18<5:23:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 79%|███████▉ | 9836/12384 [20:52:18<5:23:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 79%|███████▉ | 9836/12384 [20:52:26<5:23:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 79%|███████▉ | 9837/12384 [20:52:26<5:22:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 79%|███████▉ | 9837/12384 [20:52:34<5:22:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 0: 79%|███████▉ | 9838/12384 [20:52:34<5:22:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 0: 79%|███████▉ | 9838/12384 [20:52:41<5:22:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 79%|███████▉ | 9839/12384 [20:52:41<5:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 79%|███████▉ | 9839/12384 [20:52:49<5:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 79%|███████▉ | 9840/12384 [20:52:49<5:27:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 79%|███████▉ | 9840/12384 [20:52:57<5:27:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 79%|███████▉ | 9841/12384 [20:52:57<5:26:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 79%|███████▉ | 9841/12384 [20:53:04<5:26:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 79%|███████▉ | 9842/12384 [20:53:04<5:25:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 79%|███████▉ | 9842/12384 [20:53:12<5:25:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 79%|███████▉ | 9843/12384 [20:53:12<5:24:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 79%|███████▉ | 9843/12384 [20:53:20<5:24:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 79%|███████▉ | 9844/12384 [20:53:20<5:23:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 79%|███████▉ | 9844/12384 [20:53:27<5:23:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 79%|███████▉ | 9845/12384 [20:53:27<5:22:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 79%|███████▉ | 9845/12384 [20:53:35<5:22:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 80%|███████▉ | 9846/12384 [20:53:35<5:22:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 80%|███████▉ | 9846/12384 [20:53:42<5:22:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 80%|███████▉ | 9847/12384 [20:53:42<5:22:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 80%|███████▉ | 9847/12384 [20:53:50<5:22:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 80%|███████▉ | 9848/12384 [20:53:50<5:21:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 80%|███████▉ | 9848/12384 [20:53:58<5:21:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 80%|███████▉ | 9849/12384 [20:53:58<5:21:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 80%|███████▉ | 9849/12384 [20:54:05<5:21:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 80%|███████▉ | 9850/12384 [20:54:05<5:21:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 80%|███████▉ | 9850/12384 [20:54:13<5:21:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 80%|███████▉ | 9851/12384 [20:54:13<5:21:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 80%|███████▉ | 9851/12384 [20:54:21<5:21:12, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|███████▉ | 9852/12384 [20:54:21<5:21:08, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|███████▉ | 9852/12384 [20:54:28<5:21:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|███████▉ | 9853/12384 [20:54:28<5:21:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|███████▉ | 9853/12384 [20:54:36<5:21:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9854/12384 [20:54:36<5:20:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9854/12384 [20:54:43<5:20:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 80%|███████▉ | 9855/12384 [20:54:43<5:20:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 80%|███████▉ | 9855/12384 [20:54:51<5:20:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 80%|███████▉ | 9856/12384 [20:54:51<5:20:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 80%|███████▉ | 9856/12384 [20:54:59<5:20:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.69s]
Epoch 0: 80%|███████▉ | 9857/12384 [20:54:59<5:20:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.69s]
Epoch 0: 80%|███████▉ | 9857/12384 [20:55:06<5:20:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 80%|███████▉ | 9858/12384 [20:55:06<5:20:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 80%|███████▉ | 9858/12384 [20:55:14<5:20:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9859/12384 [20:55:14<5:20:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9859/12384 [20:55:21<5:20:06, 7.61s/it, loss=0.0002, acc=0.9994, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9860/12384 [20:55:21<5:20:02, 7.61s/it, loss=0.0002, acc=0.9994, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9860/12384 [20:55:29<5:20:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9861/12384 [20:55:29<5:19:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9861/12384 [20:55:37<5:19:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 80%|███████▉ | 9862/12384 [20:55:37<5:19:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 0: 80%|███████▉ | 9862/12384 [20:55:44<5:19:48, 7.61s/it, loss=0.0004, acc=0.9994, iter_time=10.45s]
Epoch 0: 80%|███████▉ | 9863/12384 [20:55:44<5:19:35, 7.61s/it, loss=0.0004, acc=0.9994, iter_time=10.45s]
Epoch 0: 80%|███████▉ | 9863/12384 [20:55:52<5:19:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 80%|███████▉ | 9864/12384 [20:55:52<5:19:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 80%|███████▉ | 9864/12384 [20:55:59<5:19:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 80%|███████▉ | 9865/12384 [20:55:59<5:19:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 80%|███████▉ | 9865/12384 [20:56:07<5:19:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 80%|███████▉ | 9866/12384 [20:56:07<5:24:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 80%|███████▉ | 9866/12384 [20:56:15<5:24:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 80%|███████▉ | 9867/12384 [20:56:15<5:22:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 80%|███████▉ | 9867/12384 [20:56:23<5:22:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 0: 80%|███████▉ | 9868/12384 [20:56:23<5:20:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 0: 80%|███████▉ | 9868/12384 [20:56:30<5:20:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 80%|███████▉ | 9869/12384 [20:56:30<5:20:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 80%|███████▉ | 9869/12384 [20:56:38<5:20:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 80%|███████▉ | 9870/12384 [20:56:38<5:20:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 80%|███████▉ | 9870/12384 [20:56:45<5:20:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 80%|███████▉ | 9871/12384 [20:56:45<5:19:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 80%|███████▉ | 9871/12384 [20:56:53<5:19:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 80%|███████▉ | 9872/12384 [20:56:53<5:19:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 80%|███████▉ | 9872/12384 [20:57:01<5:19:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 80%|███████▉ | 9873/12384 [20:57:01<5:19:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 80%|███████▉ | 9873/12384 [20:57:08<5:19:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 80%|███████▉ | 9874/12384 [20:57:08<5:18:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 80%|███████▉ | 9874/12384 [20:57:16<5:18:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9875/12384 [20:57:16<5:18:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9875/12384 [20:57:24<5:18:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9876/12384 [20:57:24<5:18:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9876/12384 [20:57:31<5:18:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|███████▉ | 9877/12384 [20:57:31<5:17:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|███████▉ | 9877/12384 [20:57:39<5:17:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 80%|███████▉ | 9878/12384 [20:57:39<5:17:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 80%|███████▉ | 9878/12384 [20:57:46<5:17:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 80%|███████▉ | 9879/12384 [20:57:46<5:17:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 80%|███████▉ | 9879/12384 [20:57:54<5:17:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 0: 80%|███████▉ | 9880/12384 [20:57:54<5:17:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 0: 80%|███████▉ | 9880/12384 [20:58:02<5:17:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 0: 80%|███████▉ | 9881/12384 [20:58:02<5:17:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 0: 80%|███████▉ | 9881/12384 [20:58:09<5:17:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 80%|███████▉ | 9882/12384 [20:58:09<5:17:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 80%|███████▉ | 9882/12384 [20:58:17<5:17:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 0: 80%|███████▉ | 9883/12384 [20:58:17<5:17:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 0: 80%|███████▉ | 9883/12384 [20:58:24<5:17:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9884/12384 [20:58:24<5:17:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|███████▉ | 9884/12384 [20:58:32<5:17:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|███████▉ | 9885/12384 [20:58:32<5:17:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|███████▉ | 9885/12384 [20:58:40<5:17:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 80%|███████▉ | 9886/12384 [20:58:40<5:17:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 80%|███████▉ | 9886/12384 [20:58:47<5:17:12, 7.62s/it, loss=0.0006, acc=0.9968, iter_time=8.82s]
Epoch 0: 80%|███████▉ | 9887/12384 [20:58:47<5:16:58, 7.62s/it, loss=0.0006, acc=0.9968, iter_time=8.82s]
Epoch 0: 80%|███████▉ | 9887/12384 [20:58:55<5:16:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 0: 80%|███████▉ | 9888/12384 [20:58:55<5:16:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 0: 80%|███████▉ | 9888/12384 [20:59:02<5:16:58, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=6.55s]
Epoch 0: 80%|███████▉ | 9889/12384 [20:59:02<5:16:29, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=6.55s]
Epoch 0: 80%|███████▉ | 9889/12384 [20:59:10<5:16:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 80%|███████▉ | 9890/12384 [20:59:10<5:17:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 80%|███████▉ | 9890/12384 [20:59:18<5:17:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 80%|███████▉ | 9891/12384 [20:59:18<5:17:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 80%|███████▉ | 9891/12384 [20:59:25<5:17:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 80%|███████▉ | 9892/12384 [20:59:25<5:16:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 80%|███████▉ | 9892/12384 [20:59:33<5:16:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 80%|███████▉ | 9893/12384 [20:59:33<5:20:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 80%|███████▉ | 9893/12384 [20:59:41<5:20:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 80%|███████▉ | 9894/12384 [20:59:41<5:18:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 80%|███████▉ | 9894/12384 [20:59:49<5:18:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 80%|███████▉ | 9895/12384 [20:59:49<5:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 80%|███████▉ | 9895/12384 [20:59:56<5:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 0: 80%|███████▉ | 9896/12384 [20:59:56<5:16:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 0: 80%|███████▉ | 9896/12384 [21:00:04<5:16:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 80%|███████▉ | 9897/12384 [21:00:04<5:16:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 80%|███████▉ | 9897/12384 [21:00:12<5:16:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 80%|███████▉ | 9898/12384 [21:00:12<5:20:18, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 80%|███████▉ | 9898/12384 [21:00:19<5:20:18, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|███████▉ | 9899/12384 [21:00:19<5:18:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|███████▉ | 9899/12384 [21:00:27<5:18:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 80%|███████▉ | 9900/12384 [21:00:27<5:17:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 80%|███████▉ | 9900/12384 [21:00:35<5:17:39, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=3.24s]
Epoch 0: 80%|███████▉ | 9901/12384 [21:00:35<5:16:55, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=3.24s]
Epoch 0: 80%|███████▉ | 9901/12384 [21:00:42<5:16:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.59s]
Epoch 0: 80%|███████▉ | 9902/12384 [21:00:42<5:16:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.59s]
Epoch 0: 80%|███████▉ | 9902/12384 [21:00:50<5:16:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|███████▉ | 9903/12384 [21:00:50<5:15:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|███████▉ | 9903/12384 [21:00:57<5:15:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 80%|███████▉ | 9904/12384 [21:00:57<5:15:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 80%|███████▉ | 9904/12384 [21:01:05<5:15:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 0: 80%|███████▉ | 9905/12384 [21:01:05<5:14:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 0: 80%|███████▉ | 9905/12384 [21:01:13<5:14:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 80%|███████▉ | 9906/12384 [21:01:13<5:14:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 80%|███████▉ | 9906/12384 [21:01:20<5:14:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 80%|███████▉ | 9907/12384 [21:01:20<5:14:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 80%|███████▉ | 9907/12384 [21:01:28<5:14:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 80%|████████ | 9908/12384 [21:01:28<5:14:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 80%|████████ | 9908/12384 [21:01:35<5:14:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|████████ | 9909/12384 [21:01:35<5:13:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|████████ | 9909/12384 [21:01:43<5:13:57, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.27s]
Epoch 0: 80%|████████ | 9910/12384 [21:01:43<5:13:43, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.27s]
Epoch 0: 80%|████████ | 9910/12384 [21:01:51<5:13:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 80%|████████ | 9911/12384 [21:01:51<5:13:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 80%|████████ | 9911/12384 [21:01:58<5:13:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 80%|████████ | 9912/12384 [21:01:58<5:13:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 80%|████████ | 9912/12384 [21:02:06<5:13:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 80%|████████ | 9913/12384 [21:02:06<5:13:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 80%|████████ | 9913/12384 [21:02:14<5:13:41, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 80%|████████ | 9914/12384 [21:02:14<5:13:27, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 80%|████████ | 9914/12384 [21:02:21<5:13:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|████████ | 9915/12384 [21:02:21<5:13:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|████████ | 9915/12384 [21:02:29<5:13:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|████████ | 9916/12384 [21:02:29<5:13:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|████████ | 9916/12384 [21:02:36<5:13:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|████████ | 9917/12384 [21:02:36<5:13:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|████████ | 9917/12384 [21:02:44<5:13:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|████████ | 9918/12384 [21:02:44<5:12:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|████████ | 9918/12384 [21:02:52<5:12:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 80%|████████ | 9919/12384 [21:02:52<5:16:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 80%|████████ | 9919/12384 [21:03:00<5:16:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 0: 80%|████████ | 9920/12384 [21:03:00<5:16:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 0: 80%|████████ | 9920/12384 [21:03:07<5:16:27, 7.71s/it, loss=0.0003, acc=0.9977, iter_time=5.68s]
Epoch 0: 80%|████████ | 9921/12384 [21:03:07<5:14:59, 7.67s/it, loss=0.0003, acc=0.9977, iter_time=5.68s]
Epoch 0: 80%|████████ | 9921/12384 [21:03:15<5:14:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 80%|████████ | 9922/12384 [21:03:15<5:14:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 80%|████████ | 9922/12384 [21:03:23<5:14:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 80%|████████ | 9923/12384 [21:03:23<5:14:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 80%|████████ | 9923/12384 [21:03:30<5:14:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 80%|████████ | 9924/12384 [21:03:30<5:13:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 80%|████████ | 9924/12384 [21:03:38<5:13:43, 7.65s/it, loss=0.0009, acc=0.9989, iter_time=9.96s]
Epoch 0: 80%|████████ | 9925/12384 [21:03:38<5:13:11, 7.64s/it, loss=0.0009, acc=0.9989, iter_time=9.96s]
Epoch 0: 80%|████████ | 9925/12384 [21:03:45<5:13:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 80%|████████ | 9926/12384 [21:03:45<5:12:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 80%|████████ | 9926/12384 [21:03:53<5:12:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 80%|████████ | 9927/12384 [21:03:53<5:12:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 80%|████████ | 9927/12384 [21:04:01<5:12:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 80%|████████ | 9928/12384 [21:04:01<5:12:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 80%|████████ | 9928/12384 [21:04:08<5:12:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 80%|████████ | 9929/12384 [21:04:08<5:11:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 0: 80%|████████ | 9929/12384 [21:04:16<5:11:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 80%|████████ | 9930/12384 [21:04:16<5:11:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 80%|████████ | 9930/12384 [21:04:23<5:11:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 80%|████████ | 9931/12384 [21:04:23<5:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 80%|████████ | 9931/12384 [21:04:31<5:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 80%|████████ | 9932/12384 [21:04:31<5:11:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 80%|████████ | 9932/12384 [21:04:39<5:11:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|████████ | 9933/12384 [21:04:39<5:11:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|████████ | 9933/12384 [21:04:46<5:11:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 80%|████████ | 9934/12384 [21:04:46<5:11:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 80%|████████ | 9934/12384 [21:04:54<5:11:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 80%|████████ | 9935/12384 [21:04:54<5:11:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 80%|████████ | 9935/12384 [21:05:02<5:11:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 80%|████████ | 9936/12384 [21:05:02<5:11:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 80%|████████ | 9936/12384 [21:05:09<5:11:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 80%|████████ | 9937/12384 [21:05:09<5:10:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 80%|████████ | 9937/12384 [21:05:17<5:10:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 80%|████████ | 9938/12384 [21:05:17<5:10:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 80%|████████ | 9938/12384 [21:05:24<5:10:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 80%|████████ | 9939/12384 [21:05:24<5:10:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 80%|████████ | 9939/12384 [21:05:32<5:10:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 0: 80%|████████ | 9940/12384 [21:05:32<5:11:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 0: 80%|████████ | 9940/12384 [21:05:40<5:11:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|████████ | 9941/12384 [21:05:40<5:10:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 80%|████████ | 9941/12384 [21:05:47<5:10:38, 7.63s/it, loss=0.0000, acc=0.9998, iter_time=5.86s]
Epoch 0: 80%|████████ | 9942/12384 [21:05:47<5:10:18, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=5.86s]
Epoch 0: 80%|████████ | 9942/12384 [21:05:55<5:10:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 80%|████████ | 9943/12384 [21:05:55<5:10:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 80%|████████ | 9943/12384 [21:06:03<5:10:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 80%|████████ | 9944/12384 [21:06:03<5:09:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 80%|████████ | 9944/12384 [21:06:10<5:09:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 80%|████████ | 9945/12384 [21:06:10<5:13:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 80%|████████ | 9945/12384 [21:06:18<5:13:37, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.87s]
Epoch 0: 80%|████████ | 9946/12384 [21:06:18<5:12:19, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.87s]
Epoch 0: 80%|████████ | 9946/12384 [21:06:26<5:12:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 80%|████████ | 9947/12384 [21:06:26<5:11:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 80%|████████ | 9947/12384 [21:06:33<5:11:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 0: 80%|████████ | 9948/12384 [21:06:33<5:10:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 0: 80%|████████ | 9948/12384 [21:06:41<5:10:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 0: 80%|████████ | 9949/12384 [21:06:41<5:09:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 0: 80%|████████ | 9949/12384 [21:06:49<5:09:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 80%|████████ | 9950/12384 [21:06:49<5:09:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 80%|████████ | 9950/12384 [21:06:56<5:09:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 80%|████████ | 9951/12384 [21:06:56<5:12:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 80%|████████ | 9951/12384 [21:07:04<5:12:49, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=7.97s]
Epoch 0: 80%|████████ | 9952/12384 [21:07:04<5:11:09, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=7.97s]
Epoch 0: 80%|████████ | 9952/12384 [21:07:12<5:11:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 80%|████████ | 9953/12384 [21:07:12<5:10:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 80%|████████ | 9953/12384 [21:07:19<5:10:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|████████ | 9954/12384 [21:07:19<5:09:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 80%|████████ | 9954/12384 [21:07:27<5:09:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|████████ | 9955/12384 [21:07:27<5:08:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|████████ | 9955/12384 [21:07:34<5:08:48, 7.63s/it, loss=0.0005, acc=0.9978, iter_time=7.60s]
Epoch 0: 80%|████████ | 9956/12384 [21:07:34<5:08:25, 7.62s/it, loss=0.0005, acc=0.9978, iter_time=7.60s]
Epoch 0: 80%|████████ | 9956/12384 [21:07:42<5:08:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 80%|████████ | 9957/12384 [21:07:42<5:08:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 80%|████████ | 9957/12384 [21:07:50<5:08:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 80%|████████ | 9958/12384 [21:07:50<5:09:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 80%|████████ | 9958/12384 [21:07:57<5:09:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 80%|████████ | 9959/12384 [21:07:57<5:08:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 80%|████████ | 9959/12384 [21:08:05<5:08:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 80%|████████ | 9960/12384 [21:08:05<5:08:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 80%|████████ | 9960/12384 [21:08:13<5:08:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 0: 80%|████████ | 9961/12384 [21:08:13<5:07:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 0: 80%|████████ | 9961/12384 [21:08:20<5:07:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 80%|████████ | 9962/12384 [21:08:20<5:07:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 80%|████████ | 9962/12384 [21:08:28<5:07:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 80%|████████ | 9963/12384 [21:08:28<5:07:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 80%|████████ | 9963/12384 [21:08:35<5:07:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 80%|████████ | 9964/12384 [21:08:35<5:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 80%|████████ | 9964/12384 [21:08:43<5:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|████████ | 9965/12384 [21:08:43<5:07:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 80%|████████ | 9965/12384 [21:08:51<5:07:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 80%|████████ | 9966/12384 [21:08:51<5:07:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 80%|████████ | 9966/12384 [21:08:58<5:07:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 80%|████████ | 9967/12384 [21:08:58<5:06:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 80%|████████ | 9967/12384 [21:09:06<5:06:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 80%|████████ | 9968/12384 [21:09:06<5:06:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 80%|████████ | 9968/12384 [21:09:14<5:06:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 80%|████████ | 9969/12384 [21:09:14<5:06:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 80%|████████ | 9969/12384 [21:09:21<5:06:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 0: 81%|████████ | 9970/12384 [21:09:21<5:06:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 0: 81%|████████ | 9970/12384 [21:09:29<5:06:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 0: 81%|████████ | 9971/12384 [21:09:29<5:10:09, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 0: 81%|████████ | 9971/12384 [21:09:37<5:10:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 81%|████████ | 9972/12384 [21:09:37<5:09:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 81%|████████ | 9972/12384 [21:09:44<5:09:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 0: 81%|████████ | 9973/12384 [21:09:44<5:08:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 0: 81%|████████ | 9973/12384 [21:09:52<5:08:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 81%|████████ | 9974/12384 [21:09:52<5:07:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 81%|████████ | 9974/12384 [21:10:00<5:07:20, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 0: 81%|████████ | 9975/12384 [21:10:00<5:06:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 0: 81%|████████ | 9975/12384 [21:10:07<5:06:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 81%|████████ | 9976/12384 [21:10:07<5:06:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 81%|████████ | 9976/12384 [21:10:15<5:06:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 81%|████████ | 9977/12384 [21:10:15<5:09:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 81%|████████ | 9977/12384 [21:10:23<5:09:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 81%|████████ | 9978/12384 [21:10:23<5:08:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 81%|████████ | 9978/12384 [21:10:30<5:08:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 81%|████████ | 9979/12384 [21:10:30<5:06:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 81%|████████ | 9979/12384 [21:10:38<5:06:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 0: 81%|████████ | 9980/12384 [21:10:38<5:06:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 0: 81%|████████ | 9980/12384 [21:10:45<5:06:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 81%|████████ | 9981/12384 [21:10:45<5:05:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 81%|████████ | 9981/12384 [21:10:53<5:05:23, 7.63s/it, loss=0.0005, acc=0.9985, iter_time=7.59s]
Epoch 0: 81%|████████ | 9982/12384 [21:10:53<5:04:59, 7.62s/it, loss=0.0005, acc=0.9985, iter_time=7.59s]
Epoch 0: 81%|████████ | 9982/12384 [21:11:01<5:04:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 81%|████████ | 9983/12384 [21:11:01<5:04:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 81%|████████ | 9983/12384 [21:11:08<5:04:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.14s]
Epoch 0: 81%|████████ | 9984/12384 [21:11:08<5:04:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.14s]
Epoch 0: 81%|████████ | 9984/12384 [21:11:16<5:04:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 81%|████████ | 9985/12384 [21:11:16<5:04:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 81%|████████ | 9985/12384 [21:11:24<5:04:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 81%|████████ | 9986/12384 [21:11:24<5:04:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 81%|████████ | 9986/12384 [21:11:31<5:04:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 9987/12384 [21:11:31<5:04:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 9987/12384 [21:11:39<5:04:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 0: 81%|████████ | 9988/12384 [21:11:39<5:04:59, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 0: 81%|████████ | 9988/12384 [21:11:46<5:04:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 81%|████████ | 9989/12384 [21:11:46<5:04:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 81%|████████ | 9989/12384 [21:11:54<5:04:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 81%|████████ | 9990/12384 [21:11:54<5:04:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 81%|████████ | 9990/12384 [21:12:02<5:04:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.73s]
Epoch 0: 81%|████████ | 9991/12384 [21:12:02<5:04:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.73s]
Epoch 0: 81%|████████ | 9991/12384 [21:12:09<5:04:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 81%|████████ | 9992/12384 [21:12:09<5:03:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 81%|████████ | 9992/12384 [21:12:17<5:03:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 81%|████████ | 9993/12384 [21:12:17<5:03:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 81%|████████ | 9993/12384 [21:12:25<5:03:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 9994/12384 [21:12:25<5:03:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 9994/12384 [21:12:32<5:03:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 81%|████████ | 9995/12384 [21:12:32<5:03:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 81%|████████ | 9995/12384 [21:12:40<5:03:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 81%|████████ | 9996/12384 [21:12:40<5:02:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 81%|████████ | 9996/12384 [21:12:48<5:02:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 81%|████████ | 9997/12384 [21:12:48<5:06:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 81%|████████ | 9997/12384 [21:12:55<5:06:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 81%|████████ | 9998/12384 [21:12:55<5:06:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 81%|████████ | 9998/12384 [21:13:03<5:06:09, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.17s]
Epoch 0: 81%|████████ | 9999/12384 [21:13:03<5:05:12, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.17s]
Epoch 0: 81%|████████ | 9999/12384 [21:13:11<5:05:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 81%|████████ | 10000/12384 [21:13:11<5:06:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 81%|████████ | 10000/12384 [21:13:18<5:06:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 81%|████████ | 10001/12384 [21:13:18<5:05:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 81%|████████ | 10001/12384 [21:13:26<5:05:24, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 81%|████████ | 10002/12384 [21:13:26<5:04:27, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 81%|████████ | 10002/12384 [21:13:34<5:04:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 81%|████████ | 10003/12384 [21:13:34<5:03:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 81%|████████ | 10003/12384 [21:13:41<5:03:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 81%|████████ | 10004/12384 [21:13:41<5:03:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 81%|████████ | 10004/12384 [21:13:49<5:03:01, 7.64s/it, loss=0.0012, acc=0.9989, iter_time=10.20s]
Epoch 0: 81%|████████ | 10005/12384 [21:13:49<5:02:27, 7.63s/it, loss=0.0012, acc=0.9989, iter_time=10.20s]
Epoch 0: 81%|████████ | 10005/12384 [21:13:56<5:02:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 81%|████████ | 10006/12384 [21:13:56<5:02:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 81%|████████ | 10006/12384 [21:14:04<5:02:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 81%|████████ | 10007/12384 [21:14:04<5:03:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 81%|████████ | 10007/12384 [21:14:12<5:03:03, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=7.99s]
Epoch 0: 81%|████████ | 10008/12384 [21:14:12<5:02:53, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=7.99s]
Epoch 0: 81%|████████ | 10008/12384 [21:14:19<5:02:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 81%|████████ | 10009/12384 [21:14:19<5:03:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 81%|████████ | 10009/12384 [21:14:27<5:03:07, 7.66s/it, loss=0.0004, acc=0.9986, iter_time=10.46s]
Epoch 0: 81%|████████ | 10010/12384 [21:14:27<5:02:21, 7.64s/it, loss=0.0004, acc=0.9986, iter_time=10.46s]
Epoch 0: 81%|████████ | 10010/12384 [21:14:35<5:02:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10011/12384 [21:14:35<5:01:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10011/12384 [21:14:42<5:01:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 81%|████████ | 10012/12384 [21:14:42<5:01:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 81%|████████ | 10012/12384 [21:14:50<5:01:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 81%|████████ | 10013/12384 [21:14:50<5:01:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 81%|████████ | 10013/12384 [21:14:58<5:01:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.52s]
Epoch 0: 81%|████████ | 10014/12384 [21:14:58<5:01:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.52s]
Epoch 0: 81%|████████ | 10014/12384 [21:15:05<5:01:32, 7.63s/it, loss=0.0004, acc=0.9981, iter_time=7.63s]
Epoch 0: 81%|████████ | 10015/12384 [21:15:05<5:01:23, 7.63s/it, loss=0.0004, acc=0.9981, iter_time=7.63s]
Epoch 0: 81%|████████ | 10015/12384 [21:15:13<5:01:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 81%|████████ | 10016/12384 [21:15:13<5:00:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 81%|████████ | 10016/12384 [21:15:20<5:00:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 0: 81%|████████ | 10017/12384 [21:15:20<5:00:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 0: 81%|████████ | 10017/12384 [21:15:28<5:00:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 81%|████████ | 10018/12384 [21:15:28<5:00:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 81%|████████ | 10018/12384 [21:15:36<5:00:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 10019/12384 [21:15:36<5:01:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 10019/12384 [21:15:43<5:01:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 81%|████████ | 10020/12384 [21:15:43<5:00:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 81%|████████ | 10020/12384 [21:15:51<5:00:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10021/12384 [21:15:51<5:00:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10021/12384 [21:15:59<5:00:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 0: 81%|████████ | 10022/12384 [21:15:59<4:59:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 0: 81%|████████ | 10022/12384 [21:16:06<4:59:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 0: 81%|████████ | 10023/12384 [21:16:06<4:59:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 0: 81%|████████ | 10023/12384 [21:16:14<4:59:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 81%|████████ | 10024/12384 [21:16:14<5:02:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 81%|████████ | 10024/12384 [21:16:22<5:02:27, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.41s]
Epoch 0: 81%|████████ | 10025/12384 [21:16:22<5:01:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.41s]
Epoch 0: 81%|████████ | 10025/12384 [21:16:29<5:01:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 81%|████████ | 10026/12384 [21:16:29<5:00:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 81%|████████ | 10026/12384 [21:16:37<5:00:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 81%|████████ | 10027/12384 [21:16:37<4:59:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 81%|████████ | 10027/12384 [21:16:44<4:59:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10028/12384 [21:16:44<4:59:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10028/12384 [21:16:52<4:59:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10029/12384 [21:16:52<4:58:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10029/12384 [21:17:00<4:58:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 81%|████████ | 10030/12384 [21:17:00<4:58:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 81%|████████ | 10030/12384 [21:17:07<4:58:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 81%|████████ | 10031/12384 [21:17:07<4:59:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 81%|████████ | 10031/12384 [21:17:15<4:59:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 81%|████████ | 10032/12384 [21:17:15<4:59:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 81%|████████ | 10032/12384 [21:17:23<4:59:36, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 0: 81%|████████ | 10033/12384 [21:17:23<4:59:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 0: 81%|████████ | 10033/12384 [21:17:30<4:59:07, 7.63s/it, loss=0.0023, acc=0.9931, iter_time=5.01s]
Epoch 0: 81%|████████ | 10034/12384 [21:17:30<4:58:52, 7.63s/it, loss=0.0023, acc=0.9931, iter_time=5.01s]
Epoch 0: 81%|████████ | 10034/12384 [21:17:38<4:58:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 81%|████████ | 10035/12384 [21:17:38<4:58:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 81%|████████ | 10035/12384 [21:17:46<4:58:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 81%|████████ | 10036/12384 [21:17:46<4:58:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 81%|████████ | 10036/12384 [21:17:53<4:58:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 81%|████████ | 10037/12384 [21:17:53<4:57:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 81%|████████ | 10037/12384 [21:18:01<4:57:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 81%|████████ | 10038/12384 [21:18:01<4:57:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 81%|████████ | 10038/12384 [21:18:08<4:57:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 81%|████████ | 10039/12384 [21:18:08<4:57:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 81%|████████ | 10039/12384 [21:18:16<4:57:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 81%|████████ | 10040/12384 [21:18:16<4:57:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 81%|████████ | 10040/12384 [21:18:24<4:57:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 81%|████████ | 10041/12384 [21:18:24<4:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 81%|████████ | 10041/12384 [21:18:31<4:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 0: 81%|████████ | 10042/12384 [21:18:31<4:57:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 0: 81%|████████ | 10042/12384 [21:18:39<4:57:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.66s]
Epoch 0: 81%|████████ | 10043/12384 [21:18:39<4:57:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.66s]
Epoch 0: 81%|████████ | 10043/12384 [21:18:46<4:57:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 81%|████████ | 10044/12384 [21:18:46<4:56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 81%|████████ | 10044/12384 [21:18:54<4:56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 81%|████████ | 10045/12384 [21:18:54<4:56:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 81%|████████ | 10045/12384 [21:19:02<4:56:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 10046/12384 [21:19:02<4:56:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 10046/12384 [21:19:09<4:56:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 10047/12384 [21:19:09<4:57:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 10047/12384 [21:19:17<4:57:29, 7.64s/it, loss=0.0038, acc=0.9917, iter_time=8.09s]
Epoch 0: 81%|████████ | 10048/12384 [21:19:17<4:56:54, 7.63s/it, loss=0.0038, acc=0.9917, iter_time=8.09s]
Epoch 0: 81%|████████ | 10048/12384 [21:19:25<4:56:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 81%|████████ | 10049/12384 [21:19:25<4:57:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 0: 81%|████████ | 10049/12384 [21:19:33<4:57:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 81%|████████ | 10050/12384 [21:19:33<5:00:54, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 81%|████████ | 10050/12384 [21:19:40<5:00:54, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 81%|████████ | 10051/12384 [21:19:40<4:59:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 81%|████████ | 10051/12384 [21:19:48<4:59:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10052/12384 [21:19:48<4:58:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10052/12384 [21:19:55<4:58:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 81%|████████ | 10053/12384 [21:19:55<4:57:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 81%|████████ | 10053/12384 [21:20:03<4:57:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 81%|████████ | 10054/12384 [21:20:03<4:56:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 81%|████████ | 10054/12384 [21:20:11<4:56:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 81%|████████ | 10055/12384 [21:20:11<4:56:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 81%|████████ | 10055/12384 [21:20:18<4:56:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 81%|████████ | 10056/12384 [21:20:18<4:55:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 81%|████████ | 10056/12384 [21:20:26<4:55:59, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=7.51s]
Epoch 0: 81%|████████ | 10057/12384 [21:20:26<4:58:48, 7.70s/it, loss=0.0003, acc=0.9999, iter_time=7.51s]
Epoch 0: 81%|████████ | 10057/12384 [21:20:34<4:58:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10058/12384 [21:20:34<4:57:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████ | 10058/12384 [21:20:41<4:57:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 10059/12384 [21:20:41<4:56:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████ | 10059/12384 [21:20:49<4:56:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 81%|████████ | 10060/12384 [21:20:49<4:56:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 81%|████████ | 10060/12384 [21:20:57<4:56:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 81%|████████ | 10061/12384 [21:20:57<4:55:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 81%|████████ | 10061/12384 [21:21:04<4:55:30, 7.63s/it, loss=0.0013, acc=0.9976, iter_time=4.59s]
Epoch 0: 81%|████████▏ | 10062/12384 [21:21:04<4:55:14, 7.63s/it, loss=0.0013, acc=0.9976, iter_time=4.59s]
Epoch 0: 81%|████████▏ | 10062/12384 [21:21:12<4:55:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 0: 81%|████████▏ | 10063/12384 [21:21:12<4:55:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 0: 81%|████████▏ | 10063/12384 [21:21:19<4:55:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 81%|████████▏ | 10064/12384 [21:21:19<4:54:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 81%|████████▏ | 10064/12384 [21:21:27<4:54:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 81%|████████▏ | 10065/12384 [21:21:27<4:54:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 81%|████████▏ | 10065/12384 [21:21:35<4:54:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████▏ | 10066/12384 [21:21:35<4:54:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 81%|████████▏ | 10066/12384 [21:21:42<4:54:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 81%|████████▏ | 10067/12384 [21:21:42<4:54:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 81%|████████▏ | 10067/12384 [21:21:50<4:54:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 81%|████████▏ | 10068/12384 [21:21:50<4:53:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 81%|████████▏ | 10068/12384 [21:21:57<4:53:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 81%|████████▏ | 10069/12384 [21:21:57<4:53:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 81%|████████▏ | 10069/12384 [21:22:05<4:53:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 81%|████████▏ | 10070/12384 [21:22:05<4:53:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 81%|████████▏ | 10070/12384 [21:22:13<4:53:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 81%|████████▏ | 10071/12384 [21:22:13<4:53:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 81%|████████▏ | 10071/12384 [21:22:20<4:53:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 81%|████████▏ | 10072/12384 [21:22:20<4:53:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 81%|████████▏ | 10072/12384 [21:22:28<4:53:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 81%|████████▏ | 10073/12384 [21:22:28<4:53:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 81%|████████▏ | 10073/12384 [21:22:36<4:53:18, 7.62s/it, loss=0.0006, acc=0.9983, iter_time=7.07s]
Epoch 0: 81%|████████▏ | 10074/12384 [21:22:36<4:52:44, 7.60s/it, loss=0.0006, acc=0.9983, iter_time=7.07s]
Epoch 0: 81%|████████▏ | 10074/12384 [21:22:43<4:52:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 81%|████████▏ | 10075/12384 [21:22:43<4:52:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 81%|████████▏ | 10075/12384 [21:22:51<4:52:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 0: 81%|████████▏ | 10076/12384 [21:22:51<4:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 0: 81%|████████▏ | 10076/12384 [21:22:59<4:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 81%|████████▏ | 10077/12384 [21:22:59<4:56:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 81%|████████▏ | 10077/12384 [21:23:06<4:56:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 81%|████████▏ | 10078/12384 [21:23:06<4:55:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 81%|████████▏ | 10078/12384 [21:23:14<4:55:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 81%|████████▏ | 10079/12384 [21:23:14<4:54:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 81%|████████▏ | 10079/12384 [21:23:22<4:54:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 81%|████████▏ | 10080/12384 [21:23:22<4:54:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 81%|████████▏ | 10080/12384 [21:23:29<4:54:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 81%|████████▏ | 10081/12384 [21:23:29<4:53:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 81%|████████▏ | 10081/12384 [21:23:37<4:53:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 81%|████████▏ | 10082/12384 [21:23:37<4:53:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 81%|████████▏ | 10082/12384 [21:23:45<4:53:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 81%|████████▏ | 10083/12384 [21:23:45<4:55:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 81%|████████▏ | 10083/12384 [21:23:52<4:55:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████▏ | 10084/12384 [21:23:52<4:54:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 81%|████████▏ | 10084/12384 [21:24:00<4:54:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 0: 81%|████████▏ | 10085/12384 [21:24:00<4:53:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 0: 81%|████████▏ | 10085/12384 [21:24:08<4:53:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 81%|████████▏ | 10086/12384 [21:24:08<4:52:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 81%|████████▏ | 10086/12384 [21:24:15<4:52:59, 7.65s/it, loss=0.0008, acc=0.9985, iter_time=9.71s]
Epoch 0: 81%|████████▏ | 10087/12384 [21:24:15<4:52:51, 7.65s/it, loss=0.0008, acc=0.9985, iter_time=9.71s]
Epoch 0: 81%|████████▏ | 10087/12384 [21:24:23<4:52:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 81%|████████▏ | 10088/12384 [21:24:23<4:52:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 81%|████████▏ | 10088/12384 [21:24:30<4:52:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 81%|████████▏ | 10089/12384 [21:24:30<4:51:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 81%|████████▏ | 10089/12384 [21:24:38<4:51:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 81%|████████▏ | 10090/12384 [21:24:38<4:51:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 81%|████████▏ | 10090/12384 [21:24:46<4:51:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 81%|████████▏ | 10091/12384 [21:24:46<4:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 81%|████████▏ | 10091/12384 [21:24:53<4:51:20, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=9.11s]
Epoch 0: 81%|████████▏ | 10092/12384 [21:24:53<4:51:13, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=9.11s]
Epoch 0: 81%|████████▏ | 10092/12384 [21:25:01<4:51:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10093/12384 [21:25:01<4:50:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10093/12384 [21:25:09<4:50:56, 7.62s/it, loss=0.0003, acc=0.9993, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10094/12384 [21:25:09<4:50:28, 7.61s/it, loss=0.0003, acc=0.9993, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10094/12384 [21:25:16<4:50:28, 7.61s/it, loss=0.0006, acc=0.9975, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10095/12384 [21:25:16<4:50:08, 7.61s/it, loss=0.0006, acc=0.9975, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10095/12384 [21:25:24<4:50:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 82%|████████▏ | 10096/12384 [21:25:24<4:50:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 82%|████████▏ | 10096/12384 [21:25:31<4:50:23, 7.62s/it, loss=0.0005, acc=0.9987, iter_time=7.66s]
Epoch 0: 82%|████████▏ | 10097/12384 [21:25:31<4:50:13, 7.61s/it, loss=0.0005, acc=0.9987, iter_time=7.66s]
Epoch 0: 82%|████████▏ | 10097/12384 [21:25:39<4:50:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 82%|████████▏ | 10098/12384 [21:25:39<4:50:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 82%|████████▏ | 10098/12384 [21:25:47<4:50:34, 7.63s/it, loss=0.0003, acc=0.9983, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10099/12384 [21:25:47<4:50:41, 7.63s/it, loss=0.0003, acc=0.9983, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10099/12384 [21:25:54<4:50:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 82%|████████▏ | 10100/12384 [21:25:54<4:50:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 82%|████████▏ | 10100/12384 [21:26:02<4:50:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 82%|████████▏ | 10101/12384 [21:26:02<4:50:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 82%|████████▏ | 10101/12384 [21:26:10<4:50:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 82%|████████▏ | 10102/12384 [21:26:10<4:49:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 82%|████████▏ | 10102/12384 [21:26:17<4:49:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 82%|████████▏ | 10103/12384 [21:26:17<4:53:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 82%|████████▏ | 10103/12384 [21:26:25<4:53:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 82%|████████▏ | 10104/12384 [21:26:25<4:51:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 82%|████████▏ | 10104/12384 [21:26:33<4:51:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 82%|████████▏ | 10105/12384 [21:26:33<4:51:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 82%|████████▏ | 10105/12384 [21:26:40<4:51:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10106/12384 [21:26:40<4:50:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10106/12384 [21:26:48<4:50:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10107/12384 [21:26:48<4:49:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10107/12384 [21:26:56<4:49:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10108/12384 [21:26:56<4:49:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10108/12384 [21:27:03<4:49:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 82%|████████▏ | 10109/12384 [21:27:03<4:51:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 82%|████████▏ | 10109/12384 [21:27:11<4:51:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 82%|████████▏ | 10110/12384 [21:27:11<4:50:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 82%|████████▏ | 10110/12384 [21:27:19<4:50:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 82%|████████▏ | 10111/12384 [21:27:19<4:49:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 82%|████████▏ | 10111/12384 [21:27:26<4:49:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 82%|████████▏ | 10112/12384 [21:27:26<4:49:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 82%|████████▏ | 10112/12384 [21:27:34<4:49:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 82%|████████▏ | 10113/12384 [21:27:34<4:48:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 82%|████████▏ | 10113/12384 [21:27:41<4:48:56, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10114/12384 [21:27:41<4:48:28, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10114/12384 [21:27:49<4:48:28, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10115/12384 [21:27:49<4:48:09, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10115/12384 [21:27:57<4:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10116/12384 [21:27:57<4:47:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10116/12384 [21:28:04<4:47:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 82%|████████▏ | 10117/12384 [21:28:04<4:48:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 82%|████████▏ | 10117/12384 [21:28:12<4:48:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 82%|████████▏ | 10118/12384 [21:28:12<4:48:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 82%|████████▏ | 10118/12384 [21:28:20<4:48:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.28s]
Epoch 0: 82%|████████▏ | 10119/12384 [21:28:20<4:48:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.28s]
Epoch 0: 82%|████████▏ | 10119/12384 [21:28:27<4:48:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 82%|████████▏ | 10120/12384 [21:28:27<4:48:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 82%|████████▏ | 10120/12384 [21:28:35<4:48:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10121/12384 [21:28:35<4:47:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10121/12384 [21:28:42<4:47:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 82%|████████▏ | 10122/12384 [21:28:42<4:47:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 82%|████████▏ | 10122/12384 [21:28:50<4:47:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 82%|████████▏ | 10123/12384 [21:28:50<4:47:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 0: 82%|████████▏ | 10123/12384 [21:28:58<4:47:12, 7.62s/it, loss=0.0002, acc=0.9984, iter_time=7.32s]
Epoch 0: 82%|████████▏ | 10124/12384 [21:28:58<4:47:48, 7.64s/it, loss=0.0002, acc=0.9984, iter_time=7.32s]
Epoch 0: 82%|████████▏ | 10124/12384 [21:29:05<4:47:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 82%|████████▏ | 10125/12384 [21:29:05<4:47:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 82%|████████▏ | 10125/12384 [21:29:13<4:47:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 82%|████████▏ | 10126/12384 [21:29:13<4:46:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 0: 82%|████████▏ | 10126/12384 [21:29:21<4:46:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 0: 82%|████████▏ | 10127/12384 [21:29:21<4:46:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 0: 82%|████████▏ | 10127/12384 [21:29:28<4:46:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 82%|████████▏ | 10128/12384 [21:29:28<4:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 82%|████████▏ | 10128/12384 [21:29:36<4:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10129/12384 [21:29:36<4:50:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10129/12384 [21:29:44<4:50:20, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=4.79s]
Epoch 0: 82%|████████▏ | 10130/12384 [21:29:44<4:48:51, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=4.79s]
Epoch 0: 82%|████████▏ | 10130/12384 [21:29:51<4:48:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 82%|████████▏ | 10131/12384 [21:29:51<4:47:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 82%|████████▏ | 10131/12384 [21:29:59<4:47:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10132/12384 [21:29:59<4:47:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10132/12384 [21:30:07<4:47:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10133/12384 [21:30:07<4:46:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10133/12384 [21:30:14<4:46:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 82%|████████▏ | 10134/12384 [21:30:14<4:43:14, 7.55s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 82%|████████▏ | 10134/12384 [21:30:22<4:43:14, 7.55s/it, loss=0.0001, acc=1.0000, iter_time=8.62s]
Epoch 0: 82%|████████▏ | 10135/12384 [21:30:22<4:47:03, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.62s]
Epoch 0: 82%|████████▏ | 10135/12384 [21:30:29<4:47:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 82%|████████▏ | 10136/12384 [21:30:29<4:46:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 82%|████████▏ | 10136/12384 [21:30:37<4:46:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 0: 82%|████████▏ | 10137/12384 [21:30:37<4:45:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 0: 82%|████████▏ | 10137/12384 [21:30:45<4:45:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 0: 82%|████████▏ | 10138/12384 [21:30:45<4:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 0: 82%|████████▏ | 10138/12384 [21:30:52<4:45:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.82s]
Epoch 0: 82%|████████▏ | 10139/12384 [21:30:52<4:45:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.82s]
Epoch 0: 82%|████████▏ | 10139/12384 [21:31:00<4:45:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 82%|████████▏ | 10140/12384 [21:31:00<4:45:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 82%|████████▏ | 10140/12384 [21:31:08<4:45:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10141/12384 [21:31:08<4:44:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10141/12384 [21:31:15<4:44:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10142/12384 [21:31:15<4:44:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10142/12384 [21:31:23<4:44:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 82%|████████▏ | 10143/12384 [21:31:23<4:44:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 82%|████████▏ | 10143/12384 [21:31:30<4:44:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 82%|████████▏ | 10144/12384 [21:31:30<4:44:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 82%|████████▏ | 10144/12384 [21:31:38<4:44:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 82%|████████▏ | 10145/12384 [21:31:38<4:44:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 82%|████████▏ | 10145/12384 [21:31:46<4:44:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10146/12384 [21:31:46<4:44:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10146/12384 [21:31:53<4:44:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10147/12384 [21:31:53<4:44:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10147/12384 [21:32:01<4:44:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 82%|████████▏ | 10148/12384 [21:32:01<4:44:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 82%|████████▏ | 10148/12384 [21:32:09<4:44:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10149/12384 [21:32:09<4:44:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10149/12384 [21:32:16<4:44:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 82%|████████▏ | 10150/12384 [21:32:16<4:44:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 82%|████████▏ | 10150/12384 [21:32:24<4:44:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 82%|████████▏ | 10151/12384 [21:32:24<4:44:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 82%|████████▏ | 10151/12384 [21:32:31<4:44:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 82%|████████▏ | 10152/12384 [21:32:31<4:43:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 82%|████████▏ | 10152/12384 [21:32:39<4:43:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 0: 82%|████████▏ | 10153/12384 [21:32:39<4:43:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 0: 82%|████████▏ | 10153/12384 [21:32:47<4:43:35, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=10.05s]
Epoch 0: 82%|████████▏ | 10154/12384 [21:32:47<4:45:04, 7.67s/it, loss=0.0001, acc=0.9996, iter_time=10.05s]
Epoch 0: 82%|████████▏ | 10154/12384 [21:32:55<4:45:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 82%|████████▏ | 10155/12384 [21:32:55<4:47:54, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 82%|████████▏ | 10155/12384 [21:33:02<4:47:54, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 82%|████████▏ | 10156/12384 [21:33:02<4:46:38, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 82%|████████▏ | 10156/12384 [21:33:10<4:46:38, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 82%|████████▏ | 10157/12384 [21:33:10<4:46:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 82%|████████▏ | 10157/12384 [21:33:18<4:46:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 82%|████████▏ | 10158/12384 [21:33:18<4:45:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 82%|████████▏ | 10158/12384 [21:33:25<4:45:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 82%|████████▏ | 10159/12384 [21:33:25<4:44:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 82%|████████▏ | 10159/12384 [21:33:33<4:44:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 82%|████████▏ | 10160/12384 [21:33:33<4:43:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 82%|████████▏ | 10160/12384 [21:33:41<4:43:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 82%|████████▏ | 10161/12384 [21:33:41<4:45:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 82%|████████▏ | 10161/12384 [21:33:48<4:45:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 82%|████████▏ | 10162/12384 [21:33:48<4:44:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 82%|████████▏ | 10162/12384 [21:33:56<4:44:38, 7.69s/it, loss=0.0001, acc=0.9991, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10163/12384 [21:33:56<4:43:55, 7.67s/it, loss=0.0001, acc=0.9991, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10163/12384 [21:34:04<4:43:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 82%|████████▏ | 10164/12384 [21:34:04<4:43:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 82%|████████▏ | 10164/12384 [21:34:11<4:43:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10165/12384 [21:34:11<4:42:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10165/12384 [21:34:19<4:42:47, 7.65s/it, loss=0.0003, acc=0.9994, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10166/12384 [21:34:19<4:42:21, 7.64s/it, loss=0.0003, acc=0.9994, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10166/12384 [21:34:27<4:42:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10167/12384 [21:34:27<4:41:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10167/12384 [21:34:34<4:41:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 82%|████████▏ | 10168/12384 [21:34:34<4:41:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 82%|████████▏ | 10168/12384 [21:34:42<4:41:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 82%|████████▏ | 10169/12384 [21:34:42<4:41:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 82%|████████▏ | 10169/12384 [21:34:49<4:41:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 82%|████████▏ | 10170/12384 [21:34:49<4:41:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 82%|████████▏ | 10170/12384 [21:34:57<4:41:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 82%|████████▏ | 10171/12384 [21:34:57<4:40:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 82%|████████▏ | 10171/12384 [21:35:05<4:40:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10172/12384 [21:35:05<4:40:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10172/12384 [21:35:12<4:40:37, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=7.62s]
Epoch 0: 82%|████████▏ | 10173/12384 [21:35:12<4:40:35, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=7.62s]
Epoch 0: 82%|████████▏ | 10173/12384 [21:35:20<4:40:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10174/12384 [21:35:20<4:40:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10174/12384 [21:35:27<4:40:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 0: 82%|████████▏ | 10175/12384 [21:35:27<4:40:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 0: 82%|████████▏ | 10175/12384 [21:35:35<4:40:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.51s]
Epoch 0: 82%|████████▏ | 10176/12384 [21:35:35<4:39:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.51s]
Epoch 0: 82%|████████▏ | 10176/12384 [21:35:43<4:39:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 82%|████████▏ | 10177/12384 [21:35:43<4:39:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 82%|████████▏ | 10177/12384 [21:35:50<4:39:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10178/12384 [21:35:50<4:39:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10178/12384 [21:35:58<4:39:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 82%|████████▏ | 10179/12384 [21:35:58<4:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 82%|████████▏ | 10179/12384 [21:36:06<4:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 0: 82%|████████▏ | 10180/12384 [21:36:06<4:39:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 0: 82%|████████▏ | 10180/12384 [21:36:13<4:39:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 82%|████████▏ | 10181/12384 [21:36:13<4:43:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 82%|████████▏ | 10181/12384 [21:36:21<4:43:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 82%|████████▏ | 10182/12384 [21:36:21<4:41:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 82%|████████▏ | 10182/12384 [21:36:29<4:41:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 82%|████████▏ | 10183/12384 [21:36:29<4:40:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 82%|████████▏ | 10183/12384 [21:36:36<4:40:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 82%|████████▏ | 10184/12384 [21:36:36<4:39:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 82%|████████▏ | 10184/12384 [21:36:44<4:39:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 82%|████████▏ | 10185/12384 [21:36:44<4:39:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 82%|████████▏ | 10185/12384 [21:36:51<4:39:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 82%|████████▏ | 10186/12384 [21:36:51<4:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 82%|████████▏ | 10186/12384 [21:36:59<4:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 82%|████████▏ | 10187/12384 [21:36:59<4:43:10, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 82%|████████▏ | 10187/12384 [21:37:07<4:43:10, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10188/12384 [21:37:07<4:41:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10188/12384 [21:37:15<4:41:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 82%|████████▏ | 10189/12384 [21:37:15<4:40:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 82%|████████▏ | 10189/12384 [21:37:22<4:40:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10190/12384 [21:37:22<4:39:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10190/12384 [21:37:30<4:39:48, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10191/12384 [21:37:30<4:39:19, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 82%|████████▏ | 10191/12384 [21:37:38<4:39:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 82%|████████▏ | 10192/12384 [21:37:38<4:38:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 82%|████████▏ | 10192/12384 [21:37:45<4:38:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 82%|████████▏ | 10193/12384 [21:37:45<4:38:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 82%|████████▏ | 10193/12384 [21:37:53<4:38:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 82%|████████▏ | 10194/12384 [21:37:53<4:37:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 82%|████████▏ | 10194/12384 [21:38:00<4:37:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 82%|████████▏ | 10195/12384 [21:38:00<4:37:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 82%|████████▏ | 10195/12384 [21:38:08<4:37:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 82%|████████▏ | 10196/12384 [21:38:08<4:37:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 0: 82%|████████▏ | 10196/12384 [21:38:16<4:37:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 82%|████████▏ | 10197/12384 [21:38:16<4:38:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 82%|████████▏ | 10197/12384 [21:38:23<4:38:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 0: 82%|████████▏ | 10198/12384 [21:38:23<4:37:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 0: 82%|████████▏ | 10198/12384 [21:38:31<4:37:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 82%|████████▏ | 10199/12384 [21:38:31<4:37:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 82%|████████▏ | 10199/12384 [21:38:39<4:37:45, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.00s]
Epoch 0: 82%|████████▏ | 10200/12384 [21:38:39<4:37:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.00s]
Epoch 0: 82%|████████▏ | 10200/12384 [21:38:46<4:37:37, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=7.19s]
Epoch 0: 82%|████████▏ | 10201/12384 [21:38:46<4:37:20, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.19s]
Epoch 0: 82%|████████▏ | 10201/12384 [21:38:54<4:37:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10202/12384 [21:38:54<4:37:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 82%|████████▏ | 10202/12384 [21:39:01<4:37:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10203/12384 [21:39:01<4:36:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 82%|████████▏ | 10203/12384 [21:39:09<4:36:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 82%|████████▏ | 10204/12384 [21:39:09<4:36:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 82%|████████▏ | 10204/12384 [21:39:17<4:36:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.12s]
Epoch 0: 82%|████████▏ | 10205/12384 [21:39:17<4:36:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.12s]
Epoch 0: 82%|████████▏ | 10205/12384 [21:39:24<4:36:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10206/12384 [21:39:24<4:36:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10206/12384 [21:39:32<4:36:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 82%|████████▏ | 10207/12384 [21:39:32<4:36:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 82%|████████▏ | 10207/12384 [21:39:40<4:36:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 82%|████████▏ | 10208/12384 [21:39:40<4:39:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 82%|████████▏ | 10208/12384 [21:39:47<4:39:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 82%|████████▏ | 10209/12384 [21:39:47<4:38:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 82%|████████▏ | 10209/12384 [21:39:55<4:38:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 0: 82%|████████▏ | 10210/12384 [21:39:55<4:37:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 0: 82%|████████▏ | 10210/12384 [21:40:03<4:37:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 0: 82%|████████▏ | 10211/12384 [21:40:03<4:36:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 0: 82%|████████▏ | 10211/12384 [21:40:10<4:36:49, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=9.13s]
Epoch 0: 82%|████████▏ | 10212/12384 [21:40:10<4:37:24, 7.66s/it, loss=0.0002, acc=0.9997, iter_time=9.13s]
Epoch 0: 82%|████████▏ | 10212/12384 [21:40:18<4:37:24, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 82%|████████▏ | 10213/12384 [21:40:18<4:36:56, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 82%|████████▏ | 10213/12384 [21:40:26<4:36:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 82%|████████▏ | 10214/12384 [21:40:26<4:39:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 82%|████████▏ | 10214/12384 [21:40:33<4:39:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10215/12384 [21:40:33<4:38:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 82%|████████▏ | 10215/12384 [21:40:41<4:38:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 82%|████████▏ | 10216/12384 [21:40:41<4:37:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 82%|████████▏ | 10216/12384 [21:40:49<4:37:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 83%|████████▎ | 10217/12384 [21:40:49<4:36:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 83%|████████▎ | 10217/12384 [21:40:56<4:36:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 83%|████████▎ | 10218/12384 [21:40:56<4:35:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 83%|████████▎ | 10218/12384 [21:41:04<4:35:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 83%|████████▎ | 10219/12384 [21:41:04<4:35:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 0: 83%|████████▎ | 10219/12384 [21:41:11<4:35:23, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.13s]
Epoch 0: 83%|████████▎ | 10220/12384 [21:41:11<4:35:13, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.13s]
Epoch 0: 83%|████████▎ | 10220/12384 [21:41:19<4:35:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 83%|████████▎ | 10221/12384 [21:41:19<4:34:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 83%|████████▎ | 10221/12384 [21:41:27<4:34:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 83%|████████▎ | 10222/12384 [21:41:27<4:34:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 83%|████████▎ | 10222/12384 [21:41:34<4:34:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.73s]
Epoch 0: 83%|████████▎ | 10223/12384 [21:41:34<4:34:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.73s]
Epoch 0: 83%|████████▎ | 10223/12384 [21:41:42<4:34:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 83%|████████▎ | 10224/12384 [21:41:42<4:34:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 83%|████████▎ | 10224/12384 [21:41:50<4:34:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 0: 83%|████████▎ | 10225/12384 [21:41:50<4:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 0: 83%|████████▎ | 10225/12384 [21:41:57<4:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 83%|████████▎ | 10226/12384 [21:41:57<4:34:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 83%|████████▎ | 10226/12384 [21:42:05<4:34:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 83%|████████▎ | 10227/12384 [21:42:05<4:33:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 83%|████████▎ | 10227/12384 [21:42:12<4:33:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 83%|████████▎ | 10228/12384 [21:42:12<4:33:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 83%|████████▎ | 10228/12384 [21:42:20<4:33:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 83%|████████▎ | 10229/12384 [21:42:20<4:33:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 83%|████████▎ | 10229/12384 [21:42:28<4:33:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10230/12384 [21:42:28<4:33:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10230/12384 [21:42:35<4:33:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10231/12384 [21:42:35<4:32:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10231/12384 [21:42:43<4:32:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 83%|████████▎ | 10232/12384 [21:42:43<4:32:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 83%|████████▎ | 10232/12384 [21:42:50<4:32:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 83%|████████▎ | 10233/12384 [21:42:50<4:32:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 83%|████████▎ | 10233/12384 [21:42:58<4:32:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.59s]
Epoch 0: 83%|████████▎ | 10234/12384 [21:42:58<4:36:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.59s]
Epoch 0: 83%|████████▎ | 10234/12384 [21:43:06<4:36:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=12.00s]
Epoch 0: 83%|████████▎ | 10235/12384 [21:43:06<4:35:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=12.00s]
Epoch 0: 83%|████████▎ | 10235/12384 [21:43:14<4:35:15, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=5.87s]
Epoch 0: 83%|████████▎ | 10236/12384 [21:43:14<4:34:24, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=5.87s]
Epoch 0: 83%|████████▎ | 10236/12384 [21:43:21<4:34:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 0: 83%|████████▎ | 10237/12384 [21:43:21<4:33:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 0: 83%|████████▎ | 10237/12384 [21:43:29<4:33:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 83%|████████▎ | 10238/12384 [21:43:29<4:32:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 83%|████████▎ | 10238/12384 [21:43:36<4:32:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 83%|████████▎ | 10239/12384 [21:43:36<4:32:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 83%|████████▎ | 10239/12384 [21:43:44<4:32:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 83%|████████▎ | 10240/12384 [21:43:44<4:32:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 83%|████████▎ | 10240/12384 [21:43:52<4:32:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 83%|████████▎ | 10241/12384 [21:43:52<4:34:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 83%|████████▎ | 10241/12384 [21:43:59<4:34:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10242/12384 [21:43:59<4:33:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10242/12384 [21:44:07<4:33:26, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.74s]
Epoch 0: 83%|████████▎ | 10243/12384 [21:44:07<4:32:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.74s]
Epoch 0: 83%|████████▎ | 10243/12384 [21:44:15<4:32:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 83%|████████▎ | 10244/12384 [21:44:15<4:32:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 83%|████████▎ | 10244/12384 [21:44:22<4:32:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 83%|████████▎ | 10245/12384 [21:44:22<4:32:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 83%|████████▎ | 10245/12384 [21:44:30<4:32:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 83%|████████▎ | 10246/12384 [21:44:30<4:31:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 0: 83%|████████▎ | 10246/12384 [21:44:38<4:31:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 83%|████████▎ | 10247/12384 [21:44:38<4:31:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 83%|████████▎ | 10247/12384 [21:44:45<4:31:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 83%|████████▎ | 10248/12384 [21:44:45<4:31:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 83%|████████▎ | 10248/12384 [21:44:53<4:31:30, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=6.34s]
Epoch 0: 83%|████████▎ | 10249/12384 [21:44:53<4:30:57, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.34s]
Epoch 0: 83%|████████▎ | 10249/12384 [21:45:00<4:30:57, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=8.86s]
Epoch 0: 83%|████████▎ | 10250/12384 [21:45:00<4:30:47, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=8.86s]
Epoch 0: 83%|████████▎ | 10250/12384 [21:45:08<4:30:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 0: 83%|████████▎ | 10251/12384 [21:45:08<4:30:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 0: 83%|████████▎ | 10251/12384 [21:45:16<4:30:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 83%|████████▎ | 10252/12384 [21:45:16<4:30:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 83%|████████▎ | 10252/12384 [21:45:23<4:30:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10253/12384 [21:45:23<4:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10253/12384 [21:45:31<4:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 83%|████████▎ | 10254/12384 [21:45:31<4:30:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 83%|████████▎ | 10254/12384 [21:45:38<4:30:14, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=7.60s]
Epoch 0: 83%|████████▎ | 10255/12384 [21:45:38<4:30:10, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=7.60s]
Epoch 0: 83%|████████▎ | 10255/12384 [21:45:46<4:30:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 83%|████████▎ | 10256/12384 [21:45:46<4:30:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 83%|████████▎ | 10256/12384 [21:45:54<4:30:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 83%|████████▎ | 10257/12384 [21:45:54<4:30:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 83%|████████▎ | 10257/12384 [21:46:01<4:30:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10258/12384 [21:46:01<4:29:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10258/12384 [21:46:09<4:29:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 83%|████████▎ | 10259/12384 [21:46:09<4:29:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 83%|████████▎ | 10259/12384 [21:46:17<4:29:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 83%|████████▎ | 10260/12384 [21:46:17<4:29:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 83%|████████▎ | 10260/12384 [21:46:25<4:29:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 83%|████████▎ | 10261/12384 [21:46:25<4:33:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 83%|████████▎ | 10261/12384 [21:46:32<4:33:19, 7.72s/it, loss=0.0002, acc=0.9985, iter_time=7.64s]
Epoch 0: 83%|████████▎ | 10262/12384 [21:46:32<4:31:50, 7.69s/it, loss=0.0002, acc=0.9985, iter_time=7.64s]
Epoch 0: 83%|████████▎ | 10262/12384 [21:46:40<4:31:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 83%|████████▎ | 10263/12384 [21:46:40<4:30:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 83%|████████▎ | 10263/12384 [21:46:47<4:30:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 83%|████████▎ | 10264/12384 [21:46:47<4:30:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 83%|████████▎ | 10264/12384 [21:46:55<4:30:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 83%|████████▎ | 10265/12384 [21:46:55<4:29:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 83%|████████▎ | 10265/12384 [21:47:03<4:29:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 83%|████████▎ | 10266/12384 [21:47:03<4:29:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 83%|████████▎ | 10266/12384 [21:47:10<4:29:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 83%|████████▎ | 10267/12384 [21:47:10<4:32:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 83%|████████▎ | 10267/12384 [21:47:18<4:32:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10268/12384 [21:47:18<4:30:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10268/12384 [21:47:26<4:30:55, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.31s]
Epoch 0: 83%|████████▎ | 10269/12384 [21:47:26<4:30:00, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.31s]
Epoch 0: 83%|████████▎ | 10269/12384 [21:47:33<4:30:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 83%|████████▎ | 10270/12384 [21:47:33<4:29:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 83%|████████▎ | 10270/12384 [21:47:41<4:29:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 83%|████████▎ | 10271/12384 [21:47:41<4:28:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 83%|████████▎ | 10271/12384 [21:47:49<4:28:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 0: 83%|████████▎ | 10272/12384 [21:47:49<4:28:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 0: 83%|████████▎ | 10272/12384 [21:47:56<4:28:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 83%|████████▎ | 10273/12384 [21:47:56<4:28:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 83%|████████▎ | 10273/12384 [21:48:04<4:28:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10274/12384 [21:48:04<4:28:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10274/12384 [21:48:11<4:28:08, 7.62s/it, loss=0.0007, acc=0.9982, iter_time=7.61s]
Epoch 0: 83%|████████▎ | 10275/12384 [21:48:11<4:27:50, 7.62s/it, loss=0.0007, acc=0.9982, iter_time=7.61s]
Epoch 0: 83%|████████▎ | 10275/12384 [21:48:19<4:27:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 83%|████████▎ | 10276/12384 [21:48:19<4:27:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 83%|████████▎ | 10276/12384 [21:48:27<4:27:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 83%|████████▎ | 10277/12384 [21:48:27<4:27:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 83%|████████▎ | 10277/12384 [21:48:34<4:27:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 83%|████████▎ | 10278/12384 [21:48:34<4:27:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 83%|████████▎ | 10278/12384 [21:48:42<4:27:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 83%|████████▎ | 10279/12384 [21:48:42<4:26:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 83%|████████▎ | 10279/12384 [21:48:49<4:26:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 83%|████████▎ | 10280/12384 [21:48:49<4:26:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 83%|████████▎ | 10280/12384 [21:48:57<4:26:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 83%|████████▎ | 10281/12384 [21:48:57<4:27:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 83%|████████▎ | 10281/12384 [21:49:05<4:27:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 83%|████████▎ | 10282/12384 [21:49:05<4:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 83%|████████▎ | 10282/12384 [21:49:12<4:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 83%|████████▎ | 10283/12384 [21:49:12<4:26:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 83%|████████▎ | 10283/12384 [21:49:20<4:26:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 83%|████████▎ | 10284/12384 [21:49:20<4:26:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 83%|████████▎ | 10284/12384 [21:49:28<4:26:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 83%|████████▎ | 10285/12384 [21:49:28<4:26:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 83%|████████▎ | 10285/12384 [21:49:35<4:26:13, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.89s]
Epoch 0: 83%|████████▎ | 10286/12384 [21:49:35<4:26:05, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.89s]
Epoch 0: 83%|████████▎ | 10286/12384 [21:49:43<4:26:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 83%|████████▎ | 10287/12384 [21:49:43<4:29:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 83%|████████▎ | 10287/12384 [21:49:51<4:29:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 83%|████████▎ | 10288/12384 [21:49:51<4:30:46, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 83%|████████▎ | 10288/12384 [21:49:59<4:30:46, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 83%|████████▎ | 10289/12384 [21:49:59<4:29:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 83%|████████▎ | 10289/12384 [21:50:06<4:29:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 83%|████████▎ | 10290/12384 [21:50:06<4:28:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 83%|████████▎ | 10290/12384 [21:50:14<4:28:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 83%|████████▎ | 10291/12384 [21:50:14<4:26:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 83%|████████▎ | 10291/12384 [21:50:21<4:26:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10292/12384 [21:50:21<4:26:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10292/12384 [21:50:29<4:26:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 83%|████████▎ | 10293/12384 [21:50:29<4:29:47, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 83%|████████▎ | 10293/12384 [21:50:37<4:29:47, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 83%|████████▎ | 10294/12384 [21:50:37<4:28:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 0: 83%|████████▎ | 10294/12384 [21:50:44<4:28:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 83%|████████▎ | 10295/12384 [21:50:44<4:26:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 83%|████████▎ | 10295/12384 [21:50:52<4:26:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 0: 83%|████████▎ | 10296/12384 [21:50:52<4:26:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 0: 83%|████████▎ | 10296/12384 [21:51:00<4:26:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 83%|████████▎ | 10297/12384 [21:51:00<4:25:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 83%|████████▎ | 10297/12384 [21:51:07<4:25:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 83%|████████▎ | 10298/12384 [21:51:07<4:25:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 83%|████████▎ | 10298/12384 [21:51:15<4:25:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 83%|████████▎ | 10299/12384 [21:51:15<4:24:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 83%|████████▎ | 10299/12384 [21:51:23<4:24:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 83%|████████▎ | 10300/12384 [21:51:23<4:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 0: 83%|████████▎ | 10300/12384 [21:51:30<4:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 83%|████████▎ | 10301/12384 [21:51:30<4:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 83%|████████▎ | 10301/12384 [21:51:38<4:24:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 83%|████████▎ | 10302/12384 [21:51:38<4:24:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 83%|████████▎ | 10302/12384 [21:51:45<4:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 83%|████████▎ | 10303/12384 [21:51:45<4:24:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 83%|████████▎ | 10303/12384 [21:51:53<4:24:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 83%|████████▎ | 10304/12384 [21:51:53<4:24:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 83%|████████▎ | 10304/12384 [21:52:01<4:24:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 83%|████████▎ | 10305/12384 [21:52:01<4:23:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 83%|████████▎ | 10305/12384 [21:52:08<4:23:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10306/12384 [21:52:08<4:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10306/12384 [21:52:16<4:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 83%|████████▎ | 10307/12384 [21:52:16<4:23:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 83%|████████▎ | 10307/12384 [21:52:23<4:23:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 83%|████████▎ | 10308/12384 [21:52:23<4:23:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 83%|████████▎ | 10308/12384 [21:52:31<4:23:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10309/12384 [21:52:31<4:23:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 83%|████████▎ | 10309/12384 [21:52:39<4:23:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.01s]
Epoch 0: 83%|████████▎ | 10310/12384 [21:52:39<4:23:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.01s]
Epoch 0: 83%|████████▎ | 10310/12384 [21:52:46<4:23:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 83%|████████▎ | 10311/12384 [21:52:46<4:23:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 83%|████████▎ | 10311/12384 [21:52:54<4:23:04, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.54s]
Epoch 0: 83%|████████▎ | 10312/12384 [21:52:54<4:22:46, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.54s]
Epoch 0: 83%|████████▎ | 10312/12384 [21:53:02<4:22:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 83%|████████▎ | 10313/12384 [21:53:02<4:26:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 83%|████████▎ | 10313/12384 [21:53:09<4:26:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 83%|████████▎ | 10314/12384 [21:53:09<4:24:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 83%|████████▎ | 10314/12384 [21:53:17<4:24:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 83%|████████▎ | 10315/12384 [21:53:17<4:24:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 83%|████████▎ | 10315/12384 [21:53:25<4:24:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 0: 83%|████████▎ | 10316/12384 [21:53:25<4:23:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 0: 83%|████████▎ | 10316/12384 [21:53:32<4:23:38, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.21s]
Epoch 0: 83%|████████▎ | 10317/12384 [21:53:32<4:22:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.21s]
Epoch 0: 83%|████████▎ | 10317/12384 [21:53:40<4:22:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 83%|████████▎ | 10318/12384 [21:53:40<4:22:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 83%|████████▎ | 10318/12384 [21:53:48<4:22:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 83%|████████▎ | 10319/12384 [21:53:48<4:25:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 83%|████████▎ | 10319/12384 [21:53:55<4:25:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 83%|████████▎ | 10320/12384 [21:53:55<4:24:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 83%|████████▎ | 10320/12384 [21:54:03<4:24:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 83%|████████▎ | 10321/12384 [21:54:03<4:23:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 83%|████████▎ | 10321/12384 [21:54:11<4:23:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 83%|████████▎ | 10322/12384 [21:54:11<4:23:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 83%|████████▎ | 10322/12384 [21:54:18<4:23:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 83%|████████▎ | 10323/12384 [21:54:18<4:22:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 83%|████████▎ | 10323/12384 [21:54:26<4:22:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.00s]
Epoch 0: 83%|████████▎ | 10324/12384 [21:54:26<4:22:13, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.00s]
Epoch 0: 83%|████████▎ | 10324/12384 [21:54:33<4:22:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 83%|████████▎ | 10325/12384 [21:54:33<4:21:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 83%|████████▎ | 10325/12384 [21:54:41<4:21:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 83%|████████▎ | 10326/12384 [21:54:41<4:21:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 83%|████████▎ | 10326/12384 [21:54:49<4:21:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 83%|████████▎ | 10327/12384 [21:54:49<4:21:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 83%|████████▎ | 10327/12384 [21:54:56<4:21:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 83%|████████▎ | 10328/12384 [21:54:56<4:21:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 83%|████████▎ | 10328/12384 [21:55:04<4:21:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 83%|████████▎ | 10329/12384 [21:55:04<4:21:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 83%|████████▎ | 10329/12384 [21:55:12<4:21:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 83%|████████▎ | 10330/12384 [21:55:12<4:21:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 83%|████████▎ | 10330/12384 [21:55:19<4:21:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 83%|████████▎ | 10331/12384 [21:55:19<4:21:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 83%|████████▎ | 10331/12384 [21:55:27<4:21:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10332/12384 [21:55:27<4:20:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 83%|████████▎ | 10332/12384 [21:55:34<4:20:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 83%|████████▎ | 10333/12384 [21:55:34<4:20:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 83%|████████▎ | 10333/12384 [21:55:42<4:20:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 83%|████████▎ | 10334/12384 [21:55:42<4:19:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 83%|████████▎ | 10334/12384 [21:55:50<4:19:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 83%|████████▎ | 10335/12384 [21:55:50<4:19:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 0: 83%|████████▎ | 10335/12384 [21:55:57<4:19:30, 7.60s/it, loss=0.0031, acc=0.9974, iter_time=11.70s]
Epoch 0: 83%|████████▎ | 10336/12384 [21:55:57<4:19:33, 7.60s/it, loss=0.0031, acc=0.9974, iter_time=11.70s]
Epoch 0: 83%|████████▎ | 10336/12384 [21:56:05<4:19:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 83%|████████▎ | 10337/12384 [21:56:05<4:19:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 83%|████████▎ | 10337/12384 [21:56:12<4:19:24, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=6.43s]
Epoch 0: 83%|████████▎ | 10338/12384 [21:56:12<4:19:21, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=6.43s]
Epoch 0: 83%|████████▎ | 10338/12384 [21:56:20<4:19:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 83%|████████▎ | 10339/12384 [21:56:20<4:22:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 83%|████████▎ | 10339/12384 [21:56:28<4:22:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 83%|████████▎ | 10340/12384 [21:56:28<4:21:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 83%|████████▎ | 10340/12384 [21:56:36<4:21:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 84%|████████▎ | 10341/12384 [21:56:36<4:21:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 0: 84%|████████▎ | 10341/12384 [21:56:43<4:21:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 0: 84%|████████▎ | 10342/12384 [21:56:43<4:20:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 0: 84%|████████▎ | 10342/12384 [21:56:51<4:20:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 84%|████████▎ | 10343/12384 [21:56:51<4:20:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 84%|████████▎ | 10343/12384 [21:56:59<4:20:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 84%|████████▎ | 10344/12384 [21:56:59<4:19:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 84%|████████▎ | 10344/12384 [21:57:07<4:19:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 84%|████████▎ | 10345/12384 [21:57:07<4:22:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 84%|████████▎ | 10345/12384 [21:57:14<4:22:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▎ | 10346/12384 [21:57:14<4:21:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▎ | 10346/12384 [21:57:22<4:21:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▎ | 10347/12384 [21:57:22<4:20:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▎ | 10347/12384 [21:57:29<4:20:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 84%|████████▎ | 10348/12384 [21:57:29<4:19:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 84%|████████▎ | 10348/12384 [21:57:37<4:19:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 0: 84%|████████▎ | 10349/12384 [21:57:37<4:18:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 0: 84%|████████▎ | 10349/12384 [21:57:45<4:18:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 84%|████████▎ | 10350/12384 [21:57:45<4:18:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 84%|████████▎ | 10350/12384 [21:57:52<4:18:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 84%|████████▎ | 10351/12384 [21:57:52<4:17:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 84%|████████▎ | 10351/12384 [21:58:00<4:17:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 84%|████████▎ | 10352/12384 [21:58:00<4:17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 84%|████████▎ | 10352/12384 [21:58:07<4:17:54, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=5.79s]
Epoch 0: 84%|████████▎ | 10353/12384 [21:58:07<4:17:39, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=5.79s]
Epoch 0: 84%|████████▎ | 10353/12384 [21:58:15<4:17:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 0: 84%|████████▎ | 10354/12384 [21:58:15<4:17:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 0: 84%|████████▎ | 10354/12384 [21:58:23<4:17:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 84%|████████▎ | 10355/12384 [21:58:23<4:17:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 0: 84%|████████▎ | 10355/12384 [21:58:30<4:17:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 0: 84%|████████▎ | 10356/12384 [21:58:30<4:16:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 0: 84%|████████▎ | 10356/12384 [21:58:38<4:16:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▎ | 10357/12384 [21:58:38<4:16:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▎ | 10357/12384 [21:58:45<4:16:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 84%|████████▎ | 10358/12384 [21:58:45<4:16:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 84%|████████▎ | 10358/12384 [21:58:53<4:16:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.13s]
Epoch 0: 84%|████████▎ | 10359/12384 [21:58:53<4:16:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.13s]
Epoch 0: 84%|████████▎ | 10359/12384 [21:59:01<4:16:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 84%|████████▎ | 10360/12384 [21:59:01<4:16:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 84%|████████▎ | 10360/12384 [21:59:08<4:16:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 84%|████████▎ | 10361/12384 [21:59:08<4:16:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 84%|████████▎ | 10361/12384 [21:59:16<4:16:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▎ | 10362/12384 [21:59:16<4:16:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▎ | 10362/12384 [21:59:23<4:16:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▎ | 10363/12384 [21:59:23<4:16:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▎ | 10363/12384 [21:59:31<4:16:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 0: 84%|████████▎ | 10364/12384 [21:59:31<4:15:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 0: 84%|████████▎ | 10364/12384 [21:59:39<4:15:57, 7.60s/it, loss=0.0024, acc=0.9939, iter_time=9.43s]
Epoch 0: 84%|████████▎ | 10365/12384 [21:59:39<4:19:08, 7.70s/it, loss=0.0024, acc=0.9939, iter_time=9.43s]
Epoch 0: 84%|████████▎ | 10365/12384 [21:59:47<4:19:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 84%|████████▎ | 10366/12384 [21:59:47<4:18:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 84%|████████▎ | 10366/12384 [21:59:54<4:18:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 84%|████████▎ | 10367/12384 [21:59:54<4:17:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 84%|████████▎ | 10367/12384 [22:00:02<4:17:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 0: 84%|████████▎ | 10368/12384 [22:00:02<4:17:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 0: 84%|████████▎ | 10368/12384 [22:00:09<4:17:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 84%|████████▎ | 10369/12384 [22:00:09<4:16:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 84%|████████▎ | 10369/12384 [22:00:17<4:16:46, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=8.77s]
Epoch 0: 84%|████████▎ | 10370/12384 [22:00:17<4:16:11, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.77s]
Epoch 0: 84%|████████▎ | 10370/12384 [22:00:25<4:16:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 84%|████████▎ | 10371/12384 [22:00:25<4:15:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 84%|████████▎ | 10371/12384 [22:00:32<4:15:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 84%|████████▍ | 10372/12384 [22:00:32<4:15:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 84%|████████▍ | 10372/12384 [22:00:40<4:15:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10373/12384 [22:00:40<4:15:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10373/12384 [22:00:47<4:15:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 84%|████████▍ | 10374/12384 [22:00:47<4:15:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 84%|████████▍ | 10374/12384 [22:00:55<4:15:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 84%|████████▍ | 10375/12384 [22:00:55<4:15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 84%|████████▍ | 10375/12384 [22:01:03<4:15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 84%|████████▍ | 10376/12384 [22:01:03<4:15:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 84%|████████▍ | 10376/12384 [22:01:10<4:15:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 0: 84%|████████▍ | 10377/12384 [22:01:10<4:14:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 0: 84%|████████▍ | 10377/12384 [22:01:18<4:14:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 84%|████████▍ | 10378/12384 [22:01:18<4:14:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 84%|████████▍ | 10378/12384 [22:01:26<4:14:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 84%|████████▍ | 10379/12384 [22:01:26<4:14:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 84%|████████▍ | 10379/12384 [22:01:33<4:14:26, 7.61s/it, loss=0.0021, acc=0.9930, iter_time=5.01s]
Epoch 0: 84%|████████▍ | 10380/12384 [22:01:33<4:14:11, 7.61s/it, loss=0.0021, acc=0.9930, iter_time=5.01s]
Epoch 0: 84%|████████▍ | 10380/12384 [22:01:41<4:14:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.20s]
Epoch 0: 84%|████████▍ | 10381/12384 [22:01:41<4:13:50, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.20s]
Epoch 0: 84%|████████▍ | 10381/12384 [22:01:48<4:13:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10382/12384 [22:01:48<4:14:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10382/12384 [22:01:56<4:14:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 84%|████████▍ | 10383/12384 [22:01:56<4:14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 84%|████████▍ | 10383/12384 [22:02:04<4:14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 84%|████████▍ | 10384/12384 [22:02:04<4:13:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 84%|████████▍ | 10384/12384 [22:02:11<4:13:59, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=6.34s]
Epoch 0: 84%|████████▍ | 10385/12384 [22:02:11<4:13:36, 7.61s/it, loss=0.0002, acc=0.9997, iter_time=6.34s]
Epoch 0: 84%|████████▍ | 10385/12384 [22:02:19<4:13:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 84%|████████▍ | 10386/12384 [22:02:19<4:13:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 84%|████████▍ | 10386/12384 [22:02:26<4:13:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 84%|████████▍ | 10387/12384 [22:02:26<4:13:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 0: 84%|████████▍ | 10387/12384 [22:02:34<4:13:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▍ | 10388/12384 [22:02:34<4:13:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▍ | 10388/12384 [22:02:42<4:13:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▍ | 10389/12384 [22:02:42<4:12:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▍ | 10389/12384 [22:02:49<4:12:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▍ | 10390/12384 [22:02:49<4:13:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 84%|████████▍ | 10390/12384 [22:02:57<4:13:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10391/12384 [22:02:57<4:12:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10391/12384 [22:03:05<4:12:45, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=8.05s]
Epoch 0: 84%|████████▍ | 10392/12384 [22:03:05<4:16:42, 7.73s/it, loss=0.0001, acc=0.9995, iter_time=8.05s]
Epoch 0: 84%|████████▍ | 10392/12384 [22:03:13<4:16:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 84%|████████▍ | 10393/12384 [22:03:13<4:15:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 84%|████████▍ | 10393/12384 [22:03:20<4:15:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 84%|████████▍ | 10394/12384 [22:03:20<4:14:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 84%|████████▍ | 10394/12384 [22:03:28<4:14:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 84%|████████▍ | 10395/12384 [22:03:28<4:14:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 84%|████████▍ | 10395/12384 [22:03:35<4:14:25, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=9.47s]
Epoch 0: 84%|████████▍ | 10396/12384 [22:03:35<4:13:50, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=9.47s]
Epoch 0: 84%|████████▍ | 10396/12384 [22:03:43<4:13:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▍ | 10397/12384 [22:03:43<4:13:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▍ | 10397/12384 [22:03:51<4:13:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 84%|████████▍ | 10398/12384 [22:03:51<4:12:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 84%|████████▍ | 10398/12384 [22:03:58<4:12:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 84%|████████▍ | 10399/12384 [22:03:58<4:12:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 84%|████████▍ | 10399/12384 [22:04:06<4:12:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 84%|████████▍ | 10400/12384 [22:04:06<4:12:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 84%|████████▍ | 10400/12384 [22:04:14<4:12:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 0: 84%|████████▍ | 10401/12384 [22:04:14<4:11:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 0: 84%|████████▍ | 10401/12384 [22:04:21<4:11:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 84%|████████▍ | 10402/12384 [22:04:21<4:11:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 84%|████████▍ | 10402/12384 [22:04:29<4:11:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 84%|████████▍ | 10403/12384 [22:04:29<4:11:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 84%|████████▍ | 10403/12384 [22:04:36<4:11:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.91s]
Epoch 0: 84%|████████▍ | 10404/12384 [22:04:36<4:11:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.91s]
Epoch 0: 84%|████████▍ | 10404/12384 [22:04:44<4:11:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10405/12384 [22:04:44<4:11:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10405/12384 [22:04:52<4:11:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 84%|████████▍ | 10406/12384 [22:04:52<4:10:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 84%|████████▍ | 10406/12384 [22:04:59<4:10:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.73s]
Epoch 0: 84%|████████▍ | 10407/12384 [22:04:59<4:10:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.73s]
Epoch 0: 84%|████████▍ | 10407/12384 [22:05:07<4:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 84%|████████▍ | 10408/12384 [22:05:07<4:10:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 84%|████████▍ | 10408/12384 [22:05:14<4:10:34, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.66s]
Epoch 0: 84%|████████▍ | 10409/12384 [22:05:14<4:10:21, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.66s]
Epoch 0: 84%|████████▍ | 10409/12384 [22:05:22<4:10:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 84%|████████▍ | 10410/12384 [22:05:22<4:11:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 0: 84%|████████▍ | 10410/12384 [22:05:30<4:11:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 84%|████████▍ | 10411/12384 [22:05:30<4:11:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 0: 84%|████████▍ | 10411/12384 [22:05:37<4:11:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 84%|████████▍ | 10412/12384 [22:05:37<4:10:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 84%|████████▍ | 10412/12384 [22:05:45<4:10:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 84%|████████▍ | 10413/12384 [22:05:45<4:10:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 84%|████████▍ | 10413/12384 [22:05:53<4:10:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 84%|████████▍ | 10414/12384 [22:05:53<4:10:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 84%|████████▍ | 10414/12384 [22:06:00<4:10:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 0: 84%|████████▍ | 10415/12384 [22:06:00<4:10:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 0: 84%|████████▍ | 10415/12384 [22:06:08<4:10:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 0: 84%|████████▍ | 10416/12384 [22:06:08<4:09:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 0: 84%|████████▍ | 10416/12384 [22:06:16<4:09:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=3.65s]
Epoch 0: 84%|████████▍ | 10417/12384 [22:06:16<4:10:36, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=3.65s]
Epoch 0: 84%|████████▍ | 10417/12384 [22:06:23<4:10:36, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=11.29s]
Epoch 0: 84%|████████▍ | 10418/12384 [22:06:23<4:13:26, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=11.29s]
Epoch 0: 84%|████████▍ | 10418/12384 [22:06:31<4:13:26, 7.73s/it, loss=0.0003, acc=1.0000, iter_time=7.97s]
Epoch 0: 84%|████████▍ | 10419/12384 [22:06:31<4:12:30, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=7.97s]
Epoch 0: 84%|████████▍ | 10419/12384 [22:06:39<4:12:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 84%|████████▍ | 10420/12384 [22:06:39<4:11:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 84%|████████▍ | 10420/12384 [22:06:46<4:11:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 84%|████████▍ | 10421/12384 [22:06:46<4:11:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 84%|████████▍ | 10421/12384 [22:06:54<4:11:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 84%|████████▍ | 10422/12384 [22:06:54<4:10:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 0: 84%|████████▍ | 10422/12384 [22:07:02<4:10:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 0: 84%|████████▍ | 10423/12384 [22:07:02<4:09:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 0: 84%|████████▍ | 10423/12384 [22:07:09<4:09:57, 7.65s/it, loss=0.0002, acc=0.9986, iter_time=10.07s]
Epoch 0: 84%|████████▍ | 10424/12384 [22:07:09<4:09:22, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=10.07s]
Epoch 0: 84%|████████▍ | 10424/12384 [22:07:17<4:09:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 0: 84%|████████▍ | 10425/12384 [22:07:17<4:11:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 0: 84%|████████▍ | 10425/12384 [22:07:25<4:11:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▍ | 10426/12384 [22:07:25<4:10:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▍ | 10426/12384 [22:07:32<4:10:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 84%|████████▍ | 10427/12384 [22:07:32<4:09:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 84%|████████▍ | 10427/12384 [22:07:40<4:09:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 84%|████████▍ | 10428/12384 [22:07:40<4:09:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 84%|████████▍ | 10428/12384 [22:07:48<4:09:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 84%|████████▍ | 10429/12384 [22:07:48<4:08:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 84%|████████▍ | 10429/12384 [22:07:55<4:08:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 84%|████████▍ | 10430/12384 [22:07:55<4:09:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 84%|████████▍ | 10430/12384 [22:08:03<4:09:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10431/12384 [22:08:03<4:08:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10431/12384 [22:08:10<4:08:33, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.98s]
Epoch 0: 84%|████████▍ | 10432/12384 [22:08:10<4:08:03, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.98s]
Epoch 0: 84%|████████▍ | 10432/12384 [22:08:18<4:08:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 84%|████████▍ | 10433/12384 [22:08:18<4:07:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 84%|████████▍ | 10433/12384 [22:08:26<4:07:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 84%|████████▍ | 10434/12384 [22:08:26<4:07:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 84%|████████▍ | 10434/12384 [22:08:33<4:07:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 84%|████████▍ | 10435/12384 [22:08:33<4:07:51, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 84%|████████▍ | 10435/12384 [22:08:41<4:07:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 84%|████████▍ | 10436/12384 [22:08:41<4:10:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 0: 84%|████████▍ | 10436/12384 [22:08:49<4:10:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 0: 84%|████████▍ | 10437/12384 [22:08:49<4:10:47, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 0: 84%|████████▍ | 10437/12384 [22:08:57<4:10:47, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 84%|████████▍ | 10438/12384 [22:08:57<4:11:49, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 84%|████████▍ | 10438/12384 [22:09:04<4:11:49, 7.76s/it, loss=0.0002, acc=1.0000, iter_time=7.84s]
Epoch 0: 84%|████████▍ | 10439/12384 [22:09:04<4:10:10, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.84s]
Epoch 0: 84%|████████▍ | 10439/12384 [22:09:12<4:10:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 0: 84%|████████▍ | 10440/12384 [22:09:12<4:09:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 0: 84%|████████▍ | 10440/12384 [22:09:20<4:09:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 84%|████████▍ | 10441/12384 [22:09:20<4:08:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 84%|████████▍ | 10441/12384 [22:09:27<4:08:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 84%|████████▍ | 10442/12384 [22:09:27<4:07:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 84%|████████▍ | 10442/12384 [22:09:35<4:07:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10443/12384 [22:09:35<4:07:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10443/12384 [22:09:43<4:07:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▍ | 10444/12384 [22:09:43<4:06:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▍ | 10444/12384 [22:09:51<4:06:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 84%|████████▍ | 10445/12384 [22:09:51<4:10:10, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 84%|████████▍ | 10445/12384 [22:09:58<4:10:10, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 84%|████████▍ | 10446/12384 [22:09:58<4:08:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 84%|████████▍ | 10446/12384 [22:10:06<4:08:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 84%|████████▍ | 10447/12384 [22:10:06<4:07:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 84%|████████▍ | 10447/12384 [22:10:13<4:07:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 84%|████████▍ | 10448/12384 [22:10:13<4:07:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 84%|████████▍ | 10448/12384 [22:10:21<4:07:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 84%|████████▍ | 10449/12384 [22:10:21<4:06:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 84%|████████▍ | 10449/12384 [22:10:29<4:06:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 84%|████████▍ | 10450/12384 [22:10:29<4:06:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 84%|████████▍ | 10450/12384 [22:10:36<4:06:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 84%|████████▍ | 10451/12384 [22:10:36<4:06:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 84%|████████▍ | 10451/12384 [22:10:44<4:06:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 84%|████████▍ | 10452/12384 [22:10:44<4:06:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 84%|████████▍ | 10452/12384 [22:10:52<4:06:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 84%|████████▍ | 10453/12384 [22:10:52<4:05:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 84%|████████▍ | 10453/12384 [22:10:59<4:05:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10454/12384 [22:10:59<4:05:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 84%|████████▍ | 10454/12384 [22:11:07<4:05:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 84%|████████▍ | 10455/12384 [22:11:07<4:04:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 84%|████████▍ | 10455/12384 [22:11:14<4:04:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 84%|████████▍ | 10456/12384 [22:11:14<4:04:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 84%|████████▍ | 10456/12384 [22:11:22<4:04:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 84%|████████▍ | 10457/12384 [22:11:22<4:04:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 84%|████████▍ | 10457/12384 [22:11:30<4:04:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 84%|████████▍ | 10458/12384 [22:11:30<4:04:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 84%|████████▍ | 10458/12384 [22:11:37<4:04:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 84%|████████▍ | 10459/12384 [22:11:37<4:04:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 84%|████████▍ | 10459/12384 [22:11:45<4:04:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 84%|████████▍ | 10460/12384 [22:11:45<4:05:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 84%|████████▍ | 10460/12384 [22:11:53<4:05:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.51s]
Epoch 0: 84%|████████▍ | 10461/12384 [22:11:53<4:04:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.51s]
Epoch 0: 84%|████████▍ | 10461/12384 [22:12:00<4:04:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=12.08s]
Epoch 0: 84%|████████▍ | 10462/12384 [22:12:00<4:04:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=12.08s]
Epoch 0: 84%|████████▍ | 10462/12384 [22:12:08<4:04:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▍ | 10463/12384 [22:12:08<4:03:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 84%|████████▍ | 10463/12384 [22:12:15<4:03:56, 7.62s/it, loss=0.0006, acc=0.9994, iter_time=8.00s]
Epoch 0: 84%|████████▍ | 10464/12384 [22:12:15<4:03:45, 7.62s/it, loss=0.0006, acc=0.9994, iter_time=8.00s]
Epoch 0: 84%|████████▍ | 10464/12384 [22:12:23<4:03:45, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=5.41s]
Epoch 0: 85%|████████▍ | 10465/12384 [22:12:23<4:03:46, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=5.41s]
Epoch 0: 85%|████████▍ | 10465/12384 [22:12:31<4:03:46, 7.62s/it, loss=0.0006, acc=0.9998, iter_time=6.62s]
Epoch 0: 85%|████████▍ | 10466/12384 [22:12:31<4:03:30, 7.62s/it, loss=0.0006, acc=0.9998, iter_time=6.62s]
Epoch 0: 85%|████████▍ | 10466/12384 [22:12:38<4:03:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.11s]
Epoch 0: 85%|████████▍ | 10467/12384 [22:12:38<4:03:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.11s]
Epoch 0: 85%|████████▍ | 10467/12384 [22:12:46<4:03:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 85%|████████▍ | 10468/12384 [22:12:46<4:03:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 85%|████████▍ | 10468/12384 [22:12:53<4:03:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 85%|████████▍ | 10469/12384 [22:12:53<4:02:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 85%|████████▍ | 10469/12384 [22:13:01<4:02:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 85%|████████▍ | 10470/12384 [22:13:01<4:02:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 85%|████████▍ | 10470/12384 [22:13:09<4:02:26, 7.60s/it, loss=0.0003, acc=0.9987, iter_time=8.72s]
Epoch 0: 85%|████████▍ | 10471/12384 [22:13:09<4:05:43, 7.71s/it, loss=0.0003, acc=0.9987, iter_time=8.72s]
Epoch 0: 85%|████████▍ | 10471/12384 [22:13:17<4:05:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 0: 85%|████████▍ | 10472/12384 [22:13:17<4:04:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 0: 85%|████████▍ | 10472/12384 [22:13:24<4:04:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 85%|████████▍ | 10473/12384 [22:13:24<4:03:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 85%|████████▍ | 10473/12384 [22:13:32<4:03:55, 7.66s/it, loss=0.0002, acc=0.9984, iter_time=7.63s]
Epoch 0: 85%|████████▍ | 10474/12384 [22:13:32<4:03:24, 7.65s/it, loss=0.0002, acc=0.9984, iter_time=7.63s]
Epoch 0: 85%|████████▍ | 10474/12384 [22:13:39<4:03:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 85%|████████▍ | 10475/12384 [22:13:39<4:03:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 85%|████████▍ | 10475/12384 [22:13:47<4:03:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 85%|████████▍ | 10476/12384 [22:13:47<4:03:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 85%|████████▍ | 10476/12384 [22:13:55<4:03:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 85%|████████▍ | 10477/12384 [22:13:55<4:02:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 85%|████████▍ | 10477/12384 [22:14:02<4:02:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 85%|████████▍ | 10478/12384 [22:14:02<4:02:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 85%|████████▍ | 10478/12384 [22:14:10<4:02:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 85%|████████▍ | 10479/12384 [22:14:10<4:02:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 85%|████████▍ | 10479/12384 [22:14:18<4:02:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 85%|████████▍ | 10480/12384 [22:14:18<4:02:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 85%|████████▍ | 10480/12384 [22:14:25<4:02:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 85%|████████▍ | 10481/12384 [22:14:25<4:02:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 85%|████████▍ | 10481/12384 [22:14:33<4:02:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 85%|████████▍ | 10482/12384 [22:14:33<4:01:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 85%|████████▍ | 10482/12384 [22:14:40<4:01:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 85%|████████▍ | 10483/12384 [22:14:40<4:01:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 85%|████████▍ | 10483/12384 [22:14:48<4:01:12, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.55s]
Epoch 0: 85%|████████▍ | 10484/12384 [22:14:48<4:01:16, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.55s]
Epoch 0: 85%|████████▍ | 10484/12384 [22:14:56<4:01:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 85%|████████▍ | 10485/12384 [22:14:56<4:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 85%|████████▍ | 10485/12384 [22:15:03<4:01:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 0: 85%|████████▍ | 10486/12384 [22:15:03<4:00:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 0: 85%|████████▍ | 10486/12384 [22:15:11<4:00:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 85%|████████▍ | 10487/12384 [22:15:11<4:00:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 85%|████████▍ | 10487/12384 [22:15:18<4:00:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 0: 85%|████████▍ | 10488/12384 [22:15:18<4:00:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 0: 85%|████████▍ | 10488/12384 [22:15:26<4:00:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 0: 85%|████████▍ | 10489/12384 [22:15:26<4:00:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 0: 85%|████████▍ | 10489/12384 [22:15:34<4:00:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 0: 85%|████████▍ | 10490/12384 [22:15:34<4:00:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 0: 85%|████████▍ | 10490/12384 [22:15:41<4:00:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 85%|████████▍ | 10491/12384 [22:15:41<4:00:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 85%|████████▍ | 10491/12384 [22:15:49<4:00:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▍ | 10492/12384 [22:15:49<3:59:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▍ | 10492/12384 [22:15:57<3:59:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 85%|████████▍ | 10493/12384 [22:15:57<4:00:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 0: 85%|████████▍ | 10493/12384 [22:16:04<4:00:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 85%|████████▍ | 10494/12384 [22:16:04<4:00:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 85%|████████▍ | 10494/12384 [22:16:12<4:00:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 85%|████████▍ | 10495/12384 [22:16:12<4:00:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 85%|████████▍ | 10495/12384 [22:16:20<4:00:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 0: 85%|████████▍ | 10496/12384 [22:16:20<4:00:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 0: 85%|████████▍ | 10496/12384 [22:16:27<4:00:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 85%|████████▍ | 10497/12384 [22:16:27<4:02:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 85%|████████▍ | 10497/12384 [22:16:35<4:02:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 85%|████████▍ | 10498/12384 [22:16:35<4:01:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 85%|████████▍ | 10498/12384 [22:16:43<4:01:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 85%|████████▍ | 10499/12384 [22:16:43<4:00:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 85%|████████▍ | 10499/12384 [22:16:50<4:00:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 85%|████████▍ | 10500/12384 [22:16:50<4:01:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 85%|████████▍ | 10500/12384 [22:16:58<4:01:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 85%|████████▍ | 10501/12384 [22:16:58<4:00:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 85%|████████▍ | 10501/12384 [22:17:06<4:00:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 0: 85%|████████▍ | 10502/12384 [22:17:06<4:00:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 0: 85%|████████▍ | 10502/12384 [22:17:13<4:00:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 85%|████████▍ | 10503/12384 [22:17:13<3:59:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 85%|████████▍ | 10503/12384 [22:17:21<3:59:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 85%|████████▍ | 10504/12384 [22:17:21<3:59:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 85%|████████▍ | 10504/12384 [22:17:28<3:59:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 85%|████████▍ | 10505/12384 [22:17:28<3:58:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 85%|████████▍ | 10505/12384 [22:17:36<3:58:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 85%|████████▍ | 10506/12384 [22:17:36<3:58:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 85%|████████▍ | 10506/12384 [22:17:44<3:58:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 0: 85%|████████▍ | 10507/12384 [22:17:44<3:58:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 0: 85%|████████▍ | 10507/12384 [22:17:51<3:58:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▍ | 10508/12384 [22:17:51<3:57:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▍ | 10508/12384 [22:17:59<3:57:53, 7.61s/it, loss=0.0001, acc=0.9994, iter_time=7.60s]
Epoch 0: 85%|████████▍ | 10509/12384 [22:17:59<3:57:35, 7.60s/it, loss=0.0001, acc=0.9994, iter_time=7.60s]
Epoch 0: 85%|████████▍ | 10509/12384 [22:18:06<3:57:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 85%|████████▍ | 10510/12384 [22:18:06<3:57:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 0: 85%|████████▍ | 10510/12384 [22:18:14<3:57:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 85%|████████▍ | 10511/12384 [22:18:14<3:57:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 0: 85%|████████▍ | 10511/12384 [22:18:22<3:57:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 85%|████████▍ | 10512/12384 [22:18:22<3:57:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 85%|████████▍ | 10512/12384 [22:18:29<3:57:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 85%|████████▍ | 10513/12384 [22:18:29<3:57:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 85%|████████▍ | 10513/12384 [22:18:37<3:57:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 85%|████████▍ | 10514/12384 [22:18:37<3:57:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 85%|████████▍ | 10514/12384 [22:18:45<3:57:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 85%|████████▍ | 10515/12384 [22:18:45<3:57:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 85%|████████▍ | 10515/12384 [22:18:52<3:57:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 85%|████████▍ | 10516/12384 [22:18:52<3:57:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 0: 85%|████████▍ | 10516/12384 [22:19:00<3:57:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 85%|████████▍ | 10517/12384 [22:19:00<3:57:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 85%|████████▍ | 10517/12384 [22:19:07<3:57:17, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.88s]
Epoch 0: 85%|████████▍ | 10518/12384 [22:19:07<3:56:49, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.88s]
Epoch 0: 85%|████████▍ | 10518/12384 [22:19:15<3:56:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 0: 85%|████████▍ | 10519/12384 [22:19:15<3:56:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 0: 85%|████████▍ | 10519/12384 [22:19:23<3:56:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 85%|████████▍ | 10520/12384 [22:19:23<3:56:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 85%|████████▍ | 10520/12384 [22:19:30<3:56:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 85%|████████▍ | 10521/12384 [22:19:30<3:56:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 85%|████████▍ | 10521/12384 [22:19:38<3:56:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 85%|████████▍ | 10522/12384 [22:19:38<3:56:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 85%|████████▍ | 10522/12384 [22:19:46<3:56:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 85%|████████▍ | 10523/12384 [22:19:46<4:00:13, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 85%|████████▍ | 10523/12384 [22:19:54<4:00:13, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 85%|████████▍ | 10524/12384 [22:19:54<3:59:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 85%|████████▍ | 10524/12384 [22:20:01<3:59:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 0: 85%|████████▍ | 10525/12384 [22:20:01<3:58:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 0: 85%|████████▍ | 10525/12384 [22:20:09<3:58:01, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=10.73s]
Epoch 0: 85%|████████▍ | 10526/12384 [22:20:09<3:57:18, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.73s]
Epoch 0: 85%|████████▍ | 10526/12384 [22:20:16<3:57:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 85%|████████▌ | 10527/12384 [22:20:16<3:56:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 85%|████████▌ | 10527/12384 [22:20:24<3:56:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 85%|████████▌ | 10528/12384 [22:20:24<3:58:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 85%|████████▌ | 10528/12384 [22:20:32<3:58:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 85%|████████▌ | 10529/12384 [22:20:32<3:58:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 85%|████████▌ | 10529/12384 [22:20:40<3:58:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 85%|████████▌ | 10530/12384 [22:20:40<3:57:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 85%|████████▌ | 10530/12384 [22:20:47<3:57:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10531/12384 [22:20:47<3:57:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10531/12384 [22:20:55<3:57:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 85%|████████▌ | 10532/12384 [22:20:55<3:56:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 85%|████████▌ | 10532/12384 [22:21:03<3:56:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 85%|████████▌ | 10533/12384 [22:21:03<3:55:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 85%|████████▌ | 10533/12384 [22:21:10<3:55:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 85%|████████▌ | 10534/12384 [22:21:10<3:55:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 85%|████████▌ | 10534/12384 [22:21:18<3:55:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 85%|████████▌ | 10535/12384 [22:21:18<3:55:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 0: 85%|████████▌ | 10535/12384 [22:21:25<3:55:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 85%|████████▌ | 10536/12384 [22:21:25<3:55:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 85%|████████▌ | 10536/12384 [22:21:33<3:55:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 85%|████████▌ | 10537/12384 [22:21:33<3:54:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 85%|████████▌ | 10537/12384 [22:21:41<3:54:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 85%|████████▌ | 10538/12384 [22:21:41<3:55:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 85%|████████▌ | 10538/12384 [22:21:48<3:55:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 85%|████████▌ | 10539/12384 [22:21:48<3:54:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 85%|████████▌ | 10539/12384 [22:21:56<3:54:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10540/12384 [22:21:56<3:54:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10540/12384 [22:22:04<3:54:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 85%|████████▌ | 10541/12384 [22:22:04<3:54:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 0: 85%|████████▌ | 10541/12384 [22:22:11<3:54:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 85%|████████▌ | 10542/12384 [22:22:11<3:54:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 85%|████████▌ | 10542/12384 [22:22:19<3:54:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 85%|████████▌ | 10543/12384 [22:22:19<3:54:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 85%|████████▌ | 10543/12384 [22:22:26<3:54:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 85%|████████▌ | 10544/12384 [22:22:26<3:53:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 85%|████████▌ | 10544/12384 [22:22:34<3:53:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 85%|████████▌ | 10545/12384 [22:22:34<3:53:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 85%|████████▌ | 10545/12384 [22:22:42<3:53:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 85%|████████▌ | 10546/12384 [22:22:42<3:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 85%|████████▌ | 10546/12384 [22:22:49<3:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 85%|████████▌ | 10547/12384 [22:22:49<3:54:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 85%|████████▌ | 10547/12384 [22:22:57<3:54:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 0: 85%|████████▌ | 10548/12384 [22:22:57<3:53:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 0: 85%|████████▌ | 10548/12384 [22:23:05<3:53:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 85%|████████▌ | 10549/12384 [22:23:05<3:56:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 85%|████████▌ | 10549/12384 [22:23:13<3:56:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 85%|████████▌ | 10550/12384 [22:23:13<3:55:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 85%|████████▌ | 10550/12384 [22:23:20<3:55:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 0: 85%|████████▌ | 10551/12384 [22:23:20<3:54:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 0: 85%|████████▌ | 10551/12384 [22:23:28<3:54:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 85%|████████▌ | 10552/12384 [22:23:28<3:54:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 85%|████████▌ | 10552/12384 [22:23:36<3:54:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 85%|████████▌ | 10553/12384 [22:23:36<3:53:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 85%|████████▌ | 10553/12384 [22:23:43<3:53:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 85%|████████▌ | 10554/12384 [22:23:43<3:55:47, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 85%|████████▌ | 10554/12384 [22:23:51<3:55:47, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10555/12384 [22:23:51<3:54:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10555/12384 [22:23:59<3:54:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10556/12384 [22:23:59<3:53:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10556/12384 [22:24:06<3:53:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10557/12384 [22:24:06<3:53:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 85%|████████▌ | 10557/12384 [22:24:14<3:53:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 85%|████████▌ | 10558/12384 [22:24:14<3:52:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 85%|████████▌ | 10558/12384 [22:24:21<3:52:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 85%|████████▌ | 10559/12384 [22:24:21<3:51:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 85%|████████▌ | 10559/12384 [22:24:29<3:51:56, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.56s]
Epoch 0: 85%|████████▌ | 10560/12384 [22:24:29<3:51:45, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.56s]
Epoch 0: 85%|████████▌ | 10560/12384 [22:24:37<3:51:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 85%|████████▌ | 10561/12384 [22:24:37<3:51:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 85%|████████▌ | 10561/12384 [22:24:44<3:51:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 85%|████████▌ | 10562/12384 [22:24:44<3:52:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 85%|████████▌ | 10562/12384 [22:24:52<3:52:44, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.95s]
Epoch 0: 85%|████████▌ | 10563/12384 [22:24:52<3:52:55, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=4.95s]
Epoch 0: 85%|████████▌ | 10563/12384 [22:25:00<3:52:55, 7.67s/it, loss=0.0009, acc=0.9991, iter_time=10.71s]
Epoch 0: 85%|████████▌ | 10564/12384 [22:25:00<3:52:18, 7.66s/it, loss=0.0009, acc=0.9991, iter_time=10.71s]
Epoch 0: 85%|████████▌ | 10564/12384 [22:25:07<3:52:18, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=6.71s]
Epoch 0: 85%|████████▌ | 10565/12384 [22:25:07<3:51:50, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=6.71s]
Epoch 0: 85%|████████▌ | 10565/12384 [22:25:15<3:51:50, 7.65s/it, loss=0.0001, acc=0.9994, iter_time=8.54s]
Epoch 0: 85%|████████▌ | 10566/12384 [22:25:15<3:51:25, 7.64s/it, loss=0.0001, acc=0.9994, iter_time=8.54s]
Epoch 0: 85%|████████▌ | 10566/12384 [22:25:23<3:51:25, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=6.43s]
Epoch 0: 85%|████████▌ | 10567/12384 [22:25:23<3:51:00, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=6.43s]
Epoch 0: 85%|████████▌ | 10567/12384 [22:25:30<3:51:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 85%|████████▌ | 10568/12384 [22:25:30<3:50:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 0: 85%|████████▌ | 10568/12384 [22:25:38<3:50:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 85%|████████▌ | 10569/12384 [22:25:38<3:50:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 85%|████████▌ | 10569/12384 [22:25:45<3:50:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 85%|████████▌ | 10570/12384 [22:25:45<3:50:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 85%|████████▌ | 10570/12384 [22:25:53<3:50:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 85%|████████▌ | 10571/12384 [22:25:53<3:50:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 85%|████████▌ | 10571/12384 [22:26:01<3:50:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 85%|████████▌ | 10572/12384 [22:26:01<3:50:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 85%|████████▌ | 10572/12384 [22:26:08<3:50:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 85%|████████▌ | 10573/12384 [22:26:08<3:49:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 85%|████████▌ | 10573/12384 [22:26:16<3:49:57, 7.62s/it, loss=0.0005, acc=0.9984, iter_time=8.24s]
Epoch 0: 85%|████████▌ | 10574/12384 [22:26:16<3:49:53, 7.62s/it, loss=0.0005, acc=0.9984, iter_time=8.24s]
Epoch 0: 85%|████████▌ | 10574/12384 [22:26:24<3:49:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 85%|████████▌ | 10575/12384 [22:26:24<3:49:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 85%|████████▌ | 10575/12384 [22:26:32<3:49:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 85%|████████▌ | 10576/12384 [22:26:32<3:52:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 85%|████████▌ | 10576/12384 [22:26:39<3:52:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 85%|████████▌ | 10577/12384 [22:26:39<3:51:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 85%|████████▌ | 10577/12384 [22:26:47<3:51:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 85%|████████▌ | 10578/12384 [22:26:47<3:51:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 0: 85%|████████▌ | 10578/12384 [22:26:54<3:51:06, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=7.30s]
Epoch 0: 85%|████████▌ | 10579/12384 [22:26:54<3:50:58, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=7.30s]
Epoch 0: 85%|████████▌ | 10579/12384 [22:27:02<3:50:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 85%|████████▌ | 10580/12384 [22:27:02<3:50:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 85%|████████▌ | 10580/12384 [22:27:10<3:50:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 85%|████████▌ | 10581/12384 [22:27:10<3:49:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 85%|████████▌ | 10581/12384 [22:27:17<3:49:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 85%|████████▌ | 10582/12384 [22:27:17<3:49:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 85%|████████▌ | 10582/12384 [22:27:25<3:49:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 85%|████████▌ | 10583/12384 [22:27:25<3:48:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 85%|████████▌ | 10583/12384 [22:27:33<3:48:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 85%|████████▌ | 10584/12384 [22:27:33<3:49:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 85%|████████▌ | 10584/12384 [22:27:40<3:49:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 85%|████████▌ | 10585/12384 [22:27:40<3:48:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 85%|████████▌ | 10585/12384 [22:27:48<3:48:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 85%|████████▌ | 10586/12384 [22:27:48<3:48:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 85%|████████▌ | 10586/12384 [22:27:55<3:48:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 85%|████████▌ | 10587/12384 [22:27:55<3:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 85%|████████▌ | 10587/12384 [22:28:03<3:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 85%|████████▌ | 10588/12384 [22:28:03<3:47:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 85%|████████▌ | 10588/12384 [22:28:11<3:47:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▌ | 10589/12384 [22:28:11<3:47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▌ | 10589/12384 [22:28:18<3:47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10590/12384 [22:28:18<3:47:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10590/12384 [22:28:26<3:47:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10591/12384 [22:28:26<3:47:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10591/12384 [22:28:33<3:47:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 86%|████████▌ | 10592/12384 [22:28:33<3:47:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 86%|████████▌ | 10592/12384 [22:28:41<3:47:08, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.34s]
Epoch 0: 86%|████████▌ | 10593/12384 [22:28:41<3:47:11, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.34s]
Epoch 0: 86%|████████▌ | 10593/12384 [22:28:49<3:47:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 86%|████████▌ | 10594/12384 [22:28:49<3:47:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 86%|████████▌ | 10594/12384 [22:28:56<3:47:07, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10595/12384 [22:28:56<3:46:51, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10595/12384 [22:29:04<3:46:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 86%|████████▌ | 10596/12384 [22:29:04<3:46:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 86%|████████▌ | 10596/12384 [22:29:12<3:46:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 86%|████████▌ | 10597/12384 [22:29:12<3:46:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 86%|████████▌ | 10597/12384 [22:29:19<3:46:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 86%|████████▌ | 10598/12384 [22:29:19<3:46:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 86%|████████▌ | 10598/12384 [22:29:27<3:46:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 86%|████████▌ | 10599/12384 [22:29:27<3:46:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 86%|████████▌ | 10599/12384 [22:29:34<3:46:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 86%|████████▌ | 10600/12384 [22:29:34<3:46:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 86%|████████▌ | 10600/12384 [22:29:42<3:46:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 86%|████████▌ | 10601/12384 [22:29:42<3:46:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 86%|████████▌ | 10601/12384 [22:29:50<3:46:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 86%|████████▌ | 10602/12384 [22:29:50<3:48:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 86%|████████▌ | 10602/12384 [22:29:57<3:48:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 86%|████████▌ | 10603/12384 [22:29:57<3:47:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 86%|████████▌ | 10603/12384 [22:30:05<3:47:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10604/12384 [22:30:05<3:47:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10604/12384 [22:30:13<3:47:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10605/12384 [22:30:13<3:46:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10605/12384 [22:30:20<3:46:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 86%|████████▌ | 10606/12384 [22:30:20<3:46:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 0: 86%|████████▌ | 10606/12384 [22:30:28<3:46:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 86%|████████▌ | 10607/12384 [22:30:28<3:45:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 86%|████████▌ | 10607/12384 [22:30:36<3:45:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 0: 86%|████████▌ | 10608/12384 [22:30:36<3:45:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 0: 86%|████████▌ | 10608/12384 [22:30:43<3:45:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 86%|████████▌ | 10609/12384 [22:30:43<3:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 86%|████████▌ | 10609/12384 [22:30:51<3:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10610/12384 [22:30:51<3:45:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10610/12384 [22:30:58<3:45:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 86%|████████▌ | 10611/12384 [22:30:58<3:44:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 86%|████████▌ | 10611/12384 [22:31:06<3:44:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 86%|████████▌ | 10612/12384 [22:31:06<3:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 86%|████████▌ | 10612/12384 [22:31:14<3:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 86%|████████▌ | 10613/12384 [22:31:14<3:44:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 86%|████████▌ | 10613/12384 [22:31:21<3:44:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 86%|████████▌ | 10614/12384 [22:31:21<3:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 86%|████████▌ | 10614/12384 [22:31:29<3:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 86%|████████▌ | 10615/12384 [22:31:29<3:44:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 86%|████████▌ | 10615/12384 [22:31:36<3:44:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 0: 86%|████████▌ | 10616/12384 [22:31:36<3:44:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 0: 86%|████████▌ | 10616/12384 [22:31:44<3:44:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 86%|████████▌ | 10617/12384 [22:31:44<3:44:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 86%|████████▌ | 10617/12384 [22:31:52<3:44:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 0: 86%|████████▌ | 10618/12384 [22:31:52<3:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 0: 86%|████████▌ | 10618/12384 [22:31:59<3:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 86%|████████▌ | 10619/12384 [22:31:59<3:44:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 86%|████████▌ | 10619/12384 [22:32:07<3:44:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 86%|████████▌ | 10620/12384 [22:32:07<3:43:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 86%|████████▌ | 10620/12384 [22:32:15<3:43:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 86%|████████▌ | 10621/12384 [22:32:15<3:44:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 86%|████████▌ | 10621/12384 [22:32:22<3:44:23, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10622/12384 [22:32:22<3:44:13, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10622/12384 [22:32:30<3:44:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 86%|████████▌ | 10623/12384 [22:32:30<3:43:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 86%|████████▌ | 10623/12384 [22:32:37<3:43:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 86%|████████▌ | 10624/12384 [22:32:37<3:43:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 86%|████████▌ | 10624/12384 [22:32:45<3:43:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 86%|████████▌ | 10625/12384 [22:32:45<3:43:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 86%|████████▌ | 10625/12384 [22:32:53<3:43:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10626/12384 [22:32:53<3:43:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10626/12384 [22:33:00<3:43:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10627/12384 [22:33:00<3:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10627/12384 [22:33:08<3:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10628/12384 [22:33:08<3:42:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10628/12384 [22:33:16<3:42:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▌ | 10629/12384 [22:33:16<3:45:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▌ | 10629/12384 [22:33:23<3:45:30, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 86%|████████▌ | 10630/12384 [22:33:23<3:44:31, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 86%|████████▌ | 10630/12384 [22:33:31<3:44:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10631/12384 [22:33:31<3:43:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10631/12384 [22:33:39<3:43:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 86%|████████▌ | 10632/12384 [22:33:39<3:43:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 86%|████████▌ | 10632/12384 [22:33:47<3:43:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 86%|████████▌ | 10633/12384 [22:33:47<3:44:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 86%|████████▌ | 10633/12384 [22:33:54<3:44:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 0: 86%|████████▌ | 10634/12384 [22:33:54<3:44:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 0: 86%|████████▌ | 10634/12384 [22:34:02<3:44:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 86%|████████▌ | 10635/12384 [22:34:02<3:43:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 86%|████████▌ | 10635/12384 [22:34:09<3:43:21, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10636/12384 [22:34:09<3:42:51, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10636/12384 [22:34:17<3:42:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10637/12384 [22:34:17<3:42:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10637/12384 [22:34:25<3:42:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 86%|████████▌ | 10638/12384 [22:34:25<3:41:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 86%|████████▌ | 10638/12384 [22:34:32<3:41:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 86%|████████▌ | 10639/12384 [22:34:32<3:41:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 86%|████████▌ | 10639/12384 [22:34:40<3:41:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 86%|████████▌ | 10640/12384 [22:34:40<3:41:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 86%|████████▌ | 10640/12384 [22:34:47<3:41:35, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=4.05s]
Epoch 0: 86%|████████▌ | 10641/12384 [22:34:47<3:41:09, 7.61s/it, loss=0.0004, acc=0.9979, iter_time=4.05s]
Epoch 0: 86%|████████▌ | 10641/12384 [22:34:55<3:41:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 0: 86%|████████▌ | 10642/12384 [22:34:55<3:41:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 0: 86%|████████▌ | 10642/12384 [22:35:03<3:41:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.78s]
Epoch 0: 86%|████████▌ | 10643/12384 [22:35:03<3:41:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.78s]
Epoch 0: 86%|████████▌ | 10643/12384 [22:35:10<3:41:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 0: 86%|████████▌ | 10644/12384 [22:35:10<3:40:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 0: 86%|████████▌ | 10644/12384 [22:35:18<3:40:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 86%|████████▌ | 10645/12384 [22:35:18<3:40:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 86%|████████▌ | 10645/12384 [22:35:26<3:40:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 0: 86%|████████▌ | 10646/12384 [22:35:26<3:40:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 0: 86%|████████▌ | 10646/12384 [22:35:33<3:40:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.12s]
Epoch 0: 86%|████████▌ | 10647/12384 [22:35:33<3:40:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.12s]
Epoch 0: 86%|████████▌ | 10647/12384 [22:35:41<3:40:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 86%|████████▌ | 10648/12384 [22:35:41<3:40:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 86%|████████▌ | 10648/12384 [22:35:48<3:40:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 86%|████████▌ | 10649/12384 [22:35:48<3:39:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 86%|████████▌ | 10649/12384 [22:35:56<3:39:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 0: 86%|████████▌ | 10650/12384 [22:35:56<3:39:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 0: 86%|████████▌ | 10650/12384 [22:36:04<3:39:43, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 0: 86%|████████▌ | 10651/12384 [22:36:04<3:39:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 0: 86%|████████▌ | 10651/12384 [22:36:11<3:39:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 86%|████████▌ | 10652/12384 [22:36:11<3:39:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 86%|████████▌ | 10652/12384 [22:36:19<3:39:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 0: 86%|████████▌ | 10653/12384 [22:36:19<3:39:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 0: 86%|████████▌ | 10653/12384 [22:36:26<3:39:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 86%|████████▌ | 10654/12384 [22:36:26<3:39:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 86%|████████▌ | 10654/12384 [22:36:34<3:39:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 86%|████████▌ | 10655/12384 [22:36:34<3:42:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 86%|████████▌ | 10655/12384 [22:36:42<3:42:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 86%|████████▌ | 10656/12384 [22:36:42<3:41:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 86%|████████▌ | 10656/12384 [22:36:50<3:41:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 86%|████████▌ | 10657/12384 [22:36:50<3:40:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 86%|████████▌ | 10657/12384 [22:36:57<3:40:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10658/12384 [22:36:57<3:40:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▌ | 10658/12384 [22:37:05<3:40:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 86%|████████▌ | 10659/12384 [22:37:05<3:42:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 86%|████████▌ | 10659/12384 [22:37:13<3:42:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10660/12384 [22:37:13<3:41:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▌ | 10660/12384 [22:37:20<3:41:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 86%|████████▌ | 10661/12384 [22:37:20<3:40:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 86%|████████▌ | 10661/12384 [22:37:28<3:40:13, 7.67s/it, loss=0.0001, acc=0.9997, iter_time=9.39s]
Epoch 0: 86%|████████▌ | 10662/12384 [22:37:28<3:39:35, 7.65s/it, loss=0.0001, acc=0.9997, iter_time=9.39s]
Epoch 0: 86%|████████▌ | 10662/12384 [22:37:36<3:39:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 86%|████████▌ | 10663/12384 [22:37:36<3:40:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 86%|████████▌ | 10663/12384 [22:37:43<3:40:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 0: 86%|████████▌ | 10664/12384 [22:37:43<3:39:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 0: 86%|████████▌ | 10664/12384 [22:37:51<3:39:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 0: 86%|████████▌ | 10665/12384 [22:37:51<3:38:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 0: 86%|████████▌ | 10665/12384 [22:37:58<3:38:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 86%|████████▌ | 10666/12384 [22:37:58<3:38:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 0: 86%|████████▌ | 10666/12384 [22:38:06<3:38:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10667/12384 [22:38:06<3:38:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▌ | 10667/12384 [22:38:14<3:38:05, 7.62s/it, loss=0.0000, acc=0.9999, iter_time=7.63s]
Epoch 0: 86%|████████▌ | 10668/12384 [22:38:14<3:38:03, 7.62s/it, loss=0.0000, acc=0.9999, iter_time=7.63s]
Epoch 0: 86%|████████▌ | 10668/12384 [22:38:21<3:38:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 86%|████████▌ | 10669/12384 [22:38:21<3:38:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 86%|████████▌ | 10669/12384 [22:38:29<3:38:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 0: 86%|████████▌ | 10670/12384 [22:38:29<3:37:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 0: 86%|████████▌ | 10670/12384 [22:38:37<3:37:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 86%|████████▌ | 10671/12384 [22:38:37<3:37:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 86%|████████▌ | 10671/12384 [22:38:44<3:37:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 86%|████████▌ | 10672/12384 [22:38:44<3:37:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 86%|████████▌ | 10672/12384 [22:38:52<3:37:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 86%|████████▌ | 10673/12384 [22:38:52<3:37:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 86%|████████▌ | 10673/12384 [22:38:59<3:37:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 86%|████████▌ | 10674/12384 [22:38:59<3:36:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 86%|████████▌ | 10674/12384 [22:39:07<3:36:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 86%|████████▌ | 10675/12384 [22:39:07<3:36:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 86%|████████▌ | 10675/12384 [22:39:15<3:36:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 86%|████████▌ | 10676/12384 [22:39:15<3:36:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 86%|████████▌ | 10676/12384 [22:39:22<3:36:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 0: 86%|████████▌ | 10677/12384 [22:39:22<3:36:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 0: 86%|████████▌ | 10677/12384 [22:39:30<3:36:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 0: 86%|████████▌ | 10678/12384 [22:39:30<3:36:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 0: 86%|████████▌ | 10678/12384 [22:39:37<3:36:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▌ | 10679/12384 [22:39:37<3:36:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▌ | 10679/12384 [22:39:45<3:36:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 86%|████████▌ | 10680/12384 [22:39:45<3:36:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 86%|████████▌ | 10680/12384 [22:39:53<3:36:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 86%|████████▌ | 10681/12384 [22:39:53<3:38:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 86%|████████▌ | 10681/12384 [22:40:01<3:38:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 86%|████████▋ | 10682/12384 [22:40:01<3:38:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 86%|████████▋ | 10682/12384 [22:40:08<3:38:31, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▋ | 10683/12384 [22:40:08<3:37:31, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▋ | 10683/12384 [22:40:16<3:37:31, 7.67s/it, loss=0.0010, acc=0.9971, iter_time=6.39s]
Epoch 0: 86%|████████▋ | 10684/12384 [22:40:16<3:36:46, 7.65s/it, loss=0.0010, acc=0.9971, iter_time=6.39s]
Epoch 0: 86%|████████▋ | 10684/12384 [22:40:24<3:36:46, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 86%|████████▋ | 10685/12384 [22:40:24<3:38:29, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 86%|████████▋ | 10685/12384 [22:40:31<3:38:29, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=4.57s]
Epoch 0: 86%|████████▋ | 10686/12384 [22:40:31<3:37:25, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.57s]
Epoch 0: 86%|████████▋ | 10686/12384 [22:40:39<3:37:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 86%|████████▋ | 10687/12384 [22:40:39<3:37:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 86%|████████▋ | 10687/12384 [22:40:47<3:37:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▋ | 10688/12384 [22:40:47<3:36:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▋ | 10688/12384 [22:40:54<3:36:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 86%|████████▋ | 10689/12384 [22:40:54<3:35:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 86%|████████▋ | 10689/12384 [22:41:02<3:35:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 86%|████████▋ | 10690/12384 [22:41:02<3:35:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 86%|████████▋ | 10690/12384 [22:41:09<3:35:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 0: 86%|████████▋ | 10691/12384 [22:41:09<3:35:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 0: 86%|████████▋ | 10691/12384 [22:41:17<3:35:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 0: 86%|████████▋ | 10692/12384 [22:41:17<3:34:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 0: 86%|████████▋ | 10692/12384 [22:41:25<3:34:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 86%|████████▋ | 10693/12384 [22:41:25<3:34:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 86%|████████▋ | 10693/12384 [22:41:32<3:34:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▋ | 10694/12384 [22:41:32<3:34:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 86%|████████▋ | 10694/12384 [22:41:40<3:34:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▋ | 10695/12384 [22:41:40<3:34:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 86%|████████▋ | 10695/12384 [22:41:47<3:34:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 86%|████████▋ | 10696/12384 [22:41:47<3:33:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 86%|████████▋ | 10696/12384 [22:41:55<3:33:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 86%|████████▋ | 10697/12384 [22:41:55<3:33:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 86%|████████▋ | 10697/12384 [22:42:03<3:33:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 86%|████████▋ | 10698/12384 [22:42:03<3:33:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 86%|████████▋ | 10698/12384 [22:42:10<3:33:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 86%|████████▋ | 10699/12384 [22:42:10<3:33:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 86%|████████▋ | 10699/12384 [22:42:18<3:33:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 86%|████████▋ | 10700/12384 [22:42:18<3:33:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 86%|████████▋ | 10700/12384 [22:42:26<3:33:43, 7.61s/it, loss=0.0004, acc=0.9985, iter_time=5.40s]
Epoch 0: 86%|████████▋ | 10701/12384 [22:42:26<3:33:34, 7.61s/it, loss=0.0004, acc=0.9985, iter_time=5.40s]
Epoch 0: 86%|████████▋ | 10701/12384 [22:42:33<3:33:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 86%|████████▋ | 10702/12384 [22:42:33<3:33:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 86%|████████▋ | 10702/12384 [22:42:41<3:33:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▋ | 10703/12384 [22:42:41<3:33:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 86%|████████▋ | 10703/12384 [22:42:48<3:33:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 86%|████████▋ | 10704/12384 [22:42:48<3:33:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 86%|████████▋ | 10704/12384 [22:42:56<3:33:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 86%|████████▋ | 10705/12384 [22:42:56<3:33:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 86%|████████▋ | 10705/12384 [22:43:04<3:33:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 86%|████████▋ | 10706/12384 [22:43:04<3:33:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 86%|████████▋ | 10706/12384 [22:43:12<3:33:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 86%|████████▋ | 10707/12384 [22:43:12<3:35:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 86%|████████▋ | 10707/12384 [22:43:19<3:35:28, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 0: 86%|████████▋ | 10708/12384 [22:43:19<3:35:28, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 0: 86%|████████▋ | 10708/12384 [22:43:27<3:35:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 86%|████████▋ | 10709/12384 [22:43:27<3:34:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 86%|████████▋ | 10709/12384 [22:43:34<3:34:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▋ | 10710/12384 [22:43:34<3:33:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 86%|████████▋ | 10710/12384 [22:43:42<3:33:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 86%|████████▋ | 10711/12384 [22:43:42<3:33:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 0: 86%|████████▋ | 10711/12384 [22:43:50<3:33:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 0: 86%|████████▋ | 10712/12384 [22:43:50<3:33:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 0: 86%|████████▋ | 10712/12384 [22:43:57<3:33:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 0: 87%|████████▋ | 10713/12384 [22:43:57<3:32:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 0: 87%|████████▋ | 10713/12384 [22:44:05<3:32:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 87%|████████▋ | 10714/12384 [22:44:05<3:33:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 87%|████████▋ | 10714/12384 [22:44:13<3:33:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 87%|████████▋ | 10715/12384 [22:44:13<3:32:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 87%|████████▋ | 10715/12384 [22:44:20<3:32:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10716/12384 [22:44:20<3:32:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10716/12384 [22:44:28<3:32:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10717/12384 [22:44:28<3:31:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10717/12384 [22:44:36<3:31:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 87%|████████▋ | 10718/12384 [22:44:36<3:32:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 87%|████████▋ | 10718/12384 [22:44:43<3:32:40, 7.66s/it, loss=0.0001, acc=0.9991, iter_time=10.32s]
Epoch 0: 87%|████████▋ | 10719/12384 [22:44:43<3:32:07, 7.64s/it, loss=0.0001, acc=0.9991, iter_time=10.32s]
Epoch 0: 87%|████████▋ | 10719/12384 [22:44:51<3:32:07, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.54s]
Epoch 0: 87%|████████▋ | 10720/12384 [22:44:51<3:31:29, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.54s]
Epoch 0: 87%|████████▋ | 10720/12384 [22:44:59<3:31:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 87%|████████▋ | 10721/12384 [22:44:59<3:31:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 87%|████████▋ | 10721/12384 [22:45:06<3:31:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 0: 87%|████████▋ | 10722/12384 [22:45:06<3:31:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 0: 87%|████████▋ | 10722/12384 [22:45:14<3:31:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10723/12384 [22:45:14<3:31:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10723/12384 [22:45:21<3:31:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10724/12384 [22:45:21<3:30:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10724/12384 [22:45:29<3:30:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 87%|████████▋ | 10725/12384 [22:45:29<3:30:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 87%|████████▋ | 10725/12384 [22:45:37<3:30:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 87%|████████▋ | 10726/12384 [22:45:37<3:30:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 87%|████████▋ | 10726/12384 [22:45:44<3:30:30, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.91s]
Epoch 0: 87%|████████▋ | 10727/12384 [22:45:44<3:30:12, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=4.91s]
Epoch 0: 87%|████████▋ | 10727/12384 [22:45:52<3:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 0: 87%|████████▋ | 10728/12384 [22:45:52<3:30:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 0: 87%|████████▋ | 10728/12384 [22:46:00<3:30:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10729/12384 [22:46:00<3:30:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10729/12384 [22:46:07<3:30:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 0: 87%|████████▋ | 10730/12384 [22:46:07<3:30:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 0: 87%|████████▋ | 10730/12384 [22:46:15<3:30:45, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=10.21s]
Epoch 0: 87%|████████▋ | 10731/12384 [22:46:15<3:30:06, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=10.21s]
Epoch 0: 87%|████████▋ | 10731/12384 [22:46:22<3:30:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 87%|████████▋ | 10732/12384 [22:46:22<3:29:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 87%|████████▋ | 10732/12384 [22:46:30<3:29:50, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.44s]
Epoch 0: 87%|████████▋ | 10733/12384 [22:46:30<3:32:07, 7.71s/it, loss=0.0001, acc=0.9998, iter_time=7.44s]
Epoch 0: 87%|████████▋ | 10733/12384 [22:46:38<3:32:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 87%|████████▋ | 10734/12384 [22:46:38<3:31:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 87%|████████▋ | 10734/12384 [22:46:46<3:31:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10735/12384 [22:46:46<3:30:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10735/12384 [22:46:53<3:30:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 87%|████████▋ | 10736/12384 [22:46:53<3:29:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 87%|████████▋ | 10736/12384 [22:47:01<3:29:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.48s]
Epoch 0: 87%|████████▋ | 10737/12384 [22:47:01<3:31:33, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.48s]
Epoch 0: 87%|████████▋ | 10737/12384 [22:47:09<3:31:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 87%|████████▋ | 10738/12384 [22:47:09<3:30:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 0: 87%|████████▋ | 10738/12384 [22:47:16<3:30:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.87s]
Epoch 0: 87%|████████▋ | 10739/12384 [22:47:16<3:29:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.87s]
Epoch 0: 87%|████████▋ | 10739/12384 [22:47:24<3:29:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.86s]
Epoch 0: 87%|████████▋ | 10740/12384 [22:47:24<3:29:13, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.86s]
Epoch 0: 87%|████████▋ | 10740/12384 [22:47:31<3:29:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 87%|████████▋ | 10741/12384 [22:47:31<3:28:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 87%|████████▋ | 10741/12384 [22:47:39<3:28:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10742/12384 [22:47:39<3:28:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10742/12384 [22:47:47<3:28:42, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.70s]
Epoch 0: 87%|████████▋ | 10743/12384 [22:47:47<3:28:53, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=6.70s]
Epoch 0: 87%|████████▋ | 10743/12384 [22:47:54<3:28:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 87%|████████▋ | 10744/12384 [22:47:54<3:28:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 87%|████████▋ | 10744/12384 [22:48:02<3:28:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 87%|████████▋ | 10745/12384 [22:48:02<3:28:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 87%|████████▋ | 10745/12384 [22:48:10<3:28:19, 7.63s/it, loss=0.0004, acc=0.9985, iter_time=4.56s]
Epoch 0: 87%|████████▋ | 10746/12384 [22:48:10<3:28:14, 7.63s/it, loss=0.0004, acc=0.9985, iter_time=4.56s]
Epoch 0: 87%|████████▋ | 10746/12384 [22:48:17<3:28:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 0: 87%|████████▋ | 10747/12384 [22:48:17<3:27:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 0: 87%|████████▋ | 10747/12384 [22:48:25<3:27:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 0: 87%|████████▋ | 10748/12384 [22:48:25<3:27:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 0: 87%|████████▋ | 10748/12384 [22:48:32<3:27:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10749/12384 [22:48:32<3:27:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10749/12384 [22:48:40<3:27:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 87%|████████▋ | 10750/12384 [22:48:40<3:27:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 87%|████████▋ | 10750/12384 [22:48:48<3:27:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 87%|████████▋ | 10751/12384 [22:48:48<3:27:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 87%|████████▋ | 10751/12384 [22:48:55<3:27:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 87%|████████▋ | 10752/12384 [22:48:55<3:27:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 87%|████████▋ | 10752/12384 [22:49:03<3:27:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 87%|████████▋ | 10753/12384 [22:49:03<3:27:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 87%|████████▋ | 10753/12384 [22:49:10<3:27:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 87%|████████▋ | 10754/12384 [22:49:10<3:27:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 87%|████████▋ | 10754/12384 [22:49:18<3:27:02, 7.62s/it, loss=0.0004, acc=0.9988, iter_time=9.40s]
Epoch 0: 87%|████████▋ | 10755/12384 [22:49:18<3:26:41, 7.61s/it, loss=0.0004, acc=0.9988, iter_time=9.40s]
Epoch 0: 87%|████████▋ | 10755/12384 [22:49:26<3:26:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10756/12384 [22:49:26<3:26:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10756/12384 [22:49:33<3:26:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 87%|████████▋ | 10757/12384 [22:49:33<3:26:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 87%|████████▋ | 10757/12384 [22:49:41<3:26:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10758/12384 [22:49:41<3:26:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10758/12384 [22:49:49<3:26:09, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=6.40s]
Epoch 0: 87%|████████▋ | 10759/12384 [22:49:49<3:26:01, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=6.40s]
Epoch 0: 87%|████████▋ | 10759/12384 [22:49:56<3:26:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 0: 87%|████████▋ | 10760/12384 [22:49:56<3:28:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 0: 87%|████████▋ | 10760/12384 [22:50:04<3:28:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 0: 87%|████████▋ | 10761/12384 [22:50:04<3:27:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 0: 87%|████████▋ | 10761/12384 [22:50:12<3:27:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 87%|████████▋ | 10762/12384 [22:50:12<3:27:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 87%|████████▋ | 10762/12384 [22:50:19<3:27:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 87%|████████▋ | 10763/12384 [22:50:19<3:26:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 87%|████████▋ | 10763/12384 [22:50:27<3:26:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 87%|████████▋ | 10764/12384 [22:50:27<3:26:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 87%|████████▋ | 10764/12384 [22:50:34<3:26:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 0: 87%|████████▋ | 10765/12384 [22:50:34<3:25:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 0: 87%|████████▋ | 10765/12384 [22:50:42<3:25:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 87%|████████▋ | 10766/12384 [22:50:42<3:25:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 87%|████████▋ | 10766/12384 [22:50:50<3:25:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 87%|████████▋ | 10767/12384 [22:50:50<3:25:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 87%|████████▋ | 10767/12384 [22:50:57<3:25:33, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.59s]
Epoch 0: 87%|████████▋ | 10768/12384 [22:50:57<3:25:37, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.59s]
Epoch 0: 87%|████████▋ | 10768/12384 [22:51:05<3:25:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 0: 87%|████████▋ | 10769/12384 [22:51:05<3:25:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 0: 87%|████████▋ | 10769/12384 [22:51:13<3:25:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 87%|████████▋ | 10770/12384 [22:51:13<3:24:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 87%|████████▋ | 10770/12384 [22:51:20<3:24:56, 7.62s/it, loss=0.0007, acc=0.9973, iter_time=8.14s]
Epoch 0: 87%|████████▋ | 10771/12384 [22:51:20<3:24:35, 7.61s/it, loss=0.0007, acc=0.9973, iter_time=8.14s]
Epoch 0: 87%|████████▋ | 10771/12384 [22:51:28<3:24:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 87%|████████▋ | 10772/12384 [22:51:28<3:24:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 87%|████████▋ | 10772/12384 [22:51:35<3:24:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 87%|████████▋ | 10773/12384 [22:51:35<3:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 87%|████████▋ | 10773/12384 [22:51:43<3:24:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 87%|████████▋ | 10774/12384 [22:51:43<3:24:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 87%|████████▋ | 10774/12384 [22:51:51<3:24:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 87%|████████▋ | 10775/12384 [22:51:51<3:24:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 87%|████████▋ | 10775/12384 [22:51:58<3:24:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 87%|████████▋ | 10776/12384 [22:51:58<3:24:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 87%|████████▋ | 10776/12384 [22:52:06<3:24:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 87%|████████▋ | 10777/12384 [22:52:06<3:24:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 87%|████████▋ | 10777/12384 [22:52:14<3:24:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 87%|████████▋ | 10778/12384 [22:52:14<3:23:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 0: 87%|████████▋ | 10778/12384 [22:52:21<3:23:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 87%|████████▋ | 10779/12384 [22:52:21<3:23:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 87%|████████▋ | 10779/12384 [22:52:29<3:23:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 87%|████████▋ | 10780/12384 [22:52:29<3:23:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 87%|████████▋ | 10780/12384 [22:52:36<3:23:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10781/12384 [22:52:36<3:23:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10781/12384 [22:52:44<3:23:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 87%|████████▋ | 10782/12384 [22:52:44<3:23:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 0: 87%|████████▋ | 10782/12384 [22:52:52<3:23:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 0: 87%|████████▋ | 10783/12384 [22:52:52<3:23:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 0: 87%|████████▋ | 10783/12384 [22:52:59<3:23:00, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=7.57s]
Epoch 0: 87%|████████▋ | 10784/12384 [22:52:59<3:23:01, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=7.57s]
Epoch 0: 87%|████████▋ | 10784/12384 [22:53:07<3:23:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 87%|████████▋ | 10785/12384 [22:53:07<3:22:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 87%|████████▋ | 10785/12384 [22:53:15<3:22:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 87%|████████▋ | 10786/12384 [22:53:15<3:25:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 87%|████████▋ | 10786/12384 [22:53:22<3:25:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 87%|████████▋ | 10787/12384 [22:53:22<3:24:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 87%|████████▋ | 10787/12384 [22:53:30<3:24:24, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10788/12384 [22:53:30<3:23:45, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10788/12384 [22:53:38<3:23:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 87%|████████▋ | 10789/12384 [22:53:38<3:23:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 87%|████████▋ | 10789/12384 [22:53:45<3:23:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 87%|████████▋ | 10790/12384 [22:53:45<3:22:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 87%|████████▋ | 10790/12384 [22:53:53<3:22:42, 7.63s/it, loss=0.0008, acc=0.9976, iter_time=8.52s]
Epoch 0: 87%|████████▋ | 10791/12384 [22:53:53<3:22:20, 7.62s/it, loss=0.0008, acc=0.9976, iter_time=8.52s]
Epoch 0: 87%|████████▋ | 10791/12384 [22:54:00<3:22:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 87%|████████▋ | 10792/12384 [22:54:00<3:22:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 87%|████████▋ | 10792/12384 [22:54:08<3:22:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 87%|████████▋ | 10793/12384 [22:54:08<3:22:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 87%|████████▋ | 10793/12384 [22:54:16<3:22:40, 7.64s/it, loss=0.0004, acc=0.9985, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10794/12384 [22:54:16<3:22:32, 7.64s/it, loss=0.0004, acc=0.9985, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10794/12384 [22:54:23<3:22:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 87%|████████▋ | 10795/12384 [22:54:23<3:22:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 0: 87%|████████▋ | 10795/12384 [22:54:31<3:22:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 87%|████████▋ | 10796/12384 [22:54:31<3:22:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 87%|████████▋ | 10796/12384 [22:54:39<3:22:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 0: 87%|████████▋ | 10797/12384 [22:54:39<3:21:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 0: 87%|████████▋ | 10797/12384 [22:54:46<3:21:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 0: 87%|████████▋ | 10798/12384 [22:54:46<3:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 0: 87%|████████▋ | 10798/12384 [22:54:54<3:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 87%|████████▋ | 10799/12384 [22:54:54<3:21:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 0: 87%|████████▋ | 10799/12384 [22:55:01<3:21:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 87%|████████▋ | 10800/12384 [22:55:01<3:21:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 87%|████████▋ | 10800/12384 [22:55:09<3:21:10, 7.62s/it, loss=0.0008, acc=0.9976, iter_time=7.21s]
Epoch 0: 87%|████████▋ | 10801/12384 [22:55:09<3:21:05, 7.62s/it, loss=0.0008, acc=0.9976, iter_time=7.21s]
Epoch 0: 87%|████████▋ | 10801/12384 [22:55:17<3:21:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 87%|████████▋ | 10802/12384 [22:55:17<3:20:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 87%|████████▋ | 10802/12384 [22:55:24<3:20:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10803/12384 [22:55:24<3:20:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 87%|████████▋ | 10803/12384 [22:55:32<3:20:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 87%|████████▋ | 10804/12384 [22:55:32<3:20:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 87%|████████▋ | 10804/12384 [22:55:40<3:20:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 87%|████████▋ | 10805/12384 [22:55:40<3:20:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 0: 87%|████████▋ | 10805/12384 [22:55:47<3:20:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 87%|████████▋ | 10806/12384 [22:55:47<3:19:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 87%|████████▋ | 10806/12384 [22:55:55<3:19:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10807/12384 [22:55:55<3:19:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10807/12384 [22:56:02<3:19:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 87%|████████▋ | 10808/12384 [22:56:02<3:19:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 87%|████████▋ | 10808/12384 [22:56:10<3:19:50, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.22s]
Epoch 0: 87%|████████▋ | 10809/12384 [22:56:10<3:19:37, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=7.22s]
Epoch 0: 87%|████████▋ | 10809/12384 [22:56:18<3:19:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 87%|████████▋ | 10810/12384 [22:56:18<3:19:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 87%|████████▋ | 10810/12384 [22:56:25<3:19:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 87%|████████▋ | 10811/12384 [22:56:25<3:19:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 87%|████████▋ | 10811/12384 [22:56:33<3:19:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10812/12384 [22:56:33<3:19:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 87%|████████▋ | 10812/12384 [22:56:41<3:19:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 87%|████████▋ | 10813/12384 [22:56:41<3:21:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 0: 87%|████████▋ | 10813/12384 [22:56:48<3:21:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 0: 87%|████████▋ | 10814/12384 [22:56:48<3:20:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 0: 87%|████████▋ | 10814/12384 [22:56:56<3:20:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 87%|████████▋ | 10815/12384 [22:56:56<3:20:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 87%|████████▋ | 10815/12384 [22:57:04<3:20:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 87%|████████▋ | 10816/12384 [22:57:04<3:19:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 87%|████████▋ | 10816/12384 [22:57:11<3:19:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 87%|████████▋ | 10817/12384 [22:57:11<3:21:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 87%|████████▋ | 10817/12384 [22:57:19<3:21:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 87%|████████▋ | 10818/12384 [22:57:19<3:20:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 0: 87%|████████▋ | 10818/12384 [22:57:27<3:20:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 0: 87%|████████▋ | 10819/12384 [22:57:27<3:19:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 0: 87%|████████▋ | 10819/12384 [22:57:34<3:19:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10820/12384 [22:57:34<3:19:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 87%|████████▋ | 10820/12384 [22:57:42<3:19:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 87%|████████▋ | 10821/12384 [22:57:42<3:19:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 87%|████████▋ | 10821/12384 [22:57:50<3:19:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 87%|████████▋ | 10822/12384 [22:57:50<3:18:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 0: 87%|████████▋ | 10822/12384 [22:57:57<3:18:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 87%|████████▋ | 10823/12384 [22:57:57<3:19:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 87%|████████▋ | 10823/12384 [22:58:05<3:19:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 87%|████████▋ | 10824/12384 [22:58:05<3:18:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 87%|████████▋ | 10824/12384 [22:58:12<3:18:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 87%|████████▋ | 10825/12384 [22:58:12<3:18:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 87%|████████▋ | 10825/12384 [22:58:20<3:18:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 87%|████████▋ | 10826/12384 [22:58:20<3:17:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 87%|████████▋ | 10826/12384 [22:58:28<3:17:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 87%|████████▋ | 10827/12384 [22:58:28<3:17:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 87%|████████▋ | 10827/12384 [22:58:35<3:17:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 87%|████████▋ | 10828/12384 [22:58:35<3:17:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 87%|████████▋ | 10828/12384 [22:58:43<3:17:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 87%|████████▋ | 10829/12384 [22:58:43<3:17:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 87%|████████▋ | 10829/12384 [22:58:50<3:17:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 87%|████████▋ | 10830/12384 [22:58:50<3:17:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 87%|████████▋ | 10830/12384 [22:58:58<3:17:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 87%|████████▋ | 10831/12384 [22:58:58<3:16:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 87%|████████▋ | 10831/12384 [22:59:06<3:16:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 0: 87%|████████▋ | 10832/12384 [22:59:06<3:16:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 0: 87%|████████▋ | 10832/12384 [22:59:13<3:16:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 87%|████████▋ | 10833/12384 [22:59:13<3:16:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 87%|████████▋ | 10833/12384 [22:59:21<3:16:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 0: 87%|████████▋ | 10834/12384 [22:59:21<3:16:12, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 0: 87%|████████▋ | 10834/12384 [22:59:28<3:16:12, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 0: 87%|████████▋ | 10835/12384 [22:59:28<3:16:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 0: 87%|████████▋ | 10835/12384 [22:59:36<3:16:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 88%|████████▊ | 10836/12384 [22:59:36<3:16:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 88%|████████▊ | 10836/12384 [22:59:44<3:16:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 88%|████████▊ | 10837/12384 [22:59:44<3:16:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 88%|████████▊ | 10837/12384 [22:59:51<3:16:04, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 88%|████████▊ | 10838/12384 [22:59:51<3:16:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 88%|████████▊ | 10838/12384 [22:59:59<3:16:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 88%|████████▊ | 10839/12384 [22:59:59<3:18:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 88%|████████▊ | 10839/12384 [23:00:07<3:18:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 88%|████████▊ | 10840/12384 [23:00:07<3:17:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 88%|████████▊ | 10840/12384 [23:00:14<3:17:37, 7.68s/it, loss=0.0002, acc=0.9987, iter_time=7.24s]
Epoch 0: 88%|████████▊ | 10841/12384 [23:00:14<3:16:55, 7.66s/it, loss=0.0002, acc=0.9987, iter_time=7.24s]
Epoch 0: 88%|████████▊ | 10841/12384 [23:00:22<3:16:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 88%|████████▊ | 10842/12384 [23:00:22<3:16:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 88%|████████▊ | 10842/12384 [23:00:30<3:16:15, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.12s]
Epoch 0: 88%|████████▊ | 10843/12384 [23:00:30<3:15:47, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.12s]
Epoch 0: 88%|████████▊ | 10843/12384 [23:00:37<3:15:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 88%|████████▊ | 10844/12384 [23:00:37<3:15:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 88%|████████▊ | 10844/12384 [23:00:45<3:15:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 88%|████████▊ | 10845/12384 [23:00:45<3:15:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 88%|████████▊ | 10845/12384 [23:00:52<3:15:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 88%|████████▊ | 10846/12384 [23:00:52<3:15:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 88%|████████▊ | 10846/12384 [23:01:00<3:15:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 0: 88%|████████▊ | 10847/12384 [23:01:00<3:15:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 0: 88%|████████▊ | 10847/12384 [23:01:08<3:15:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 0: 88%|████████▊ | 10848/12384 [23:01:08<3:15:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 0: 88%|████████▊ | 10848/12384 [23:01:15<3:15:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 88%|████████▊ | 10849/12384 [23:01:15<3:14:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 88%|████████▊ | 10849/12384 [23:01:23<3:14:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 88%|████████▊ | 10850/12384 [23:01:23<3:14:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 88%|████████▊ | 10850/12384 [23:01:31<3:14:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 88%|████████▊ | 10851/12384 [23:01:31<3:14:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 88%|████████▊ | 10851/12384 [23:01:38<3:14:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 88%|████████▊ | 10852/12384 [23:01:38<3:14:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 0: 88%|████████▊ | 10852/12384 [23:01:46<3:14:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 88%|████████▊ | 10853/12384 [23:01:46<3:14:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 0: 88%|████████▊ | 10853/12384 [23:01:53<3:14:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 88%|████████▊ | 10854/12384 [23:01:53<3:14:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 88%|████████▊ | 10854/12384 [23:02:01<3:14:10, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=10.64s]
Epoch 0: 88%|████████▊ | 10855/12384 [23:02:01<3:14:04, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.64s]
Epoch 0: 88%|████████▊ | 10855/12384 [23:02:09<3:14:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 88%|████████▊ | 10856/12384 [23:02:09<3:14:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 88%|████████▊ | 10856/12384 [23:02:16<3:14:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 88%|████████▊ | 10857/12384 [23:02:16<3:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 88%|████████▊ | 10857/12384 [23:02:24<3:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 88%|████████▊ | 10858/12384 [23:02:24<3:14:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 88%|████████▊ | 10858/12384 [23:02:32<3:14:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 88%|████████▊ | 10859/12384 [23:02:32<3:13:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 88%|████████▊ | 10859/12384 [23:02:39<3:13:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 88%|████████▊ | 10860/12384 [23:02:39<3:13:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 88%|████████▊ | 10860/12384 [23:02:47<3:13:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10861/12384 [23:02:47<3:13:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10861/12384 [23:02:54<3:13:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10862/12384 [23:02:54<3:13:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10862/12384 [23:03:02<3:13:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10863/12384 [23:03:02<3:12:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10863/12384 [23:03:10<3:12:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 88%|████████▊ | 10864/12384 [23:03:10<3:12:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 88%|████████▊ | 10864/12384 [23:03:17<3:12:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 0: 88%|████████▊ | 10865/12384 [23:03:17<3:15:09, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 0: 88%|████████▊ | 10865/12384 [23:03:25<3:15:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 88%|████████▊ | 10866/12384 [23:03:25<3:14:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 88%|████████▊ | 10866/12384 [23:03:33<3:14:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10867/12384 [23:03:33<3:13:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10867/12384 [23:03:40<3:13:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 88%|████████▊ | 10868/12384 [23:03:40<3:13:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 88%|████████▊ | 10868/12384 [23:03:48<3:13:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 88%|████████▊ | 10869/12384 [23:03:48<3:14:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 88%|████████▊ | 10869/12384 [23:03:56<3:14:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 88%|████████▊ | 10870/12384 [23:03:56<3:14:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 0: 88%|████████▊ | 10870/12384 [23:04:03<3:14:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 88%|████████▊ | 10871/12384 [23:04:03<3:13:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 88%|████████▊ | 10871/12384 [23:04:11<3:13:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10872/12384 [23:04:11<3:13:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10872/12384 [23:04:19<3:13:18, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.89s]
Epoch 0: 88%|████████▊ | 10873/12384 [23:04:19<3:12:48, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.89s]
Epoch 0: 88%|████████▊ | 10873/12384 [23:04:26<3:12:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 88%|████████▊ | 10874/12384 [23:04:26<3:12:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 88%|████████▊ | 10874/12384 [23:04:34<3:12:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 88%|████████▊ | 10875/12384 [23:04:34<3:12:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 88%|████████▊ | 10875/12384 [23:04:42<3:12:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 88%|████████▊ | 10876/12384 [23:04:42<3:11:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 88%|████████▊ | 10876/12384 [23:04:49<3:11:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 88%|████████▊ | 10877/12384 [23:04:49<3:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 0: 88%|████████▊ | 10877/12384 [23:04:57<3:11:29, 7.62s/it, loss=0.0004, acc=0.9969, iter_time=5.50s]
Epoch 0: 88%|████████▊ | 10878/12384 [23:04:57<3:11:21, 7.62s/it, loss=0.0004, acc=0.9969, iter_time=5.50s]
Epoch 0: 88%|████████▊ | 10878/12384 [23:05:04<3:11:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 88%|████████▊ | 10879/12384 [23:05:04<3:10:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 88%|████████▊ | 10879/12384 [23:05:12<3:10:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 88%|████████▊ | 10880/12384 [23:05:12<3:10:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 88%|████████▊ | 10880/12384 [23:05:20<3:10:49, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=7.22s]
Epoch 0: 88%|████████▊ | 10881/12384 [23:05:20<3:10:46, 7.62s/it, loss=0.0003, acc=0.9981, iter_time=7.22s]
Epoch 0: 88%|████████▊ | 10881/12384 [23:05:27<3:10:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 88%|████████▊ | 10882/12384 [23:05:27<3:10:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 88%|████████▊ | 10882/12384 [23:05:35<3:10:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 88%|████████▊ | 10883/12384 [23:05:35<3:10:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 88%|████████▊ | 10883/12384 [23:05:42<3:10:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 88%|████████▊ | 10884/12384 [23:05:42<3:10:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 88%|████████▊ | 10884/12384 [23:05:50<3:10:17, 7.61s/it, loss=0.0008, acc=0.9987, iter_time=6.09s]
Epoch 0: 88%|████████▊ | 10885/12384 [23:05:50<3:09:57, 7.60s/it, loss=0.0008, acc=0.9987, iter_time=6.09s]
Epoch 0: 88%|████████▊ | 10885/12384 [23:05:58<3:09:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 88%|████████▊ | 10886/12384 [23:05:58<3:09:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 88%|████████▊ | 10886/12384 [23:06:05<3:09:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 88%|████████▊ | 10887/12384 [23:06:05<3:09:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 88%|████████▊ | 10887/12384 [23:06:13<3:09:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 88%|████████▊ | 10888/12384 [23:06:13<3:10:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 88%|████████▊ | 10888/12384 [23:06:21<3:10:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 88%|████████▊ | 10889/12384 [23:06:21<3:09:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 88%|████████▊ | 10889/12384 [23:06:28<3:09:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 88%|████████▊ | 10890/12384 [23:06:28<3:09:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 88%|████████▊ | 10890/12384 [23:06:36<3:09:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 88%|████████▊ | 10891/12384 [23:06:36<3:11:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 88%|████████▊ | 10891/12384 [23:06:44<3:11:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 88%|████████▊ | 10892/12384 [23:06:44<3:11:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 88%|████████▊ | 10892/12384 [23:06:51<3:11:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 88%|████████▊ | 10893/12384 [23:06:51<3:10:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 88%|████████▊ | 10893/12384 [23:06:59<3:10:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10894/12384 [23:06:59<3:09:52, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10894/12384 [23:07:07<3:09:52, 7.65s/it, loss=0.0030, acc=0.9932, iter_time=7.91s]
Epoch 0: 88%|████████▊ | 10895/12384 [23:07:07<3:11:43, 7.73s/it, loss=0.0030, acc=0.9932, iter_time=7.91s]
Epoch 0: 88%|████████▊ | 10895/12384 [23:07:14<3:11:43, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 88%|████████▊ | 10896/12384 [23:07:14<3:10:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 88%|████████▊ | 10896/12384 [23:07:22<3:10:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 88%|████████▊ | 10897/12384 [23:07:22<3:09:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 88%|████████▊ | 10897/12384 [23:07:30<3:09:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 88%|████████▊ | 10898/12384 [23:07:30<3:09:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 88%|████████▊ | 10898/12384 [23:07:37<3:09:28, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10899/12384 [23:07:37<3:09:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10899/12384 [23:07:45<3:09:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 88%|████████▊ | 10900/12384 [23:07:45<3:08:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 88%|████████▊ | 10900/12384 [23:07:53<3:08:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 88%|████████▊ | 10901/12384 [23:07:53<3:08:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 88%|████████▊ | 10901/12384 [23:08:00<3:08:25, 7.62s/it, loss=0.0001, acc=0.9986, iter_time=6.13s]
Epoch 0: 88%|████████▊ | 10902/12384 [23:08:00<3:08:02, 7.61s/it, loss=0.0001, acc=0.9986, iter_time=6.13s]
Epoch 0: 88%|████████▊ | 10902/12384 [23:08:08<3:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 88%|████████▊ | 10903/12384 [23:08:08<3:07:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 88%|████████▊ | 10903/12384 [23:08:15<3:07:50, 7.61s/it, loss=0.0001, acc=0.9989, iter_time=7.99s]
Epoch 0: 88%|████████▊ | 10904/12384 [23:08:15<3:08:16, 7.63s/it, loss=0.0001, acc=0.9989, iter_time=7.99s]
Epoch 0: 88%|████████▊ | 10904/12384 [23:08:23<3:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 88%|████████▊ | 10905/12384 [23:08:23<3:07:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 88%|████████▊ | 10905/12384 [23:08:31<3:07:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 0: 88%|████████▊ | 10906/12384 [23:08:31<3:07:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 0: 88%|████████▊ | 10906/12384 [23:08:38<3:07:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 88%|████████▊ | 10907/12384 [23:08:38<3:07:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 88%|████████▊ | 10907/12384 [23:08:46<3:07:30, 7.62s/it, loss=0.0003, acc=0.9992, iter_time=7.63s]
Epoch 0: 88%|████████▊ | 10908/12384 [23:08:46<3:07:19, 7.61s/it, loss=0.0003, acc=0.9992, iter_time=7.63s]
Epoch 0: 88%|████████▊ | 10908/12384 [23:08:53<3:07:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 88%|████████▊ | 10909/12384 [23:08:53<3:07:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 88%|████████▊ | 10909/12384 [23:09:01<3:07:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 88%|████████▊ | 10910/12384 [23:09:01<3:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 88%|████████▊ | 10910/12384 [23:09:09<3:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 88%|████████▊ | 10911/12384 [23:09:09<3:06:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 88%|████████▊ | 10911/12384 [23:09:16<3:06:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 88%|████████▊ | 10912/12384 [23:09:16<3:07:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 88%|████████▊ | 10912/12384 [23:09:24<3:07:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 88%|████████▊ | 10913/12384 [23:09:24<3:07:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 88%|████████▊ | 10913/12384 [23:09:32<3:07:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 0: 88%|████████▊ | 10914/12384 [23:09:32<3:06:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 0: 88%|████████▊ | 10914/12384 [23:09:39<3:06:50, 7.63s/it, loss=0.0003, acc=0.9978, iter_time=7.53s]
Epoch 0: 88%|████████▊ | 10915/12384 [23:09:39<3:06:33, 7.62s/it, loss=0.0003, acc=0.9978, iter_time=7.53s]
Epoch 0: 88%|████████▊ | 10915/12384 [23:09:47<3:06:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 88%|████████▊ | 10916/12384 [23:09:47<3:06:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 88%|████████▊ | 10916/12384 [23:09:55<3:06:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 0: 88%|████████▊ | 10917/12384 [23:09:55<3:08:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 0: 88%|████████▊ | 10917/12384 [23:10:02<3:08:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 88%|████████▊ | 10918/12384 [23:10:02<3:07:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 88%|████████▊ | 10918/12384 [23:10:10<3:07:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 88%|████████▊ | 10919/12384 [23:10:10<3:06:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 88%|████████▊ | 10919/12384 [23:10:18<3:06:56, 7.66s/it, loss=0.0003, acc=0.9988, iter_time=7.56s]
Epoch 0: 88%|████████▊ | 10920/12384 [23:10:18<3:06:33, 7.65s/it, loss=0.0003, acc=0.9988, iter_time=7.56s]
Epoch 0: 88%|████████▊ | 10920/12384 [23:10:25<3:06:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 0: 88%|████████▊ | 10921/12384 [23:10:25<3:06:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 0: 88%|████████▊ | 10921/12384 [23:10:33<3:06:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 88%|████████▊ | 10922/12384 [23:10:33<3:05:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 0: 88%|████████▊ | 10922/12384 [23:10:40<3:05:50, 7.63s/it, loss=0.0000, acc=0.9996, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10923/12384 [23:10:40<3:05:35, 7.62s/it, loss=0.0000, acc=0.9996, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10923/12384 [23:10:48<3:05:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10924/12384 [23:10:48<3:05:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10924/12384 [23:10:56<3:05:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 88%|████████▊ | 10925/12384 [23:10:56<3:05:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 88%|████████▊ | 10925/12384 [23:11:03<3:05:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 88%|████████▊ | 10926/12384 [23:11:03<3:05:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 88%|████████▊ | 10926/12384 [23:11:11<3:05:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 88%|████████▊ | 10927/12384 [23:11:11<3:04:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 88%|████████▊ | 10927/12384 [23:11:18<3:04:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 88%|████████▊ | 10928/12384 [23:11:18<3:04:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 88%|████████▊ | 10928/12384 [23:11:26<3:04:40, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=4.40s]
Epoch 0: 88%|████████▊ | 10929/12384 [23:11:26<3:04:28, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=4.40s]
Epoch 0: 88%|████████▊ | 10929/12384 [23:11:34<3:04:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.41s]
Epoch 0: 88%|████████▊ | 10930/12384 [23:11:34<3:04:14, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.41s]
Epoch 0: 88%|████████▊ | 10930/12384 [23:11:41<3:04:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10931/12384 [23:11:41<3:04:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10931/12384 [23:11:49<3:04:52, 7.63s/it, loss=0.0003, acc=0.9993, iter_time=7.70s]
Epoch 0: 88%|████████▊ | 10932/12384 [23:11:49<3:04:40, 7.63s/it, loss=0.0003, acc=0.9993, iter_time=7.70s]
Epoch 0: 88%|████████▊ | 10932/12384 [23:11:57<3:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 88%|████████▊ | 10933/12384 [23:11:57<3:04:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 88%|████████▊ | 10933/12384 [23:12:04<3:04:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 88%|████████▊ | 10934/12384 [23:12:04<3:04:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 88%|████████▊ | 10934/12384 [23:12:12<3:04:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 88%|████████▊ | 10935/12384 [23:12:12<3:04:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 88%|████████▊ | 10935/12384 [23:12:19<3:04:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 88%|████████▊ | 10936/12384 [23:12:19<3:04:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 88%|████████▊ | 10936/12384 [23:12:27<3:04:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 88%|████████▊ | 10937/12384 [23:12:27<3:03:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 88%|████████▊ | 10937/12384 [23:12:35<3:03:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 88%|████████▊ | 10938/12384 [23:12:35<3:03:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 88%|████████▊ | 10938/12384 [23:12:42<3:03:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 88%|████████▊ | 10939/12384 [23:12:42<3:03:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 88%|████████▊ | 10939/12384 [23:12:50<3:03:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 0: 88%|████████▊ | 10940/12384 [23:12:50<3:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 0: 88%|████████▊ | 10940/12384 [23:12:58<3:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 0: 88%|████████▊ | 10941/12384 [23:12:58<3:03:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 0: 88%|████████▊ | 10941/12384 [23:13:05<3:03:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 0: 88%|████████▊ | 10942/12384 [23:13:05<3:03:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 0: 88%|████████▊ | 10942/12384 [23:13:13<3:03:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 88%|████████▊ | 10943/12384 [23:13:13<3:02:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 88%|████████▊ | 10943/12384 [23:13:21<3:02:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 88%|████████▊ | 10944/12384 [23:13:21<3:05:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 88%|████████▊ | 10944/12384 [23:13:28<3:05:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 88%|████████▊ | 10945/12384 [23:13:28<3:04:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 0: 88%|████████▊ | 10945/12384 [23:13:36<3:04:17, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=9.71s]
Epoch 0: 88%|████████▊ | 10946/12384 [23:13:36<3:03:37, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=9.71s]
Epoch 0: 88%|████████▊ | 10946/12384 [23:13:44<3:03:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 88%|████████▊ | 10947/12384 [23:13:44<3:05:18, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 88%|████████▊ | 10947/12384 [23:13:51<3:05:18, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 88%|████████▊ | 10948/12384 [23:13:51<3:04:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 88%|████████▊ | 10948/12384 [23:13:59<3:04:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 0: 88%|████████▊ | 10949/12384 [23:13:59<3:03:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 0: 88%|████████▊ | 10949/12384 [23:14:07<3:03:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 88%|████████▊ | 10950/12384 [23:14:07<3:02:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 88%|████████▊ | 10950/12384 [23:14:14<3:02:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 88%|████████▊ | 10951/12384 [23:14:14<3:02:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 0: 88%|████████▊ | 10951/12384 [23:14:22<3:02:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 88%|████████▊ | 10952/12384 [23:14:22<3:01:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 88%|████████▊ | 10952/12384 [23:14:29<3:01:52, 7.62s/it, loss=0.0003, acc=0.9988, iter_time=7.22s]
Epoch 0: 88%|████████▊ | 10953/12384 [23:14:29<3:01:41, 7.62s/it, loss=0.0003, acc=0.9988, iter_time=7.22s]
Epoch 0: 88%|████████▊ | 10953/12384 [23:14:37<3:01:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10954/12384 [23:14:37<3:01:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10954/12384 [23:14:45<3:01:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10955/12384 [23:14:45<3:01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10955/12384 [23:14:52<3:01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10956/12384 [23:14:52<3:01:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 88%|████████▊ | 10956/12384 [23:15:00<3:01:05, 7.61s/it, loss=0.0003, acc=0.9978, iter_time=7.29s]
Epoch 0: 88%|████████▊ | 10957/12384 [23:15:00<3:01:02, 7.61s/it, loss=0.0003, acc=0.9978, iter_time=7.29s]
Epoch 0: 88%|████████▊ | 10957/12384 [23:15:08<3:01:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 88%|████████▊ | 10958/12384 [23:15:08<3:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 88%|████████▊ | 10958/12384 [23:15:15<3:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 0: 88%|████████▊ | 10959/12384 [23:15:15<3:00:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 0: 88%|████████▊ | 10959/12384 [23:15:23<3:00:54, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=10.53s]
Epoch 0: 89%|████████▊ | 10960/12384 [23:15:23<3:00:44, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=10.53s]
Epoch 0: 89%|████████▊ | 10960/12384 [23:15:30<3:00:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 89%|████████▊ | 10961/12384 [23:15:30<3:00:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 89%|████████▊ | 10961/12384 [23:15:38<3:00:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 89%|████████▊ | 10962/12384 [23:15:38<3:00:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 89%|████████▊ | 10962/12384 [23:15:46<3:00:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 89%|████████▊ | 10963/12384 [23:15:46<3:00:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 89%|████████▊ | 10963/12384 [23:15:53<3:00:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▊ | 10964/12384 [23:15:53<3:00:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▊ | 10964/12384 [23:16:01<3:00:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 89%|████████▊ | 10965/12384 [23:16:01<2:59:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 89%|████████▊ | 10965/12384 [23:16:08<2:59:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 89%|████████▊ | 10966/12384 [23:16:08<2:59:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 89%|████████▊ | 10966/12384 [23:16:16<2:59:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 89%|████████▊ | 10967/12384 [23:16:16<2:59:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 89%|████████▊ | 10967/12384 [23:16:24<2:59:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 89%|████████▊ | 10968/12384 [23:16:24<2:59:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 89%|████████▊ | 10968/12384 [23:16:31<2:59:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 89%|████████▊ | 10969/12384 [23:16:31<2:59:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 89%|████████▊ | 10969/12384 [23:16:39<2:59:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 0: 89%|████████▊ | 10970/12384 [23:16:39<3:01:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 0: 89%|████████▊ | 10970/12384 [23:16:47<3:01:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 89%|████████▊ | 10971/12384 [23:16:47<3:00:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 89%|████████▊ | 10971/12384 [23:16:54<3:00:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▊ | 10972/12384 [23:16:54<3:00:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▊ | 10972/12384 [23:17:02<3:00:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▊ | 10973/12384 [23:17:02<2:59:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▊ | 10973/12384 [23:17:10<2:59:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 89%|████████▊ | 10974/12384 [23:17:10<3:01:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 89%|████████▊ | 10974/12384 [23:17:18<3:01:24, 7.72s/it, loss=0.0002, acc=0.9997, iter_time=7.60s]
Epoch 0: 89%|████████▊ | 10975/12384 [23:17:18<3:00:26, 7.68s/it, loss=0.0002, acc=0.9997, iter_time=7.60s]
Epoch 0: 89%|████████▊ | 10975/12384 [23:17:25<3:00:26, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=8.01s]
Epoch 0: 89%|████████▊ | 10976/12384 [23:17:25<2:59:51, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=8.01s]
Epoch 0: 89%|████████▊ | 10976/12384 [23:17:33<2:59:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 0: 89%|████████▊ | 10977/12384 [23:17:33<2:59:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 0: 89%|████████▊ | 10977/12384 [23:17:40<2:59:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 89%|████████▊ | 10978/12384 [23:17:40<2:59:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 0: 89%|████████▊ | 10978/12384 [23:17:48<2:59:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 89%|████████▊ | 10979/12384 [23:17:48<2:58:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 89%|████████▊ | 10979/12384 [23:17:56<2:58:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 89%|████████▊ | 10980/12384 [23:17:56<2:58:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 89%|████████▊ | 10980/12384 [23:18:03<2:58:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 89%|████████▊ | 10981/12384 [23:18:03<2:58:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 89%|████████▊ | 10981/12384 [23:18:11<2:58:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 89%|████████▊ | 10982/12384 [23:18:11<2:57:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 89%|████████▊ | 10982/12384 [23:18:18<2:57:58, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.39s]
Epoch 0: 89%|████████▊ | 10983/12384 [23:18:18<2:57:51, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.39s]
Epoch 0: 89%|████████▊ | 10983/12384 [23:18:26<2:57:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 0: 89%|████████▊ | 10984/12384 [23:18:26<2:57:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 0: 89%|████████▊ | 10984/12384 [23:18:34<2:57:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 89%|████████▊ | 10985/12384 [23:18:34<2:57:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 89%|████████▊ | 10985/12384 [23:18:41<2:57:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 89%|████████▊ | 10986/12384 [23:18:41<2:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 89%|████████▊ | 10986/12384 [23:18:49<2:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 89%|████████▊ | 10987/12384 [23:18:49<2:57:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 89%|████████▊ | 10987/12384 [23:18:56<2:57:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 89%|████████▊ | 10988/12384 [23:18:56<2:56:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 89%|████████▊ | 10988/12384 [23:19:04<2:56:55, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.37s]
Epoch 0: 89%|████████▊ | 10989/12384 [23:19:04<2:57:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.37s]
Epoch 0: 89%|████████▊ | 10989/12384 [23:19:12<2:57:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 0: 89%|████████▊ | 10990/12384 [23:19:12<2:57:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 0: 89%|████████▊ | 10990/12384 [23:19:19<2:57:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 89%|████████▉ | 10991/12384 [23:19:19<2:56:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 89%|████████▉ | 10991/12384 [23:19:27<2:56:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 89%|████████▉ | 10992/12384 [23:19:27<2:56:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 89%|████████▉ | 10992/12384 [23:19:35<2:56:37, 7.61s/it, loss=0.0004, acc=0.9991, iter_time=7.20s]
Epoch 0: 89%|████████▉ | 10993/12384 [23:19:35<2:56:29, 7.61s/it, loss=0.0004, acc=0.9991, iter_time=7.20s]
Epoch 0: 89%|████████▉ | 10993/12384 [23:19:42<2:56:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 10994/12384 [23:19:42<2:56:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 10994/12384 [23:19:50<2:56:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▉ | 10995/12384 [23:19:50<2:56:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▉ | 10995/12384 [23:19:57<2:56:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 10996/12384 [23:19:57<2:56:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 10996/12384 [23:20:05<2:56:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 89%|████████▉ | 10997/12384 [23:20:05<2:58:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 89%|████████▉ | 10997/12384 [23:20:13<2:58:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 0: 89%|████████▉ | 10998/12384 [23:20:13<2:57:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 0: 89%|████████▉ | 10998/12384 [23:20:21<2:57:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 89%|████████▉ | 10999/12384 [23:20:21<2:56:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 89%|████████▉ | 10999/12384 [23:20:28<2:56:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 0: 89%|████████▉ | 11000/12384 [23:20:28<2:57:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 0: 89%|████████▉ | 11000/12384 [23:20:36<2:57:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 89%|████████▉ | 11001/12384 [23:20:36<2:58:48, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 89%|████████▉ | 11001/12384 [23:20:44<2:58:48, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 89%|████████▉ | 11002/12384 [23:20:44<2:58:06, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 89%|████████▉ | 11002/12384 [23:20:52<2:58:06, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 0: 89%|████████▉ | 11003/12384 [23:20:52<2:57:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 0: 89%|████████▉ | 11003/12384 [23:20:59<2:57:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 11004/12384 [23:20:59<2:56:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 11004/12384 [23:21:07<2:56:27, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 89%|████████▉ | 11005/12384 [23:21:07<2:55:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 89%|████████▉ | 11005/12384 [23:21:14<2:55:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 89%|████████▉ | 11006/12384 [23:21:14<2:55:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 89%|████████▉ | 11006/12384 [23:21:22<2:55:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 89%|████████▉ | 11007/12384 [23:21:22<2:54:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 0: 89%|████████▉ | 11007/12384 [23:21:30<2:54:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 89%|████████▉ | 11008/12384 [23:21:30<2:54:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 89%|████████▉ | 11008/12384 [23:21:37<2:54:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 89%|████████▉ | 11009/12384 [23:21:37<2:54:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 89%|████████▉ | 11009/12384 [23:21:45<2:54:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 89%|████████▉ | 11010/12384 [23:21:45<2:54:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 89%|████████▉ | 11010/12384 [23:21:52<2:54:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11011/12384 [23:21:52<2:54:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11011/12384 [23:22:00<2:54:15, 7.62s/it, loss=0.0017, acc=0.9963, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11012/12384 [23:22:00<2:54:04, 7.61s/it, loss=0.0017, acc=0.9963, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11012/12384 [23:22:08<2:54:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 89%|████████▉ | 11013/12384 [23:22:08<2:53:44, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 89%|████████▉ | 11013/12384 [23:22:15<2:53:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 89%|████████▉ | 11014/12384 [23:22:15<2:54:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 89%|████████▉ | 11014/12384 [23:22:23<2:54:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 89%|████████▉ | 11015/12384 [23:22:23<2:53:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 89%|████████▉ | 11015/12384 [23:22:30<2:53:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 89%|████████▉ | 11016/12384 [23:22:30<2:53:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 89%|████████▉ | 11016/12384 [23:22:38<2:53:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 89%|████████▉ | 11017/12384 [23:22:38<2:53:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 89%|████████▉ | 11017/12384 [23:22:46<2:53:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 89%|████████▉ | 11018/12384 [23:22:46<2:53:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 89%|████████▉ | 11018/12384 [23:22:53<2:53:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 89%|████████▉ | 11019/12384 [23:22:53<2:53:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 89%|████████▉ | 11019/12384 [23:23:01<2:53:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 89%|████████▉ | 11020/12384 [23:23:01<2:53:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 89%|████████▉ | 11020/12384 [23:23:09<2:53:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 11021/12384 [23:23:09<2:53:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 11021/12384 [23:23:16<2:53:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 89%|████████▉ | 11022/12384 [23:23:16<2:52:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 89%|████████▉ | 11022/12384 [23:23:24<2:52:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 89%|████████▉ | 11023/12384 [23:23:24<2:55:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 89%|████████▉ | 11023/12384 [23:23:32<2:55:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 89%|████████▉ | 11024/12384 [23:23:32<2:54:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 89%|████████▉ | 11024/12384 [23:23:39<2:54:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 89%|████████▉ | 11025/12384 [23:23:39<2:53:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 89%|████████▉ | 11025/12384 [23:23:47<2:53:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 11026/12384 [23:23:47<2:53:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 11026/12384 [23:23:55<2:53:27, 7.66s/it, loss=0.0014, acc=0.9977, iter_time=5.86s]
Epoch 0: 89%|████████▉ | 11027/12384 [23:23:55<2:52:58, 7.65s/it, loss=0.0014, acc=0.9977, iter_time=5.86s]
Epoch 0: 89%|████████▉ | 11027/12384 [23:24:02<2:52:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 89%|████████▉ | 11028/12384 [23:24:02<2:54:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 0: 89%|████████▉ | 11028/12384 [23:24:10<2:54:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11029/12384 [23:24:10<2:53:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11029/12384 [23:24:18<2:53:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11030/12384 [23:24:18<2:52:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11030/12384 [23:24:25<2:52:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11031/12384 [23:24:25<2:52:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11031/12384 [23:24:33<2:52:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 89%|████████▉ | 11032/12384 [23:24:33<2:52:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 89%|████████▉ | 11032/12384 [23:24:41<2:52:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 89%|████████▉ | 11033/12384 [23:24:41<2:52:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 89%|████████▉ | 11033/12384 [23:24:48<2:52:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 89%|████████▉ | 11034/12384 [23:24:48<2:51:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 89%|████████▉ | 11034/12384 [23:24:56<2:51:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11035/12384 [23:24:56<2:51:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11035/12384 [23:25:03<2:51:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▉ | 11036/12384 [23:25:03<2:51:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▉ | 11036/12384 [23:25:11<2:51:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.55s]
Epoch 0: 89%|████████▉ | 11037/12384 [23:25:11<2:51:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.55s]
Epoch 0: 89%|████████▉ | 11037/12384 [23:25:19<2:51:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 0: 89%|████████▉ | 11038/12384 [23:25:19<2:50:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 0: 89%|████████▉ | 11038/12384 [23:25:26<2:50:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 89%|████████▉ | 11039/12384 [23:25:26<2:50:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 89%|████████▉ | 11039/12384 [23:25:34<2:50:31, 7.61s/it, loss=0.0005, acc=0.9987, iter_time=8.00s]
Epoch 0: 89%|████████▉ | 11040/12384 [23:25:34<2:50:27, 7.61s/it, loss=0.0005, acc=0.9987, iter_time=8.00s]
Epoch 0: 89%|████████▉ | 11040/12384 [23:25:41<2:50:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 89%|████████▉ | 11041/12384 [23:25:41<2:50:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 89%|████████▉ | 11041/12384 [23:25:49<2:50:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11042/12384 [23:25:49<2:50:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11042/12384 [23:25:57<2:50:10, 7.61s/it, loss=0.0003, acc=0.9989, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11043/12384 [23:25:57<2:49:58, 7.61s/it, loss=0.0003, acc=0.9989, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11043/12384 [23:26:04<2:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 89%|████████▉ | 11044/12384 [23:26:04<2:49:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 89%|████████▉ | 11044/12384 [23:26:12<2:49:45, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 89%|████████▉ | 11045/12384 [23:26:12<2:49:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 89%|████████▉ | 11045/12384 [23:26:19<2:49:46, 7.61s/it, loss=0.0005, acc=0.9991, iter_time=7.01s]
Epoch 0: 89%|████████▉ | 11046/12384 [23:26:19<2:49:38, 7.61s/it, loss=0.0005, acc=0.9991, iter_time=7.01s]
Epoch 0: 89%|████████▉ | 11046/12384 [23:26:27<2:49:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 0: 89%|████████▉ | 11047/12384 [23:26:27<2:49:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 0: 89%|████████▉ | 11047/12384 [23:26:35<2:49:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 89%|████████▉ | 11048/12384 [23:26:35<2:49:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 89%|████████▉ | 11048/12384 [23:26:43<2:49:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 89%|████████▉ | 11049/12384 [23:26:43<2:51:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 0: 89%|████████▉ | 11049/12384 [23:26:50<2:51:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 89%|████████▉ | 11050/12384 [23:26:50<2:51:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 89%|████████▉ | 11050/12384 [23:26:58<2:51:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 89%|████████▉ | 11051/12384 [23:26:58<2:50:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 89%|████████▉ | 11051/12384 [23:27:06<2:50:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 89%|████████▉ | 11052/12384 [23:27:06<2:50:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 0: 89%|████████▉ | 11052/12384 [23:27:13<2:50:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 89%|████████▉ | 11053/12384 [23:27:13<2:49:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 89%|████████▉ | 11053/12384 [23:27:21<2:49:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 0: 89%|████████▉ | 11054/12384 [23:27:21<2:51:41, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 0: 89%|████████▉ | 11054/12384 [23:27:29<2:51:41, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 89%|████████▉ | 11055/12384 [23:27:29<2:50:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 89%|████████▉ | 11055/12384 [23:27:36<2:50:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 89%|████████▉ | 11056/12384 [23:27:36<2:49:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 89%|████████▉ | 11056/12384 [23:27:44<2:49:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 89%|████████▉ | 11057/12384 [23:27:44<2:49:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 89%|████████▉ | 11057/12384 [23:27:52<2:49:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 89%|████████▉ | 11058/12384 [23:27:52<2:48:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 89%|████████▉ | 11058/12384 [23:27:59<2:48:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 89%|████████▉ | 11059/12384 [23:27:59<2:48:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 89%|████████▉ | 11059/12384 [23:28:07<2:48:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 89%|████████▉ | 11060/12384 [23:28:07<2:48:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 89%|████████▉ | 11060/12384 [23:28:14<2:48:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▉ | 11061/12384 [23:28:14<2:47:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▉ | 11061/12384 [23:28:22<2:47:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 89%|████████▉ | 11062/12384 [23:28:24<2:58:01, 8.08s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 89%|████████▉ | 11062/12384 [23:28:31<2:58:01, 8.08s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 0: 89%|████████▉ | 11063/12384 [23:28:31<2:54:43, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 0: 89%|████████▉ | 11063/12384 [23:28:39<2:54:43, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 89%|████████▉ | 11064/12384 [23:28:39<2:52:20, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 89%|████████▉ | 11064/12384 [23:28:46<2:52:20, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 89%|████████▉ | 11065/12384 [23:28:46<2:50:44, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 89%|████████▉ | 11065/12384 [23:28:54<2:50:44, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▉ | 11066/12384 [23:28:54<2:49:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 89%|████████▉ | 11066/12384 [23:29:02<2:49:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 11067/12384 [23:29:02<2:48:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 89%|████████▉ | 11067/12384 [23:29:09<2:48:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11068/12384 [23:29:09<2:48:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 89%|████████▉ | 11068/12384 [23:29:17<2:48:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11069/12384 [23:29:17<2:47:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11069/12384 [23:29:24<2:47:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 89%|████████▉ | 11070/12384 [23:29:24<2:47:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 89%|████████▉ | 11070/12384 [23:29:32<2:47:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 89%|████████▉ | 11071/12384 [23:29:32<2:47:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 89%|████████▉ | 11071/12384 [23:29:40<2:47:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 89%|████████▉ | 11072/12384 [23:29:40<2:46:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 89%|████████▉ | 11072/12384 [23:29:47<2:46:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 89%|████████▉ | 11073/12384 [23:29:47<2:46:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 89%|████████▉ | 11073/12384 [23:29:55<2:46:33, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11074/12384 [23:29:55<2:46:20, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 89%|████████▉ | 11074/12384 [23:30:03<2:46:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 89%|████████▉ | 11075/12384 [23:30:03<2:48:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 89%|████████▉ | 11075/12384 [23:30:10<2:48:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 89%|████████▉ | 11076/12384 [23:30:10<2:47:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 0: 89%|████████▉ | 11076/12384 [23:30:18<2:47:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 0: 89%|████████▉ | 11077/12384 [23:30:18<2:46:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 0: 89%|████████▉ | 11077/12384 [23:30:26<2:46:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 89%|████████▉ | 11078/12384 [23:30:26<2:46:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 89%|████████▉ | 11078/12384 [23:30:33<2:46:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 89%|████████▉ | 11079/12384 [23:30:33<2:45:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 0: 89%|████████▉ | 11079/12384 [23:30:41<2:45:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 89%|████████▉ | 11080/12384 [23:30:41<2:47:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 89%|████████▉ | 11080/12384 [23:30:49<2:47:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 89%|████████▉ | 11081/12384 [23:30:49<2:46:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 89%|████████▉ | 11081/12384 [23:30:56<2:46:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 89%|████████▉ | 11082/12384 [23:30:56<2:46:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 0: 89%|████████▉ | 11082/12384 [23:31:04<2:46:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 89%|████████▉ | 11083/12384 [23:31:04<2:45:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 0: 89%|████████▉ | 11083/12384 [23:31:12<2:45:37, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=6.68s]
Epoch 0: 90%|████████▉ | 11084/12384 [23:31:12<2:45:19, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=6.68s]
Epoch 0: 90%|████████▉ | 11084/12384 [23:31:19<2:45:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 90%|████████▉ | 11085/12384 [23:31:19<2:45:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 90%|████████▉ | 11085/12384 [23:31:27<2:45:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 90%|████████▉ | 11086/12384 [23:31:27<2:44:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 90%|████████▉ | 11086/12384 [23:31:34<2:44:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 90%|████████▉ | 11087/12384 [23:31:34<2:45:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 90%|████████▉ | 11087/12384 [23:31:42<2:45:14, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=8.83s]
Epoch 0: 90%|████████▉ | 11088/12384 [23:31:42<2:44:44, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.83s]
Epoch 0: 90%|████████▉ | 11088/12384 [23:31:50<2:44:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 90%|████████▉ | 11089/12384 [23:31:50<2:45:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 90%|████████▉ | 11089/12384 [23:31:57<2:45:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 90%|████████▉ | 11090/12384 [23:31:57<2:44:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 90%|████████▉ | 11090/12384 [23:32:05<2:44:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 90%|████████▉ | 11091/12384 [23:32:05<2:44:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 90%|████████▉ | 11091/12384 [23:32:13<2:44:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 90%|████████▉ | 11092/12384 [23:32:13<2:44:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 90%|████████▉ | 11092/12384 [23:32:20<2:44:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11093/12384 [23:32:20<2:44:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11093/12384 [23:32:28<2:44:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11094/12384 [23:32:28<2:43:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11094/12384 [23:32:36<2:43:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|████████▉ | 11095/12384 [23:32:36<2:44:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|████████▉ | 11095/12384 [23:32:43<2:44:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 90%|████████▉ | 11096/12384 [23:32:43<2:44:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 90%|████████▉ | 11096/12384 [23:32:51<2:44:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 0: 90%|████████▉ | 11097/12384 [23:32:51<2:43:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 0: 90%|████████▉ | 11097/12384 [23:32:58<2:43:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11098/12384 [23:32:58<2:43:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11098/12384 [23:33:06<2:43:31, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=6.55s]
Epoch 0: 90%|████████▉ | 11099/12384 [23:33:06<2:43:20, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=6.55s]
Epoch 0: 90%|████████▉ | 11099/12384 [23:33:14<2:43:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 0: 90%|████████▉ | 11100/12384 [23:33:14<2:43:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 0: 90%|████████▉ | 11100/12384 [23:33:22<2:43:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 90%|████████▉ | 11101/12384 [23:33:22<2:44:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 90%|████████▉ | 11101/12384 [23:33:29<2:44:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 90%|████████▉ | 11102/12384 [23:33:29<2:44:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 90%|████████▉ | 11102/12384 [23:33:37<2:44:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|████████▉ | 11103/12384 [23:33:37<2:43:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|████████▉ | 11103/12384 [23:33:44<2:43:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 90%|████████▉ | 11104/12384 [23:33:44<2:42:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 90%|████████▉ | 11104/12384 [23:33:52<2:42:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 90%|████████▉ | 11105/12384 [23:33:52<2:44:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 90%|████████▉ | 11105/12384 [23:34:00<2:44:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 90%|████████▉ | 11106/12384 [23:34:00<2:43:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 90%|████████▉ | 11106/12384 [23:34:08<2:43:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 90%|████████▉ | 11107/12384 [23:34:08<2:43:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 90%|████████▉ | 11107/12384 [23:34:15<2:43:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 90%|████████▉ | 11108/12384 [23:34:15<2:42:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 0: 90%|████████▉ | 11108/12384 [23:34:23<2:42:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 90%|████████▉ | 11109/12384 [23:34:23<2:42:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 90%|████████▉ | 11109/12384 [23:34:30<2:42:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 90%|████████▉ | 11110/12384 [23:34:30<2:42:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 90%|████████▉ | 11110/12384 [23:34:38<2:42:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 90%|████████▉ | 11111/12384 [23:34:38<2:41:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 90%|████████▉ | 11111/12384 [23:34:46<2:41:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 90%|████████▉ | 11112/12384 [23:34:46<2:41:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 90%|████████▉ | 11112/12384 [23:34:53<2:41:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 90%|████████▉ | 11113/12384 [23:34:53<2:41:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 90%|████████▉ | 11113/12384 [23:35:01<2:41:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 90%|████████▉ | 11114/12384 [23:35:01<2:41:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 90%|████████▉ | 11114/12384 [23:35:08<2:41:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11115/12384 [23:35:08<2:41:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11115/12384 [23:35:16<2:41:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 90%|████████▉ | 11116/12384 [23:35:16<2:40:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 90%|████████▉ | 11116/12384 [23:35:24<2:40:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 90%|████████▉ | 11117/12384 [23:35:24<2:40:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 90%|████████▉ | 11117/12384 [23:35:31<2:40:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 90%|████████▉ | 11118/12384 [23:35:31<2:40:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 90%|████████▉ | 11118/12384 [23:35:39<2:40:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 90%|████████▉ | 11119/12384 [23:35:39<2:40:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 90%|████████▉ | 11119/12384 [23:35:47<2:40:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 0: 90%|████████▉ | 11120/12384 [23:35:47<2:40:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 0: 90%|████████▉ | 11120/12384 [23:35:54<2:40:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 90%|████████▉ | 11121/12384 [23:35:54<2:40:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 90%|████████▉ | 11121/12384 [23:36:02<2:40:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 90%|████████▉ | 11122/12384 [23:36:02<2:40:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 90%|████████▉ | 11122/12384 [23:36:09<2:40:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 90%|████████▉ | 11123/12384 [23:36:09<2:40:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 90%|████████▉ | 11123/12384 [23:36:17<2:40:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 90%|████████▉ | 11124/12384 [23:36:17<2:39:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 90%|████████▉ | 11124/12384 [23:36:25<2:39:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11125/12384 [23:36:25<2:40:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11125/12384 [23:36:32<2:40:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 90%|████████▉ | 11126/12384 [23:36:32<2:39:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 90%|████████▉ | 11126/12384 [23:36:40<2:39:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11127/12384 [23:36:40<2:39:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11127/12384 [23:36:48<2:39:36, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=8.05s]
Epoch 0: 90%|████████▉ | 11128/12384 [23:36:48<2:41:34, 7.72s/it, loss=0.0002, acc=0.9997, iter_time=8.05s]
Epoch 0: 90%|████████▉ | 11128/12384 [23:36:55<2:41:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 90%|████████▉ | 11129/12384 [23:36:55<2:40:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 90%|████████▉ | 11129/12384 [23:37:03<2:40:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 90%|████████▉ | 11130/12384 [23:37:03<2:40:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 90%|████████▉ | 11130/12384 [23:37:11<2:40:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 90%|████████▉ | 11131/12384 [23:37:11<2:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 90%|████████▉ | 11131/12384 [23:37:18<2:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 90%|████████▉ | 11132/12384 [23:37:18<2:39:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 90%|████████▉ | 11132/12384 [23:37:26<2:39:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 90%|████████▉ | 11133/12384 [23:37:26<2:39:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 90%|████████▉ | 11133/12384 [23:37:34<2:39:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 90%|████████▉ | 11134/12384 [23:37:34<2:39:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 90%|████████▉ | 11134/12384 [23:37:41<2:39:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 90%|████████▉ | 11135/12384 [23:37:41<2:38:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 90%|████████▉ | 11135/12384 [23:37:49<2:38:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 0: 90%|████████▉ | 11136/12384 [23:37:49<2:38:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 0: 90%|████████▉ | 11136/12384 [23:37:56<2:38:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 0: 90%|████████▉ | 11137/12384 [23:37:56<2:38:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 0: 90%|████████▉ | 11137/12384 [23:38:04<2:38:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 90%|████████▉ | 11138/12384 [23:38:04<2:38:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 90%|████████▉ | 11138/12384 [23:38:12<2:38:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 90%|████████▉ | 11139/12384 [23:38:12<2:37:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 90%|████████▉ | 11139/12384 [23:38:19<2:37:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 0: 90%|████████▉ | 11140/12384 [23:38:19<2:37:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 0: 90%|████████▉ | 11140/12384 [23:38:27<2:37:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 90%|████████▉ | 11141/12384 [23:38:27<2:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 0: 90%|████████▉ | 11141/12384 [23:38:34<2:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|████████▉ | 11142/12384 [23:38:34<2:37:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|████████▉ | 11142/12384 [23:38:42<2:37:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|████████▉ | 11143/12384 [23:38:42<2:37:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|████████▉ | 11143/12384 [23:38:50<2:37:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 90%|████████▉ | 11144/12384 [23:38:50<2:37:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 90%|████████▉ | 11144/12384 [23:38:57<2:37:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11145/12384 [23:38:57<2:36:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|████████▉ | 11145/12384 [23:39:05<2:36:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 90%|█████████ | 11146/12384 [23:39:05<2:36:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 90%|█████████ | 11146/12384 [23:39:12<2:36:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|█████████ | 11147/12384 [23:39:12<2:36:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|█████████ | 11147/12384 [23:39:20<2:36:36, 7.60s/it, loss=0.0001, acc=0.9997, iter_time=6.67s]
Epoch 0: 90%|█████████ | 11148/12384 [23:39:20<2:36:29, 7.60s/it, loss=0.0001, acc=0.9997, iter_time=6.67s]
Epoch 0: 90%|█████████ | 11148/12384 [23:39:28<2:36:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 90%|█████████ | 11149/12384 [23:39:28<2:36:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 90%|█████████ | 11149/12384 [23:39:35<2:36:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 90%|█████████ | 11150/12384 [23:39:35<2:36:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 90%|█████████ | 11150/12384 [23:39:43<2:36:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 90%|█████████ | 11151/12384 [23:39:43<2:36:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 90%|█████████ | 11151/12384 [23:39:50<2:36:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 90%|█████████ | 11152/12384 [23:39:50<2:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 90%|█████████ | 11152/12384 [23:39:58<2:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 90%|█████████ | 11153/12384 [23:39:58<2:36:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 90%|█████████ | 11153/12384 [23:40:06<2:36:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 90%|█████████ | 11154/12384 [23:40:06<2:38:32, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 90%|█████████ | 11154/12384 [23:40:14<2:38:32, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 0: 90%|█████████ | 11155/12384 [23:40:14<2:37:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 0: 90%|█████████ | 11155/12384 [23:40:21<2:37:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 90%|█████████ | 11156/12384 [23:40:21<2:36:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 90%|█████████ | 11156/12384 [23:40:29<2:36:51, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.78s]
Epoch 0: 90%|█████████ | 11157/12384 [23:40:29<2:36:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.78s]
Epoch 0: 90%|█████████ | 11157/12384 [23:40:37<2:36:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 90%|█████████ | 11158/12384 [23:40:37<2:36:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 90%|█████████ | 11158/12384 [23:40:44<2:36:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 90%|█████████ | 11159/12384 [23:40:44<2:35:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 90%|█████████ | 11159/12384 [23:40:52<2:35:45, 7.63s/it, loss=0.0001, acc=0.9988, iter_time=7.99s]
Epoch 0: 90%|█████████ | 11160/12384 [23:40:52<2:35:28, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=7.99s]
Epoch 0: 90%|█████████ | 11160/12384 [23:40:59<2:35:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 90%|█████████ | 11161/12384 [23:40:59<2:35:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 90%|█████████ | 11161/12384 [23:41:07<2:35:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 90%|█████████ | 11162/12384 [23:41:07<2:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 90%|█████████ | 11162/12384 [23:41:15<2:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 90%|█████████ | 11163/12384 [23:41:15<2:34:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 90%|█████████ | 11163/12384 [23:41:22<2:34:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 90%|█████████ | 11164/12384 [23:41:22<2:34:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 90%|█████████ | 11164/12384 [23:41:30<2:34:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 90%|█████████ | 11165/12384 [23:41:30<2:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 90%|█████████ | 11165/12384 [23:41:37<2:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 90%|█████████ | 11166/12384 [23:41:37<2:34:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 90%|█████████ | 11166/12384 [23:41:45<2:34:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 90%|█████████ | 11167/12384 [23:41:45<2:35:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 0: 90%|█████████ | 11167/12384 [23:41:53<2:35:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 90%|█████████ | 11168/12384 [23:41:53<2:34:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 90%|█████████ | 11168/12384 [23:42:00<2:34:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 90%|█████████ | 11169/12384 [23:42:00<2:34:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 90%|█████████ | 11169/12384 [23:42:08<2:34:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 90%|█████████ | 11170/12384 [23:42:08<2:34:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 90%|█████████ | 11170/12384 [23:42:16<2:34:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 90%|█████████ | 11171/12384 [23:42:16<2:34:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 0: 90%|█████████ | 11171/12384 [23:42:23<2:34:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 90%|█████████ | 11172/12384 [23:42:23<2:34:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 90%|█████████ | 11172/12384 [23:42:31<2:34:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 90%|█████████ | 11173/12384 [23:42:31<2:33:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 90%|█████████ | 11173/12384 [23:42:38<2:33:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|█████████ | 11174/12384 [23:42:38<2:33:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|█████████ | 11174/12384 [23:42:46<2:33:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 90%|█████████ | 11175/12384 [23:42:46<2:33:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 90%|█████████ | 11175/12384 [23:42:54<2:33:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 90%|█████████ | 11176/12384 [23:42:54<2:33:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 90%|█████████ | 11176/12384 [23:43:01<2:33:23, 7.62s/it, loss=0.0006, acc=0.9989, iter_time=7.21s]
Epoch 0: 90%|█████████ | 11177/12384 [23:43:01<2:33:19, 7.62s/it, loss=0.0006, acc=0.9989, iter_time=7.21s]
Epoch 0: 90%|█████████ | 11177/12384 [23:43:09<2:33:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 90%|█████████ | 11178/12384 [23:43:09<2:33:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 90%|█████████ | 11178/12384 [23:43:17<2:33:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 90%|█████████ | 11179/12384 [23:43:17<2:33:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 90%|█████████ | 11179/12384 [23:43:24<2:33:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 90%|█████████ | 11180/12384 [23:43:24<2:32:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 90%|█████████ | 11180/12384 [23:43:32<2:32:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 0: 90%|█████████ | 11181/12384 [23:43:32<2:34:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 0: 90%|█████████ | 11181/12384 [23:43:40<2:34:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 0: 90%|█████████ | 11182/12384 [23:43:40<2:34:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 0: 90%|█████████ | 11182/12384 [23:43:47<2:34:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 90%|█████████ | 11183/12384 [23:43:47<2:33:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 90%|█████████ | 11183/12384 [23:43:55<2:33:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 90%|█████████ | 11184/12384 [23:43:55<2:33:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 90%|█████████ | 11184/12384 [23:44:03<2:33:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 90%|█████████ | 11185/12384 [23:44:03<2:33:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 90%|█████████ | 11185/12384 [23:44:10<2:33:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 90%|█████████ | 11186/12384 [23:44:10<2:32:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 90%|█████████ | 11186/12384 [23:44:18<2:32:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 90%|█████████ | 11187/12384 [23:44:18<2:32:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 90%|█████████ | 11187/12384 [23:44:26<2:32:21, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 90%|█████████ | 11188/12384 [23:44:26<2:32:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 90%|█████████ | 11188/12384 [23:44:33<2:32:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 90%|█████████ | 11189/12384 [23:44:33<2:31:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 90%|█████████ | 11189/12384 [23:44:41<2:31:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|█████████ | 11190/12384 [23:44:41<2:31:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 90%|█████████ | 11190/12384 [23:44:48<2:31:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|█████████ | 11191/12384 [23:44:48<2:31:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|█████████ | 11191/12384 [23:44:56<2:31:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 90%|█████████ | 11192/12384 [23:44:56<2:31:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 90%|█████████ | 11192/12384 [23:45:04<2:31:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 90%|█████████ | 11193/12384 [23:45:04<2:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 90%|█████████ | 11193/12384 [23:45:11<2:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 90%|█████████ | 11194/12384 [23:45:11<2:31:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 90%|█████████ | 11194/12384 [23:45:19<2:31:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 90%|█████████ | 11195/12384 [23:45:19<2:30:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 90%|█████████ | 11195/12384 [23:45:26<2:30:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 90%|█████████ | 11196/12384 [23:45:26<2:30:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 0: 90%|█████████ | 11196/12384 [23:45:34<2:30:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 0: 90%|█████████ | 11197/12384 [23:45:34<2:30:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 0: 90%|█████████ | 11197/12384 [23:45:42<2:30:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 90%|█████████ | 11198/12384 [23:45:42<2:30:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 0: 90%|█████████ | 11198/12384 [23:45:49<2:30:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 90%|█████████ | 11199/12384 [23:45:49<2:30:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 90%|█████████ | 11199/12384 [23:45:57<2:30:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 90%|█████████ | 11200/12384 [23:45:57<2:30:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 90%|█████████ | 11200/12384 [23:46:04<2:30:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 90%|█████████ | 11201/12384 [23:46:04<2:30:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 90%|█████████ | 11201/12384 [23:46:12<2:30:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 90%|█████████ | 11202/12384 [23:46:12<2:29:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 90%|█████████ | 11202/12384 [23:46:20<2:29:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 90%|█████████ | 11203/12384 [23:46:20<2:29:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 90%|█████████ | 11203/12384 [23:46:27<2:29:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|█████████ | 11204/12384 [23:46:27<2:29:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 90%|█████████ | 11204/12384 [23:46:35<2:29:24, 7.60s/it, loss=0.0029, acc=0.9961, iter_time=7.59s]
Epoch 0: 90%|█████████ | 11205/12384 [23:46:35<2:29:17, 7.60s/it, loss=0.0029, acc=0.9961, iter_time=7.59s]
Epoch 0: 90%|█████████ | 11205/12384 [23:46:42<2:29:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 90%|█████████ | 11206/12384 [23:46:42<2:29:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 90%|█████████ | 11206/12384 [23:46:50<2:29:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 0: 90%|█████████ | 11207/12384 [23:46:50<2:31:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 0: 90%|█████████ | 11207/12384 [23:46:58<2:31:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 91%|█████████ | 11208/12384 [23:46:58<2:30:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 91%|█████████ | 11208/12384 [23:47:06<2:30:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 0: 91%|█████████ | 11209/12384 [23:47:06<2:29:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 0: 91%|█████████ | 11209/12384 [23:47:13<2:29:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 91%|█████████ | 11210/12384 [23:47:13<2:29:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 0: 91%|█████████ | 11210/12384 [23:47:21<2:29:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11211/12384 [23:47:21<2:29:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11211/12384 [23:47:28<2:29:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 91%|█████████ | 11212/12384 [23:47:28<2:28:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 91%|█████████ | 11212/12384 [23:47:36<2:28:49, 7.62s/it, loss=0.0004, acc=0.9983, iter_time=10.39s]
Epoch 0: 91%|█████████ | 11213/12384 [23:47:36<2:28:39, 7.62s/it, loss=0.0004, acc=0.9983, iter_time=10.39s]
Epoch 0: 91%|█████████ | 11213/12384 [23:47:44<2:28:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11214/12384 [23:47:44<2:28:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11214/12384 [23:47:51<2:28:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11215/12384 [23:47:51<2:28:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11215/12384 [23:47:59<2:28:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 91%|█████████ | 11216/12384 [23:47:59<2:28:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 91%|█████████ | 11216/12384 [23:48:06<2:28:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 91%|█████████ | 11217/12384 [23:48:06<2:27:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 91%|█████████ | 11217/12384 [23:48:14<2:27:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 91%|█████████ | 11218/12384 [23:48:14<2:27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 0: 91%|█████████ | 11218/12384 [23:48:22<2:27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 0: 91%|█████████ | 11219/12384 [23:48:22<2:27:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 0: 91%|█████████ | 11219/12384 [23:48:29<2:27:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 91%|█████████ | 11220/12384 [23:48:29<2:27:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 0: 91%|█████████ | 11220/12384 [23:48:37<2:27:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11221/12384 [23:48:37<2:27:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11221/12384 [23:48:45<2:27:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████ | 11222/12384 [23:48:45<2:27:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████ | 11222/12384 [23:48:52<2:27:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 91%|█████████ | 11223/12384 [23:48:52<2:27:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 0: 91%|█████████ | 11223/12384 [23:49:00<2:27:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 91%|█████████ | 11224/12384 [23:49:00<2:27:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 91%|█████████ | 11224/12384 [23:49:07<2:27:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 91%|█████████ | 11225/12384 [23:49:07<2:27:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 91%|█████████ | 11225/12384 [23:49:15<2:27:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 91%|█████████ | 11226/12384 [23:49:15<2:27:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 91%|█████████ | 11226/12384 [23:49:23<2:27:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 91%|█████████ | 11227/12384 [23:49:23<2:26:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 0: 91%|█████████ | 11227/12384 [23:49:30<2:26:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 91%|█████████ | 11228/12384 [23:49:30<2:26:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 91%|█████████ | 11228/12384 [23:49:38<2:26:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 91%|█████████ | 11229/12384 [23:49:38<2:26:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 91%|█████████ | 11229/12384 [23:49:45<2:26:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 91%|█████████ | 11230/12384 [23:49:45<2:26:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 91%|█████████ | 11230/12384 [23:49:53<2:26:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 91%|█████████ | 11231/12384 [23:49:53<2:26:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 91%|█████████ | 11231/12384 [23:50:01<2:26:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 91%|█████████ | 11232/12384 [23:50:01<2:26:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 91%|█████████ | 11232/12384 [23:50:09<2:26:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 91%|█████████ | 11233/12384 [23:50:09<2:27:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 91%|█████████ | 11233/12384 [23:50:16<2:27:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 91%|█████████ | 11234/12384 [23:50:16<2:27:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 91%|█████████ | 11234/12384 [23:50:24<2:27:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 91%|█████████ | 11235/12384 [23:50:24<2:28:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 91%|█████████ | 11235/12384 [23:50:32<2:28:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 91%|█████████ | 11236/12384 [23:50:32<2:27:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 91%|█████████ | 11236/12384 [23:50:39<2:27:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 91%|█████████ | 11237/12384 [23:50:39<2:26:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 91%|█████████ | 11237/12384 [23:50:47<2:26:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 91%|█████████ | 11238/12384 [23:50:47<2:26:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 91%|█████████ | 11238/12384 [23:50:55<2:26:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 0: 91%|█████████ | 11239/12384 [23:50:55<2:25:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 0: 91%|█████████ | 11239/12384 [23:51:02<2:25:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 0: 91%|█████████ | 11240/12384 [23:51:02<2:26:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 0: 91%|█████████ | 11240/12384 [23:51:10<2:26:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 91%|█████████ | 11241/12384 [23:51:10<2:25:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 91%|█████████ | 11241/12384 [23:51:17<2:25:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.63s]
Epoch 0: 91%|█████████ | 11242/12384 [23:51:17<2:25:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.63s]
Epoch 0: 91%|█████████ | 11242/12384 [23:51:25<2:25:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 91%|█████████ | 11243/12384 [23:51:25<2:25:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 91%|█████████ | 11243/12384 [23:51:33<2:25:05, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.10s]
Epoch 0: 91%|█████████ | 11244/12384 [23:51:33<2:24:54, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.10s]
Epoch 0: 91%|█████████ | 11244/12384 [23:51:40<2:24:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 91%|█████████ | 11245/12384 [23:51:40<2:24:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 91%|█████████ | 11245/12384 [23:51:48<2:24:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████ | 11246/12384 [23:51:48<2:24:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████ | 11246/12384 [23:51:56<2:24:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 91%|█████████ | 11247/12384 [23:51:56<2:24:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 91%|█████████ | 11247/12384 [23:52:03<2:24:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 91%|█████████ | 11248/12384 [23:52:03<2:24:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 91%|█████████ | 11248/12384 [23:52:11<2:24:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 91%|█████████ | 11249/12384 [23:52:11<2:24:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 91%|█████████ | 11249/12384 [23:52:18<2:24:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 91%|█████████ | 11250/12384 [23:52:18<2:23:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 91%|█████████ | 11250/12384 [23:52:26<2:23:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 91%|█████████ | 11251/12384 [23:52:26<2:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 91%|█████████ | 11251/12384 [23:52:34<2:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 91%|█████████ | 11252/12384 [23:52:34<2:23:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 91%|█████████ | 11252/12384 [23:52:41<2:23:32, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.67s]
Epoch 0: 91%|█████████ | 11253/12384 [23:52:41<2:23:21, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.67s]
Epoch 0: 91%|█████████ | 11253/12384 [23:52:49<2:23:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 91%|█████████ | 11254/12384 [23:52:49<2:23:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 91%|█████████ | 11254/12384 [23:52:56<2:23:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 91%|█████████ | 11255/12384 [23:52:56<2:23:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 91%|█████████ | 11255/12384 [23:53:04<2:23:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 0: 91%|█████████ | 11256/12384 [23:53:04<2:22:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 0: 91%|█████████ | 11256/12384 [23:53:12<2:22:56, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 91%|█████████ | 11257/12384 [23:53:12<2:22:46, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 91%|█████████ | 11257/12384 [23:53:19<2:22:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11258/12384 [23:53:19<2:22:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11258/12384 [23:53:27<2:22:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 91%|█████████ | 11259/12384 [23:53:27<2:24:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 91%|█████████ | 11259/12384 [23:53:35<2:24:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 91%|█████████ | 11260/12384 [23:53:35<2:24:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 0: 91%|█████████ | 11260/12384 [23:53:43<2:24:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 91%|█████████ | 11261/12384 [23:53:43<2:25:18, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 91%|█████████ | 11261/12384 [23:53:50<2:25:18, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 91%|█████████ | 11262/12384 [23:53:50<2:24:38, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 91%|█████████ | 11262/12384 [23:53:58<2:24:38, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 91%|█████████ | 11263/12384 [23:53:58<2:23:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 91%|█████████ | 11263/12384 [23:54:06<2:23:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.25s]
Epoch 0: 91%|█████████ | 11264/12384 [23:54:06<2:23:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.25s]
Epoch 0: 91%|█████████ | 11264/12384 [23:54:13<2:23:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 91%|█████████ | 11265/12384 [23:54:13<2:22:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 91%|█████████ | 11265/12384 [23:54:21<2:22:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 91%|█████████ | 11266/12384 [23:54:21<2:22:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 91%|█████████ | 11266/12384 [23:54:28<2:22:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 0: 91%|█████████ | 11267/12384 [23:54:28<2:22:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 0: 91%|█████████ | 11267/12384 [23:54:36<2:22:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 91%|█████████ | 11268/12384 [23:54:36<2:21:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 91%|█████████ | 11268/12384 [23:54:44<2:21:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 91%|█████████ | 11269/12384 [23:54:44<2:21:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 91%|█████████ | 11269/12384 [23:54:51<2:21:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 91%|█████████ | 11270/12384 [23:54:51<2:21:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 91%|█████████ | 11270/12384 [23:54:59<2:21:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 91%|█████████ | 11271/12384 [23:54:59<2:21:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 91%|█████████ | 11271/12384 [23:55:07<2:21:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 91%|█████████ | 11272/12384 [23:55:07<2:21:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 91%|█████████ | 11272/12384 [23:55:14<2:21:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 91%|█████████ | 11273/12384 [23:55:14<2:21:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 91%|█████████ | 11273/12384 [23:55:22<2:21:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 91%|█████████ | 11274/12384 [23:55:22<2:21:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 91%|█████████ | 11274/12384 [23:55:29<2:21:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.78s]
Epoch 0: 91%|█████████ | 11275/12384 [23:55:29<2:20:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.78s]
Epoch 0: 91%|█████████ | 11275/12384 [23:55:37<2:20:47, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 91%|█████████ | 11276/12384 [23:55:37<2:20:34, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.59s]
Epoch 0: 91%|█████████ | 11276/12384 [23:55:45<2:20:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 91%|█████████ | 11277/12384 [23:55:45<2:20:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 91%|█████████ | 11277/12384 [23:55:52<2:20:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████ | 11278/12384 [23:55:52<2:20:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████ | 11278/12384 [23:56:00<2:20:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 91%|█████████ | 11279/12384 [23:56:00<2:20:05, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 91%|█████████ | 11279/12384 [23:56:07<2:20:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 91%|█████████ | 11280/12384 [23:56:07<2:20:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 91%|█████████ | 11280/12384 [23:56:15<2:20:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 0: 91%|█████████ | 11281/12384 [23:56:15<2:19:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 0: 91%|█████████ | 11281/12384 [23:56:23<2:19:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 91%|█████████ | 11282/12384 [23:56:23<2:19:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 91%|█████████ | 11282/12384 [23:56:30<2:19:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 91%|█████████ | 11283/12384 [23:56:30<2:19:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 91%|█████████ | 11283/12384 [23:56:38<2:19:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 91%|█████████ | 11284/12384 [23:56:38<2:19:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 91%|█████████ | 11284/12384 [23:56:46<2:19:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 91%|█████████ | 11285/12384 [23:56:46<2:21:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 91%|█████████ | 11285/12384 [23:56:53<2:21:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 0: 91%|█████████ | 11286/12384 [23:56:53<2:20:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 0: 91%|█████████ | 11286/12384 [23:57:01<2:20:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 91%|█████████ | 11287/12384 [23:57:01<2:20:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 0: 91%|█████████ | 11287/12384 [23:57:09<2:20:09, 7.67s/it, loss=0.0005, acc=0.9976, iter_time=8.05s]
Epoch 0: 91%|█████████ | 11288/12384 [23:57:09<2:19:42, 7.65s/it, loss=0.0005, acc=0.9976, iter_time=8.05s]
Epoch 0: 91%|█████████ | 11288/12384 [23:57:16<2:19:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 0: 91%|█████████ | 11289/12384 [23:57:16<2:19:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 0: 91%|█████████ | 11289/12384 [23:57:24<2:19:16, 7.63s/it, loss=0.0001, acc=0.9994, iter_time=9.13s]
Epoch 0: 91%|█████████ | 11290/12384 [23:57:24<2:19:03, 7.63s/it, loss=0.0001, acc=0.9994, iter_time=9.13s]
Epoch 0: 91%|█████████ | 11290/12384 [23:57:32<2:19:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11291/12384 [23:57:32<2:18:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████ | 11291/12384 [23:57:39<2:18:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 91%|█████████ | 11292/12384 [23:57:39<2:18:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 91%|█████████ | 11292/12384 [23:57:47<2:18:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 91%|█████████ | 11293/12384 [23:57:47<2:18:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 91%|█████████ | 11293/12384 [23:57:54<2:18:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 91%|█████████ | 11294/12384 [23:57:54<2:18:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 91%|█████████ | 11294/12384 [23:58:02<2:18:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 91%|█████████ | 11295/12384 [23:58:02<2:18:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 91%|█████████ | 11295/12384 [23:58:10<2:18:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 91%|█████████ | 11296/12384 [23:58:10<2:18:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 91%|█████████ | 11296/12384 [23:58:17<2:18:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 91%|█████████ | 11297/12384 [23:58:17<2:17:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 91%|█████████ | 11297/12384 [23:58:25<2:17:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 91%|█████████ | 11298/12384 [23:58:25<2:17:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 91%|█████████ | 11298/12384 [23:58:32<2:17:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 91%|█████████ | 11299/12384 [23:58:32<2:17:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 0: 91%|█████████ | 11299/12384 [23:58:40<2:17:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 0: 91%|█████████ | 11300/12384 [23:58:40<2:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 0: 91%|█████████ | 11300/12384 [23:58:48<2:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 0: 91%|█████████▏| 11301/12384 [23:58:48<2:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 0: 91%|█████████▏| 11301/12384 [23:58:55<2:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 0: 91%|█████████▏| 11302/12384 [23:58:55<2:17:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 0: 91%|█████████▏| 11302/12384 [23:59:03<2:17:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 91%|█████████▏| 11303/12384 [23:59:03<2:17:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 91%|█████████▏| 11303/12384 [23:59:10<2:17:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 91%|█████████▏| 11304/12384 [23:59:10<2:17:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 91%|█████████▏| 11304/12384 [23:59:18<2:17:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 0: 91%|█████████▏| 11305/12384 [23:59:18<2:17:11, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 0: 91%|█████████▏| 11305/12384 [23:59:26<2:17:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 91%|█████████▏| 11306/12384 [23:59:26<2:17:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 91%|█████████▏| 11306/12384 [23:59:33<2:17:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 91%|█████████▏| 11307/12384 [23:59:33<2:16:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 91%|█████████▏| 11307/12384 [23:59:41<2:16:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 91%|█████████▏| 11308/12384 [23:59:41<2:16:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 0: 91%|█████████▏| 11308/12384 [23:59:49<2:16:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████▏| 11309/12384 [23:59:49<2:16:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████▏| 11309/12384 [23:59:56<2:16:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████▏| 11310/12384 [23:59:56<2:16:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████▏| 11310/12384 [24:00:04<2:16:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 91%|█████████▏| 11311/12384 [24:00:04<2:16:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 91%|█████████▏| 11311/12384 [24:00:12<2:16:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 91%|█████████▏| 11312/12384 [24:00:12<2:18:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 91%|█████████▏| 11312/12384 [24:00:19<2:18:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 91%|█████████▏| 11313/12384 [24:00:19<2:17:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 91%|█████████▏| 11313/12384 [24:00:27<2:17:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 91%|█████████▏| 11314/12384 [24:00:27<2:16:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 91%|█████████▏| 11314/12384 [24:00:35<2:16:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 91%|█████████▏| 11315/12384 [24:00:35<2:16:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 91%|█████████▏| 11315/12384 [24:00:42<2:16:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████▏| 11316/12384 [24:00:42<2:15:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 91%|█████████▏| 11316/12384 [24:00:50<2:15:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 91%|█████████▏| 11317/12384 [24:00:50<2:15:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 0: 91%|█████████▏| 11317/12384 [24:00:58<2:15:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 0: 91%|█████████▏| 11318/12384 [24:00:58<2:15:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 0: 91%|█████████▏| 11318/12384 [24:01:05<2:15:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 0: 91%|█████████▏| 11319/12384 [24:01:05<2:15:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 0: 91%|█████████▏| 11319/12384 [24:01:13<2:15:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 0: 91%|█████████▏| 11320/12384 [24:01:13<2:15:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 0: 91%|█████████▏| 11320/12384 [24:01:20<2:15:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 91%|█████████▏| 11321/12384 [24:01:20<2:14:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 91%|█████████▏| 11321/12384 [24:01:28<2:14:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 91%|█████████▏| 11322/12384 [24:01:28<2:14:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 91%|█████████▏| 11322/12384 [24:01:36<2:14:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████▏| 11323/12384 [24:01:36<2:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████▏| 11323/12384 [24:01:43<2:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 91%|█████████▏| 11324/12384 [24:01:43<2:14:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 0: 91%|█████████▏| 11324/12384 [24:01:51<2:14:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 91%|█████████▏| 11325/12384 [24:01:51<2:14:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 91%|█████████▏| 11325/12384 [24:01:58<2:14:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████▏| 11326/12384 [24:01:58<2:14:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 91%|█████████▏| 11326/12384 [24:02:06<2:14:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 91%|█████████▏| 11327/12384 [24:02:06<2:13:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 91%|█████████▏| 11327/12384 [24:02:14<2:13:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 0: 91%|█████████▏| 11328/12384 [24:02:14<2:13:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 0: 91%|█████████▏| 11328/12384 [24:02:21<2:13:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 0: 91%|█████████▏| 11329/12384 [24:02:21<2:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 0: 91%|█████████▏| 11329/12384 [24:02:29<2:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 0: 91%|█████████▏| 11330/12384 [24:02:29<2:13:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 0: 91%|█████████▏| 11330/12384 [24:02:36<2:13:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 91%|█████████▏| 11331/12384 [24:02:36<2:13:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 91%|█████████▏| 11331/12384 [24:02:44<2:13:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11332/12384 [24:02:44<2:13:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11332/12384 [24:02:52<2:13:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11333/12384 [24:02:52<2:13:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11333/12384 [24:02:59<2:13:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11334/12384 [24:02:59<2:13:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11334/12384 [24:03:07<2:13:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 92%|█████████▏| 11335/12384 [24:03:07<2:13:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 0: 92%|█████████▏| 11335/12384 [24:03:15<2:13:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.03s]
Epoch 0: 92%|█████████▏| 11336/12384 [24:03:15<2:13:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.03s]
Epoch 0: 92%|█████████▏| 11336/12384 [24:03:22<2:13:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 92%|█████████▏| 11337/12384 [24:03:22<2:13:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 92%|█████████▏| 11337/12384 [24:03:30<2:13:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 92%|█████████▏| 11338/12384 [24:03:30<2:14:56, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 92%|█████████▏| 11338/12384 [24:03:38<2:14:56, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 92%|█████████▏| 11339/12384 [24:03:38<2:15:38, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 92%|█████████▏| 11339/12384 [24:03:46<2:15:38, 7.79s/it, loss=0.0001, acc=1.0000, iter_time=4.44s]
Epoch 0: 92%|█████████▏| 11340/12384 [24:03:46<2:14:31, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=4.44s]
Epoch 0: 92%|█████████▏| 11340/12384 [24:03:53<2:14:31, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 92%|█████████▏| 11341/12384 [24:03:53<2:13:50, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 92%|█████████▏| 11341/12384 [24:04:01<2:13:50, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=10.66s]
Epoch 0: 92%|█████████▏| 11342/12384 [24:04:01<2:13:13, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.66s]
Epoch 0: 92%|█████████▏| 11342/12384 [24:04:09<2:13:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11343/12384 [24:04:09<2:12:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11343/12384 [24:04:16<2:12:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 92%|█████████▏| 11344/12384 [24:04:16<2:12:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 92%|█████████▏| 11344/12384 [24:04:24<2:12:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 92%|█████████▏| 11345/12384 [24:04:24<2:12:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 92%|█████████▏| 11345/12384 [24:04:31<2:12:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11346/12384 [24:04:31<2:12:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11346/12384 [24:04:39<2:12:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 92%|█████████▏| 11347/12384 [24:04:39<2:11:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 92%|█████████▏| 11347/12384 [24:04:47<2:11:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 92%|█████████▏| 11348/12384 [24:04:47<2:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 92%|█████████▏| 11348/12384 [24:04:54<2:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11349/12384 [24:04:54<2:11:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11349/12384 [24:05:02<2:11:24, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=8.02s]
Epoch 0: 92%|█████████▏| 11350/12384 [24:05:02<2:11:17, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=8.02s]
Epoch 0: 92%|█████████▏| 11350/12384 [24:05:10<2:11:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 92%|█████████▏| 11351/12384 [24:05:10<2:11:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 92%|█████████▏| 11351/12384 [24:05:17<2:11:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 92%|█████████▏| 11352/12384 [24:05:17<2:10:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 92%|█████████▏| 11352/12384 [24:05:25<2:10:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 92%|█████████▏| 11353/12384 [24:05:25<2:10:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 92%|█████████▏| 11353/12384 [24:05:32<2:10:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11354/12384 [24:05:32<2:10:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11354/12384 [24:05:40<2:10:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11355/12384 [24:05:40<2:10:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11355/12384 [24:05:48<2:10:38, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=7.64s]
Epoch 0: 92%|█████████▏| 11356/12384 [24:05:48<2:10:32, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=7.64s]
Epoch 0: 92%|█████████▏| 11356/12384 [24:05:55<2:10:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11357/12384 [24:05:55<2:10:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11357/12384 [24:06:03<2:10:21, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11358/12384 [24:06:03<2:10:09, 7.61s/it, loss=0.0004, acc=0.9985, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11358/12384 [24:06:10<2:10:09, 7.61s/it, loss=0.0005, acc=0.9987, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11359/12384 [24:06:10<2:10:04, 7.61s/it, loss=0.0005, acc=0.9987, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11359/12384 [24:06:18<2:10:04, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.99s]
Epoch 0: 92%|█████████▏| 11360/12384 [24:06:18<2:09:59, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.99s]
Epoch 0: 92%|█████████▏| 11360/12384 [24:06:26<2:09:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 92%|█████████▏| 11361/12384 [24:06:26<2:09:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 92%|█████████▏| 11361/12384 [24:06:33<2:09:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 0: 92%|█████████▏| 11362/12384 [24:06:33<2:09:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 0: 92%|█████████▏| 11362/12384 [24:06:41<2:09:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 0: 92%|█████████▏| 11363/12384 [24:06:41<2:09:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 0: 92%|█████████▏| 11363/12384 [24:06:48<2:09:34, 7.61s/it, loss=0.0004, acc=0.9981, iter_time=7.58s]
Epoch 0: 92%|█████████▏| 11364/12384 [24:06:48<2:09:15, 7.60s/it, loss=0.0004, acc=0.9981, iter_time=7.58s]
Epoch 0: 92%|█████████▏| 11364/12384 [24:06:56<2:09:15, 7.60s/it, loss=0.0003, acc=0.9992, iter_time=7.64s]
Epoch 0: 92%|█████████▏| 11365/12384 [24:06:56<2:10:46, 7.70s/it, loss=0.0003, acc=0.9992, iter_time=7.64s]
Epoch 0: 92%|█████████▏| 11365/12384 [24:07:04<2:10:46, 7.70s/it, loss=0.0007, acc=0.9975, iter_time=8.18s]
Epoch 0: 92%|█████████▏| 11366/12384 [24:07:04<2:11:41, 7.76s/it, loss=0.0007, acc=0.9975, iter_time=8.18s]
Epoch 0: 92%|█████████▏| 11366/12384 [24:07:12<2:11:41, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 92%|█████████▏| 11367/12384 [24:07:12<2:10:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 0: 92%|█████████▏| 11367/12384 [24:07:20<2:10:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 92%|█████████▏| 11368/12384 [24:07:20<2:10:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 92%|█████████▏| 11368/12384 [24:07:27<2:10:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 92%|█████████▏| 11369/12384 [24:07:27<2:09:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 92%|█████████▏| 11369/12384 [24:07:35<2:09:39, 7.66s/it, loss=0.0008, acc=0.9978, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11370/12384 [24:07:35<2:09:08, 7.64s/it, loss=0.0008, acc=0.9978, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11370/12384 [24:07:42<2:09:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 92%|█████████▏| 11371/12384 [24:07:42<2:08:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 92%|█████████▏| 11371/12384 [24:07:50<2:08:41, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11372/12384 [24:07:50<2:08:28, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11372/12384 [24:07:58<2:08:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 92%|█████████▏| 11373/12384 [24:07:58<2:08:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 0: 92%|█████████▏| 11373/12384 [24:08:05<2:08:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11374/12384 [24:08:05<2:08:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11374/12384 [24:08:13<2:08:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11375/12384 [24:08:13<2:08:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11375/12384 [24:08:20<2:08:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 92%|█████████▏| 11376/12384 [24:08:20<2:07:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 92%|█████████▏| 11376/12384 [24:08:28<2:07:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 92%|█████████▏| 11377/12384 [24:08:28<2:07:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 92%|█████████▏| 11377/12384 [24:08:36<2:07:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11378/12384 [24:08:36<2:07:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11378/12384 [24:08:43<2:07:35, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11379/12384 [24:08:43<2:07:31, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11379/12384 [24:08:51<2:07:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11380/12384 [24:08:51<2:07:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11380/12384 [24:08:58<2:07:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 92%|█████████▏| 11381/12384 [24:08:58<2:07:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 92%|█████████▏| 11381/12384 [24:09:06<2:07:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 0: 92%|█████████▏| 11382/12384 [24:09:06<2:07:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 0: 92%|█████████▏| 11382/12384 [24:09:14<2:07:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 92%|█████████▏| 11383/12384 [24:09:14<2:08:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 0: 92%|█████████▏| 11383/12384 [24:09:22<2:08:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 92%|█████████▏| 11384/12384 [24:09:22<2:07:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 92%|█████████▏| 11384/12384 [24:09:29<2:07:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 92%|█████████▏| 11385/12384 [24:09:29<2:07:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 92%|█████████▏| 11385/12384 [24:09:37<2:07:19, 7.65s/it, loss=0.0006, acc=0.9986, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11386/12384 [24:09:37<2:07:00, 7.64s/it, loss=0.0006, acc=0.9986, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11386/12384 [24:09:44<2:07:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 92%|█████████▏| 11387/12384 [24:09:44<2:06:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 0: 92%|█████████▏| 11387/12384 [24:09:52<2:06:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 92%|█████████▏| 11388/12384 [24:09:52<2:06:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 0: 92%|█████████▏| 11388/12384 [24:10:00<2:06:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11389/12384 [24:10:00<2:06:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11389/12384 [24:10:07<2:06:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11390/12384 [24:10:07<2:06:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11390/12384 [24:10:15<2:06:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 92%|█████████▏| 11391/12384 [24:10:15<2:07:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 92%|█████████▏| 11391/12384 [24:10:23<2:07:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 92%|█████████▏| 11392/12384 [24:10:23<2:06:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 0: 92%|█████████▏| 11392/12384 [24:10:31<2:06:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 92%|█████████▏| 11393/12384 [24:10:31<2:07:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 0: 92%|█████████▏| 11393/12384 [24:10:38<2:07:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 92%|█████████▏| 11394/12384 [24:10:38<2:06:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 0: 92%|█████████▏| 11394/12384 [24:10:46<2:06:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 0: 92%|█████████▏| 11395/12384 [24:10:46<2:06:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 0: 92%|█████████▏| 11395/12384 [24:10:53<2:06:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 92%|█████████▏| 11396/12384 [24:10:53<2:06:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 92%|█████████▏| 11396/12384 [24:11:01<2:06:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 92%|█████████▏| 11397/12384 [24:11:01<2:05:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 92%|█████████▏| 11397/12384 [24:11:09<2:05:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11398/12384 [24:11:09<2:05:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11398/12384 [24:11:16<2:05:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11399/12384 [24:11:16<2:05:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11399/12384 [24:11:24<2:05:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 92%|█████████▏| 11400/12384 [24:11:24<2:04:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 92%|█████████▏| 11400/12384 [24:11:31<2:04:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 92%|█████████▏| 11401/12384 [24:11:31<2:04:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 92%|█████████▏| 11401/12384 [24:11:39<2:04:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 92%|█████████▏| 11402/12384 [24:11:39<2:04:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 92%|█████████▏| 11402/12384 [24:11:47<2:04:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11403/12384 [24:11:47<2:04:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11403/12384 [24:11:54<2:04:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 92%|█████████▏| 11404/12384 [24:11:54<2:04:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 92%|█████████▏| 11404/12384 [24:12:02<2:04:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 0: 92%|█████████▏| 11405/12384 [24:12:02<2:04:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 0: 92%|█████████▏| 11405/12384 [24:12:10<2:04:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 92%|█████████▏| 11406/12384 [24:12:10<2:04:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 92%|█████████▏| 11406/12384 [24:12:17<2:04:14, 7.62s/it, loss=0.0005, acc=0.9975, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11407/12384 [24:12:17<2:04:00, 7.62s/it, loss=0.0005, acc=0.9975, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11407/12384 [24:12:25<2:04:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 92%|█████████▏| 11408/12384 [24:12:25<2:03:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 92%|█████████▏| 11408/12384 [24:12:32<2:03:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 0: 92%|█████████▏| 11409/12384 [24:12:32<2:03:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 0: 92%|█████████▏| 11409/12384 [24:12:40<2:03:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 92%|█████████▏| 11410/12384 [24:12:40<2:03:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 92%|█████████▏| 11410/12384 [24:12:48<2:03:29, 7.61s/it, loss=0.0014, acc=0.9988, iter_time=7.43s]
Epoch 0: 92%|█████████▏| 11411/12384 [24:12:48<2:03:26, 7.61s/it, loss=0.0014, acc=0.9988, iter_time=7.43s]
Epoch 0: 92%|█████████▏| 11411/12384 [24:12:55<2:03:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 0: 92%|█████████▏| 11412/12384 [24:12:55<2:03:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 0: 92%|█████████▏| 11412/12384 [24:13:03<2:03:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 0: 92%|█████████▏| 11413/12384 [24:13:03<2:03:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 0: 92%|█████████▏| 11413/12384 [24:13:10<2:03:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 92%|█████████▏| 11414/12384 [24:13:10<2:02:46, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 92%|█████████▏| 11414/12384 [24:13:18<2:02:46, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 92%|█████████▏| 11415/12384 [24:13:18<2:02:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 92%|█████████▏| 11415/12384 [24:13:26<2:02:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 92%|█████████▏| 11416/12384 [24:13:26<2:02:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 92%|█████████▏| 11416/12384 [24:13:34<2:02:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 92%|█████████▏| 11417/12384 [24:13:34<2:04:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 0: 92%|█████████▏| 11417/12384 [24:13:41<2:04:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 92%|█████████▏| 11418/12384 [24:13:41<2:04:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 92%|█████████▏| 11418/12384 [24:13:49<2:04:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 0: 92%|█████████▏| 11419/12384 [24:13:49<2:03:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 0: 92%|█████████▏| 11419/12384 [24:13:57<2:03:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 92%|█████████▏| 11420/12384 [24:13:57<2:02:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 0: 92%|█████████▏| 11420/12384 [24:14:04<2:02:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 92%|█████████▏| 11421/12384 [24:14:04<2:02:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 92%|█████████▏| 11421/12384 [24:14:12<2:02:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 0: 92%|█████████▏| 11422/12384 [24:14:12<2:02:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 0: 92%|█████████▏| 11422/12384 [24:14:19<2:02:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11423/12384 [24:14:19<2:02:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11423/12384 [24:14:27<2:02:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 92%|█████████▏| 11424/12384 [24:14:27<2:02:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 92%|█████████▏| 11424/12384 [24:14:34<2:02:29, 7.66s/it, loss=0.0006, acc=0.9977, iter_time=4.75s]
Epoch 0: 92%|█████████▏| 11425/12384 [24:14:34<1:58:47, 7.43s/it, loss=0.0006, acc=0.9977, iter_time=4.75s]
Epoch 0: 92%|█████████▏| 11425/12384 [24:14:42<1:58:47, 7.43s/it, loss=0.0008, acc=0.9989, iter_time=8.96s]
Epoch 0: 92%|█████████▏| 11426/12384 [24:14:42<1:59:23, 7.48s/it, loss=0.0008, acc=0.9989, iter_time=8.96s]
Epoch 0: 92%|█████████▏| 11426/12384 [24:14:49<1:59:23, 7.48s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 92%|█████████▏| 11427/12384 [24:14:49<2:00:27, 7.55s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 92%|█████████▏| 11427/12384 [24:14:57<2:00:27, 7.55s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 92%|█████████▏| 11428/12384 [24:14:57<2:00:39, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 0: 92%|█████████▏| 11428/12384 [24:15:05<2:00:39, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11429/12384 [24:15:05<2:00:44, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11429/12384 [24:15:12<2:00:44, 7.59s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11430/12384 [24:15:12<2:00:43, 7.59s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11430/12384 [24:15:20<2:00:43, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11431/12384 [24:15:20<2:00:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 92%|█████████▏| 11431/12384 [24:15:27<2:00:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 92%|█████████▏| 11432/12384 [24:15:27<2:00:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 92%|█████████▏| 11432/12384 [24:15:35<2:00:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 92%|█████████▏| 11433/12384 [24:15:35<2:00:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 92%|█████████▏| 11433/12384 [24:15:43<2:00:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 92%|█████████▏| 11434/12384 [24:15:43<2:00:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 92%|█████████▏| 11434/12384 [24:15:50<2:00:41, 7.62s/it, loss=0.0005, acc=0.9980, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11435/12384 [24:15:50<2:00:24, 7.61s/it, loss=0.0005, acc=0.9980, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11435/12384 [24:15:58<2:00:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11436/12384 [24:15:58<2:00:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11436/12384 [24:16:06<2:00:21, 7.62s/it, loss=0.0001, acc=0.9990, iter_time=7.64s]
Epoch 0: 92%|█████████▏| 11437/12384 [24:16:06<2:00:08, 7.61s/it, loss=0.0001, acc=0.9990, iter_time=7.64s]
Epoch 0: 92%|█████████▏| 11437/12384 [24:16:13<2:00:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11438/12384 [24:16:13<1:59:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11438/12384 [24:16:21<1:59:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11439/12384 [24:16:21<1:59:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 92%|█████████▏| 11439/12384 [24:16:28<1:59:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 92%|█████████▏| 11440/12384 [24:16:28<1:59:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 92%|█████████▏| 11440/12384 [24:16:36<1:59:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 92%|█████████▏| 11441/12384 [24:16:36<1:59:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 92%|█████████▏| 11441/12384 [24:16:44<1:59:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11442/12384 [24:16:44<1:59:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 92%|█████████▏| 11442/12384 [24:16:52<1:59:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 0: 92%|█████████▏| 11443/12384 [24:16:52<2:00:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 0: 92%|█████████▏| 11443/12384 [24:16:59<2:00:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 0: 92%|█████████▏| 11444/12384 [24:16:59<2:00:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 0: 92%|█████████▏| 11444/12384 [24:17:07<2:00:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 92%|█████████▏| 11445/12384 [24:17:07<1:59:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 0: 92%|█████████▏| 11445/12384 [24:17:14<1:59:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 92%|█████████▏| 11446/12384 [24:17:14<1:59:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 92%|█████████▏| 11446/12384 [24:17:22<1:59:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11447/12384 [24:17:22<1:59:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11447/12384 [24:17:30<1:59:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 92%|█████████▏| 11448/12384 [24:17:30<1:59:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 92%|█████████▏| 11448/12384 [24:17:37<1:59:01, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.20s]
Epoch 0: 92%|█████████▏| 11449/12384 [24:17:37<1:58:43, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.20s]
Epoch 0: 92%|█████████▏| 11449/12384 [24:17:45<1:58:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 92%|█████████▏| 11450/12384 [24:17:45<1:58:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 92%|█████████▏| 11450/12384 [24:17:52<1:58:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 92%|█████████▏| 11451/12384 [24:17:52<1:58:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 92%|█████████▏| 11451/12384 [24:18:00<1:58:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11452/12384 [24:18:00<1:58:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11452/12384 [24:18:08<1:58:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11453/12384 [24:18:08<1:58:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 92%|█████████▏| 11453/12384 [24:18:15<1:58:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11454/12384 [24:18:15<1:57:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 92%|█████████▏| 11454/12384 [24:18:23<1:57:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 0: 92%|█████████▏| 11455/12384 [24:18:23<1:57:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 0: 92%|█████████▏| 11455/12384 [24:18:30<1:57:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 0: 93%|█████████▎| 11456/12384 [24:18:30<1:57:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 0: 93%|█████████▎| 11456/12384 [24:18:38<1:57:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 93%|█████████▎| 11457/12384 [24:18:38<1:57:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 93%|█████████▎| 11457/12384 [24:18:46<1:57:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 93%|█████████▎| 11458/12384 [24:18:46<1:57:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 93%|█████████▎| 11458/12384 [24:18:53<1:57:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11459/12384 [24:18:53<1:57:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11459/12384 [24:19:01<1:57:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 93%|█████████▎| 11460/12384 [24:19:01<1:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 0: 93%|█████████▎| 11460/12384 [24:19:09<1:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 0: 93%|█████████▎| 11461/12384 [24:19:09<1:57:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 0: 93%|█████████▎| 11461/12384 [24:19:16<1:57:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 0: 93%|█████████▎| 11462/12384 [24:19:16<1:57:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 0: 93%|█████████▎| 11462/12384 [24:19:24<1:57:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 93%|█████████▎| 11463/12384 [24:19:24<1:56:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 93%|█████████▎| 11463/12384 [24:19:31<1:56:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 93%|█████████▎| 11464/12384 [24:19:31<1:56:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 93%|█████████▎| 11464/12384 [24:19:39<1:56:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 93%|█████████▎| 11465/12384 [24:19:39<1:56:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 93%|█████████▎| 11465/12384 [24:19:47<1:56:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 93%|█████████▎| 11466/12384 [24:19:47<1:56:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 0: 93%|█████████▎| 11466/12384 [24:19:54<1:56:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 93%|█████████▎| 11467/12384 [24:19:54<1:56:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 93%|█████████▎| 11467/12384 [24:20:02<1:56:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 93%|█████████▎| 11468/12384 [24:20:02<1:56:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 0: 93%|█████████▎| 11468/12384 [24:20:10<1:56:40, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=11.08s]
Epoch 0: 93%|█████████▎| 11469/12384 [24:20:10<1:58:19, 7.76s/it, loss=0.0003, acc=0.9998, iter_time=11.08s]
Epoch 0: 93%|█████████▎| 11469/12384 [24:20:18<1:58:19, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 93%|█████████▎| 11470/12384 [24:20:18<1:57:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 93%|█████████▎| 11470/12384 [24:20:25<1:57:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 93%|█████████▎| 11471/12384 [24:20:25<1:56:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 93%|█████████▎| 11471/12384 [24:20:33<1:56:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 93%|█████████▎| 11472/12384 [24:20:33<1:56:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 93%|█████████▎| 11472/12384 [24:20:40<1:56:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 93%|█████████▎| 11473/12384 [24:20:40<1:56:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 93%|█████████▎| 11473/12384 [24:20:48<1:56:01, 7.64s/it, loss=0.0002, acc=0.9994, iter_time=5.52s]
Epoch 0: 93%|█████████▎| 11474/12384 [24:20:48<1:55:46, 7.63s/it, loss=0.0002, acc=0.9994, iter_time=5.52s]
Epoch 0: 93%|█████████▎| 11474/12384 [24:20:56<1:55:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 93%|█████████▎| 11475/12384 [24:20:56<1:55:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 93%|█████████▎| 11475/12384 [24:21:03<1:55:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 0: 93%|█████████▎| 11476/12384 [24:21:03<1:55:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 0: 93%|█████████▎| 11476/12384 [24:21:11<1:55:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 93%|█████████▎| 11477/12384 [24:21:11<1:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 93%|█████████▎| 11477/12384 [24:21:18<1:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 93%|█████████▎| 11478/12384 [24:21:18<1:54:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 93%|█████████▎| 11478/12384 [24:21:26<1:54:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 93%|█████████▎| 11479/12384 [24:21:26<1:54:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 93%|█████████▎| 11479/12384 [24:21:34<1:54:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 0: 93%|█████████▎| 11480/12384 [24:21:34<1:54:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 0: 93%|█████████▎| 11480/12384 [24:21:41<1:54:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 93%|█████████▎| 11481/12384 [24:21:41<1:54:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 93%|█████████▎| 11481/12384 [24:21:49<1:54:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 93%|█████████▎| 11482/12384 [24:21:49<1:54:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 93%|█████████▎| 11482/12384 [24:21:56<1:54:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 93%|█████████▎| 11483/12384 [24:21:56<1:54:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 93%|█████████▎| 11483/12384 [24:22:04<1:54:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.13s]
Epoch 0: 93%|█████████▎| 11484/12384 [24:22:04<1:54:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.13s]
Epoch 0: 93%|█████████▎| 11484/12384 [24:22:12<1:54:13, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=10.21s]
Epoch 0: 93%|█████████▎| 11485/12384 [24:22:12<1:54:03, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=10.21s]
Epoch 0: 93%|█████████▎| 11485/12384 [24:22:19<1:54:03, 7.61s/it, loss=0.0003, acc=0.9980, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11486/12384 [24:22:19<1:53:52, 7.61s/it, loss=0.0003, acc=0.9980, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11486/12384 [24:22:27<1:53:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 93%|█████████▎| 11487/12384 [24:22:27<1:53:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 93%|█████████▎| 11487/12384 [24:22:34<1:53:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 93%|█████████▎| 11488/12384 [24:22:34<1:53:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 93%|█████████▎| 11488/12384 [24:22:42<1:53:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 0: 93%|█████████▎| 11489/12384 [24:22:42<1:53:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 0: 93%|█████████▎| 11489/12384 [24:22:50<1:53:24, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.63s]
Epoch 0: 93%|█████████▎| 11490/12384 [24:22:50<1:53:11, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.63s]
Epoch 0: 93%|█████████▎| 11490/12384 [24:22:57<1:53:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 93%|█████████▎| 11491/12384 [24:22:57<1:53:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 93%|█████████▎| 11491/12384 [24:23:05<1:53:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 93%|█████████▎| 11492/12384 [24:23:05<1:53:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 0: 93%|█████████▎| 11492/12384 [24:23:13<1:53:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 0: 93%|█████████▎| 11493/12384 [24:23:13<1:53:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 0: 93%|█████████▎| 11493/12384 [24:23:20<1:53:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 93%|█████████▎| 11494/12384 [24:23:20<1:52:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 93%|█████████▎| 11494/12384 [24:23:28<1:52:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11495/12384 [24:23:28<1:52:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11495/12384 [24:23:36<1:52:41, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.06s]
Epoch 0: 93%|█████████▎| 11496/12384 [24:23:36<1:53:52, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.06s]
Epoch 0: 93%|█████████▎| 11496/12384 [24:23:43<1:53:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 93%|█████████▎| 11497/12384 [24:23:43<1:53:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 93%|█████████▎| 11497/12384 [24:23:51<1:53:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 93%|█████████▎| 11498/12384 [24:23:51<1:52:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 93%|█████████▎| 11498/12384 [24:23:58<1:52:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 93%|█████████▎| 11499/12384 [24:23:58<1:52:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 93%|█████████▎| 11499/12384 [24:24:06<1:52:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 93%|█████████▎| 11500/12384 [24:24:06<1:53:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 93%|█████████▎| 11500/12384 [24:24:14<1:53:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 0: 93%|█████████▎| 11501/12384 [24:24:14<1:52:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 0: 93%|█████████▎| 11501/12384 [24:24:21<1:52:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 93%|█████████▎| 11502/12384 [24:24:21<1:52:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 93%|█████████▎| 11502/12384 [24:24:29<1:52:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11503/12384 [24:24:29<1:52:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11503/12384 [24:24:37<1:52:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 93%|█████████▎| 11504/12384 [24:24:37<1:51:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 93%|█████████▎| 11504/12384 [24:24:44<1:51:57, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 93%|█████████▎| 11505/12384 [24:24:44<1:51:45, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 93%|█████████▎| 11505/12384 [24:24:52<1:51:45, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11506/12384 [24:24:52<1:51:32, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11506/12384 [24:25:00<1:51:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11507/12384 [24:25:00<1:51:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11507/12384 [24:25:07<1:51:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11508/12384 [24:25:07<1:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11508/12384 [24:25:15<1:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 93%|█████████▎| 11509/12384 [24:25:15<1:50:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 93%|█████████▎| 11509/12384 [24:25:22<1:50:53, 7.60s/it, loss=0.0001, acc=0.9999, iter_time=5.64s]
Epoch 0: 93%|█████████▎| 11510/12384 [24:25:22<1:50:45, 7.60s/it, loss=0.0001, acc=0.9999, iter_time=5.64s]
Epoch 0: 93%|█████████▎| 11510/12384 [24:25:30<1:50:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 93%|█████████▎| 11511/12384 [24:25:30<1:50:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 93%|█████████▎| 11511/12384 [24:25:38<1:50:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 0: 93%|█████████▎| 11512/12384 [24:25:38<1:50:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 0: 93%|█████████▎| 11512/12384 [24:25:45<1:50:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 0: 93%|█████████▎| 11513/12384 [24:25:45<1:50:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 0: 93%|█████████▎| 11513/12384 [24:25:53<1:50:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 93%|█████████▎| 11514/12384 [24:25:53<1:50:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 93%|█████████▎| 11514/12384 [24:26:00<1:50:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 93%|█████████▎| 11515/12384 [24:26:00<1:50:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 93%|█████████▎| 11515/12384 [24:26:08<1:50:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 93%|█████████▎| 11516/12384 [24:26:08<1:50:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 0: 93%|█████████▎| 11516/12384 [24:26:16<1:50:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 93%|█████████▎| 11517/12384 [24:26:16<1:49:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 93%|█████████▎| 11517/12384 [24:26:23<1:49:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11518/12384 [24:26:23<1:49:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11518/12384 [24:26:31<1:49:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11519/12384 [24:26:31<1:49:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11519/12384 [24:26:38<1:49:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 93%|█████████▎| 11520/12384 [24:26:38<1:49:29, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 93%|█████████▎| 11520/12384 [24:26:46<1:49:29, 7.60s/it, loss=0.0027, acc=0.9897, iter_time=7.48s]
Epoch 0: 93%|█████████▎| 11521/12384 [24:26:46<1:49:29, 7.61s/it, loss=0.0027, acc=0.9897, iter_time=7.48s]
Epoch 0: 93%|█████████▎| 11521/12384 [24:26:54<1:49:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 93%|█████████▎| 11522/12384 [24:26:54<1:50:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 93%|█████████▎| 11522/12384 [24:27:02<1:50:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 0: 93%|█████████▎| 11523/12384 [24:27:02<1:50:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 0: 93%|█████████▎| 11523/12384 [24:27:09<1:50:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 93%|█████████▎| 11524/12384 [24:27:09<1:50:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 93%|█████████▎| 11524/12384 [24:27:17<1:50:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 93%|█████████▎| 11525/12384 [24:27:17<1:49:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 0: 93%|█████████▎| 11525/12384 [24:27:24<1:49:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11526/12384 [24:27:24<1:49:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11526/12384 [24:27:32<1:49:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 93%|█████████▎| 11527/12384 [24:27:32<1:48:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 93%|█████████▎| 11527/12384 [24:27:40<1:48:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 93%|█████████▎| 11528/12384 [24:27:40<1:48:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 93%|█████████▎| 11528/12384 [24:27:47<1:48:47, 7.63s/it, loss=0.0004, acc=0.9993, iter_time=7.65s]
Epoch 0: 93%|█████████▎| 11529/12384 [24:27:47<1:48:31, 7.62s/it, loss=0.0004, acc=0.9993, iter_time=7.65s]
Epoch 0: 93%|█████████▎| 11529/12384 [24:27:55<1:48:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11530/12384 [24:27:55<1:48:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11530/12384 [24:28:02<1:48:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 0: 93%|█████████▎| 11531/12384 [24:28:02<1:48:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 0: 93%|█████████▎| 11531/12384 [24:28:10<1:48:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 93%|█████████▎| 11532/12384 [24:28:10<1:48:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 93%|█████████▎| 11532/12384 [24:28:18<1:48:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11533/12384 [24:28:18<1:48:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11533/12384 [24:28:25<1:48:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11534/12384 [24:28:25<1:47:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11534/12384 [24:28:33<1:47:55, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11535/12384 [24:28:33<1:47:47, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11535/12384 [24:28:41<1:47:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 93%|█████████▎| 11536/12384 [24:28:41<1:47:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 93%|█████████▎| 11536/12384 [24:28:48<1:47:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 93%|█████████▎| 11537/12384 [24:28:48<1:47:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 93%|█████████▎| 11537/12384 [24:28:56<1:47:29, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=6.13s]
Epoch 0: 93%|█████████▎| 11538/12384 [24:28:56<1:47:17, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=6.13s]
Epoch 0: 93%|█████████▎| 11538/12384 [24:29:03<1:47:17, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=9.07s]
Epoch 0: 93%|█████████▎| 11539/12384 [24:29:03<1:47:05, 7.60s/it, loss=0.0001, acc=0.9996, iter_time=9.07s]
Epoch 0: 93%|█████████▎| 11539/12384 [24:29:11<1:47:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11540/12384 [24:29:11<1:46:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11540/12384 [24:29:19<1:46:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 93%|█████████▎| 11541/12384 [24:29:19<1:46:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 93%|█████████▎| 11541/12384 [24:29:26<1:46:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 93%|█████████▎| 11542/12384 [24:29:26<1:46:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 0: 93%|█████████▎| 11542/12384 [24:29:34<1:46:48, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=9.69s]
Epoch 0: 93%|█████████▎| 11543/12384 [24:29:34<1:46:49, 7.62s/it, loss=0.0005, acc=0.9982, iter_time=9.69s]
Epoch 0: 93%|█████████▎| 11543/12384 [24:29:41<1:46:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 93%|█████████▎| 11544/12384 [24:29:41<1:46:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 93%|█████████▎| 11544/12384 [24:29:49<1:46:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 93%|█████████▎| 11545/12384 [24:29:49<1:46:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 93%|█████████▎| 11545/12384 [24:29:57<1:46:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11546/12384 [24:29:57<1:46:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11546/12384 [24:30:04<1:46:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 93%|█████████▎| 11547/12384 [24:30:04<1:46:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 0: 93%|█████████▎| 11547/12384 [24:30:12<1:46:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 93%|█████████▎| 11548/12384 [24:30:12<1:46:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 0: 93%|█████████▎| 11548/12384 [24:30:20<1:46:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 93%|█████████▎| 11549/12384 [24:30:20<1:47:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 0: 93%|█████████▎| 11549/12384 [24:30:27<1:47:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 0: 93%|█████████▎| 11550/12384 [24:30:27<1:46:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 0: 93%|█████████▎| 11550/12384 [24:30:35<1:46:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 93%|█████████▎| 11551/12384 [24:30:35<1:46:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 93%|█████████▎| 11551/12384 [24:30:43<1:46:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 93%|█████████▎| 11552/12384 [24:30:43<1:45:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 93%|█████████▎| 11552/12384 [24:30:50<1:45:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 93%|█████████▎| 11553/12384 [24:30:50<1:45:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 93%|█████████▎| 11553/12384 [24:30:58<1:45:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 93%|█████████▎| 11554/12384 [24:30:58<1:45:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 93%|█████████▎| 11554/12384 [24:31:05<1:45:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11555/12384 [24:31:05<1:45:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 93%|█████████▎| 11555/12384 [24:31:13<1:45:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11556/12384 [24:31:13<1:45:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11556/12384 [24:31:21<1:45:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 93%|█████████▎| 11557/12384 [24:31:21<1:45:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 93%|█████████▎| 11557/12384 [24:31:28<1:45:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 0: 93%|█████████▎| 11558/12384 [24:31:28<1:44:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 0: 93%|█████████▎| 11558/12384 [24:31:36<1:44:45, 7.61s/it, loss=0.0004, acc=0.9971, iter_time=6.41s]
Epoch 0: 93%|█████████▎| 11559/12384 [24:31:36<1:44:37, 7.61s/it, loss=0.0004, acc=0.9971, iter_time=6.41s]
Epoch 0: 93%|█████████▎| 11559/12384 [24:31:43<1:44:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 0: 93%|█████████▎| 11560/12384 [24:31:43<1:44:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 0: 93%|█████████▎| 11560/12384 [24:31:51<1:44:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11561/12384 [24:31:51<1:44:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 93%|█████████▎| 11561/12384 [24:31:59<1:44:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 93%|█████████▎| 11562/12384 [24:31:59<1:44:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 93%|█████████▎| 11562/12384 [24:32:06<1:44:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 93%|█████████▎| 11563/12384 [24:32:06<1:44:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 0: 93%|█████████▎| 11563/12384 [24:32:14<1:44:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 93%|█████████▎| 11564/12384 [24:32:14<1:44:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 93%|█████████▎| 11564/12384 [24:32:22<1:44:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11565/12384 [24:32:22<1:43:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 93%|█████████▎| 11565/12384 [24:32:29<1:43:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 93%|█████████▎| 11566/12384 [24:32:29<1:43:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 93%|█████████▎| 11566/12384 [24:32:37<1:43:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 0: 93%|█████████▎| 11567/12384 [24:32:37<1:43:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 0: 93%|█████████▎| 11567/12384 [24:32:44<1:43:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 0: 93%|█████████▎| 11568/12384 [24:32:44<1:43:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 0: 93%|█████████▎| 11568/12384 [24:32:52<1:43:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 93%|█████████▎| 11569/12384 [24:32:52<1:43:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 93%|█████████▎| 11569/12384 [24:33:00<1:43:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11570/12384 [24:33:00<1:43:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 93%|█████████▎| 11570/12384 [24:33:07<1:43:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 93%|█████████▎| 11571/12384 [24:33:07<1:43:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 0: 93%|█████████▎| 11571/12384 [24:33:15<1:43:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 93%|█████████▎| 11572/12384 [24:33:15<1:43:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 93%|█████████▎| 11572/12384 [24:33:22<1:43:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 93%|█████████▎| 11573/12384 [24:33:22<1:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 0: 93%|█████████▎| 11573/12384 [24:33:30<1:42:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 93%|█████████▎| 11574/12384 [24:33:30<1:42:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 93%|█████████▎| 11574/12384 [24:33:38<1:42:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 93%|█████████▎| 11575/12384 [24:33:38<1:44:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 93%|█████████▎| 11575/12384 [24:33:46<1:44:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 93%|█████████▎| 11576/12384 [24:33:46<1:43:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 93%|█████████▎| 11576/12384 [24:33:53<1:43:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 93%|█████████▎| 11577/12384 [24:33:53<1:43:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 93%|█████████▎| 11577/12384 [24:34:01<1:43:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 93%|█████████▎| 11578/12384 [24:34:01<1:42:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 93%|█████████▎| 11578/12384 [24:34:09<1:42:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 93%|█████████▎| 11579/12384 [24:34:09<1:42:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 93%|█████████▎| 11579/12384 [24:34:16<1:42:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 0: 94%|█████████▎| 11580/12384 [24:34:16<1:42:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 0: 94%|█████████▎| 11580/12384 [24:34:24<1:42:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 0: 94%|█████████▎| 11581/12384 [24:34:24<1:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 0: 94%|█████████▎| 11581/12384 [24:34:31<1:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 94%|█████████▎| 11582/12384 [24:34:31<1:41:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 94%|█████████▎| 11582/12384 [24:34:39<1:41:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 94%|█████████▎| 11583/12384 [24:34:39<1:41:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 94%|█████████▎| 11583/12384 [24:34:47<1:41:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 94%|█████████▎| 11584/12384 [24:34:47<1:41:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 94%|█████████▎| 11584/12384 [24:34:54<1:41:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 94%|█████████▎| 11585/12384 [24:34:54<1:41:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 94%|█████████▎| 11585/12384 [24:35:02<1:41:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 94%|█████████▎| 11586/12384 [24:35:02<1:41:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 94%|█████████▎| 11586/12384 [24:35:09<1:41:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 94%|█████████▎| 11587/12384 [24:35:09<1:40:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 94%|█████████▎| 11587/12384 [24:35:17<1:40:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 94%|█████████▎| 11588/12384 [24:35:17<1:40:43, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 94%|█████████▎| 11588/12384 [24:35:25<1:40:43, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 94%|█████████▎| 11589/12384 [24:35:25<1:40:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 94%|█████████▎| 11589/12384 [24:35:32<1:40:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 94%|█████████▎| 11590/12384 [24:35:32<1:40:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 94%|█████████▎| 11590/12384 [24:35:40<1:40:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 94%|█████████▎| 11591/12384 [24:35:40<1:40:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 0: 94%|█████████▎| 11591/12384 [24:35:47<1:40:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 94%|█████████▎| 11592/12384 [24:35:47<1:40:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 0: 94%|█████████▎| 11592/12384 [24:35:55<1:40:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 0: 94%|█████████▎| 11593/12384 [24:35:55<1:40:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 0: 94%|█████████▎| 11593/12384 [24:36:03<1:40:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 0: 94%|█████████▎| 11594/12384 [24:36:03<1:40:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 0: 94%|█████████▎| 11594/12384 [24:36:10<1:40:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 94%|█████████▎| 11595/12384 [24:36:10<1:40:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 94%|█████████▎| 11595/12384 [24:36:18<1:40:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 94%|█████████▎| 11596/12384 [24:36:18<1:40:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 94%|█████████▎| 11596/12384 [24:36:26<1:40:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 94%|█████████▎| 11597/12384 [24:36:26<1:40:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 94%|█████████▎| 11597/12384 [24:36:33<1:40:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 94%|█████████▎| 11598/12384 [24:36:33<1:39:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 0: 94%|█████████▎| 11598/12384 [24:36:41<1:39:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 94%|█████████▎| 11599/12384 [24:36:41<1:39:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 94%|█████████▎| 11599/12384 [24:36:49<1:39:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 94%|█████████▎| 11600/12384 [24:36:49<1:39:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 94%|█████████▎| 11600/12384 [24:36:57<1:39:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 94%|█████████▎| 11601/12384 [24:36:57<1:41:03, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 94%|█████████▎| 11601/12384 [24:37:04<1:41:03, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 94%|█████████▎| 11602/12384 [24:37:04<1:41:42, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 0: 94%|█████████▎| 11602/12384 [24:37:12<1:41:42, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▎| 11603/12384 [24:37:12<1:40:57, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▎| 11603/12384 [24:37:20<1:40:57, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 0: 94%|█████████▎| 11604/12384 [24:37:20<1:40:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 0: 94%|█████████▎| 11604/12384 [24:37:27<1:40:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 94%|█████████▎| 11605/12384 [24:37:27<1:39:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 94%|█████████▎| 11605/12384 [24:37:35<1:39:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 94%|█████████▎| 11606/12384 [24:37:35<1:39:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 0: 94%|█████████▎| 11606/12384 [24:37:43<1:39:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 0: 94%|█████████▎| 11607/12384 [24:37:43<1:38:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 0: 94%|█████████▎| 11607/12384 [24:37:50<1:38:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 0: 94%|█████████▎| 11608/12384 [24:37:50<1:38:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 0: 94%|█████████▎| 11608/12384 [24:37:58<1:38:38, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=5.11s]
Epoch 0: 94%|█████████▎| 11609/12384 [24:37:58<1:38:26, 7.62s/it, loss=0.0003, acc=0.9990, iter_time=5.11s]
Epoch 0: 94%|█████████▎| 11609/12384 [24:38:05<1:38:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 94%|█████████▍| 11610/12384 [24:38:05<1:38:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 0: 94%|█████████▍| 11610/12384 [24:38:13<1:38:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11611/12384 [24:38:13<1:38:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11611/12384 [24:38:21<1:38:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 94%|█████████▍| 11612/12384 [24:38:21<1:37:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 94%|█████████▍| 11612/12384 [24:38:28<1:37:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 94%|█████████▍| 11613/12384 [24:38:28<1:37:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 94%|█████████▍| 11613/12384 [24:38:36<1:37:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 94%|█████████▍| 11614/12384 [24:38:36<1:37:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 94%|█████████▍| 11614/12384 [24:38:43<1:37:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 94%|█████████▍| 11615/12384 [24:38:43<1:37:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 94%|█████████▍| 11615/12384 [24:38:51<1:37:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 94%|█████████▍| 11616/12384 [24:38:51<1:37:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 94%|█████████▍| 11616/12384 [24:38:59<1:37:17, 7.60s/it, loss=0.0004, acc=0.9999, iter_time=7.27s]
Epoch 0: 94%|█████████▍| 11617/12384 [24:38:59<1:37:30, 7.63s/it, loss=0.0004, acc=0.9999, iter_time=7.27s]
Epoch 0: 94%|█████████▍| 11617/12384 [24:39:06<1:37:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 94%|█████████▍| 11618/12384 [24:39:06<1:37:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 0: 94%|█████████▍| 11618/12384 [24:39:14<1:37:19, 7.62s/it, loss=0.0014, acc=0.9967, iter_time=8.16s]
Epoch 0: 94%|█████████▍| 11619/12384 [24:39:14<1:37:05, 7.61s/it, loss=0.0014, acc=0.9967, iter_time=8.16s]
Epoch 0: 94%|█████████▍| 11619/12384 [24:39:21<1:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11620/12384 [24:39:21<1:37:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11620/12384 [24:39:29<1:37:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 94%|█████████▍| 11621/12384 [24:39:29<1:37:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 94%|█████████▍| 11621/12384 [24:39:37<1:37:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11622/12384 [24:39:37<1:36:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11622/12384 [24:39:44<1:36:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11623/12384 [24:39:44<1:36:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11623/12384 [24:39:52<1:36:35, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 94%|█████████▍| 11624/12384 [24:39:52<1:36:43, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 94%|█████████▍| 11624/12384 [24:40:00<1:36:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 94%|█████████▍| 11625/12384 [24:40:00<1:36:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 94%|█████████▍| 11625/12384 [24:40:07<1:36:25, 7.62s/it, loss=0.0019, acc=0.9958, iter_time=8.78s]
Epoch 0: 94%|█████████▍| 11626/12384 [24:40:07<1:36:15, 7.62s/it, loss=0.0019, acc=0.9958, iter_time=8.78s]
Epoch 0: 94%|█████████▍| 11626/12384 [24:40:15<1:36:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.54s]
Epoch 0: 94%|█████████▍| 11627/12384 [24:40:15<1:37:22, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=4.54s]
Epoch 0: 94%|█████████▍| 11627/12384 [24:40:23<1:37:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 94%|█████████▍| 11628/12384 [24:40:23<1:36:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 0: 94%|█████████▍| 11628/12384 [24:40:30<1:36:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 94%|█████████▍| 11629/12384 [24:40:30<1:36:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 94%|█████████▍| 11629/12384 [24:40:38<1:36:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11630/12384 [24:40:38<1:36:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11630/12384 [24:40:46<1:36:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 94%|█████████▍| 11631/12384 [24:40:46<1:35:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 94%|█████████▍| 11631/12384 [24:40:53<1:35:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 94%|█████████▍| 11632/12384 [24:40:53<1:35:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 94%|█████████▍| 11632/12384 [24:41:01<1:35:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 94%|█████████▍| 11633/12384 [24:41:01<1:35:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 0: 94%|█████████▍| 11633/12384 [24:41:08<1:35:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 0: 94%|█████████▍| 11634/12384 [24:41:08<1:35:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 0: 94%|█████████▍| 11634/12384 [24:41:16<1:35:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11635/12384 [24:41:16<1:35:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11635/12384 [24:41:24<1:35:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 94%|█████████▍| 11636/12384 [24:41:24<1:34:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 94%|█████████▍| 11636/12384 [24:41:31<1:34:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 94%|█████████▍| 11637/12384 [24:41:31<1:34:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 94%|█████████▍| 11637/12384 [24:41:39<1:34:46, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.35s]
Epoch 0: 94%|█████████▍| 11638/12384 [24:41:39<1:34:40, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.35s]
Epoch 0: 94%|█████████▍| 11638/12384 [24:41:47<1:34:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 94%|█████████▍| 11639/12384 [24:41:47<1:34:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 94%|█████████▍| 11639/12384 [24:41:54<1:34:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 94%|█████████▍| 11640/12384 [24:41:54<1:34:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 0: 94%|█████████▍| 11640/12384 [24:42:02<1:34:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 94%|█████████▍| 11641/12384 [24:42:02<1:34:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 94%|█████████▍| 11641/12384 [24:42:09<1:34:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 94%|█████████▍| 11642/12384 [24:42:09<1:34:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 0: 94%|█████████▍| 11642/12384 [24:42:17<1:34:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 94%|█████████▍| 11643/12384 [24:42:17<1:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 94%|█████████▍| 11643/12384 [24:42:25<1:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 94%|█████████▍| 11644/12384 [24:42:25<1:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 94%|█████████▍| 11644/12384 [24:42:32<1:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 94%|█████████▍| 11645/12384 [24:42:32<1:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 94%|█████████▍| 11645/12384 [24:42:40<1:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11646/12384 [24:42:40<1:33:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11646/12384 [24:42:47<1:33:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 94%|█████████▍| 11647/12384 [24:42:47<1:33:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 94%|█████████▍| 11647/12384 [24:42:55<1:33:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 94%|█████████▍| 11648/12384 [24:42:55<1:33:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 0: 94%|█████████▍| 11648/12384 [24:43:03<1:33:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 94%|█████████▍| 11649/12384 [24:43:03<1:33:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 0: 94%|█████████▍| 11649/12384 [24:43:10<1:33:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 0: 94%|█████████▍| 11650/12384 [24:43:10<1:33:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 0: 94%|█████████▍| 11650/12384 [24:43:18<1:33:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 0: 94%|█████████▍| 11651/12384 [24:43:18<1:33:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 0: 94%|█████████▍| 11651/12384 [24:43:26<1:33:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 94%|█████████▍| 11652/12384 [24:43:26<1:33:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 0: 94%|█████████▍| 11652/12384 [24:43:34<1:33:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 0: 94%|█████████▍| 11653/12384 [24:43:34<1:34:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 0: 94%|█████████▍| 11653/12384 [24:43:41<1:34:02, 7.72s/it, loss=0.0008, acc=0.9963, iter_time=10.43s]
Epoch 0: 94%|█████████▍| 11654/12384 [24:43:41<1:34:28, 7.77s/it, loss=0.0008, acc=0.9963, iter_time=10.43s]
Epoch 0: 94%|█████████▍| 11654/12384 [24:43:49<1:34:28, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11655/12384 [24:43:49<1:33:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11655/12384 [24:43:57<1:33:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 94%|█████████▍| 11656/12384 [24:43:57<1:33:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 0: 94%|█████████▍| 11656/12384 [24:44:04<1:33:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 94%|█████████▍| 11657/12384 [24:44:04<1:32:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 94%|█████████▍| 11657/12384 [24:44:12<1:32:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11658/12384 [24:44:12<1:32:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11658/12384 [24:44:19<1:32:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11659/12384 [24:44:19<1:32:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11659/12384 [24:44:27<1:32:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 94%|█████████▍| 11660/12384 [24:44:27<1:31:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 94%|█████████▍| 11660/12384 [24:44:35<1:31:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 94%|█████████▍| 11661/12384 [24:44:35<1:32:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 94%|█████████▍| 11661/12384 [24:44:42<1:32:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 0: 94%|█████████▍| 11662/12384 [24:44:42<1:31:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 0: 94%|█████████▍| 11662/12384 [24:44:50<1:31:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11663/12384 [24:44:50<1:31:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11663/12384 [24:44:58<1:31:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 94%|█████████▍| 11664/12384 [24:44:58<1:31:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 94%|█████████▍| 11664/12384 [24:45:05<1:31:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 94%|█████████▍| 11665/12384 [24:45:05<1:31:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 94%|█████████▍| 11665/12384 [24:45:13<1:31:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 94%|█████████▍| 11666/12384 [24:45:13<1:31:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 94%|█████████▍| 11666/12384 [24:45:21<1:31:18, 7.63s/it, loss=0.0002, acc=0.9996, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11667/12384 [24:45:21<1:31:09, 7.63s/it, loss=0.0002, acc=0.9996, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11667/12384 [24:45:28<1:31:09, 7.63s/it, loss=0.0001, acc=0.9992, iter_time=7.61s]
Epoch 0: 94%|█████████▍| 11668/12384 [24:45:28<1:31:00, 7.63s/it, loss=0.0001, acc=0.9992, iter_time=7.61s]
Epoch 0: 94%|█████████▍| 11668/12384 [24:45:36<1:31:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11669/12384 [24:45:36<1:30:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11669/12384 [24:45:43<1:30:50, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11670/12384 [24:45:43<1:30:35, 7.61s/it, loss=0.0004, acc=0.9985, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11670/12384 [24:45:51<1:30:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11671/12384 [24:45:51<1:30:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11671/12384 [24:45:59<1:30:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 94%|█████████▍| 11672/12384 [24:45:59<1:30:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 94%|█████████▍| 11672/12384 [24:46:06<1:30:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 94%|█████████▍| 11673/12384 [24:46:06<1:30:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 94%|█████████▍| 11673/12384 [24:46:14<1:30:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.81s]
Epoch 0: 94%|█████████▍| 11674/12384 [24:46:14<1:30:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.81s]
Epoch 0: 94%|█████████▍| 11674/12384 [24:46:21<1:30:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 94%|█████████▍| 11675/12384 [24:46:21<1:29:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 94%|█████████▍| 11675/12384 [24:46:29<1:29:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 94%|█████████▍| 11676/12384 [24:46:29<1:29:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 94%|█████████▍| 11676/12384 [24:46:37<1:29:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 94%|█████████▍| 11677/12384 [24:46:37<1:29:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 94%|█████████▍| 11677/12384 [24:46:44<1:29:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 94%|█████████▍| 11678/12384 [24:46:44<1:29:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 94%|█████████▍| 11678/12384 [24:46:52<1:29:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 94%|█████████▍| 11679/12384 [24:46:52<1:29:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 94%|█████████▍| 11679/12384 [24:47:00<1:29:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 0: 94%|█████████▍| 11680/12384 [24:47:00<1:30:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 0: 94%|█████████▍| 11680/12384 [24:47:07<1:30:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 94%|█████████▍| 11681/12384 [24:47:07<1:30:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 94%|█████████▍| 11681/12384 [24:47:15<1:30:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 94%|█████████▍| 11682/12384 [24:47:15<1:29:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 94%|█████████▍| 11682/12384 [24:47:23<1:29:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 94%|█████████▍| 11683/12384 [24:47:23<1:29:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 0: 94%|█████████▍| 11683/12384 [24:47:30<1:29:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 94%|█████████▍| 11684/12384 [24:47:30<1:29:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 94%|█████████▍| 11684/12384 [24:47:38<1:29:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11685/12384 [24:47:38<1:28:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11685/12384 [24:47:46<1:28:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 94%|█████████▍| 11686/12384 [24:47:46<1:28:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 0: 94%|█████████▍| 11686/12384 [24:47:53<1:28:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 0: 94%|█████████▍| 11687/12384 [24:47:53<1:28:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 0: 94%|█████████▍| 11687/12384 [24:48:01<1:28:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 94%|█████████▍| 11688/12384 [24:48:01<1:28:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 94%|█████████▍| 11688/12384 [24:48:08<1:28:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 0: 94%|█████████▍| 11689/12384 [24:48:08<1:28:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 0: 94%|█████████▍| 11689/12384 [24:48:16<1:28:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 0: 94%|█████████▍| 11690/12384 [24:48:16<1:28:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 0: 94%|█████████▍| 11690/12384 [24:48:24<1:28:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 0: 94%|█████████▍| 11691/12384 [24:48:24<1:27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 0: 94%|█████████▍| 11691/12384 [24:48:31<1:27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 94%|█████████▍| 11692/12384 [24:48:31<1:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 94%|█████████▍| 11692/12384 [24:48:39<1:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11693/12384 [24:48:39<1:27:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 94%|█████████▍| 11693/12384 [24:48:46<1:27:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11694/12384 [24:48:46<1:27:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 94%|█████████▍| 11694/12384 [24:48:54<1:27:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11695/12384 [24:48:54<1:27:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11695/12384 [24:49:02<1:27:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 94%|█████████▍| 11696/12384 [24:49:02<1:27:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 94%|█████████▍| 11696/12384 [24:49:09<1:27:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 0: 94%|█████████▍| 11697/12384 [24:49:09<1:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 0: 94%|█████████▍| 11697/12384 [24:49:17<1:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 94%|█████████▍| 11698/12384 [24:49:17<1:27:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 94%|█████████▍| 11698/12384 [24:49:25<1:27:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11699/12384 [24:49:25<1:27:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 94%|█████████▍| 11699/12384 [24:49:32<1:27:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 94%|█████████▍| 11700/12384 [24:49:32<1:26:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 94%|█████████▍| 11700/12384 [24:49:40<1:26:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 94%|█████████▍| 11701/12384 [24:49:40<1:26:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 94%|█████████▍| 11701/12384 [24:49:47<1:26:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 94%|█████████▍| 11702/12384 [24:49:47<1:26:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 94%|█████████▍| 11702/12384 [24:49:55<1:26:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11703/12384 [24:49:55<1:26:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11703/12384 [24:50:03<1:26:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 95%|█████████▍| 11704/12384 [24:50:03<1:26:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 95%|█████████▍| 11704/12384 [24:50:10<1:26:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 95%|█████████▍| 11705/12384 [24:50:10<1:26:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 0: 95%|█████████▍| 11705/12384 [24:50:18<1:26:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 95%|█████████▍| 11706/12384 [24:50:18<1:27:24, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 95%|█████████▍| 11706/12384 [24:50:26<1:27:24, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 95%|█████████▍| 11707/12384 [24:50:26<1:26:50, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 95%|█████████▍| 11707/12384 [24:50:34<1:26:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11708/12384 [24:50:34<1:26:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11708/12384 [24:50:41<1:26:21, 7.67s/it, loss=0.0004, acc=0.9981, iter_time=7.59s]
Epoch 0: 95%|█████████▍| 11709/12384 [24:50:41<1:26:05, 7.65s/it, loss=0.0004, acc=0.9981, iter_time=7.59s]
Epoch 0: 95%|█████████▍| 11709/12384 [24:50:49<1:26:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 95%|█████████▍| 11710/12384 [24:50:49<1:25:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 0: 95%|█████████▍| 11710/12384 [24:50:56<1:25:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 95%|█████████▍| 11711/12384 [24:50:56<1:25:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 0: 95%|█████████▍| 11711/12384 [24:51:04<1:25:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 95%|█████████▍| 11712/12384 [24:51:04<1:25:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 95%|█████████▍| 11712/12384 [24:51:12<1:25:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 95%|█████████▍| 11713/12384 [24:51:12<1:25:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 95%|█████████▍| 11713/12384 [24:51:19<1:25:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11714/12384 [24:51:19<1:25:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11714/12384 [24:51:27<1:25:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11715/12384 [24:51:27<1:24:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11715/12384 [24:51:34<1:24:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11716/12384 [24:51:34<1:24:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11716/12384 [24:51:42<1:24:46, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.02s]
Epoch 0: 95%|█████████▍| 11717/12384 [24:51:42<1:24:32, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.02s]
Epoch 0: 95%|█████████▍| 11717/12384 [24:51:50<1:24:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 95%|█████████▍| 11718/12384 [24:51:50<1:24:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 95%|█████████▍| 11718/12384 [24:51:57<1:24:25, 7.61s/it, loss=0.0003, acc=0.9981, iter_time=6.73s]
Epoch 0: 95%|█████████▍| 11719/12384 [24:51:57<1:24:13, 7.60s/it, loss=0.0003, acc=0.9981, iter_time=6.73s]
Epoch 0: 95%|█████████▍| 11719/12384 [24:52:05<1:24:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 95%|█████████▍| 11720/12384 [24:52:05<1:24:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 0: 95%|█████████▍| 11720/12384 [24:52:12<1:24:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 95%|█████████▍| 11721/12384 [24:52:12<1:23:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 95%|█████████▍| 11721/12384 [24:52:20<1:23:59, 7.60s/it, loss=0.0001, acc=0.9991, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11722/12384 [24:52:20<1:23:50, 7.60s/it, loss=0.0001, acc=0.9991, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11722/12384 [24:52:28<1:23:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 95%|█████████▍| 11723/12384 [24:52:28<1:23:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 0: 95%|█████████▍| 11723/12384 [24:52:35<1:23:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11724/12384 [24:52:35<1:23:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11724/12384 [24:52:43<1:23:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 0: 95%|█████████▍| 11725/12384 [24:52:43<1:23:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 0: 95%|█████████▍| 11725/12384 [24:52:50<1:23:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11726/12384 [24:52:50<1:23:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11726/12384 [24:52:58<1:23:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 95%|█████████▍| 11727/12384 [24:52:58<1:23:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 95%|█████████▍| 11727/12384 [24:53:06<1:23:19, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 95%|█████████▍| 11728/12384 [24:53:06<1:23:30, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 95%|█████████▍| 11728/12384 [24:53:13<1:23:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 95%|█████████▍| 11729/12384 [24:53:13<1:23:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 0: 95%|█████████▍| 11729/12384 [24:53:21<1:23:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 95%|█████████▍| 11730/12384 [24:53:21<1:23:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 95%|█████████▍| 11730/12384 [24:53:29<1:23:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 95%|█████████▍| 11731/12384 [24:53:29<1:22:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 0: 95%|█████████▍| 11731/12384 [24:53:36<1:22:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 95%|█████████▍| 11732/12384 [24:53:36<1:22:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 95%|█████████▍| 11732/12384 [24:53:44<1:22:50, 7.62s/it, loss=0.0019, acc=0.9969, iter_time=8.63s]
Epoch 0: 95%|█████████▍| 11733/12384 [24:53:44<1:23:48, 7.72s/it, loss=0.0019, acc=0.9969, iter_time=8.63s]
Epoch 0: 95%|█████████▍| 11733/12384 [24:53:52<1:23:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 95%|█████████▍| 11734/12384 [24:53:52<1:23:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 95%|█████████▍| 11734/12384 [24:54:00<1:23:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 95%|█████████▍| 11735/12384 [24:54:00<1:23:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 95%|█████████▍| 11735/12384 [24:54:07<1:23:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 0: 95%|█████████▍| 11736/12384 [24:54:07<1:22:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 0: 95%|█████████▍| 11736/12384 [24:54:15<1:22:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 95%|█████████▍| 11737/12384 [24:54:15<1:22:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 95%|█████████▍| 11737/12384 [24:54:22<1:22:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 95%|█████████▍| 11738/12384 [24:54:22<1:22:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 95%|█████████▍| 11738/12384 [24:54:30<1:22:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 95%|█████████▍| 11739/12384 [24:54:30<1:22:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 95%|█████████▍| 11739/12384 [24:54:38<1:22:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 95%|█████████▍| 11740/12384 [24:54:38<1:21:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 95%|█████████▍| 11740/12384 [24:54:45<1:21:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 95%|█████████▍| 11741/12384 [24:54:45<1:21:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 95%|█████████▍| 11741/12384 [24:54:53<1:21:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 95%|█████████▍| 11742/12384 [24:54:53<1:21:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 95%|█████████▍| 11742/12384 [24:55:00<1:21:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11743/12384 [24:55:00<1:21:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▍| 11743/12384 [24:55:08<1:21:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 95%|█████████▍| 11744/12384 [24:55:08<1:21:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 95%|█████████▍| 11744/12384 [24:55:16<1:21:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 95%|█████████▍| 11745/12384 [24:55:16<1:21:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 95%|█████████▍| 11745/12384 [24:55:23<1:21:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 0: 95%|█████████▍| 11746/12384 [24:55:23<1:20:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 0: 95%|█████████▍| 11746/12384 [24:55:31<1:20:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 95%|█████████▍| 11747/12384 [24:55:31<1:20:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 0: 95%|█████████▍| 11747/12384 [24:55:38<1:20:45, 7.61s/it, loss=0.0003, acc=0.9972, iter_time=9.15s]
Epoch 0: 95%|█████████▍| 11748/12384 [24:55:38<1:20:46, 7.62s/it, loss=0.0003, acc=0.9972, iter_time=9.15s]
Epoch 0: 95%|█████████▍| 11748/12384 [24:55:46<1:20:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11749/12384 [24:55:46<1:20:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▍| 11749/12384 [24:55:54<1:20:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 95%|█████████▍| 11750/12384 [24:55:54<1:20:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 95%|█████████▍| 11750/12384 [24:56:01<1:20:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 95%|█████████▍| 11751/12384 [24:56:01<1:20:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 95%|█████████▍| 11751/12384 [24:56:09<1:20:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 95%|█████████▍| 11752/12384 [24:56:09<1:20:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 95%|█████████▍| 11752/12384 [24:56:17<1:20:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 95%|█████████▍| 11753/12384 [24:56:17<1:20:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 0: 95%|█████████▍| 11753/12384 [24:56:24<1:20:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 95%|█████████▍| 11754/12384 [24:56:24<1:20:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 95%|█████████▍| 11754/12384 [24:56:32<1:20:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 0: 95%|█████████▍| 11755/12384 [24:56:32<1:19:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 0: 95%|█████████▍| 11755/12384 [24:56:39<1:19:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 95%|█████████▍| 11756/12384 [24:56:39<1:19:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 95%|█████████▍| 11756/12384 [24:56:47<1:19:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 0: 95%|█████████▍| 11757/12384 [24:56:47<1:19:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 0: 95%|█████████▍| 11757/12384 [24:56:55<1:19:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 0: 95%|█████████▍| 11758/12384 [24:56:55<1:20:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 0: 95%|█████████▍| 11758/12384 [24:57:03<1:20:17, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 95%|█████████▍| 11759/12384 [24:57:03<1:20:50, 7.76s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 95%|█████████▍| 11759/12384 [24:57:10<1:20:50, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 95%|█████████▍| 11760/12384 [24:57:10<1:20:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 95%|█████████▍| 11760/12384 [24:57:18<1:20:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 95%|█████████▍| 11761/12384 [24:57:18<1:19:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 95%|█████████▍| 11761/12384 [24:57:26<1:19:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 95%|█████████▍| 11762/12384 [24:57:26<1:19:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 0: 95%|█████████▍| 11762/12384 [24:57:33<1:19:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 0: 95%|█████████▍| 11763/12384 [24:57:33<1:19:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 0: 95%|█████████▍| 11763/12384 [24:57:41<1:19:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 0: 95%|█████████▍| 11764/12384 [24:57:41<1:18:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 0: 95%|█████████▍| 11764/12384 [24:57:49<1:18:59, 7.64s/it, loss=0.0002, acc=0.9986, iter_time=7.64s]
Epoch 0: 95%|█████████▌| 11765/12384 [24:57:49<1:18:44, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=7.64s]
Epoch 0: 95%|█████████▌| 11765/12384 [24:57:56<1:18:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 95%|█████████▌| 11766/12384 [24:57:56<1:18:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 0: 95%|█████████▌| 11766/12384 [24:58:04<1:18:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 95%|█████████▌| 11767/12384 [24:58:04<1:18:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 95%|█████████▌| 11767/12384 [24:58:11<1:18:17, 7.61s/it, loss=0.0004, acc=0.9980, iter_time=9.72s]
Epoch 0: 95%|█████████▌| 11768/12384 [24:58:11<1:18:14, 7.62s/it, loss=0.0004, acc=0.9980, iter_time=9.72s]
Epoch 0: 95%|█████████▌| 11768/12384 [24:58:19<1:18:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 95%|█████████▌| 11769/12384 [24:58:19<1:18:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 95%|█████████▌| 11769/12384 [24:58:27<1:18:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 95%|█████████▌| 11770/12384 [24:58:27<1:17:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 95%|█████████▌| 11770/12384 [24:58:34<1:17:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 95%|█████████▌| 11771/12384 [24:58:34<1:18:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 0: 95%|█████████▌| 11771/12384 [24:58:42<1:18:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 95%|█████████▌| 11772/12384 [24:58:42<1:17:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 95%|█████████▌| 11772/12384 [24:58:49<1:17:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 0: 95%|█████████▌| 11773/12384 [24:58:49<1:17:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 0: 95%|█████████▌| 11773/12384 [24:58:57<1:17:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 0: 95%|█████████▌| 11774/12384 [24:58:57<1:17:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 0: 95%|█████████▌| 11774/12384 [24:59:05<1:17:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 95%|█████████▌| 11775/12384 [24:59:05<1:17:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 95%|█████████▌| 11775/12384 [24:59:12<1:17:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 95%|█████████▌| 11776/12384 [24:59:12<1:17:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 95%|█████████▌| 11776/12384 [24:59:20<1:17:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 95%|█████████▌| 11777/12384 [24:59:20<1:17:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 0: 95%|█████████▌| 11777/12384 [24:59:28<1:17:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 95%|█████████▌| 11778/12384 [24:59:28<1:17:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 0: 95%|█████████▌| 11778/12384 [24:59:35<1:17:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 95%|█████████▌| 11779/12384 [24:59:35<1:17:01, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 0: 95%|█████████▌| 11779/12384 [24:59:43<1:17:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 95%|█████████▌| 11780/12384 [24:59:43<1:16:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 95%|█████████▌| 11780/12384 [24:59:51<1:16:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 95%|█████████▌| 11781/12384 [24:59:51<1:16:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 95%|█████████▌| 11781/12384 [24:59:58<1:16:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 95%|█████████▌| 11782/12384 [24:59:58<1:16:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 95%|█████████▌| 11782/12384 [25:00:06<1:16:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 95%|█████████▌| 11783/12384 [25:00:06<1:16:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 0: 95%|█████████▌| 11783/12384 [25:00:13<1:16:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 0: 95%|█████████▌| 11784/12384 [25:00:13<1:16:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 0: 95%|█████████▌| 11784/12384 [25:00:21<1:16:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 95%|█████████▌| 11785/12384 [25:00:21<1:17:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 0: 95%|█████████▌| 11785/12384 [25:00:29<1:17:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 0: 95%|█████████▌| 11786/12384 [25:00:29<1:16:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 0: 95%|█████████▌| 11786/12384 [25:00:37<1:16:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▌| 11787/12384 [25:00:37<1:16:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▌| 11787/12384 [25:00:44<1:16:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 0: 95%|█████████▌| 11788/12384 [25:00:44<1:16:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 0: 95%|█████████▌| 11788/12384 [25:00:52<1:16:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 95%|█████████▌| 11789/12384 [25:00:52<1:15:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 0: 95%|█████████▌| 11789/12384 [25:00:59<1:15:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 95%|█████████▌| 11790/12384 [25:00:59<1:15:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 95%|█████████▌| 11790/12384 [25:01:07<1:15:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 95%|█████████▌| 11791/12384 [25:01:07<1:15:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 95%|█████████▌| 11791/12384 [25:01:15<1:15:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 95%|█████████▌| 11792/12384 [25:01:15<1:15:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 0: 95%|█████████▌| 11792/12384 [25:01:22<1:15:11, 7.62s/it, loss=0.0016, acc=0.9973, iter_time=4.59s]
Epoch 0: 95%|█████████▌| 11793/12384 [25:01:22<1:14:59, 7.61s/it, loss=0.0016, acc=0.9973, iter_time=4.59s]
Epoch 0: 95%|█████████▌| 11793/12384 [25:01:30<1:14:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 0: 95%|█████████▌| 11794/12384 [25:01:30<1:14:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 0: 95%|█████████▌| 11794/12384 [25:01:37<1:14:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 0: 95%|█████████▌| 11795/12384 [25:01:37<1:14:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 0: 95%|█████████▌| 11795/12384 [25:01:45<1:14:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 95%|█████████▌| 11796/12384 [25:01:45<1:14:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 0: 95%|█████████▌| 11796/12384 [25:01:53<1:14:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 95%|█████████▌| 11797/12384 [25:01:53<1:14:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 0: 95%|█████████▌| 11797/12384 [25:02:00<1:14:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 95%|█████████▌| 11798/12384 [25:02:00<1:14:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 95%|█████████▌| 11798/12384 [25:02:08<1:14:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 95%|█████████▌| 11799/12384 [25:02:08<1:14:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 0: 95%|█████████▌| 11799/12384 [25:02:15<1:14:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 0: 95%|█████████▌| 11800/12384 [25:02:15<1:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 0: 95%|█████████▌| 11800/12384 [25:02:23<1:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 0: 95%|█████████▌| 11801/12384 [25:02:23<1:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 0: 95%|█████████▌| 11801/12384 [25:02:31<1:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 95%|█████████▌| 11802/12384 [25:02:31<1:13:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 0: 95%|█████████▌| 11802/12384 [25:02:38<1:13:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 95%|█████████▌| 11803/12384 [25:02:38<1:13:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 0: 95%|█████████▌| 11803/12384 [25:02:46<1:13:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 0: 95%|█████████▌| 11804/12384 [25:02:46<1:13:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 0: 95%|█████████▌| 11804/12384 [25:02:53<1:13:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 95%|█████████▌| 11805/12384 [25:02:53<1:13:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 95%|█████████▌| 11805/12384 [25:03:01<1:13:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 95%|█████████▌| 11806/12384 [25:03:01<1:13:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 95%|█████████▌| 11806/12384 [25:03:09<1:13:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 95%|█████████▌| 11807/12384 [25:03:09<1:13:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 95%|█████████▌| 11807/12384 [25:03:16<1:13:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 95%|█████████▌| 11808/12384 [25:03:16<1:13:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 95%|█████████▌| 11808/12384 [25:03:24<1:13:02, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=6.57s]
Epoch 0: 95%|█████████▌| 11809/12384 [25:03:24<1:12:07, 7.53s/it, loss=0.0003, acc=1.0000, iter_time=6.57s]
Epoch 0: 95%|█████████▌| 11809/12384 [25:03:31<1:12:07, 7.53s/it, loss=0.0004, acc=0.9997, iter_time=7.05s]
Epoch 0: 95%|█████████▌| 11810/12384 [25:03:31<1:12:12, 7.55s/it, loss=0.0004, acc=0.9997, iter_time=7.05s]
Epoch 0: 95%|█████████▌| 11810/12384 [25:03:39<1:12:12, 7.55s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 95%|█████████▌| 11811/12384 [25:03:39<1:13:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 0: 95%|█████████▌| 11811/12384 [25:03:47<1:13:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 0: 95%|█████████▌| 11812/12384 [25:03:47<1:13:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 0: 95%|█████████▌| 11812/12384 [25:03:54<1:13:07, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=9.41s]
Epoch 0: 95%|█████████▌| 11813/12384 [25:03:54<1:12:50, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=9.41s]
Epoch 0: 95%|█████████▌| 11813/12384 [25:04:02<1:12:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 95%|█████████▌| 11814/12384 [25:04:02<1:12:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 0: 95%|█████████▌| 11814/12384 [25:04:10<1:12:44, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 95%|█████████▌| 11815/12384 [25:04:10<1:12:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 95%|█████████▌| 11815/12384 [25:04:17<1:12:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 95%|█████████▌| 11816/12384 [25:04:17<1:12:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 95%|█████████▌| 11816/12384 [25:04:25<1:12:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 95%|█████████▌| 11817/12384 [25:04:25<1:12:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 95%|█████████▌| 11817/12384 [25:04:33<1:12:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▌| 11818/12384 [25:04:33<1:11:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▌| 11818/12384 [25:04:40<1:11:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▌| 11819/12384 [25:04:40<1:11:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 95%|█████████▌| 11819/12384 [25:04:48<1:11:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 95%|█████████▌| 11820/12384 [25:04:48<1:11:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 0: 95%|█████████▌| 11820/12384 [25:04:55<1:11:41, 7.63s/it, loss=0.0004, acc=0.9978, iter_time=8.79s]
Epoch 0: 95%|█████████▌| 11821/12384 [25:04:55<1:11:30, 7.62s/it, loss=0.0004, acc=0.9978, iter_time=8.79s]
Epoch 0: 95%|█████████▌| 11821/12384 [25:05:03<1:11:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▌| 11822/12384 [25:05:03<1:11:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 95%|█████████▌| 11822/12384 [25:05:11<1:11:16, 7.61s/it, loss=0.0011, acc=0.9978, iter_time=7.60s]
Epoch 0: 95%|█████████▌| 11823/12384 [25:05:11<1:11:11, 7.61s/it, loss=0.0011, acc=0.9978, iter_time=7.60s]
Epoch 0: 95%|█████████▌| 11823/12384 [25:05:18<1:11:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 95%|█████████▌| 11824/12384 [25:05:18<1:11:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 95%|█████████▌| 11824/12384 [25:05:26<1:11:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 95%|█████████▌| 11825/12384 [25:05:26<1:10:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 95%|█████████▌| 11825/12384 [25:05:34<1:10:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 95%|█████████▌| 11826/12384 [25:05:34<1:10:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 0: 95%|█████████▌| 11826/12384 [25:05:41<1:10:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 96%|█████████▌| 11827/12384 [25:05:41<1:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 0: 96%|█████████▌| 11827/12384 [25:05:49<1:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 96%|█████████▌| 11828/12384 [25:05:49<1:10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 96%|█████████▌| 11828/12384 [25:05:56<1:10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 96%|█████████▌| 11829/12384 [25:05:56<1:10:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 96%|█████████▌| 11829/12384 [25:06:04<1:10:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 96%|█████████▌| 11830/12384 [25:06:04<1:10:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 0: 96%|█████████▌| 11830/12384 [25:06:12<1:10:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 96%|█████████▌| 11831/12384 [25:06:12<1:10:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 96%|█████████▌| 11831/12384 [25:06:19<1:10:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 96%|█████████▌| 11832/12384 [25:06:19<1:10:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 96%|█████████▌| 11832/12384 [25:06:27<1:10:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 0: 96%|█████████▌| 11833/12384 [25:06:27<1:09:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 0: 96%|█████████▌| 11833/12384 [25:06:34<1:09:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 96%|█████████▌| 11834/12384 [25:06:34<1:09:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 96%|█████████▌| 11834/12384 [25:06:42<1:09:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 0: 96%|█████████▌| 11835/12384 [25:06:42<1:09:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 0: 96%|█████████▌| 11835/12384 [25:06:50<1:09:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 96%|█████████▌| 11836/12384 [25:06:50<1:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 0: 96%|█████████▌| 11836/12384 [25:06:58<1:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 96%|█████████▌| 11837/12384 [25:06:58<1:10:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 96%|█████████▌| 11837/12384 [25:07:05<1:10:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 0: 96%|█████████▌| 11838/12384 [25:07:05<1:10:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 0: 96%|█████████▌| 11838/12384 [25:07:13<1:10:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 96%|█████████▌| 11839/12384 [25:07:13<1:09:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 0: 96%|█████████▌| 11839/12384 [25:07:20<1:09:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 96%|█████████▌| 11840/12384 [25:07:20<1:09:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 0: 96%|█████████▌| 11840/12384 [25:07:28<1:09:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 96%|█████████▌| 11841/12384 [25:07:28<1:09:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 0: 96%|█████████▌| 11841/12384 [25:07:36<1:09:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 96%|█████████▌| 11842/12384 [25:07:36<1:08:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 96%|█████████▌| 11842/12384 [25:07:43<1:08:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 96%|█████████▌| 11843/12384 [25:07:43<1:08:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 0: 96%|█████████▌| 11843/12384 [25:07:51<1:08:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 96%|█████████▌| 11844/12384 [25:07:51<1:08:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 96%|█████████▌| 11844/12384 [25:07:59<1:08:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 96%|█████████▌| 11845/12384 [25:07:59<1:08:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 96%|█████████▌| 11845/12384 [25:08:06<1:08:23, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=7.59s]
Epoch 0: 96%|█████████▌| 11846/12384 [25:08:06<1:08:22, 7.63s/it, loss=0.0004, acc=0.9986, iter_time=7.59s]
Epoch 0: 96%|█████████▌| 11846/12384 [25:08:14<1:08:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.39s]
Epoch 0: 96%|█████████▌| 11847/12384 [25:08:14<1:08:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.39s]
Epoch 0: 96%|█████████▌| 11847/12384 [25:08:21<1:08:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 0: 96%|█████████▌| 11848/12384 [25:08:21<1:08:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 0: 96%|█████████▌| 11848/12384 [25:08:29<1:08:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 96%|█████████▌| 11849/12384 [25:08:29<1:07:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 96%|█████████▌| 11849/12384 [25:08:37<1:07:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 96%|█████████▌| 11850/12384 [25:08:37<1:07:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 96%|█████████▌| 11850/12384 [25:08:44<1:07:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 96%|█████████▌| 11851/12384 [25:08:44<1:07:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 96%|█████████▌| 11851/12384 [25:08:52<1:07:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 96%|█████████▌| 11852/12384 [25:08:52<1:07:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 0: 96%|█████████▌| 11852/12384 [25:08:59<1:07:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 0: 96%|█████████▌| 11853/12384 [25:08:59<1:07:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 0: 96%|█████████▌| 11853/12384 [25:09:07<1:07:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 96%|█████████▌| 11854/12384 [25:09:07<1:07:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 96%|█████████▌| 11854/12384 [25:09:15<1:07:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 96%|█████████▌| 11855/12384 [25:09:15<1:07:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 0: 96%|█████████▌| 11855/12384 [25:09:22<1:07:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 96%|█████████▌| 11856/12384 [25:09:22<1:07:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 0: 96%|█████████▌| 11856/12384 [25:09:30<1:07:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 96%|█████████▌| 11857/12384 [25:09:30<1:06:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 96%|█████████▌| 11857/12384 [25:09:37<1:06:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 96%|█████████▌| 11858/12384 [25:09:37<1:06:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 0: 96%|█████████▌| 11858/12384 [25:09:45<1:06:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 96%|█████████▌| 11859/12384 [25:09:45<1:06:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 96%|█████████▌| 11859/12384 [25:09:53<1:06:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 96%|█████████▌| 11860/12384 [25:09:53<1:06:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 96%|█████████▌| 11860/12384 [25:10:00<1:06:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.83s]
Epoch 0: 96%|█████████▌| 11861/12384 [25:10:00<1:06:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.83s]
Epoch 0: 96%|█████████▌| 11861/12384 [25:10:08<1:06:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 96%|█████████▌| 11862/12384 [25:10:08<1:06:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 96%|█████████▌| 11862/12384 [25:10:16<1:06:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 0: 96%|█████████▌| 11863/12384 [25:10:16<1:06:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 0: 96%|█████████▌| 11863/12384 [25:10:24<1:06:45, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 0: 96%|█████████▌| 11864/12384 [25:10:24<1:07:24, 7.78s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 0: 96%|█████████▌| 11864/12384 [25:10:31<1:07:24, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 96%|█████████▌| 11865/12384 [25:10:31<1:06:49, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 96%|█████████▌| 11865/12384 [25:10:39<1:06:49, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11866/12384 [25:10:39<1:06:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11866/12384 [25:10:47<1:06:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11867/12384 [25:10:47<1:06:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11867/12384 [25:10:54<1:06:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 96%|█████████▌| 11868/12384 [25:10:54<1:05:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 0: 96%|█████████▌| 11868/12384 [25:11:02<1:05:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 0: 96%|█████████▌| 11869/12384 [25:11:02<1:05:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 0: 96%|█████████▌| 11869/12384 [25:11:09<1:05:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 0: 96%|█████████▌| 11870/12384 [25:11:09<1:05:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 0: 96%|█████████▌| 11870/12384 [25:11:17<1:05:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▌| 11871/12384 [25:11:17<1:05:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▌| 11871/12384 [25:11:25<1:05:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 96%|█████████▌| 11872/12384 [25:11:25<1:05:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 96%|█████████▌| 11872/12384 [25:11:32<1:05:03, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=7.54s]
Epoch 0: 96%|█████████▌| 11873/12384 [25:11:32<1:04:54, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=7.54s]
Epoch 0: 96%|█████████▌| 11873/12384 [25:11:40<1:04:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 96%|█████████▌| 11874/12384 [25:11:40<1:04:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 96%|█████████▌| 11874/12384 [25:11:47<1:04:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 96%|█████████▌| 11875/12384 [25:11:47<1:04:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 96%|█████████▌| 11875/12384 [25:11:55<1:04:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 96%|█████████▌| 11876/12384 [25:11:55<1:04:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 0: 96%|█████████▌| 11876/12384 [25:12:03<1:04:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 96%|█████████▌| 11877/12384 [25:12:03<1:04:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 96%|█████████▌| 11877/12384 [25:12:10<1:04:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 96%|█████████▌| 11878/12384 [25:12:10<1:04:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 96%|█████████▌| 11878/12384 [25:12:18<1:04:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 96%|█████████▌| 11879/12384 [25:12:18<1:04:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 96%|█████████▌| 11879/12384 [25:12:26<1:04:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 96%|█████████▌| 11880/12384 [25:12:26<1:04:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 0: 96%|█████████▌| 11880/12384 [25:12:33<1:04:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 96%|█████████▌| 11881/12384 [25:12:33<1:03:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 96%|█████████▌| 11881/12384 [25:12:41<1:03:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 96%|█████████▌| 11882/12384 [25:12:41<1:03:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 96%|█████████▌| 11882/12384 [25:12:48<1:03:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 96%|█████████▌| 11883/12384 [25:12:48<1:03:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 96%|█████████▌| 11883/12384 [25:12:56<1:03:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▌| 11884/12384 [25:12:56<1:03:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▌| 11884/12384 [25:13:04<1:03:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11885/12384 [25:13:04<1:03:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11885/12384 [25:13:11<1:03:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11886/12384 [25:13:11<1:03:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11886/12384 [25:13:19<1:03:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 96%|█████████▌| 11887/12384 [25:13:19<1:03:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 96%|█████████▌| 11887/12384 [25:13:26<1:03:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.29s]
Epoch 0: 96%|█████████▌| 11888/12384 [25:13:26<1:02:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.29s]
Epoch 0: 96%|█████████▌| 11888/12384 [25:13:34<1:02:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 96%|█████████▌| 11889/12384 [25:13:34<1:03:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 96%|█████████▌| 11889/12384 [25:13:42<1:03:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 96%|█████████▌| 11890/12384 [25:13:42<1:03:51, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 96%|█████████▌| 11890/12384 [25:13:50<1:03:51, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 96%|█████████▌| 11891/12384 [25:13:50<1:03:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 0: 96%|█████████▌| 11891/12384 [25:13:57<1:03:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 96%|█████████▌| 11892/12384 [25:13:57<1:03:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 96%|█████████▌| 11892/12384 [25:14:05<1:03:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▌| 11893/12384 [25:14:05<1:02:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▌| 11893/12384 [25:14:13<1:02:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 96%|█████████▌| 11894/12384 [25:14:13<1:02:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 96%|█████████▌| 11894/12384 [25:14:20<1:02:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 96%|█████████▌| 11895/12384 [25:14:20<1:02:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 0: 96%|█████████▌| 11895/12384 [25:14:28<1:02:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 96%|█████████▌| 11896/12384 [25:14:28<1:01:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 0: 96%|█████████▌| 11896/12384 [25:14:35<1:01:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 96%|█████████▌| 11897/12384 [25:14:35<1:01:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 0: 96%|█████████▌| 11897/12384 [25:14:43<1:01:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 96%|█████████▌| 11898/12384 [25:14:43<1:01:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 96%|█████████▌| 11898/12384 [25:14:51<1:01:40, 7.61s/it, loss=0.0009, acc=0.9972, iter_time=10.48s]
Epoch 0: 96%|█████████▌| 11899/12384 [25:14:51<1:01:29, 7.61s/it, loss=0.0009, acc=0.9972, iter_time=10.48s]
Epoch 0: 96%|█████████▌| 11899/12384 [25:14:58<1:01:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 96%|█████████▌| 11900/12384 [25:14:58<1:01:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 96%|█████████▌| 11900/12384 [25:15:06<1:01:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 96%|█████████▌| 11901/12384 [25:15:06<1:01:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 96%|█████████▌| 11901/12384 [25:15:13<1:01:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 96%|█████████▌| 11902/12384 [25:15:13<1:01:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 0: 96%|█████████▌| 11902/12384 [25:15:21<1:01:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 96%|█████████▌| 11903/12384 [25:15:21<1:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 0: 96%|█████████▌| 11903/12384 [25:15:29<1:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 96%|█████████▌| 11904/12384 [25:15:29<1:00:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 96%|█████████▌| 11904/12384 [25:15:36<1:00:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 96%|█████████▌| 11905/12384 [25:15:36<1:00:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 96%|█████████▌| 11905/12384 [25:15:44<1:00:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 96%|█████████▌| 11906/12384 [25:15:44<1:00:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 96%|█████████▌| 11906/12384 [25:15:52<1:00:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 96%|█████████▌| 11907/12384 [25:15:52<1:00:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 96%|█████████▌| 11907/12384 [25:15:59<1:00:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 96%|█████████▌| 11908/12384 [25:15:59<1:00:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 0: 96%|█████████▌| 11908/12384 [25:16:07<1:00:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11909/12384 [25:16:07<1:00:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11909/12384 [25:16:14<1:00:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 0: 96%|█████████▌| 11910/12384 [25:16:14<1:00:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 0: 96%|█████████▌| 11910/12384 [25:16:22<1:00:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 96%|█████████▌| 11911/12384 [25:16:22<1:00:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 0: 96%|█████████▌| 11911/12384 [25:16:30<1:00:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 96%|█████████▌| 11912/12384 [25:16:30<1:00:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 96%|█████████▌| 11912/12384 [25:16:37<1:00:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 96%|█████████▌| 11913/12384 [25:16:37<59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 0: 96%|█████████▌| 11913/12384 [25:16:45<59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▌| 11914/12384 [25:16:45<59:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▌| 11914/12384 [25:16:53<59:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 96%|█████████▌| 11915/12384 [25:16:53<59:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 0: 96%|█████████▌| 11915/12384 [25:17:00<59:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 96%|█████████▌| 11916/12384 [25:17:00<59:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 0: 96%|█████████▌| 11916/12384 [25:17:08<59:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 0: 96%|█████████▌| 11917/12384 [25:17:08<1:00:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 0: 96%|█████████▌| 11917/12384 [25:17:16<1:00:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 96%|█████████▌| 11918/12384 [25:17:16<59:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 0: 96%|█████████▌| 11918/12384 [25:17:23<59:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11919/12384 [25:17:23<59:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 96%|█████████▌| 11919/12384 [25:17:31<59:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 96%|█████████▋| 11920/12384 [25:17:31<59:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 96%|█████████▋| 11920/12384 [25:17:38<59:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 96%|█████████▋| 11921/12384 [25:17:38<58:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 0: 96%|█████████▋| 11921/12384 [25:17:46<58:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 96%|█████████▋| 11922/12384 [25:17:46<58:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 0: 96%|█████████▋| 11922/12384 [25:17:54<58:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 0: 96%|█████████▋| 11923/12384 [25:17:54<58:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 0: 96%|█████████▋| 11923/12384 [25:18:01<58:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 96%|█████████▋| 11924/12384 [25:18:01<58:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 0: 96%|█████████▋| 11924/12384 [25:18:09<58:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 96%|█████████▋| 11925/12384 [25:18:09<58:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 0: 96%|█████████▋| 11925/12384 [25:18:17<58:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 96%|█████████▋| 11926/12384 [25:18:17<58:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 96%|█████████▋| 11926/12384 [25:18:24<58:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 96%|█████████▋| 11927/12384 [25:18:24<58:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 0: 96%|█████████▋| 11927/12384 [25:18:32<58:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 0: 96%|█████████▋| 11928/12384 [25:18:32<57:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 0: 96%|█████████▋| 11928/12384 [25:18:39<57:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 96%|█████████▋| 11929/12384 [25:18:39<57:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 96%|█████████▋| 11929/12384 [25:18:47<57:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 96%|█████████▋| 11930/12384 [25:18:47<57:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 0: 96%|█████████▋| 11930/12384 [25:18:55<57:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 96%|█████████▋| 11931/12384 [25:18:55<57:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 96%|█████████▋| 11931/12384 [25:19:02<57:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 96%|█████████▋| 11932/12384 [25:19:02<57:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 96%|█████████▋| 11932/12384 [25:19:10<57:24, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.26s]
Epoch 0: 96%|█████████▋| 11933/12384 [25:19:10<57:18, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.26s]
Epoch 0: 96%|█████████▋| 11933/12384 [25:19:18<57:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 96%|█████████▋| 11934/12384 [25:19:18<57:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 0: 96%|█████████▋| 11934/12384 [25:19:25<57:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 0: 96%|█████████▋| 11935/12384 [25:19:25<57:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 0: 96%|█████████▋| 11935/12384 [25:19:33<57:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 96%|█████████▋| 11936/12384 [25:19:33<57:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 96%|█████████▋| 11936/12384 [25:19:40<57:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 96%|█████████▋| 11937/12384 [25:19:40<56:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 96%|█████████▋| 11937/12384 [25:19:48<56:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 96%|█████████▋| 11938/12384 [25:19:48<56:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 96%|█████████▋| 11938/12384 [25:19:56<56:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 96%|█████████▋| 11939/12384 [25:19:56<56:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 0: 96%|█████████▋| 11939/12384 [25:20:03<56:36, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=10.48s]
Epoch 0: 96%|█████████▋| 11940/12384 [25:20:03<56:27, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=10.48s]
Epoch 0: 96%|█████████▋| 11940/12384 [25:20:11<56:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 96%|█████████▋| 11941/12384 [25:20:11<56:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 96%|█████████▋| 11941/12384 [25:20:19<56:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 96%|█████████▋| 11942/12384 [25:20:19<56:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 96%|█████████▋| 11942/12384 [25:20:27<56:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 96%|█████████▋| 11943/12384 [25:20:27<57:03, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 0: 96%|█████████▋| 11943/12384 [25:20:34<57:03, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 0: 96%|█████████▋| 11944/12384 [25:20:34<56:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 0: 96%|█████████▋| 11944/12384 [25:20:42<56:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 96%|█████████▋| 11945/12384 [25:20:42<56:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 0: 96%|█████████▋| 11945/12384 [25:20:50<56:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 0: 96%|█████████▋| 11946/12384 [25:20:50<55:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 0: 96%|█████████▋| 11946/12384 [25:20:57<55:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▋| 11947/12384 [25:20:57<55:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 96%|█████████▋| 11947/12384 [25:21:05<55:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 96%|█████████▋| 11948/12384 [25:21:05<55:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 0: 96%|█████████▋| 11948/12384 [25:21:12<55:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 96%|█████████▋| 11949/12384 [25:21:12<55:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 0: 96%|█████████▋| 11949/12384 [25:21:20<55:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 96%|█████████▋| 11950/12384 [25:21:20<55:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 96%|█████████▋| 11950/12384 [25:21:28<55:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 97%|█████████▋| 11951/12384 [25:21:28<54:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 0: 97%|█████████▋| 11951/12384 [25:21:35<54:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 97%|█████████▋| 11952/12384 [25:21:35<55:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 97%|█████████▋| 11952/12384 [25:21:43<55:03, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=7.67s]
Epoch 0: 97%|█████████▋| 11953/12384 [25:21:43<54:49, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=7.67s]
Epoch 0: 97%|█████████▋| 11953/12384 [25:21:51<54:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 11954/12384 [25:21:51<54:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 11954/12384 [25:21:58<54:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 97%|█████████▋| 11955/12384 [25:21:58<54:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 97%|█████████▋| 11955/12384 [25:22:06<54:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11956/12384 [25:22:06<54:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11956/12384 [25:22:13<54:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 0: 97%|█████████▋| 11957/12384 [25:22:13<54:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 0: 97%|█████████▋| 11957/12384 [25:22:21<54:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 0: 97%|█████████▋| 11958/12384 [25:22:21<54:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 0: 97%|█████████▋| 11958/12384 [25:22:29<54:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 97%|█████████▋| 11959/12384 [25:22:29<54:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 97%|█████████▋| 11959/12384 [25:22:36<54:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 97%|█████████▋| 11960/12384 [25:22:36<53:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 97%|█████████▋| 11960/12384 [25:22:44<53:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 97%|█████████▋| 11961/12384 [25:22:44<53:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 97%|█████████▋| 11961/12384 [25:22:52<53:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 97%|█████████▋| 11962/12384 [25:22:52<53:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 97%|█████████▋| 11962/12384 [25:22:59<53:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 97%|█████████▋| 11963/12384 [25:22:59<53:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 97%|█████████▋| 11963/12384 [25:23:07<53:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 11964/12384 [25:23:07<53:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 11964/12384 [25:23:14<53:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 11965/12384 [25:23:14<53:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 11965/12384 [25:23:22<53:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11966/12384 [25:23:22<52:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11966/12384 [25:23:30<52:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 11967/12384 [25:23:30<52:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 11967/12384 [25:23:37<52:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 97%|█████████▋| 11968/12384 [25:23:37<52:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 97%|█████████▋| 11968/12384 [25:23:45<52:47, 7.61s/it, loss=0.0010, acc=0.9985, iter_time=7.51s]
Epoch 0: 97%|█████████▋| 11969/12384 [25:23:45<53:23, 7.72s/it, loss=0.0010, acc=0.9985, iter_time=7.51s]
Epoch 0: 97%|█████████▋| 11969/12384 [25:23:53<53:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 97%|█████████▋| 11970/12384 [25:23:53<53:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 97%|█████████▋| 11970/12384 [25:24:00<53:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11971/12384 [25:24:00<52:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11971/12384 [25:24:08<52:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 97%|█████████▋| 11972/12384 [25:24:08<52:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 97%|█████████▋| 11972/12384 [25:24:16<52:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 97%|█████████▋| 11973/12384 [25:24:16<52:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 97%|█████████▋| 11973/12384 [25:24:23<52:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 0: 97%|█████████▋| 11974/12384 [25:24:23<52:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 0: 97%|█████████▋| 11974/12384 [25:24:31<52:08, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=11.00s]
Epoch 0: 97%|█████████▋| 11975/12384 [25:24:31<52:08, 7.65s/it, loss=0.0002, acc=0.9995, iter_time=11.00s]
Epoch 0: 97%|█████████▋| 11975/12384 [25:24:38<52:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 97%|█████████▋| 11976/12384 [25:24:38<51:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 97%|█████████▋| 11976/12384 [25:24:46<51:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 97%|█████████▋| 11977/12384 [25:24:46<51:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 97%|█████████▋| 11977/12384 [25:24:54<51:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 97%|█████████▋| 11978/12384 [25:24:54<51:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 97%|█████████▋| 11978/12384 [25:25:01<51:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 97%|█████████▋| 11979/12384 [25:25:01<51:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 97%|█████████▋| 11979/12384 [25:25:09<51:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 97%|█████████▋| 11980/12384 [25:25:09<51:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 97%|█████████▋| 11980/12384 [25:25:17<51:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 97%|█████████▋| 11981/12384 [25:25:17<51:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 97%|█████████▋| 11981/12384 [25:25:24<51:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 97%|█████████▋| 11982/12384 [25:25:24<50:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 0: 97%|█████████▋| 11982/12384 [25:25:32<50:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 97%|█████████▋| 11983/12384 [25:25:32<50:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 97%|█████████▋| 11983/12384 [25:25:39<50:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 97%|█████████▋| 11984/12384 [25:25:39<50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 97%|█████████▋| 11984/12384 [25:25:47<50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 97%|█████████▋| 11985/12384 [25:25:47<50:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 97%|█████████▋| 11985/12384 [25:25:55<50:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 97%|█████████▋| 11986/12384 [25:25:55<50:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 0: 97%|█████████▋| 11986/12384 [25:26:02<50:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 97%|█████████▋| 11987/12384 [25:26:02<50:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 0: 97%|█████████▋| 11987/12384 [25:26:10<50:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 97%|█████████▋| 11988/12384 [25:26:10<50:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 97%|█████████▋| 11988/12384 [25:26:17<50:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 97%|█████████▋| 11989/12384 [25:26:17<50:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 0: 97%|█████████▋| 11989/12384 [25:26:25<50:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 0: 97%|█████████▋| 11990/12384 [25:26:25<49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 0: 97%|█████████▋| 11990/12384 [25:26:33<49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 97%|█████████▋| 11991/12384 [25:26:33<49:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 0: 97%|█████████▋| 11991/12384 [25:26:40<49:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 97%|█████████▋| 11992/12384 [25:26:40<49:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 97%|█████████▋| 11992/12384 [25:26:48<49:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 97%|█████████▋| 11993/12384 [25:26:48<49:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 0: 97%|█████████▋| 11993/12384 [25:26:55<49:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 97%|█████████▋| 11994/12384 [25:26:55<49:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 0: 97%|█████████▋| 11994/12384 [25:27:03<49:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11995/12384 [25:27:03<49:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11995/12384 [25:27:11<49:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 97%|█████████▋| 11996/12384 [25:27:11<49:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 0: 97%|█████████▋| 11996/12384 [25:27:19<49:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11997/12384 [25:27:19<49:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 11997/12384 [25:27:26<49:23, 7.66s/it, loss=0.0032, acc=0.9978, iter_time=6.67s]
Epoch 0: 97%|█████████▋| 11998/12384 [25:27:26<49:10, 7.64s/it, loss=0.0032, acc=0.9978, iter_time=6.67s]
Epoch 0: 97%|█████████▋| 11998/12384 [25:27:34<49:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 97%|█████████▋| 11999/12384 [25:27:34<48:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 0: 97%|█████████▋| 11999/12384 [25:27:41<48:56, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=9.20s]
Epoch 0: 97%|█████████▋| 12000/12384 [25:27:42<49:10, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=9.20s]
Epoch 0: 97%|█████████▋| 12000/12384 [25:27:49<49:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 97%|█████████▋| 12001/12384 [25:27:49<48:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 97%|█████████▋| 12001/12384 [25:27:57<48:54, 7.66s/it, loss=0.0157, acc=0.9605, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 12002/12384 [25:27:57<48:39, 7.64s/it, loss=0.0157, acc=0.9605, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 12002/12384 [25:28:04<48:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 12003/12384 [25:28:04<48:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 12003/12384 [25:28:12<48:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 0: 97%|█████████▋| 12004/12384 [25:28:12<48:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 0: 97%|█████████▋| 12004/12384 [25:28:20<48:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 97%|█████████▋| 12005/12384 [25:28:20<48:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 0: 97%|█████████▋| 12005/12384 [25:28:27<48:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 97%|█████████▋| 12006/12384 [25:28:27<47:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 97%|█████████▋| 12006/12384 [25:28:35<47:59, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=8.23s]
Epoch 0: 97%|█████████▋| 12007/12384 [25:28:35<47:48, 7.61s/it, loss=0.0003, acc=0.9984, iter_time=8.23s]
Epoch 0: 97%|█████████▋| 12007/12384 [25:28:43<47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 97%|█████████▋| 12008/12384 [25:28:43<47:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 97%|█████████▋| 12008/12384 [25:28:50<47:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 0: 97%|█████████▋| 12009/12384 [25:28:50<47:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 0: 97%|█████████▋| 12009/12384 [25:28:58<47:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 0: 97%|█████████▋| 12010/12384 [25:28:58<47:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 0: 97%|█████████▋| 12010/12384 [25:29:05<47:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 97%|█████████▋| 12011/12384 [25:29:05<47:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 0: 97%|█████████▋| 12011/12384 [25:29:14<47:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 97%|█████████▋| 12012/12384 [25:29:14<48:44, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 0: 97%|█████████▋| 12012/12384 [25:29:22<48:44, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 97%|█████████▋| 12013/12384 [25:29:22<49:04, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 0: 97%|█████████▋| 12013/12384 [25:29:31<49:04, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 97%|█████████▋| 12014/12384 [25:29:31<50:21, 8.17s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 0: 97%|█████████▋| 12014/12384 [25:29:39<50:21, 8.17s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 97%|█████████▋| 12015/12384 [25:29:39<49:59, 8.13s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 97%|█████████▋| 12015/12384 [25:29:46<49:59, 8.13s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 97%|█████████▋| 12016/12384 [25:29:46<48:59, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 0: 97%|█████████▋| 12016/12384 [25:29:54<48:59, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 97%|█████████▋| 12017/12384 [25:29:54<48:17, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 97%|█████████▋| 12017/12384 [25:30:02<48:17, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 0: 97%|█████████▋| 12018/12384 [25:30:02<47:42, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 0: 97%|█████████▋| 12018/12384 [25:30:09<47:42, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 97%|█████████▋| 12019/12384 [25:30:09<47:18, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 0: 97%|█████████▋| 12019/12384 [25:30:17<47:18, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 0: 97%|█████████▋| 12020/12384 [25:30:17<47:17, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 0: 97%|█████████▋| 12020/12384 [25:30:25<47:17, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 97%|█████████▋| 12021/12384 [25:30:25<47:37, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 0: 97%|█████████▋| 12021/12384 [25:30:33<47:37, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 97%|█████████▋| 12022/12384 [25:30:33<47:15, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 97%|█████████▋| 12022/12384 [25:30:41<47:15, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 12023/12384 [25:30:41<46:44, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 12023/12384 [25:30:48<46:44, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 0: 97%|█████████▋| 12024/12384 [25:30:48<46:20, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 0: 97%|█████████▋| 12024/12384 [25:30:56<46:20, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 0: 97%|█████████▋| 12025/12384 [25:30:56<46:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 0: 97%|█████████▋| 12025/12384 [25:31:03<46:02, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.93s]
Epoch 0: 97%|█████████▋| 12026/12384 [25:31:03<45:48, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.93s]
Epoch 0: 97%|█████████▋| 12026/12384 [25:31:11<45:48, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 97%|█████████▋| 12027/12384 [25:31:11<45:36, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 97%|█████████▋| 12027/12384 [25:31:19<45:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 97%|█████████▋| 12028/12384 [25:31:19<45:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 0: 97%|█████████▋| 12028/12384 [25:31:26<45:24, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12029/12384 [25:31:26<45:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12029/12384 [25:31:34<45:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 0: 97%|█████████▋| 12030/12384 [25:31:34<45:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 0: 97%|█████████▋| 12030/12384 [25:31:42<45:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 0: 97%|█████████▋| 12031/12384 [25:31:42<45:47, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 0: 97%|█████████▋| 12031/12384 [25:31:50<45:47, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 97%|█████████▋| 12032/12384 [25:31:50<45:24, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 97%|█████████▋| 12032/12384 [25:31:57<45:24, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 97%|█████████▋| 12033/12384 [25:31:57<45:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 97%|█████████▋| 12033/12384 [25:32:05<45:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12034/12384 [25:32:05<44:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12034/12384 [25:32:13<44:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 97%|█████████▋| 12035/12384 [25:32:13<44:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 97%|█████████▋| 12035/12384 [25:32:20<44:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 97%|█████████▋| 12036/12384 [25:32:20<44:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 97%|█████████▋| 12036/12384 [25:32:28<44:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 12037/12384 [25:32:28<44:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 12037/12384 [25:32:35<44:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 12038/12384 [25:32:35<43:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 97%|█████████▋| 12038/12384 [25:32:43<43:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 12039/12384 [25:32:43<43:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 12039/12384 [25:32:51<43:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 97%|█████████▋| 12040/12384 [25:32:51<43:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 97%|█████████▋| 12040/12384 [25:32:58<43:57, 7.67s/it, loss=0.0005, acc=1.0000, iter_time=7.35s]
Epoch 0: 97%|█████████▋| 12041/12384 [25:32:58<43:48, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=7.35s]
Epoch 0: 97%|█████████▋| 12041/12384 [25:33:06<43:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 97%|█████████▋| 12042/12384 [25:33:06<43:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 97%|█████████▋| 12042/12384 [25:33:14<43:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 97%|█████████▋| 12043/12384 [25:33:14<43:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 97%|█████████▋| 12043/12384 [25:33:21<43:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 97%|█████████▋| 12044/12384 [25:33:21<43:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 0: 97%|█████████▋| 12044/12384 [25:33:29<43:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 97%|█████████▋| 12045/12384 [25:33:29<43:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 97%|█████████▋| 12045/12384 [25:33:37<43:06, 7.63s/it, loss=0.0007, acc=0.9976, iter_time=7.92s]
Epoch 0: 97%|█████████▋| 12046/12384 [25:33:37<43:28, 7.72s/it, loss=0.0007, acc=0.9976, iter_time=7.92s]
Epoch 0: 97%|█████████▋| 12046/12384 [25:33:45<43:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 97%|█████████▋| 12047/12384 [25:33:45<43:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 97%|█████████▋| 12047/12384 [25:33:52<43:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 97%|█████████▋| 12048/12384 [25:33:52<43:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 0: 97%|█████████▋| 12048/12384 [25:34:00<43:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 97%|█████████▋| 12049/12384 [25:34:00<43:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 97%|█████████▋| 12049/12384 [25:34:08<43:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 97%|█████████▋| 12050/12384 [25:34:08<42:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 97%|█████████▋| 12050/12384 [25:34:15<42:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 97%|█████████▋| 12051/12384 [25:34:15<42:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 0: 97%|█████████▋| 12051/12384 [25:34:23<42:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 97%|█████████▋| 12052/12384 [25:34:23<42:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 97%|█████████▋| 12052/12384 [25:34:30<42:16, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 97%|█████████▋| 12053/12384 [25:34:30<42:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 97%|█████████▋| 12053/12384 [25:34:38<42:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 97%|█████████▋| 12054/12384 [25:34:38<41:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 97%|█████████▋| 12054/12384 [25:34:46<41:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12055/12384 [25:34:46<41:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12055/12384 [25:34:53<41:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 97%|█████████▋| 12056/12384 [25:34:53<41:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 97%|█████████▋| 12056/12384 [25:35:01<41:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 97%|█████████▋| 12057/12384 [25:35:01<41:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 97%|█████████▋| 12057/12384 [25:35:09<41:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 97%|█████████▋| 12058/12384 [25:35:09<41:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 97%|█████████▋| 12058/12384 [25:35:16<41:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 12059/12384 [25:35:16<41:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 97%|█████████▋| 12059/12384 [25:35:24<41:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 97%|█████████▋| 12060/12384 [25:35:24<41:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 0: 97%|█████████▋| 12060/12384 [25:35:31<41:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 97%|█████████▋| 12061/12384 [25:35:31<40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 0: 97%|█████████▋| 12061/12384 [25:35:39<40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12062/12384 [25:35:39<40:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12062/12384 [25:35:47<40:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12063/12384 [25:35:47<40:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 97%|█████████▋| 12063/12384 [25:35:54<40:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 97%|█████████▋| 12064/12384 [25:35:54<40:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 97%|█████████▋| 12064/12384 [25:36:02<40:38, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=7.21s]
Epoch 0: 97%|█████████▋| 12065/12384 [25:36:02<40:28, 7.61s/it, loss=0.0002, acc=0.9993, iter_time=7.21s]
Epoch 0: 97%|█████████▋| 12065/12384 [25:36:09<40:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 97%|█████████▋| 12066/12384 [25:36:09<40:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 97%|█████████▋| 12066/12384 [25:36:17<40:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 97%|█████████▋| 12067/12384 [25:36:17<40:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 97%|█████████▋| 12067/12384 [25:36:25<40:13, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.82s]
Epoch 0: 97%|█████████▋| 12068/12384 [25:36:25<40:04, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=5.82s]
Epoch 0: 97%|█████████▋| 12068/12384 [25:36:32<40:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 97%|█████████▋| 12069/12384 [25:36:32<39:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 97%|█████████▋| 12069/12384 [25:36:40<39:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 97%|█████████▋| 12070/12384 [25:36:40<39:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 0: 97%|█████████▋| 12070/12384 [25:36:47<39:50, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=9.62s]
Epoch 0: 97%|█████████▋| 12071/12384 [25:36:47<39:41, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=9.62s]
Epoch 0: 97%|█████████▋| 12071/12384 [25:36:55<39:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 97%|█████████▋| 12072/12384 [25:36:55<40:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 97%|█████████▋| 12072/12384 [25:37:03<40:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 97%|█████████▋| 12073/12384 [25:37:03<40:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 97%|█████████▋| 12073/12384 [25:37:11<40:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 97%|█████████▋| 12074/12384 [25:37:11<40:19, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 0: 97%|█████████▋| 12074/12384 [25:37:19<40:19, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 98%|█████████▊| 12075/12384 [25:37:19<39:54, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 98%|█████████▊| 12075/12384 [25:37:26<39:54, 7.75s/it, loss=0.0002, acc=0.9993, iter_time=7.62s]
Epoch 0: 98%|█████████▊| 12076/12384 [25:37:26<39:37, 7.72s/it, loss=0.0002, acc=0.9993, iter_time=7.62s]
Epoch 0: 98%|█████████▊| 12076/12384 [25:37:34<39:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 98%|█████████▊| 12077/12384 [25:37:34<39:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 98%|█████████▊| 12077/12384 [25:37:42<39:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 98%|█████████▊| 12078/12384 [25:37:42<39:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 0: 98%|█████████▊| 12078/12384 [25:37:49<39:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12079/12384 [25:37:49<38:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12079/12384 [25:37:57<38:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 98%|█████████▊| 12080/12384 [25:37:57<38:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 98%|█████████▊| 12080/12384 [25:38:05<38:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 0: 98%|█████████▊| 12081/12384 [25:38:05<38:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 0: 98%|█████████▊| 12081/12384 [25:38:12<38:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 98%|█████████▊| 12082/12384 [25:38:12<38:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 0: 98%|█████████▊| 12082/12384 [25:38:20<38:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 98%|█████████▊| 12083/12384 [25:38:20<38:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 98%|█████████▊| 12083/12384 [25:38:27<38:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12084/12384 [25:38:27<38:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12084/12384 [25:38:35<38:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 98%|█████████▊| 12085/12384 [25:38:35<37:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 0: 98%|█████████▊| 12085/12384 [25:38:43<37:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 98%|█████████▊| 12086/12384 [25:38:43<37:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 98%|█████████▊| 12086/12384 [25:38:50<37:45, 7.60s/it, loss=0.0009, acc=0.9987, iter_time=7.59s]
Epoch 0: 98%|█████████▊| 12087/12384 [25:38:50<37:36, 7.60s/it, loss=0.0009, acc=0.9987, iter_time=7.59s]
Epoch 0: 98%|█████████▊| 12087/12384 [25:38:58<37:36, 7.60s/it, loss=0.0002, acc=0.9981, iter_time=7.98s]
Epoch 0: 98%|█████████▊| 12088/12384 [25:38:58<37:29, 7.60s/it, loss=0.0002, acc=0.9981, iter_time=7.98s]
Epoch 0: 98%|█████████▊| 12088/12384 [25:39:05<37:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 98%|█████████▊| 12089/12384 [25:39:05<37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 98%|█████████▊| 12089/12384 [25:39:13<37:24, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=7.32s]
Epoch 0: 98%|█████████▊| 12090/12384 [25:39:13<37:20, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.32s]
Epoch 0: 98%|█████████▊| 12090/12384 [25:39:21<37:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 98%|█████████▊| 12091/12384 [25:39:21<37:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 0: 98%|█████████▊| 12091/12384 [25:39:28<37:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12092/12384 [25:39:28<37:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12092/12384 [25:39:37<37:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 0: 98%|█████████▊| 12093/12384 [25:39:37<38:04, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 0: 98%|█████████▊| 12093/12384 [25:39:44<38:04, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12094/12384 [25:39:44<37:37, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12094/12384 [25:39:52<37:37, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12095/12384 [25:39:52<37:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12095/12384 [25:39:59<37:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 98%|█████████▊| 12096/12384 [25:39:59<36:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 98%|█████████▊| 12096/12384 [25:40:07<36:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 98%|█████████▊| 12097/12384 [25:40:07<36:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 0: 98%|█████████▊| 12097/12384 [25:40:15<36:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 98%|█████████▊| 12098/12384 [25:40:15<36:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 0: 98%|█████████▊| 12098/12384 [25:40:23<36:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12099/12384 [25:40:23<36:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12099/12384 [25:40:30<36:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 98%|█████████▊| 12100/12384 [25:40:30<36:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 0: 98%|█████████▊| 12100/12384 [25:40:38<36:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 98%|█████████▊| 12101/12384 [25:40:38<36:38, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 0: 98%|█████████▊| 12101/12384 [25:40:46<36:38, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 98%|█████████▊| 12102/12384 [25:40:46<36:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 0: 98%|█████████▊| 12102/12384 [25:40:53<36:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 98%|█████████▊| 12103/12384 [25:40:53<35:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 0: 98%|█████████▊| 12103/12384 [25:41:01<35:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 0: 98%|█████████▊| 12104/12384 [25:41:01<35:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 0: 98%|█████████▊| 12104/12384 [25:41:09<35:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 98%|█████████▊| 12105/12384 [25:41:09<35:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 98%|█████████▊| 12105/12384 [25:41:16<35:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12106/12384 [25:41:16<35:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12106/12384 [25:41:24<35:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 98%|█████████▊| 12107/12384 [25:41:24<35:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 0: 98%|█████████▊| 12107/12384 [25:41:31<35:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 98%|█████████▊| 12108/12384 [25:41:31<35:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 0: 98%|█████████▊| 12108/12384 [25:41:39<35:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 0: 98%|█████████▊| 12109/12384 [25:41:39<34:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 0: 98%|█████████▊| 12109/12384 [25:41:47<34:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 98%|█████████▊| 12110/12384 [25:41:47<34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 0: 98%|█████████▊| 12110/12384 [25:41:54<34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 98%|█████████▊| 12111/12384 [25:41:54<34:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 0: 98%|█████████▊| 12111/12384 [25:42:02<34:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 0: 98%|█████████▊| 12112/12384 [25:42:02<34:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 0: 98%|█████████▊| 12112/12384 [25:42:09<34:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 0: 98%|█████████▊| 12113/12384 [25:42:09<34:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 0: 98%|█████████▊| 12113/12384 [25:42:17<34:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 98%|█████████▊| 12114/12384 [25:42:17<34:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 0: 98%|█████████▊| 12114/12384 [25:42:25<34:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 0: 98%|█████████▊| 12115/12384 [25:42:25<34:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 0: 98%|█████████▊| 12115/12384 [25:42:32<34:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 98%|█████████▊| 12116/12384 [25:42:32<34:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 98%|█████████▊| 12116/12384 [25:42:40<34:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 98%|█████████▊| 12117/12384 [25:42:40<33:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 0: 98%|█████████▊| 12117/12384 [25:42:48<33:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 0: 98%|█████████▊| 12118/12384 [25:42:48<33:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 0: 98%|█████████▊| 12118/12384 [25:42:55<33:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 0: 98%|█████████▊| 12119/12384 [25:42:55<33:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 0: 98%|█████████▊| 12119/12384 [25:43:03<33:38, 7.62s/it, loss=0.0017, acc=0.9953, iter_time=9.97s]
Epoch 0: 98%|█████████▊| 12120/12384 [25:43:03<33:33, 7.63s/it, loss=0.0017, acc=0.9953, iter_time=9.97s]
Epoch 0: 98%|█████████▊| 12120/12384 [25:43:11<33:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 98%|█████████▊| 12121/12384 [25:43:11<33:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 98%|█████████▊| 12121/12384 [25:43:18<33:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 98%|█████████▊| 12122/12384 [25:43:18<33:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 98%|█████████▊| 12122/12384 [25:43:26<33:22, 7.64s/it, loss=0.0022, acc=0.9976, iter_time=4.48s]
Epoch 0: 98%|█████████▊| 12123/12384 [25:43:26<33:12, 7.63s/it, loss=0.0022, acc=0.9976, iter_time=4.48s]
Epoch 0: 98%|█████████▊| 12123/12384 [25:43:34<33:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 0: 98%|█████████▊| 12124/12384 [25:43:34<33:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 0: 98%|█████████▊| 12124/12384 [25:43:41<33:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 98%|█████████▊| 12125/12384 [25:43:41<33:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 98%|█████████▊| 12125/12384 [25:43:49<33:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12126/12384 [25:43:49<32:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12126/12384 [25:43:57<32:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 98%|█████████▊| 12127/12384 [25:43:57<33:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 0: 98%|█████████▊| 12127/12384 [25:44:05<33:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 98%|█████████▊| 12128/12384 [25:44:05<32:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 0: 98%|█████████▊| 12128/12384 [25:44:12<32:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 98%|█████████▊| 12129/12384 [25:44:12<32:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 98%|█████████▊| 12129/12384 [25:44:20<32:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 98%|█████████▊| 12130/12384 [25:44:20<32:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 98%|█████████▊| 12130/12384 [25:44:27<32:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 98%|█████████▊| 12131/12384 [25:44:27<32:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 0: 98%|█████████▊| 12131/12384 [25:44:35<32:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 0: 98%|█████████▊| 12132/12384 [25:44:35<32:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 0: 98%|█████████▊| 12132/12384 [25:44:43<32:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 98%|█████████▊| 12133/12384 [25:44:43<31:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 0: 98%|█████████▊| 12133/12384 [25:44:50<31:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 98%|█████████▊| 12134/12384 [25:44:50<31:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 0: 98%|█████████▊| 12134/12384 [25:44:58<31:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 98%|█████████▊| 12135/12384 [25:44:58<31:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 0: 98%|█████████▊| 12135/12384 [25:45:05<31:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 98%|█████████▊| 12136/12384 [25:45:05<31:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 98%|█████████▊| 12136/12384 [25:45:13<31:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 98%|█████████▊| 12137/12384 [25:45:13<31:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 98%|█████████▊| 12137/12384 [25:45:21<31:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 98%|█████████▊| 12138/12384 [25:45:21<31:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 98%|█████████▊| 12138/12384 [25:45:28<31:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 98%|█████████▊| 12139/12384 [25:45:28<31:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 0: 98%|█████████▊| 12139/12384 [25:45:36<31:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 98%|█████████▊| 12140/12384 [25:45:36<30:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 0: 98%|█████████▊| 12140/12384 [25:45:43<30:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 0: 98%|█████████▊| 12141/12384 [25:45:43<30:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 0: 98%|█████████▊| 12141/12384 [25:45:51<30:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 98%|█████████▊| 12142/12384 [25:45:51<30:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 0: 98%|█████████▊| 12142/12384 [25:45:59<30:43, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.55s]
Epoch 0: 98%|█████████▊| 12143/12384 [25:45:59<30:34, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=4.55s]
Epoch 0: 98%|█████████▊| 12143/12384 [25:46:06<30:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 98%|█████████▊| 12144/12384 [25:46:06<30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 98%|█████████▊| 12144/12384 [25:46:14<30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 98%|█████████▊| 12145/12384 [25:46:14<30:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 98%|█████████▊| 12145/12384 [25:46:22<30:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.55s]
Epoch 0: 98%|█████████▊| 12146/12384 [25:46:22<30:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.55s]
Epoch 0: 98%|█████████▊| 12146/12384 [25:46:29<30:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 98%|█████████▊| 12147/12384 [25:46:29<30:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 98%|█████████▊| 12147/12384 [25:46:37<30:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12148/12384 [25:46:37<29:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12148/12384 [25:46:44<29:57, 7.62s/it, loss=0.0008, acc=0.9982, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12149/12384 [25:46:44<29:53, 7.63s/it, loss=0.0008, acc=0.9982, iter_time=7.63s]
Epoch 0: 98%|█████████▊| 12149/12384 [25:46:52<29:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 98%|█████████▊| 12150/12384 [25:46:52<29:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 98%|█████████▊| 12150/12384 [25:47:00<29:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 98%|█████████▊| 12151/12384 [25:47:00<29:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 98%|█████████▊| 12151/12384 [25:47:07<29:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 98%|█████████▊| 12152/12384 [25:47:07<29:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 98%|█████████▊| 12152/12384 [25:47:15<29:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 98%|█████████▊| 12153/12384 [25:47:15<29:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 0: 98%|█████████▊| 12153/12384 [25:47:23<29:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 98%|█████████▊| 12154/12384 [25:47:23<29:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 98%|█████████▊| 12154/12384 [25:47:31<29:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 98%|█████████▊| 12155/12384 [25:47:31<29:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 98%|█████████▊| 12155/12384 [25:47:38<29:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 98%|█████████▊| 12156/12384 [25:47:38<29:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 0: 98%|█████████▊| 12156/12384 [25:47:46<29:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 98%|█████████▊| 12157/12384 [25:47:46<29:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 0: 98%|█████████▊| 12157/12384 [25:47:53<29:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 98%|█████████▊| 12158/12384 [25:47:53<28:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 0: 98%|█████████▊| 12158/12384 [25:48:01<28:51, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 98%|█████████▊| 12159/12384 [25:48:01<28:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 98%|█████████▊| 12159/12384 [25:48:09<28:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 98%|█████████▊| 12160/12384 [25:48:09<28:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 0: 98%|█████████▊| 12160/12384 [25:48:16<28:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 0: 98%|█████████▊| 12161/12384 [25:48:16<28:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 0: 98%|█████████▊| 12161/12384 [25:48:24<28:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 0: 98%|█████████▊| 12162/12384 [25:48:24<28:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 0: 98%|█████████▊| 12162/12384 [25:48:32<28:12, 7.62s/it, loss=0.0000, acc=0.9999, iter_time=9.06s]
Epoch 0: 98%|█████████▊| 12163/12384 [25:48:32<28:03, 7.62s/it, loss=0.0000, acc=0.9999, iter_time=9.06s]
Epoch 0: 98%|█████████▊| 12163/12384 [25:48:39<28:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 98%|█████████▊| 12164/12384 [25:48:39<27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 98%|█████████▊| 12164/12384 [25:48:47<27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 98%|█████████▊| 12165/12384 [25:48:47<27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 0: 98%|█████████▊| 12165/12384 [25:48:54<27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 98%|█████████▊| 12166/12384 [25:48:54<27:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 98%|█████████▊| 12166/12384 [25:49:02<27:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 98%|█████████▊| 12167/12384 [25:49:02<27:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 98%|█████████▊| 12167/12384 [25:49:10<27:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 98%|█████████▊| 12168/12384 [25:49:10<27:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 98%|█████████▊| 12168/12384 [25:49:17<27:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 98%|█████████▊| 12169/12384 [25:49:17<27:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 98%|█████████▊| 12169/12384 [25:49:25<27:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 98%|█████████▊| 12170/12384 [25:49:25<27:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 98%|█████████▊| 12170/12384 [25:49:33<27:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 98%|█████████▊| 12171/12384 [25:49:33<27:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 98%|█████████▊| 12171/12384 [25:49:40<27:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 98%|█████████▊| 12172/12384 [25:49:40<26:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 98%|█████████▊| 12172/12384 [25:49:48<26:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 98%|█████████▊| 12173/12384 [25:49:48<26:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 0: 98%|█████████▊| 12173/12384 [25:49:56<26:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 0: 98%|█████████▊| 12174/12384 [25:49:56<26:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 0: 98%|█████████▊| 12174/12384 [25:50:04<26:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 98%|█████████▊| 12175/12384 [25:50:04<27:16, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 0: 98%|█████████▊| 12175/12384 [25:50:11<27:16, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 98%|█████████▊| 12176/12384 [25:50:11<26:54, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 98%|█████████▊| 12176/12384 [25:50:19<26:54, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 98%|█████████▊| 12177/12384 [25:50:19<26:54, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 0: 98%|█████████▊| 12177/12384 [25:50:27<26:54, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12178/12384 [25:50:27<26:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 98%|█████████▊| 12178/12384 [25:50:35<26:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 0: 98%|█████████▊| 12179/12384 [25:50:35<26:39, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 0: 98%|█████████▊| 12179/12384 [25:50:42<26:39, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 98%|█████████▊| 12180/12384 [25:50:42<26:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 0: 98%|█████████▊| 12180/12384 [25:50:50<26:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 0: 98%|█████████▊| 12181/12384 [25:50:50<26:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 0: 98%|█████████▊| 12181/12384 [25:50:58<26:06, 7.72s/it, loss=0.0001, acc=0.9996, iter_time=9.13s]
Epoch 0: 98%|█████████▊| 12182/12384 [25:50:58<25:52, 7.69s/it, loss=0.0001, acc=0.9996, iter_time=9.13s]
Epoch 0: 98%|█████████▊| 12182/12384 [25:51:05<25:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 98%|█████████▊| 12183/12384 [25:51:05<25:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 98%|█████████▊| 12183/12384 [25:51:13<25:40, 7.66s/it, loss=0.0037, acc=0.9957, iter_time=8.00s]
Epoch 0: 98%|█████████▊| 12184/12384 [25:51:13<25:30, 7.65s/it, loss=0.0037, acc=0.9957, iter_time=8.00s]
Epoch 0: 98%|█████████▊| 12184/12384 [25:51:21<25:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 0: 98%|█████████▊| 12185/12384 [25:51:21<25:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 0: 98%|█████████▊| 12185/12384 [25:51:28<25:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 98%|█████████▊| 12186/12384 [25:51:28<25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 98%|█████████▊| 12186/12384 [25:51:36<25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 98%|█████████▊| 12187/12384 [25:51:36<25:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 98%|█████████▊| 12187/12384 [25:51:43<25:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 0: 98%|█████████▊| 12188/12384 [25:51:43<24:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 0: 98%|█████████▊| 12188/12384 [25:51:51<24:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 98%|█████████▊| 12189/12384 [25:51:51<24:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 0: 98%|█████████▊| 12189/12384 [25:51:59<24:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 0: 98%|█████████▊| 12190/12384 [25:51:59<24:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 0: 98%|█████████▊| 12190/12384 [25:52:06<24:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.19s]
Epoch 0: 98%|█████████▊| 12191/12384 [25:52:06<24:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.19s]
Epoch 0: 98%|█████████▊| 12191/12384 [25:52:14<24:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 0: 98%|█████████▊| 12192/12384 [25:52:14<24:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 0: 98%|█████████▊| 12192/12384 [25:52:21<24:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 98%|█████████▊| 12193/12384 [25:52:21<24:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 0: 98%|█████████▊| 12193/12384 [25:52:29<24:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 98%|█████████▊| 12194/12384 [25:52:29<24:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 0: 98%|█████████▊| 12194/12384 [25:52:37<24:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 98%|█████████▊| 12195/12384 [25:52:37<23:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 98%|█████████▊| 12195/12384 [25:52:44<23:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 98%|█████████▊| 12196/12384 [25:52:44<23:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 98%|█████████▊| 12196/12384 [25:52:52<23:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 98%|█████████▊| 12197/12384 [25:52:52<23:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 0: 98%|█████████▊| 12197/12384 [25:52:59<23:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 98%|█████████▊| 12198/12384 [25:52:59<23:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 0: 98%|█████████▊| 12198/12384 [25:53:07<23:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12199/12384 [25:53:07<23:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12199/12384 [25:53:15<23:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 99%|█████████▊| 12200/12384 [25:53:15<23:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 0: 99%|█████████▊| 12200/12384 [25:53:22<23:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 0: 99%|█████████▊| 12201/12384 [25:53:22<23:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 0: 99%|█████████▊| 12201/12384 [25:53:30<23:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▊| 12202/12384 [25:53:30<23:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▊| 12202/12384 [25:53:38<23:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 99%|█████████▊| 12203/12384 [25:53:38<23:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 99%|█████████▊| 12203/12384 [25:53:45<23:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▊| 12204/12384 [25:53:45<23:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▊| 12204/12384 [25:53:53<23:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 99%|█████████▊| 12205/12384 [25:53:53<23:10, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 99%|█████████▊| 12205/12384 [25:54:01<23:10, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 99%|█████████▊| 12206/12384 [25:54:01<22:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 99%|█████████▊| 12206/12384 [25:54:09<22:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12207/12384 [25:54:09<22:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12207/12384 [25:54:16<22:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 99%|█████████▊| 12208/12384 [25:54:16<22:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 0: 99%|█████████▊| 12208/12384 [25:54:24<22:28, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 99%|█████████▊| 12209/12384 [25:54:24<22:21, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 99%|█████████▊| 12209/12384 [25:54:31<22:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▊| 12210/12384 [25:54:31<22:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▊| 12210/12384 [25:54:39<22:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 99%|█████████▊| 12211/12384 [25:54:39<22:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 0: 99%|█████████▊| 12211/12384 [25:54:47<22:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 99%|█████████▊| 12212/12384 [25:54:47<21:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 99%|█████████▊| 12212/12384 [25:54:54<21:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 99%|█████████▊| 12213/12384 [25:54:54<21:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 99%|█████████▊| 12213/12384 [25:55:02<21:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12214/12384 [25:55:02<21:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12214/12384 [25:55:10<21:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 99%|█████████▊| 12215/12384 [25:55:10<21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 0: 99%|█████████▊| 12215/12384 [25:55:17<21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 99%|█████████▊| 12216/12384 [25:55:17<21:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 0: 99%|█████████▊| 12216/12384 [25:55:25<21:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 99%|█████████▊| 12217/12384 [25:55:25<21:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 99%|█████████▊| 12217/12384 [25:55:32<21:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 99%|█████████▊| 12218/12384 [25:55:32<21:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 0: 99%|█████████▊| 12218/12384 [25:55:40<21:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12219/12384 [25:55:40<20:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12219/12384 [25:55:48<20:55, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=7.61s]
Epoch 0: 99%|█████████▊| 12220/12384 [25:55:48<20:50, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=7.61s]
Epoch 0: 99%|█████████▊| 12220/12384 [25:55:55<20:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 99%|█████████▊| 12221/12384 [25:55:55<20:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 99%|█████████▊| 12221/12384 [25:56:04<20:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 99%|█████████▊| 12222/12384 [25:56:04<21:25, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 99%|█████████▊| 12222/12384 [25:56:12<21:25, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12223/12384 [25:56:12<21:01, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▊| 12223/12384 [25:56:19<21:01, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 99%|█████████▊| 12224/12384 [25:56:19<20:43, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 99%|█████████▊| 12224/12384 [25:56:27<20:43, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 99%|█████████▊| 12225/12384 [25:56:27<20:30, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 99%|█████████▊| 12225/12384 [25:56:35<20:30, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 99%|█████████▊| 12226/12384 [25:56:35<20:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 99%|█████████▊| 12226/12384 [25:56:42<20:16, 7.70s/it, loss=0.0003, acc=0.9999, iter_time=7.62s]
Epoch 0: 99%|█████████▊| 12227/12384 [25:56:42<20:05, 7.68s/it, loss=0.0003, acc=0.9999, iter_time=7.62s]
Epoch 0: 99%|█████████▊| 12227/12384 [25:56:50<20:05, 7.68s/it, loss=0.0018, acc=0.9954, iter_time=7.62s]
Epoch 0: 99%|█████████▊| 12228/12384 [25:56:50<19:53, 7.65s/it, loss=0.0018, acc=0.9954, iter_time=7.62s]
Epoch 0: 99%|█████████▊| 12228/12384 [25:56:58<19:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 99%|█████████▊| 12229/12384 [25:56:58<20:01, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 99%|█████████▊| 12229/12384 [25:57:05<20:01, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12230/12384 [25:57:05<19:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12230/12384 [25:57:13<19:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 0: 99%|█████████▉| 12231/12384 [25:57:13<19:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 0: 99%|█████████▉| 12231/12384 [25:57:21<19:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 99%|█████████▉| 12232/12384 [25:57:21<19:38, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 99%|█████████▉| 12232/12384 [25:57:29<19:38, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 99%|█████████▉| 12233/12384 [25:57:29<19:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 99%|█████████▉| 12233/12384 [25:57:36<19:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▉| 12234/12384 [25:57:36<19:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▉| 12234/12384 [25:57:44<19:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12235/12384 [25:57:44<19:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12235/12384 [25:57:51<19:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12236/12384 [25:57:51<18:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12236/12384 [25:57:59<18:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 99%|█████████▉| 12237/12384 [25:57:59<18:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 0: 99%|█████████▉| 12237/12384 [25:58:07<18:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 99%|█████████▉| 12238/12384 [25:58:07<18:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 0: 99%|█████████▉| 12238/12384 [25:58:14<18:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 0: 99%|█████████▉| 12239/12384 [25:58:14<18:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 0: 99%|█████████▉| 12239/12384 [25:58:22<18:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 99%|█████████▉| 12240/12384 [25:58:22<18:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 0: 99%|█████████▉| 12240/12384 [25:58:29<18:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 99%|█████████▉| 12241/12384 [25:58:29<18:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 99%|█████████▉| 12241/12384 [25:58:37<18:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▉| 12242/12384 [25:58:37<18:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▉| 12242/12384 [25:58:45<18:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 99%|█████████▉| 12243/12384 [25:58:45<17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 99%|█████████▉| 12243/12384 [25:58:52<17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12244/12384 [25:58:52<17:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12244/12384 [25:59:00<17:47, 7.62s/it, loss=0.0002, acc=0.9982, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12245/12384 [25:59:00<17:38, 7.62s/it, loss=0.0002, acc=0.9982, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12245/12384 [25:59:07<17:38, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=4.46s]
Epoch 0: 99%|█████████▉| 12246/12384 [25:59:07<17:30, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=4.46s]
Epoch 0: 99%|█████████▉| 12246/12384 [25:59:15<17:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 99%|█████████▉| 12247/12384 [25:59:15<17:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 99%|█████████▉| 12247/12384 [25:59:23<17:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 99%|█████████▉| 12248/12384 [25:59:23<17:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 99%|█████████▉| 12248/12384 [25:59:30<17:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 99%|█████████▉| 12249/12384 [25:59:30<17:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 99%|█████████▉| 12249/12384 [25:59:38<17:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 99%|█████████▉| 12250/12384 [25:59:38<17:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 0: 99%|█████████▉| 12250/12384 [25:59:46<17:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 99%|█████████▉| 12251/12384 [25:59:46<16:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 0: 99%|█████████▉| 12251/12384 [25:59:53<16:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12252/12384 [25:59:53<16:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12252/12384 [26:00:01<16:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 99%|█████████▉| 12253/12384 [26:00:01<16:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 0: 99%|█████████▉| 12253/12384 [26:00:08<16:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 0: 99%|█████████▉| 12254/12384 [26:00:08<16:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 0: 99%|█████████▉| 12254/12384 [26:00:16<16:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 99%|█████████▉| 12255/12384 [26:00:16<16:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 0: 99%|█████████▉| 12255/12384 [26:00:24<16:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 99%|█████████▉| 12256/12384 [26:00:24<16:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 0: 99%|█████████▉| 12256/12384 [26:00:31<16:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 99%|█████████▉| 12257/12384 [26:00:31<16:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 0: 99%|█████████▉| 12257/12384 [26:00:39<16:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 99%|█████████▉| 12258/12384 [26:00:39<16:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 0: 99%|█████████▉| 12258/12384 [26:00:47<16:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 99%|█████████▉| 12259/12384 [26:00:47<16:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 99%|█████████▉| 12259/12384 [26:00:55<16:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12260/12384 [26:00:55<15:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12260/12384 [26:01:02<15:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 0: 99%|█████████▉| 12261/12384 [26:01:02<15:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 0: 99%|█████████▉| 12261/12384 [26:01:10<15:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 99%|█████████▉| 12262/12384 [26:01:10<15:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 99%|█████████▉| 12262/12384 [26:01:17<15:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 99%|█████████▉| 12263/12384 [26:01:17<15:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 0: 99%|█████████▉| 12263/12384 [26:01:25<15:24, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=9.19s]
Epoch 0: 99%|█████████▉| 12264/12384 [26:01:25<15:16, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=9.19s]
Epoch 0: 99%|█████████▉| 12264/12384 [26:01:33<15:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 99%|█████████▉| 12265/12384 [26:01:33<15:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 0: 99%|█████████▉| 12265/12384 [26:01:40<15:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 99%|█████████▉| 12266/12384 [26:01:40<14:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 0: 99%|█████████▉| 12266/12384 [26:01:48<14:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 0: 99%|█████████▉| 12267/12384 [26:01:48<14:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 0: 99%|█████████▉| 12267/12384 [26:01:56<14:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12268/12384 [26:01:56<14:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12268/12384 [26:02:03<14:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 99%|█████████▉| 12269/12384 [26:02:03<14:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 0: 99%|█████████▉| 12269/12384 [26:02:11<14:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 99%|█████████▉| 12270/12384 [26:02:11<14:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 0: 99%|█████████▉| 12270/12384 [26:02:18<14:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.43s]
Epoch 0: 99%|█████████▉| 12271/12384 [26:02:18<14:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.43s]
Epoch 0: 99%|█████████▉| 12271/12384 [26:02:26<14:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 99%|█████████▉| 12272/12384 [26:02:26<14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 99%|█████████▉| 12272/12384 [26:02:34<14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 99%|█████████▉| 12273/12384 [26:02:34<14:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 0: 99%|█████████▉| 12273/12384 [26:02:41<14:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 0: 99%|█████████▉| 12274/12384 [26:02:41<13:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 0: 99%|█████████▉| 12274/12384 [26:02:49<13:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 99%|█████████▉| 12275/12384 [26:02:49<13:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 0: 99%|█████████▉| 12275/12384 [26:02:56<13:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 99%|█████████▉| 12276/12384 [26:02:56<13:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 0: 99%|█████████▉| 12276/12384 [26:03:04<13:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 99%|█████████▉| 12277/12384 [26:03:04<13:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 0: 99%|█████████▉| 12277/12384 [26:03:12<13:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12278/12384 [26:03:12<13:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12278/12384 [26:03:19<13:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 99%|█████████▉| 12279/12384 [26:03:19<13:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 99%|█████████▉| 12279/12384 [26:03:27<13:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 0: 99%|█████████▉| 12280/12384 [26:03:27<13:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 0: 99%|█████████▉| 12280/12384 [26:03:35<13:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 99%|█████████▉| 12281/12384 [26:03:35<13:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 0: 99%|█████████▉| 12281/12384 [26:03:42<13:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12282/12384 [26:03:42<13:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12282/12384 [26:03:50<13:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 99%|█████████▉| 12283/12384 [26:03:50<12:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 0: 99%|█████████▉| 12283/12384 [26:03:58<12:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 99%|█████████▉| 12284/12384 [26:03:58<12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 99%|█████████▉| 12284/12384 [26:04:06<12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 99%|█████████▉| 12285/12384 [26:04:06<12:45, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 99%|█████████▉| 12285/12384 [26:04:13<12:45, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 99%|█████████▉| 12286/12384 [26:04:13<12:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 99%|█████████▉| 12286/12384 [26:04:21<12:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 99%|█████████▉| 12287/12384 [26:04:21<12:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 99%|█████████▉| 12287/12384 [26:04:28<12:24, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.30s]
Epoch 0: 99%|█████████▉| 12288/12384 [26:04:28<12:15, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=11.30s]
Epoch 0: 99%|█████████▉| 12288/12384 [26:04:36<12:15, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.73s]
Epoch 0: 99%|█████████▉| 12289/12384 [26:04:36<12:06, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.73s]
Epoch 0: 99%|█████████▉| 12289/12384 [26:04:44<12:06, 7.65s/it, loss=0.0025, acc=0.9939, iter_time=8.25s]
Epoch 0: 99%|█████████▉| 12290/12384 [26:04:44<11:59, 7.66s/it, loss=0.0025, acc=0.9939, iter_time=8.25s]
Epoch 0: 99%|█████████▉| 12290/12384 [26:04:51<11:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 99%|█████████▉| 12291/12384 [26:04:51<11:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 0: 99%|█████████▉| 12291/12384 [26:04:59<11:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 99%|█████████▉| 12292/12384 [26:04:59<11:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 0: 99%|█████████▉| 12292/12384 [26:05:07<11:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12293/12384 [26:05:07<11:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12293/12384 [26:05:14<11:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12294/12384 [26:05:14<11:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12294/12384 [26:05:22<11:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12295/12384 [26:05:22<11:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12295/12384 [26:05:30<11:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 99%|█████████▉| 12296/12384 [26:05:30<11:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 0: 99%|█████████▉| 12296/12384 [26:05:37<11:11, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.21s]
Epoch 0: 99%|█████████▉| 12297/12384 [26:05:37<11:03, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.21s]
Epoch 0: 99%|█████████▉| 12297/12384 [26:05:45<11:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 99%|█████████▉| 12298/12384 [26:05:45<10:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 0: 99%|█████████▉| 12298/12384 [26:05:52<10:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 99%|█████████▉| 12299/12384 [26:05:52<10:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 0: 99%|█████████▉| 12299/12384 [26:06:00<10:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 99%|█████████▉| 12300/12384 [26:06:00<10:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 0: 99%|█████████▉| 12300/12384 [26:06:08<10:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 99%|█████████▉| 12301/12384 [26:06:08<10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 0: 99%|█████████▉| 12301/12384 [26:06:15<10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 99%|█████████▉| 12302/12384 [26:06:15<10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 99%|█████████▉| 12302/12384 [26:06:23<10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12303/12384 [26:06:23<10:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 99%|█████████▉| 12303/12384 [26:06:30<10:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 99%|█████████▉| 12304/12384 [26:06:30<10:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 0: 99%|█████████▉| 12304/12384 [26:06:38<10:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 0: 99%|█████████▉| 12305/12384 [26:06:38<10:00, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 0: 99%|█████████▉| 12305/12384 [26:06:46<10:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12306/12384 [26:06:46<09:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12306/12384 [26:06:53<09:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 99%|█████████▉| 12307/12384 [26:06:53<09:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 99%|█████████▉| 12307/12384 [26:07:01<09:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 99%|█████████▉| 12308/12384 [26:07:01<09:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 0: 99%|█████████▉| 12308/12384 [26:07:09<09:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 99%|█████████▉| 12309/12384 [26:07:09<09:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 0: 99%|█████████▉| 12309/12384 [26:07:16<09:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 0: 99%|█████████▉| 12310/12384 [26:07:16<09:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 0: 99%|█████████▉| 12310/12384 [26:07:24<09:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 99%|█████████▉| 12311/12384 [26:07:24<09:25, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 0: 99%|█████████▉| 12311/12384 [26:07:32<09:25, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=11.45s]
Epoch 0: 99%|█████████▉| 12312/12384 [26:07:32<09:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.45s]
Epoch 0: 99%|█████████▉| 12312/12384 [26:07:40<09:14, 7.71s/it, loss=0.0021, acc=0.9947, iter_time=4.27s]
Epoch 0: 99%|█████████▉| 12313/12384 [26:07:40<09:05, 7.68s/it, loss=0.0021, acc=0.9947, iter_time=4.27s]
Epoch 0: 99%|█████████▉| 12313/12384 [26:07:47<09:05, 7.68s/it, loss=0.0002, acc=0.9985, iter_time=10.97s]
Epoch 0: 99%|█████████▉| 12314/12384 [26:07:47<08:55, 7.65s/it, loss=0.0002, acc=0.9985, iter_time=10.97s]
Epoch 0: 99%|█████████▉| 12314/12384 [26:07:55<08:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▉| 12315/12384 [26:07:55<08:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 99%|█████████▉| 12315/12384 [26:08:02<08:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 99%|█████████▉| 12316/12384 [26:08:02<08:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 99%|█████████▉| 12316/12384 [26:08:10<08:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 99%|█████████▉| 12317/12384 [26:08:10<08:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 99%|█████████▉| 12317/12384 [26:08:18<08:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12318/12384 [26:08:18<08:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 99%|█████████▉| 12318/12384 [26:08:25<08:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12319/12384 [26:08:25<08:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 99%|█████████▉| 12319/12384 [26:08:33<08:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 99%|█████████▉| 12320/12384 [26:08:33<08:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 99%|█████████▉| 12320/12384 [26:08:41<08:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 0: 99%|█████████▉| 12321/12384 [26:08:41<08:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 0: 99%|█████████▉| 12321/12384 [26:08:48<08:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 0: 99%|█████████▉| 12322/12384 [26:08:48<07:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 0: 99%|█████████▉| 12322/12384 [26:08:56<07:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 0: 100%|█████████▉| 12323/12384 [26:08:56<07:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 0: 100%|█████████▉| 12323/12384 [26:09:04<07:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 100%|█████████▉| 12324/12384 [26:09:04<07:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 0: 100%|█████████▉| 12324/12384 [26:09:11<07:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 100%|█████████▉| 12325/12384 [26:09:11<07:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 0: 100%|█████████▉| 12325/12384 [26:09:19<07:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 100%|█████████▉| 12326/12384 [26:09:19<07:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 0: 100%|█████████▉| 12326/12384 [26:09:26<07:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 100%|█████████▉| 12327/12384 [26:09:26<07:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 0: 100%|█████████▉| 12327/12384 [26:09:34<07:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 100%|█████████▉| 12328/12384 [26:09:34<07:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 100%|█████████▉| 12328/12384 [26:09:42<07:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 100%|█████████▉| 12329/12384 [26:09:42<06:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 100%|█████████▉| 12329/12384 [26:09:49<06:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 100%|█████████▉| 12330/12384 [26:09:49<06:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 100%|█████████▉| 12330/12384 [26:09:57<06:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 0: 100%|█████████▉| 12331/12384 [26:09:57<06:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 0: 100%|█████████▉| 12331/12384 [26:10:05<06:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 100%|█████████▉| 12332/12384 [26:10:05<06:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 0: 100%|█████████▉| 12332/12384 [26:10:12<06:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 100%|█████████▉| 12333/12384 [26:10:12<06:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 100%|█████████▉| 12333/12384 [26:10:20<06:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 100%|█████████▉| 12334/12384 [26:10:20<06:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 0: 100%|█████████▉| 12334/12384 [26:10:28<06:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 100%|█████████▉| 12335/12384 [26:10:28<06:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 100%|█████████▉| 12335/12384 [26:10:35<06:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 100%|█████████▉| 12336/12384 [26:10:35<06:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 100%|█████████▉| 12336/12384 [26:10:43<06:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 100%|█████████▉| 12337/12384 [26:10:43<06:04, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 0: 100%|█████████▉| 12337/12384 [26:10:51<06:04, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 100%|█████████▉| 12338/12384 [26:10:51<05:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 100%|█████████▉| 12338/12384 [26:10:59<05:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 100%|█████████▉| 12339/12384 [26:10:59<05:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 0: 100%|█████████▉| 12339/12384 [26:11:06<05:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 100%|█████████▉| 12340/12384 [26:11:06<05:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 0: 100%|█████████▉| 12340/12384 [26:11:14<05:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 100%|█████████▉| 12341/12384 [26:11:14<05:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 0: 100%|█████████▉| 12341/12384 [26:11:21<05:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 100%|█████████▉| 12342/12384 [26:11:21<05:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 0: 100%|█████████▉| 12342/12384 [26:11:29<05:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 0: 100%|█████████▉| 12343/12384 [26:11:29<05:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 0: 100%|█████████▉| 12343/12384 [26:11:37<05:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.59s]
Epoch 0: 100%|█████████▉| 12344/12384 [26:11:37<05:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.59s]
Epoch 0: 100%|█████████▉| 12344/12384 [26:11:44<05:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 100%|█████████▉| 12345/12384 [26:11:44<04:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 0: 100%|█████████▉| 12345/12384 [26:11:52<04:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 100%|█████████▉| 12346/12384 [26:11:52<04:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 0: 100%|█████████▉| 12346/12384 [26:12:00<04:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 100%|█████████▉| 12347/12384 [26:12:00<04:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 100%|█████████▉| 12347/12384 [26:12:07<04:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 0: 100%|█████████▉| 12348/12384 [26:12:07<04:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 0: 100%|█████████▉| 12348/12384 [26:12:15<04:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 100%|█████████▉| 12349/12384 [26:12:15<04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 0: 100%|█████████▉| 12349/12384 [26:12:22<04:26, 7.62s/it, loss=0.0007, acc=0.9979, iter_time=8.14s]
Epoch 0: 100%|█████████▉| 12350/12384 [26:12:22<04:19, 7.65s/it, loss=0.0007, acc=0.9979, iter_time=8.14s]
Epoch 0: 100%|█████████▉| 12350/12384 [26:12:30<04:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 0: 100%|█████████▉| 12351/12384 [26:12:30<04:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 0: 100%|█████████▉| 12351/12384 [26:12:38<04:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 100%|█████████▉| 12352/12384 [26:12:38<04:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 0: 100%|█████████▉| 12352/12384 [26:12:45<04:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 100%|█████████▉| 12353/12384 [26:12:45<03:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 0: 100%|█████████▉| 12353/12384 [26:12:53<03:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 0: 100%|█████████▉| 12354/12384 [26:12:53<03:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 0: 100%|█████████▉| 12354/12384 [26:13:01<03:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 100%|█████████▉| 12355/12384 [26:13:01<03:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 0: 100%|█████████▉| 12355/12384 [26:13:08<03:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 100%|█████████▉| 12356/12384 [26:13:08<03:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 0: 100%|█████████▉| 12356/12384 [26:13:16<03:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 100%|█████████▉| 12357/12384 [26:13:16<03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 0: 100%|█████████▉| 12357/12384 [26:13:23<03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 100%|█████████▉| 12358/12384 [26:13:23<03:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 100%|█████████▉| 12358/12384 [26:13:31<03:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 100%|█████████▉| 12359/12384 [26:13:31<03:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 100%|█████████▉| 12359/12384 [26:13:39<03:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 100%|█████████▉| 12360/12384 [26:13:39<03:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 0: 100%|█████████▉| 12360/12384 [26:13:46<03:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.59s]
Epoch 0: 100%|█████████▉| 12361/12384 [26:13:46<02:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.59s]
Epoch 0: 100%|█████████▉| 12361/12384 [26:13:54<02:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 0: 100%|█████████▉| 12362/12384 [26:13:54<02:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 0: 100%|█████████▉| 12362/12384 [26:14:02<02:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 100%|█████████▉| 12363/12384 [26:14:02<02:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 100%|█████████▉| 12363/12384 [26:14:09<02:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 100%|█████████▉| 12364/12384 [26:14:09<02:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 100%|█████████▉| 12364/12384 [26:14:17<02:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 100%|█████████▉| 12365/12384 [26:14:17<02:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 0: 100%|█████████▉| 12365/12384 [26:14:25<02:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 100%|█████████▉| 12366/12384 [26:14:25<02:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 0: 100%|█████████▉| 12366/12384 [26:14:32<02:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 100%|█████████▉| 12367/12384 [26:14:32<02:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 0: 100%|█████████▉| 12367/12384 [26:14:40<02:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 0: 100%|█████████▉| 12368/12384 [26:14:40<02:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 0: 100%|█████████▉| 12368/12384 [26:14:47<02:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 0: 100%|█████████▉| 12369/12384 [26:14:47<01:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 0: 100%|█████████▉| 12369/12384 [26:14:55<01:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 100%|█████████▉| 12370/12384 [26:14:55<01:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 0: 100%|█████████▉| 12370/12384 [26:15:03<01:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 0: 100%|█████████▉| 12371/12384 [26:15:03<01:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 0: 100%|█████████▉| 12371/12384 [26:15:10<01:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 100%|█████████▉| 12372/12384 [26:15:10<01:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 100%|█████████▉| 12372/12384 [26:15:18<01:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 100%|█████████▉| 12373/12384 [26:15:18<01:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 0: 100%|█████████▉| 12373/12384 [26:15:26<01:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 100%|█████████▉| 12374/12384 [26:15:26<01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 100%|█████████▉| 12374/12384 [26:15:33<01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 100%|█████████▉| 12375/12384 [26:15:33<01:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 0: 100%|█████████▉| 12375/12384 [26:15:41<01:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 100%|█████████▉| 12376/12384 [26:15:41<01:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 100%|█████████▉| 12376/12384 [26:15:48<01:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 0: 100%|█████████▉| 12377/12384 [26:15:48<00:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 0: 100%|█████████▉| 12377/12384 [26:15:56<00:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 100%|█████████▉| 12378/12384 [26:15:56<00:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 0: 100%|█████████▉| 12378/12384 [26:16:04<00:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 100%|█████████▉| 12379/12384 [26:16:04<00:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 100%|█████████▉| 12379/12384 [26:16:11<00:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 100%|█████████▉| 12380/12384 [26:16:11<00:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 100%|█████████▉| 12380/12384 [26:16:19<00:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 100%|█████████▉| 12381/12384 [26:16:19<00:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 0: 100%|█████████▉| 12381/12384 [26:16:27<00:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 100%|█████████▉| 12382/12384 [26:16:27<00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 0: 100%|█████████▉| 12382/12384 [26:16:34<00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 100%|█████████▉| 12383/12384 [26:16:34<00:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 0: 100%|█████████▉| 12383/12384 [26:16:42<00:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 0: 100%|██████████| 12384/12384 [26:16:42<00:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 0: 100%|██████████| 12384/12384 [26:16:42<00:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
+
Epoch 1: 0%| | 0/12384 [00:00, ?it/s]
Epoch 1: 0%| | 0/12384 [00:07, ?it/s, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 1: 0%| | 1/12384 [00:07<26:17:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 1: 0%| | 1/12384 [00:15<26:17:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 0%| | 2/12384 [00:15<26:14:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 0%| | 2/12384 [00:22<26:14:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 1: 0%| | 3/12384 [00:22<26:11:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 1: 0%| | 3/12384 [00:30<26:11:57, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=10.15s]
Epoch 1: 0%| | 4/12384 [00:30<26:15:21, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=10.15s]
Epoch 1: 0%| | 4/12384 [00:38<26:15:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 0%| | 5/12384 [00:38<26:37:25, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 0%| | 5/12384 [00:46<26:37:25, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 0%| | 6/12384 [00:46<26:27:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 0%| | 6/12384 [00:53<26:27:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 0%| | 7/12384 [00:53<26:22:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 0%| | 7/12384 [01:01<26:22:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 0%| | 8/12384 [01:01<26:18:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 0%| | 8/12384 [01:08<26:18:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 0%| | 9/12384 [01:08<26:15:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 0%| | 9/12384 [01:16<26:15:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 0%| | 10/12384 [01:16<26:12:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 0%| | 10/12384 [01:24<26:12:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.76s]
Epoch 1: 0%| | 11/12384 [01:24<26:11:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.76s]
Epoch 1: 0%| | 11/12384 [01:31<26:11:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 1: 0%| | 12/12384 [01:31<26:11:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 1: 0%| | 12/12384 [01:39<26:11:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 0%| | 13/12384 [01:39<26:12:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 0%| | 13/12384 [01:46<26:12:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 0%| | 14/12384 [01:46<26:10:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 0%| | 14/12384 [01:54<26:10:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 0%| | 15/12384 [01:54<26:13:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 0%| | 15/12384 [02:02<26:13:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 0%| | 16/12384 [02:02<26:12:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 0%| | 16/12384 [02:09<26:12:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 0%| | 17/12384 [02:09<26:15:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 0%| | 17/12384 [02:17<26:15:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 0%| | 18/12384 [02:17<26:12:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 0%| | 18/12384 [02:25<26:12:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 0%| | 19/12384 [02:25<26:10:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 0%| | 19/12384 [02:32<26:10:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 0%| | 20/12384 [02:32<26:09:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 0%| | 20/12384 [02:40<26:09:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 0%| | 21/12384 [02:40<26:09:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 0%| | 21/12384 [02:47<26:09:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 0%| | 22/12384 [02:47<26:09:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 0%| | 22/12384 [02:55<26:09:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 0%| | 23/12384 [02:55<26:09:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 0%| | 23/12384 [03:03<26:09:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.27s]
Epoch 1: 0%| | 24/12384 [03:03<26:12:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.27s]
Epoch 1: 0%| | 24/12384 [03:10<26:12:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 0%| | 25/12384 [03:10<26:11:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 0%| | 25/12384 [03:18<26:11:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 0%| | 26/12384 [03:18<26:14:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 0%| | 26/12384 [03:26<26:14:56, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 1: 0%| | 27/12384 [03:26<26:12:36, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 1: 0%| | 27/12384 [03:33<26:12:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 0%| | 28/12384 [03:33<26:15:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 0%| | 28/12384 [03:41<26:15:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 0%| | 29/12384 [03:41<26:29:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 0%| | 29/12384 [03:49<26:29:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 0%| | 30/12384 [03:49<26:23:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 0%| | 30/12384 [03:56<26:23:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 0%| | 31/12384 [03:56<26:16:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 0%| | 31/12384 [04:04<26:16:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 0%| | 32/12384 [04:04<26:37:54, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 0%| | 32/12384 [04:12<26:37:54, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 0%| | 33/12384 [04:12<26:27:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 0%| | 33/12384 [04:20<26:27:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 0%| | 34/12384 [04:20<26:21:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 0%| | 34/12384 [04:27<26:21:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 0%| | 35/12384 [04:27<26:17:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 0%| | 35/12384 [04:35<26:17:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 0%| | 36/12384 [04:35<26:14:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 0%| | 36/12384 [04:43<26:14:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 1: 0%| | 37/12384 [04:43<26:13:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 1: 0%| | 37/12384 [04:50<26:13:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 0%| | 38/12384 [04:50<26:12:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 0%| | 38/12384 [04:58<26:12:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 0%| | 39/12384 [04:58<26:10:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 0%| | 39/12384 [05:05<26:10:57, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 0%| | 40/12384 [05:05<26:10:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 0%| | 40/12384 [05:13<26:10:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 0%| | 41/12384 [05:13<26:07:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 0%| | 41/12384 [05:21<26:07:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 0%| | 42/12384 [05:21<26:06:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 0%| | 42/12384 [05:28<26:06:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 0%| | 43/12384 [05:28<26:07:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 0%| | 43/12384 [05:36<26:07:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 0%| | 44/12384 [05:36<26:05:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 0%| | 44/12384 [05:43<26:05:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 0%| | 45/12384 [05:43<26:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 0%| | 45/12384 [05:51<26:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 0%| | 46/12384 [05:51<26:05:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 0%| | 46/12384 [05:59<26:05:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 0%| | 47/12384 [05:59<26:05:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 0%| | 47/12384 [06:06<26:05:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 0%| | 48/12384 [06:06<26:05:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 0%| | 48/12384 [06:14<26:05:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 0%| | 49/12384 [06:14<26:04:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 0%| | 49/12384 [06:22<26:04:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 0%| | 50/12384 [06:22<26:03:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 0%| | 50/12384 [06:29<26:03:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 0%| | 51/12384 [06:29<26:03:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 0%| | 51/12384 [06:37<26:03:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.87s]
Epoch 1: 0%| | 52/12384 [06:37<26:02:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.87s]
Epoch 1: 0%| | 52/12384 [06:44<26:02:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 0%| | 53/12384 [06:44<26:02:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 0%| | 53/12384 [06:52<26:02:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 0%| | 54/12384 [06:52<26:02:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 0%| | 54/12384 [07:00<26:02:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 0%| | 55/12384 [07:00<26:02:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 0%| | 55/12384 [07:07<26:02:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 1: 0%| | 56/12384 [07:07<26:03:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 1: 0%| | 56/12384 [07:15<26:03:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 0%| | 57/12384 [07:15<26:03:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 0%| | 57/12384 [07:23<26:03:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 0%| | 58/12384 [07:23<26:23:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 0%| | 58/12384 [07:30<26:23:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 0%| | 59/12384 [07:30<26:15:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 0%| | 59/12384 [07:38<26:15:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 0%| | 60/12384 [07:38<26:12:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 0%| | 60/12384 [07:45<26:12:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 0%| | 61/12384 [07:45<26:09:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 0%| | 61/12384 [07:53<26:09:09, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 1: 1%| | 62/12384 [07:53<26:06:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 1: 1%| | 62/12384 [08:01<26:06:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 1%| | 63/12384 [08:01<26:24:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 1%| | 63/12384 [08:09<26:24:25, 7.72s/it, loss=0.0002, acc=0.9994, iter_time=7.98s]
Epoch 1: 1%| | 64/12384 [08:09<26:22:15, 7.71s/it, loss=0.0002, acc=0.9994, iter_time=7.98s]
Epoch 1: 1%| | 64/12384 [08:16<26:22:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 1: 1%| | 65/12384 [08:16<26:16:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 1: 1%| | 65/12384 [08:24<26:16:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 1: 1%| | 66/12384 [08:24<26:11:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 1: 1%| | 66/12384 [08:32<26:11:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 1%| | 67/12384 [08:32<26:09:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 1%| | 67/12384 [08:39<26:09:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 1%| | 68/12384 [08:39<26:07:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 1%| | 68/12384 [08:47<26:07:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 1%| | 69/12384 [08:47<26:05:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 1%| | 69/12384 [08:54<26:05:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 1%| | 70/12384 [08:54<26:05:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 1%| | 70/12384 [09:02<26:05:57, 7.63s/it, loss=0.0005, acc=0.9977, iter_time=7.63s]
Epoch 1: 1%| | 71/12384 [09:02<26:03:48, 7.62s/it, loss=0.0005, acc=0.9977, iter_time=7.63s]
Epoch 1: 1%| | 71/12384 [09:10<26:03:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 1%| | 72/12384 [09:10<26:03:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 1%| | 72/12384 [09:17<26:03:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 1%| | 73/12384 [09:17<26:03:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 1%| | 73/12384 [09:25<26:03:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 74/12384 [09:25<26:01:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 74/12384 [09:32<26:01:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 1%| | 75/12384 [09:32<26:01:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 1%| | 75/12384 [09:40<26:01:04, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=10.50s]
Epoch 1: 1%| | 76/12384 [09:40<26:00:32, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=10.50s]
Epoch 1: 1%| | 76/12384 [09:48<26:00:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 1%| | 77/12384 [09:48<25:59:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 1%| | 77/12384 [09:55<25:59:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%| | 78/12384 [09:55<26:00:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%| | 78/12384 [10:03<26:00:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 79/12384 [10:03<25:59:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 79/12384 [10:10<25:59:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 1%| | 80/12384 [10:10<25:59:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 1%| | 80/12384 [10:18<25:59:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 1%| | 81/12384 [10:18<26:15:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 1%| | 81/12384 [10:26<26:15:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 1%| | 82/12384 [10:26<26:11:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 1%| | 82/12384 [10:34<26:11:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 1%| | 83/12384 [10:34<26:06:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 1%| | 83/12384 [10:41<26:06:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 1%| | 84/12384 [10:41<26:04:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 1%| | 84/12384 [10:49<26:04:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 1%| | 85/12384 [10:49<26:24:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 1%| | 85/12384 [10:57<26:24:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 1%| | 86/12384 [10:57<26:16:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 1%| | 86/12384 [11:04<26:16:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 1%| | 87/12384 [11:04<26:11:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 1%| | 87/12384 [11:12<26:11:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 1%| | 88/12384 [11:12<26:07:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 1%| | 88/12384 [11:20<26:07:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 1%| | 89/12384 [11:20<26:05:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 1%| | 89/12384 [11:27<26:05:51, 7.64s/it, loss=0.0000, acc=0.9995, iter_time=7.71s]
Epoch 1: 1%| | 90/12384 [11:27<26:08:38, 7.66s/it, loss=0.0000, acc=0.9995, iter_time=7.71s]
Epoch 1: 1%| | 90/12384 [11:35<26:08:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 1%| | 91/12384 [11:35<26:05:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 1%| | 91/12384 [11:42<26:05:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 1%| | 92/12384 [11:42<26:04:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 1%| | 92/12384 [11:50<26:04:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 1%| | 93/12384 [11:50<26:02:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 1%| | 93/12384 [11:58<26:02:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%| | 94/12384 [11:58<26:00:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%| | 94/12384 [12:05<26:00:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 1%| | 95/12384 [12:05<26:00:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 1%| | 95/12384 [12:13<26:00:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 1%| | 96/12384 [12:13<25:59:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 1%| | 96/12384 [12:20<25:59:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 1%| | 97/12384 [12:20<25:57:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 1%| | 97/12384 [12:28<25:57:14, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=10.59s]
Epoch 1: 1%| | 98/12384 [12:28<25:58:05, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=10.59s]
Epoch 1: 1%| | 98/12384 [12:36<25:58:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 1%| | 99/12384 [12:36<25:58:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 1%| | 99/12384 [12:43<25:58:13, 7.61s/it, loss=0.0012, acc=0.9972, iter_time=7.64s]
Epoch 1: 1%| | 100/12384 [12:43<25:57:57, 7.61s/it, loss=0.0012, acc=0.9972, iter_time=7.64s]
Epoch 1: 1%| | 100/12384 [12:51<25:57:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 1%| | 101/12384 [12:51<25:57:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 1%| | 101/12384 [12:59<25:57:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 102/12384 [12:59<25:58:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 102/12384 [13:06<25:58:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 1%| | 103/12384 [13:06<26:03:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 1%| | 103/12384 [13:14<26:03:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 1%| | 104/12384 [13:14<26:03:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 1%| | 104/12384 [13:21<26:03:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 1%| | 105/12384 [13:21<26:00:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 1%| | 105/12384 [13:29<26:00:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%| | 106/12384 [13:29<26:00:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%| | 106/12384 [13:37<26:00:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 1%| | 107/12384 [13:37<26:16:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 1%| | 107/12384 [13:45<26:16:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 1%| | 108/12384 [13:45<26:11:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 1%| | 108/12384 [13:52<26:11:29, 7.68s/it, loss=0.0004, acc=0.9998, iter_time=7.02s]
Epoch 1: 1%| | 109/12384 [13:52<26:05:11, 7.65s/it, loss=0.0004, acc=0.9998, iter_time=7.02s]
Epoch 1: 1%| | 109/12384 [14:00<26:05:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 1%| | 110/12384 [14:00<26:03:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 1%| | 110/12384 [14:08<26:03:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 1%| | 111/12384 [14:08<26:19:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 1%| | 111/12384 [14:15<26:19:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 1%| | 112/12384 [14:15<26:13:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 1%| | 112/12384 [14:23<26:13:17, 7.69s/it, loss=0.0002, acc=0.9999, iter_time=7.66s]
Epoch 1: 1%| | 113/12384 [14:23<26:06:58, 7.66s/it, loss=0.0002, acc=0.9999, iter_time=7.66s]
Epoch 1: 1%| | 113/12384 [14:31<26:06:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 1%| | 114/12384 [14:31<26:02:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 1%| | 114/12384 [14:38<26:02:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 1%| | 115/12384 [14:38<26:00:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 1%| | 115/12384 [14:46<26:00:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 1%| | 116/12384 [14:46<26:21:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 1%| | 116/12384 [14:54<26:21:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 1: 1%| | 117/12384 [14:54<26:15:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 1: 1%| | 117/12384 [15:01<26:15:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 1%| | 118/12384 [15:01<26:11:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 1%| | 118/12384 [15:09<26:11:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 1%| | 119/12384 [15:09<26:04:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 1%| | 119/12384 [15:17<26:04:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 1%| | 120/12384 [15:17<26:07:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 1%| | 120/12384 [15:24<26:07:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 1%| | 121/12384 [15:24<26:03:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 1%| | 121/12384 [15:32<26:03:35, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=9.92s]
Epoch 1: 1%| | 122/12384 [15:32<26:00:07, 7.63s/it, loss=0.0003, acc=0.9997, iter_time=9.92s]
Epoch 1: 1%| | 122/12384 [15:40<26:00:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 1%| | 123/12384 [15:40<26:14:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 1%| | 123/12384 [15:47<26:14:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 1%| | 124/12384 [15:47<26:13:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 1%| | 124/12384 [15:55<26:13:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 1%| | 125/12384 [15:55<26:08:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 1%| | 125/12384 [16:03<26:08:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 1%| | 126/12384 [16:03<26:04:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 1%| | 126/12384 [16:10<26:04:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 1%| | 127/12384 [16:10<26:05:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 1%| | 127/12384 [16:18<26:05:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 1%| | 128/12384 [16:18<26:02:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 1%| | 128/12384 [16:26<26:02:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 1: 1%| | 129/12384 [16:26<25:58:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 1: 1%| | 129/12384 [16:33<25:58:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 1%| | 130/12384 [16:33<25:58:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 1%| | 130/12384 [16:41<25:58:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 1%| | 131/12384 [16:41<25:58:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 1%| | 131/12384 [16:48<25:58:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 1%| | 132/12384 [16:48<25:58:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 1%| | 132/12384 [16:56<25:58:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 1%| | 133/12384 [16:56<25:57:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 1%| | 133/12384 [17:04<25:57:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 1%| | 134/12384 [17:04<26:13:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 1%| | 134/12384 [17:12<26:13:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 1%| | 135/12384 [17:12<26:06:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 1%| | 135/12384 [17:19<26:06:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 1%| | 136/12384 [17:19<26:09:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 1%| | 136/12384 [17:27<26:09:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 1%| | 137/12384 [17:27<26:23:35, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 1%| | 137/12384 [17:35<26:23:35, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 1%| | 138/12384 [17:35<26:14:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 1%| | 138/12384 [17:42<26:14:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 139/12384 [17:42<26:07:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 139/12384 [17:50<26:07:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 140/12384 [17:50<26:03:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%| | 140/12384 [17:58<26:03:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 1%| | 141/12384 [17:58<26:00:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 1%| | 141/12384 [18:05<26:00:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 1: 1%| | 142/12384 [18:05<25:58:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 1: 1%| | 142/12384 [18:13<25:58:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 1%| | 143/12384 [18:13<25:56:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 1%| | 143/12384 [18:20<25:56:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 1%| | 144/12384 [18:20<25:54:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 1%| | 144/12384 [18:28<25:54:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 1%| | 145/12384 [18:28<25:52:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 1%| | 145/12384 [18:36<25:52:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%| | 146/12384 [18:36<25:53:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%| | 146/12384 [18:43<25:53:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 1%| | 147/12384 [18:43<25:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 1%| | 147/12384 [18:51<25:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%| | 148/12384 [18:51<25:53:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%| | 148/12384 [18:59<25:53:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 1%| | 149/12384 [18:59<25:52:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 1%| | 149/12384 [19:06<25:52:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%| | 150/12384 [19:06<25:51:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%| | 150/12384 [19:14<25:51:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 1%| | 151/12384 [19:14<25:50:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 1%| | 151/12384 [19:21<25:50:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 1: 1%| | 152/12384 [19:21<25:49:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 1: 1%| | 152/12384 [19:29<25:49:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 1%| | 153/12384 [19:29<25:48:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 1%| | 153/12384 [19:37<25:48:22, 7.60s/it, loss=0.0001, acc=0.9995, iter_time=10.64s]
Epoch 1: 1%| | 154/12384 [19:37<25:48:42, 7.60s/it, loss=0.0001, acc=0.9995, iter_time=10.64s]
Epoch 1: 1%| | 154/12384 [19:44<25:48:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%|▏ | 155/12384 [19:44<25:48:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%|▏ | 155/12384 [19:52<25:48:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%|▏ | 156/12384 [19:52<25:49:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%|▏ | 156/12384 [19:59<25:49:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%|▏ | 157/12384 [19:59<25:49:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 1%|▏ | 157/12384 [20:07<25:49:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 1%|▏ | 158/12384 [20:07<25:51:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 1%|▏ | 158/12384 [20:15<25:51:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 1%|▏ | 159/12384 [20:15<25:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 1%|▏ | 159/12384 [20:22<25:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 1%|▏ | 160/12384 [20:22<25:49:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 1%|▏ | 160/12384 [20:30<25:49:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 1%|▏ | 161/12384 [20:30<26:05:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 1%|▏ | 161/12384 [20:38<26:05:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 1%|▏ | 162/12384 [20:38<26:03:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 1%|▏ | 162/12384 [20:46<26:03:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 1%|▏ | 163/12384 [20:46<26:20:46, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 1%|▏ | 163/12384 [20:53<26:20:46, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 1%|▏ | 164/12384 [20:53<26:12:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 1%|▏ | 164/12384 [21:01<26:12:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%|▏ | 165/12384 [21:01<26:04:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 1%|▏ | 165/12384 [21:09<26:04:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 1%|▏ | 166/12384 [21:09<26:04:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 1%|▏ | 166/12384 [21:16<26:04:27, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 1: 1%|▏ | 167/12384 [21:16<25:59:00, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 1: 1%|▏ | 167/12384 [21:24<25:59:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 1%|▏ | 168/12384 [21:24<25:55:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 1%|▏ | 168/12384 [21:31<25:55:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 1%|▏ | 169/12384 [21:31<25:53:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 1%|▏ | 169/12384 [21:39<25:53:24, 7.63s/it, loss=0.0004, acc=0.9984, iter_time=7.60s]
Epoch 1: 1%|▏ | 170/12384 [21:39<25:52:37, 7.63s/it, loss=0.0004, acc=0.9984, iter_time=7.60s]
Epoch 1: 1%|▏ | 170/12384 [21:47<25:52:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 1%|▏ | 171/12384 [21:47<25:51:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 1%|▏ | 171/12384 [21:54<25:51:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 1%|▏ | 172/12384 [21:54<25:51:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 1%|▏ | 172/12384 [22:02<25:51:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 1%|▏ | 173/12384 [22:02<25:50:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 1%|▏ | 173/12384 [22:09<25:50:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 1%|▏ | 174/12384 [22:09<25:50:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 1%|▏ | 174/12384 [22:17<25:50:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 1%|▏ | 175/12384 [22:17<25:54:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 1%|▏ | 175/12384 [22:25<25:54:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 1%|▏ | 176/12384 [22:25<25:53:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 1%|▏ | 176/12384 [22:32<25:53:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 1%|▏ | 177/12384 [22:32<25:51:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 1%|▏ | 177/12384 [22:40<25:51:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%|▏ | 178/12384 [22:40<25:49:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%|▏ | 178/12384 [22:48<25:49:41, 7.62s/it, loss=0.0005, acc=0.9982, iter_time=5.80s]
Epoch 1: 1%|▏ | 179/12384 [22:48<25:49:11, 7.62s/it, loss=0.0005, acc=0.9982, iter_time=5.80s]
Epoch 1: 1%|▏ | 179/12384 [22:55<25:49:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 1%|▏ | 180/12384 [22:55<25:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 1%|▏ | 180/12384 [23:03<25:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 1%|▏ | 181/12384 [23:03<25:46:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 1%|▏ | 181/12384 [23:10<25:46:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%|▏ | 182/12384 [23:10<25:47:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 1%|▏ | 182/12384 [23:18<25:47:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 1%|▏ | 183/12384 [23:18<25:48:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 1%|▏ | 183/12384 [23:26<25:48:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 1%|▏ | 184/12384 [23:26<25:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 1%|▏ | 184/12384 [23:33<25:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 1%|▏ | 185/12384 [23:33<25:48:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 1%|▏ | 185/12384 [23:41<25:48:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 2%|▏ | 186/12384 [23:41<25:48:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 2%|▏ | 186/12384 [23:48<25:48:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 2%|▏ | 187/12384 [23:48<25:47:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 2%|▏ | 187/12384 [23:56<25:47:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 1: 2%|▏ | 188/12384 [23:56<25:49:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 1: 2%|▏ | 188/12384 [24:04<25:49:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 2%|▏ | 189/12384 [24:04<26:09:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 2%|▏ | 189/12384 [24:12<26:09:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 2%|▏ | 190/12384 [24:12<26:02:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 2%|▏ | 190/12384 [24:19<26:02:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 2%|▏ | 191/12384 [24:19<25:59:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 2%|▏ | 191/12384 [24:27<25:59:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 1: 2%|▏ | 192/12384 [24:27<25:55:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 1: 2%|▏ | 192/12384 [24:35<25:55:17, 7.65s/it, loss=0.0000, acc=0.9999, iter_time=7.23s]
Epoch 1: 2%|▏ | 193/12384 [24:35<25:52:11, 7.64s/it, loss=0.0000, acc=0.9999, iter_time=7.23s]
Epoch 1: 2%|▏ | 193/12384 [24:42<25:52:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 2%|▏ | 194/12384 [24:42<25:50:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 2%|▏ | 194/12384 [24:50<25:50:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 195/12384 [24:50<25:49:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 195/12384 [24:57<25:49:04, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=5.81s]
Epoch 1: 2%|▏ | 196/12384 [24:57<25:46:35, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=5.81s]
Epoch 1: 2%|▏ | 196/12384 [25:05<25:46:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 2%|▏ | 197/12384 [25:05<25:46:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 2%|▏ | 197/12384 [25:13<25:46:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 198/12384 [25:13<25:46:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 198/12384 [25:20<25:46:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=2.68s]
Epoch 1: 2%|▏ | 199/12384 [25:20<25:44:07, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=2.68s]
Epoch 1: 2%|▏ | 199/12384 [25:28<25:44:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=12.90s]
Epoch 1: 2%|▏ | 200/12384 [25:28<25:44:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=12.90s]
Epoch 1: 2%|▏ | 200/12384 [25:35<25:44:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 1: 2%|▏ | 201/12384 [25:35<25:42:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 1: 2%|▏ | 201/12384 [25:43<25:42:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 2%|▏ | 202/12384 [25:43<25:42:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 2%|▏ | 202/12384 [25:51<25:42:40, 7.60s/it, loss=0.0004, acc=0.9983, iter_time=8.53s]
Epoch 1: 2%|▏ | 203/12384 [25:51<25:42:10, 7.60s/it, loss=0.0004, acc=0.9983, iter_time=8.53s]
Epoch 1: 2%|▏ | 203/12384 [25:58<25:42:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 204/12384 [25:58<25:42:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 204/12384 [26:06<25:42:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 2%|▏ | 205/12384 [26:06<25:49:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 2%|▏ | 205/12384 [26:13<25:49:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 2%|▏ | 206/12384 [26:13<25:47:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 2%|▏ | 206/12384 [26:21<25:47:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 2%|▏ | 207/12384 [26:21<25:46:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 2%|▏ | 207/12384 [26:29<25:46:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 1: 2%|▏ | 208/12384 [26:29<25:48:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 1: 2%|▏ | 208/12384 [26:36<25:48:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 1: 2%|▏ | 209/12384 [26:36<25:47:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 1: 2%|▏ | 209/12384 [26:44<25:47:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 2%|▏ | 210/12384 [26:44<25:46:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 2%|▏ | 210/12384 [26:52<25:46:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 2%|▏ | 211/12384 [26:52<25:50:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 2%|▏ | 211/12384 [26:59<25:50:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 2%|▏ | 212/12384 [26:59<25:48:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 2%|▏ | 212/12384 [27:07<25:48:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 213/12384 [27:07<25:46:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 213/12384 [27:14<25:46:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 2%|▏ | 214/12384 [27:14<25:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 2%|▏ | 214/12384 [27:22<25:46:19, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=6.20s]
Epoch 1: 2%|▏ | 215/12384 [27:22<25:45:57, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=6.20s]
Epoch 1: 2%|▏ | 215/12384 [27:30<25:45:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 1: 2%|▏ | 216/12384 [27:30<26:08:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 1: 2%|▏ | 216/12384 [27:38<26:08:52, 7.74s/it, loss=0.0001, acc=0.9999, iter_time=7.21s]
Epoch 1: 2%|▏ | 217/12384 [27:38<26:01:02, 7.70s/it, loss=0.0001, acc=0.9999, iter_time=7.21s]
Epoch 1: 2%|▏ | 217/12384 [27:45<26:01:02, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 218/12384 [27:45<25:55:42, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 218/12384 [27:53<25:55:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 2%|▏ | 219/12384 [27:53<25:53:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 2%|▏ | 219/12384 [28:01<25:53:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 2%|▏ | 220/12384 [28:01<25:50:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 2%|▏ | 220/12384 [28:08<25:50:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 2%|▏ | 221/12384 [28:08<25:48:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 2%|▏ | 221/12384 [28:16<25:48:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 2%|▏ | 222/12384 [28:16<25:45:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 2%|▏ | 222/12384 [28:23<25:45:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 2%|▏ | 223/12384 [28:23<25:43:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 2%|▏ | 223/12384 [28:31<25:43:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 2%|▏ | 224/12384 [28:31<25:44:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 2%|▏ | 224/12384 [28:39<25:44:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 225/12384 [28:39<25:42:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 225/12384 [28:46<25:42:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 2%|▏ | 226/12384 [28:46<25:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 2%|▏ | 226/12384 [28:54<25:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 2%|▏ | 227/12384 [28:54<25:44:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 2%|▏ | 227/12384 [29:01<25:44:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 228/12384 [29:01<25:42:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 228/12384 [29:09<25:42:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 2%|▏ | 229/12384 [29:09<25:42:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 2%|▏ | 229/12384 [29:17<25:42:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 2%|▏ | 230/12384 [29:17<25:41:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 2%|▏ | 230/12384 [29:24<25:41:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 231/12384 [29:24<25:42:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 231/12384 [29:32<25:42:06, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=8.00s]
Epoch 1: 2%|▏ | 232/12384 [29:32<25:44:29, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=8.00s]
Epoch 1: 2%|▏ | 232/12384 [29:40<25:44:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 2%|▏ | 233/12384 [29:40<25:41:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 2%|▏ | 233/12384 [29:47<25:41:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 234/12384 [29:47<25:40:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 234/12384 [29:55<25:40:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 235/12384 [29:55<25:40:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 235/12384 [30:02<25:40:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 2%|▏ | 236/12384 [30:02<25:40:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 2%|▏ | 236/12384 [30:10<25:40:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 2%|▏ | 237/12384 [30:10<25:40:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 2%|▏ | 237/12384 [30:18<25:40:55, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.01s]
Epoch 1: 2%|▏ | 238/12384 [30:18<25:41:01, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.01s]
Epoch 1: 2%|▏ | 238/12384 [30:25<25:41:01, 7.61s/it, loss=0.0000, acc=0.9998, iter_time=6.00s]
Epoch 1: 2%|▏ | 239/12384 [30:25<25:41:08, 7.61s/it, loss=0.0000, acc=0.9998, iter_time=6.00s]
Epoch 1: 2%|▏ | 239/12384 [30:33<25:41:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.83s]
Epoch 1: 2%|▏ | 240/12384 [30:33<25:58:16, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=10.83s]
Epoch 1: 2%|▏ | 240/12384 [30:41<25:58:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 2%|▏ | 241/12384 [30:41<25:51:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 2%|▏ | 241/12384 [30:49<25:51:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 1: 2%|▏ | 242/12384 [30:49<26:08:57, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 1: 2%|▏ | 242/12384 [30:56<26:08:57, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 2%|▏ | 243/12384 [30:56<26:01:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 2%|▏ | 243/12384 [31:04<26:01:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 244/12384 [31:04<25:57:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 244/12384 [31:12<25:57:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 245/12384 [31:12<25:52:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 245/12384 [31:19<25:52:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 2%|▏ | 246/12384 [31:19<25:51:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 2%|▏ | 246/12384 [31:27<25:51:42, 7.67s/it, loss=0.0002, acc=0.9979, iter_time=5.90s]
Epoch 1: 2%|▏ | 247/12384 [31:27<25:48:58, 7.66s/it, loss=0.0002, acc=0.9979, iter_time=5.90s]
Epoch 1: 2%|▏ | 247/12384 [31:34<25:48:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 2%|▏ | 248/12384 [31:34<25:48:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 2%|▏ | 248/12384 [31:42<25:48:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 2%|▏ | 249/12384 [31:42<25:45:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 2%|▏ | 249/12384 [31:50<25:45:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 250/12384 [31:50<25:43:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 250/12384 [31:57<25:43:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 2%|▏ | 251/12384 [31:57<25:42:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 2%|▏ | 251/12384 [32:05<25:42:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 2%|▏ | 252/12384 [32:05<25:40:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 2%|▏ | 252/12384 [32:13<25:40:55, 7.62s/it, loss=0.0003, acc=0.9985, iter_time=10.36s]
Epoch 1: 2%|▏ | 253/12384 [32:13<25:42:22, 7.63s/it, loss=0.0003, acc=0.9985, iter_time=10.36s]
Epoch 1: 2%|▏ | 253/12384 [32:20<25:42:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 2%|▏ | 254/12384 [32:20<25:45:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 2%|▏ | 254/12384 [32:28<25:45:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 2%|▏ | 255/12384 [32:28<25:43:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 2%|▏ | 255/12384 [32:36<25:43:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 2%|▏ | 256/12384 [32:36<25:45:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 2%|▏ | 256/12384 [32:43<25:45:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 2%|▏ | 257/12384 [32:43<25:42:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 2%|▏ | 257/12384 [32:51<25:42:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 2%|▏ | 258/12384 [32:51<25:42:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 2%|▏ | 258/12384 [32:58<25:42:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 2%|▏ | 259/12384 [32:58<25:40:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 2%|▏ | 259/12384 [33:06<25:40:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 2%|▏ | 260/12384 [33:06<25:42:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 2%|▏ | 260/12384 [33:14<25:42:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 2%|▏ | 261/12384 [33:14<25:40:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 2%|▏ | 261/12384 [33:21<25:40:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 2%|▏ | 262/12384 [33:21<25:39:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 2%|▏ | 262/12384 [33:29<25:39:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 2%|▏ | 263/12384 [33:29<25:42:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 2%|▏ | 263/12384 [33:36<25:42:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 2%|▏ | 264/12384 [33:36<25:40:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 2%|▏ | 264/12384 [33:44<25:40:06, 7.62s/it, loss=0.0007, acc=0.9978, iter_time=7.53s]
Epoch 1: 2%|▏ | 265/12384 [33:44<25:57:08, 7.71s/it, loss=0.0007, acc=0.9978, iter_time=7.53s]
Epoch 1: 2%|▏ | 265/12384 [33:52<25:57:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 2%|▏ | 266/12384 [33:52<25:49:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 2%|▏ | 266/12384 [34:00<25:49:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 2%|▏ | 267/12384 [34:00<25:46:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 2%|▏ | 267/12384 [34:07<25:46:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 2%|▏ | 268/12384 [34:07<25:43:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 2%|▏ | 268/12384 [34:15<25:43:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 2%|▏ | 269/12384 [34:15<25:58:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 2%|▏ | 269/12384 [34:23<25:58:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 2%|▏ | 270/12384 [34:23<25:52:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 2%|▏ | 270/12384 [34:30<25:52:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 2%|▏ | 271/12384 [34:30<25:46:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 2%|▏ | 271/12384 [34:38<25:46:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 2%|▏ | 272/12384 [34:38<25:46:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 2%|▏ | 272/12384 [34:46<25:46:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 2%|▏ | 273/12384 [34:46<25:44:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 2%|▏ | 273/12384 [34:53<25:44:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 2%|▏ | 274/12384 [34:53<25:40:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 2%|▏ | 274/12384 [35:01<25:40:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 2%|▏ | 275/12384 [35:01<25:40:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 2%|▏ | 275/12384 [35:08<25:40:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 2%|▏ | 276/12384 [35:08<25:39:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 2%|▏ | 276/12384 [35:16<25:39:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 2%|▏ | 277/12384 [35:16<25:37:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 2%|▏ | 277/12384 [35:24<25:37:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 278/12384 [35:24<25:37:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 278/12384 [35:31<25:37:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 2%|▏ | 279/12384 [35:31<25:36:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 2%|▏ | 279/12384 [35:39<25:36:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 2%|▏ | 280/12384 [35:39<25:34:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 2%|▏ | 280/12384 [35:46<25:34:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 1: 2%|▏ | 281/12384 [35:46<25:33:24, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 1: 2%|▏ | 281/12384 [35:54<25:33:24, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 2%|▏ | 282/12384 [35:54<25:34:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 2%|▏ | 282/12384 [36:02<25:34:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 2%|▏ | 283/12384 [36:02<25:35:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 2%|▏ | 283/12384 [36:09<25:35:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 2%|▏ | 284/12384 [36:09<25:36:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 2%|▏ | 284/12384 [36:17<25:36:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 2%|▏ | 285/12384 [36:17<25:34:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 2%|▏ | 285/12384 [36:25<25:34:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 2%|▏ | 286/12384 [36:25<25:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 2%|▏ | 286/12384 [36:32<25:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 2%|▏ | 287/12384 [36:32<25:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 2%|▏ | 287/12384 [36:40<25:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 2%|▏ | 288/12384 [36:40<25:39:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 2%|▏ | 288/12384 [36:47<25:39:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 2%|▏ | 289/12384 [36:47<25:36:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 2%|▏ | 289/12384 [36:55<25:36:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 2%|▏ | 290/12384 [36:55<25:36:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 2%|▏ | 290/12384 [37:03<25:36:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 2%|▏ | 291/12384 [37:03<25:35:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 2%|▏ | 291/12384 [37:10<25:35:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 2%|▏ | 292/12384 [37:10<25:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 2%|▏ | 292/12384 [37:18<25:33:47, 7.61s/it, loss=0.0007, acc=0.9965, iter_time=7.59s]
Epoch 1: 2%|▏ | 293/12384 [37:18<25:32:45, 7.61s/it, loss=0.0007, acc=0.9965, iter_time=7.59s]
Epoch 1: 2%|▏ | 293/12384 [37:25<25:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 2%|▏ | 294/12384 [37:25<25:33:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 2%|▏ | 294/12384 [37:33<25:33:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 2%|▏ | 295/12384 [37:33<25:52:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 2%|▏ | 295/12384 [37:41<25:52:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 2%|▏ | 296/12384 [37:41<25:46:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 2%|▏ | 296/12384 [37:49<25:46:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 2%|▏ | 297/12384 [37:49<25:43:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 2%|▏ | 297/12384 [37:56<25:43:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 2%|▏ | 298/12384 [37:56<25:40:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 2%|▏ | 298/12384 [38:04<25:40:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 2%|▏ | 299/12384 [38:04<25:38:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 2%|▏ | 299/12384 [38:11<25:38:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 2%|▏ | 300/12384 [38:11<25:36:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 2%|▏ | 300/12384 [38:19<25:36:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 2%|▏ | 301/12384 [38:19<25:37:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 2%|▏ | 301/12384 [38:27<25:37:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 302/12384 [38:27<25:34:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 2%|▏ | 302/12384 [38:34<25:34:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 2%|▏ | 303/12384 [38:34<25:31:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 2%|▏ | 303/12384 [38:42<25:31:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 2%|▏ | 304/12384 [38:42<25:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 2%|▏ | 304/12384 [38:50<25:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 2%|▏ | 305/12384 [38:50<25:31:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 2%|▏ | 305/12384 [38:57<25:31:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 2%|▏ | 306/12384 [38:57<25:30:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 2%|▏ | 306/12384 [39:05<25:30:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 2%|▏ | 307/12384 [39:05<25:31:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 2%|▏ | 307/12384 [39:12<25:31:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 308/12384 [39:12<25:33:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 2%|▏ | 308/12384 [39:20<25:33:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 2%|▏ | 309/12384 [39:20<25:31:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 2%|▏ | 309/12384 [39:28<25:31:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 3%|▎ | 310/12384 [39:28<25:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 3%|▎ | 310/12384 [39:35<25:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 3%|▎ | 311/12384 [39:35<25:36:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 3%|▎ | 311/12384 [39:43<25:36:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 3%|▎ | 312/12384 [39:43<25:34:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 3%|▎ | 312/12384 [39:50<25:34:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 3%|▎ | 313/12384 [39:50<25:32:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 3%|▎ | 313/12384 [39:58<25:32:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 3%|▎ | 314/12384 [39:58<25:32:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 3%|▎ | 314/12384 [40:06<25:32:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 1: 3%|▎ | 315/12384 [40:06<25:28:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 1: 3%|▎ | 315/12384 [40:13<25:28:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 3%|▎ | 316/12384 [40:13<25:29:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 3%|▎ | 316/12384 [40:21<25:29:29, 7.60s/it, loss=0.0008, acc=0.9974, iter_time=7.19s]
Epoch 1: 3%|▎ | 317/12384 [40:21<25:31:58, 7.62s/it, loss=0.0008, acc=0.9974, iter_time=7.19s]
Epoch 1: 3%|▎ | 317/12384 [40:29<25:31:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 3%|▎ | 318/12384 [40:29<25:31:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 3%|▎ | 318/12384 [40:36<25:31:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 319/12384 [40:36<25:32:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 319/12384 [40:44<25:32:48, 7.62s/it, loss=0.0006, acc=0.9976, iter_time=8.04s]
Epoch 1: 3%|▎ | 320/12384 [40:44<25:31:42, 7.62s/it, loss=0.0006, acc=0.9976, iter_time=8.04s]
Epoch 1: 3%|▎ | 320/12384 [40:52<25:31:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 3%|▎ | 321/12384 [40:52<25:50:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 3%|▎ | 321/12384 [40:59<25:50:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 3%|▎ | 322/12384 [40:59<25:48:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 3%|▎ | 322/12384 [41:07<25:48:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 1: 3%|▎ | 323/12384 [41:07<25:42:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 1: 3%|▎ | 323/12384 [41:15<25:42:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 3%|▎ | 324/12384 [41:15<25:37:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 3%|▎ | 324/12384 [41:22<25:37:01, 7.65s/it, loss=0.0006, acc=0.9951, iter_time=8.51s]
Epoch 1: 3%|▎ | 325/12384 [41:22<25:33:28, 7.63s/it, loss=0.0006, acc=0.9951, iter_time=8.51s]
Epoch 1: 3%|▎ | 325/12384 [41:30<25:33:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 3%|▎ | 326/12384 [41:30<25:31:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 3%|▎ | 326/12384 [41:37<25:31:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 327/12384 [41:37<25:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 327/12384 [41:45<25:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 3%|▎ | 328/12384 [41:45<25:33:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 3%|▎ | 328/12384 [41:53<25:33:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 3%|▎ | 329/12384 [41:53<25:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 3%|▎ | 329/12384 [42:00<25:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 3%|▎ | 330/12384 [42:00<25:31:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 3%|▎ | 330/12384 [42:08<25:31:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 3%|▎ | 331/12384 [42:08<25:30:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 3%|▎ | 331/12384 [42:15<25:30:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 3%|▎ | 332/12384 [42:15<25:30:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 3%|▎ | 332/12384 [42:23<25:30:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 333/12384 [42:23<25:29:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 333/12384 [42:31<25:29:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 3%|▎ | 334/12384 [42:31<25:29:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 3%|▎ | 334/12384 [42:38<25:29:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 3%|▎ | 335/12384 [42:38<25:34:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 3%|▎ | 335/12384 [42:46<25:34:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 3%|▎ | 336/12384 [42:46<25:35:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 3%|▎ | 336/12384 [42:54<25:35:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 3%|▎ | 337/12384 [42:54<25:31:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 3%|▎ | 337/12384 [43:01<25:31:13, 7.63s/it, loss=0.0007, acc=0.9972, iter_time=10.41s]
Epoch 1: 3%|▎ | 338/12384 [43:01<25:29:55, 7.62s/it, loss=0.0007, acc=0.9972, iter_time=10.41s]
Epoch 1: 3%|▎ | 338/12384 [43:09<25:29:55, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=7.63s]
Epoch 1: 3%|▎ | 339/12384 [43:09<25:28:30, 7.61s/it, loss=0.0002, acc=0.9992, iter_time=7.63s]
Epoch 1: 3%|▎ | 339/12384 [43:16<25:28:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 3%|▎ | 340/12384 [43:16<25:27:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 3%|▎ | 340/12384 [43:24<25:27:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 3%|▎ | 341/12384 [43:24<25:26:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 3%|▎ | 341/12384 [43:32<25:26:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 3%|▎ | 342/12384 [43:32<25:45:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 3%|▎ | 342/12384 [43:40<25:45:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 343/12384 [43:40<25:38:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 343/12384 [43:47<25:38:31, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 1: 3%|▎ | 344/12384 [43:47<25:34:12, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.97s]
Epoch 1: 3%|▎ | 344/12384 [43:55<25:34:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 3%|▎ | 345/12384 [43:55<25:33:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 3%|▎ | 345/12384 [44:02<25:33:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 3%|▎ | 346/12384 [44:02<25:33:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 3%|▎ | 346/12384 [44:10<25:33:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 3%|▎ | 347/12384 [44:10<25:52:37, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 3%|▎ | 347/12384 [44:18<25:52:37, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 3%|▎ | 348/12384 [44:18<25:43:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 3%|▎ | 348/12384 [44:26<25:43:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 349/12384 [44:26<25:38:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 349/12384 [44:33<25:38:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 350/12384 [44:33<25:37:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 350/12384 [44:41<25:37:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 3%|▎ | 351/12384 [44:41<25:33:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 3%|▎ | 351/12384 [44:48<25:33:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 3%|▎ | 352/12384 [44:48<25:33:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 3%|▎ | 352/12384 [44:56<25:33:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 3%|▎ | 353/12384 [44:56<25:36:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 3%|▎ | 353/12384 [45:04<25:36:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 354/12384 [45:04<25:33:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 354/12384 [45:11<25:33:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 3%|▎ | 355/12384 [45:11<25:31:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 3%|▎ | 355/12384 [45:19<25:31:18, 7.64s/it, loss=0.0006, acc=0.9973, iter_time=7.60s]
Epoch 1: 3%|▎ | 356/12384 [45:19<25:28:38, 7.63s/it, loss=0.0006, acc=0.9973, iter_time=7.60s]
Epoch 1: 3%|▎ | 356/12384 [45:27<25:28:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 3%|▎ | 357/12384 [45:27<25:26:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 3%|▎ | 357/12384 [45:34<25:26:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 3%|▎ | 358/12384 [45:34<25:26:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 3%|▎ | 358/12384 [45:42<25:26:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 3%|▎ | 359/12384 [45:42<25:29:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 3%|▎ | 359/12384 [45:49<25:29:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 3%|▎ | 360/12384 [45:49<25:27:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 3%|▎ | 360/12384 [45:57<25:27:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=3.91s]
Epoch 1: 3%|▎ | 361/12384 [45:57<25:27:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=3.91s]
Epoch 1: 3%|▎ | 361/12384 [46:05<25:27:55, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=11.37s]
Epoch 1: 3%|▎ | 362/12384 [46:05<25:27:21, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=11.37s]
Epoch 1: 3%|▎ | 362/12384 [46:12<25:27:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 363/12384 [46:12<25:26:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 363/12384 [46:20<25:26:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 364/12384 [46:20<25:25:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 364/12384 [46:28<25:25:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 365/12384 [46:28<25:27:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 365/12384 [46:35<25:27:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 3%|▎ | 366/12384 [46:35<25:25:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 3%|▎ | 366/12384 [46:43<25:25:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 1: 3%|▎ | 367/12384 [46:43<25:23:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 1: 3%|▎ | 367/12384 [46:50<25:23:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 3%|▎ | 368/12384 [46:50<25:26:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 3%|▎ | 368/12384 [46:58<25:26:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 3%|▎ | 369/12384 [46:58<25:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 3%|▎ | 369/12384 [47:06<25:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 3%|▎ | 370/12384 [47:06<25:28:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 3%|▎ | 370/12384 [47:13<25:28:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 3%|▎ | 371/12384 [47:13<25:26:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 3%|▎ | 371/12384 [47:21<25:26:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 3%|▎ | 372/12384 [47:21<25:25:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 3%|▎ | 372/12384 [47:29<25:25:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 3%|▎ | 373/12384 [47:29<25:44:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 3%|▎ | 373/12384 [47:36<25:44:35, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 3%|▎ | 374/12384 [47:36<25:37:11, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 3%|▎ | 374/12384 [47:44<25:37:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 375/12384 [47:44<25:33:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 375/12384 [47:52<25:33:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 3%|▎ | 376/12384 [47:52<25:29:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 3%|▎ | 376/12384 [47:59<25:29:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 3%|▎ | 377/12384 [47:59<25:26:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 3%|▎ | 377/12384 [48:07<25:26:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 3%|▎ | 378/12384 [48:07<25:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 3%|▎ | 378/12384 [48:14<25:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 3%|▎ | 379/12384 [48:14<25:24:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 3%|▎ | 379/12384 [48:22<25:24:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 3%|▎ | 380/12384 [48:22<25:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 3%|▎ | 380/12384 [48:30<25:22:57, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.69s]
Epoch 1: 3%|▎ | 381/12384 [48:30<25:27:33, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.69s]
Epoch 1: 3%|▎ | 381/12384 [48:37<25:27:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 382/12384 [48:37<25:25:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 382/12384 [48:45<25:25:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 383/12384 [48:45<25:23:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 383/12384 [48:53<25:23:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 3%|▎ | 384/12384 [48:53<25:24:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 3%|▎ | 384/12384 [49:00<25:24:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 1: 3%|▎ | 385/12384 [49:00<25:23:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 1: 3%|▎ | 385/12384 [49:08<25:23:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 3%|▎ | 386/12384 [49:08<25:22:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 3%|▎ | 386/12384 [49:15<25:22:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 3%|▎ | 387/12384 [49:15<25:22:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 3%|▎ | 387/12384 [49:23<25:22:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 3%|▎ | 388/12384 [49:23<25:21:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 3%|▎ | 388/12384 [49:31<25:21:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 1: 3%|▎ | 389/12384 [49:31<25:21:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 1: 3%|▎ | 389/12384 [49:38<25:21:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 3%|▎ | 390/12384 [49:38<25:20:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 3%|▎ | 390/12384 [49:46<25:20:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 391/12384 [49:46<25:25:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 391/12384 [49:54<25:25:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 3%|▎ | 392/12384 [49:54<25:24:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 3%|▎ | 392/12384 [50:01<25:24:23, 7.63s/it, loss=0.0009, acc=0.9970, iter_time=7.20s]
Epoch 1: 3%|▎ | 393/12384 [50:01<25:23:13, 7.62s/it, loss=0.0009, acc=0.9970, iter_time=7.20s]
Epoch 1: 3%|▎ | 393/12384 [50:09<25:23:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 394/12384 [50:09<25:21:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 394/12384 [50:17<25:21:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 3%|▎ | 395/12384 [50:17<25:37:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 3%|▎ | 395/12384 [50:24<25:37:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 3%|▎ | 396/12384 [50:24<25:34:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 3%|▎ | 396/12384 [50:32<25:34:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 3%|▎ | 397/12384 [50:32<25:29:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 3%|▎ | 397/12384 [50:39<25:29:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 398/12384 [50:39<25:26:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 398/12384 [50:47<25:26:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 399/12384 [50:47<25:23:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 399/12384 [50:55<25:23:28, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=8.05s]
Epoch 1: 3%|▎ | 400/12384 [50:55<25:41:32, 7.72s/it, loss=0.0001, acc=0.9997, iter_time=8.05s]
Epoch 1: 3%|▎ | 400/12384 [51:03<25:41:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 3%|▎ | 401/12384 [51:03<25:34:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 3%|▎ | 401/12384 [51:10<25:34:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 3%|▎ | 402/12384 [51:10<25:30:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 3%|▎ | 402/12384 [51:18<25:30:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 403/12384 [51:18<25:25:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 403/12384 [51:25<25:25:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 404/12384 [51:25<25:24:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 404/12384 [51:33<25:24:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 3%|▎ | 405/12384 [51:33<25:24:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 3%|▎ | 405/12384 [51:41<25:24:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 406/12384 [51:41<25:23:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 406/12384 [51:48<25:23:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 3%|▎ | 407/12384 [51:48<25:22:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 3%|▎ | 407/12384 [51:56<25:22:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.57s]
Epoch 1: 3%|▎ | 408/12384 [51:56<25:21:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.57s]
Epoch 1: 3%|▎ | 408/12384 [52:04<25:21:39, 7.62s/it, loss=0.0023, acc=0.9967, iter_time=4.96s]
Epoch 1: 3%|▎ | 409/12384 [52:04<25:19:22, 7.61s/it, loss=0.0023, acc=0.9967, iter_time=4.96s]
Epoch 1: 3%|▎ | 409/12384 [52:11<25:19:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 3%|▎ | 410/12384 [52:11<25:17:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 3%|▎ | 410/12384 [52:19<25:17:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 3%|▎ | 411/12384 [52:19<25:21:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 3%|▎ | 411/12384 [52:26<25:21:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 3%|▎ | 412/12384 [52:26<25:24:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 3%|▎ | 412/12384 [52:34<25:24:03, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.68s]
Epoch 1: 3%|▎ | 413/12384 [52:34<25:21:41, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.68s]
Epoch 1: 3%|▎ | 413/12384 [52:42<25:21:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 414/12384 [52:42<25:20:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 414/12384 [52:49<25:20:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 3%|▎ | 415/12384 [52:49<25:19:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 3%|▎ | 415/12384 [52:57<25:19:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 1: 3%|▎ | 416/12384 [52:57<25:18:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 1: 3%|▎ | 416/12384 [53:04<25:18:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 3%|▎ | 417/12384 [53:04<25:18:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 3%|▎ | 417/12384 [53:12<25:18:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 3%|▎ | 418/12384 [53:12<25:17:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 3%|▎ | 418/12384 [53:20<25:17:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 3%|▎ | 419/12384 [53:20<25:17:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 3%|▎ | 419/12384 [53:27<25:17:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 420/12384 [53:27<25:22:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 3%|▎ | 420/12384 [53:35<25:22:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 3%|▎ | 421/12384 [53:35<25:37:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 3%|▎ | 421/12384 [53:43<25:37:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 422/12384 [53:43<25:31:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 422/12384 [53:51<25:31:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 3%|▎ | 423/12384 [53:51<25:27:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 3%|▎ | 423/12384 [53:58<25:27:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 3%|▎ | 424/12384 [53:58<25:24:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 3%|▎ | 424/12384 [54:06<25:24:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 3%|▎ | 425/12384 [54:06<25:26:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 3%|▎ | 425/12384 [54:14<25:26:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.97s]
Epoch 1: 3%|▎ | 426/12384 [54:14<25:39:59, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=3.97s]
Epoch 1: 3%|▎ | 426/12384 [54:21<25:39:59, 7.73s/it, loss=0.0004, acc=0.9986, iter_time=11.29s]
Epoch 1: 3%|▎ | 427/12384 [54:21<25:33:36, 7.70s/it, loss=0.0004, acc=0.9986, iter_time=11.29s]
Epoch 1: 3%|▎ | 427/12384 [54:29<25:33:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 3%|▎ | 428/12384 [54:29<25:28:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 3%|▎ | 428/12384 [54:37<25:28:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 429/12384 [54:37<25:25:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 3%|▎ | 429/12384 [54:44<25:25:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 430/12384 [54:44<25:22:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 3%|▎ | 430/12384 [54:52<25:22:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 431/12384 [54:52<25:20:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 3%|▎ | 431/12384 [54:59<25:20:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 3%|▎ | 432/12384 [54:59<25:24:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 3%|▎ | 432/12384 [55:07<25:24:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 3%|▎ | 433/12384 [55:07<25:21:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 3%|▎ | 433/12384 [55:15<25:21:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 434/12384 [55:15<25:20:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 434/12384 [55:22<25:20:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 435/12384 [55:22<25:17:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 435/12384 [55:30<25:17:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▎ | 436/12384 [55:30<25:17:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▎ | 436/12384 [55:38<25:17:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 4%|▎ | 437/12384 [55:38<25:17:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 4%|▎ | 437/12384 [55:45<25:17:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 438/12384 [55:45<25:17:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 438/12384 [55:53<25:17:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 4%|▎ | 439/12384 [55:53<25:19:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 4%|▎ | 439/12384 [56:00<25:19:41, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 1: 4%|▎ | 440/12384 [56:00<25:19:07, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 1: 4%|▎ | 440/12384 [56:08<25:19:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 4%|▎ | 441/12384 [56:08<25:16:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 4%|▎ | 441/12384 [56:16<25:16:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 4%|▎ | 442/12384 [56:16<25:14:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 4%|▎ | 442/12384 [56:23<25:14:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 4%|▎ | 443/12384 [56:23<25:13:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 4%|▎ | 443/12384 [56:31<25:13:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▎ | 444/12384 [56:31<25:18:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▎ | 444/12384 [56:39<25:18:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 4%|▎ | 445/12384 [56:39<25:17:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 4%|▎ | 445/12384 [56:46<25:17:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 4%|▎ | 446/12384 [56:46<25:14:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 4%|▎ | 446/12384 [56:54<25:14:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 4%|▎ | 447/12384 [56:54<25:29:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 4%|▎ | 447/12384 [57:02<25:29:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 4%|▎ | 448/12384 [57:02<25:25:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 4%|▎ | 448/12384 [57:09<25:25:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 4%|▎ | 449/12384 [57:09<25:21:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 4%|▎ | 449/12384 [57:17<25:21:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 4%|▎ | 450/12384 [57:17<25:19:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 4%|▎ | 450/12384 [57:24<25:19:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 4%|▎ | 451/12384 [57:24<25:18:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 4%|▎ | 451/12384 [57:32<25:18:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 4%|▎ | 452/12384 [57:32<25:17:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 4%|▎ | 452/12384 [57:40<25:17:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 4%|▎ | 453/12384 [57:40<25:37:10, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 4%|▎ | 453/12384 [57:48<25:37:10, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 4%|▎ | 454/12384 [57:48<25:33:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 4%|▎ | 454/12384 [57:55<25:33:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 4%|▎ | 455/12384 [57:55<25:25:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 4%|▎ | 455/12384 [58:03<25:25:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 4%|▎ | 456/12384 [58:03<25:28:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 4%|▎ | 456/12384 [58:11<25:28:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 4%|▎ | 457/12384 [58:11<25:25:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 4%|▎ | 457/12384 [58:18<25:25:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 458/12384 [58:18<25:22:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 458/12384 [58:26<25:22:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 459/12384 [58:26<25:19:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▎ | 459/12384 [58:33<25:19:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▎ | 460/12384 [58:33<25:16:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▎ | 460/12384 [58:41<25:16:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▎ | 461/12384 [58:41<25:15:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▎ | 461/12384 [58:49<25:15:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▎ | 462/12384 [58:49<25:14:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▎ | 462/12384 [58:56<25:14:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▎ | 463/12384 [58:56<25:12:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▎ | 463/12384 [59:04<25:12:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 4%|▎ | 464/12384 [59:04<25:13:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 4%|▎ | 464/12384 [59:12<25:13:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 4%|▍ | 465/12384 [59:12<25:12:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 4%|▍ | 465/12384 [59:19<25:12:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 4%|▍ | 466/12384 [59:19<25:13:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 4%|▍ | 466/12384 [59:27<25:13:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 4%|▍ | 467/12384 [59:27<25:14:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 4%|▍ | 467/12384 [59:34<25:14:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 4%|▍ | 468/12384 [59:34<25:13:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 4%|▍ | 468/12384 [59:42<25:13:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 4%|▍ | 469/12384 [59:42<25:13:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 4%|▍ | 469/12384 [59:50<25:13:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 470/12384 [59:50<25:11:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 470/12384 [59:57<25:11:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 471/12384 [59:57<25:10:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 471/12384 [1:00:05<25:10:47, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.98s]
Epoch 1: 4%|▍ | 472/12384 [1:00:05<25:10:37, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.98s]
Epoch 1: 4%|▍ | 472/12384 [1:00:13<25:10:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 4%|▍ | 473/12384 [1:00:13<25:26:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 4%|▍ | 473/12384 [1:00:20<25:26:23, 7.69s/it, loss=0.0001, acc=0.9990, iter_time=7.59s]
Epoch 1: 4%|▍ | 474/12384 [1:00:20<25:20:39, 7.66s/it, loss=0.0001, acc=0.9990, iter_time=7.59s]
Epoch 1: 4%|▍ | 474/12384 [1:00:28<25:20:39, 7.66s/it, loss=0.0005, acc=0.9981, iter_time=7.60s]
Epoch 1: 4%|▍ | 475/12384 [1:00:28<25:16:44, 7.64s/it, loss=0.0005, acc=0.9981, iter_time=7.60s]
Epoch 1: 4%|▍ | 475/12384 [1:00:36<25:16:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 4%|▍ | 476/12384 [1:00:36<25:14:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 4%|▍ | 476/12384 [1:00:43<25:14:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 4%|▍ | 477/12384 [1:00:43<25:13:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 4%|▍ | 477/12384 [1:00:51<25:13:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▍ | 478/12384 [1:00:51<25:12:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▍ | 478/12384 [1:00:59<25:12:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 4%|▍ | 479/12384 [1:00:59<25:28:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 4%|▍ | 479/12384 [1:01:06<25:28:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 4%|▍ | 480/12384 [1:01:06<25:22:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 4%|▍ | 480/12384 [1:01:14<25:22:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 4%|▍ | 481/12384 [1:01:14<25:18:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 4%|▍ | 481/12384 [1:01:21<25:18:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 482/12384 [1:01:21<25:16:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 482/12384 [1:01:29<25:16:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 483/12384 [1:01:29<25:13:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 483/12384 [1:01:37<25:13:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 4%|▍ | 484/12384 [1:01:37<25:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 4%|▍ | 484/12384 [1:01:44<25:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 4%|▍ | 485/12384 [1:01:44<25:13:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 4%|▍ | 485/12384 [1:01:52<25:13:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 4%|▍ | 486/12384 [1:01:52<25:13:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 4%|▍ | 486/12384 [1:02:00<25:13:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 4%|▍ | 487/12384 [1:02:00<25:11:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 4%|▍ | 487/12384 [1:02:07<25:11:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 4%|▍ | 488/12384 [1:02:07<25:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 4%|▍ | 488/12384 [1:02:15<25:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 4%|▍ | 489/12384 [1:02:15<25:13:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 4%|▍ | 489/12384 [1:02:22<25:13:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 4%|▍ | 490/12384 [1:02:22<25:12:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 4%|▍ | 490/12384 [1:02:30<25:12:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 4%|▍ | 491/12384 [1:02:30<25:09:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 4%|▍ | 491/12384 [1:02:38<25:09:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 4%|▍ | 492/12384 [1:02:38<25:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 4%|▍ | 492/12384 [1:02:45<25:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 4%|▍ | 493/12384 [1:02:45<25:13:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 4%|▍ | 493/12384 [1:02:53<25:13:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 4%|▍ | 494/12384 [1:02:53<25:10:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 4%|▍ | 494/12384 [1:03:01<25:10:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 4%|▍ | 495/12384 [1:03:01<25:09:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 4%|▍ | 495/12384 [1:03:08<25:09:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 4%|▍ | 496/12384 [1:03:08<25:09:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 4%|▍ | 496/12384 [1:03:16<25:09:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 4%|▍ | 497/12384 [1:03:16<25:14:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 4%|▍ | 497/12384 [1:03:23<25:14:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▍ | 498/12384 [1:03:23<25:12:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▍ | 498/12384 [1:03:31<25:12:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 1: 4%|▍ | 499/12384 [1:03:31<25:10:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 1: 4%|▍ | 499/12384 [1:03:39<25:10:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 4%|▍ | 500/12384 [1:03:39<25:09:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 4%|▍ | 500/12384 [1:03:46<25:09:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 4%|▍ | 501/12384 [1:03:46<25:09:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 4%|▍ | 501/12384 [1:03:54<25:09:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 4%|▍ | 502/12384 [1:03:54<25:08:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 4%|▍ | 502/12384 [1:04:02<25:08:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 4%|▍ | 503/12384 [1:04:02<25:07:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 4%|▍ | 503/12384 [1:04:09<25:07:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 4%|▍ | 504/12384 [1:04:09<25:08:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 4%|▍ | 504/12384 [1:04:17<25:08:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 4%|▍ | 505/12384 [1:04:17<25:27:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 4%|▍ | 505/12384 [1:04:25<25:27:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 4%|▍ | 506/12384 [1:04:25<25:19:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 4%|▍ | 506/12384 [1:04:32<25:19:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 4%|▍ | 507/12384 [1:04:32<25:17:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 4%|▍ | 507/12384 [1:04:40<25:17:44, 7.67s/it, loss=0.0002, acc=0.9990, iter_time=8.85s]
Epoch 1: 4%|▍ | 508/12384 [1:04:40<25:14:36, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=8.85s]
Epoch 1: 4%|▍ | 508/12384 [1:04:48<25:14:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 4%|▍ | 509/12384 [1:04:48<25:13:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 4%|▍ | 509/12384 [1:04:55<25:13:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▍ | 510/12384 [1:04:55<25:11:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 4%|▍ | 510/12384 [1:05:03<25:11:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 4%|▍ | 511/12384 [1:05:03<25:08:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 4%|▍ | 511/12384 [1:05:10<25:08:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 1: 4%|▍ | 512/12384 [1:05:10<25:08:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 1: 4%|▍ | 512/12384 [1:05:18<25:08:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 4%|▍ | 513/12384 [1:05:18<25:05:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 4%|▍ | 513/12384 [1:05:26<25:05:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 4%|▍ | 514/12384 [1:05:26<25:09:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 4%|▍ | 514/12384 [1:05:33<25:09:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 1: 4%|▍ | 515/12384 [1:05:33<25:07:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 1: 4%|▍ | 515/12384 [1:05:41<25:07:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 4%|▍ | 516/12384 [1:05:41<25:09:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 4%|▍ | 516/12384 [1:05:49<25:09:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 1: 4%|▍ | 517/12384 [1:05:49<25:11:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 1: 4%|▍ | 517/12384 [1:05:56<25:11:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 4%|▍ | 518/12384 [1:05:56<25:10:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 4%|▍ | 518/12384 [1:06:04<25:10:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 4%|▍ | 519/12384 [1:06:04<25:10:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 4%|▍ | 519/12384 [1:06:11<25:10:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 4%|▍ | 520/12384 [1:06:11<25:07:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 4%|▍ | 520/12384 [1:06:19<25:07:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 4%|▍ | 521/12384 [1:06:19<25:06:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 4%|▍ | 521/12384 [1:06:27<25:06:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 4%|▍ | 522/12384 [1:06:27<25:06:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 4%|▍ | 522/12384 [1:06:34<25:06:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 4%|▍ | 523/12384 [1:06:34<25:06:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 4%|▍ | 523/12384 [1:06:42<25:06:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 4%|▍ | 524/12384 [1:06:42<25:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 4%|▍ | 524/12384 [1:06:50<25:04:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 525/12384 [1:06:50<25:04:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 525/12384 [1:06:57<25:04:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 4%|▍ | 526/12384 [1:06:57<25:21:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 4%|▍ | 526/12384 [1:07:05<25:21:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 4%|▍ | 527/12384 [1:07:05<25:15:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 4%|▍ | 527/12384 [1:07:13<25:15:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 4%|▍ | 528/12384 [1:07:13<25:11:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 4%|▍ | 528/12384 [1:07:20<25:11:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 4%|▍ | 529/12384 [1:07:20<25:07:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 4%|▍ | 529/12384 [1:07:28<25:07:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 4%|▍ | 530/12384 [1:07:28<25:05:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 4%|▍ | 530/12384 [1:07:36<25:05:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 4%|▍ | 531/12384 [1:07:36<25:27:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 4%|▍ | 531/12384 [1:07:43<25:27:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 4%|▍ | 532/12384 [1:07:43<25:18:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 4%|▍ | 532/12384 [1:07:51<25:18:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 4%|▍ | 533/12384 [1:07:51<25:15:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 4%|▍ | 533/12384 [1:07:59<25:15:26, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 534/12384 [1:07:59<25:11:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 534/12384 [1:08:06<25:11:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 535/12384 [1:08:06<25:07:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 535/12384 [1:08:14<25:07:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 4%|▍ | 536/12384 [1:08:14<25:06:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 4%|▍ | 536/12384 [1:08:21<25:06:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 4%|▍ | 537/12384 [1:08:21<25:05:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 4%|▍ | 537/12384 [1:08:29<25:05:01, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=7.63s]
Epoch 1: 4%|▍ | 538/12384 [1:08:29<25:04:37, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=7.63s]
Epoch 1: 4%|▍ | 538/12384 [1:08:37<25:04:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 4%|▍ | 539/12384 [1:08:37<25:02:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 4%|▍ | 539/12384 [1:08:44<25:02:18, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 1: 4%|▍ | 540/12384 [1:08:44<25:01:52, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 1: 4%|▍ | 540/12384 [1:08:52<25:01:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 541/12384 [1:08:52<25:00:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 541/12384 [1:08:59<25:00:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 542/12384 [1:08:59<25:01:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 4%|▍ | 542/12384 [1:09:07<25:01:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 543/12384 [1:09:07<25:02:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 543/12384 [1:09:15<25:02:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 4%|▍ | 544/12384 [1:09:15<25:01:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 4%|▍ | 544/12384 [1:09:22<25:01:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 4%|▍ | 545/12384 [1:09:22<25:00:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 4%|▍ | 545/12384 [1:09:30<25:00:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 4%|▍ | 546/12384 [1:09:30<25:00:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 4%|▍ | 546/12384 [1:09:37<25:00:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 4%|▍ | 547/12384 [1:09:37<24:59:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 4%|▍ | 547/12384 [1:09:45<24:59:26, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=8.53s]
Epoch 1: 4%|▍ | 548/12384 [1:09:45<24:59:09, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=8.53s]
Epoch 1: 4%|▍ | 548/12384 [1:09:53<24:59:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 549/12384 [1:09:53<24:59:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 4%|▍ | 549/12384 [1:10:00<24:59:56, 7.60s/it, loss=0.0001, acc=0.9995, iter_time=5.62s]
Epoch 1: 4%|▍ | 550/12384 [1:10:00<25:00:30, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=5.62s]
Epoch 1: 4%|▍ | 550/12384 [1:10:08<25:00:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 1: 4%|▍ | 551/12384 [1:10:08<25:01:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 1: 4%|▍ | 551/12384 [1:10:16<25:01:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 1: 4%|▍ | 552/12384 [1:10:16<25:01:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 1: 4%|▍ | 552/12384 [1:10:23<25:01:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 4%|▍ | 553/12384 [1:10:23<25:00:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 4%|▍ | 553/12384 [1:10:31<25:00:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 4%|▍ | 554/12384 [1:10:31<25:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 4%|▍ | 554/12384 [1:10:38<25:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 4%|▍ | 555/12384 [1:10:38<24:59:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 4%|▍ | 555/12384 [1:10:46<24:59:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 4%|▍ | 556/12384 [1:10:46<25:00:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 4%|▍ | 556/12384 [1:10:54<25:00:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 4%|▍ | 557/12384 [1:10:54<25:20:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 4%|▍ | 557/12384 [1:11:02<25:20:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 5%|▍ | 558/12384 [1:11:02<25:14:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 5%|▍ | 558/12384 [1:11:09<25:14:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 5%|▍ | 559/12384 [1:11:09<25:13:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 5%|▍ | 559/12384 [1:11:17<25:13:09, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.09s]
Epoch 1: 5%|▍ | 560/12384 [1:11:17<25:14:02, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.09s]
Epoch 1: 5%|▍ | 560/12384 [1:11:25<25:14:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.81s]
Epoch 1: 5%|▍ | 561/12384 [1:11:25<25:10:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.81s]
Epoch 1: 5%|▍ | 561/12384 [1:11:32<25:10:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 1: 5%|▍ | 562/12384 [1:11:32<25:06:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 1: 5%|▍ | 562/12384 [1:11:40<25:06:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 563/12384 [1:11:40<25:04:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 563/12384 [1:11:47<25:04:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 564/12384 [1:11:47<25:03:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 564/12384 [1:11:55<25:03:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▍ | 565/12384 [1:11:55<25:01:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▍ | 565/12384 [1:12:03<25:01:11, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.99s]
Epoch 1: 5%|▍ | 566/12384 [1:12:03<24:59:48, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.99s]
Epoch 1: 5%|▍ | 566/12384 [1:12:10<24:59:48, 7.61s/it, loss=0.0003, acc=0.9983, iter_time=7.22s]
Epoch 1: 5%|▍ | 567/12384 [1:12:10<24:59:20, 7.61s/it, loss=0.0003, acc=0.9983, iter_time=7.22s]
Epoch 1: 5%|▍ | 567/12384 [1:12:18<24:59:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 5%|▍ | 568/12384 [1:12:18<24:59:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 5%|▍ | 568/12384 [1:12:25<24:59:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=2.96s]
Epoch 1: 5%|▍ | 569/12384 [1:12:25<24:57:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=2.96s]
Epoch 1: 5%|▍ | 569/12384 [1:12:33<24:57:21, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=12.28s]
Epoch 1: 5%|▍ | 570/12384 [1:12:33<24:58:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=12.28s]
Epoch 1: 5%|▍ | 570/12384 [1:12:41<24:58:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 5%|▍ | 571/12384 [1:12:41<24:57:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 5%|▍ | 571/12384 [1:12:48<24:57:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 5%|▍ | 572/12384 [1:12:48<24:58:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 5%|▍ | 572/12384 [1:12:56<24:58:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 5%|▍ | 573/12384 [1:12:56<24:56:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 5%|▍ | 573/12384 [1:13:03<24:56:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 5%|▍ | 574/12384 [1:13:03<24:55:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 5%|▍ | 574/12384 [1:13:11<24:55:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▍ | 575/12384 [1:13:11<24:57:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▍ | 575/12384 [1:13:19<24:57:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 5%|▍ | 576/12384 [1:13:19<24:57:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 5%|▍ | 576/12384 [1:13:26<24:57:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 5%|▍ | 577/12384 [1:13:26<24:56:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 5%|▍ | 577/12384 [1:13:34<24:56:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 5%|▍ | 578/12384 [1:13:34<24:59:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 5%|▍ | 578/12384 [1:13:42<24:59:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 5%|▍ | 579/12384 [1:13:42<25:15:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 5%|▍ | 579/12384 [1:13:49<25:15:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 580/12384 [1:13:49<25:10:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 580/12384 [1:13:57<25:10:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 581/12384 [1:13:57<25:05:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 581/12384 [1:14:05<25:05:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▍ | 582/12384 [1:14:05<25:07:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▍ | 582/12384 [1:14:12<25:07:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 5%|▍ | 583/12384 [1:14:12<25:07:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 5%|▍ | 583/12384 [1:14:20<25:07:25, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.89s]
Epoch 1: 5%|▍ | 584/12384 [1:14:20<25:23:24, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=7.89s]
Epoch 1: 5%|▍ | 584/12384 [1:14:28<25:23:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 5%|▍ | 585/12384 [1:14:28<25:15:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 5%|▍ | 585/12384 [1:14:35<25:15:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 1: 5%|▍ | 586/12384 [1:14:35<25:09:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 1: 5%|▍ | 586/12384 [1:14:43<25:09:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 5%|▍ | 587/12384 [1:14:43<25:05:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 5%|▍ | 587/12384 [1:14:51<25:05:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 5%|▍ | 588/12384 [1:14:51<25:01:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 5%|▍ | 588/12384 [1:14:58<25:01:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 589/12384 [1:14:58<24:59:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 589/12384 [1:15:06<24:59:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 5%|▍ | 590/12384 [1:15:06<25:01:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 5%|▍ | 590/12384 [1:15:14<25:01:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 5%|▍ | 591/12384 [1:15:14<24:58:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 5%|▍ | 591/12384 [1:15:21<24:58:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 5%|▍ | 592/12384 [1:15:21<24:58:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 5%|▍ | 592/12384 [1:15:29<24:58:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 5%|▍ | 593/12384 [1:15:29<24:58:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 5%|▍ | 593/12384 [1:15:36<24:58:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 5%|▍ | 594/12384 [1:15:36<24:58:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 5%|▍ | 594/12384 [1:15:44<24:58:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 5%|▍ | 595/12384 [1:15:44<25:00:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 5%|▍ | 595/12384 [1:15:52<25:00:22, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 1: 5%|▍ | 596/12384 [1:15:52<24:58:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 1: 5%|▍ | 596/12384 [1:15:59<24:58:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 597/12384 [1:15:59<24:56:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 597/12384 [1:16:07<24:56:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 598/12384 [1:16:07<24:55:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 598/12384 [1:16:14<24:55:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▍ | 599/12384 [1:16:14<24:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▍ | 599/12384 [1:16:22<24:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 5%|▍ | 600/12384 [1:16:22<24:53:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 5%|▍ | 600/12384 [1:16:30<24:53:07, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 5%|▍ | 601/12384 [1:16:30<24:54:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 5%|▍ | 601/12384 [1:16:37<24:54:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▍ | 602/12384 [1:16:37<24:54:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▍ | 602/12384 [1:16:45<24:54:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▍ | 603/12384 [1:16:45<24:54:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▍ | 603/12384 [1:16:53<24:54:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 604/12384 [1:16:53<24:55:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 604/12384 [1:17:00<24:55:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 5%|▍ | 605/12384 [1:17:00<24:55:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 5%|▍ | 605/12384 [1:17:08<24:55:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 5%|▍ | 606/12384 [1:17:08<24:54:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 5%|▍ | 606/12384 [1:17:15<24:54:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 5%|▍ | 607/12384 [1:17:15<24:53:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 5%|▍ | 607/12384 [1:17:23<24:53:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 5%|▍ | 608/12384 [1:17:23<24:53:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 5%|▍ | 608/12384 [1:17:31<24:53:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 5%|▍ | 609/12384 [1:17:31<24:54:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 5%|▍ | 609/12384 [1:17:39<24:54:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 5%|▍ | 610/12384 [1:17:39<25:14:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 5%|▍ | 610/12384 [1:17:46<25:14:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 5%|▍ | 611/12384 [1:17:46<25:08:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 5%|▍ | 611/12384 [1:17:54<25:08:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▍ | 612/12384 [1:17:54<25:04:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▍ | 612/12384 [1:18:01<25:04:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 613/12384 [1:18:01<25:01:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 613/12384 [1:18:09<25:01:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 5%|▍ | 614/12384 [1:18:09<24:59:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 5%|▍ | 614/12384 [1:18:17<24:59:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▍ | 615/12384 [1:18:17<24:58:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▍ | 615/12384 [1:18:24<24:58:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 5%|▍ | 616/12384 [1:18:24<25:08:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 5%|▍ | 616/12384 [1:18:32<25:08:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 5%|▍ | 617/12384 [1:18:32<25:02:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 5%|▍ | 617/12384 [1:18:40<25:02:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 618/12384 [1:18:40<24:59:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▍ | 618/12384 [1:18:47<24:59:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 619/12384 [1:18:47<24:55:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▍ | 619/12384 [1:18:55<24:55:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▌ | 620/12384 [1:18:55<24:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▌ | 620/12384 [1:19:02<24:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 621/12384 [1:19:02<24:53:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 621/12384 [1:19:10<24:53:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▌ | 622/12384 [1:19:10<24:55:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▌ | 622/12384 [1:19:18<24:55:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 623/12384 [1:19:18<24:56:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 623/12384 [1:19:25<24:56:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 5%|▌ | 624/12384 [1:19:25<24:55:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 5%|▌ | 624/12384 [1:19:33<24:55:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 5%|▌ | 625/12384 [1:19:33<24:53:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 5%|▌ | 625/12384 [1:19:41<24:53:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.57s]
Epoch 1: 5%|▌ | 626/12384 [1:19:41<24:57:41, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.57s]
Epoch 1: 5%|▌ | 626/12384 [1:19:48<24:57:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 5%|▌ | 627/12384 [1:19:48<24:56:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 5%|▌ | 627/12384 [1:19:56<24:56:34, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=11.41s]
Epoch 1: 5%|▌ | 628/12384 [1:19:56<25:01:39, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=11.41s]
Epoch 1: 5%|▌ | 628/12384 [1:20:04<25:01:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.81s]
Epoch 1: 5%|▌ | 629/12384 [1:20:04<24:59:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.81s]
Epoch 1: 5%|▌ | 629/12384 [1:20:11<24:59:49, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.46s]
Epoch 1: 5%|▌ | 630/12384 [1:20:11<24:56:21, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.46s]
Epoch 1: 5%|▌ | 630/12384 [1:20:19<24:56:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 5%|▌ | 631/12384 [1:20:19<24:54:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 5%|▌ | 631/12384 [1:20:27<24:54:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 5%|▌ | 632/12384 [1:20:27<24:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 5%|▌ | 632/12384 [1:20:34<24:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▌ | 633/12384 [1:20:34<24:53:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 5%|▌ | 633/12384 [1:20:42<24:53:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▌ | 634/12384 [1:20:42<24:51:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 5%|▌ | 634/12384 [1:20:49<24:51:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 5%|▌ | 635/12384 [1:20:49<24:52:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 5%|▌ | 635/12384 [1:20:57<24:52:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.91s]
Epoch 1: 5%|▌ | 636/12384 [1:20:57<24:56:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.91s]
Epoch 1: 5%|▌ | 636/12384 [1:21:05<24:56:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 5%|▌ | 637/12384 [1:21:05<25:13:33, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 5%|▌ | 637/12384 [1:21:13<25:13:33, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 5%|▌ | 638/12384 [1:21:13<25:04:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 5%|▌ | 638/12384 [1:21:20<25:04:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 5%|▌ | 639/12384 [1:21:20<25:00:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 5%|▌ | 639/12384 [1:21:28<25:00:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 5%|▌ | 640/12384 [1:21:28<24:57:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 5%|▌ | 640/12384 [1:21:35<24:57:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 5%|▌ | 641/12384 [1:21:35<24:55:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 5%|▌ | 641/12384 [1:21:43<24:55:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 5%|▌ | 642/12384 [1:21:43<24:54:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 5%|▌ | 642/12384 [1:21:51<24:54:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 5%|▌ | 643/12384 [1:21:51<24:53:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 5%|▌ | 643/12384 [1:21:58<24:53:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 5%|▌ | 644/12384 [1:21:58<24:51:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 5%|▌ | 644/12384 [1:22:06<24:51:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 5%|▌ | 645/12384 [1:22:06<24:49:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 5%|▌ | 645/12384 [1:22:13<24:49:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 5%|▌ | 646/12384 [1:22:13<24:48:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 5%|▌ | 646/12384 [1:22:21<24:48:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 647/12384 [1:22:21<24:47:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 647/12384 [1:22:29<24:47:54, 7.61s/it, loss=0.0001, acc=0.9991, iter_time=8.01s]
Epoch 1: 5%|▌ | 648/12384 [1:22:29<24:49:15, 7.61s/it, loss=0.0001, acc=0.9991, iter_time=8.01s]
Epoch 1: 5%|▌ | 648/12384 [1:22:36<24:49:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 5%|▌ | 649/12384 [1:22:36<24:49:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 5%|▌ | 649/12384 [1:22:44<24:49:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 5%|▌ | 650/12384 [1:22:44<24:48:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 5%|▌ | 650/12384 [1:22:52<24:48:53, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 1: 5%|▌ | 651/12384 [1:22:52<24:48:07, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 1: 5%|▌ | 651/12384 [1:22:59<24:48:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 5%|▌ | 652/12384 [1:22:59<24:47:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 5%|▌ | 652/12384 [1:23:07<24:47:53, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=9.87s]
Epoch 1: 5%|▌ | 653/12384 [1:23:07<24:54:54, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=9.87s]
Epoch 1: 5%|▌ | 653/12384 [1:23:14<24:54:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 5%|▌ | 654/12384 [1:23:14<24:51:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 5%|▌ | 654/12384 [1:23:22<24:51:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▌ | 655/12384 [1:23:22<24:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▌ | 655/12384 [1:23:30<24:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 5%|▌ | 656/12384 [1:23:30<24:50:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 5%|▌ | 656/12384 [1:23:37<24:50:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 5%|▌ | 657/12384 [1:23:37<24:50:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 5%|▌ | 657/12384 [1:23:45<24:50:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 5%|▌ | 658/12384 [1:23:45<24:50:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 5%|▌ | 658/12384 [1:23:53<24:50:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 659/12384 [1:23:53<24:47:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 659/12384 [1:24:00<24:47:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 5%|▌ | 660/12384 [1:24:00<24:46:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 5%|▌ | 660/12384 [1:24:08<24:46:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 5%|▌ | 661/12384 [1:24:08<24:51:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 5%|▌ | 661/12384 [1:24:15<24:51:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 5%|▌ | 662/12384 [1:24:15<24:50:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 5%|▌ | 662/12384 [1:24:23<24:50:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 5%|▌ | 663/12384 [1:24:23<25:12:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 5%|▌ | 663/12384 [1:24:31<25:12:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 5%|▌ | 664/12384 [1:24:31<25:04:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 5%|▌ | 664/12384 [1:24:39<25:04:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 5%|▌ | 665/12384 [1:24:39<25:02:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 5%|▌ | 665/12384 [1:24:46<25:02:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 5%|▌ | 666/12384 [1:24:46<24:58:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 5%|▌ | 666/12384 [1:24:54<24:58:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 5%|▌ | 667/12384 [1:24:54<24:54:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 5%|▌ | 667/12384 [1:25:02<24:54:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▌ | 668/12384 [1:25:02<24:50:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 5%|▌ | 668/12384 [1:25:09<24:50:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▌ | 669/12384 [1:25:09<24:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▌ | 669/12384 [1:25:17<24:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▌ | 670/12384 [1:25:17<24:47:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 5%|▌ | 670/12384 [1:25:24<24:47:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 671/12384 [1:25:24<24:46:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 5%|▌ | 671/12384 [1:25:32<24:46:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 5%|▌ | 672/12384 [1:25:32<24:46:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 5%|▌ | 672/12384 [1:25:40<24:46:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 5%|▌ | 673/12384 [1:25:40<24:48:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 5%|▌ | 673/12384 [1:25:47<24:48:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 5%|▌ | 674/12384 [1:25:47<24:47:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 5%|▌ | 674/12384 [1:25:55<24:47:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 5%|▌ | 675/12384 [1:25:55<24:47:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 5%|▌ | 675/12384 [1:26:02<24:47:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 1: 5%|▌ | 676/12384 [1:26:02<24:46:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 1: 5%|▌ | 676/12384 [1:26:10<24:46:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 5%|▌ | 677/12384 [1:26:10<24:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 5%|▌ | 677/12384 [1:26:18<24:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 5%|▌ | 678/12384 [1:26:18<24:47:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 5%|▌ | 678/12384 [1:26:25<24:47:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 5%|▌ | 679/12384 [1:26:25<24:51:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 5%|▌ | 679/12384 [1:26:33<24:51:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 5%|▌ | 680/12384 [1:26:33<24:48:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 5%|▌ | 680/12384 [1:26:41<24:48:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 5%|▌ | 681/12384 [1:26:41<24:46:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 5%|▌ | 681/12384 [1:26:49<24:46:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 6%|▌ | 682/12384 [1:26:49<25:03:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 6%|▌ | 682/12384 [1:26:56<25:03:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 6%|▌ | 683/12384 [1:26:56<24:59:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 6%|▌ | 683/12384 [1:27:04<24:59:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 684/12384 [1:27:04<24:58:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 684/12384 [1:27:11<24:58:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 6%|▌ | 685/12384 [1:27:11<24:54:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 6%|▌ | 685/12384 [1:27:19<24:54:23, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 1: 6%|▌ | 686/12384 [1:27:19<24:51:54, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 1: 6%|▌ | 686/12384 [1:27:27<24:51:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 6%|▌ | 687/12384 [1:27:27<24:51:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 6%|▌ | 687/12384 [1:27:34<24:51:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 6%|▌ | 688/12384 [1:27:34<24:48:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 6%|▌ | 688/12384 [1:27:42<24:48:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 1: 6%|▌ | 689/12384 [1:27:42<25:06:38, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 1: 6%|▌ | 689/12384 [1:27:50<25:06:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 6%|▌ | 690/12384 [1:27:50<25:00:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 6%|▌ | 690/12384 [1:27:58<25:00:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 6%|▌ | 691/12384 [1:27:58<24:54:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 6%|▌ | 691/12384 [1:28:05<24:54:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 6%|▌ | 692/12384 [1:28:05<24:51:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 6%|▌ | 692/12384 [1:28:13<24:51:25, 7.65s/it, loss=0.0006, acc=0.9996, iter_time=7.58s]
Epoch 1: 6%|▌ | 693/12384 [1:28:13<24:48:40, 7.64s/it, loss=0.0006, acc=0.9996, iter_time=7.58s]
Epoch 1: 6%|▌ | 693/12384 [1:28:20<24:48:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 6%|▌ | 694/12384 [1:28:20<24:46:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 6%|▌ | 694/12384 [1:28:28<24:46:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 6%|▌ | 695/12384 [1:28:28<24:45:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 6%|▌ | 695/12384 [1:28:36<24:45:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 6%|▌ | 696/12384 [1:28:36<24:44:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 6%|▌ | 696/12384 [1:28:43<24:44:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 6%|▌ | 697/12384 [1:28:43<24:42:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 6%|▌ | 697/12384 [1:28:51<24:42:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 698/12384 [1:28:51<24:49:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 698/12384 [1:28:59<24:49:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 6%|▌ | 699/12384 [1:28:59<24:50:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 6%|▌ | 699/12384 [1:29:06<24:50:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 6%|▌ | 700/12384 [1:29:06<24:48:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 6%|▌ | 700/12384 [1:29:14<24:48:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 6%|▌ | 701/12384 [1:29:14<24:45:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 6%|▌ | 701/12384 [1:29:21<24:45:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 6%|▌ | 702/12384 [1:29:21<24:43:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 6%|▌ | 702/12384 [1:29:29<24:43:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 6%|▌ | 703/12384 [1:29:29<24:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 6%|▌ | 703/12384 [1:29:37<24:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 6%|▌ | 704/12384 [1:29:37<24:48:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 6%|▌ | 704/12384 [1:29:44<24:48:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 6%|▌ | 705/12384 [1:29:44<24:45:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 6%|▌ | 705/12384 [1:29:52<24:45:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 6%|▌ | 706/12384 [1:29:52<24:45:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 6%|▌ | 706/12384 [1:30:00<24:45:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 707/12384 [1:30:00<24:47:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 707/12384 [1:30:07<24:47:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 6%|▌ | 708/12384 [1:30:07<24:44:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 6%|▌ | 708/12384 [1:30:15<24:44:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 1: 6%|▌ | 709/12384 [1:30:15<24:44:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 1: 6%|▌ | 709/12384 [1:30:22<24:44:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 6%|▌ | 710/12384 [1:30:22<24:42:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 6%|▌ | 710/12384 [1:30:30<24:42:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 711/12384 [1:30:30<24:43:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 711/12384 [1:30:38<24:43:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▌ | 712/12384 [1:30:38<24:44:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▌ | 712/12384 [1:30:45<24:44:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 6%|▌ | 713/12384 [1:30:45<24:43:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 6%|▌ | 713/12384 [1:30:53<24:43:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 6%|▌ | 714/12384 [1:30:53<24:42:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 6%|▌ | 714/12384 [1:31:01<24:42:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 6%|▌ | 715/12384 [1:31:01<25:01:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 6%|▌ | 715/12384 [1:31:08<25:01:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 6%|▌ | 716/12384 [1:31:08<24:53:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 6%|▌ | 716/12384 [1:31:16<24:53:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 6%|▌ | 717/12384 [1:31:16<24:48:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 6%|▌ | 717/12384 [1:31:24<24:48:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 6%|▌ | 718/12384 [1:31:24<24:44:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 6%|▌ | 718/12384 [1:31:31<24:44:31, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 719/12384 [1:31:31<24:43:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 719/12384 [1:31:39<24:43:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 6%|▌ | 720/12384 [1:31:39<24:40:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 6%|▌ | 720/12384 [1:31:46<24:40:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 1: 6%|▌ | 721/12384 [1:31:46<24:39:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 1: 6%|▌ | 721/12384 [1:31:54<24:39:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 6%|▌ | 722/12384 [1:31:54<24:37:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 6%|▌ | 722/12384 [1:32:02<24:37:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 6%|▌ | 723/12384 [1:32:02<24:37:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 6%|▌ | 723/12384 [1:32:09<24:37:39, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 724/12384 [1:32:09<24:43:09, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 724/12384 [1:32:17<24:43:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 1: 6%|▌ | 725/12384 [1:32:17<24:41:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 1: 6%|▌ | 725/12384 [1:32:25<24:41:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 726/12384 [1:32:25<24:40:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 726/12384 [1:32:32<24:40:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▌ | 727/12384 [1:32:32<24:39:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▌ | 727/12384 [1:32:40<24:39:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 6%|▌ | 728/12384 [1:32:40<24:38:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 6%|▌ | 728/12384 [1:32:47<24:38:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 6%|▌ | 729/12384 [1:32:47<24:38:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 6%|▌ | 729/12384 [1:32:55<24:38:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 6%|▌ | 730/12384 [1:32:55<24:37:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 6%|▌ | 730/12384 [1:33:03<24:37:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 6%|▌ | 731/12384 [1:33:03<24:37:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 6%|▌ | 731/12384 [1:33:10<24:37:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▌ | 732/12384 [1:33:10<24:37:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▌ | 732/12384 [1:33:18<24:37:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 6%|▌ | 733/12384 [1:33:18<24:37:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 6%|▌ | 733/12384 [1:33:26<24:37:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 6%|▌ | 734/12384 [1:33:26<24:54:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 6%|▌ | 734/12384 [1:33:33<24:54:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 6%|▌ | 735/12384 [1:33:33<24:49:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 6%|▌ | 735/12384 [1:33:41<24:49:35, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 6%|▌ | 736/12384 [1:33:41<24:44:44, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 6%|▌ | 736/12384 [1:33:49<24:44:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 6%|▌ | 737/12384 [1:33:49<24:41:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 6%|▌ | 737/12384 [1:33:56<24:41:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 6%|▌ | 738/12384 [1:33:56<24:40:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 6%|▌ | 738/12384 [1:34:04<24:40:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 6%|▌ | 739/12384 [1:34:04<24:37:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 6%|▌ | 739/12384 [1:34:11<24:37:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 740/12384 [1:34:11<24:39:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 740/12384 [1:34:19<24:39:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 6%|▌ | 741/12384 [1:34:19<24:59:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 6%|▌ | 741/12384 [1:34:27<24:59:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 6%|▌ | 742/12384 [1:34:27<24:51:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 6%|▌ | 742/12384 [1:34:35<24:51:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 6%|▌ | 743/12384 [1:34:35<24:45:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 6%|▌ | 743/12384 [1:34:42<24:45:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 6%|▌ | 744/12384 [1:34:42<24:44:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 6%|▌ | 744/12384 [1:34:50<24:44:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 6%|▌ | 745/12384 [1:34:50<24:41:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 6%|▌ | 745/12384 [1:34:57<24:41:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 6%|▌ | 746/12384 [1:34:57<24:43:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 6%|▌ | 746/12384 [1:35:05<24:43:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 6%|▌ | 747/12384 [1:35:05<24:41:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 6%|▌ | 747/12384 [1:35:13<24:41:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 6%|▌ | 748/12384 [1:35:13<24:40:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 6%|▌ | 748/12384 [1:35:20<24:40:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.32s]
Epoch 1: 6%|▌ | 749/12384 [1:35:20<24:37:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.32s]
Epoch 1: 6%|▌ | 749/12384 [1:35:28<24:37:46, 7.62s/it, loss=0.0003, acc=0.9972, iter_time=7.83s]
Epoch 1: 6%|▌ | 750/12384 [1:35:28<24:36:20, 7.61s/it, loss=0.0003, acc=0.9972, iter_time=7.83s]
Epoch 1: 6%|▌ | 750/12384 [1:35:35<24:36:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 6%|▌ | 751/12384 [1:35:35<24:34:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 6%|▌ | 751/12384 [1:35:43<24:34:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 6%|▌ | 752/12384 [1:35:43<24:35:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 6%|▌ | 752/12384 [1:35:51<24:35:15, 7.61s/it, loss=0.0006, acc=0.9997, iter_time=7.20s]
Epoch 1: 6%|▌ | 753/12384 [1:35:51<24:34:22, 7.61s/it, loss=0.0006, acc=0.9997, iter_time=7.20s]
Epoch 1: 6%|▌ | 753/12384 [1:35:58<24:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 754/12384 [1:35:58<24:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 754/12384 [1:36:06<24:34:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 755/12384 [1:36:06<24:33:44, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 755/12384 [1:36:13<24:33:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 6%|▌ | 756/12384 [1:36:13<24:34:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 6%|▌ | 756/12384 [1:36:21<24:34:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 6%|▌ | 757/12384 [1:36:21<24:34:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 6%|▌ | 757/12384 [1:36:29<24:34:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▌ | 758/12384 [1:36:29<24:34:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▌ | 758/12384 [1:36:36<24:34:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 6%|▌ | 759/12384 [1:36:36<24:34:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 6%|▌ | 759/12384 [1:36:44<24:34:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 6%|▌ | 760/12384 [1:36:44<24:33:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 6%|▌ | 760/12384 [1:36:52<24:33:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 6%|▌ | 761/12384 [1:36:52<24:38:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 6%|▌ | 761/12384 [1:36:59<24:38:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 6%|▌ | 762/12384 [1:36:59<24:38:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 6%|▌ | 762/12384 [1:37:07<24:38:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 6%|▌ | 763/12384 [1:37:07<24:34:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 6%|▌ | 763/12384 [1:37:14<24:34:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 764/12384 [1:37:14<24:34:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▌ | 764/12384 [1:37:22<24:34:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 765/12384 [1:37:22<24:35:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 765/12384 [1:37:30<24:35:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 6%|▌ | 766/12384 [1:37:30<24:35:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 6%|▌ | 766/12384 [1:37:37<24:35:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 6%|▌ | 767/12384 [1:37:37<24:35:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 6%|▌ | 767/12384 [1:37:45<24:35:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 6%|▌ | 768/12384 [1:37:45<24:52:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 6%|▌ | 768/12384 [1:37:53<24:52:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 6%|▌ | 769/12384 [1:37:53<24:47:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 6%|▌ | 769/12384 [1:38:00<24:47:16, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=9.69s]
Epoch 1: 6%|▌ | 770/12384 [1:38:00<24:43:44, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.69s]
Epoch 1: 6%|▌ | 770/12384 [1:38:08<24:43:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 771/12384 [1:38:08<24:41:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 771/12384 [1:38:16<24:41:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 6%|▌ | 772/12384 [1:38:16<24:39:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 6%|▌ | 772/12384 [1:38:23<24:39:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 773/12384 [1:38:23<24:43:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▌ | 773/12384 [1:38:31<24:43:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 6%|▋ | 774/12384 [1:38:31<24:41:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 6%|▋ | 774/12384 [1:38:39<24:41:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 6%|▋ | 775/12384 [1:38:39<24:37:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 6%|▋ | 775/12384 [1:38:46<24:37:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 6%|▋ | 776/12384 [1:38:46<24:36:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 6%|▋ | 776/12384 [1:38:54<24:36:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 6%|▋ | 777/12384 [1:38:54<24:35:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 6%|▋ | 777/12384 [1:39:01<24:35:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 6%|▋ | 778/12384 [1:39:01<24:32:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 6%|▋ | 778/12384 [1:39:09<24:32:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 6%|▋ | 779/12384 [1:39:09<24:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 6%|▋ | 779/12384 [1:39:17<24:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 6%|▋ | 780/12384 [1:39:17<24:30:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 6%|▋ | 780/12384 [1:39:24<24:30:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 6%|▋ | 781/12384 [1:39:24<24:29:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 6%|▋ | 781/12384 [1:39:32<24:29:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 6%|▋ | 782/12384 [1:39:32<24:31:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 6%|▋ | 782/12384 [1:39:39<24:31:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▋ | 783/12384 [1:39:39<24:30:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▋ | 783/12384 [1:39:47<24:30:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 6%|▋ | 784/12384 [1:39:47<24:31:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 6%|▋ | 784/12384 [1:39:55<24:31:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 6%|▋ | 785/12384 [1:39:55<24:31:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 6%|▋ | 785/12384 [1:40:02<24:31:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▋ | 786/12384 [1:40:02<24:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▋ | 786/12384 [1:40:10<24:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 6%|▋ | 787/12384 [1:40:10<24:47:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 6%|▋ | 787/12384 [1:40:18<24:47:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 6%|▋ | 788/12384 [1:40:18<24:42:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 6%|▋ | 788/12384 [1:40:25<24:42:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 6%|▋ | 789/12384 [1:40:25<24:37:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 6%|▋ | 789/12384 [1:40:33<24:37:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▋ | 790/12384 [1:40:33<24:35:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▋ | 790/12384 [1:40:41<24:35:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▋ | 791/12384 [1:40:41<24:33:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 6%|▋ | 791/12384 [1:40:48<24:33:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 6%|▋ | 792/12384 [1:40:48<24:32:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 6%|▋ | 792/12384 [1:40:56<24:32:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 6%|▋ | 793/12384 [1:40:56<24:32:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 6%|▋ | 793/12384 [1:41:04<24:32:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 6%|▋ | 794/12384 [1:41:04<24:50:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 6%|▋ | 794/12384 [1:41:11<24:50:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 6%|▋ | 795/12384 [1:41:11<24:44:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 6%|▋ | 795/12384 [1:41:19<24:44:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▋ | 796/12384 [1:41:19<24:40:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 6%|▋ | 796/12384 [1:41:27<24:40:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▋ | 797/12384 [1:41:27<24:37:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 6%|▋ | 797/12384 [1:41:34<24:37:00, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.16s]
Epoch 1: 6%|▋ | 798/12384 [1:41:34<24:35:16, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.16s]
Epoch 1: 6%|▋ | 798/12384 [1:41:42<24:35:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 1: 6%|▋ | 799/12384 [1:41:42<24:32:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 1: 6%|▋ | 799/12384 [1:41:49<24:32:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 6%|▋ | 800/12384 [1:41:49<24:31:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 6%|▋ | 800/12384 [1:41:57<24:31:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 6%|▋ | 801/12384 [1:41:57<24:32:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 6%|▋ | 801/12384 [1:42:05<24:32:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 6%|▋ | 802/12384 [1:42:05<24:31:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 6%|▋ | 802/12384 [1:42:12<24:31:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 6%|▋ | 803/12384 [1:42:12<24:29:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 6%|▋ | 803/12384 [1:42:20<24:29:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 6%|▋ | 804/12384 [1:42:20<24:28:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 6%|▋ | 804/12384 [1:42:28<24:28:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 7%|▋ | 805/12384 [1:42:28<24:28:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 7%|▋ | 805/12384 [1:42:35<24:28:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 7%|▋ | 806/12384 [1:42:35<24:28:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 7%|▋ | 806/12384 [1:42:43<24:28:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 7%|▋ | 807/12384 [1:42:43<24:28:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 7%|▋ | 807/12384 [1:42:50<24:28:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 7%|▋ | 808/12384 [1:42:50<24:28:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 7%|▋ | 808/12384 [1:42:58<24:28:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 7%|▋ | 809/12384 [1:42:58<24:33:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 7%|▋ | 809/12384 [1:43:06<24:33:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 7%|▋ | 810/12384 [1:43:06<24:33:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 7%|▋ | 810/12384 [1:43:13<24:33:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 1: 7%|▋ | 811/12384 [1:43:13<24:32:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 1: 7%|▋ | 811/12384 [1:43:21<24:32:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 7%|▋ | 812/12384 [1:43:21<24:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 7%|▋ | 812/12384 [1:43:28<24:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 7%|▋ | 813/12384 [1:43:28<24:28:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 7%|▋ | 813/12384 [1:43:36<24:28:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 7%|▋ | 814/12384 [1:43:36<24:30:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 7%|▋ | 814/12384 [1:43:44<24:30:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 7%|▋ | 815/12384 [1:43:44<24:28:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 7%|▋ | 815/12384 [1:43:51<24:28:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 7%|▋ | 816/12384 [1:43:51<24:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 7%|▋ | 816/12384 [1:43:59<24:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 7%|▋ | 817/12384 [1:43:59<24:27:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 7%|▋ | 817/12384 [1:44:07<24:27:06, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=10.91s]
Epoch 1: 7%|▋ | 818/12384 [1:44:07<24:27:19, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=10.91s]
Epoch 1: 7%|▋ | 818/12384 [1:44:14<24:27:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 819/12384 [1:44:14<24:32:23, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 819/12384 [1:44:22<24:32:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 7%|▋ | 820/12384 [1:44:22<24:34:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 7%|▋ | 820/12384 [1:44:30<24:34:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 1: 7%|▋ | 821/12384 [1:44:30<24:51:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 1: 7%|▋ | 821/12384 [1:44:38<24:51:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 1: 7%|▋ | 822/12384 [1:44:38<24:43:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 1: 7%|▋ | 822/12384 [1:44:45<24:43:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 7%|▋ | 823/12384 [1:44:45<24:38:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 7%|▋ | 823/12384 [1:44:53<24:38:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 7%|▋ | 824/12384 [1:44:53<24:34:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 7%|▋ | 824/12384 [1:45:00<24:34:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 7%|▋ | 825/12384 [1:45:00<24:31:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 7%|▋ | 825/12384 [1:45:08<24:31:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 7%|▋ | 826/12384 [1:45:08<24:29:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 7%|▋ | 826/12384 [1:45:16<24:29:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 827/12384 [1:45:16<24:28:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 827/12384 [1:45:23<24:28:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 7%|▋ | 828/12384 [1:45:23<24:27:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 7%|▋ | 828/12384 [1:45:31<24:27:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 7%|▋ | 829/12384 [1:45:31<24:28:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 7%|▋ | 829/12384 [1:45:38<24:28:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 7%|▋ | 830/12384 [1:45:38<24:27:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 7%|▋ | 830/12384 [1:45:46<24:27:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 7%|▋ | 831/12384 [1:45:46<24:25:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 7%|▋ | 831/12384 [1:45:54<24:25:58, 7.61s/it, loss=0.0064, acc=0.9975, iter_time=7.99s]
Epoch 1: 7%|▋ | 832/12384 [1:45:54<24:25:16, 7.61s/it, loss=0.0064, acc=0.9975, iter_time=7.99s]
Epoch 1: 7%|▋ | 832/12384 [1:46:01<24:25:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 7%|▋ | 833/12384 [1:46:01<24:25:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 7%|▋ | 833/12384 [1:46:09<24:25:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 7%|▋ | 834/12384 [1:46:09<24:23:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 7%|▋ | 834/12384 [1:46:16<24:23:32, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.35s]
Epoch 1: 7%|▋ | 835/12384 [1:46:16<24:23:47, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.35s]
Epoch 1: 7%|▋ | 835/12384 [1:46:24<24:23:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 7%|▋ | 836/12384 [1:46:24<24:29:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 7%|▋ | 836/12384 [1:46:32<24:29:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 7%|▋ | 837/12384 [1:46:32<24:27:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 7%|▋ | 837/12384 [1:46:39<24:27:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 7%|▋ | 838/12384 [1:46:39<24:30:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 7%|▋ | 838/12384 [1:46:47<24:30:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 7%|▋ | 839/12384 [1:46:47<24:28:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 7%|▋ | 839/12384 [1:46:55<24:28:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.68s]
Epoch 1: 7%|▋ | 840/12384 [1:46:55<24:27:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.68s]
Epoch 1: 7%|▋ | 840/12384 [1:47:02<24:27:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 7%|▋ | 841/12384 [1:47:02<24:26:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 7%|▋ | 841/12384 [1:47:10<24:26:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 7%|▋ | 842/12384 [1:47:10<24:26:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 7%|▋ | 842/12384 [1:47:18<24:26:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 7%|▋ | 843/12384 [1:47:18<24:28:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 7%|▋ | 843/12384 [1:47:25<24:28:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 7%|▋ | 844/12384 [1:47:25<24:27:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 7%|▋ | 844/12384 [1:47:33<24:27:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 7%|▋ | 845/12384 [1:47:33<24:26:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 7%|▋ | 845/12384 [1:47:40<24:26:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 7%|▋ | 846/12384 [1:47:40<24:32:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 7%|▋ | 846/12384 [1:47:48<24:32:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 7%|▋ | 847/12384 [1:47:48<24:50:43, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 7%|▋ | 847/12384 [1:47:56<24:50:43, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 7%|▋ | 848/12384 [1:47:56<24:45:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 7%|▋ | 848/12384 [1:48:04<24:45:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 7%|▋ | 849/12384 [1:48:04<24:38:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 7%|▋ | 849/12384 [1:48:11<24:38:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 850/12384 [1:48:11<24:33:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 850/12384 [1:48:19<24:33:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 851/12384 [1:48:19<24:29:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 851/12384 [1:48:27<24:29:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 7%|▋ | 852/12384 [1:48:27<24:26:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 7%|▋ | 852/12384 [1:48:34<24:26:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 7%|▋ | 853/12384 [1:48:34<24:26:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 7%|▋ | 853/12384 [1:48:42<24:26:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 7%|▋ | 854/12384 [1:48:42<24:25:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 7%|▋ | 854/12384 [1:48:49<24:25:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 7%|▋ | 855/12384 [1:48:49<24:24:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 7%|▋ | 855/12384 [1:48:57<24:24:55, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.55s]
Epoch 1: 7%|▋ | 856/12384 [1:48:57<24:22:59, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.55s]
Epoch 1: 7%|▋ | 856/12384 [1:49:05<24:22:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 7%|▋ | 857/12384 [1:49:05<24:22:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 7%|▋ | 857/12384 [1:49:12<24:22:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 7%|▋ | 858/12384 [1:49:12<24:22:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 7%|▋ | 858/12384 [1:49:20<24:22:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 859/12384 [1:49:20<24:22:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 859/12384 [1:49:27<24:22:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 860/12384 [1:49:27<24:21:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 860/12384 [1:49:35<24:21:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 7%|▋ | 861/12384 [1:49:35<24:24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 7%|▋ | 861/12384 [1:49:43<24:24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 7%|▋ | 862/12384 [1:49:43<24:23:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 7%|▋ | 862/12384 [1:49:50<24:23:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 7%|▋ | 863/12384 [1:49:50<24:22:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 7%|▋ | 863/12384 [1:49:58<24:22:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 7%|▋ | 864/12384 [1:49:58<24:21:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 7%|▋ | 864/12384 [1:50:06<24:21:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 7%|▋ | 865/12384 [1:50:06<24:37:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 7%|▋ | 865/12384 [1:50:13<24:37:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 866/12384 [1:50:13<24:32:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 866/12384 [1:50:21<24:32:35, 7.67s/it, loss=0.0007, acc=0.9981, iter_time=7.21s]
Epoch 1: 7%|▋ | 867/12384 [1:50:21<24:28:37, 7.65s/it, loss=0.0007, acc=0.9981, iter_time=7.21s]
Epoch 1: 7%|▋ | 867/12384 [1:50:29<24:28:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 7%|▋ | 868/12384 [1:50:29<24:31:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 7%|▋ | 868/12384 [1:50:36<24:31:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 1: 7%|▋ | 869/12384 [1:50:36<24:31:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 1: 7%|▋ | 869/12384 [1:50:44<24:31:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 7%|▋ | 870/12384 [1:50:44<24:26:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 7%|▋ | 870/12384 [1:50:52<24:26:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 7%|▋ | 871/12384 [1:50:52<24:27:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 7%|▋ | 871/12384 [1:50:59<24:27:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 7%|▋ | 872/12384 [1:50:59<24:24:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 7%|▋ | 872/12384 [1:51:07<24:24:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 7%|▋ | 873/12384 [1:51:07<24:39:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 7%|▋ | 873/12384 [1:51:15<24:39:25, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 1: 7%|▋ | 874/12384 [1:51:15<24:34:04, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 1: 7%|▋ | 874/12384 [1:51:22<24:34:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 875/12384 [1:51:22<24:34:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 875/12384 [1:51:30<24:34:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 876/12384 [1:51:30<24:29:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 876/12384 [1:51:38<24:29:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 877/12384 [1:51:38<24:25:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 877/12384 [1:51:45<24:25:57, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 878/12384 [1:51:45<24:25:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 878/12384 [1:51:53<24:25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 7%|▋ | 879/12384 [1:51:53<24:22:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 7%|▋ | 879/12384 [1:52:01<24:22:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 7%|▋ | 880/12384 [1:52:01<24:27:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 7%|▋ | 880/12384 [1:52:08<24:27:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 7%|▋ | 881/12384 [1:52:08<24:24:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 7%|▋ | 881/12384 [1:52:16<24:24:17, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 1: 7%|▋ | 882/12384 [1:52:16<24:22:31, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 1: 7%|▋ | 882/12384 [1:52:23<24:22:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 7%|▋ | 883/12384 [1:52:23<24:20:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 7%|▋ | 883/12384 [1:52:31<24:20:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 7%|▋ | 884/12384 [1:52:31<24:20:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 7%|▋ | 884/12384 [1:52:39<24:20:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 7%|▋ | 885/12384 [1:52:39<24:25:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 7%|▋ | 885/12384 [1:52:46<24:25:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 7%|▋ | 886/12384 [1:52:46<24:27:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 7%|▋ | 886/12384 [1:52:54<24:27:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 1: 7%|▋ | 887/12384 [1:52:54<24:26:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 1: 7%|▋ | 887/12384 [1:53:02<24:26:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 1: 7%|▋ | 888/12384 [1:53:02<24:23:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 1: 7%|▋ | 888/12384 [1:53:09<24:23:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 7%|▋ | 889/12384 [1:53:09<24:22:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 7%|▋ | 889/12384 [1:53:17<24:22:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 7%|▋ | 890/12384 [1:53:17<24:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 7%|▋ | 890/12384 [1:53:25<24:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 7%|▋ | 891/12384 [1:53:25<24:38:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 7%|▋ | 891/12384 [1:53:32<24:38:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 7%|▋ | 892/12384 [1:53:32<24:31:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 7%|▋ | 892/12384 [1:53:40<24:31:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 7%|▋ | 893/12384 [1:53:40<24:25:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 7%|▋ | 893/12384 [1:53:48<24:25:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 894/12384 [1:53:48<24:23:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 894/12384 [1:53:55<24:23:21, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.49s]
Epoch 1: 7%|▋ | 895/12384 [1:53:55<24:22:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.49s]
Epoch 1: 7%|▋ | 895/12384 [1:54:03<24:22:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 7%|▋ | 896/12384 [1:54:03<24:20:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 7%|▋ | 896/12384 [1:54:11<24:20:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 7%|▋ | 897/12384 [1:54:11<24:22:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 7%|▋ | 897/12384 [1:54:18<24:22:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 7%|▋ | 898/12384 [1:54:18<24:20:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 7%|▋ | 898/12384 [1:54:26<24:20:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 7%|▋ | 899/12384 [1:54:26<24:46:17, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 7%|▋ | 899/12384 [1:54:34<24:46:17, 7.76s/it, loss=0.0001, acc=0.9999, iter_time=7.95s]
Epoch 1: 7%|▋ | 900/12384 [1:54:34<24:37:05, 7.72s/it, loss=0.0001, acc=0.9999, iter_time=7.95s]
Epoch 1: 7%|▋ | 900/12384 [1:54:41<24:37:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 901/12384 [1:54:41<24:29:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 901/12384 [1:54:49<24:29:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 7%|▋ | 902/12384 [1:54:49<24:27:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 7%|▋ | 902/12384 [1:54:57<24:27:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 7%|▋ | 903/12384 [1:54:57<24:23:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 7%|▋ | 903/12384 [1:55:04<24:23:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 904/12384 [1:55:04<24:21:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 904/12384 [1:55:12<24:21:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 1: 7%|▋ | 905/12384 [1:55:12<24:20:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 1: 7%|▋ | 905/12384 [1:55:20<24:20:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 7%|▋ | 906/12384 [1:55:20<24:21:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 7%|▋ | 906/12384 [1:55:27<24:21:58, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=5.35s]
Epoch 1: 7%|▋ | 907/12384 [1:55:27<24:20:06, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=5.35s]
Epoch 1: 7%|▋ | 907/12384 [1:55:35<24:20:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 7%|▋ | 908/12384 [1:55:35<24:19:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 7%|▋ | 908/12384 [1:55:42<24:19:15, 7.63s/it, loss=0.0010, acc=0.9957, iter_time=7.61s]
Epoch 1: 7%|▋ | 909/12384 [1:55:42<24:17:25, 7.62s/it, loss=0.0010, acc=0.9957, iter_time=7.61s]
Epoch 1: 7%|▋ | 909/12384 [1:55:50<24:17:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 1: 7%|▋ | 910/12384 [1:55:50<24:17:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 1: 7%|▋ | 910/12384 [1:55:58<24:17:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 1: 7%|▋ | 911/12384 [1:55:58<24:17:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 1: 7%|▋ | 911/12384 [1:56:05<24:17:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 7%|▋ | 912/12384 [1:56:05<24:17:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 7%|▋ | 912/12384 [1:56:13<24:17:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 7%|▋ | 913/12384 [1:56:13<24:15:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 7%|▋ | 913/12384 [1:56:20<24:15:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 7%|▋ | 914/12384 [1:56:20<24:16:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 7%|▋ | 914/12384 [1:56:28<24:16:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 7%|▋ | 915/12384 [1:56:28<24:15:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 7%|▋ | 915/12384 [1:56:36<24:15:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 916/12384 [1:56:36<24:15:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 916/12384 [1:56:43<24:15:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 7%|▋ | 917/12384 [1:56:43<24:15:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 7%|▋ | 917/12384 [1:56:51<24:15:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 7%|▋ | 918/12384 [1:56:51<24:15:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 7%|▋ | 918/12384 [1:56:59<24:15:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 7%|▋ | 919/12384 [1:56:59<24:14:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 7%|▋ | 919/12384 [1:57:06<24:14:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 7%|▋ | 920/12384 [1:57:06<24:15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 7%|▋ | 920/12384 [1:57:14<24:15:14, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 1: 7%|▋ | 921/12384 [1:57:14<24:14:00, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.21s]
Epoch 1: 7%|▋ | 921/12384 [1:57:21<24:14:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 922/12384 [1:57:21<24:12:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 922/12384 [1:57:29<24:12:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 923/12384 [1:57:29<24:12:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 7%|▋ | 923/12384 [1:57:37<24:12:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 924/12384 [1:57:37<24:12:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 7%|▋ | 924/12384 [1:57:44<24:12:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 7%|▋ | 925/12384 [1:57:44<24:30:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 7%|▋ | 925/12384 [1:57:52<24:30:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 7%|▋ | 926/12384 [1:57:52<24:25:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 7%|▋ | 926/12384 [1:58:00<24:25:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 7%|▋ | 927/12384 [1:58:00<24:22:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 7%|▋ | 927/12384 [1:58:07<24:22:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 928/12384 [1:58:07<24:19:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 7%|▋ | 928/12384 [1:58:15<24:19:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 8%|▊ | 929/12384 [1:58:15<24:16:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 8%|▊ | 929/12384 [1:58:23<24:16:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 8%|▊ | 930/12384 [1:58:23<24:15:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 8%|▊ | 930/12384 [1:58:30<24:15:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 8%|▊ | 931/12384 [1:58:30<24:14:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 8%|▊ | 931/12384 [1:58:38<24:14:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 8%|▊ | 932/12384 [1:58:38<24:14:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 8%|▊ | 932/12384 [1:58:45<24:14:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 8%|▊ | 933/12384 [1:58:45<24:14:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 8%|▊ | 933/12384 [1:58:53<24:14:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 8%|▊ | 934/12384 [1:58:53<24:13:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 8%|▊ | 934/12384 [1:59:01<24:13:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.62s]
Epoch 1: 8%|▊ | 935/12384 [1:59:01<24:12:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.62s]
Epoch 1: 8%|▊ | 935/12384 [1:59:08<24:12:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 8%|▊ | 936/12384 [1:59:08<24:11:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 8%|▊ | 936/12384 [1:59:16<24:11:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 8%|▊ | 937/12384 [1:59:16<24:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 8%|▊ | 937/12384 [1:59:23<24:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 938/12384 [1:59:23<24:11:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 938/12384 [1:59:31<24:11:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 939/12384 [1:59:31<24:11:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 939/12384 [1:59:39<24:11:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 940/12384 [1:59:39<24:16:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 940/12384 [1:59:46<24:16:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 8%|▊ | 941/12384 [1:59:46<24:14:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 8%|▊ | 941/12384 [1:59:54<24:14:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 8%|▊ | 942/12384 [1:59:54<24:13:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 8%|▊ | 942/12384 [2:00:02<24:13:19, 7.62s/it, loss=0.0014, acc=0.9950, iter_time=10.65s]
Epoch 1: 8%|▊ | 943/12384 [2:00:02<24:10:53, 7.61s/it, loss=0.0014, acc=0.9950, iter_time=10.65s]
Epoch 1: 8%|▊ | 943/12384 [2:00:09<24:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 8%|▊ | 944/12384 [2:00:09<24:09:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 8%|▊ | 944/12384 [2:00:17<24:09:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 8%|▊ | 945/12384 [2:00:17<24:11:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 8%|▊ | 945/12384 [2:00:24<24:11:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 8%|▊ | 946/12384 [2:00:24<24:09:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 8%|▊ | 946/12384 [2:00:32<24:09:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 8%|▊ | 947/12384 [2:00:32<24:10:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 8%|▊ | 947/12384 [2:00:40<24:10:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 8%|▊ | 948/12384 [2:00:40<24:10:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 8%|▊ | 948/12384 [2:00:47<24:10:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 8%|▊ | 949/12384 [2:00:47<24:08:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 8%|▊ | 949/12384 [2:00:55<24:08:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 8%|▊ | 950/12384 [2:00:55<24:10:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 8%|▊ | 950/12384 [2:01:02<24:10:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 1: 8%|▊ | 951/12384 [2:01:02<24:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 1: 8%|▊ | 951/12384 [2:01:10<24:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.67s]
Epoch 1: 8%|▊ | 952/12384 [2:01:10<24:28:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.67s]
Epoch 1: 8%|▊ | 952/12384 [2:01:18<24:28:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 8%|▊ | 953/12384 [2:01:18<24:21:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 8%|▊ | 953/12384 [2:01:26<24:21:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 8%|▊ | 954/12384 [2:01:26<24:16:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 8%|▊ | 954/12384 [2:01:33<24:16:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 8%|▊ | 955/12384 [2:01:33<24:14:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 8%|▊ | 955/12384 [2:01:41<24:14:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 956/12384 [2:01:41<24:12:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 956/12384 [2:01:48<24:12:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 957/12384 [2:01:48<24:12:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 957/12384 [2:01:56<24:12:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 958/12384 [2:01:56<24:10:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 958/12384 [2:02:04<24:10:08, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=7.60s]
Epoch 1: 8%|▊ | 959/12384 [2:02:04<24:10:15, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.60s]
Epoch 1: 8%|▊ | 959/12384 [2:02:11<24:10:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 8%|▊ | 960/12384 [2:02:11<24:11:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 8%|▊ | 960/12384 [2:02:19<24:11:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 8%|▊ | 961/12384 [2:02:19<24:09:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 8%|▊ | 961/12384 [2:02:26<24:09:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 962/12384 [2:02:26<24:08:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 962/12384 [2:02:34<24:08:00, 7.61s/it, loss=0.0005, acc=0.9981, iter_time=7.61s]
Epoch 1: 8%|▊ | 963/12384 [2:02:34<24:08:03, 7.61s/it, loss=0.0005, acc=0.9981, iter_time=7.61s]
Epoch 1: 8%|▊ | 963/12384 [2:02:42<24:08:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 8%|▊ | 964/12384 [2:02:42<24:07:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 8%|▊ | 964/12384 [2:02:49<24:07:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 8%|▊ | 965/12384 [2:02:49<24:06:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 8%|▊ | 965/12384 [2:02:57<24:06:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 8%|▊ | 966/12384 [2:02:57<24:12:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 8%|▊ | 966/12384 [2:03:04<24:12:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 8%|▊ | 967/12384 [2:03:04<24:10:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 8%|▊ | 967/12384 [2:03:12<24:10:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 8%|▊ | 968/12384 [2:03:12<24:08:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 8%|▊ | 968/12384 [2:03:20<24:08:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 8%|▊ | 969/12384 [2:03:20<24:13:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 8%|▊ | 969/12384 [2:03:27<24:13:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 1: 8%|▊ | 970/12384 [2:03:27<24:13:23, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 1: 8%|▊ | 970/12384 [2:03:35<24:13:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 8%|▊ | 971/12384 [2:03:35<24:28:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 8%|▊ | 971/12384 [2:03:43<24:28:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 8%|▊ | 972/12384 [2:03:43<24:22:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 8%|▊ | 972/12384 [2:03:51<24:22:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 8%|▊ | 973/12384 [2:03:51<24:17:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 8%|▊ | 973/12384 [2:03:58<24:17:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 974/12384 [2:03:58<24:14:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 974/12384 [2:04:06<24:14:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 975/12384 [2:04:06<24:11:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 975/12384 [2:04:13<24:11:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 8%|▊ | 976/12384 [2:04:13<24:10:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 8%|▊ | 976/12384 [2:04:21<24:10:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 8%|▊ | 977/12384 [2:04:21<24:09:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 8%|▊ | 977/12384 [2:04:29<24:09:39, 7.63s/it, loss=0.0002, acc=0.9991, iter_time=7.69s]
Epoch 1: 8%|▊ | 978/12384 [2:04:29<24:28:02, 7.72s/it, loss=0.0002, acc=0.9991, iter_time=7.69s]
Epoch 1: 8%|▊ | 978/12384 [2:04:37<24:28:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 8%|▊ | 979/12384 [2:04:37<24:22:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 8%|▊ | 979/12384 [2:04:44<24:22:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 980/12384 [2:04:44<24:16:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 980/12384 [2:04:52<24:16:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 8%|▊ | 981/12384 [2:04:52<24:13:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 8%|▊ | 981/12384 [2:04:59<24:13:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 8%|▊ | 982/12384 [2:04:59<24:10:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 8%|▊ | 982/12384 [2:05:07<24:10:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 8%|▊ | 983/12384 [2:05:07<24:09:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 8%|▊ | 983/12384 [2:05:15<24:09:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 8%|▊ | 984/12384 [2:05:15<24:11:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 8%|▊ | 984/12384 [2:05:22<24:11:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 8%|▊ | 985/12384 [2:05:22<24:10:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 8%|▊ | 985/12384 [2:05:30<24:10:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 8%|▊ | 986/12384 [2:05:30<24:08:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 8%|▊ | 986/12384 [2:05:37<24:08:45, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 1: 8%|▊ | 987/12384 [2:05:37<24:07:15, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 1: 8%|▊ | 987/12384 [2:05:45<24:07:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 988/12384 [2:05:45<24:11:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 988/12384 [2:05:53<24:11:54, 7.64s/it, loss=0.0004, acc=0.9983, iter_time=7.70s]
Epoch 1: 8%|▊ | 989/12384 [2:05:53<24:10:55, 7.64s/it, loss=0.0004, acc=0.9983, iter_time=7.70s]
Epoch 1: 8%|▊ | 989/12384 [2:06:00<24:10:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 990/12384 [2:06:00<24:08:02, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 990/12384 [2:06:08<24:08:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 991/12384 [2:06:08<24:08:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 991/12384 [2:06:16<24:08:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 8%|▊ | 992/12384 [2:06:16<24:06:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 8%|▊ | 992/12384 [2:06:23<24:06:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 8%|▊ | 993/12384 [2:06:23<24:07:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 8%|▊ | 993/12384 [2:06:31<24:07:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 8%|▊ | 994/12384 [2:06:31<24:07:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 8%|▊ | 994/12384 [2:06:39<24:07:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 8%|▊ | 995/12384 [2:06:39<24:07:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 8%|▊ | 995/12384 [2:06:46<24:07:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 8%|▊ | 996/12384 [2:06:46<24:09:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 8%|▊ | 996/12384 [2:06:54<24:09:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 8%|▊ | 997/12384 [2:06:54<24:22:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 8%|▊ | 997/12384 [2:07:02<24:22:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 8%|▊ | 998/12384 [2:07:02<24:17:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 8%|▊ | 998/12384 [2:07:09<24:17:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 8%|▊ | 999/12384 [2:07:09<24:13:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 8%|▊ | 999/12384 [2:07:17<24:13:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 8%|▊ | 1000/12384 [2:07:17<24:10:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 8%|▊ | 1000/12384 [2:07:25<24:10:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 8%|▊ | 1001/12384 [2:07:25<24:08:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 8%|▊ | 1001/12384 [2:07:32<24:08:06, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.26s]
Epoch 1: 8%|▊ | 1002/12384 [2:07:32<24:06:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.26s]
Epoch 1: 8%|▊ | 1002/12384 [2:07:40<24:06:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 1: 8%|▊ | 1003/12384 [2:07:40<24:05:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 1: 8%|▊ | 1003/12384 [2:07:47<24:05:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1004/12384 [2:07:47<24:05:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1004/12384 [2:07:55<24:05:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 8%|▊ | 1005/12384 [2:07:55<24:22:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 8%|▊ | 1005/12384 [2:08:03<24:22:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 8%|▊ | 1006/12384 [2:08:03<24:16:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 8%|▊ | 1006/12384 [2:08:11<24:16:44, 7.68s/it, loss=0.0001, acc=0.9992, iter_time=7.60s]
Epoch 1: 8%|▊ | 1007/12384 [2:08:11<24:13:11, 7.66s/it, loss=0.0001, acc=0.9992, iter_time=7.60s]
Epoch 1: 8%|▊ | 1007/12384 [2:08:18<24:13:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 8%|▊ | 1008/12384 [2:08:18<24:09:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 8%|▊ | 1008/12384 [2:08:26<24:09:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 8%|▊ | 1009/12384 [2:08:26<24:06:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 8%|▊ | 1009/12384 [2:08:33<24:06:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 8%|▊ | 1010/12384 [2:08:33<24:05:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 8%|▊ | 1010/12384 [2:08:41<24:05:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 8%|▊ | 1011/12384 [2:08:41<24:07:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 8%|▊ | 1011/12384 [2:08:49<24:07:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 1012/12384 [2:08:49<24:06:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 1012/12384 [2:08:56<24:06:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 1013/12384 [2:08:56<24:05:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 1013/12384 [2:09:04<24:05:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1014/12384 [2:09:04<24:03:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1014/12384 [2:09:11<24:03:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 1015/12384 [2:09:11<24:06:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 8%|▊ | 1015/12384 [2:09:19<24:06:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 8%|▊ | 1016/12384 [2:09:19<24:05:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 8%|▊ | 1016/12384 [2:09:27<24:05:28, 7.63s/it, loss=0.0005, acc=0.9999, iter_time=7.20s]
Epoch 1: 8%|▊ | 1017/12384 [2:09:27<24:04:57, 7.63s/it, loss=0.0005, acc=0.9999, iter_time=7.20s]
Epoch 1: 8%|▊ | 1017/12384 [2:09:34<24:04:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 8%|▊ | 1018/12384 [2:09:34<24:04:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 8%|▊ | 1018/12384 [2:09:42<24:04:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 1019/12384 [2:09:42<24:05:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 1019/12384 [2:09:50<24:05:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 8%|▊ | 1020/12384 [2:09:50<24:04:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 8%|▊ | 1020/12384 [2:09:57<24:04:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.27s]
Epoch 1: 8%|▊ | 1021/12384 [2:09:57<24:02:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.27s]
Epoch 1: 8%|▊ | 1021/12384 [2:10:05<24:02:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 8%|▊ | 1022/12384 [2:10:05<24:02:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 8%|▊ | 1022/12384 [2:10:13<24:02:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 1: 8%|▊ | 1023/12384 [2:10:13<24:18:09, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 1: 8%|▊ | 1023/12384 [2:10:20<24:18:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 8%|▊ | 1024/12384 [2:10:20<24:14:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 8%|▊ | 1024/12384 [2:10:28<24:14:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 8%|▊ | 1025/12384 [2:10:28<24:10:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 8%|▊ | 1025/12384 [2:10:36<24:10:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 8%|▊ | 1026/12384 [2:10:36<24:07:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 8%|▊ | 1026/12384 [2:10:43<24:07:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 8%|▊ | 1027/12384 [2:10:43<24:05:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 8%|▊ | 1027/12384 [2:10:51<24:05:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 8%|▊ | 1028/12384 [2:10:51<24:02:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 8%|▊ | 1028/12384 [2:10:58<24:02:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 8%|▊ | 1029/12384 [2:10:58<24:02:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 8%|▊ | 1029/12384 [2:11:06<24:02:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 8%|▊ | 1030/12384 [2:11:06<24:02:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 8%|▊ | 1030/12384 [2:11:14<24:02:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 8%|▊ | 1031/12384 [2:11:14<24:21:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 8%|▊ | 1031/12384 [2:11:22<24:21:53, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 1: 8%|▊ | 1032/12384 [2:11:22<24:14:38, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 1: 8%|▊ | 1032/12384 [2:11:29<24:14:38, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=4.29s]
Epoch 1: 8%|▊ | 1033/12384 [2:11:29<24:11:13, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=4.29s]
Epoch 1: 8%|▊ | 1033/12384 [2:11:37<24:11:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 8%|▊ | 1034/12384 [2:11:37<24:10:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 8%|▊ | 1034/12384 [2:11:44<24:10:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 8%|▊ | 1035/12384 [2:11:44<24:06:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 8%|▊ | 1035/12384 [2:11:52<24:06:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1036/12384 [2:11:52<24:04:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1036/12384 [2:12:00<24:04:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 8%|▊ | 1037/12384 [2:12:00<24:03:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 8%|▊ | 1037/12384 [2:12:07<24:03:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 8%|▊ | 1038/12384 [2:12:07<24:00:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 8%|▊ | 1038/12384 [2:12:15<24:00:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 1039/12384 [2:12:15<23:59:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 8%|▊ | 1039/12384 [2:12:23<23:59:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 8%|▊ | 1040/12384 [2:12:23<24:01:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 8%|▊ | 1040/12384 [2:12:30<24:01:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 8%|▊ | 1041/12384 [2:12:30<23:59:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 8%|▊ | 1041/12384 [2:12:38<23:59:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.54s]
Epoch 1: 8%|▊ | 1042/12384 [2:12:38<24:00:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.54s]
Epoch 1: 8%|▊ | 1042/12384 [2:12:45<24:00:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 8%|▊ | 1043/12384 [2:12:45<24:01:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 8%|▊ | 1043/12384 [2:12:53<24:01:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 8%|▊ | 1044/12384 [2:12:53<24:04:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 8%|▊ | 1044/12384 [2:13:01<24:04:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 8%|▊ | 1045/12384 [2:13:01<24:01:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 8%|▊ | 1045/12384 [2:13:08<24:01:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 1: 8%|▊ | 1046/12384 [2:13:08<23:58:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 1: 8%|▊ | 1046/12384 [2:13:16<23:58:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 8%|▊ | 1047/12384 [2:13:16<23:58:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 8%|▊ | 1047/12384 [2:13:24<23:58:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 8%|▊ | 1048/12384 [2:13:24<23:59:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 8%|▊ | 1048/12384 [2:13:31<23:59:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 8%|▊ | 1049/12384 [2:13:31<24:12:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 8%|▊ | 1049/12384 [2:13:39<24:12:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1050/12384 [2:13:39<24:06:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1050/12384 [2:13:47<24:06:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 8%|▊ | 1051/12384 [2:13:47<24:02:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 8%|▊ | 1051/12384 [2:13:54<24:02:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1052/12384 [2:13:54<24:00:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 8%|▊ | 1052/12384 [2:14:02<24:00:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▊ | 1053/12384 [2:14:02<23:59:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▊ | 1053/12384 [2:14:09<23:59:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▊ | 1054/12384 [2:14:09<24:00:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▊ | 1054/12384 [2:14:17<24:00:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 9%|▊ | 1055/12384 [2:14:17<23:58:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 9%|▊ | 1055/12384 [2:14:25<23:58:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 9%|▊ | 1056/12384 [2:14:25<23:58:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 9%|▊ | 1056/12384 [2:14:33<23:58:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.66s]
Epoch 1: 9%|▊ | 1057/12384 [2:14:33<24:17:28, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=6.66s]
Epoch 1: 9%|▊ | 1057/12384 [2:14:40<24:17:28, 7.72s/it, loss=0.0013, acc=0.9983, iter_time=8.51s]
Epoch 1: 9%|▊ | 1058/12384 [2:14:40<24:11:07, 7.69s/it, loss=0.0013, acc=0.9983, iter_time=8.51s]
Epoch 1: 9%|▊ | 1058/12384 [2:14:48<24:11:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 9%|▊ | 1059/12384 [2:14:48<24:05:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 9%|▊ | 1059/12384 [2:14:55<24:05:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 9%|▊ | 1060/12384 [2:14:55<24:03:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 9%|▊ | 1060/12384 [2:15:03<24:03:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 9%|▊ | 1061/12384 [2:15:03<23:59:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 9%|▊ | 1061/12384 [2:15:11<23:59:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 9%|▊ | 1062/12384 [2:15:11<23:58:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 9%|▊ | 1062/12384 [2:15:18<23:58:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 9%|▊ | 1063/12384 [2:15:18<23:58:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 9%|▊ | 1063/12384 [2:15:26<23:58:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▊ | 1064/12384 [2:15:26<23:58:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▊ | 1064/12384 [2:15:33<23:58:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 9%|▊ | 1065/12384 [2:15:33<23:57:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 9%|▊ | 1065/12384 [2:15:41<23:57:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 9%|▊ | 1066/12384 [2:15:41<23:56:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 9%|▊ | 1066/12384 [2:15:49<23:56:05, 7.61s/it, loss=0.0007, acc=0.9979, iter_time=7.21s]
Epoch 1: 9%|▊ | 1067/12384 [2:15:49<23:55:49, 7.61s/it, loss=0.0007, acc=0.9979, iter_time=7.21s]
Epoch 1: 9%|▊ | 1067/12384 [2:15:56<23:55:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▊ | 1068/12384 [2:15:56<23:55:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▊ | 1068/12384 [2:16:04<23:55:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▊ | 1069/12384 [2:16:04<23:56:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▊ | 1069/12384 [2:16:12<23:56:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 1: 9%|▊ | 1070/12384 [2:16:12<23:55:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 1: 9%|▊ | 1070/12384 [2:16:19<23:55:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 9%|▊ | 1071/12384 [2:16:19<23:56:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 9%|▊ | 1071/12384 [2:16:27<23:56:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.58s]
Epoch 1: 9%|▊ | 1072/12384 [2:16:27<23:57:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.58s]
Epoch 1: 9%|▊ | 1072/12384 [2:16:34<23:57:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 9%|▊ | 1073/12384 [2:16:34<23:56:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 9%|▊ | 1073/12384 [2:16:42<23:56:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▊ | 1074/12384 [2:16:42<23:56:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▊ | 1074/12384 [2:16:50<23:56:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 9%|▊ | 1075/12384 [2:16:50<24:10:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 9%|▊ | 1075/12384 [2:16:58<24:10:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 9%|▊ | 1076/12384 [2:16:58<24:06:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 9%|▊ | 1076/12384 [2:17:05<24:06:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 9%|▊ | 1077/12384 [2:17:05<24:04:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 9%|▊ | 1077/12384 [2:17:13<24:04:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 9%|▊ | 1078/12384 [2:17:13<24:00:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 9%|▊ | 1078/12384 [2:17:20<24:00:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▊ | 1079/12384 [2:17:20<23:59:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▊ | 1079/12384 [2:17:28<23:59:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 9%|▊ | 1080/12384 [2:17:28<23:58:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 9%|▊ | 1080/12384 [2:17:36<23:58:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 9%|▊ | 1081/12384 [2:17:36<23:57:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 9%|▊ | 1081/12384 [2:17:43<23:57:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 9%|▊ | 1082/12384 [2:17:43<23:55:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 9%|▊ | 1082/12384 [2:17:51<23:55:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 1: 9%|▊ | 1083/12384 [2:17:51<24:16:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 1: 9%|▊ | 1083/12384 [2:17:59<24:16:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 9%|▉ | 1084/12384 [2:17:59<24:09:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 9%|▉ | 1084/12384 [2:18:06<24:09:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 9%|▉ | 1085/12384 [2:18:06<24:05:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 9%|▉ | 1085/12384 [2:18:14<24:05:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▉ | 1086/12384 [2:18:14<24:03:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▉ | 1086/12384 [2:18:22<24:03:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 9%|▉ | 1087/12384 [2:18:22<24:00:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 9%|▉ | 1087/12384 [2:18:29<24:00:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 9%|▉ | 1088/12384 [2:18:29<23:58:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 9%|▉ | 1088/12384 [2:18:37<23:58:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 9%|▉ | 1089/12384 [2:18:37<23:55:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 9%|▉ | 1089/12384 [2:18:45<23:55:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 9%|▉ | 1090/12384 [2:18:45<23:56:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 9%|▉ | 1090/12384 [2:18:52<23:56:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 9%|▉ | 1091/12384 [2:18:52<23:55:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 9%|▉ | 1091/12384 [2:19:00<23:55:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 9%|▉ | 1092/12384 [2:19:00<23:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 9%|▉ | 1092/12384 [2:19:07<23:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 9%|▉ | 1093/12384 [2:19:07<23:54:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 9%|▉ | 1093/12384 [2:19:15<23:54:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.12s]
Epoch 1: 9%|▉ | 1094/12384 [2:19:15<23:54:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.12s]
Epoch 1: 9%|▉ | 1094/12384 [2:19:23<23:54:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 9%|▉ | 1095/12384 [2:19:23<23:56:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 9%|▉ | 1095/12384 [2:19:30<23:56:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 9%|▉ | 1096/12384 [2:19:30<23:55:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 9%|▉ | 1096/12384 [2:19:38<23:55:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 9%|▉ | 1097/12384 [2:19:38<23:54:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 9%|▉ | 1097/12384 [2:19:46<23:54:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▉ | 1098/12384 [2:19:46<23:53:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▉ | 1098/12384 [2:19:53<23:53:11, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=6.11s]
Epoch 1: 9%|▉ | 1099/12384 [2:19:53<23:53:26, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=6.11s]
Epoch 1: 9%|▉ | 1099/12384 [2:20:01<23:53:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 9%|▉ | 1100/12384 [2:20:01<23:57:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 9%|▉ | 1100/12384 [2:20:08<23:57:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 9%|▉ | 1101/12384 [2:20:08<23:54:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 9%|▉ | 1101/12384 [2:20:16<23:54:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 9%|▉ | 1102/12384 [2:20:16<24:09:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 9%|▉ | 1102/12384 [2:20:24<24:09:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 9%|▉ | 1103/12384 [2:20:24<24:03:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 9%|▉ | 1103/12384 [2:20:32<24:03:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 9%|▉ | 1104/12384 [2:20:32<24:00:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 9%|▉ | 1104/12384 [2:20:39<24:00:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 9%|▉ | 1105/12384 [2:20:39<23:57:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 9%|▉ | 1105/12384 [2:20:47<23:57:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 9%|▉ | 1106/12384 [2:20:47<23:56:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 9%|▉ | 1106/12384 [2:20:54<23:56:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▉ | 1107/12384 [2:20:54<23:54:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 9%|▉ | 1107/12384 [2:21:02<23:54:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 1: 9%|▉ | 1108/12384 [2:21:02<23:52:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 1: 9%|▉ | 1108/12384 [2:21:10<23:52:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 9%|▉ | 1109/12384 [2:21:10<24:07:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 9%|▉ | 1109/12384 [2:21:18<24:07:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 1: 9%|▉ | 1110/12384 [2:21:18<24:02:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 1: 9%|▉ | 1110/12384 [2:21:25<24:02:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 9%|▉ | 1111/12384 [2:21:25<23:59:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 9%|▉ | 1111/12384 [2:21:33<23:59:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 1: 9%|▉ | 1112/12384 [2:21:33<23:57:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 1: 9%|▉ | 1112/12384 [2:21:40<23:57:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 9%|▉ | 1113/12384 [2:21:40<23:57:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 9%|▉ | 1113/12384 [2:21:48<23:57:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 9%|▉ | 1114/12384 [2:21:48<23:53:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 9%|▉ | 1114/12384 [2:21:56<23:53:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▉ | 1115/12384 [2:21:56<23:57:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▉ | 1115/12384 [2:22:03<23:57:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 9%|▉ | 1116/12384 [2:22:04<24:05:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 9%|▉ | 1116/12384 [2:22:11<24:05:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 9%|▉ | 1117/12384 [2:22:11<23:58:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 9%|▉ | 1117/12384 [2:22:19<23:58:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 9%|▉ | 1118/12384 [2:22:19<23:55:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 9%|▉ | 1118/12384 [2:22:26<23:55:40, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=10.89s]
Epoch 1: 9%|▉ | 1119/12384 [2:22:26<23:52:50, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=10.89s]
Epoch 1: 9%|▉ | 1119/12384 [2:22:34<23:52:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 9%|▉ | 1120/12384 [2:22:34<23:52:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 9%|▉ | 1120/12384 [2:22:42<23:52:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 9%|▉ | 1121/12384 [2:22:42<23:55:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 9%|▉ | 1121/12384 [2:22:49<23:55:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 9%|▉ | 1122/12384 [2:22:49<23:52:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 9%|▉ | 1122/12384 [2:22:57<23:52:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 9%|▉ | 1123/12384 [2:22:57<24:03:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 9%|▉ | 1123/12384 [2:23:05<24:03:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 9%|▉ | 1124/12384 [2:23:05<23:58:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 9%|▉ | 1124/12384 [2:23:12<23:58:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 9%|▉ | 1125/12384 [2:23:14<25:03:30, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 9%|▉ | 1125/12384 [2:23:21<25:03:30, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=12.18s]
Epoch 1: 9%|▉ | 1126/12384 [2:23:21<24:39:53, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=12.18s]
Epoch 1: 9%|▉ | 1126/12384 [2:23:29<24:39:53, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 9%|▉ | 1127/12384 [2:23:29<24:37:45, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 9%|▉ | 1127/12384 [2:23:37<24:37:45, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 9%|▉ | 1128/12384 [2:23:37<24:23:13, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 9%|▉ | 1128/12384 [2:23:44<24:23:13, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 9%|▉ | 1129/12384 [2:23:44<24:13:02, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 9%|▉ | 1129/12384 [2:23:52<24:13:02, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 9%|▉ | 1130/12384 [2:23:52<24:06:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 9%|▉ | 1130/12384 [2:23:59<24:06:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 9%|▉ | 1131/12384 [2:23:59<24:01:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 9%|▉ | 1131/12384 [2:24:07<24:01:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 9%|▉ | 1132/12384 [2:24:07<24:01:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 9%|▉ | 1132/12384 [2:24:15<24:01:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 1: 9%|▉ | 1133/12384 [2:24:15<23:56:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 1: 9%|▉ | 1133/12384 [2:24:22<23:56:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 9%|▉ | 1134/12384 [2:24:22<23:53:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 9%|▉ | 1134/12384 [2:24:30<23:53:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 9%|▉ | 1135/12384 [2:24:30<23:54:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 9%|▉ | 1135/12384 [2:24:38<23:54:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 9%|▉ | 1136/12384 [2:24:38<24:09:34, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 9%|▉ | 1136/12384 [2:24:46<24:09:34, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 9%|▉ | 1137/12384 [2:24:46<24:03:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 9%|▉ | 1137/12384 [2:24:53<24:03:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 9%|▉ | 1138/12384 [2:24:53<23:56:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 9%|▉ | 1138/12384 [2:25:01<23:56:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 9%|▉ | 1139/12384 [2:25:01<23:51:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 9%|▉ | 1139/12384 [2:25:08<23:51:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 9%|▉ | 1140/12384 [2:25:08<23:51:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 9%|▉ | 1140/12384 [2:25:16<23:51:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 1: 9%|▉ | 1141/12384 [2:25:16<23:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 1: 9%|▉ | 1141/12384 [2:25:24<23:48:35, 7.62s/it, loss=0.0020, acc=0.9982, iter_time=7.58s]
Epoch 1: 9%|▉ | 1142/12384 [2:25:24<23:47:20, 7.62s/it, loss=0.0020, acc=0.9982, iter_time=7.58s]
Epoch 1: 9%|▉ | 1142/12384 [2:25:31<23:47:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 9%|▉ | 1143/12384 [2:25:31<23:46:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 9%|▉ | 1143/12384 [2:25:39<23:46:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 9%|▉ | 1144/12384 [2:25:39<23:46:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 9%|▉ | 1144/12384 [2:25:46<23:46:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 9%|▉ | 1145/12384 [2:25:46<23:43:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 9%|▉ | 1145/12384 [2:25:54<23:43:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 9%|▉ | 1146/12384 [2:25:54<23:48:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 9%|▉ | 1146/12384 [2:26:02<23:48:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 9%|▉ | 1147/12384 [2:26:02<23:47:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 9%|▉ | 1147/12384 [2:26:09<23:47:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.07s]
Epoch 1: 9%|▉ | 1148/12384 [2:26:09<23:46:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.07s]
Epoch 1: 9%|▉ | 1148/12384 [2:26:17<23:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 9%|▉ | 1149/12384 [2:26:17<23:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 9%|▉ | 1149/12384 [2:26:24<23:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 9%|▉ | 1150/12384 [2:26:24<23:43:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 9%|▉ | 1150/12384 [2:26:32<23:43:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 9%|▉ | 1151/12384 [2:26:32<23:44:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 9%|▉ | 1151/12384 [2:26:40<23:44:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 1: 9%|▉ | 1152/12384 [2:26:40<23:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 1: 9%|▉ | 1152/12384 [2:26:47<23:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 1: 9%|▉ | 1153/12384 [2:26:47<23:44:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 1: 9%|▉ | 1153/12384 [2:26:55<23:44:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 9%|▉ | 1154/12384 [2:26:55<23:59:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 9%|▉ | 1154/12384 [2:27:03<23:59:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 9%|▉ | 1155/12384 [2:27:03<23:53:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 9%|▉ | 1155/12384 [2:27:10<23:53:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 9%|▉ | 1156/12384 [2:27:10<23:51:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 9%|▉ | 1156/12384 [2:27:18<23:51:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 9%|▉ | 1157/12384 [2:27:18<23:50:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 9%|▉ | 1157/12384 [2:27:26<23:50:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 9%|▉ | 1158/12384 [2:27:26<23:51:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 9%|▉ | 1158/12384 [2:27:33<23:51:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 9%|▉ | 1159/12384 [2:27:33<23:48:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 9%|▉ | 1159/12384 [2:27:41<23:48:39, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.98s]
Epoch 1: 9%|▉ | 1160/12384 [2:27:41<23:48:01, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.98s]
Epoch 1: 9%|▉ | 1160/12384 [2:27:49<23:48:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 9%|▉ | 1161/12384 [2:27:49<23:50:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 9%|▉ | 1161/12384 [2:27:56<23:50:10, 7.65s/it, loss=0.0000, acc=0.9999, iter_time=7.72s]
Epoch 1: 9%|▉ | 1162/12384 [2:27:57<24:07:14, 7.74s/it, loss=0.0000, acc=0.9999, iter_time=7.72s]
Epoch 1: 9%|▉ | 1162/12384 [2:28:04<24:07:14, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 9%|▉ | 1163/12384 [2:28:04<23:59:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 9%|▉ | 1163/12384 [2:28:12<23:59:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▉ | 1164/12384 [2:28:12<23:55:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 9%|▉ | 1164/12384 [2:28:19<23:55:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 9%|▉ | 1165/12384 [2:28:19<23:50:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 9%|▉ | 1165/12384 [2:28:27<23:50:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 1: 9%|▉ | 1166/12384 [2:28:27<23:49:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 1: 9%|▉ | 1166/12384 [2:28:35<23:49:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 9%|▉ | 1167/12384 [2:28:35<23:47:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 9%|▉ | 1167/12384 [2:28:42<23:47:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 9%|▉ | 1168/12384 [2:28:42<23:47:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 9%|▉ | 1168/12384 [2:28:50<23:47:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 9%|▉ | 1169/12384 [2:28:50<23:45:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 9%|▉ | 1169/12384 [2:28:57<23:45:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 9%|▉ | 1170/12384 [2:28:57<23:43:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 9%|▉ | 1170/12384 [2:29:05<23:43:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 9%|▉ | 1171/12384 [2:29:05<23:43:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 9%|▉ | 1171/12384 [2:29:13<23:43:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 9%|▉ | 1172/12384 [2:29:13<23:42:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 9%|▉ | 1172/12384 [2:29:20<23:42:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 9%|▉ | 1173/12384 [2:29:20<23:42:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 9%|▉ | 1173/12384 [2:29:28<23:42:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 9%|▉ | 1174/12384 [2:29:28<23:43:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 9%|▉ | 1174/12384 [2:29:35<23:43:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 9%|▉ | 1175/12384 [2:29:35<23:43:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 9%|▉ | 1175/12384 [2:29:43<23:43:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 1: 9%|▉ | 1176/12384 [2:29:43<23:42:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 1: 9%|▉ | 1176/12384 [2:29:51<23:42:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 1: 10%|▉ | 1177/12384 [2:29:51<23:41:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 1: 10%|▉ | 1177/12384 [2:29:58<23:41:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 10%|▉ | 1178/12384 [2:29:58<23:41:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 10%|▉ | 1178/12384 [2:30:06<23:41:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 10%|▉ | 1179/12384 [2:30:06<23:42:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 10%|▉ | 1179/12384 [2:30:14<23:42:08, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=10.23s]
Epoch 1: 10%|▉ | 1180/12384 [2:30:14<23:56:54, 7.70s/it, loss=0.0004, acc=0.9979, iter_time=10.23s]
Epoch 1: 10%|▉ | 1180/12384 [2:30:21<23:56:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|▉ | 1181/12384 [2:30:21<23:55:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|▉ | 1181/12384 [2:30:29<23:55:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 10%|▉ | 1182/12384 [2:30:29<23:51:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 10%|▉ | 1182/12384 [2:30:37<23:51:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 10%|▉ | 1183/12384 [2:30:37<23:49:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 10%|▉ | 1183/12384 [2:30:44<23:49:05, 7.66s/it, loss=0.0004, acc=0.9973, iter_time=8.79s]
Epoch 1: 10%|▉ | 1184/12384 [2:30:44<23:47:08, 7.65s/it, loss=0.0004, acc=0.9973, iter_time=8.79s]
Epoch 1: 10%|▉ | 1184/12384 [2:30:52<23:47:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 10%|▉ | 1185/12384 [2:30:52<23:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 10%|▉ | 1185/12384 [2:31:00<23:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 10%|▉ | 1186/12384 [2:31:00<23:42:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 10%|▉ | 1186/12384 [2:31:07<23:42:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 10%|▉ | 1187/12384 [2:31:07<23:41:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 10%|▉ | 1187/12384 [2:31:15<23:41:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 1: 10%|▉ | 1188/12384 [2:31:15<23:39:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 1: 10%|▉ | 1188/12384 [2:31:23<23:39:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 10%|▉ | 1189/12384 [2:31:23<23:56:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 10%|▉ | 1189/12384 [2:31:30<23:56:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 10%|▉ | 1190/12384 [2:31:30<23:52:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 10%|▉ | 1190/12384 [2:31:38<23:52:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|▉ | 1191/12384 [2:31:38<23:47:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|▉ | 1191/12384 [2:31:45<23:47:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 10%|▉ | 1192/12384 [2:31:45<23:45:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 10%|▉ | 1192/12384 [2:31:53<23:45:00, 7.64s/it, loss=0.0007, acc=0.9974, iter_time=4.18s]
Epoch 1: 10%|▉ | 1193/12384 [2:31:53<23:42:11, 7.63s/it, loss=0.0007, acc=0.9974, iter_time=4.18s]
Epoch 1: 10%|▉ | 1193/12384 [2:32:01<23:42:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 10%|▉ | 1194/12384 [2:32:01<23:40:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 10%|▉ | 1194/12384 [2:32:08<23:40:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 1: 10%|▉ | 1195/12384 [2:32:08<23:40:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 1: 10%|▉ | 1195/12384 [2:32:16<23:40:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 1: 10%|▉ | 1196/12384 [2:32:16<23:40:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 1: 10%|▉ | 1196/12384 [2:32:24<23:40:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 10%|▉ | 1197/12384 [2:32:24<23:40:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 10%|▉ | 1197/12384 [2:32:31<23:40:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|▉ | 1198/12384 [2:32:31<23:40:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|▉ | 1198/12384 [2:32:39<23:40:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 10%|▉ | 1199/12384 [2:32:39<23:39:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 10%|▉ | 1199/12384 [2:32:46<23:39:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 10%|▉ | 1200/12384 [2:32:46<23:39:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 10%|▉ | 1200/12384 [2:32:54<23:39:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 1: 10%|▉ | 1201/12384 [2:32:54<23:38:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 1: 10%|▉ | 1201/12384 [2:33:02<23:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 10%|▉ | 1202/12384 [2:33:02<23:38:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 10%|▉ | 1202/12384 [2:33:09<23:38:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 10%|▉ | 1203/12384 [2:33:09<23:36:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 10%|▉ | 1203/12384 [2:33:17<23:36:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 10%|▉ | 1204/12384 [2:33:17<23:37:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 10%|▉ | 1204/12384 [2:33:24<23:37:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|▉ | 1205/12384 [2:33:24<23:37:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|▉ | 1205/12384 [2:33:32<23:37:17, 7.61s/it, loss=0.0004, acc=0.9983, iter_time=7.93s]
Epoch 1: 10%|▉ | 1206/12384 [2:33:32<23:54:49, 7.70s/it, loss=0.0004, acc=0.9983, iter_time=7.93s]
Epoch 1: 10%|▉ | 1206/12384 [2:33:40<23:54:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 10%|▉ | 1207/12384 [2:33:40<23:49:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 10%|▉ | 1207/12384 [2:33:48<23:49:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 10%|▉ | 1208/12384 [2:33:48<23:45:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 10%|▉ | 1208/12384 [2:33:55<23:45:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 10%|▉ | 1209/12384 [2:33:55<23:43:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 10%|▉ | 1209/12384 [2:34:03<23:43:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 10%|▉ | 1210/12384 [2:34:03<23:42:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 10%|▉ | 1210/12384 [2:34:10<23:42:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 10%|▉ | 1211/12384 [2:34:10<23:40:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 10%|▉ | 1211/12384 [2:34:18<23:40:53, 7.63s/it, loss=0.0010, acc=0.9974, iter_time=7.63s]
Epoch 1: 10%|▉ | 1212/12384 [2:34:18<23:40:25, 7.63s/it, loss=0.0010, acc=0.9974, iter_time=7.63s]
Epoch 1: 10%|▉ | 1212/12384 [2:34:26<23:40:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|▉ | 1213/12384 [2:34:26<23:40:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|▉ | 1213/12384 [2:34:33<23:40:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 10%|▉ | 1214/12384 [2:34:33<23:39:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 10%|▉ | 1214/12384 [2:34:41<23:39:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 10%|▉ | 1215/12384 [2:34:41<23:58:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 10%|▉ | 1215/12384 [2:34:49<23:58:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 10%|▉ | 1216/12384 [2:34:49<23:51:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 10%|▉ | 1216/12384 [2:34:56<23:51:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 1: 10%|▉ | 1217/12384 [2:34:56<23:48:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 1: 10%|▉ | 1217/12384 [2:35:04<23:48:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 10%|▉ | 1218/12384 [2:35:04<23:44:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 10%|▉ | 1218/12384 [2:35:12<23:44:27, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.02s]
Epoch 1: 10%|▉ | 1219/12384 [2:35:12<23:42:50, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.02s]
Epoch 1: 10%|▉ | 1219/12384 [2:35:19<23:42:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=12.31s]
Epoch 1: 10%|▉ | 1220/12384 [2:35:19<23:41:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=12.31s]
Epoch 1: 10%|▉ | 1220/12384 [2:35:27<23:41:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 10%|▉ | 1221/12384 [2:35:27<23:38:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 10%|▉ | 1221/12384 [2:35:35<23:38:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 10%|▉ | 1222/12384 [2:35:35<23:36:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 10%|▉ | 1222/12384 [2:35:42<23:36:24, 7.61s/it, loss=0.0003, acc=0.9998, iter_time=7.59s]
Epoch 1: 10%|▉ | 1223/12384 [2:35:42<23:38:16, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=7.59s]
Epoch 1: 10%|▉ | 1223/12384 [2:35:50<23:38:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 10%|▉ | 1224/12384 [2:35:50<23:36:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 10%|▉ | 1224/12384 [2:35:57<23:36:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 10%|▉ | 1225/12384 [2:35:57<23:35:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 10%|▉ | 1225/12384 [2:36:05<23:35:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 10%|▉ | 1226/12384 [2:36:05<23:35:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 10%|▉ | 1226/12384 [2:36:13<23:35:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 10%|▉ | 1227/12384 [2:36:13<23:37:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 10%|▉ | 1227/12384 [2:36:20<23:37:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 10%|▉ | 1228/12384 [2:36:20<23:36:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 10%|▉ | 1228/12384 [2:36:28<23:36:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 10%|▉ | 1229/12384 [2:36:28<23:36:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 10%|▉ | 1229/12384 [2:36:35<23:36:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 10%|▉ | 1230/12384 [2:36:35<23:35:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 10%|▉ | 1230/12384 [2:36:43<23:35:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 10%|▉ | 1231/12384 [2:36:43<23:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 10%|▉ | 1231/12384 [2:36:51<23:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 10%|▉ | 1232/12384 [2:36:51<23:50:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 10%|▉ | 1232/12384 [2:36:59<23:50:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 1: 10%|▉ | 1233/12384 [2:36:59<23:44:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 1: 10%|▉ | 1233/12384 [2:37:06<23:44:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 1: 10%|▉ | 1234/12384 [2:37:06<23:41:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 1: 10%|▉ | 1234/12384 [2:37:14<23:41:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 10%|▉ | 1235/12384 [2:37:14<23:38:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 10%|▉ | 1235/12384 [2:37:21<23:38:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 10%|▉ | 1236/12384 [2:37:21<23:38:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 10%|▉ | 1236/12384 [2:37:29<23:38:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 10%|▉ | 1237/12384 [2:37:29<23:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 10%|▉ | 1237/12384 [2:37:37<23:36:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 1: 10%|▉ | 1238/12384 [2:37:37<23:36:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 1: 10%|▉ | 1238/12384 [2:37:44<23:36:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 10%|█ | 1239/12384 [2:37:44<23:35:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 10%|█ | 1239/12384 [2:37:52<23:35:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 1: 10%|█ | 1240/12384 [2:37:52<23:40:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 1: 10%|█ | 1240/12384 [2:38:00<23:40:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 10%|█ | 1241/12384 [2:38:00<23:57:20, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 10%|█ | 1241/12384 [2:38:07<23:57:20, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 10%|█ | 1242/12384 [2:38:07<23:49:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 10%|█ | 1242/12384 [2:38:15<23:49:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 10%|█ | 1243/12384 [2:38:15<23:44:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 10%|█ | 1243/12384 [2:38:23<23:44:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 10%|█ | 1244/12384 [2:38:23<23:41:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 10%|█ | 1244/12384 [2:38:30<23:41:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 10%|█ | 1245/12384 [2:38:30<23:39:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 10%|█ | 1245/12384 [2:38:38<23:39:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 10%|█ | 1246/12384 [2:38:38<23:35:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 10%|█ | 1246/12384 [2:38:46<23:35:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 10%|█ | 1247/12384 [2:38:46<23:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 10%|█ | 1247/12384 [2:38:53<23:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 10%|█ | 1248/12384 [2:38:53<23:35:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 10%|█ | 1248/12384 [2:39:01<23:35:22, 7.63s/it, loss=0.0005, acc=0.9993, iter_time=7.24s]
Epoch 1: 10%|█ | 1249/12384 [2:39:01<23:34:04, 7.62s/it, loss=0.0005, acc=0.9993, iter_time=7.24s]
Epoch 1: 10%|█ | 1249/12384 [2:39:08<23:34:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 10%|█ | 1250/12384 [2:39:08<23:32:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 10%|█ | 1250/12384 [2:39:16<23:32:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=2.95s]
Epoch 1: 10%|█ | 1251/12384 [2:39:16<23:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=2.95s]
Epoch 1: 10%|█ | 1251/12384 [2:39:24<23:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 10%|█ | 1252/12384 [2:39:24<23:33:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 10%|█ | 1252/12384 [2:39:31<23:33:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 1: 10%|█ | 1253/12384 [2:39:31<23:33:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 1: 10%|█ | 1253/12384 [2:39:39<23:33:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 10%|█ | 1254/12384 [2:39:39<23:31:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 10%|█ | 1254/12384 [2:39:46<23:31:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|█ | 1255/12384 [2:39:46<23:30:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|█ | 1255/12384 [2:39:54<23:30:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 10%|█ | 1256/12384 [2:39:54<23:31:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 10%|█ | 1256/12384 [2:40:02<23:31:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 1: 10%|█ | 1257/12384 [2:40:02<23:29:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 1: 10%|█ | 1257/12384 [2:40:09<23:29:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 10%|█ | 1258/12384 [2:40:09<23:29:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 10%|█ | 1258/12384 [2:40:17<23:29:21, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.06s]
Epoch 1: 10%|█ | 1259/12384 [2:40:17<23:29:09, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.06s]
Epoch 1: 10%|█ | 1259/12384 [2:40:24<23:29:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|█ | 1260/12384 [2:40:24<23:30:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|█ | 1260/12384 [2:40:32<23:30:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 10%|█ | 1261/12384 [2:40:32<23:32:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 10%|█ | 1261/12384 [2:40:40<23:32:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 10%|█ | 1262/12384 [2:40:40<23:27:47, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 10%|█ | 1262/12384 [2:40:47<23:27:47, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 10%|█ | 1263/12384 [2:40:47<23:29:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 10%|█ | 1263/12384 [2:40:55<23:29:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 10%|█ | 1264/12384 [2:40:55<23:28:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 10%|█ | 1264/12384 [2:41:02<23:28:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 10%|█ | 1265/12384 [2:41:02<23:29:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 10%|█ | 1265/12384 [2:41:10<23:29:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 10%|█ | 1266/12384 [2:41:10<23:32:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 10%|█ | 1266/12384 [2:41:18<23:32:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 10%|█ | 1267/12384 [2:41:18<23:51:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 10%|█ | 1267/12384 [2:41:26<23:51:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 10%|█ | 1268/12384 [2:41:26<23:46:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 10%|█ | 1268/12384 [2:41:33<23:46:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 10%|█ | 1269/12384 [2:41:33<23:40:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 10%|█ | 1269/12384 [2:41:41<23:40:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 10%|█ | 1270/12384 [2:41:41<23:40:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 10%|█ | 1270/12384 [2:41:49<23:40:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 10%|█ | 1271/12384 [2:41:49<23:36:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 10%|█ | 1271/12384 [2:41:56<23:36:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 10%|█ | 1272/12384 [2:41:56<23:34:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 10%|█ | 1272/12384 [2:42:04<23:34:15, 7.64s/it, loss=0.0025, acc=0.9979, iter_time=7.64s]
Epoch 1: 10%|█ | 1273/12384 [2:42:04<23:33:44, 7.63s/it, loss=0.0025, acc=0.9979, iter_time=7.64s]
Epoch 1: 10%|█ | 1273/12384 [2:42:11<23:33:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 10%|█ | 1274/12384 [2:42:11<23:32:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 10%|█ | 1274/12384 [2:42:19<23:32:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|█ | 1275/12384 [2:42:19<23:31:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|█ | 1275/12384 [2:42:27<23:31:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|█ | 1276/12384 [2:42:27<23:30:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 10%|█ | 1276/12384 [2:42:34<23:30:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 10%|█ | 1277/12384 [2:42:34<23:30:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 10%|█ | 1277/12384 [2:42:42<23:30:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 10%|█ | 1278/12384 [2:42:42<23:29:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 10%|█ | 1278/12384 [2:42:49<23:29:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 10%|█ | 1279/12384 [2:42:49<23:27:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 10%|█ | 1279/12384 [2:42:57<23:27:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 10%|█ | 1280/12384 [2:42:57<23:28:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 10%|█ | 1280/12384 [2:43:05<23:28:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 10%|█ | 1281/12384 [2:43:05<23:28:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 10%|█ | 1281/12384 [2:43:12<23:28:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 10%|█ | 1282/12384 [2:43:12<23:27:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 10%|█ | 1282/12384 [2:43:20<23:27:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 10%|█ | 1283/12384 [2:43:20<23:32:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 10%|█ | 1283/12384 [2:43:28<23:32:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 10%|█ | 1284/12384 [2:43:28<23:46:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 10%|█ | 1284/12384 [2:43:35<23:46:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 10%|█ | 1285/12384 [2:43:35<23:37:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 10%|█ | 1285/12384 [2:43:43<23:37:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 10%|█ | 1286/12384 [2:43:43<23:34:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 10%|█ | 1286/12384 [2:43:51<23:34:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 10%|█ | 1287/12384 [2:43:51<23:30:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 10%|█ | 1287/12384 [2:43:58<23:30:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 10%|█ | 1288/12384 [2:43:58<23:29:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 10%|█ | 1288/12384 [2:44:06<23:29:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 10%|█ | 1289/12384 [2:44:06<23:32:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 10%|█ | 1289/12384 [2:44:14<23:32:51, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 1: 10%|█ | 1290/12384 [2:44:14<23:31:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 1: 10%|█ | 1290/12384 [2:44:21<23:31:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 10%|█ | 1291/12384 [2:44:21<23:29:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 10%|█ | 1291/12384 [2:44:29<23:29:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 10%|█ | 1292/12384 [2:44:29<23:30:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 10%|█ | 1292/12384 [2:44:37<23:30:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 10%|█ | 1293/12384 [2:44:37<23:47:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 10%|█ | 1293/12384 [2:44:44<23:47:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 10%|█ | 1294/12384 [2:44:44<23:41:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 10%|█ | 1294/12384 [2:44:52<23:41:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 10%|█ | 1295/12384 [2:44:52<23:40:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 10%|█ | 1295/12384 [2:45:00<23:40:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 10%|█ | 1296/12384 [2:45:00<23:36:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 10%|█ | 1296/12384 [2:45:07<23:36:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 10%|█ | 1297/12384 [2:45:07<23:33:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 10%|█ | 1297/12384 [2:45:15<23:33:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 10%|█ | 1298/12384 [2:45:15<23:31:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 10%|█ | 1298/12384 [2:45:22<23:31:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|█ | 1299/12384 [2:45:22<23:28:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 10%|█ | 1299/12384 [2:45:30<23:28:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 10%|█ | 1300/12384 [2:45:30<23:26:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 10%|█ | 1300/12384 [2:45:38<23:26:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.24s]
Epoch 1: 11%|█ | 1301/12384 [2:45:38<23:27:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.24s]
Epoch 1: 11%|█ | 1301/12384 [2:45:45<23:27:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 11%|█ | 1302/12384 [2:45:45<23:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 11%|█ | 1302/12384 [2:45:53<23:26:57, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.82s]
Epoch 1: 11%|█ | 1303/12384 [2:45:53<23:25:43, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=8.82s]
Epoch 1: 11%|█ | 1303/12384 [2:46:00<23:25:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 11%|█ | 1304/12384 [2:46:00<23:25:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 11%|█ | 1304/12384 [2:46:08<23:25:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 11%|█ | 1305/12384 [2:46:08<23:28:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 11%|█ | 1305/12384 [2:46:16<23:28:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 11%|█ | 1306/12384 [2:46:16<23:26:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 11%|█ | 1306/12384 [2:46:23<23:26:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 11%|█ | 1307/12384 [2:46:23<23:27:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 11%|█ | 1307/12384 [2:46:31<23:27:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 11%|█ | 1308/12384 [2:46:31<23:27:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 11%|█ | 1308/12384 [2:46:39<23:27:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.46s]
Epoch 1: 11%|█ | 1309/12384 [2:46:39<23:24:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.46s]
Epoch 1: 11%|█ | 1309/12384 [2:46:46<23:24:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 11%|█ | 1310/12384 [2:46:46<23:24:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 11%|█ | 1310/12384 [2:46:54<23:24:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 11%|█ | 1311/12384 [2:46:54<23:23:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 11%|█ | 1311/12384 [2:47:01<23:23:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 11%|█ | 1312/12384 [2:47:01<23:22:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 11%|█ | 1312/12384 [2:47:09<23:22:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 11%|█ | 1313/12384 [2:47:09<23:23:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 11%|█ | 1313/12384 [2:47:17<23:23:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 11%|█ | 1314/12384 [2:47:17<23:23:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 11%|█ | 1314/12384 [2:47:24<23:23:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 11%|█ | 1315/12384 [2:47:24<23:22:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 11%|█ | 1315/12384 [2:47:32<23:22:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 1: 11%|█ | 1316/12384 [2:47:32<23:23:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 1: 11%|█ | 1316/12384 [2:47:39<23:23:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 11%|█ | 1317/12384 [2:47:39<23:22:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 11%|█ | 1317/12384 [2:47:47<23:22:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 11%|█ | 1318/12384 [2:47:47<23:24:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 11%|█ | 1318/12384 [2:47:55<23:24:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 11%|█ | 1319/12384 [2:47:55<23:23:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 11%|█ | 1319/12384 [2:48:03<23:23:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 11%|█ | 1320/12384 [2:48:03<23:39:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 11%|█ | 1320/12384 [2:48:10<23:39:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 11%|█ | 1321/12384 [2:48:10<23:34:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 11%|█ | 1321/12384 [2:48:18<23:34:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 11%|█ | 1322/12384 [2:48:18<23:31:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 11%|█ | 1322/12384 [2:48:25<23:31:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 11%|█ | 1323/12384 [2:48:25<23:28:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 11%|█ | 1323/12384 [2:48:33<23:28:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█ | 1324/12384 [2:48:33<23:26:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█ | 1324/12384 [2:48:41<23:26:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█ | 1325/12384 [2:48:41<23:25:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█ | 1325/12384 [2:48:48<23:25:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 11%|█ | 1326/12384 [2:48:48<23:23:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 11%|█ | 1326/12384 [2:48:56<23:23:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 11%|█ | 1327/12384 [2:48:56<23:22:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 11%|█ | 1327/12384 [2:49:03<23:22:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 1: 11%|█ | 1328/12384 [2:49:03<23:21:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 1: 11%|█ | 1328/12384 [2:49:11<23:21:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 11%|█ | 1329/12384 [2:49:11<23:21:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 11%|█ | 1329/12384 [2:49:19<23:21:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█ | 1330/12384 [2:49:19<23:22:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█ | 1330/12384 [2:49:26<23:22:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 11%|█ | 1331/12384 [2:49:26<23:21:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 11%|█ | 1331/12384 [2:49:34<23:21:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.30s]
Epoch 1: 11%|█ | 1332/12384 [2:49:34<23:22:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.30s]
Epoch 1: 11%|█ | 1332/12384 [2:49:41<23:22:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 11%|█ | 1333/12384 [2:49:41<23:21:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 11%|█ | 1333/12384 [2:49:49<23:21:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█ | 1334/12384 [2:49:49<23:21:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█ | 1334/12384 [2:49:57<23:21:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 11%|█ | 1335/12384 [2:49:57<23:20:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 11%|█ | 1335/12384 [2:50:04<23:20:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 11%|█ | 1336/12384 [2:50:04<23:26:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 11%|█ | 1336/12384 [2:50:12<23:26:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█ | 1337/12384 [2:50:12<23:39:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█ | 1337/12384 [2:50:20<23:39:09, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.11s]
Epoch 1: 11%|█ | 1338/12384 [2:50:20<23:32:51, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.11s]
Epoch 1: 11%|█ | 1338/12384 [2:50:27<23:32:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 11%|█ | 1339/12384 [2:50:27<23:28:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 11%|█ | 1339/12384 [2:50:35<23:28:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 11%|█ | 1340/12384 [2:50:35<23:25:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 11%|█ | 1340/12384 [2:50:43<23:25:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 11%|█ | 1341/12384 [2:50:43<23:24:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 11%|█ | 1341/12384 [2:50:50<23:24:17, 7.63s/it, loss=0.0002, acc=0.9990, iter_time=5.84s]
Epoch 1: 11%|█ | 1342/12384 [2:50:50<23:23:35, 7.63s/it, loss=0.0002, acc=0.9990, iter_time=5.84s]
Epoch 1: 11%|█ | 1342/12384 [2:50:58<23:23:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 11%|█ | 1343/12384 [2:50:58<23:23:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 11%|█ | 1343/12384 [2:51:06<23:23:22, 7.63s/it, loss=0.0000, acc=0.9998, iter_time=7.68s]
Epoch 1: 11%|█ | 1344/12384 [2:51:06<23:28:24, 7.65s/it, loss=0.0000, acc=0.9998, iter_time=7.68s]
Epoch 1: 11%|█ | 1344/12384 [2:51:13<23:28:24, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.45s]
Epoch 1: 11%|█ | 1345/12384 [2:51:13<23:26:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.45s]
Epoch 1: 11%|█ | 1345/12384 [2:51:21<23:26:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 11%|█ | 1346/12384 [2:51:21<23:44:34, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 11%|█ | 1346/12384 [2:51:29<23:44:34, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 11%|█ | 1347/12384 [2:51:29<23:36:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 11%|█ | 1347/12384 [2:51:36<23:36:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 11%|█ | 1348/12384 [2:51:36<23:31:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 11%|█ | 1348/12384 [2:51:44<23:31:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 11%|█ | 1349/12384 [2:51:44<23:27:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 11%|█ | 1349/12384 [2:51:52<23:27:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 11%|█ | 1350/12384 [2:51:52<23:23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 11%|█ | 1350/12384 [2:51:59<23:23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 11%|█ | 1351/12384 [2:51:59<23:22:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 11%|█ | 1351/12384 [2:52:07<23:22:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 11%|█ | 1352/12384 [2:52:07<23:25:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 11%|█ | 1352/12384 [2:52:15<23:25:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 11%|█ | 1353/12384 [2:52:15<23:23:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 11%|█ | 1353/12384 [2:52:22<23:23:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 11%|█ | 1354/12384 [2:52:22<23:23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 11%|█ | 1354/12384 [2:52:30<23:23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 11%|█ | 1355/12384 [2:52:30<23:21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 11%|█ | 1355/12384 [2:52:37<23:21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█ | 1356/12384 [2:52:37<23:19:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█ | 1356/12384 [2:52:45<23:19:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 11%|█ | 1357/12384 [2:52:45<23:21:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 11%|█ | 1357/12384 [2:52:53<23:21:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 11%|█ | 1358/12384 [2:52:53<23:20:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 11%|█ | 1358/12384 [2:53:00<23:20:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 1: 11%|█ | 1359/12384 [2:53:00<23:18:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 1: 11%|█ | 1359/12384 [2:53:08<23:18:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.99s]
Epoch 1: 11%|█ | 1360/12384 [2:53:08<23:18:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.99s]
Epoch 1: 11%|█ | 1360/12384 [2:53:15<23:18:28, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 1: 11%|█ | 1361/12384 [2:53:15<23:19:03, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 1: 11%|█ | 1361/12384 [2:53:23<23:19:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 11%|█ | 1362/12384 [2:53:23<23:22:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 11%|█ | 1362/12384 [2:53:31<23:22:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 11%|█ | 1363/12384 [2:53:31<23:21:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 11%|█ | 1363/12384 [2:53:38<23:21:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 11%|█ | 1364/12384 [2:53:38<23:21:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 11%|█ | 1364/12384 [2:53:46<23:21:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 11%|█ | 1365/12384 [2:53:46<23:19:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 11%|█ | 1365/12384 [2:53:54<23:19:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 11%|█ | 1366/12384 [2:53:54<23:20:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 11%|█ | 1366/12384 [2:54:01<23:20:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 11%|█ | 1367/12384 [2:54:01<23:19:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 11%|█ | 1367/12384 [2:54:09<23:19:04, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=9.27s]
Epoch 1: 11%|█ | 1368/12384 [2:54:09<23:20:24, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=9.27s]
Epoch 1: 11%|█ | 1368/12384 [2:54:16<23:20:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 11%|█ | 1369/12384 [2:54:16<23:20:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 11%|█ | 1369/12384 [2:54:24<23:20:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 11%|█ | 1370/12384 [2:54:24<23:19:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 11%|█ | 1370/12384 [2:54:32<23:19:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 11%|█ | 1371/12384 [2:54:32<23:17:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 11%|█ | 1371/12384 [2:54:39<23:17:15, 7.61s/it, loss=0.0010, acc=0.9953, iter_time=7.58s]
Epoch 1: 11%|█ | 1372/12384 [2:54:39<23:16:27, 7.61s/it, loss=0.0010, acc=0.9953, iter_time=7.58s]
Epoch 1: 11%|█ | 1372/12384 [2:54:47<23:16:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 11%|█ | 1373/12384 [2:54:47<23:35:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 11%|█ | 1373/12384 [2:54:55<23:35:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 11%|█ | 1374/12384 [2:54:55<23:28:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 11%|█ | 1374/12384 [2:55:02<23:28:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█ | 1375/12384 [2:55:02<23:25:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█ | 1375/12384 [2:55:10<23:25:00, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 1: 11%|█ | 1376/12384 [2:55:10<23:21:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 1: 11%|█ | 1376/12384 [2:55:18<23:21:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 1: 11%|█ | 1377/12384 [2:55:18<23:19:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 1: 11%|█ | 1377/12384 [2:55:25<23:19:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 11%|█ | 1378/12384 [2:55:25<23:18:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 11%|█ | 1378/12384 [2:55:33<23:18:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 11%|█ | 1379/12384 [2:55:33<23:18:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 11%|█ | 1379/12384 [2:55:40<23:18:08, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 1: 11%|█ | 1380/12384 [2:55:40<23:17:10, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 1: 11%|█ | 1380/12384 [2:55:48<23:17:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█ | 1381/12384 [2:55:48<23:16:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█ | 1381/12384 [2:55:56<23:16:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 11%|█ | 1382/12384 [2:55:56<23:16:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 11%|█ | 1382/12384 [2:56:03<23:16:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 11%|█ | 1383/12384 [2:56:03<23:14:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 11%|█ | 1383/12384 [2:56:11<23:14:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 11%|█ | 1384/12384 [2:56:11<23:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 11%|█ | 1384/12384 [2:56:18<23:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 11%|█ | 1385/12384 [2:56:18<23:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 11%|█ | 1385/12384 [2:56:26<23:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 11%|█ | 1386/12384 [2:56:26<23:15:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 11%|█ | 1386/12384 [2:56:34<23:15:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 11%|█ | 1387/12384 [2:56:34<23:15:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 11%|█ | 1387/12384 [2:56:41<23:15:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 1: 11%|█ | 1388/12384 [2:56:41<23:17:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 1: 11%|█ | 1388/12384 [2:56:49<23:17:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 11%|█ | 1389/12384 [2:56:49<23:19:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 11%|█ | 1389/12384 [2:56:57<23:19:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 11%|█ | 1390/12384 [2:56:57<23:23:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 11%|█ | 1390/12384 [2:57:04<23:23:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 11%|█ | 1391/12384 [2:57:04<23:20:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 11%|█ | 1391/12384 [2:57:12<23:20:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 11%|█ | 1392/12384 [2:57:12<23:19:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 11%|█ | 1392/12384 [2:57:20<23:19:18, 7.64s/it, loss=0.0019, acc=0.9982, iter_time=7.65s]
Epoch 1: 11%|█ | 1393/12384 [2:57:20<23:17:58, 7.63s/it, loss=0.0019, acc=0.9982, iter_time=7.65s]
Epoch 1: 11%|█ | 1393/12384 [2:57:27<23:17:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 11%|█▏ | 1394/12384 [2:57:27<23:16:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 11%|█▏ | 1394/12384 [2:57:35<23:16:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 11%|█▏ | 1395/12384 [2:57:35<23:14:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 11%|█▏ | 1395/12384 [2:57:42<23:14:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 11%|█▏ | 1396/12384 [2:57:42<23:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 11%|█▏ | 1396/12384 [2:57:50<23:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 11%|█▏ | 1397/12384 [2:57:50<23:13:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 11%|█▏ | 1397/12384 [2:57:58<23:13:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█▏ | 1398/12384 [2:57:58<23:13:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█▏ | 1398/12384 [2:58:06<23:13:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 11%|█▏ | 1399/12384 [2:58:06<23:33:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 11%|█▏ | 1399/12384 [2:58:13<23:33:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 11%|█▏ | 1400/12384 [2:58:13<23:26:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 11%|█▏ | 1400/12384 [2:58:21<23:26:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 11%|█▏ | 1401/12384 [2:58:21<23:22:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 11%|█▏ | 1401/12384 [2:58:28<23:22:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 11%|█▏ | 1402/12384 [2:58:28<23:19:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 11%|█▏ | 1402/12384 [2:58:36<23:19:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 11%|█▏ | 1403/12384 [2:58:36<23:18:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 11%|█▏ | 1403/12384 [2:58:44<23:18:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 11%|█▏ | 1404/12384 [2:58:44<23:15:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 11%|█▏ | 1404/12384 [2:58:51<23:15:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 11%|█▏ | 1405/12384 [2:58:51<23:15:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 11%|█▏ | 1405/12384 [2:58:59<23:15:33, 7.63s/it, loss=0.0005, acc=0.9998, iter_time=7.62s]
Epoch 1: 11%|█▏ | 1406/12384 [2:58:59<23:13:33, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=7.62s]
Epoch 1: 11%|█▏ | 1406/12384 [2:59:06<23:13:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█▏ | 1407/12384 [2:59:06<23:13:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█▏ | 1407/12384 [2:59:14<23:13:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 11%|█▏ | 1408/12384 [2:59:14<23:19:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 11%|█▏ | 1408/12384 [2:59:22<23:19:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 11%|█▏ | 1409/12384 [2:59:22<23:16:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 11%|█▏ | 1409/12384 [2:59:29<23:16:03, 7.63s/it, loss=0.0004, acc=0.9997, iter_time=9.90s]
Epoch 1: 11%|█▏ | 1410/12384 [2:59:29<23:17:21, 7.64s/it, loss=0.0004, acc=0.9997, iter_time=9.90s]
Epoch 1: 11%|█▏ | 1410/12384 [2:59:37<23:17:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 11%|█▏ | 1411/12384 [2:59:37<23:15:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 11%|█▏ | 1411/12384 [2:59:45<23:15:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█▏ | 1412/12384 [2:59:45<23:14:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 11%|█▏ | 1412/12384 [2:59:52<23:14:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 11%|█▏ | 1413/12384 [2:59:52<23:12:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 11%|█▏ | 1413/12384 [3:00:00<23:12:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 11%|█▏ | 1414/12384 [3:00:00<23:11:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 11%|█▏ | 1414/12384 [3:00:08<23:11:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 11%|█▏ | 1415/12384 [3:00:08<23:26:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 11%|█▏ | 1415/12384 [3:00:15<23:26:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 11%|█▏ | 1416/12384 [3:00:15<23:23:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 11%|█▏ | 1416/12384 [3:00:23<23:23:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 11%|█▏ | 1417/12384 [3:00:23<23:19:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 11%|█▏ | 1417/12384 [3:00:31<23:19:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 11%|█▏ | 1418/12384 [3:00:31<23:16:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 11%|█▏ | 1418/12384 [3:00:38<23:16:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 11%|█▏ | 1419/12384 [3:00:38<23:13:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 11%|█▏ | 1419/12384 [3:00:46<23:13:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█▏ | 1420/12384 [3:00:46<23:13:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█▏ | 1420/12384 [3:00:53<23:13:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 11%|█▏ | 1421/12384 [3:00:53<23:12:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 11%|█▏ | 1421/12384 [3:01:01<23:12:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 11%|█▏ | 1422/12384 [3:01:01<23:11:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 11%|█▏ | 1422/12384 [3:01:09<23:11:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█▏ | 1423/12384 [3:01:09<23:10:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 11%|█▏ | 1423/12384 [3:01:16<23:10:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 11%|█▏ | 1424/12384 [3:01:16<23:11:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 11%|█▏ | 1424/12384 [3:01:24<23:11:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 12%|█▏ | 1425/12384 [3:01:24<23:27:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 12%|█▏ | 1425/12384 [3:01:32<23:27:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 12%|█▏ | 1426/12384 [3:01:32<23:22:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 12%|█▏ | 1426/12384 [3:01:39<23:22:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 12%|█▏ | 1427/12384 [3:01:39<23:18:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 12%|█▏ | 1427/12384 [3:01:47<23:18:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 12%|█▏ | 1428/12384 [3:01:47<23:15:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 12%|█▏ | 1428/12384 [3:01:55<23:15:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 12%|█▏ | 1429/12384 [3:01:55<23:13:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 12%|█▏ | 1429/12384 [3:02:02<23:13:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1430/12384 [3:02:02<23:10:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1430/12384 [3:02:10<23:10:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1431/12384 [3:02:10<23:10:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1431/12384 [3:02:17<23:10:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 12%|█▏ | 1432/12384 [3:02:17<23:10:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 12%|█▏ | 1432/12384 [3:02:25<23:10:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 12%|█▏ | 1433/12384 [3:02:25<23:09:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 12%|█▏ | 1433/12384 [3:02:33<23:09:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 12%|█▏ | 1434/12384 [3:02:33<23:09:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 12%|█▏ | 1434/12384 [3:02:40<23:09:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.55s]
Epoch 1: 12%|█▏ | 1435/12384 [3:02:40<23:09:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.55s]
Epoch 1: 12%|█▏ | 1435/12384 [3:02:48<23:09:16, 7.61s/it, loss=0.0007, acc=0.9996, iter_time=9.68s]
Epoch 1: 12%|█▏ | 1436/12384 [3:02:48<23:09:00, 7.61s/it, loss=0.0007, acc=0.9996, iter_time=9.68s]
Epoch 1: 12%|█▏ | 1436/12384 [3:02:55<23:09:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1437/12384 [3:02:55<23:07:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1437/12384 [3:03:03<23:07:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 12%|█▏ | 1438/12384 [3:03:03<23:07:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 12%|█▏ | 1438/12384 [3:03:11<23:07:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 12%|█▏ | 1439/12384 [3:03:11<23:06:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 12%|█▏ | 1439/12384 [3:03:18<23:06:36, 7.60s/it, loss=0.0002, acc=0.9995, iter_time=8.08s]
Epoch 1: 12%|█▏ | 1440/12384 [3:03:18<23:14:19, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=8.08s]
Epoch 1: 12%|█▏ | 1440/12384 [3:03:26<23:14:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 12%|█▏ | 1441/12384 [3:03:26<23:29:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 12%|█▏ | 1441/12384 [3:03:34<23:29:46, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 12%|█▏ | 1442/12384 [3:03:34<23:23:38, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 12%|█▏ | 1442/12384 [3:03:42<23:23:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 12%|█▏ | 1443/12384 [3:03:42<23:18:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 12%|█▏ | 1443/12384 [3:03:49<23:18:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 12%|█▏ | 1444/12384 [3:03:49<23:13:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 12%|█▏ | 1444/12384 [3:03:57<23:13:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 12%|█▏ | 1445/12384 [3:03:57<23:11:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 12%|█▏ | 1445/12384 [3:04:04<23:11:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 12%|█▏ | 1446/12384 [3:04:04<23:10:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 12%|█▏ | 1446/12384 [3:04:12<23:10:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 12%|█▏ | 1447/12384 [3:04:12<23:09:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 12%|█▏ | 1447/12384 [3:04:20<23:09:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 12%|█▏ | 1448/12384 [3:04:20<23:08:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 12%|█▏ | 1448/12384 [3:04:27<23:08:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 12%|█▏ | 1449/12384 [3:04:27<23:07:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 12%|█▏ | 1449/12384 [3:04:35<23:07:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1450/12384 [3:04:35<23:06:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1450/12384 [3:04:43<23:06:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 12%|█▏ | 1451/12384 [3:04:43<23:24:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 12%|█▏ | 1451/12384 [3:04:50<23:24:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 12%|█▏ | 1452/12384 [3:04:50<23:17:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 12%|█▏ | 1452/12384 [3:04:58<23:17:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 12%|█▏ | 1453/12384 [3:04:58<23:14:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 12%|█▏ | 1453/12384 [3:05:06<23:14:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 12%|█▏ | 1454/12384 [3:05:06<23:15:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 12%|█▏ | 1454/12384 [3:05:13<23:15:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 12%|█▏ | 1455/12384 [3:05:13<23:10:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 12%|█▏ | 1455/12384 [3:05:21<23:10:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 12%|█▏ | 1456/12384 [3:05:21<23:09:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 12%|█▏ | 1456/12384 [3:05:28<23:09:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 12%|█▏ | 1457/12384 [3:05:28<23:07:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 12%|█▏ | 1457/12384 [3:05:36<23:07:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1458/12384 [3:05:36<23:06:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1458/12384 [3:05:44<23:06:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 12%|█▏ | 1459/12384 [3:05:44<23:06:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 12%|█▏ | 1459/12384 [3:05:51<23:06:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 12%|█▏ | 1460/12384 [3:05:51<23:06:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 12%|█▏ | 1460/12384 [3:05:59<23:06:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 12%|█▏ | 1461/12384 [3:05:59<23:09:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 12%|█▏ | 1461/12384 [3:06:07<23:09:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 12%|█▏ | 1462/12384 [3:06:07<23:07:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 12%|█▏ | 1462/12384 [3:06:14<23:07:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 12%|█▏ | 1463/12384 [3:06:14<23:06:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 12%|█▏ | 1463/12384 [3:06:22<23:06:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 12%|█▏ | 1464/12384 [3:06:22<23:07:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 12%|█▏ | 1464/12384 [3:06:29<23:07:00, 7.62s/it, loss=0.0006, acc=0.9998, iter_time=7.22s]
Epoch 1: 12%|█▏ | 1465/12384 [3:06:29<23:05:02, 7.61s/it, loss=0.0006, acc=0.9998, iter_time=7.22s]
Epoch 1: 12%|█▏ | 1465/12384 [3:06:37<23:05:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 12%|█▏ | 1466/12384 [3:06:37<23:08:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 12%|█▏ | 1466/12384 [3:06:45<23:08:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 12%|█▏ | 1467/12384 [3:06:45<23:23:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 12%|█▏ | 1467/12384 [3:06:53<23:23:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1468/12384 [3:06:53<23:21:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1468/12384 [3:07:00<23:21:21, 7.70s/it, loss=0.0001, acc=0.9996, iter_time=5.61s]
Epoch 1: 12%|█▏ | 1469/12384 [3:07:00<23:16:05, 7.67s/it, loss=0.0001, acc=0.9996, iter_time=5.61s]
Epoch 1: 12%|█▏ | 1469/12384 [3:07:08<23:16:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 12%|█▏ | 1470/12384 [3:07:08<23:13:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 12%|█▏ | 1470/12384 [3:07:15<23:13:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 12%|█▏ | 1471/12384 [3:07:15<23:13:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 12%|█▏ | 1471/12384 [3:07:23<23:13:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 12%|█▏ | 1472/12384 [3:07:23<23:10:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 12%|█▏ | 1472/12384 [3:07:31<23:10:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 12%|█▏ | 1473/12384 [3:07:31<23:09:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 12%|█▏ | 1473/12384 [3:07:38<23:09:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 12%|█▏ | 1474/12384 [3:07:38<23:06:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 12%|█▏ | 1474/12384 [3:07:46<23:06:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 12%|█▏ | 1475/12384 [3:07:46<23:09:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 12%|█▏ | 1475/12384 [3:07:54<23:09:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1476/12384 [3:07:54<23:06:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1476/12384 [3:08:02<23:06:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 12%|█▏ | 1477/12384 [3:08:02<23:22:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 12%|█▏ | 1477/12384 [3:08:09<23:22:08, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.36s]
Epoch 1: 12%|█▏ | 1478/12384 [3:08:09<23:15:26, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.36s]
Epoch 1: 12%|█▏ | 1478/12384 [3:08:17<23:15:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 12%|█▏ | 1479/12384 [3:08:17<23:11:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 12%|█▏ | 1479/12384 [3:08:24<23:11:44, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 1: 12%|█▏ | 1480/12384 [3:08:24<23:08:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 1: 12%|█▏ | 1480/12384 [3:08:32<23:08:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 12%|█▏ | 1481/12384 [3:08:32<23:06:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 12%|█▏ | 1481/12384 [3:08:40<23:06:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 12%|█▏ | 1482/12384 [3:08:40<23:05:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 12%|█▏ | 1482/12384 [3:08:47<23:05:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 12%|█▏ | 1483/12384 [3:08:47<23:05:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 12%|█▏ | 1483/12384 [3:08:55<23:05:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 12%|█▏ | 1484/12384 [3:08:55<23:06:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 12%|█▏ | 1484/12384 [3:09:02<23:06:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 12%|█▏ | 1485/12384 [3:09:02<23:05:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 12%|█▏ | 1485/12384 [3:09:10<23:05:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 12%|█▏ | 1486/12384 [3:09:10<23:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 12%|█▏ | 1486/12384 [3:09:18<23:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 12%|█▏ | 1487/12384 [3:09:18<23:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 12%|█▏ | 1487/12384 [3:09:25<23:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 12%|█▏ | 1488/12384 [3:09:25<23:01:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 12%|█▏ | 1488/12384 [3:09:33<23:01:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 12%|█▏ | 1489/12384 [3:09:33<23:00:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 12%|█▏ | 1489/12384 [3:09:40<23:00:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 12%|█▏ | 1490/12384 [3:09:40<23:01:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 12%|█▏ | 1490/12384 [3:09:48<23:01:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 12%|█▏ | 1491/12384 [3:09:48<23:01:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 12%|█▏ | 1491/12384 [3:09:56<23:01:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 12%|█▏ | 1492/12384 [3:09:56<23:01:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 12%|█▏ | 1492/12384 [3:10:03<23:01:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 12%|█▏ | 1493/12384 [3:10:03<22:59:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 12%|█▏ | 1493/12384 [3:10:11<22:59:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 12%|█▏ | 1494/12384 [3:10:11<22:59:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 12%|█▏ | 1494/12384 [3:10:18<22:59:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 12%|█▏ | 1495/12384 [3:10:18<22:59:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 12%|█▏ | 1495/12384 [3:10:26<22:59:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 12%|█▏ | 1496/12384 [3:10:26<22:59:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 12%|█▏ | 1496/12384 [3:10:34<22:59:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 12%|█▏ | 1497/12384 [3:10:34<22:59:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 12%|█▏ | 1497/12384 [3:10:41<22:59:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 12%|█▏ | 1498/12384 [3:10:41<22:59:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 12%|█▏ | 1498/12384 [3:10:49<22:59:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 12%|█▏ | 1499/12384 [3:10:49<23:03:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 12%|█▏ | 1499/12384 [3:10:57<23:03:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 12%|█▏ | 1500/12384 [3:10:57<23:04:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 12%|█▏ | 1500/12384 [3:11:04<23:04:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 12%|█▏ | 1501/12384 [3:11:04<23:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 12%|█▏ | 1501/12384 [3:11:12<23:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1502/12384 [3:11:12<23:01:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1502/12384 [3:11:19<23:01:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1503/12384 [3:11:19<23:00:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1503/12384 [3:11:27<23:00:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 12%|█▏ | 1504/12384 [3:11:27<23:18:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 12%|█▏ | 1504/12384 [3:11:35<23:18:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 12%|█▏ | 1505/12384 [3:11:35<23:18:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 12%|█▏ | 1505/12384 [3:11:43<23:18:43, 7.71s/it, loss=0.0003, acc=0.9998, iter_time=10.01s]
Epoch 1: 12%|█▏ | 1506/12384 [3:11:43<23:12:17, 7.68s/it, loss=0.0003, acc=0.9998, iter_time=10.01s]
Epoch 1: 12%|█▏ | 1506/12384 [3:11:50<23:12:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 12%|█▏ | 1507/12384 [3:11:50<23:08:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 12%|█▏ | 1507/12384 [3:11:58<23:08:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 12%|█▏ | 1508/12384 [3:11:58<23:04:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 12%|█▏ | 1508/12384 [3:12:05<23:04:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1509/12384 [3:12:05<23:04:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1509/12384 [3:12:13<23:04:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1510/12384 [3:12:13<23:02:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1510/12384 [3:12:21<23:02:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 12%|█▏ | 1511/12384 [3:12:21<23:01:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 12%|█▏ | 1511/12384 [3:12:28<23:01:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 12%|█▏ | 1512/12384 [3:12:28<22:59:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 12%|█▏ | 1512/12384 [3:12:36<22:59:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 12%|█▏ | 1513/12384 [3:12:36<23:02:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 12%|█▏ | 1513/12384 [3:12:44<23:02:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 12%|█▏ | 1514/12384 [3:12:44<23:01:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 12%|█▏ | 1514/12384 [3:12:51<23:01:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 12%|█▏ | 1515/12384 [3:12:51<23:01:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 12%|█▏ | 1515/12384 [3:12:59<23:01:15, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 1: 12%|█▏ | 1516/12384 [3:12:59<22:59:13, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 1: 12%|█▏ | 1516/12384 [3:13:06<22:59:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 12%|█▏ | 1517/12384 [3:13:06<22:57:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 12%|█▏ | 1517/12384 [3:13:14<22:57:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 12%|█▏ | 1518/12384 [3:13:14<23:00:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 12%|█▏ | 1518/12384 [3:13:22<23:00:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 12%|█▏ | 1519/12384 [3:13:22<22:58:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 12%|█▏ | 1519/12384 [3:13:29<22:58:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 12%|█▏ | 1520/12384 [3:13:29<22:59:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 12%|█▏ | 1520/12384 [3:13:37<22:59:26, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.52s]
Epoch 1: 12%|█▏ | 1521/12384 [3:13:37<23:12:49, 7.69s/it, loss=0.0001, acc=0.9998, iter_time=7.52s]
Epoch 1: 12%|█▏ | 1521/12384 [3:13:45<23:12:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.37s]
Epoch 1: 12%|█▏ | 1522/12384 [3:13:45<23:07:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.37s]
Epoch 1: 12%|█▏ | 1522/12384 [3:13:52<23:07:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 12%|█▏ | 1523/12384 [3:13:52<23:03:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 12%|█▏ | 1523/12384 [3:14:00<23:03:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 12%|█▏ | 1524/12384 [3:14:00<23:00:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 12%|█▏ | 1524/12384 [3:14:07<23:00:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 1: 12%|█▏ | 1525/12384 [3:14:07<22:58:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 1: 12%|█▏ | 1525/12384 [3:14:15<22:58:36, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 1: 12%|█▏ | 1526/12384 [3:14:15<22:58:31, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 1: 12%|█▏ | 1526/12384 [3:14:23<22:58:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 12%|█▏ | 1527/12384 [3:14:23<22:59:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 12%|█▏ | 1527/12384 [3:14:30<22:59:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 12%|█▏ | 1528/12384 [3:14:30<22:58:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 12%|█▏ | 1528/12384 [3:14:38<22:58:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 1: 12%|█▏ | 1529/12384 [3:14:38<22:59:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 1: 12%|█▏ | 1529/12384 [3:14:46<22:59:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 12%|█▏ | 1530/12384 [3:14:46<23:17:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 12%|█▏ | 1530/12384 [3:14:54<23:17:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 12%|█▏ | 1531/12384 [3:14:54<23:10:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 12%|█▏ | 1531/12384 [3:15:01<23:10:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 12%|█▏ | 1532/12384 [3:15:01<23:06:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 12%|█▏ | 1532/12384 [3:15:09<23:06:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 12%|█▏ | 1533/12384 [3:15:09<23:03:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 12%|█▏ | 1533/12384 [3:15:16<23:03:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 12%|█▏ | 1534/12384 [3:15:16<23:00:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 12%|█▏ | 1534/12384 [3:15:24<23:00:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1535/12384 [3:15:24<23:02:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▏ | 1535/12384 [3:15:32<23:02:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 12%|█▏ | 1536/12384 [3:15:32<23:01:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 12%|█▏ | 1536/12384 [3:15:39<23:01:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 12%|█▏ | 1537/12384 [3:15:39<22:57:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 12%|█▏ | 1537/12384 [3:15:47<22:57:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 12%|█▏ | 1538/12384 [3:15:47<22:56:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 12%|█▏ | 1538/12384 [3:15:54<22:56:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 12%|█▏ | 1539/12384 [3:15:54<22:55:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 12%|█▏ | 1539/12384 [3:16:02<22:55:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1540/12384 [3:16:02<22:54:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 12%|█▏ | 1540/12384 [3:16:10<22:54:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 12%|█▏ | 1541/12384 [3:16:10<22:55:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 12%|█▏ | 1541/12384 [3:16:17<22:55:13, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=7.63s]
Epoch 1: 12%|█▏ | 1542/12384 [3:16:17<22:54:29, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=7.63s]
Epoch 1: 12%|█▏ | 1542/12384 [3:16:25<22:54:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 12%|█▏ | 1543/12384 [3:16:25<22:55:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 12%|█▏ | 1543/12384 [3:16:33<22:55:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 12%|█▏ | 1544/12384 [3:16:33<22:55:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 12%|█▏ | 1544/12384 [3:16:40<22:55:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 12%|█▏ | 1545/12384 [3:16:40<22:54:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 12%|█▏ | 1545/12384 [3:16:48<22:54:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 12%|█▏ | 1546/12384 [3:16:48<22:54:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 12%|█▏ | 1546/12384 [3:16:56<22:54:38, 7.61s/it, loss=0.0011, acc=0.9981, iter_time=9.70s]
Epoch 1: 12%|█▏ | 1547/12384 [3:16:56<23:09:46, 7.69s/it, loss=0.0011, acc=0.9981, iter_time=9.70s]
Epoch 1: 12%|█▏ | 1547/12384 [3:17:03<23:09:46, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▎ | 1548/12384 [3:17:03<23:05:21, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 12%|█▎ | 1548/12384 [3:17:11<23:05:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 13%|█▎ | 1549/12384 [3:17:11<23:04:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 13%|█▎ | 1549/12384 [3:17:18<23:04:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 13%|█▎ | 1550/12384 [3:17:18<22:59:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 13%|█▎ | 1550/12384 [3:17:26<22:59:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 13%|█▎ | 1551/12384 [3:17:26<23:01:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 13%|█▎ | 1551/12384 [3:17:34<23:01:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 13%|█▎ | 1552/12384 [3:17:34<22:58:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 13%|█▎ | 1552/12384 [3:17:41<22:58:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 13%|█▎ | 1553/12384 [3:17:41<22:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 13%|█▎ | 1553/12384 [3:17:49<22:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 13%|█▎ | 1554/12384 [3:17:49<22:54:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 13%|█▎ | 1554/12384 [3:17:57<22:54:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 13%|█▎ | 1555/12384 [3:17:57<22:53:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 13%|█▎ | 1555/12384 [3:18:04<22:53:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 13%|█▎ | 1556/12384 [3:18:04<22:53:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 13%|█▎ | 1556/12384 [3:18:12<22:53:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 13%|█▎ | 1557/12384 [3:18:12<23:08:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 13%|█▎ | 1557/12384 [3:18:20<23:08:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 1: 13%|█▎ | 1558/12384 [3:18:20<23:04:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 1: 13%|█▎ | 1558/12384 [3:18:27<23:04:04, 7.67s/it, loss=0.0001, acc=0.9991, iter_time=4.77s]
Epoch 1: 13%|█▎ | 1559/12384 [3:18:27<22:59:53, 7.65s/it, loss=0.0001, acc=0.9991, iter_time=4.77s]
Epoch 1: 13%|█▎ | 1559/12384 [3:18:35<22:59:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 13%|█▎ | 1560/12384 [3:18:35<22:56:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 13%|█▎ | 1560/12384 [3:18:42<22:56:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 13%|█▎ | 1561/12384 [3:18:42<22:55:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 13%|█▎ | 1561/12384 [3:18:50<22:55:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 13%|█▎ | 1562/12384 [3:18:50<22:55:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 13%|█▎ | 1562/12384 [3:18:58<22:55:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1563/12384 [3:18:58<22:54:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1563/12384 [3:19:05<22:54:10, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1564/12384 [3:19:05<22:52:51, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1564/12384 [3:19:13<22:52:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1565/12384 [3:19:13<22:52:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1565/12384 [3:19:20<22:52:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 13%|█▎ | 1566/12384 [3:19:20<22:52:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 13%|█▎ | 1566/12384 [3:19:28<22:52:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.46s]
Epoch 1: 13%|█▎ | 1567/12384 [3:19:28<22:52:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.46s]
Epoch 1: 13%|█▎ | 1567/12384 [3:19:36<22:52:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.76s]
Epoch 1: 13%|█▎ | 1568/12384 [3:19:36<22:52:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.76s]
Epoch 1: 13%|█▎ | 1568/12384 [3:19:43<22:52:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 13%|█▎ | 1569/12384 [3:19:43<22:51:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 13%|█▎ | 1569/12384 [3:19:51<22:51:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 13%|█▎ | 1570/12384 [3:19:51<22:50:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 13%|█▎ | 1570/12384 [3:19:59<22:50:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 13%|█▎ | 1571/12384 [3:19:59<22:50:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 13%|█▎ | 1571/12384 [3:20:06<22:50:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 1: 13%|█▎ | 1572/12384 [3:20:06<22:49:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 1: 13%|█▎ | 1572/12384 [3:20:14<22:49:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 1: 13%|█▎ | 1573/12384 [3:20:14<23:03:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 1: 13%|█▎ | 1573/12384 [3:20:22<23:03:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 13%|█▎ | 1574/12384 [3:20:22<22:58:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 13%|█▎ | 1574/12384 [3:20:29<22:58:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 13%|█▎ | 1575/12384 [3:20:29<22:54:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 13%|█▎ | 1575/12384 [3:20:37<22:54:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 13%|█▎ | 1576/12384 [3:20:37<22:53:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 13%|█▎ | 1576/12384 [3:20:44<22:53:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 13%|█▎ | 1577/12384 [3:20:44<22:52:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 13%|█▎ | 1577/12384 [3:20:52<22:52:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 13%|█▎ | 1578/12384 [3:20:52<22:51:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 13%|█▎ | 1578/12384 [3:21:00<22:51:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.55s]
Epoch 1: 13%|█▎ | 1579/12384 [3:21:00<22:50:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.55s]
Epoch 1: 13%|█▎ | 1579/12384 [3:21:07<22:50:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 13%|█▎ | 1580/12384 [3:21:07<22:50:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 13%|█▎ | 1580/12384 [3:21:15<22:50:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 13%|█▎ | 1581/12384 [3:21:15<22:49:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 13%|█▎ | 1581/12384 [3:21:22<22:49:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 13%|█▎ | 1582/12384 [3:21:22<22:49:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 13%|█▎ | 1582/12384 [3:21:30<22:49:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.10s]
Epoch 1: 13%|█▎ | 1583/12384 [3:21:30<23:08:27, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.10s]
Epoch 1: 13%|█▎ | 1583/12384 [3:21:38<23:08:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 13%|█▎ | 1584/12384 [3:21:38<23:03:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 13%|█▎ | 1584/12384 [3:21:46<23:03:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 13%|█▎ | 1585/12384 [3:21:46<22:58:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 13%|█▎ | 1585/12384 [3:21:53<22:58:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1586/12384 [3:21:53<23:00:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1586/12384 [3:22:01<23:00:59, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.70s]
Epoch 1: 13%|█▎ | 1587/12384 [3:22:01<22:59:04, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=7.70s]
Epoch 1: 13%|█▎ | 1587/12384 [3:22:09<22:59:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 13%|█▎ | 1588/12384 [3:22:09<22:56:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 13%|█▎ | 1588/12384 [3:22:16<22:56:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 13%|█▎ | 1589/12384 [3:22:16<22:53:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 13%|█▎ | 1589/12384 [3:22:24<22:53:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 13%|█▎ | 1590/12384 [3:22:24<22:52:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 13%|█▎ | 1590/12384 [3:22:31<22:52:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 1: 13%|█▎ | 1591/12384 [3:22:31<22:51:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 1: 13%|█▎ | 1591/12384 [3:22:39<22:51:13, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=11.52s]
Epoch 1: 13%|█▎ | 1592/12384 [3:22:39<22:51:14, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=11.52s]
Epoch 1: 13%|█▎ | 1592/12384 [3:22:47<22:51:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 13%|█▎ | 1593/12384 [3:22:47<22:51:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 13%|█▎ | 1593/12384 [3:22:54<22:51:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 13%|█▎ | 1594/12384 [3:22:54<22:49:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 13%|█▎ | 1594/12384 [3:23:02<22:49:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 13%|█▎ | 1595/12384 [3:23:02<22:49:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 13%|█▎ | 1595/12384 [3:23:09<22:49:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 13%|█▎ | 1596/12384 [3:23:09<22:50:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 13%|█▎ | 1596/12384 [3:23:17<22:50:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 13%|█▎ | 1597/12384 [3:23:17<22:47:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 13%|█▎ | 1597/12384 [3:23:25<22:47:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 13%|█▎ | 1598/12384 [3:23:25<22:48:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 13%|█▎ | 1598/12384 [3:23:32<22:48:24, 7.61s/it, loss=0.0003, acc=0.9977, iter_time=4.62s]
Epoch 1: 13%|█▎ | 1599/12384 [3:23:32<22:48:27, 7.61s/it, loss=0.0003, acc=0.9977, iter_time=4.62s]
Epoch 1: 13%|█▎ | 1599/12384 [3:23:40<22:48:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 13%|█▎ | 1600/12384 [3:23:40<22:47:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 13%|█▎ | 1600/12384 [3:23:47<22:47:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 13%|█▎ | 1601/12384 [3:23:47<22:48:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 13%|█▎ | 1601/12384 [3:23:55<22:48:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1602/12384 [3:23:55<22:47:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1602/12384 [3:24:03<22:47:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 13%|█▎ | 1603/12384 [3:24:03<22:46:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 13%|█▎ | 1603/12384 [3:24:10<22:46:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1604/12384 [3:24:10<22:46:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1604/12384 [3:24:18<22:46:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 13%|█▎ | 1605/12384 [3:24:18<22:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 13%|█▎ | 1605/12384 [3:24:26<22:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1606/12384 [3:24:26<22:46:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1606/12384 [3:24:33<22:46:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 13%|█▎ | 1607/12384 [3:24:33<22:46:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 13%|█▎ | 1607/12384 [3:24:41<22:46:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 13%|█▎ | 1608/12384 [3:24:41<22:50:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 13%|█▎ | 1608/12384 [3:24:49<22:50:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 13%|█▎ | 1609/12384 [3:24:49<23:08:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 13%|█▎ | 1609/12384 [3:24:56<23:08:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 13%|█▎ | 1610/12384 [3:24:56<23:01:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 13%|█▎ | 1610/12384 [3:25:04<23:01:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 13%|█▎ | 1611/12384 [3:25:04<22:59:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 13%|█▎ | 1611/12384 [3:25:12<22:59:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 13%|█▎ | 1612/12384 [3:25:12<22:55:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 13%|█▎ | 1612/12384 [3:25:19<22:55:01, 7.66s/it, loss=0.0009, acc=0.9982, iter_time=9.08s]
Epoch 1: 13%|█▎ | 1613/12384 [3:25:19<22:51:34, 7.64s/it, loss=0.0009, acc=0.9982, iter_time=9.08s]
Epoch 1: 13%|█▎ | 1613/12384 [3:25:27<22:51:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 13%|█▎ | 1614/12384 [3:25:27<22:49:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 13%|█▎ | 1614/12384 [3:25:34<22:49:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1615/12384 [3:25:34<22:49:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1615/12384 [3:25:42<22:49:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 13%|█▎ | 1616/12384 [3:25:42<22:58:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 13%|█▎ | 1616/12384 [3:25:50<22:58:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 13%|█▎ | 1617/12384 [3:25:50<22:54:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 13%|█▎ | 1617/12384 [3:25:57<22:54:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 13%|█▎ | 1618/12384 [3:25:57<22:51:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 13%|█▎ | 1618/12384 [3:26:05<22:51:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 13%|█▎ | 1619/12384 [3:26:05<22:50:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 13%|█▎ | 1619/12384 [3:26:12<22:50:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 13%|█▎ | 1620/12384 [3:26:12<22:10:26, 7.42s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 13%|█▎ | 1620/12384 [3:26:20<22:10:26, 7.42s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 13%|█▎ | 1621/12384 [3:26:20<22:20:01, 7.47s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 13%|█▎ | 1621/12384 [3:26:27<22:20:01, 7.47s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1622/12384 [3:26:27<22:26:50, 7.51s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1622/12384 [3:26:35<22:26:50, 7.51s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 13%|█▎ | 1623/12384 [3:26:35<22:31:12, 7.53s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 13%|█▎ | 1623/12384 [3:26:42<22:31:12, 7.53s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 13%|█▎ | 1624/12384 [3:26:42<22:37:44, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 13%|█▎ | 1624/12384 [3:26:50<22:37:44, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 13%|█▎ | 1625/12384 [3:26:50<22:39:11, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 13%|█▎ | 1625/12384 [3:26:58<22:39:11, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 13%|█▎ | 1626/12384 [3:26:58<22:55:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 13%|█▎ | 1626/12384 [3:27:06<22:55:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 13%|█▎ | 1627/12384 [3:27:06<22:52:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 13%|█▎ | 1627/12384 [3:27:13<22:52:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 13%|█▎ | 1628/12384 [3:27:13<22:50:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 13%|█▎ | 1628/12384 [3:27:21<22:50:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 13%|█▎ | 1629/12384 [3:27:21<22:49:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 13%|█▎ | 1629/12384 [3:27:28<22:49:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 13%|█▎ | 1630/12384 [3:27:28<22:47:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 13%|█▎ | 1630/12384 [3:27:36<22:47:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 13%|█▎ | 1631/12384 [3:27:36<22:42:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 13%|█▎ | 1631/12384 [3:27:44<22:42:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 13%|█▎ | 1632/12384 [3:27:44<22:43:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 13%|█▎ | 1632/12384 [3:27:51<22:43:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 13%|█▎ | 1633/12384 [3:27:51<22:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 13%|█▎ | 1633/12384 [3:27:59<22:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1634/12384 [3:27:59<22:44:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1634/12384 [3:28:07<22:44:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 13%|█▎ | 1635/12384 [3:28:07<23:05:10, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 13%|█▎ | 1635/12384 [3:28:14<23:05:10, 7.73s/it, loss=0.0007, acc=1.0000, iter_time=6.44s]
Epoch 1: 13%|█▎ | 1636/12384 [3:28:14<22:57:58, 7.69s/it, loss=0.0007, acc=1.0000, iter_time=6.44s]
Epoch 1: 13%|█▎ | 1636/12384 [3:28:22<22:57:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 13%|█▎ | 1637/12384 [3:28:22<22:53:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 13%|█▎ | 1637/12384 [3:28:30<22:53:15, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 1: 13%|█▎ | 1638/12384 [3:28:30<22:50:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.68s]
Epoch 1: 13%|█▎ | 1638/12384 [3:28:37<22:50:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1639/12384 [3:28:37<22:49:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1639/12384 [3:28:45<22:49:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1640/12384 [3:28:45<22:48:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1640/12384 [3:28:52<22:48:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 13%|█▎ | 1641/12384 [3:28:52<22:44:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 13%|█▎ | 1641/12384 [3:29:00<22:44:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 13%|█▎ | 1642/12384 [3:29:00<22:43:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 13%|█▎ | 1642/12384 [3:29:08<22:43:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1643/12384 [3:29:08<22:44:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1643/12384 [3:29:15<22:44:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 1: 13%|█▎ | 1644/12384 [3:29:15<22:44:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 1: 13%|█▎ | 1644/12384 [3:29:23<22:44:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 13%|█▎ | 1645/12384 [3:29:23<22:44:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 13%|█▎ | 1645/12384 [3:29:31<22:44:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1646/12384 [3:29:31<22:44:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1646/12384 [3:29:38<22:44:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 13%|█▎ | 1647/12384 [3:29:38<22:44:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 13%|█▎ | 1647/12384 [3:29:46<22:44:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 13%|█▎ | 1648/12384 [3:29:46<22:43:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 13%|█▎ | 1648/12384 [3:29:53<22:43:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1649/12384 [3:29:53<22:43:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 13%|█▎ | 1649/12384 [3:30:01<22:43:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 13%|█▎ | 1650/12384 [3:30:01<22:43:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 13%|█▎ | 1650/12384 [3:30:09<22:43:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 13%|█▎ | 1651/12384 [3:30:09<22:41:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 13%|█▎ | 1651/12384 [3:30:16<22:41:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 13%|█▎ | 1652/12384 [3:30:16<22:40:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 13%|█▎ | 1652/12384 [3:30:24<22:40:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 13%|█▎ | 1653/12384 [3:30:24<22:40:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 13%|█▎ | 1653/12384 [3:30:31<22:40:13, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.36s]
Epoch 1: 13%|█▎ | 1654/12384 [3:30:31<22:39:45, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.36s]
Epoch 1: 13%|█▎ | 1654/12384 [3:30:39<22:39:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 13%|█▎ | 1655/12384 [3:30:39<22:40:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 13%|█▎ | 1655/12384 [3:30:47<22:40:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 13%|█▎ | 1656/12384 [3:30:47<22:40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 13%|█▎ | 1656/12384 [3:30:54<22:40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 13%|█▎ | 1657/12384 [3:30:54<22:40:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 13%|█▎ | 1657/12384 [3:31:02<22:40:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1658/12384 [3:31:02<22:40:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1658/12384 [3:31:10<22:40:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1659/12384 [3:31:10<22:39:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1659/12384 [3:31:17<22:39:09, 7.60s/it, loss=0.0001, acc=0.9992, iter_time=7.59s]
Epoch 1: 13%|█▎ | 1660/12384 [3:31:17<22:38:26, 7.60s/it, loss=0.0001, acc=0.9992, iter_time=7.59s]
Epoch 1: 13%|█▎ | 1660/12384 [3:31:25<22:38:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 13%|█▎ | 1661/12384 [3:31:25<22:54:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 13%|█▎ | 1661/12384 [3:31:33<22:54:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 13%|█▎ | 1662/12384 [3:31:33<22:50:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 13%|█▎ | 1662/12384 [3:31:40<22:50:43, 7.67s/it, loss=0.0007, acc=0.9976, iter_time=7.62s]
Epoch 1: 13%|█▎ | 1663/12384 [3:31:40<22:46:35, 7.65s/it, loss=0.0007, acc=0.9976, iter_time=7.62s]
Epoch 1: 13%|█▎ | 1663/12384 [3:31:48<22:46:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 13%|█▎ | 1664/12384 [3:31:48<22:44:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 13%|█▎ | 1664/12384 [3:31:55<22:44:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 13%|█▎ | 1665/12384 [3:31:55<22:43:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 13%|█▎ | 1665/12384 [3:32:03<22:43:39, 7.63s/it, loss=0.0005, acc=0.9989, iter_time=8.05s]
Epoch 1: 13%|█▎ | 1666/12384 [3:32:03<22:42:53, 7.63s/it, loss=0.0005, acc=0.9989, iter_time=8.05s]
Epoch 1: 13%|█▎ | 1666/12384 [3:32:11<22:42:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 13%|█▎ | 1667/12384 [3:32:11<22:40:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 13%|█▎ | 1667/12384 [3:32:18<22:40:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 13%|█▎ | 1668/12384 [3:32:18<22:43:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 13%|█▎ | 1668/12384 [3:32:26<22:43:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 13%|█▎ | 1669/12384 [3:32:26<22:42:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 13%|█▎ | 1669/12384 [3:32:34<22:42:14, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1670/12384 [3:32:34<22:39:46, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 1: 13%|█▎ | 1670/12384 [3:32:41<22:39:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 13%|█▎ | 1671/12384 [3:32:41<22:39:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 13%|█▎ | 1671/12384 [3:32:49<22:39:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 1: 14%|█▎ | 1672/12384 [3:32:49<22:38:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 1: 14%|█▎ | 1672/12384 [3:32:56<22:38:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 14%|█▎ | 1673/12384 [3:32:56<22:41:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 14%|█▎ | 1673/12384 [3:33:04<22:41:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 14%|█▎ | 1674/12384 [3:33:04<22:40:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 14%|█▎ | 1674/12384 [3:33:12<22:40:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 14%|█▎ | 1675/12384 [3:33:12<22:39:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 14%|█▎ | 1675/12384 [3:33:19<22:39:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.38s]
Epoch 1: 14%|█▎ | 1676/12384 [3:33:19<22:38:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.38s]
Epoch 1: 14%|█▎ | 1676/12384 [3:33:27<22:38:56, 7.61s/it, loss=0.0035, acc=0.9978, iter_time=8.81s]
Epoch 1: 14%|█▎ | 1677/12384 [3:33:27<22:38:40, 7.61s/it, loss=0.0035, acc=0.9978, iter_time=8.81s]
Epoch 1: 14%|█▎ | 1677/12384 [3:33:34<22:38:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 14%|█▎ | 1678/12384 [3:33:34<22:38:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 14%|█▎ | 1678/12384 [3:33:42<22:38:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▎ | 1679/12384 [3:33:42<22:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▎ | 1679/12384 [3:33:50<22:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 14%|█▎ | 1680/12384 [3:33:50<22:38:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 14%|█▎ | 1680/12384 [3:33:57<22:38:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 14%|█▎ | 1681/12384 [3:33:57<22:37:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 14%|█▎ | 1681/12384 [3:34:05<22:37:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 14%|█▎ | 1682/12384 [3:34:05<22:37:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 14%|█▎ | 1682/12384 [3:34:13<22:37:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 14%|█▎ | 1683/12384 [3:34:13<22:37:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 14%|█▎ | 1683/12384 [3:34:20<22:37:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▎ | 1684/12384 [3:34:20<22:38:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▎ | 1684/12384 [3:34:28<22:38:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▎ | 1685/12384 [3:34:28<22:36:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▎ | 1685/12384 [3:34:35<22:36:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 14%|█▎ | 1686/12384 [3:34:35<22:36:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 14%|█▎ | 1686/12384 [3:34:43<22:36:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 14%|█▎ | 1687/12384 [3:34:43<22:34:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 14%|█▎ | 1687/12384 [3:34:51<22:34:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 14%|█▎ | 1688/12384 [3:34:51<22:52:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 14%|█▎ | 1688/12384 [3:34:58<22:52:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 14%|█▎ | 1689/12384 [3:34:58<22:27:22, 7.56s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 14%|█▎ | 1689/12384 [3:35:06<22:27:22, 7.56s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 14%|█▎ | 1690/12384 [3:35:06<22:28:36, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 14%|█▎ | 1690/12384 [3:35:13<22:28:36, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 14%|█▎ | 1691/12384 [3:35:13<22:30:03, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 14%|█▎ | 1691/12384 [3:35:21<22:30:03, 7.58s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 1: 14%|█▎ | 1692/12384 [3:35:21<22:30:02, 7.58s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 1: 14%|█▎ | 1692/12384 [3:35:28<22:30:02, 7.58s/it, loss=0.0002, acc=0.9989, iter_time=9.38s]
Epoch 1: 14%|█▎ | 1693/12384 [3:35:28<22:30:55, 7.58s/it, loss=0.0002, acc=0.9989, iter_time=9.38s]
Epoch 1: 14%|█▎ | 1693/12384 [3:35:36<22:30:55, 7.58s/it, loss=0.0012, acc=0.9979, iter_time=6.37s]
Epoch 1: 14%|█▎ | 1694/12384 [3:35:36<22:32:05, 7.59s/it, loss=0.0012, acc=0.9979, iter_time=6.37s]
Epoch 1: 14%|█▎ | 1694/12384 [3:35:44<22:32:05, 7.59s/it, loss=0.0002, acc=0.9994, iter_time=5.54s]
Epoch 1: 14%|█▎ | 1695/12384 [3:35:44<22:33:40, 7.60s/it, loss=0.0002, acc=0.9994, iter_time=5.54s]
Epoch 1: 14%|█▎ | 1695/12384 [3:35:51<22:33:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 1: 14%|█▎ | 1696/12384 [3:35:51<22:34:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 1: 14%|█▎ | 1696/12384 [3:35:59<22:34:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.39s]
Epoch 1: 14%|█▎ | 1697/12384 [3:35:59<22:33:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.39s]
Epoch 1: 14%|█▎ | 1697/12384 [3:36:06<22:33:45, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=11.45s]
Epoch 1: 14%|█▎ | 1698/12384 [3:36:06<22:33:30, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=11.45s]
Epoch 1: 14%|█▎ | 1698/12384 [3:36:14<22:33:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 14%|█▎ | 1699/12384 [3:36:14<22:35:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 14%|█▎ | 1699/12384 [3:36:22<22:35:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 14%|█▎ | 1700/12384 [3:36:22<22:35:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 14%|█▎ | 1700/12384 [3:36:29<22:35:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 1: 14%|█▎ | 1701/12384 [3:36:29<22:35:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 1: 14%|█▎ | 1701/12384 [3:36:37<22:35:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 14%|█▎ | 1702/12384 [3:36:37<22:35:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 14%|█▎ | 1702/12384 [3:36:45<22:35:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1703/12384 [3:36:45<22:34:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1703/12384 [3:36:52<22:34:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 14%|█▍ | 1704/12384 [3:36:52<22:34:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 14%|█▍ | 1704/12384 [3:37:00<22:34:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▍ | 1705/12384 [3:37:00<22:34:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▍ | 1705/12384 [3:37:08<22:34:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 14%|█▍ | 1706/12384 [3:37:08<22:51:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 14%|█▍ | 1706/12384 [3:37:15<22:51:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1707/12384 [3:37:15<22:45:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1707/12384 [3:37:23<22:45:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 14%|█▍ | 1708/12384 [3:37:23<22:40:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 14%|█▍ | 1708/12384 [3:37:31<22:40:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 14%|█▍ | 1709/12384 [3:37:31<22:38:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 14%|█▍ | 1709/12384 [3:37:38<22:38:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1710/12384 [3:37:38<22:36:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1710/12384 [3:37:46<22:36:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1711/12384 [3:37:46<22:36:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1711/12384 [3:37:53<22:36:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 14%|█▍ | 1712/12384 [3:37:53<22:36:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 14%|█▍ | 1712/12384 [3:38:01<22:36:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 14%|█▍ | 1713/12384 [3:38:01<22:35:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 14%|█▍ | 1713/12384 [3:38:09<22:35:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 1: 14%|█▍ | 1714/12384 [3:38:09<22:52:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 1: 14%|█▍ | 1714/12384 [3:38:17<22:52:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 14%|█▍ | 1715/12384 [3:38:17<22:47:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 14%|█▍ | 1715/12384 [3:38:24<22:47:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 14%|█▍ | 1716/12384 [3:38:24<22:43:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 14%|█▍ | 1716/12384 [3:38:32<22:43:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 14%|█▍ | 1717/12384 [3:38:32<22:39:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 14%|█▍ | 1717/12384 [3:38:39<22:39:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1718/12384 [3:38:39<22:37:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1718/12384 [3:38:47<22:37:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1719/12384 [3:38:47<22:35:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1719/12384 [3:38:55<22:35:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 14%|█▍ | 1720/12384 [3:38:55<22:33:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 14%|█▍ | 1720/12384 [3:39:02<22:33:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 14%|█▍ | 1721/12384 [3:39:02<22:33:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 14%|█▍ | 1721/12384 [3:39:10<22:33:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 14%|█▍ | 1722/12384 [3:39:10<22:33:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 14%|█▍ | 1722/12384 [3:39:17<22:33:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 14%|█▍ | 1723/12384 [3:39:17<22:33:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 14%|█▍ | 1723/12384 [3:39:25<22:33:21, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.07s]
Epoch 1: 14%|█▍ | 1724/12384 [3:39:25<22:34:10, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.07s]
Epoch 1: 14%|█▍ | 1724/12384 [3:39:33<22:34:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 14%|█▍ | 1725/12384 [3:39:33<22:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 14%|█▍ | 1725/12384 [3:39:40<22:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1726/12384 [3:39:40<22:33:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1726/12384 [3:39:48<22:33:01, 7.62s/it, loss=0.0004, acc=0.9976, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1727/12384 [3:39:48<22:32:35, 7.62s/it, loss=0.0004, acc=0.9976, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1727/12384 [3:39:55<22:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 14%|█▍ | 1728/12384 [3:39:55<22:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 14%|█▍ | 1728/12384 [3:40:03<22:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 14%|█▍ | 1729/12384 [3:40:03<22:30:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 14%|█▍ | 1729/12384 [3:40:11<22:30:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1730/12384 [3:40:11<22:35:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1730/12384 [3:40:18<22:35:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 14%|█▍ | 1731/12384 [3:40:18<22:33:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 14%|█▍ | 1731/12384 [3:40:26<22:33:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 14%|█▍ | 1732/12384 [3:40:26<22:34:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 14%|█▍ | 1732/12384 [3:40:34<22:34:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 1: 14%|█▍ | 1733/12384 [3:40:34<22:53:55, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 1: 14%|█▍ | 1733/12384 [3:40:42<22:53:55, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1734/12384 [3:40:42<22:47:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1734/12384 [3:40:49<22:47:02, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1735/12384 [3:40:49<22:42:42, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1735/12384 [3:40:57<22:42:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 14%|█▍ | 1736/12384 [3:40:57<22:39:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 14%|█▍ | 1736/12384 [3:41:05<22:39:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 14%|█▍ | 1737/12384 [3:41:05<22:40:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 14%|█▍ | 1737/12384 [3:41:12<22:40:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 14%|█▍ | 1738/12384 [3:41:12<22:37:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 14%|█▍ | 1738/12384 [3:41:20<22:37:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1739/12384 [3:41:20<22:35:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1739/12384 [3:41:27<22:35:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▍ | 1740/12384 [3:41:27<22:33:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▍ | 1740/12384 [3:41:35<22:33:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 14%|█▍ | 1741/12384 [3:41:35<22:50:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 14%|█▍ | 1741/12384 [3:41:43<22:50:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 14%|█▍ | 1742/12384 [3:41:43<22:42:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 14%|█▍ | 1742/12384 [3:41:51<22:42:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1743/12384 [3:41:51<22:39:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1743/12384 [3:41:58<22:39:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 14%|█▍ | 1744/12384 [3:41:58<22:36:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 14%|█▍ | 1744/12384 [3:42:06<22:36:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 14%|█▍ | 1745/12384 [3:42:06<22:34:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 14%|█▍ | 1745/12384 [3:42:13<22:34:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 14%|█▍ | 1746/12384 [3:42:13<22:35:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 14%|█▍ | 1746/12384 [3:42:21<22:35:09, 7.64s/it, loss=0.0008, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▍ | 1747/12384 [3:42:21<22:39:34, 7.67s/it, loss=0.0008, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▍ | 1747/12384 [3:42:29<22:39:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 14%|█▍ | 1748/12384 [3:42:29<22:41:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 14%|█▍ | 1748/12384 [3:42:36<22:41:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 14%|█▍ | 1749/12384 [3:42:36<22:36:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 14%|█▍ | 1749/12384 [3:42:44<22:36:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 14%|█▍ | 1750/12384 [3:42:44<22:33:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 14%|█▍ | 1750/12384 [3:42:52<22:33:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 14%|█▍ | 1751/12384 [3:42:52<22:31:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 14%|█▍ | 1751/12384 [3:42:59<22:31:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1752/12384 [3:42:59<22:34:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1752/12384 [3:43:07<22:34:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 14%|█▍ | 1753/12384 [3:43:07<22:30:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 14%|█▍ | 1753/12384 [3:43:15<22:30:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 14%|█▍ | 1754/12384 [3:43:15<22:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 14%|█▍ | 1754/12384 [3:43:22<22:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 14%|█▍ | 1755/12384 [3:43:22<22:28:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 14%|█▍ | 1755/12384 [3:43:30<22:28:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 14%|█▍ | 1756/12384 [3:43:30<22:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 14%|█▍ | 1756/12384 [3:43:37<22:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 1: 14%|█▍ | 1757/12384 [3:43:37<22:26:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 1: 14%|█▍ | 1757/12384 [3:43:45<22:26:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 1: 14%|█▍ | 1758/12384 [3:43:45<22:26:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 1: 14%|█▍ | 1758/12384 [3:43:53<22:26:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 14%|█▍ | 1759/12384 [3:43:53<22:41:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 14%|█▍ | 1759/12384 [3:44:00<22:41:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 14%|█▍ | 1760/12384 [3:44:00<22:36:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 14%|█▍ | 1760/12384 [3:44:08<22:36:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 14%|█▍ | 1761/12384 [3:44:08<22:34:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 14%|█▍ | 1761/12384 [3:44:16<22:34:08, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.06s]
Epoch 1: 14%|█▍ | 1762/12384 [3:44:16<22:32:23, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.06s]
Epoch 1: 14%|█▍ | 1762/12384 [3:44:23<22:32:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 14%|█▍ | 1763/12384 [3:44:23<22:29:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 14%|█▍ | 1763/12384 [3:44:31<22:29:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1764/12384 [3:44:31<22:31:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 14%|█▍ | 1764/12384 [3:44:39<22:31:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 14%|█▍ | 1765/12384 [3:44:39<22:30:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 14%|█▍ | 1765/12384 [3:44:46<22:30:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 14%|█▍ | 1766/12384 [3:44:46<22:27:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 14%|█▍ | 1766/12384 [3:44:54<22:27:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 14%|█▍ | 1767/12384 [3:44:54<22:44:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 14%|█▍ | 1767/12384 [3:45:02<22:44:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 14%|█▍ | 1768/12384 [3:45:02<22:38:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 14%|█▍ | 1768/12384 [3:45:09<22:38:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 14%|█▍ | 1769/12384 [3:45:09<22:33:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 14%|█▍ | 1769/12384 [3:45:17<22:33:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 1: 14%|█▍ | 1770/12384 [3:45:17<22:31:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 1: 14%|█▍ | 1770/12384 [3:45:24<22:31:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 14%|█▍ | 1771/12384 [3:45:24<22:29:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 14%|█▍ | 1771/12384 [3:45:32<22:29:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 14%|█▍ | 1772/12384 [3:45:32<22:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 14%|█▍ | 1772/12384 [3:45:40<22:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 14%|█▍ | 1773/12384 [3:45:40<22:27:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 14%|█▍ | 1773/12384 [3:45:47<22:27:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 14%|█▍ | 1774/12384 [3:45:47<22:32:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 14%|█▍ | 1774/12384 [3:45:55<22:32:02, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.49s]
Epoch 1: 14%|█▍ | 1775/12384 [3:45:55<22:30:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.49s]
Epoch 1: 14%|█▍ | 1775/12384 [3:46:03<22:30:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 1: 14%|█▍ | 1776/12384 [3:46:03<22:28:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 1: 14%|█▍ | 1776/12384 [3:46:10<22:28:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 14%|█▍ | 1777/12384 [3:46:10<22:29:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 14%|█▍ | 1777/12384 [3:46:18<22:29:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1778/12384 [3:46:18<22:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1778/12384 [3:46:25<22:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 14%|█▍ | 1779/12384 [3:46:25<22:26:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 14%|█▍ | 1779/12384 [3:46:33<22:26:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 14%|█▍ | 1780/12384 [3:46:33<22:24:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 14%|█▍ | 1780/12384 [3:46:41<22:24:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1781/12384 [3:46:41<22:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 14%|█▍ | 1781/12384 [3:46:48<22:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1782/12384 [3:46:48<22:25:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1782/12384 [3:46:56<22:25:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.58s]
Epoch 1: 14%|█▍ | 1783/12384 [3:46:56<22:25:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.58s]
Epoch 1: 14%|█▍ | 1783/12384 [3:47:03<22:25:02, 7.61s/it, loss=0.0002, acc=0.9985, iter_time=11.58s]
Epoch 1: 14%|█▍ | 1784/12384 [3:47:03<22:24:43, 7.61s/it, loss=0.0002, acc=0.9985, iter_time=11.58s]
Epoch 1: 14%|█▍ | 1784/12384 [3:47:11<22:24:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 14%|█▍ | 1785/12384 [3:47:11<22:24:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 14%|█▍ | 1785/12384 [3:47:19<22:24:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 14%|█▍ | 1786/12384 [3:47:19<22:25:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 14%|█▍ | 1786/12384 [3:47:26<22:25:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 14%|█▍ | 1787/12384 [3:47:26<22:25:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 14%|█▍ | 1787/12384 [3:47:34<22:25:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 14%|█▍ | 1788/12384 [3:47:34<22:24:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 14%|█▍ | 1788/12384 [3:47:42<22:24:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▍ | 1789/12384 [3:47:42<22:30:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 14%|█▍ | 1789/12384 [3:47:49<22:30:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 14%|█▍ | 1790/12384 [3:47:49<22:28:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 14%|█▍ | 1790/12384 [3:47:57<22:28:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1791/12384 [3:47:57<22:26:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 14%|█▍ | 1791/12384 [3:48:04<22:26:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 14%|█▍ | 1792/12384 [3:48:04<22:26:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 14%|█▍ | 1792/12384 [3:48:12<22:26:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 14%|█▍ | 1793/12384 [3:48:12<22:41:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 14%|█▍ | 1793/12384 [3:48:20<22:41:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 14%|█▍ | 1794/12384 [3:48:20<22:34:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 14%|█▍ | 1794/12384 [3:48:28<22:34:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 14%|█▍ | 1795/12384 [3:48:28<22:30:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 14%|█▍ | 1795/12384 [3:48:35<22:30:29, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▍ | 1796/12384 [3:48:35<22:27:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▍ | 1796/12384 [3:48:43<22:27:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 15%|█▍ | 1797/12384 [3:48:43<22:24:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 15%|█▍ | 1797/12384 [3:48:50<22:24:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 15%|█▍ | 1798/12384 [3:48:50<22:23:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 15%|█▍ | 1798/12384 [3:48:58<22:23:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 15%|█▍ | 1799/12384 [3:48:58<22:23:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 15%|█▍ | 1799/12384 [3:49:06<22:23:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 15%|█▍ | 1800/12384 [3:49:06<22:23:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 15%|█▍ | 1800/12384 [3:49:13<22:23:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.71s]
Epoch 1: 15%|█▍ | 1801/12384 [3:49:13<22:23:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.71s]
Epoch 1: 15%|█▍ | 1801/12384 [3:49:21<22:23:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 15%|█▍ | 1802/12384 [3:49:21<22:28:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 15%|█▍ | 1802/12384 [3:49:29<22:28:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 15%|█▍ | 1803/12384 [3:49:29<22:26:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 15%|█▍ | 1803/12384 [3:49:36<22:26:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 15%|█▍ | 1804/12384 [3:49:36<22:23:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 15%|█▍ | 1804/12384 [3:49:44<22:23:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 15%|█▍ | 1805/12384 [3:49:44<22:23:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 15%|█▍ | 1805/12384 [3:49:52<22:23:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 15%|█▍ | 1806/12384 [3:49:52<22:29:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 15%|█▍ | 1806/12384 [3:49:59<22:29:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 15%|█▍ | 1807/12384 [3:49:59<22:26:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 15%|█▍ | 1807/12384 [3:50:07<22:26:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 15%|█▍ | 1808/12384 [3:50:07<22:26:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 15%|█▍ | 1808/12384 [3:50:14<22:26:03, 7.64s/it, loss=0.0000, acc=0.9998, iter_time=7.66s]
Epoch 1: 15%|█▍ | 1809/12384 [3:50:14<22:27:10, 7.64s/it, loss=0.0000, acc=0.9998, iter_time=7.66s]
Epoch 1: 15%|█▍ | 1809/12384 [3:50:22<22:27:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 15%|█▍ | 1810/12384 [3:50:22<22:24:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 15%|█▍ | 1810/12384 [3:50:30<22:24:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 15%|█▍ | 1811/12384 [3:50:30<22:39:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 15%|█▍ | 1811/12384 [3:50:38<22:39:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 15%|█▍ | 1812/12384 [3:50:38<22:35:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 15%|█▍ | 1812/12384 [3:50:45<22:35:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 15%|█▍ | 1813/12384 [3:50:45<22:30:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 15%|█▍ | 1813/12384 [3:50:53<22:30:57, 7.67s/it, loss=0.0008, acc=0.9972, iter_time=8.14s]
Epoch 1: 15%|█▍ | 1814/12384 [3:50:53<22:28:52, 7.66s/it, loss=0.0008, acc=0.9972, iter_time=8.14s]
Epoch 1: 15%|█▍ | 1814/12384 [3:51:00<22:28:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 15%|█▍ | 1815/12384 [3:51:00<22:26:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 15%|█▍ | 1815/12384 [3:51:08<22:26:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 15%|█▍ | 1816/12384 [3:51:08<22:24:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 15%|█▍ | 1816/12384 [3:51:16<22:24:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 15%|█▍ | 1817/12384 [3:51:16<22:23:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 15%|█▍ | 1817/12384 [3:51:23<22:23:14, 7.63s/it, loss=0.0003, acc=0.9982, iter_time=7.71s]
Epoch 1: 15%|█▍ | 1818/12384 [3:51:23<22:29:15, 7.66s/it, loss=0.0003, acc=0.9982, iter_time=7.71s]
Epoch 1: 15%|█▍ | 1818/12384 [3:51:31<22:29:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 15%|█▍ | 1819/12384 [3:51:31<22:42:02, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 15%|█▍ | 1819/12384 [3:51:39<22:42:02, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 15%|█▍ | 1820/12384 [3:51:39<22:34:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 15%|█▍ | 1820/12384 [3:51:46<22:34:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 15%|█▍ | 1821/12384 [3:51:46<22:30:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 15%|█▍ | 1821/12384 [3:51:54<22:30:13, 7.67s/it, loss=0.0015, acc=0.9954, iter_time=9.90s]
Epoch 1: 15%|█▍ | 1822/12384 [3:51:54<22:27:05, 7.65s/it, loss=0.0015, acc=0.9954, iter_time=9.90s]
Epoch 1: 15%|█▍ | 1822/12384 [3:52:02<22:27:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 15%|█▍ | 1823/12384 [3:52:02<22:24:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 15%|█▍ | 1823/12384 [3:52:09<22:24:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 1: 15%|█▍ | 1824/12384 [3:52:09<22:22:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 1: 15%|█▍ | 1824/12384 [3:52:17<22:22:28, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.41s]
Epoch 1: 15%|█▍ | 1825/12384 [3:52:17<22:20:44, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.41s]
Epoch 1: 15%|█▍ | 1825/12384 [3:52:25<22:20:44, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.92s]
Epoch 1: 15%|█▍ | 1826/12384 [3:52:25<22:19:16, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.92s]
Epoch 1: 15%|█▍ | 1826/12384 [3:52:32<22:19:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.50s]
Epoch 1: 15%|█▍ | 1827/12384 [3:52:32<22:18:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.50s]
Epoch 1: 15%|█▍ | 1827/12384 [3:52:40<22:18:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 15%|█▍ | 1828/12384 [3:52:40<22:22:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 15%|█▍ | 1828/12384 [3:52:47<22:22:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 15%|█▍ | 1829/12384 [3:52:47<22:21:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 15%|█▍ | 1829/12384 [3:52:55<22:21:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 15%|█▍ | 1830/12384 [3:52:55<22:20:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 15%|█▍ | 1830/12384 [3:53:03<22:20:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 15%|█▍ | 1831/12384 [3:53:03<22:20:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 15%|█▍ | 1831/12384 [3:53:10<22:20:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 15%|█▍ | 1832/12384 [3:53:10<22:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 15%|█▍ | 1832/12384 [3:53:18<22:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 15%|█▍ | 1833/12384 [3:53:18<22:22:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 15%|█▍ | 1833/12384 [3:53:26<22:22:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 1: 15%|█▍ | 1834/12384 [3:53:26<22:24:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 1: 15%|█▍ | 1834/12384 [3:53:33<22:24:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 15%|█▍ | 1835/12384 [3:53:33<22:23:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 15%|█▍ | 1835/12384 [3:53:41<22:23:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 15%|█▍ | 1836/12384 [3:53:41<22:28:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 15%|█▍ | 1836/12384 [3:53:49<22:28:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 15%|█▍ | 1837/12384 [3:53:49<22:40:00, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 15%|█▍ | 1837/12384 [3:53:57<22:40:00, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 15%|█▍ | 1838/12384 [3:53:57<22:36:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 15%|█▍ | 1838/12384 [3:54:04<22:36:19, 7.72s/it, loss=0.0002, acc=0.9990, iter_time=8.22s]
Epoch 1: 15%|█▍ | 1839/12384 [3:54:04<22:30:05, 7.68s/it, loss=0.0002, acc=0.9990, iter_time=8.22s]
Epoch 1: 15%|█▍ | 1839/12384 [3:54:12<22:30:05, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=7.57s]
Epoch 1: 15%|█▍ | 1840/12384 [3:54:12<22:27:12, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=7.57s]
Epoch 1: 15%|█▍ | 1840/12384 [3:54:19<22:27:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 15%|█▍ | 1841/12384 [3:54:19<22:26:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 15%|█▍ | 1841/12384 [3:54:27<22:26:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 15%|█▍ | 1842/12384 [3:54:27<22:22:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 15%|█▍ | 1842/12384 [3:54:35<22:22:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 15%|█▍ | 1843/12384 [3:54:35<22:20:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 15%|█▍ | 1843/12384 [3:54:42<22:20:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 15%|█▍ | 1844/12384 [3:54:42<22:18:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 15%|█▍ | 1844/12384 [3:54:50<22:18:46, 7.62s/it, loss=0.0011, acc=0.9990, iter_time=4.05s]
Epoch 1: 15%|█▍ | 1845/12384 [3:54:50<22:35:56, 7.72s/it, loss=0.0011, acc=0.9990, iter_time=4.05s]
Epoch 1: 15%|█▍ | 1845/12384 [3:54:58<22:35:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 15%|█▍ | 1846/12384 [3:54:58<22:30:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 15%|█▍ | 1846/12384 [3:55:05<22:30:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 15%|█▍ | 1847/12384 [3:55:05<22:28:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 15%|█▍ | 1847/12384 [3:55:13<22:28:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 15%|█▍ | 1848/12384 [3:55:13<22:24:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 15%|█▍ | 1848/12384 [3:55:21<22:24:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 15%|█▍ | 1849/12384 [3:55:21<22:23:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 15%|█▍ | 1849/12384 [3:55:28<22:23:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 15%|█▍ | 1850/12384 [3:55:28<22:21:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 15%|█▍ | 1850/12384 [3:55:36<22:21:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 15%|█▍ | 1851/12384 [3:55:36<22:18:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 15%|█▍ | 1851/12384 [3:55:43<22:18:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 15%|█▍ | 1852/12384 [3:55:43<22:17:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 15%|█▍ | 1852/12384 [3:55:51<22:17:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 15%|█▍ | 1853/12384 [3:55:51<22:15:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 15%|█▍ | 1853/12384 [3:55:59<22:15:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 15%|█▍ | 1854/12384 [3:55:59<22:14:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 15%|█▍ | 1854/12384 [3:56:06<22:14:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 15%|█▍ | 1855/12384 [3:56:06<22:14:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 15%|█▍ | 1855/12384 [3:56:14<22:14:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 15%|█▍ | 1856/12384 [3:56:14<22:14:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 15%|█▍ | 1856/12384 [3:56:21<22:14:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 15%|█▍ | 1857/12384 [3:56:21<22:15:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 15%|█▍ | 1857/12384 [3:56:29<22:15:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 15%|█▌ | 1858/12384 [3:56:29<22:15:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 15%|█▌ | 1858/12384 [3:56:37<22:15:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 15%|█▌ | 1859/12384 [3:56:37<22:13:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 15%|█▌ | 1859/12384 [3:56:44<22:13:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1860/12384 [3:56:44<22:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1860/12384 [3:56:52<22:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 15%|█▌ | 1861/12384 [3:56:52<22:14:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 15%|█▌ | 1861/12384 [3:57:00<22:14:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 15%|█▌ | 1862/12384 [3:57:00<22:13:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 15%|█▌ | 1862/12384 [3:57:07<22:13:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 15%|█▌ | 1863/12384 [3:57:07<22:13:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 15%|█▌ | 1863/12384 [3:57:15<22:13:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 1: 15%|█▌ | 1864/12384 [3:57:15<22:28:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 1: 15%|█▌ | 1864/12384 [3:57:23<22:28:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 15%|█▌ | 1865/12384 [3:57:23<22:24:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 15%|█▌ | 1865/12384 [3:57:30<22:24:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 15%|█▌ | 1866/12384 [3:57:30<22:25:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 15%|█▌ | 1866/12384 [3:57:38<22:25:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 15%|█▌ | 1867/12384 [3:57:38<22:23:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 15%|█▌ | 1867/12384 [3:57:46<22:23:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 15%|█▌ | 1868/12384 [3:57:46<22:20:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 15%|█▌ | 1868/12384 [3:57:53<22:20:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 15%|█▌ | 1869/12384 [3:57:53<22:18:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 15%|█▌ | 1869/12384 [3:58:01<22:18:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 15%|█▌ | 1870/12384 [3:58:01<22:16:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 15%|█▌ | 1870/12384 [3:58:08<22:16:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 15%|█▌ | 1871/12384 [3:58:08<22:16:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 15%|█▌ | 1871/12384 [3:58:16<22:16:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 15%|█▌ | 1872/12384 [3:58:16<22:32:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 15%|█▌ | 1872/12384 [3:58:24<22:32:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 15%|█▌ | 1873/12384 [3:58:24<22:25:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 15%|█▌ | 1873/12384 [3:58:32<22:25:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1874/12384 [3:58:32<22:24:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1874/12384 [3:58:39<22:24:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 15%|█▌ | 1875/12384 [3:58:39<22:20:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 15%|█▌ | 1875/12384 [3:58:47<22:20:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 15%|█▌ | 1876/12384 [3:58:47<22:17:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 15%|█▌ | 1876/12384 [3:58:54<22:17:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1877/12384 [3:58:54<22:16:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1877/12384 [3:59:02<22:16:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 15%|█▌ | 1878/12384 [3:59:02<22:15:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 15%|█▌ | 1878/12384 [3:59:10<22:15:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 15%|█▌ | 1879/12384 [3:59:10<22:13:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 15%|█▌ | 1879/12384 [3:59:17<22:13:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 15%|█▌ | 1880/12384 [3:59:17<22:13:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 15%|█▌ | 1880/12384 [3:59:25<22:13:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 15%|█▌ | 1881/12384 [3:59:25<22:12:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 15%|█▌ | 1881/12384 [3:59:32<22:12:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 15%|█▌ | 1882/12384 [3:59:32<22:12:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 15%|█▌ | 1882/12384 [3:59:40<22:12:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 15%|█▌ | 1883/12384 [3:59:40<22:13:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 15%|█▌ | 1883/12384 [3:59:48<22:13:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1884/12384 [3:59:48<22:11:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1884/12384 [3:59:55<22:11:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 15%|█▌ | 1885/12384 [3:59:55<22:11:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 15%|█▌ | 1885/12384 [4:00:03<22:11:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 1: 15%|█▌ | 1886/12384 [4:00:03<22:10:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 1: 15%|█▌ | 1886/12384 [4:00:10<22:10:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 15%|█▌ | 1887/12384 [4:00:10<22:09:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 15%|█▌ | 1887/12384 [4:00:18<22:09:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 15%|█▌ | 1888/12384 [4:00:18<22:09:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 15%|█▌ | 1888/12384 [4:00:26<22:09:07, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 1: 15%|█▌ | 1889/12384 [4:00:26<22:15:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 1: 15%|█▌ | 1889/12384 [4:00:33<22:15:43, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=6.95s]
Epoch 1: 15%|█▌ | 1890/12384 [4:00:33<22:13:09, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=6.95s]
Epoch 1: 15%|█▌ | 1890/12384 [4:00:41<22:13:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 15%|█▌ | 1891/12384 [4:00:41<22:11:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 15%|█▌ | 1891/12384 [4:00:49<22:11:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1892/12384 [4:00:49<22:10:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 15%|█▌ | 1892/12384 [4:00:56<22:10:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 15%|█▌ | 1893/12384 [4:00:56<22:10:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 15%|█▌ | 1893/12384 [4:01:04<22:10:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 15%|█▌ | 1894/12384 [4:01:04<22:09:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 15%|█▌ | 1894/12384 [4:01:11<22:09:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 15%|█▌ | 1895/12384 [4:01:11<22:09:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 15%|█▌ | 1895/12384 [4:01:19<22:09:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 15%|█▌ | 1896/12384 [4:01:19<22:09:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 15%|█▌ | 1896/12384 [4:01:27<22:09:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 15%|█▌ | 1897/12384 [4:01:27<22:09:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 15%|█▌ | 1897/12384 [4:01:35<22:09:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 15%|█▌ | 1898/12384 [4:01:35<22:26:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 15%|█▌ | 1898/12384 [4:01:42<22:26:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 15%|█▌ | 1899/12384 [4:01:42<22:20:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 15%|█▌ | 1899/12384 [4:01:50<22:20:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 15%|█▌ | 1900/12384 [4:01:50<22:16:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 15%|█▌ | 1900/12384 [4:01:57<22:16:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 15%|█▌ | 1901/12384 [4:01:57<22:18:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 15%|█▌ | 1901/12384 [4:02:05<22:18:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 15%|█▌ | 1902/12384 [4:02:05<22:14:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 15%|█▌ | 1902/12384 [4:02:13<22:14:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 15%|█▌ | 1903/12384 [4:02:13<22:13:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 15%|█▌ | 1903/12384 [4:02:20<22:13:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 15%|█▌ | 1904/12384 [4:02:20<22:12:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 15%|█▌ | 1904/12384 [4:02:28<22:12:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 15%|█▌ | 1905/12384 [4:02:28<22:11:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 15%|█▌ | 1905/12384 [4:02:35<22:11:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 15%|█▌ | 1906/12384 [4:02:35<22:11:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 15%|█▌ | 1906/12384 [4:02:43<22:11:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 15%|█▌ | 1907/12384 [4:02:43<22:10:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 15%|█▌ | 1907/12384 [4:02:51<22:10:04, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=9.23s]
Epoch 1: 15%|█▌ | 1908/12384 [4:02:51<22:12:13, 7.63s/it, loss=0.0003, acc=0.9982, iter_time=9.23s]
Epoch 1: 15%|█▌ | 1908/12384 [4:02:58<22:12:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 15%|█▌ | 1909/12384 [4:02:58<22:11:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 15%|█▌ | 1909/12384 [4:03:06<22:11:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.05s]
Epoch 1: 15%|█▌ | 1910/12384 [4:03:06<22:12:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.05s]
Epoch 1: 15%|█▌ | 1910/12384 [4:03:14<22:12:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 15%|█▌ | 1911/12384 [4:03:14<22:10:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 15%|█▌ | 1911/12384 [4:03:21<22:10:25, 7.62s/it, loss=0.0004, acc=0.9994, iter_time=9.78s]
Epoch 1: 15%|█▌ | 1912/12384 [4:03:21<22:10:57, 7.63s/it, loss=0.0004, acc=0.9994, iter_time=9.78s]
Epoch 1: 15%|█▌ | 1912/12384 [4:03:29<22:10:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 15%|█▌ | 1913/12384 [4:03:29<22:10:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 15%|█▌ | 1913/12384 [4:03:36<22:10:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 15%|█▌ | 1914/12384 [4:03:36<22:08:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 15%|█▌ | 1914/12384 [4:03:44<22:08:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 15%|█▌ | 1915/12384 [4:03:44<22:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 15%|█▌ | 1915/12384 [4:03:52<22:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 1: 15%|█▌ | 1916/12384 [4:03:52<22:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 1: 15%|█▌ | 1916/12384 [4:04:00<22:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 15%|█▌ | 1917/12384 [4:04:00<22:22:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 15%|█▌ | 1917/12384 [4:04:07<22:22:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 15%|█▌ | 1918/12384 [4:04:07<22:18:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 15%|█▌ | 1918/12384 [4:04:15<22:18:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 15%|█▌ | 1919/12384 [4:04:15<22:14:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 15%|█▌ | 1919/12384 [4:04:22<22:14:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 16%|█▌ | 1920/12384 [4:04:22<22:12:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 16%|█▌ | 1920/12384 [4:04:30<22:12:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 16%|█▌ | 1921/12384 [4:04:30<22:11:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 16%|█▌ | 1921/12384 [4:04:38<22:11:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 16%|█▌ | 1922/12384 [4:04:38<22:09:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 16%|█▌ | 1922/12384 [4:04:45<22:09:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1923/12384 [4:04:45<22:12:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1923/12384 [4:04:53<22:12:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 16%|█▌ | 1924/12384 [4:04:53<22:10:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 16%|█▌ | 1924/12384 [4:05:01<22:10:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 16%|█▌ | 1925/12384 [4:05:01<22:24:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 16%|█▌ | 1925/12384 [4:05:08<22:24:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 16%|█▌ | 1926/12384 [4:05:08<22:19:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 16%|█▌ | 1926/12384 [4:05:16<22:19:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 16%|█▌ | 1927/12384 [4:05:16<22:14:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 16%|█▌ | 1927/12384 [4:05:24<22:14:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 16%|█▌ | 1928/12384 [4:05:24<22:13:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 16%|█▌ | 1928/12384 [4:05:31<22:13:11, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 1: 16%|█▌ | 1929/12384 [4:05:31<22:11:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 1: 16%|█▌ | 1929/12384 [4:05:39<22:11:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 16%|█▌ | 1930/12384 [4:05:39<22:09:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 16%|█▌ | 1930/12384 [4:05:47<22:09:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 16%|█▌ | 1931/12384 [4:05:47<22:10:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 16%|█▌ | 1931/12384 [4:05:54<22:10:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 16%|█▌ | 1932/12384 [4:05:54<22:08:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 16%|█▌ | 1932/12384 [4:06:02<22:08:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 16%|█▌ | 1933/12384 [4:06:02<22:07:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 16%|█▌ | 1933/12384 [4:06:09<22:07:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 16%|█▌ | 1934/12384 [4:06:09<22:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 16%|█▌ | 1934/12384 [4:06:17<22:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 16%|█▌ | 1935/12384 [4:06:17<22:07:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 16%|█▌ | 1935/12384 [4:06:25<22:07:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 16%|█▌ | 1936/12384 [4:06:25<22:06:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 16%|█▌ | 1936/12384 [4:06:32<22:06:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 16%|█▌ | 1937/12384 [4:06:32<22:06:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 16%|█▌ | 1937/12384 [4:06:40<22:06:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 16%|█▌ | 1938/12384 [4:06:40<22:04:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 16%|█▌ | 1938/12384 [4:06:47<22:04:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 16%|█▌ | 1939/12384 [4:06:47<22:03:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 16%|█▌ | 1939/12384 [4:06:55<22:03:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 16%|█▌ | 1940/12384 [4:06:55<22:04:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 16%|█▌ | 1940/12384 [4:07:03<22:04:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 16%|█▌ | 1941/12384 [4:07:03<22:03:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 16%|█▌ | 1941/12384 [4:07:10<22:03:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 16%|█▌ | 1942/12384 [4:07:10<22:03:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 16%|█▌ | 1942/12384 [4:07:18<22:03:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 16%|█▌ | 1943/12384 [4:07:18<22:04:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 16%|█▌ | 1943/12384 [4:07:26<22:04:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 16%|█▌ | 1944/12384 [4:07:26<22:08:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 16%|█▌ | 1944/12384 [4:07:33<22:08:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 16%|█▌ | 1945/12384 [4:07:33<22:08:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 16%|█▌ | 1945/12384 [4:07:41<22:08:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▌ | 1946/12384 [4:07:41<22:07:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▌ | 1946/12384 [4:07:48<22:07:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▌ | 1947/12384 [4:07:48<22:05:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▌ | 1947/12384 [4:07:56<22:05:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 16%|█▌ | 1948/12384 [4:07:56<22:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 16%|█▌ | 1948/12384 [4:08:04<22:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1949/12384 [4:08:04<22:03:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1949/12384 [4:08:11<22:03:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 16%|█▌ | 1950/12384 [4:08:11<22:04:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 16%|█▌ | 1950/12384 [4:08:19<22:04:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 16%|█▌ | 1951/12384 [4:08:19<22:22:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 16%|█▌ | 1951/12384 [4:08:27<22:22:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 16%|█▌ | 1952/12384 [4:08:27<22:17:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 16%|█▌ | 1952/12384 [4:08:34<22:17:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▌ | 1953/12384 [4:08:34<22:12:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▌ | 1953/12384 [4:08:42<22:12:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▌ | 1954/12384 [4:08:42<22:08:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▌ | 1954/12384 [4:08:50<22:08:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 16%|█▌ | 1955/12384 [4:08:50<22:07:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 16%|█▌ | 1955/12384 [4:08:57<22:07:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 16%|█▌ | 1956/12384 [4:08:57<22:04:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 16%|█▌ | 1956/12384 [4:09:05<22:04:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 16%|█▌ | 1957/12384 [4:09:05<22:03:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 16%|█▌ | 1957/12384 [4:09:12<22:03:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 16%|█▌ | 1958/12384 [4:09:12<22:03:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 16%|█▌ | 1958/12384 [4:09:20<22:03:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 16%|█▌ | 1959/12384 [4:09:20<22:03:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 16%|█▌ | 1959/12384 [4:09:28<22:03:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 16%|█▌ | 1960/12384 [4:09:28<22:06:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 16%|█▌ | 1960/12384 [4:09:35<22:06:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 16%|█▌ | 1961/12384 [4:09:35<22:04:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 16%|█▌ | 1961/12384 [4:09:43<22:04:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 16%|█▌ | 1962/12384 [4:09:43<22:03:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 16%|█▌ | 1962/12384 [4:09:51<22:03:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 16%|█▌ | 1963/12384 [4:09:51<22:02:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 16%|█▌ | 1963/12384 [4:09:58<22:02:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 16%|█▌ | 1964/12384 [4:09:58<22:01:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 16%|█▌ | 1964/12384 [4:10:06<22:01:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▌ | 1965/12384 [4:10:06<21:59:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▌ | 1965/12384 [4:10:13<21:59:57, 7.60s/it, loss=0.0003, acc=0.9987, iter_time=8.00s]
Epoch 1: 16%|█▌ | 1966/12384 [4:10:13<22:00:26, 7.60s/it, loss=0.0003, acc=0.9987, iter_time=8.00s]
Epoch 1: 16%|█▌ | 1966/12384 [4:10:21<22:00:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 16%|█▌ | 1967/12384 [4:10:21<22:00:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 16%|█▌ | 1967/12384 [4:10:29<22:00:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 16%|█▌ | 1968/12384 [4:10:29<22:01:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 16%|█▌ | 1968/12384 [4:10:36<22:01:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 16%|█▌ | 1969/12384 [4:10:36<22:17:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 16%|█▌ | 1969/12384 [4:10:44<22:17:06, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=4.83s]
Epoch 1: 16%|█▌ | 1970/12384 [4:10:44<22:12:12, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.83s]
Epoch 1: 16%|█▌ | 1970/12384 [4:10:52<22:12:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 16%|█▌ | 1971/12384 [4:10:52<22:09:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 16%|█▌ | 1971/12384 [4:10:59<22:09:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▌ | 1972/12384 [4:10:59<22:05:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▌ | 1972/12384 [4:11:07<22:05:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1973/12384 [4:11:07<22:03:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1973/12384 [4:11:14<22:03:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1974/12384 [4:11:14<22:02:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1974/12384 [4:11:22<22:02:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 16%|█▌ | 1975/12384 [4:11:22<22:02:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 16%|█▌ | 1975/12384 [4:11:30<22:02:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 1: 16%|█▌ | 1976/12384 [4:11:30<22:01:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 1: 16%|█▌ | 1976/12384 [4:11:38<22:01:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 16%|█▌ | 1977/12384 [4:11:38<22:15:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 16%|█▌ | 1977/12384 [4:11:45<22:15:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 16%|█▌ | 1978/12384 [4:11:45<22:10:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 16%|█▌ | 1978/12384 [4:11:53<22:10:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 16%|█▌ | 1979/12384 [4:11:53<22:08:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 16%|█▌ | 1979/12384 [4:12:00<22:08:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▌ | 1980/12384 [4:12:00<22:05:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▌ | 1980/12384 [4:12:08<22:05:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 16%|█▌ | 1981/12384 [4:12:08<22:02:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 16%|█▌ | 1981/12384 [4:12:16<22:02:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 16%|█▌ | 1982/12384 [4:12:16<22:01:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 16%|█▌ | 1982/12384 [4:12:23<22:01:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 16%|█▌ | 1983/12384 [4:12:23<22:01:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 16%|█▌ | 1983/12384 [4:12:31<22:01:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 16%|█▌ | 1984/12384 [4:12:31<21:59:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 16%|█▌ | 1984/12384 [4:12:38<21:59:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▌ | 1985/12384 [4:12:38<21:59:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▌ | 1985/12384 [4:12:46<21:59:18, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=6.14s]
Epoch 1: 16%|█▌ | 1986/12384 [4:12:46<21:59:29, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=6.14s]
Epoch 1: 16%|█▌ | 1986/12384 [4:12:54<21:59:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 16%|█▌ | 1987/12384 [4:12:54<21:58:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 16%|█▌ | 1987/12384 [4:13:01<21:58:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1988/12384 [4:13:01<21:59:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▌ | 1988/12384 [4:13:09<21:59:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 16%|█▌ | 1989/12384 [4:13:09<21:59:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 16%|█▌ | 1989/12384 [4:13:17<21:59:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 16%|█▌ | 1990/12384 [4:13:17<21:58:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 16%|█▌ | 1990/12384 [4:13:24<21:58:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 16%|█▌ | 1991/12384 [4:13:24<21:57:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 16%|█▌ | 1991/12384 [4:13:32<21:57:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 16%|█▌ | 1992/12384 [4:13:32<21:57:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 16%|█▌ | 1992/12384 [4:13:39<21:57:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 16%|█▌ | 1993/12384 [4:13:39<21:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 16%|█▌ | 1993/12384 [4:13:47<21:58:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.85s]
Epoch 1: 16%|█▌ | 1994/12384 [4:13:47<21:57:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.85s]
Epoch 1: 16%|█▌ | 1994/12384 [4:13:55<21:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 16%|█▌ | 1995/12384 [4:13:55<21:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 16%|█▌ | 1995/12384 [4:14:02<21:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 16%|█▌ | 1996/12384 [4:14:02<21:57:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 16%|█▌ | 1996/12384 [4:14:10<21:57:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 16%|█▌ | 1997/12384 [4:14:10<21:57:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 16%|█▌ | 1997/12384 [4:14:17<21:57:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 16%|█▌ | 1998/12384 [4:14:17<21:58:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 16%|█▌ | 1998/12384 [4:14:25<21:58:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 16%|█▌ | 1999/12384 [4:14:25<21:57:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 16%|█▌ | 1999/12384 [4:14:33<21:57:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 16%|█▌ | 2000/12384 [4:14:33<22:01:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 16%|█▌ | 2000/12384 [4:14:40<22:01:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 16%|█▌ | 2001/12384 [4:14:40<22:00:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 16%|█▌ | 2001/12384 [4:14:48<22:00:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 16%|█▌ | 2002/12384 [4:14:48<22:03:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 16%|█▌ | 2002/12384 [4:14:56<22:03:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 16%|█▌ | 2003/12384 [4:14:56<22:17:32, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 16%|█▌ | 2003/12384 [4:15:04<22:17:32, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 16%|█▌ | 2004/12384 [4:15:04<22:10:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 16%|█▌ | 2004/12384 [4:15:11<22:10:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 16%|█▌ | 2005/12384 [4:15:11<22:05:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 16%|█▌ | 2005/12384 [4:15:19<22:05:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 16%|█▌ | 2006/12384 [4:15:19<22:03:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 16%|█▌ | 2006/12384 [4:15:26<22:03:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 16%|█▌ | 2007/12384 [4:15:26<22:01:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 16%|█▌ | 2007/12384 [4:15:34<22:01:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 16%|█▌ | 2008/12384 [4:15:34<22:00:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 16%|█▌ | 2008/12384 [4:15:42<22:00:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 16%|█▌ | 2009/12384 [4:15:42<21:58:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 16%|█▌ | 2009/12384 [4:15:49<21:58:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 16%|█▌ | 2010/12384 [4:15:49<22:00:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 16%|█▌ | 2010/12384 [4:15:57<22:00:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 16%|█▌ | 2011/12384 [4:15:57<21:58:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 16%|█▌ | 2011/12384 [4:16:05<21:58:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 16%|█▌ | 2012/12384 [4:16:05<21:56:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 16%|█▌ | 2012/12384 [4:16:12<21:56:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 16%|█▋ | 2013/12384 [4:16:12<21:57:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 16%|█▋ | 2013/12384 [4:16:20<21:57:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 16%|█▋ | 2014/12384 [4:16:20<21:57:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 16%|█▋ | 2014/12384 [4:16:27<21:57:39, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.65s]
Epoch 1: 16%|█▋ | 2015/12384 [4:16:27<21:57:45, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.65s]
Epoch 1: 16%|█▋ | 2015/12384 [4:16:35<21:57:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 16%|█▋ | 2016/12384 [4:16:35<21:57:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 16%|█▋ | 2016/12384 [4:16:43<21:57:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 1: 16%|█▋ | 2017/12384 [4:16:43<21:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 1: 16%|█▋ | 2017/12384 [4:16:50<21:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 16%|█▋ | 2018/12384 [4:16:50<21:58:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 16%|█▋ | 2018/12384 [4:16:58<21:58:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 16%|█▋ | 2019/12384 [4:16:58<21:56:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 16%|█▋ | 2019/12384 [4:17:06<21:56:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 16%|█▋ | 2020/12384 [4:17:06<21:57:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 16%|█▋ | 2020/12384 [4:17:13<21:57:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 16%|█▋ | 2021/12384 [4:17:13<21:54:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 16%|█▋ | 2021/12384 [4:17:21<21:54:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 16%|█▋ | 2022/12384 [4:17:21<21:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 16%|█▋ | 2022/12384 [4:17:28<21:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 1: 16%|█▋ | 2023/12384 [4:17:28<21:55:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 1: 16%|█▋ | 2023/12384 [4:17:36<21:55:34, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.87s]
Epoch 1: 16%|█▋ | 2024/12384 [4:17:36<21:54:56, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.87s]
Epoch 1: 16%|█▋ | 2024/12384 [4:17:44<21:54:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 16%|█▋ | 2025/12384 [4:17:44<21:55:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 16%|█▋ | 2025/12384 [4:17:51<21:55:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 1: 16%|█▋ | 2026/12384 [4:17:51<21:55:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 1: 16%|█▋ | 2026/12384 [4:17:59<21:55:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 16%|█▋ | 2027/12384 [4:17:59<21:53:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 16%|█▋ | 2027/12384 [4:18:06<21:53:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 16%|█▋ | 2028/12384 [4:18:06<21:52:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 16%|█▋ | 2028/12384 [4:18:14<21:52:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▋ | 2029/12384 [4:18:14<22:08:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 16%|█▋ | 2029/12384 [4:18:22<22:08:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 16%|█▋ | 2030/12384 [4:18:22<22:03:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 16%|█▋ | 2030/12384 [4:18:30<22:03:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 16%|█▋ | 2031/12384 [4:18:30<22:00:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 16%|█▋ | 2031/12384 [4:18:37<22:00:29, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 16%|█▋ | 2032/12384 [4:18:37<22:04:15, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 16%|█▋ | 2032/12384 [4:18:45<22:04:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 16%|█▋ | 2033/12384 [4:18:45<21:59:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 16%|█▋ | 2033/12384 [4:18:52<21:59:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▋ | 2034/12384 [4:18:52<21:57:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 16%|█▋ | 2034/12384 [4:19:00<21:57:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.00s]
Epoch 1: 16%|█▋ | 2035/12384 [4:19:00<21:56:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.00s]
Epoch 1: 16%|█▋ | 2035/12384 [4:19:08<21:56:19, 7.63s/it, loss=0.0002, acc=0.9987, iter_time=8.21s]
Epoch 1: 16%|█▋ | 2036/12384 [4:19:08<21:55:37, 7.63s/it, loss=0.0002, acc=0.9987, iter_time=8.21s]
Epoch 1: 16%|█▋ | 2036/12384 [4:19:15<21:55:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 16%|█▋ | 2037/12384 [4:19:15<21:59:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 16%|█▋ | 2037/12384 [4:19:23<21:59:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 1: 16%|█▋ | 2038/12384 [4:19:23<21:57:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 1: 16%|█▋ | 2038/12384 [4:19:31<21:57:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▋ | 2039/12384 [4:19:31<21:55:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 16%|█▋ | 2039/12384 [4:19:38<21:55:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 16%|█▋ | 2040/12384 [4:19:38<21:53:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 16%|█▋ | 2040/12384 [4:19:46<21:53:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 16%|█▋ | 2041/12384 [4:19:46<21:54:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 16%|█▋ | 2041/12384 [4:19:53<21:54:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 1: 16%|█▋ | 2042/12384 [4:19:53<21:53:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 1: 16%|█▋ | 2042/12384 [4:20:01<21:53:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 16%|█▋ | 2043/12384 [4:20:01<21:52:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 16%|█▋ | 2043/12384 [4:20:09<21:52:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 17%|█▋ | 2044/12384 [4:20:09<21:51:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 17%|█▋ | 2044/12384 [4:20:16<21:51:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 17%|█▋ | 2045/12384 [4:20:16<21:51:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 17%|█▋ | 2045/12384 [4:20:24<21:51:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 17%|█▋ | 2046/12384 [4:20:24<21:50:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 17%|█▋ | 2046/12384 [4:20:31<21:50:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 17%|█▋ | 2047/12384 [4:20:31<21:50:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 17%|█▋ | 2047/12384 [4:20:39<21:50:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 17%|█▋ | 2048/12384 [4:20:39<22:04:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 17%|█▋ | 2048/12384 [4:20:47<22:04:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 17%|█▋ | 2049/12384 [4:20:47<21:58:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 17%|█▋ | 2049/12384 [4:20:55<21:58:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 17%|█▋ | 2050/12384 [4:20:55<21:55:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 17%|█▋ | 2050/12384 [4:21:02<21:55:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2051/12384 [4:21:02<21:54:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2051/12384 [4:21:10<21:54:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2052/12384 [4:21:10<21:52:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2052/12384 [4:21:17<21:52:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 17%|█▋ | 2053/12384 [4:21:17<21:51:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 17%|█▋ | 2053/12384 [4:21:25<21:51:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 17%|█▋ | 2054/12384 [4:21:25<21:50:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 17%|█▋ | 2054/12384 [4:21:33<21:50:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2055/12384 [4:21:33<21:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2055/12384 [4:21:41<21:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 17%|█▋ | 2056/12384 [4:21:41<22:06:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 17%|█▋ | 2056/12384 [4:21:48<22:06:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 17%|█▋ | 2057/12384 [4:21:48<22:02:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 17%|█▋ | 2057/12384 [4:21:56<22:02:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 17%|█▋ | 2058/12384 [4:21:56<21:57:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 17%|█▋ | 2058/12384 [4:22:03<21:57:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 17%|█▋ | 2059/12384 [4:22:03<21:54:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 17%|█▋ | 2059/12384 [4:22:11<21:54:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 17%|█▋ | 2060/12384 [4:22:11<21:52:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 17%|█▋ | 2060/12384 [4:22:19<21:52:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 17%|█▋ | 2061/12384 [4:22:19<21:51:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 17%|█▋ | 2061/12384 [4:22:26<21:51:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 17%|█▋ | 2062/12384 [4:22:26<21:52:57, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 17%|█▋ | 2062/12384 [4:22:34<21:52:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2063/12384 [4:22:34<21:51:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2063/12384 [4:22:41<21:51:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 17%|█▋ | 2064/12384 [4:22:41<21:51:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 17%|█▋ | 2064/12384 [4:22:49<21:51:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 17%|█▋ | 2065/12384 [4:22:49<21:50:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 17%|█▋ | 2065/12384 [4:22:57<21:50:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 17%|█▋ | 2066/12384 [4:22:57<21:50:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 17%|█▋ | 2066/12384 [4:23:04<21:50:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 17%|█▋ | 2067/12384 [4:23:04<21:49:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 17%|█▋ | 2067/12384 [4:23:12<21:49:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2068/12384 [4:23:12<21:48:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2068/12384 [4:23:19<21:48:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2069/12384 [4:23:19<21:48:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2069/12384 [4:23:27<21:48:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2070/12384 [4:23:27<21:48:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2070/12384 [4:23:35<21:48:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 1: 17%|█▋ | 2071/12384 [4:23:35<21:47:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 1: 17%|█▋ | 2071/12384 [4:23:42<21:47:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.75s]
Epoch 1: 17%|█▋ | 2072/12384 [4:23:42<21:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.75s]
Epoch 1: 17%|█▋ | 2072/12384 [4:23:50<21:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 17%|█▋ | 2073/12384 [4:23:50<21:48:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 17%|█▋ | 2073/12384 [4:23:58<21:48:04, 7.61s/it, loss=0.0005, acc=0.9998, iter_time=8.48s]
Epoch 1: 17%|█▋ | 2074/12384 [4:23:58<22:01:51, 7.69s/it, loss=0.0005, acc=0.9998, iter_time=8.48s]
Epoch 1: 17%|█▋ | 2074/12384 [4:24:05<22:01:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 17%|█▋ | 2075/12384 [4:24:05<21:56:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 17%|█▋ | 2075/12384 [4:24:13<21:56:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2076/12384 [4:24:13<21:54:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2076/12384 [4:24:21<21:54:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 17%|█▋ | 2077/12384 [4:24:21<21:55:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 17%|█▋ | 2077/12384 [4:24:28<21:55:29, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 1: 17%|█▋ | 2078/12384 [4:24:28<21:51:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 1: 17%|█▋ | 2078/12384 [4:24:36<21:51:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 17%|█▋ | 2079/12384 [4:24:36<21:50:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 17%|█▋ | 2079/12384 [4:24:44<21:50:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 1: 17%|█▋ | 2080/12384 [4:24:44<21:49:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 1: 17%|█▋ | 2080/12384 [4:24:51<21:49:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 17%|█▋ | 2081/12384 [4:24:51<21:48:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 17%|█▋ | 2081/12384 [4:24:59<21:48:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.16s]
Epoch 1: 17%|█▋ | 2082/12384 [4:24:59<22:04:44, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.16s]
Epoch 1: 17%|█▋ | 2082/12384 [4:25:07<22:04:44, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=10.52s]
Epoch 1: 17%|█▋ | 2083/12384 [4:25:07<22:04:47, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=10.52s]
Epoch 1: 17%|█▋ | 2083/12384 [4:25:14<22:04:47, 7.72s/it, loss=0.0002, acc=0.9978, iter_time=4.90s]
Epoch 1: 17%|█▋ | 2084/12384 [4:25:14<21:59:11, 7.68s/it, loss=0.0002, acc=0.9978, iter_time=4.90s]
Epoch 1: 17%|█▋ | 2084/12384 [4:25:22<21:59:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 17%|█▋ | 2085/12384 [4:25:22<21:55:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 17%|█▋ | 2085/12384 [4:25:30<21:55:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 17%|█▋ | 2086/12384 [4:25:30<21:52:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 17%|█▋ | 2086/12384 [4:25:37<21:52:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 17%|█▋ | 2087/12384 [4:25:37<21:51:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 17%|█▋ | 2087/12384 [4:25:45<21:51:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 17%|█▋ | 2088/12384 [4:25:45<21:48:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 17%|█▋ | 2088/12384 [4:25:52<21:48:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 17%|█▋ | 2089/12384 [4:25:52<21:47:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 17%|█▋ | 2089/12384 [4:26:00<21:47:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2090/12384 [4:26:00<21:45:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2090/12384 [4:26:08<21:45:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2091/12384 [4:26:08<21:44:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2091/12384 [4:26:15<21:44:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 17%|█▋ | 2092/12384 [4:26:15<21:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 17%|█▋ | 2092/12384 [4:26:23<21:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 17%|█▋ | 2093/12384 [4:26:23<21:43:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 17%|█▋ | 2093/12384 [4:26:30<21:43:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 17%|█▋ | 2094/12384 [4:26:30<21:44:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 17%|█▋ | 2094/12384 [4:26:38<21:44:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 17%|█▋ | 2095/12384 [4:26:38<21:42:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 17%|█▋ | 2095/12384 [4:26:46<21:42:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 17%|█▋ | 2096/12384 [4:26:46<21:43:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 17%|█▋ | 2096/12384 [4:26:53<21:43:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 17%|█▋ | 2097/12384 [4:26:53<21:43:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 17%|█▋ | 2097/12384 [4:27:01<21:43:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 17%|█▋ | 2098/12384 [4:27:01<21:44:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 17%|█▋ | 2098/12384 [4:27:08<21:44:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 17%|█▋ | 2099/12384 [4:27:08<21:45:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 17%|█▋ | 2099/12384 [4:27:16<21:45:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 17%|█▋ | 2100/12384 [4:27:16<21:49:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 17%|█▋ | 2100/12384 [4:27:24<21:49:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 17%|█▋ | 2101/12384 [4:27:24<21:49:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 17%|█▋ | 2101/12384 [4:27:31<21:49:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.65s]
Epoch 1: 17%|█▋ | 2102/12384 [4:27:31<21:47:57, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.65s]
Epoch 1: 17%|█▋ | 2102/12384 [4:27:39<21:47:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 17%|█▋ | 2103/12384 [4:27:39<21:47:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 17%|█▋ | 2103/12384 [4:27:47<21:47:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2104/12384 [4:27:47<21:47:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2104/12384 [4:27:54<21:47:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 17%|█▋ | 2105/12384 [4:27:54<21:46:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 17%|█▋ | 2105/12384 [4:28:02<21:46:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 17%|█▋ | 2106/12384 [4:28:02<21:46:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 17%|█▋ | 2106/12384 [4:28:10<21:46:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 17%|█▋ | 2107/12384 [4:28:10<21:45:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 17%|█▋ | 2107/12384 [4:28:17<21:45:13, 7.62s/it, loss=0.0006, acc=1.0000, iter_time=6.09s]
Epoch 1: 17%|█▋ | 2108/12384 [4:28:17<21:45:44, 7.62s/it, loss=0.0006, acc=1.0000, iter_time=6.09s]
Epoch 1: 17%|█▋ | 2108/12384 [4:28:25<21:45:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 17%|█▋ | 2109/12384 [4:28:25<22:02:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 17%|█▋ | 2109/12384 [4:28:33<22:02:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 17%|█▋ | 2110/12384 [4:28:33<21:57:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 17%|█▋ | 2110/12384 [4:28:40<21:57:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2111/12384 [4:28:40<21:52:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2111/12384 [4:28:48<21:52:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 17%|█▋ | 2112/12384 [4:28:48<21:50:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 17%|█▋ | 2112/12384 [4:28:56<21:50:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 17%|█▋ | 2113/12384 [4:28:56<21:48:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 17%|█▋ | 2113/12384 [4:29:03<21:48:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 17%|█▋ | 2114/12384 [4:29:03<21:47:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 17%|█▋ | 2114/12384 [4:29:11<21:47:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 17%|█▋ | 2115/12384 [4:29:11<21:46:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 17%|█▋ | 2115/12384 [4:29:18<21:46:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 17%|█▋ | 2116/12384 [4:29:19<21:55:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 17%|█▋ | 2116/12384 [4:29:26<21:55:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 17%|█▋ | 2117/12384 [4:29:26<21:54:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 17%|█▋ | 2117/12384 [4:29:34<21:54:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 17%|█▋ | 2118/12384 [4:29:34<21:51:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 17%|█▋ | 2118/12384 [4:29:42<21:51:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2119/12384 [4:29:42<21:48:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2119/12384 [4:29:49<21:48:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 17%|█▋ | 2120/12384 [4:29:49<21:46:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 17%|█▋ | 2120/12384 [4:29:57<21:46:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 17%|█▋ | 2121/12384 [4:29:57<21:45:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 17%|█▋ | 2121/12384 [4:30:04<21:45:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 17%|█▋ | 2122/12384 [4:30:04<21:43:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 17%|█▋ | 2122/12384 [4:30:12<21:43:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 17%|█▋ | 2123/12384 [4:30:12<21:41:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 17%|█▋ | 2123/12384 [4:30:20<21:41:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 17%|█▋ | 2124/12384 [4:30:20<21:40:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 17%|█▋ | 2124/12384 [4:30:27<21:40:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 17%|█▋ | 2125/12384 [4:30:27<21:38:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 17%|█▋ | 2125/12384 [4:30:35<21:38:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 17%|█▋ | 2126/12384 [4:30:35<21:38:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 17%|█▋ | 2126/12384 [4:30:43<21:38:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 17%|█▋ | 2127/12384 [4:30:43<21:55:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 17%|█▋ | 2127/12384 [4:30:50<21:55:55, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.98s]
Epoch 1: 17%|█▋ | 2128/12384 [4:30:50<21:50:24, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.98s]
Epoch 1: 17%|█▋ | 2128/12384 [4:30:58<21:50:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 17%|█▋ | 2129/12384 [4:30:58<21:47:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 17%|█▋ | 2129/12384 [4:31:05<21:47:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2130/12384 [4:31:05<21:45:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2130/12384 [4:31:13<21:45:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2131/12384 [4:31:13<21:42:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2131/12384 [4:31:21<21:42:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2132/12384 [4:31:21<21:41:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2132/12384 [4:31:28<21:41:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 17%|█▋ | 2133/12384 [4:31:28<21:41:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 17%|█▋ | 2133/12384 [4:31:36<21:41:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 17%|█▋ | 2134/12384 [4:31:36<21:40:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 17%|█▋ | 2134/12384 [4:31:44<21:40:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 17%|█▋ | 2135/12384 [4:31:44<21:56:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 17%|█▋ | 2135/12384 [4:31:51<21:56:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 17%|█▋ | 2136/12384 [4:31:51<21:50:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 17%|█▋ | 2136/12384 [4:31:59<21:50:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 17%|█▋ | 2137/12384 [4:31:59<21:47:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 17%|█▋ | 2137/12384 [4:32:07<21:47:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 17%|█▋ | 2138/12384 [4:32:07<21:43:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 17%|█▋ | 2138/12384 [4:32:14<21:43:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2139/12384 [4:32:14<21:42:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2139/12384 [4:32:22<21:42:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2140/12384 [4:32:22<21:40:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 17%|█▋ | 2140/12384 [4:32:29<21:40:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2141/12384 [4:32:29<21:39:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2141/12384 [4:32:37<21:39:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2142/12384 [4:32:37<21:38:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2142/12384 [4:32:45<21:38:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 17%|█▋ | 2143/12384 [4:32:45<21:36:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 17%|█▋ | 2143/12384 [4:32:52<21:36:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 1: 17%|█▋ | 2144/12384 [4:32:52<21:40:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 1: 17%|█▋ | 2144/12384 [4:33:00<21:40:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 17%|█▋ | 2145/12384 [4:33:00<21:38:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 17%|█▋ | 2145/12384 [4:33:07<21:38:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2146/12384 [4:33:07<21:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 17%|█▋ | 2146/12384 [4:33:15<21:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2147/12384 [4:33:15<21:37:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2147/12384 [4:33:23<21:37:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 17%|█▋ | 2148/12384 [4:33:23<21:39:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 17%|█▋ | 2148/12384 [4:33:30<21:39:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 17%|█▋ | 2149/12384 [4:33:30<21:39:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 17%|█▋ | 2149/12384 [4:33:38<21:39:17, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2150/12384 [4:33:38<21:38:38, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2150/12384 [4:33:46<21:38:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 17%|█▋ | 2151/12384 [4:33:46<21:54:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 17%|█▋ | 2151/12384 [4:33:53<21:54:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 17%|█▋ | 2152/12384 [4:33:53<21:49:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 17%|█▋ | 2152/12384 [4:34:01<21:49:16, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 1: 17%|█▋ | 2153/12384 [4:34:01<21:44:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 1: 17%|█▋ | 2153/12384 [4:34:09<21:44:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2154/12384 [4:34:09<21:42:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 17%|█▋ | 2154/12384 [4:34:16<21:42:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 17%|█▋ | 2155/12384 [4:34:16<21:40:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 17%|█▋ | 2155/12384 [4:34:24<21:40:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 17%|█▋ | 2156/12384 [4:34:24<21:39:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 17%|█▋ | 2156/12384 [4:34:31<21:39:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 17%|█▋ | 2157/12384 [4:34:31<21:39:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 17%|█▋ | 2157/12384 [4:34:39<21:39:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 17%|█▋ | 2158/12384 [4:34:39<21:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 17%|█▋ | 2158/12384 [4:34:47<21:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 17%|█▋ | 2159/12384 [4:34:47<21:37:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 17%|█▋ | 2159/12384 [4:34:54<21:37:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 17%|█▋ | 2160/12384 [4:34:54<21:37:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 17%|█▋ | 2160/12384 [4:35:02<21:37:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 17%|█▋ | 2161/12384 [4:35:02<21:52:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 17%|█▋ | 2161/12384 [4:35:10<21:52:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 17%|█▋ | 2162/12384 [4:35:10<21:46:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 17%|█▋ | 2162/12384 [4:35:17<21:46:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 17%|█▋ | 2163/12384 [4:35:17<21:43:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 17%|█▋ | 2163/12384 [4:35:25<21:43:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 17%|█▋ | 2164/12384 [4:35:25<21:39:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 17%|█▋ | 2164/12384 [4:35:33<21:39:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2165/12384 [4:35:33<21:39:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 17%|█▋ | 2165/12384 [4:35:40<21:39:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 17%|█▋ | 2166/12384 [4:35:40<21:37:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 17%|█▋ | 2166/12384 [4:35:48<21:37:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 17%|█▋ | 2167/12384 [4:35:48<21:38:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 17%|█▋ | 2167/12384 [4:35:56<21:38:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 18%|█▊ | 2168/12384 [4:35:56<21:40:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 18%|█▊ | 2168/12384 [4:36:03<21:40:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 18%|█▊ | 2169/12384 [4:36:03<21:38:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 18%|█▊ | 2169/12384 [4:36:11<21:38:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2170/12384 [4:36:11<21:37:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2170/12384 [4:36:18<21:37:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2171/12384 [4:36:18<21:37:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2171/12384 [4:36:26<21:37:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 18%|█▊ | 2172/12384 [4:36:26<21:36:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 18%|█▊ | 2172/12384 [4:36:34<21:36:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 18%|█▊ | 2173/12384 [4:36:34<21:33:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 18%|█▊ | 2173/12384 [4:36:41<21:33:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 18%|█▊ | 2174/12384 [4:36:41<21:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 18%|█▊ | 2174/12384 [4:36:49<21:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2175/12384 [4:36:49<21:35:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2175/12384 [4:36:56<21:35:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 18%|█▊ | 2176/12384 [4:36:56<21:33:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 18%|█▊ | 2176/12384 [4:37:04<21:33:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 18%|█▊ | 2177/12384 [4:37:04<21:49:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 18%|█▊ | 2177/12384 [4:37:12<21:49:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2178/12384 [4:37:12<21:45:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2178/12384 [4:37:20<21:45:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.41s]
Epoch 1: 18%|█▊ | 2179/12384 [4:37:20<21:42:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.41s]
Epoch 1: 18%|█▊ | 2179/12384 [4:37:27<21:42:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 1: 18%|█▊ | 2180/12384 [4:37:27<21:39:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 1: 18%|█▊ | 2180/12384 [4:37:35<21:39:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 18%|█▊ | 2181/12384 [4:37:35<21:37:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 18%|█▊ | 2181/12384 [4:37:42<21:37:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 18%|█▊ | 2182/12384 [4:37:42<21:35:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 18%|█▊ | 2182/12384 [4:37:50<21:35:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 1: 18%|█▊ | 2183/12384 [4:37:50<21:33:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 1: 18%|█▊ | 2183/12384 [4:37:58<21:33:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 18%|█▊ | 2184/12384 [4:37:58<21:34:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 18%|█▊ | 2184/12384 [4:38:05<21:34:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2185/12384 [4:38:05<21:33:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2185/12384 [4:38:13<21:33:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2186/12384 [4:38:13<21:32:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2186/12384 [4:38:21<21:32:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 18%|█▊ | 2187/12384 [4:38:21<21:48:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 18%|█▊ | 2187/12384 [4:38:28<21:48:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 18%|█▊ | 2188/12384 [4:38:28<21:44:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 18%|█▊ | 2188/12384 [4:38:36<21:44:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 18%|█▊ | 2189/12384 [4:38:36<21:40:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 18%|█▊ | 2189/12384 [4:38:44<21:40:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 18%|█▊ | 2190/12384 [4:38:44<21:38:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 18%|█▊ | 2190/12384 [4:38:51<21:38:53, 7.65s/it, loss=0.0001, acc=0.9988, iter_time=8.42s]
Epoch 1: 18%|█▊ | 2191/12384 [4:38:51<21:36:59, 7.63s/it, loss=0.0001, acc=0.9988, iter_time=8.42s]
Epoch 1: 18%|█▊ | 2191/12384 [4:38:59<21:36:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 18%|█▊ | 2192/12384 [4:38:59<21:36:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 18%|█▊ | 2192/12384 [4:39:06<21:36:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 1: 18%|█▊ | 2193/12384 [4:39:06<21:34:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 1: 18%|█▊ | 2193/12384 [4:39:14<21:34:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 18%|█▊ | 2194/12384 [4:39:14<21:33:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 18%|█▊ | 2194/12384 [4:39:22<21:33:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 18%|█▊ | 2195/12384 [4:39:22<21:33:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 18%|█▊ | 2195/12384 [4:39:29<21:33:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 18%|█▊ | 2196/12384 [4:39:29<21:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 18%|█▊ | 2196/12384 [4:39:37<21:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 18%|█▊ | 2197/12384 [4:39:37<21:31:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 18%|█▊ | 2197/12384 [4:39:44<21:31:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 18%|█▊ | 2198/12384 [4:39:44<21:31:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 18%|█▊ | 2198/12384 [4:39:52<21:31:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2199/12384 [4:39:52<21:30:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2199/12384 [4:40:00<21:30:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 18%|█▊ | 2200/12384 [4:40:00<21:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 18%|█▊ | 2200/12384 [4:40:07<21:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 18%|█▊ | 2201/12384 [4:40:07<21:29:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 18%|█▊ | 2201/12384 [4:40:15<21:29:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 18%|█▊ | 2202/12384 [4:40:15<21:29:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 18%|█▊ | 2202/12384 [4:40:23<21:29:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 18%|█▊ | 2203/12384 [4:40:23<21:44:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 18%|█▊ | 2203/12384 [4:40:30<21:44:28, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=6.46s]
Epoch 1: 18%|█▊ | 2204/12384 [4:40:30<21:41:15, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.46s]
Epoch 1: 18%|█▊ | 2204/12384 [4:40:38<21:41:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 18%|█▊ | 2205/12384 [4:40:38<21:37:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 18%|█▊ | 2205/12384 [4:40:45<21:37:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 18%|█▊ | 2206/12384 [4:40:45<21:35:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 18%|█▊ | 2206/12384 [4:40:53<21:35:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 18%|█▊ | 2207/12384 [4:40:53<21:33:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 18%|█▊ | 2207/12384 [4:41:01<21:33:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 18%|█▊ | 2208/12384 [4:41:01<21:31:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 18%|█▊ | 2208/12384 [4:41:08<21:31:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 18%|█▊ | 2209/12384 [4:41:08<21:30:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 18%|█▊ | 2209/12384 [4:41:16<21:30:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2210/12384 [4:41:16<21:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2210/12384 [4:41:23<21:30:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.87s]
Epoch 1: 18%|█▊ | 2211/12384 [4:41:23<21:29:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.87s]
Epoch 1: 18%|█▊ | 2211/12384 [4:41:31<21:29:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 18%|█▊ | 2212/12384 [4:41:31<21:28:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 18%|█▊ | 2212/12384 [4:41:39<21:28:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 18%|█▊ | 2213/12384 [4:41:39<21:45:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 18%|█▊ | 2213/12384 [4:41:47<21:45:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 18%|█▊ | 2214/12384 [4:41:47<21:41:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 18%|█▊ | 2214/12384 [4:41:54<21:41:28, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.10s]
Epoch 1: 18%|█▊ | 2215/12384 [4:41:54<21:36:58, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.10s]
Epoch 1: 18%|█▊ | 2215/12384 [4:42:02<21:36:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 1: 18%|█▊ | 2216/12384 [4:42:02<21:34:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 1: 18%|█▊ | 2216/12384 [4:42:09<21:34:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 18%|█▊ | 2217/12384 [4:42:09<21:32:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 18%|█▊ | 2217/12384 [4:42:17<21:32:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.26s]
Epoch 1: 18%|█▊ | 2218/12384 [4:42:17<21:31:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.26s]
Epoch 1: 18%|█▊ | 2218/12384 [4:42:25<21:31:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 1: 18%|█▊ | 2219/12384 [4:42:25<21:29:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 1: 18%|█▊ | 2219/12384 [4:42:32<21:29:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2220/12384 [4:42:32<21:29:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2220/12384 [4:42:40<21:29:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 18%|█▊ | 2221/12384 [4:42:40<21:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 18%|█▊ | 2221/12384 [4:42:47<21:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 18%|█▊ | 2222/12384 [4:42:47<21:29:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 18%|█▊ | 2222/12384 [4:42:55<21:29:30, 7.61s/it, loss=0.0003, acc=0.9988, iter_time=7.71s]
Epoch 1: 18%|█▊ | 2223/12384 [4:42:55<21:33:49, 7.64s/it, loss=0.0003, acc=0.9988, iter_time=7.71s]
Epoch 1: 18%|█▊ | 2223/12384 [4:43:03<21:33:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 18%|█▊ | 2224/12384 [4:43:03<21:32:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 18%|█▊ | 2224/12384 [4:43:10<21:32:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 18%|█▊ | 2225/12384 [4:43:10<21:30:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 18%|█▊ | 2225/12384 [4:43:18<21:30:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2226/12384 [4:43:18<21:29:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2226/12384 [4:43:26<21:29:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 18%|█▊ | 2227/12384 [4:43:26<21:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 18%|█▊ | 2227/12384 [4:43:33<21:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 18%|█▊ | 2228/12384 [4:43:33<21:33:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 18%|█▊ | 2228/12384 [4:43:41<21:33:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 18%|█▊ | 2229/12384 [4:43:41<21:46:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 18%|█▊ | 2229/12384 [4:43:49<21:46:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 18%|█▊ | 2230/12384 [4:43:49<21:41:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 18%|█▊ | 2230/12384 [4:43:56<21:41:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2231/12384 [4:43:56<21:36:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2231/12384 [4:44:04<21:36:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 18%|█▊ | 2232/12384 [4:44:04<21:34:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 18%|█▊ | 2232/12384 [4:44:12<21:34:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 18%|█▊ | 2233/12384 [4:44:12<21:32:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 18%|█▊ | 2233/12384 [4:44:19<21:32:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 18%|█▊ | 2234/12384 [4:44:19<21:30:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 18%|█▊ | 2234/12384 [4:44:27<21:30:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 18%|█▊ | 2235/12384 [4:44:27<21:29:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 18%|█▊ | 2235/12384 [4:44:35<21:29:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 18%|█▊ | 2236/12384 [4:44:35<21:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 18%|█▊ | 2236/12384 [4:44:42<21:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 1: 18%|█▊ | 2237/12384 [4:44:42<21:30:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 1: 18%|█▊ | 2237/12384 [4:44:50<21:30:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 18%|█▊ | 2238/12384 [4:44:50<21:29:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 18%|█▊ | 2238/12384 [4:44:57<21:29:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 18%|█▊ | 2239/12384 [4:44:57<21:29:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 18%|█▊ | 2239/12384 [4:45:05<21:29:03, 7.62s/it, loss=0.0024, acc=0.9981, iter_time=11.41s]
Epoch 1: 18%|█▊ | 2240/12384 [4:45:05<21:45:50, 7.72s/it, loss=0.0024, acc=0.9981, iter_time=11.41s]
Epoch 1: 18%|█▊ | 2240/12384 [4:45:13<21:45:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 1: 18%|█▊ | 2241/12384 [4:45:13<21:40:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 1: 18%|█▊ | 2241/12384 [4:45:21<21:40:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 18%|█▊ | 2242/12384 [4:45:21<21:36:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 18%|█▊ | 2242/12384 [4:45:28<21:36:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 18%|█▊ | 2243/12384 [4:45:28<21:32:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 18%|█▊ | 2243/12384 [4:45:36<21:32:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2244/12384 [4:45:36<21:30:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2244/12384 [4:45:43<21:30:01, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 1: 18%|█▊ | 2245/12384 [4:45:43<21:28:12, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 1: 18%|█▊ | 2245/12384 [4:45:51<21:28:12, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.61s]
Epoch 1: 18%|█▊ | 2246/12384 [4:45:51<21:27:08, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.61s]
Epoch 1: 18%|█▊ | 2246/12384 [4:45:59<21:27:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 18%|█▊ | 2247/12384 [4:45:59<21:27:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 18%|█▊ | 2247/12384 [4:46:06<21:27:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 18%|█▊ | 2248/12384 [4:46:06<21:25:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 18%|█▊ | 2248/12384 [4:46:14<21:25:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 18%|█▊ | 2249/12384 [4:46:14<21:25:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 18%|█▊ | 2249/12384 [4:46:21<21:25:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2250/12384 [4:46:21<21:26:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2250/12384 [4:46:29<21:26:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 18%|█▊ | 2251/12384 [4:46:29<21:24:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 18%|█▊ | 2251/12384 [4:46:37<21:24:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2252/12384 [4:46:37<21:24:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2252/12384 [4:46:44<21:24:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2253/12384 [4:46:44<21:23:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2253/12384 [4:46:52<21:23:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 18%|█▊ | 2254/12384 [4:46:52<21:23:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 18%|█▊ | 2254/12384 [4:46:59<21:23:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 18%|█▊ | 2255/12384 [4:46:59<21:23:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 18%|█▊ | 2255/12384 [4:47:07<21:23:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 18%|█▊ | 2256/12384 [4:47:07<21:38:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 18%|█▊ | 2256/12384 [4:47:15<21:38:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 18%|█▊ | 2257/12384 [4:47:15<21:34:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 18%|█▊ | 2257/12384 [4:47:23<21:34:59, 7.67s/it, loss=0.0004, acc=0.9978, iter_time=9.46s]
Epoch 1: 18%|█▊ | 2258/12384 [4:47:23<21:32:22, 7.66s/it, loss=0.0004, acc=0.9978, iter_time=9.46s]
Epoch 1: 18%|█▊ | 2258/12384 [4:47:30<21:32:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 18%|█▊ | 2259/12384 [4:47:30<21:29:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 18%|█▊ | 2259/12384 [4:47:38<21:29:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2260/12384 [4:47:38<21:28:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2260/12384 [4:47:45<21:28:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 18%|█▊ | 2261/12384 [4:47:45<21:27:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 18%|█▊ | 2261/12384 [4:47:53<21:27:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2262/12384 [4:47:53<21:26:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2262/12384 [4:48:01<21:26:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 18%|█▊ | 2263/12384 [4:48:01<21:26:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 18%|█▊ | 2263/12384 [4:48:08<21:26:24, 7.63s/it, loss=0.0008, acc=0.9985, iter_time=10.61s]
Epoch 1: 18%|█▊ | 2264/12384 [4:48:08<21:26:53, 7.63s/it, loss=0.0008, acc=0.9985, iter_time=10.61s]
Epoch 1: 18%|█▊ | 2264/12384 [4:48:16<21:26:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 18%|█▊ | 2265/12384 [4:48:16<21:25:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 18%|█▊ | 2265/12384 [4:48:24<21:25:34, 7.62s/it, loss=0.0004, acc=0.9982, iter_time=11.70s]
Epoch 1: 18%|█▊ | 2266/12384 [4:48:24<21:41:00, 7.71s/it, loss=0.0004, acc=0.9982, iter_time=11.70s]
Epoch 1: 18%|█▊ | 2266/12384 [4:48:31<21:41:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 18%|█▊ | 2267/12384 [4:48:31<21:36:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 18%|█▊ | 2267/12384 [4:48:39<21:36:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2268/12384 [4:48:39<21:32:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 18%|█▊ | 2268/12384 [4:48:47<21:32:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 18%|█▊ | 2269/12384 [4:48:47<21:30:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 18%|█▊ | 2269/12384 [4:48:54<21:30:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2270/12384 [4:48:54<21:26:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2270/12384 [4:49:02<21:26:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 18%|█▊ | 2271/12384 [4:49:02<21:27:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 18%|█▊ | 2271/12384 [4:49:10<21:27:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 18%|█▊ | 2272/12384 [4:49:10<21:26:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 18%|█▊ | 2272/12384 [4:49:17<21:26:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 18%|█▊ | 2273/12384 [4:49:17<21:29:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 18%|█▊ | 2273/12384 [4:49:25<21:29:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 18%|█▊ | 2274/12384 [4:49:25<21:29:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 18%|█▊ | 2274/12384 [4:49:33<21:29:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 18%|█▊ | 2275/12384 [4:49:33<21:30:41, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 18%|█▊ | 2275/12384 [4:49:40<21:30:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 18%|█▊ | 2276/12384 [4:49:40<21:27:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 18%|█▊ | 2276/12384 [4:49:48<21:27:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2277/12384 [4:49:48<21:24:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2277/12384 [4:49:55<21:24:29, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.58s]
Epoch 1: 18%|█▊ | 2278/12384 [4:49:55<21:23:42, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.58s]
Epoch 1: 18%|█▊ | 2278/12384 [4:50:03<21:23:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2279/12384 [4:50:03<21:22:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 18%|█▊ | 2279/12384 [4:50:11<21:22:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 18%|█▊ | 2280/12384 [4:50:11<21:21:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 18%|█▊ | 2280/12384 [4:50:18<21:21:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 18%|█▊ | 2281/12384 [4:50:18<21:21:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 18%|█▊ | 2281/12384 [4:50:26<21:21:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 18%|█▊ | 2282/12384 [4:50:26<21:35:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 18%|█▊ | 2282/12384 [4:50:34<21:35:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 18%|█▊ | 2283/12384 [4:50:34<21:30:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 18%|█▊ | 2283/12384 [4:50:41<21:30:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2284/12384 [4:50:41<21:26:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 18%|█▊ | 2284/12384 [4:50:49<21:26:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 18%|█▊ | 2285/12384 [4:50:49<21:24:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 18%|█▊ | 2285/12384 [4:50:56<21:24:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 18%|█▊ | 2286/12384 [4:50:56<21:22:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 18%|█▊ | 2286/12384 [4:51:04<21:22:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 18%|█▊ | 2287/12384 [4:51:04<21:22:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 18%|█▊ | 2287/12384 [4:51:12<21:22:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 18%|█▊ | 2288/12384 [4:51:12<21:21:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 18%|█▊ | 2288/12384 [4:51:19<21:21:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 18%|█▊ | 2289/12384 [4:51:19<21:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 18%|█▊ | 2289/12384 [4:51:27<21:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 18%|█▊ | 2290/12384 [4:51:27<21:22:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 18%|█▊ | 2290/12384 [4:51:35<21:22:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 18%|█▊ | 2291/12384 [4:51:35<21:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 18%|█▊ | 2291/12384 [4:51:42<21:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 19%|█▊ | 2292/12384 [4:51:42<21:20:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 19%|█▊ | 2292/12384 [4:51:50<21:20:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 19%|█▊ | 2293/12384 [4:51:50<21:35:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 19%|█▊ | 2293/12384 [4:51:58<21:35:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 19%|█▊ | 2294/12384 [4:51:58<21:32:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 19%|█▊ | 2294/12384 [4:52:05<21:32:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 19%|█▊ | 2295/12384 [4:52:05<21:27:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 19%|█▊ | 2295/12384 [4:52:13<21:27:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 19%|█▊ | 2296/12384 [4:52:13<21:28:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 19%|█▊ | 2296/12384 [4:52:21<21:28:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 19%|█▊ | 2297/12384 [4:52:21<21:30:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 19%|█▊ | 2297/12384 [4:52:28<21:30:39, 7.68s/it, loss=0.0008, acc=0.9988, iter_time=7.62s]
Epoch 1: 19%|█▊ | 2298/12384 [4:52:28<21:26:56, 7.66s/it, loss=0.0008, acc=0.9988, iter_time=7.62s]
Epoch 1: 19%|█▊ | 2298/12384 [4:52:36<21:26:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▊ | 2299/12384 [4:52:36<21:24:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▊ | 2299/12384 [4:52:44<21:24:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 19%|█▊ | 2300/12384 [4:52:44<21:23:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 19%|█▊ | 2300/12384 [4:52:51<21:23:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 19%|█▊ | 2301/12384 [4:52:51<21:22:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 19%|█▊ | 2301/12384 [4:52:59<21:22:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 19%|█▊ | 2302/12384 [4:52:59<21:21:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 19%|█▊ | 2302/12384 [4:53:06<21:21:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▊ | 2303/12384 [4:53:06<21:19:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▊ | 2303/12384 [4:53:14<21:19:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 19%|█▊ | 2304/12384 [4:53:14<21:19:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 19%|█▊ | 2304/12384 [4:53:22<21:19:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 19%|█▊ | 2305/12384 [4:53:22<21:25:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 19%|█▊ | 2305/12384 [4:53:29<21:25:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 19%|█▊ | 2306/12384 [4:53:29<21:24:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 19%|█▊ | 2306/12384 [4:53:37<21:24:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 19%|█▊ | 2307/12384 [4:53:37<21:22:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 19%|█▊ | 2307/12384 [4:53:45<21:22:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 19%|█▊ | 2308/12384 [4:53:45<21:21:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 19%|█▊ | 2308/12384 [4:53:53<21:21:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.96s]
Epoch 1: 19%|█▊ | 2309/12384 [4:53:53<21:36:27, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.96s]
Epoch 1: 19%|█▊ | 2309/12384 [4:54:00<21:36:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 19%|█▊ | 2310/12384 [4:54:00<21:30:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 19%|█▊ | 2310/12384 [4:54:08<21:30:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 19%|█▊ | 2311/12384 [4:54:08<21:25:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 19%|█▊ | 2311/12384 [4:54:15<21:25:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 19%|█▊ | 2312/12384 [4:54:15<21:23:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 19%|█▊ | 2312/12384 [4:54:23<21:23:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 1: 19%|█▊ | 2313/12384 [4:54:23<21:20:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 1: 19%|█▊ | 2313/12384 [4:54:31<21:20:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 19%|█▊ | 2314/12384 [4:54:31<21:19:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 19%|█▊ | 2314/12384 [4:54:38<21:19:46, 7.63s/it, loss=0.0003, acc=0.9991, iter_time=9.13s]
Epoch 1: 19%|█▊ | 2315/12384 [4:54:38<21:18:19, 7.62s/it, loss=0.0003, acc=0.9991, iter_time=9.13s]
Epoch 1: 19%|█▊ | 2315/12384 [4:54:46<21:18:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 19%|█▊ | 2316/12384 [4:54:46<21:17:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 19%|█▊ | 2316/12384 [4:54:53<21:17:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 1: 19%|█▊ | 2317/12384 [4:54:53<21:17:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 1: 19%|█▊ | 2317/12384 [4:55:01<21:17:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 19%|█▊ | 2318/12384 [4:55:01<21:17:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 19%|█▊ | 2318/12384 [4:55:09<21:17:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 1: 19%|█▊ | 2319/12384 [4:55:09<21:36:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 1: 19%|█▊ | 2319/12384 [4:55:17<21:36:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 1: 19%|█▊ | 2320/12384 [4:55:17<21:30:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 1: 19%|█▊ | 2320/12384 [4:55:24<21:30:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 19%|█▊ | 2321/12384 [4:55:24<21:25:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 19%|█▊ | 2321/12384 [4:55:32<21:25:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 19%|█▉ | 2322/12384 [4:55:32<21:21:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 19%|█▉ | 2322/12384 [4:55:39<21:21:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2323/12384 [4:55:39<21:19:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2323/12384 [4:55:47<21:19:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2324/12384 [4:55:47<21:18:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2324/12384 [4:55:55<21:18:35, 7.63s/it, loss=0.0001, acc=0.9987, iter_time=4.80s]
Epoch 1: 19%|█▉ | 2325/12384 [4:55:55<21:17:34, 7.62s/it, loss=0.0001, acc=0.9987, iter_time=4.80s]
Epoch 1: 19%|█▉ | 2325/12384 [4:56:02<21:17:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 19%|█▉ | 2326/12384 [4:56:02<21:16:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 19%|█▉ | 2326/12384 [4:56:10<21:16:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 19%|█▉ | 2327/12384 [4:56:10<21:15:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 19%|█▉ | 2327/12384 [4:56:17<21:15:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2328/12384 [4:56:17<21:18:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2328/12384 [4:56:25<21:18:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 19%|█▉ | 2329/12384 [4:56:25<21:16:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 19%|█▉ | 2329/12384 [4:56:33<21:16:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 19%|█▉ | 2330/12384 [4:56:33<21:16:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 19%|█▉ | 2330/12384 [4:56:40<21:16:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 19%|█▉ | 2331/12384 [4:56:40<21:16:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 19%|█▉ | 2331/12384 [4:56:48<21:16:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 19%|█▉ | 2332/12384 [4:56:48<21:14:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 19%|█▉ | 2332/12384 [4:56:55<21:14:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 19%|█▉ | 2333/12384 [4:56:55<21:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 19%|█▉ | 2333/12384 [4:57:03<21:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 19%|█▉ | 2334/12384 [4:57:03<21:13:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 19%|█▉ | 2334/12384 [4:57:11<21:13:11, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.09s]
Epoch 1: 19%|█▉ | 2335/12384 [4:57:11<21:28:03, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=9.09s]
Epoch 1: 19%|█▉ | 2335/12384 [4:57:19<21:28:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 19%|█▉ | 2336/12384 [4:57:19<21:25:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 19%|█▉ | 2336/12384 [4:57:26<21:25:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 19%|█▉ | 2337/12384 [4:57:26<21:21:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 19%|█▉ | 2337/12384 [4:57:34<21:21:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 19%|█▉ | 2338/12384 [4:57:34<21:19:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 19%|█▉ | 2338/12384 [4:57:41<21:19:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 19%|█▉ | 2339/12384 [4:57:41<21:17:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 19%|█▉ | 2339/12384 [4:57:49<21:17:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 19%|█▉ | 2340/12384 [4:57:49<21:18:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 19%|█▉ | 2340/12384 [4:57:57<21:18:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 19%|█▉ | 2341/12384 [4:57:57<21:16:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 19%|█▉ | 2341/12384 [4:58:04<21:16:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2342/12384 [4:58:04<21:14:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2342/12384 [4:58:12<21:14:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 19%|█▉ | 2343/12384 [4:58:12<21:14:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 19%|█▉ | 2343/12384 [4:58:20<21:14:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 19%|█▉ | 2344/12384 [4:58:20<21:17:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 19%|█▉ | 2344/12384 [4:58:28<21:17:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 19%|█▉ | 2345/12384 [4:58:28<21:33:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 19%|█▉ | 2345/12384 [4:58:35<21:33:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 19%|█▉ | 2346/12384 [4:58:35<21:27:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 19%|█▉ | 2346/12384 [4:58:43<21:27:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 19%|█▉ | 2347/12384 [4:58:43<21:25:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 19%|█▉ | 2347/12384 [4:58:50<21:25:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 19%|█▉ | 2348/12384 [4:58:50<21:20:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 19%|█▉ | 2348/12384 [4:58:58<21:20:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 19%|█▉ | 2349/12384 [4:58:58<21:18:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 19%|█▉ | 2349/12384 [4:59:06<21:18:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 19%|█▉ | 2350/12384 [4:59:06<21:16:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 19%|█▉ | 2350/12384 [4:59:13<21:16:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 1: 19%|█▉ | 2351/12384 [4:59:13<21:15:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 1: 19%|█▉ | 2351/12384 [4:59:21<21:15:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 1: 19%|█▉ | 2352/12384 [4:59:21<21:14:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 1: 19%|█▉ | 2352/12384 [4:59:28<21:14:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 19%|█▉ | 2353/12384 [4:59:28<21:12:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 19%|█▉ | 2353/12384 [4:59:36<21:12:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 19%|█▉ | 2354/12384 [4:59:36<21:13:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 19%|█▉ | 2354/12384 [4:59:44<21:13:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 19%|█▉ | 2355/12384 [4:59:44<21:12:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 19%|█▉ | 2355/12384 [4:59:51<21:12:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 19%|█▉ | 2356/12384 [4:59:51<21:11:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 19%|█▉ | 2356/12384 [4:59:59<21:11:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 19%|█▉ | 2357/12384 [4:59:59<21:11:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 19%|█▉ | 2357/12384 [5:00:06<21:11:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 1: 19%|█▉ | 2358/12384 [5:00:06<21:11:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 1: 19%|█▉ | 2358/12384 [5:00:14<21:11:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 19%|█▉ | 2359/12384 [5:00:14<21:12:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 19%|█▉ | 2359/12384 [5:00:22<21:12:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 19%|█▉ | 2360/12384 [5:00:22<21:12:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 19%|█▉ | 2360/12384 [5:00:29<21:12:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 19%|█▉ | 2361/12384 [5:00:29<21:11:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 19%|█▉ | 2361/12384 [5:00:37<21:11:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 19%|█▉ | 2362/12384 [5:00:37<21:11:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 19%|█▉ | 2362/12384 [5:00:45<21:11:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2363/12384 [5:00:45<21:10:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2363/12384 [5:00:52<21:10:45, 7.61s/it, loss=0.0002, acc=0.9985, iter_time=7.61s]
Epoch 1: 19%|█▉ | 2364/12384 [5:00:52<21:15:12, 7.64s/it, loss=0.0002, acc=0.9985, iter_time=7.61s]
Epoch 1: 19%|█▉ | 2364/12384 [5:01:00<21:15:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 19%|█▉ | 2365/12384 [5:01:00<21:14:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 19%|█▉ | 2365/12384 [5:01:07<21:14:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 19%|█▉ | 2366/12384 [5:01:07<21:13:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 19%|█▉ | 2366/12384 [5:01:15<21:13:55, 7.63s/it, loss=0.0009, acc=0.9978, iter_time=6.01s]
Epoch 1: 19%|█▉ | 2367/12384 [5:01:15<21:12:46, 7.62s/it, loss=0.0009, acc=0.9978, iter_time=6.01s]
Epoch 1: 19%|█▉ | 2367/12384 [5:01:23<21:12:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 19%|█▉ | 2368/12384 [5:01:23<21:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 19%|█▉ | 2368/12384 [5:01:30<21:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 19%|█▉ | 2369/12384 [5:01:30<21:10:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 19%|█▉ | 2369/12384 [5:01:38<21:10:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 19%|█▉ | 2370/12384 [5:01:38<21:09:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 19%|█▉ | 2370/12384 [5:01:46<21:09:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 19%|█▉ | 2371/12384 [5:01:46<21:25:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 19%|█▉ | 2371/12384 [5:01:54<21:25:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 19%|█▉ | 2372/12384 [5:01:54<21:24:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 19%|█▉ | 2372/12384 [5:02:01<21:24:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 19%|█▉ | 2373/12384 [5:02:01<21:19:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 19%|█▉ | 2373/12384 [5:02:09<21:19:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 19%|█▉ | 2374/12384 [5:02:09<21:16:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 19%|█▉ | 2374/12384 [5:02:16<21:16:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 19%|█▉ | 2375/12384 [5:02:16<21:16:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 19%|█▉ | 2375/12384 [5:02:24<21:16:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 19%|█▉ | 2376/12384 [5:02:24<21:13:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 19%|█▉ | 2376/12384 [5:02:32<21:13:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 19%|█▉ | 2377/12384 [5:02:32<21:11:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 19%|█▉ | 2377/12384 [5:02:39<21:11:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 19%|█▉ | 2378/12384 [5:02:39<21:11:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 19%|█▉ | 2378/12384 [5:02:47<21:11:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 19%|█▉ | 2379/12384 [5:02:47<21:10:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 19%|█▉ | 2379/12384 [5:02:54<21:10:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 19%|█▉ | 2380/12384 [5:02:54<21:10:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 19%|█▉ | 2380/12384 [5:03:02<21:10:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 19%|█▉ | 2381/12384 [5:03:02<21:09:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 19%|█▉ | 2381/12384 [5:03:10<21:09:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 19%|█▉ | 2382/12384 [5:03:10<21:08:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 19%|█▉ | 2382/12384 [5:03:17<21:08:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 19%|█▉ | 2383/12384 [5:03:17<21:08:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 19%|█▉ | 2383/12384 [5:03:25<21:08:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 19%|█▉ | 2384/12384 [5:03:25<21:07:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 19%|█▉ | 2384/12384 [5:03:32<21:07:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 19%|█▉ | 2385/12384 [5:03:32<21:07:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 19%|█▉ | 2385/12384 [5:03:40<21:07:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2386/12384 [5:03:40<21:07:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2386/12384 [5:03:48<21:07:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 19%|█▉ | 2387/12384 [5:03:48<21:22:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 19%|█▉ | 2387/12384 [5:03:56<21:22:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 19%|█▉ | 2388/12384 [5:03:56<21:18:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 19%|█▉ | 2388/12384 [5:04:03<21:18:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 19%|█▉ | 2389/12384 [5:04:03<21:14:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 19%|█▉ | 2389/12384 [5:04:11<21:14:54, 7.65s/it, loss=0.0003, acc=0.9986, iter_time=7.61s]
Epoch 1: 19%|█▉ | 2390/12384 [5:04:11<21:13:21, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.61s]
Epoch 1: 19%|█▉ | 2390/12384 [5:04:18<21:13:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 19%|█▉ | 2391/12384 [5:04:18<21:14:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 19%|█▉ | 2391/12384 [5:04:26<21:14:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 19%|█▉ | 2392/12384 [5:04:26<21:11:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 19%|█▉ | 2392/12384 [5:04:34<21:11:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 19%|█▉ | 2393/12384 [5:04:34<21:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 19%|█▉ | 2393/12384 [5:04:41<21:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 19%|█▉ | 2394/12384 [5:04:41<21:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 19%|█▉ | 2394/12384 [5:04:49<21:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 19%|█▉ | 2395/12384 [5:04:49<21:06:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 19%|█▉ | 2395/12384 [5:04:56<21:06:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 19%|█▉ | 2396/12384 [5:04:56<21:06:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 19%|█▉ | 2396/12384 [5:05:04<21:06:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 19%|█▉ | 2397/12384 [5:05:04<21:21:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 19%|█▉ | 2397/12384 [5:05:12<21:21:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 19%|█▉ | 2398/12384 [5:05:12<21:16:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 19%|█▉ | 2398/12384 [5:05:20<21:16:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 19%|█▉ | 2399/12384 [5:05:20<21:13:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 19%|█▉ | 2399/12384 [5:05:27<21:13:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 19%|█▉ | 2400/12384 [5:05:27<21:11:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 19%|█▉ | 2400/12384 [5:05:35<21:11:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 19%|█▉ | 2401/12384 [5:05:35<21:09:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 19%|█▉ | 2401/12384 [5:05:42<21:09:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 1: 19%|█▉ | 2402/12384 [5:05:42<21:10:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 1: 19%|█▉ | 2402/12384 [5:05:50<21:10:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 1: 19%|█▉ | 2403/12384 [5:05:50<21:09:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 1: 19%|█▉ | 2403/12384 [5:05:58<21:09:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 19%|█▉ | 2404/12384 [5:05:58<21:08:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 19%|█▉ | 2404/12384 [5:06:05<21:08:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 19%|█▉ | 2405/12384 [5:06:05<21:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 19%|█▉ | 2405/12384 [5:06:13<21:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 19%|█▉ | 2406/12384 [5:06:13<21:06:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 19%|█▉ | 2406/12384 [5:06:21<21:06:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 19%|█▉ | 2407/12384 [5:06:21<21:11:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 19%|█▉ | 2407/12384 [5:06:28<21:11:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 19%|█▉ | 2408/12384 [5:06:28<21:10:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 19%|█▉ | 2408/12384 [5:06:36<21:10:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 19%|█▉ | 2409/12384 [5:06:36<21:09:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 19%|█▉ | 2409/12384 [5:06:43<21:09:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 19%|█▉ | 2410/12384 [5:06:43<21:07:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 19%|█▉ | 2410/12384 [5:06:51<21:07:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 19%|█▉ | 2411/12384 [5:06:51<21:06:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 19%|█▉ | 2411/12384 [5:06:59<21:06:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 19%|█▉ | 2412/12384 [5:06:59<21:06:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 19%|█▉ | 2412/12384 [5:07:07<21:06:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 19%|█▉ | 2413/12384 [5:07:07<21:20:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 19%|█▉ | 2413/12384 [5:07:14<21:20:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2414/12384 [5:07:14<21:15:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 19%|█▉ | 2414/12384 [5:07:22<21:15:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|█▉ | 2415/12384 [5:07:22<21:12:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|█▉ | 2415/12384 [5:07:30<21:12:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 20%|█▉ | 2416/12384 [5:07:30<21:14:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 20%|█▉ | 2416/12384 [5:07:37<21:14:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 20%|█▉ | 2417/12384 [5:07:37<21:11:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 20%|█▉ | 2417/12384 [5:07:45<21:11:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 20%|█▉ | 2418/12384 [5:07:45<21:08:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 20%|█▉ | 2418/12384 [5:07:52<21:08:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 20%|█▉ | 2419/12384 [5:07:52<21:07:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 20%|█▉ | 2419/12384 [5:08:00<21:07:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 20%|█▉ | 2420/12384 [5:08:00<21:06:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 20%|█▉ | 2420/12384 [5:08:08<21:06:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2421/12384 [5:08:08<21:05:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2421/12384 [5:08:15<21:05:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 20%|█▉ | 2422/12384 [5:08:15<21:04:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 20%|█▉ | 2422/12384 [5:08:23<21:04:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 20%|█▉ | 2423/12384 [5:08:23<21:08:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 20%|█▉ | 2423/12384 [5:08:31<21:08:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 20%|█▉ | 2424/12384 [5:08:31<21:23:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 20%|█▉ | 2424/12384 [5:08:38<21:23:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 20%|█▉ | 2425/12384 [5:08:38<21:17:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 20%|█▉ | 2425/12384 [5:08:46<21:17:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 20%|█▉ | 2426/12384 [5:08:46<21:13:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 20%|█▉ | 2426/12384 [5:08:54<21:13:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 20%|█▉ | 2427/12384 [5:08:54<21:08:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 20%|█▉ | 2427/12384 [5:09:01<21:08:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2428/12384 [5:09:01<21:07:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2428/12384 [5:09:09<21:07:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 20%|█▉ | 2429/12384 [5:09:09<21:06:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 20%|█▉ | 2429/12384 [5:09:17<21:06:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 20%|█▉ | 2430/12384 [5:09:17<21:05:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 20%|█▉ | 2430/12384 [5:09:24<21:05:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|█▉ | 2431/12384 [5:09:24<21:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|█▉ | 2431/12384 [5:09:32<21:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 20%|█▉ | 2432/12384 [5:09:32<21:02:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 20%|█▉ | 2432/12384 [5:09:39<21:02:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 20%|█▉ | 2433/12384 [5:09:39<21:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 20%|█▉ | 2433/12384 [5:09:47<21:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 1: 20%|█▉ | 2434/12384 [5:09:47<21:01:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 1: 20%|█▉ | 2434/12384 [5:09:54<21:01:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.40s]
Epoch 1: 20%|█▉ | 2435/12384 [5:09:54<21:00:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.40s]
Epoch 1: 20%|█▉ | 2435/12384 [5:10:02<21:00:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 20%|█▉ | 2436/12384 [5:10:02<21:01:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 20%|█▉ | 2436/12384 [5:10:10<21:01:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 20%|█▉ | 2437/12384 [5:10:10<21:06:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 20%|█▉ | 2437/12384 [5:10:17<21:06:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 20%|█▉ | 2438/12384 [5:10:17<21:05:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 20%|█▉ | 2438/12384 [5:10:25<21:05:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 20%|█▉ | 2439/12384 [5:10:25<21:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 20%|█▉ | 2439/12384 [5:10:33<21:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 20%|█▉ | 2440/12384 [5:10:33<21:20:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 20%|█▉ | 2440/12384 [5:10:41<21:20:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 20%|█▉ | 2441/12384 [5:10:41<21:13:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 20%|█▉ | 2441/12384 [5:10:48<21:13:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2442/12384 [5:10:48<21:13:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2442/12384 [5:10:56<21:13:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 20%|█▉ | 2443/12384 [5:10:56<21:08:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 20%|█▉ | 2443/12384 [5:11:03<21:08:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 20%|█▉ | 2444/12384 [5:11:03<21:05:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 20%|█▉ | 2444/12384 [5:11:11<21:05:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 20%|█▉ | 2445/12384 [5:11:11<21:03:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 20%|█▉ | 2445/12384 [5:11:19<21:03:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 20%|█▉ | 2446/12384 [5:11:19<21:03:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 20%|█▉ | 2446/12384 [5:11:26<21:03:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 20%|█▉ | 2447/12384 [5:11:26<21:05:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 20%|█▉ | 2447/12384 [5:11:34<21:05:57, 7.64s/it, loss=0.0000, acc=0.9999, iter_time=8.09s]
Epoch 1: 20%|█▉ | 2448/12384 [5:11:34<21:04:30, 7.64s/it, loss=0.0000, acc=0.9999, iter_time=8.09s]
Epoch 1: 20%|█▉ | 2448/12384 [5:11:42<21:04:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 20%|█▉ | 2449/12384 [5:11:42<21:03:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 20%|█▉ | 2449/12384 [5:11:50<21:03:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 1: 20%|█▉ | 2450/12384 [5:11:50<21:19:29, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 1: 20%|█▉ | 2450/12384 [5:11:57<21:19:29, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 20%|█▉ | 2451/12384 [5:11:57<21:12:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 20%|█▉ | 2451/12384 [5:12:05<21:12:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 20%|█▉ | 2452/12384 [5:12:05<21:07:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 20%|█▉ | 2452/12384 [5:12:12<21:07:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2453/12384 [5:12:12<21:05:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2453/12384 [5:12:20<21:05:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 20%|█▉ | 2454/12384 [5:12:20<21:03:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 20%|█▉ | 2454/12384 [5:12:28<21:03:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 20%|█▉ | 2455/12384 [5:12:28<21:02:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 20%|█▉ | 2455/12384 [5:12:35<21:02:43, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 1: 20%|█▉ | 2456/12384 [5:12:35<21:02:11, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 1: 20%|█▉ | 2456/12384 [5:12:43<21:02:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 20%|█▉ | 2457/12384 [5:12:43<20:59:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 20%|█▉ | 2457/12384 [5:12:50<20:59:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 1: 20%|█▉ | 2458/12384 [5:12:50<20:59:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 1: 20%|█▉ | 2458/12384 [5:12:58<20:59:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 20%|█▉ | 2459/12384 [5:12:58<20:58:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 20%|█▉ | 2459/12384 [5:13:06<20:58:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 1: 20%|█▉ | 2460/12384 [5:13:06<20:59:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 1: 20%|█▉ | 2460/12384 [5:13:13<20:59:14, 7.61s/it, loss=0.0007, acc=0.9977, iter_time=9.08s]
Epoch 1: 20%|█▉ | 2461/12384 [5:13:13<20:57:54, 7.61s/it, loss=0.0007, acc=0.9977, iter_time=9.08s]
Epoch 1: 20%|█▉ | 2461/12384 [5:13:21<20:57:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 20%|█▉ | 2462/12384 [5:13:21<20:58:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 20%|█▉ | 2462/12384 [5:13:28<20:58:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 20%|█▉ | 2463/12384 [5:13:28<20:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 20%|█▉ | 2463/12384 [5:13:36<20:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 20%|█▉ | 2464/12384 [5:13:36<20:58:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 20%|█▉ | 2464/12384 [5:13:44<20:58:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 20%|█▉ | 2465/12384 [5:13:44<20:58:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 20%|█▉ | 2465/12384 [5:13:52<20:58:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 1: 20%|█▉ | 2466/12384 [5:13:52<21:15:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 1: 20%|█▉ | 2466/12384 [5:13:59<21:15:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 20%|█▉ | 2467/12384 [5:13:59<21:10:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 20%|█▉ | 2467/12384 [5:14:07<21:10:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 20%|█▉ | 2468/12384 [5:14:07<21:09:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 20%|█▉ | 2468/12384 [5:14:15<21:09:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.52s]
Epoch 1: 20%|█▉ | 2469/12384 [5:14:15<21:06:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.52s]
Epoch 1: 20%|█▉ | 2469/12384 [5:14:22<21:06:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2470/12384 [5:14:22<21:04:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|█▉ | 2470/12384 [5:14:30<21:04:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 20%|█▉ | 2471/12384 [5:14:30<21:02:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 20%|█▉ | 2471/12384 [5:14:37<21:02:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 20%|█▉ | 2472/12384 [5:14:37<21:01:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 20%|█▉ | 2472/12384 [5:14:45<21:01:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 1: 20%|█▉ | 2473/12384 [5:14:45<21:01:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 1: 20%|█▉ | 2473/12384 [5:14:53<21:01:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 1: 20%|█▉ | 2474/12384 [5:14:53<20:59:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 1: 20%|█▉ | 2474/12384 [5:15:00<20:59:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 20%|█▉ | 2475/12384 [5:15:00<20:59:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 20%|█▉ | 2475/12384 [5:15:08<20:59:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 20%|█▉ | 2476/12384 [5:15:08<20:58:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 20%|█▉ | 2476/12384 [5:15:16<20:58:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 20%|██ | 2477/12384 [5:15:16<21:19:15, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 20%|██ | 2477/12384 [5:15:24<21:19:15, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 20%|██ | 2478/12384 [5:15:24<21:12:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 20%|██ | 2478/12384 [5:15:31<21:12:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 20%|██ | 2479/12384 [5:15:31<21:08:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 20%|██ | 2479/12384 [5:15:39<21:08:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 20%|██ | 2480/12384 [5:15:39<21:05:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 20%|██ | 2480/12384 [5:15:46<21:05:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 20%|██ | 2481/12384 [5:15:46<21:04:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 20%|██ | 2481/12384 [5:15:54<21:04:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 20%|██ | 2482/12384 [5:15:54<21:04:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 20%|██ | 2482/12384 [5:16:02<21:04:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 20%|██ | 2483/12384 [5:16:02<21:01:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 20%|██ | 2483/12384 [5:16:09<21:01:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 20%|██ | 2484/12384 [5:16:09<20:59:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 20%|██ | 2484/12384 [5:16:17<20:59:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2485/12384 [5:16:17<20:58:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2485/12384 [5:16:25<20:58:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 20%|██ | 2486/12384 [5:16:25<20:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 20%|██ | 2486/12384 [5:16:32<20:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 20%|██ | 2487/12384 [5:16:32<20:56:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 20%|██ | 2487/12384 [5:16:40<20:56:40, 7.62s/it, loss=0.0008, acc=0.9973, iter_time=8.02s]
Epoch 1: 20%|██ | 2488/12384 [5:16:40<20:57:16, 7.62s/it, loss=0.0008, acc=0.9973, iter_time=8.02s]
Epoch 1: 20%|██ | 2488/12384 [5:16:48<20:57:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 20%|██ | 2489/12384 [5:16:48<21:00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 20%|██ | 2489/12384 [5:16:55<21:00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 20%|██ | 2490/12384 [5:16:55<21:03:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 20%|██ | 2490/12384 [5:17:03<21:03:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 1: 20%|██ | 2491/12384 [5:17:03<21:01:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 1: 20%|██ | 2491/12384 [5:17:10<21:01:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 20%|██ | 2492/12384 [5:17:10<20:58:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 20%|██ | 2492/12384 [5:17:18<20:58:09, 7.63s/it, loss=0.0004, acc=0.9987, iter_time=7.89s]
Epoch 1: 20%|██ | 2493/12384 [5:17:18<21:10:41, 7.71s/it, loss=0.0004, acc=0.9987, iter_time=7.89s]
Epoch 1: 20%|██ | 2493/12384 [5:17:26<21:10:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 20%|██ | 2494/12384 [5:17:26<21:09:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 20%|██ | 2494/12384 [5:17:34<21:09:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 20%|██ | 2495/12384 [5:17:34<21:06:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 20%|██ | 2495/12384 [5:17:41<21:06:52, 7.69s/it, loss=0.0003, acc=0.9994, iter_time=7.57s]
Epoch 1: 20%|██ | 2496/12384 [5:17:41<21:03:44, 7.67s/it, loss=0.0003, acc=0.9994, iter_time=7.57s]
Epoch 1: 20%|██ | 2496/12384 [5:17:49<21:03:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 20%|██ | 2497/12384 [5:17:49<21:00:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 20%|██ | 2497/12384 [5:17:57<21:00:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 20%|██ | 2498/12384 [5:17:57<20:59:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 20%|██ | 2498/12384 [5:18:04<20:59:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 20%|██ | 2499/12384 [5:18:04<20:58:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 20%|██ | 2499/12384 [5:18:12<20:58:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 20%|██ | 2500/12384 [5:18:12<20:58:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 20%|██ | 2500/12384 [5:18:19<20:58:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 20%|██ | 2501/12384 [5:18:19<20:58:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 20%|██ | 2501/12384 [5:18:27<20:58:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2502/12384 [5:18:27<20:56:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2502/12384 [5:18:35<20:56:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 20%|██ | 2503/12384 [5:18:35<21:13:34, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 20%|██ | 2503/12384 [5:18:43<21:13:34, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 20%|██ | 2504/12384 [5:18:43<21:08:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 20%|██ | 2504/12384 [5:18:50<21:08:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 20%|██ | 2505/12384 [5:18:50<21:04:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 20%|██ | 2505/12384 [5:18:58<21:04:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2506/12384 [5:18:58<21:00:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2506/12384 [5:19:05<21:00:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2507/12384 [5:19:05<20:57:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2507/12384 [5:19:13<20:57:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|██ | 2508/12384 [5:19:13<20:55:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|██ | 2508/12384 [5:19:21<20:55:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|██ | 2509/12384 [5:19:21<20:54:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|██ | 2509/12384 [5:19:28<20:54:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2510/12384 [5:19:28<20:54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2510/12384 [5:19:36<20:54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 20%|██ | 2511/12384 [5:19:36<20:52:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 20%|██ | 2511/12384 [5:19:43<20:52:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 20%|██ | 2512/12384 [5:19:43<20:52:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 20%|██ | 2512/12384 [5:19:51<20:52:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 20%|██ | 2513/12384 [5:19:51<20:52:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 20%|██ | 2513/12384 [5:19:59<20:52:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 20%|██ | 2514/12384 [5:19:59<20:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 20%|██ | 2514/12384 [5:20:06<20:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 20%|██ | 2515/12384 [5:20:06<20:51:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 20%|██ | 2515/12384 [5:20:14<20:51:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 20%|██ | 2516/12384 [5:20:14<20:51:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 20%|██ | 2516/12384 [5:20:22<20:51:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 20%|██ | 2517/12384 [5:20:22<20:52:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 20%|██ | 2517/12384 [5:20:29<20:52:02, 7.61s/it, loss=0.0013, acc=0.9987, iter_time=7.63s]
Epoch 1: 20%|██ | 2518/12384 [5:20:29<20:52:12, 7.62s/it, loss=0.0013, acc=0.9987, iter_time=7.63s]
Epoch 1: 20%|██ | 2518/12384 [5:20:37<20:52:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 20%|██ | 2519/12384 [5:20:37<20:52:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 20%|██ | 2519/12384 [5:20:44<20:52:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 20%|██ | 2520/12384 [5:20:44<20:52:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 20%|██ | 2520/12384 [5:20:52<20:52:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 20%|██ | 2521/12384 [5:20:52<20:50:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 20%|██ | 2521/12384 [5:21:00<20:50:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2522/12384 [5:21:00<20:50:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 20%|██ | 2522/12384 [5:21:07<20:50:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|██ | 2523/12384 [5:21:07<20:49:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 20%|██ | 2523/12384 [5:21:15<20:49:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 20%|██ | 2524/12384 [5:21:15<20:49:33, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 20%|██ | 2524/12384 [5:21:22<20:49:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 20%|██ | 2525/12384 [5:21:22<20:48:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 20%|██ | 2525/12384 [5:21:30<20:48:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 20%|██ | 2526/12384 [5:21:30<20:49:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 20%|██ | 2526/12384 [5:21:38<20:49:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 20%|██ | 2527/12384 [5:21:38<20:49:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 20%|██ | 2527/12384 [5:21:45<20:49:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 20%|██ | 2528/12384 [5:21:45<20:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 20%|██ | 2528/12384 [5:21:53<20:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 20%|██ | 2529/12384 [5:21:53<21:09:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 20%|██ | 2529/12384 [5:22:01<21:09:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 20%|██ | 2530/12384 [5:22:01<21:03:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 20%|██ | 2530/12384 [5:22:09<21:03:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 20%|██ | 2531/12384 [5:22:09<21:00:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 20%|██ | 2531/12384 [5:22:16<21:00:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 20%|██ | 2532/12384 [5:22:16<20:57:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 20%|██ | 2532/12384 [5:22:24<20:57:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 20%|██ | 2533/12384 [5:22:24<20:54:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 20%|██ | 2533/12384 [5:22:31<20:54:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 20%|██ | 2534/12384 [5:22:31<20:52:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 20%|██ | 2534/12384 [5:22:39<20:52:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 20%|██ | 2535/12384 [5:22:39<20:51:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 20%|██ | 2535/12384 [5:22:47<20:51:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 20%|██ | 2536/12384 [5:22:47<20:50:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 20%|██ | 2536/12384 [5:22:54<20:50:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 20%|██ | 2537/12384 [5:22:54<20:50:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 20%|██ | 2537/12384 [5:23:02<20:50:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 20%|██ | 2538/12384 [5:23:02<20:49:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 20%|██ | 2538/12384 [5:23:09<20:49:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 21%|██ | 2539/12384 [5:23:09<20:49:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 21%|██ | 2539/12384 [5:23:17<20:49:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 21%|██ | 2540/12384 [5:23:17<20:48:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 21%|██ | 2540/12384 [5:23:25<20:48:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 21%|██ | 2541/12384 [5:23:25<20:53:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 21%|██ | 2541/12384 [5:23:32<20:53:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 21%|██ | 2542/12384 [5:23:32<20:50:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 21%|██ | 2542/12384 [5:23:40<20:50:38, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=9.13s]
Epoch 1: 21%|██ | 2543/12384 [5:23:40<20:50:07, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=9.13s]
Epoch 1: 21%|██ | 2543/12384 [5:23:48<20:50:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 21%|██ | 2544/12384 [5:23:48<20:50:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 21%|██ | 2544/12384 [5:23:55<20:50:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 21%|██ | 2545/12384 [5:23:55<21:03:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 21%|██ | 2545/12384 [5:24:03<21:03:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2546/12384 [5:24:03<20:59:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2546/12384 [5:24:11<20:59:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 21%|██ | 2547/12384 [5:24:11<20:55:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 21%|██ | 2547/12384 [5:24:18<20:55:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 21%|██ | 2548/12384 [5:24:18<20:53:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 21%|██ | 2548/12384 [5:24:26<20:53:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 21%|██ | 2549/12384 [5:24:26<20:51:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 21%|██ | 2549/12384 [5:24:33<20:51:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 21%|██ | 2550/12384 [5:24:33<20:49:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 21%|██ | 2550/12384 [5:24:41<20:49:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 21%|██ | 2551/12384 [5:24:41<20:47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 21%|██ | 2551/12384 [5:24:49<20:47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 21%|██ | 2552/12384 [5:24:49<20:46:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 21%|██ | 2552/12384 [5:24:56<20:46:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 21%|██ | 2553/12384 [5:24:56<20:47:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 21%|██ | 2553/12384 [5:25:04<20:47:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 21%|██ | 2554/12384 [5:25:04<20:46:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 21%|██ | 2554/12384 [5:25:12<20:46:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 21%|██ | 2555/12384 [5:25:12<21:02:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 21%|██ | 2555/12384 [5:25:19<21:02:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 1: 21%|██ | 2556/12384 [5:25:19<20:57:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 1: 21%|██ | 2556/12384 [5:25:27<20:57:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 1: 21%|██ | 2557/12384 [5:25:27<20:53:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 1: 21%|██ | 2557/12384 [5:25:35<20:53:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 21%|██ | 2558/12384 [5:25:35<20:50:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 21%|██ | 2558/12384 [5:25:42<20:50:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 21%|██ | 2559/12384 [5:25:42<20:48:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 21%|██ | 2559/12384 [5:25:50<20:48:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 21%|██ | 2560/12384 [5:25:50<20:46:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 21%|██ | 2560/12384 [5:25:57<20:46:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 21%|██ | 2561/12384 [5:25:57<20:46:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 21%|██ | 2561/12384 [5:26:05<20:46:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 1: 21%|██ | 2562/12384 [5:26:05<20:46:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 1: 21%|██ | 2562/12384 [5:26:13<20:46:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 21%|██ | 2563/12384 [5:26:13<20:45:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 21%|██ | 2563/12384 [5:26:20<20:45:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 21%|██ | 2564/12384 [5:26:20<20:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 21%|██ | 2564/12384 [5:26:28<20:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 21%|██ | 2565/12384 [5:26:28<20:43:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 21%|██ | 2565/12384 [5:26:35<20:43:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 21%|██ | 2566/12384 [5:26:35<20:43:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 21%|██ | 2566/12384 [5:26:43<20:43:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 1: 21%|██ | 2567/12384 [5:26:43<20:44:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 1: 21%|██ | 2567/12384 [5:26:51<20:44:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 1: 21%|██ | 2568/12384 [5:26:51<20:45:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 1: 21%|██ | 2568/12384 [5:26:58<20:45:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 1: 21%|██ | 2569/12384 [5:26:58<20:45:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 1: 21%|██ | 2569/12384 [5:27:06<20:45:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██ | 2570/12384 [5:27:06<20:45:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██ | 2570/12384 [5:27:14<20:45:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 21%|██ | 2571/12384 [5:27:14<20:58:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 21%|██ | 2571/12384 [5:27:21<20:58:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 21%|██ | 2572/12384 [5:27:21<20:54:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 21%|██ | 2572/12384 [5:27:29<20:54:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 21%|██ | 2573/12384 [5:27:29<20:51:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 21%|██ | 2573/12384 [5:27:37<20:51:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██ | 2574/12384 [5:27:37<20:49:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██ | 2574/12384 [5:27:44<20:49:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2575/12384 [5:27:44<20:47:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2575/12384 [5:27:52<20:47:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 21%|██ | 2576/12384 [5:27:52<20:47:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 21%|██ | 2576/12384 [5:27:59<20:47:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 21%|██ | 2577/12384 [5:27:59<20:46:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 21%|██ | 2577/12384 [5:28:07<20:46:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██ | 2578/12384 [5:28:07<20:45:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██ | 2578/12384 [5:28:15<20:45:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 21%|██ | 2579/12384 [5:28:15<20:45:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 21%|██ | 2579/12384 [5:28:22<20:45:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 21%|██ | 2580/12384 [5:28:22<20:44:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 21%|██ | 2580/12384 [5:28:30<20:44:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 21%|██ | 2581/12384 [5:28:30<21:00:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 21%|██ | 2581/12384 [5:28:38<21:00:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 21%|██ | 2582/12384 [5:28:38<20:55:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 21%|██ | 2582/12384 [5:28:46<20:55:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 21%|██ | 2583/12384 [5:28:46<20:56:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 21%|██ | 2583/12384 [5:28:53<20:56:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 21%|██ | 2584/12384 [5:28:53<20:51:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 21%|██ | 2584/12384 [5:29:01<20:51:36, 7.66s/it, loss=0.0003, acc=0.9991, iter_time=7.21s]
Epoch 1: 21%|██ | 2585/12384 [5:29:01<20:48:33, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=7.21s]
Epoch 1: 21%|██ | 2585/12384 [5:29:08<20:48:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 21%|██ | 2586/12384 [5:29:08<20:46:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 21%|██ | 2586/12384 [5:29:16<20:46:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 21%|██ | 2587/12384 [5:29:16<20:46:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 21%|██ | 2587/12384 [5:29:24<20:46:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 21%|██ | 2588/12384 [5:29:24<20:46:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 21%|██ | 2588/12384 [5:29:31<20:46:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 21%|██ | 2589/12384 [5:29:31<20:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 21%|██ | 2589/12384 [5:29:39<20:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 21%|██ | 2590/12384 [5:29:39<20:43:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 21%|██ | 2590/12384 [5:29:46<20:43:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 21%|██ | 2591/12384 [5:29:46<20:43:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 21%|██ | 2591/12384 [5:29:54<20:43:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 21%|██ | 2592/12384 [5:29:54<20:41:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 21%|██ | 2592/12384 [5:30:02<20:41:52, 7.61s/it, loss=0.0013, acc=0.9966, iter_time=4.36s]
Epoch 1: 21%|██ | 2593/12384 [5:30:02<20:43:19, 7.62s/it, loss=0.0013, acc=0.9966, iter_time=4.36s]
Epoch 1: 21%|██ | 2593/12384 [5:30:09<20:43:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 21%|██ | 2594/12384 [5:30:09<20:43:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 21%|██ | 2594/12384 [5:30:17<20:43:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 21%|██ | 2595/12384 [5:30:17<20:45:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 21%|██ | 2595/12384 [5:30:25<20:45:22, 7.63s/it, loss=0.0001, acc=0.9994, iter_time=7.65s]
Epoch 1: 21%|██ | 2596/12384 [5:30:25<20:44:35, 7.63s/it, loss=0.0001, acc=0.9994, iter_time=7.65s]
Epoch 1: 21%|██ | 2596/12384 [5:30:33<20:44:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 21%|██ | 2597/12384 [5:30:33<20:57:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 21%|██ | 2597/12384 [5:30:40<20:57:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██ | 2598/12384 [5:30:40<20:51:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██ | 2598/12384 [5:30:48<20:51:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 21%|██ | 2599/12384 [5:30:48<20:50:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 21%|██ | 2599/12384 [5:30:55<20:50:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 21%|██ | 2600/12384 [5:30:55<20:46:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 21%|██ | 2600/12384 [5:31:03<20:46:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 21%|██ | 2601/12384 [5:31:03<20:44:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 21%|██ | 2601/12384 [5:31:11<20:44:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██ | 2602/12384 [5:31:11<20:42:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██ | 2602/12384 [5:31:18<20:42:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██ | 2603/12384 [5:31:18<20:42:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██ | 2603/12384 [5:31:26<20:42:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 21%|██ | 2604/12384 [5:31:26<20:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 21%|██ | 2604/12384 [5:31:33<20:40:40, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=9.89s]
Epoch 1: 21%|██ | 2605/12384 [5:31:33<20:40:14, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=9.89s]
Epoch 1: 21%|██ | 2605/12384 [5:31:41<20:40:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██ | 2606/12384 [5:31:41<20:39:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██ | 2606/12384 [5:31:49<20:39:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2607/12384 [5:31:49<20:39:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2607/12384 [5:31:56<20:39:23, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.05s]
Epoch 1: 21%|██ | 2608/12384 [5:31:56<20:54:56, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=8.05s]
Epoch 1: 21%|██ | 2608/12384 [5:32:04<20:54:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 21%|██ | 2609/12384 [5:32:04<20:50:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 21%|██ | 2609/12384 [5:32:12<20:50:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 21%|██ | 2610/12384 [5:32:12<20:46:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 21%|██ | 2610/12384 [5:32:19<20:46:48, 7.65s/it, loss=0.0007, acc=0.9995, iter_time=10.73s]
Epoch 1: 21%|██ | 2611/12384 [5:32:19<20:48:23, 7.66s/it, loss=0.0007, acc=0.9995, iter_time=10.73s]
Epoch 1: 21%|██ | 2611/12384 [5:32:27<20:48:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 21%|██ | 2612/12384 [5:32:27<20:46:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 21%|██ | 2612/12384 [5:32:35<20:46:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 21%|██ | 2613/12384 [5:32:35<20:43:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 21%|██ | 2613/12384 [5:32:42<20:43:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2614/12384 [5:32:42<20:42:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2614/12384 [5:32:50<20:42:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 21%|██ | 2615/12384 [5:32:50<20:40:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 21%|██ | 2615/12384 [5:32:57<20:40:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 21%|██ | 2616/12384 [5:32:58<20:49:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 21%|██ | 2616/12384 [5:33:05<20:49:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 1: 21%|██ | 2617/12384 [5:33:05<20:44:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 1: 21%|██ | 2617/12384 [5:33:13<20:44:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 21%|██ | 2618/12384 [5:33:13<20:41:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 21%|██ | 2618/12384 [5:33:20<20:41:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2619/12384 [5:33:20<20:40:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 21%|██ | 2619/12384 [5:33:28<20:40:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 21%|██ | 2620/12384 [5:33:28<20:43:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 21%|██ | 2620/12384 [5:33:36<20:43:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 21%|██ | 2621/12384 [5:33:36<20:42:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 21%|██ | 2621/12384 [5:33:43<20:42:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 21%|██ | 2622/12384 [5:33:43<20:41:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 21%|██ | 2622/12384 [5:33:51<20:41:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 21%|██ | 2623/12384 [5:33:51<20:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 21%|██ | 2623/12384 [5:33:59<20:38:56, 7.62s/it, loss=0.0000, acc=0.9996, iter_time=7.99s]
Epoch 1: 21%|██ | 2624/12384 [5:33:59<20:39:26, 7.62s/it, loss=0.0000, acc=0.9996, iter_time=7.99s]
Epoch 1: 21%|██ | 2624/12384 [5:34:06<20:39:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.16s]
Epoch 1: 21%|██ | 2625/12384 [5:34:06<20:39:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.16s]
Epoch 1: 21%|██ | 2625/12384 [5:34:14<20:39:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 21%|██ | 2626/12384 [5:34:14<20:38:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 21%|██ | 2626/12384 [5:34:21<20:38:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 1: 21%|██ | 2627/12384 [5:34:21<20:38:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 1: 21%|██ | 2627/12384 [5:34:29<20:38:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 21%|██ | 2628/12384 [5:34:29<20:38:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 21%|██ | 2628/12384 [5:34:37<20:38:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 21%|██ | 2629/12384 [5:34:37<20:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 21%|██ | 2629/12384 [5:34:44<20:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 21%|██ | 2630/12384 [5:34:44<20:40:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 21%|██ | 2630/12384 [5:34:52<20:40:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 21%|██ | 2631/12384 [5:34:52<20:40:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 21%|██ | 2631/12384 [5:35:00<20:40:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 21%|██▏ | 2632/12384 [5:35:00<20:39:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 21%|██▏ | 2632/12384 [5:35:07<20:39:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 21%|██▏ | 2633/12384 [5:35:07<20:39:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 21%|██▏ | 2633/12384 [5:35:15<20:39:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.95s]
Epoch 1: 21%|██▏ | 2634/12384 [5:35:15<20:55:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=3.95s]
Epoch 1: 21%|██▏ | 2634/12384 [5:35:23<20:55:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 21%|██▏ | 2635/12384 [5:35:23<20:50:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 21%|██▏ | 2635/12384 [5:35:30<20:50:07, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 1: 21%|██▏ | 2636/12384 [5:35:30<20:45:11, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 1: 21%|██▏ | 2636/12384 [5:35:38<20:45:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 1: 21%|██▏ | 2637/12384 [5:35:38<20:41:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 1: 21%|██▏ | 2637/12384 [5:35:46<20:41:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 21%|██▏ | 2638/12384 [5:35:46<20:38:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 21%|██▏ | 2638/12384 [5:35:53<20:38:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 21%|██▏ | 2639/12384 [5:35:53<20:38:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 21%|██▏ | 2639/12384 [5:36:01<20:38:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 21%|██▏ | 2640/12384 [5:36:01<20:36:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 21%|██▏ | 2640/12384 [5:36:08<20:36:47, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=3.63s]
Epoch 1: 21%|██▏ | 2641/12384 [5:36:08<20:37:03, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=3.63s]
Epoch 1: 21%|██▏ | 2641/12384 [5:36:16<20:37:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 21%|██▏ | 2642/12384 [5:36:16<20:36:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 21%|██▏ | 2642/12384 [5:36:24<20:36:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██▏ | 2643/12384 [5:36:24<20:36:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██▏ | 2643/12384 [5:36:31<20:36:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 21%|██▏ | 2644/12384 [5:36:31<20:36:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 21%|██▏ | 2644/12384 [5:36:39<20:36:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 21%|██▏ | 2645/12384 [5:36:39<20:37:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 21%|██▏ | 2645/12384 [5:36:46<20:37:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 21%|██▏ | 2646/12384 [5:36:46<20:36:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 21%|██▏ | 2646/12384 [5:36:54<20:36:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██▏ | 2647/12384 [5:36:54<20:35:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 21%|██▏ | 2647/12384 [5:37:02<20:35:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 21%|██▏ | 2648/12384 [5:37:02<20:34:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 21%|██▏ | 2648/12384 [5:37:10<20:34:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 21%|██▏ | 2649/12384 [5:37:10<20:48:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 21%|██▏ | 2649/12384 [5:37:17<20:48:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 21%|██▏ | 2650/12384 [5:37:17<20:44:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 21%|██▏ | 2650/12384 [5:37:25<20:44:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 21%|██▏ | 2651/12384 [5:37:25<20:39:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 21%|██▏ | 2651/12384 [5:37:32<20:39:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 21%|██▏ | 2652/12384 [5:37:32<20:36:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 21%|██▏ | 2652/12384 [5:37:40<20:36:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 21%|██▏ | 2653/12384 [5:37:40<20:35:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 21%|██▏ | 2653/12384 [5:37:48<20:35:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 21%|██▏ | 2654/12384 [5:37:48<20:35:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 21%|██▏ | 2654/12384 [5:37:55<20:35:58, 7.62s/it, loss=0.0036, acc=0.9978, iter_time=6.51s]
Epoch 1: 21%|██▏ | 2655/12384 [5:37:55<20:38:50, 7.64s/it, loss=0.0036, acc=0.9978, iter_time=6.51s]
Epoch 1: 21%|██▏ | 2655/12384 [5:38:03<20:38:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 21%|██▏ | 2656/12384 [5:38:03<20:36:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 21%|██▏ | 2656/12384 [5:38:10<20:36:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 21%|██▏ | 2657/12384 [5:38:10<20:37:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 21%|██▏ | 2657/12384 [5:38:18<20:37:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 21%|██▏ | 2658/12384 [5:38:18<20:37:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 21%|██▏ | 2658/12384 [5:38:26<20:37:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██▏ | 2659/12384 [5:38:26<20:36:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 21%|██▏ | 2659/12384 [5:38:33<20:36:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 21%|██▏ | 2660/12384 [5:38:33<20:35:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 21%|██▏ | 2660/12384 [5:38:41<20:35:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 21%|██▏ | 2661/12384 [5:38:41<20:51:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 21%|██▏ | 2661/12384 [5:38:49<20:51:12, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 1: 21%|██▏ | 2662/12384 [5:38:49<20:44:36, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 1: 21%|██▏ | 2662/12384 [5:38:56<20:44:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 22%|██▏ | 2663/12384 [5:38:56<20:39:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 22%|██▏ | 2663/12384 [5:39:04<20:39:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 22%|██▏ | 2664/12384 [5:39:04<20:37:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 22%|██▏ | 2664/12384 [5:39:12<20:37:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 22%|██▏ | 2665/12384 [5:39:12<20:36:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 22%|██▏ | 2665/12384 [5:39:19<20:36:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 22%|██▏ | 2666/12384 [5:39:19<20:35:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 22%|██▏ | 2666/12384 [5:39:27<20:35:50, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.20s]
Epoch 1: 22%|██▏ | 2667/12384 [5:39:27<20:35:10, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.20s]
Epoch 1: 22%|██▏ | 2667/12384 [5:39:35<20:35:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2668/12384 [5:39:35<20:33:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2668/12384 [5:39:42<20:33:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 22%|██▏ | 2669/12384 [5:39:42<20:33:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 22%|██▏ | 2669/12384 [5:39:50<20:33:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 22%|██▏ | 2670/12384 [5:39:50<20:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 22%|██▏ | 2670/12384 [5:39:57<20:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2671/12384 [5:39:57<20:32:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2671/12384 [5:40:05<20:32:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 22%|██▏ | 2672/12384 [5:40:05<20:32:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 22%|██▏ | 2672/12384 [5:40:13<20:32:28, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.20s]
Epoch 1: 22%|██▏ | 2673/12384 [5:40:13<20:31:26, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.20s]
Epoch 1: 22%|██▏ | 2673/12384 [5:40:20<20:31:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 22%|██▏ | 2674/12384 [5:40:20<20:30:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 22%|██▏ | 2674/12384 [5:40:28<20:30:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 22%|██▏ | 2675/12384 [5:40:28<20:30:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 22%|██▏ | 2675/12384 [5:40:36<20:30:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 22%|██▏ | 2676/12384 [5:40:36<20:45:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 22%|██▏ | 2676/12384 [5:40:43<20:45:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 22%|██▏ | 2677/12384 [5:40:43<20:41:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 22%|██▏ | 2677/12384 [5:40:51<20:41:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 22%|██▏ | 2678/12384 [5:40:51<20:37:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 22%|██▏ | 2678/12384 [5:40:58<20:37:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 22%|██▏ | 2679/12384 [5:40:58<20:34:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 22%|██▏ | 2679/12384 [5:41:06<20:34:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 22%|██▏ | 2680/12384 [5:41:06<20:33:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 22%|██▏ | 2680/12384 [5:41:14<20:33:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2681/12384 [5:41:14<20:34:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2681/12384 [5:41:21<20:34:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 22%|██▏ | 2682/12384 [5:41:21<20:37:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 22%|██▏ | 2682/12384 [5:41:29<20:37:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 22%|██▏ | 2683/12384 [5:41:29<20:35:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 22%|██▏ | 2683/12384 [5:41:37<20:35:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2684/12384 [5:41:37<20:33:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2684/12384 [5:41:44<20:33:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2685/12384 [5:41:44<20:33:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2685/12384 [5:41:52<20:33:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 22%|██▏ | 2686/12384 [5:41:52<20:35:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 22%|██▏ | 2686/12384 [5:42:00<20:35:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 22%|██▏ | 2687/12384 [5:42:00<20:48:59, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 22%|██▏ | 2687/12384 [5:42:08<20:48:59, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 22%|██▏ | 2688/12384 [5:42:08<20:44:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 22%|██▏ | 2688/12384 [5:42:15<20:44:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2689/12384 [5:42:15<20:43:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2689/12384 [5:42:23<20:43:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 22%|██▏ | 2690/12384 [5:42:23<20:41:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 22%|██▏ | 2690/12384 [5:42:30<20:41:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 22%|██▏ | 2691/12384 [5:42:30<20:37:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 22%|██▏ | 2691/12384 [5:42:38<20:37:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 22%|██▏ | 2692/12384 [5:42:38<20:35:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 22%|██▏ | 2692/12384 [5:42:46<20:35:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 22%|██▏ | 2693/12384 [5:42:46<20:32:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 22%|██▏ | 2693/12384 [5:42:53<20:32:45, 7.63s/it, loss=0.0002, acc=0.9980, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2694/12384 [5:42:53<20:31:01, 7.62s/it, loss=0.0002, acc=0.9980, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2694/12384 [5:43:01<20:31:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 22%|██▏ | 2695/12384 [5:43:01<20:30:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 22%|██▏ | 2695/12384 [5:43:08<20:30:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 22%|██▏ | 2696/12384 [5:43:08<20:28:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 22%|██▏ | 2696/12384 [5:43:16<20:28:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 22%|██▏ | 2697/12384 [5:43:16<20:28:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 22%|██▏ | 2697/12384 [5:43:24<20:28:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 22%|██▏ | 2698/12384 [5:43:24<20:27:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 22%|██▏ | 2698/12384 [5:43:31<20:27:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2699/12384 [5:43:31<20:28:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2699/12384 [5:43:39<20:28:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 22%|██▏ | 2700/12384 [5:43:39<20:29:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 22%|██▏ | 2700/12384 [5:43:47<20:29:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2701/12384 [5:43:47<20:29:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2701/12384 [5:43:54<20:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 22%|██▏ | 2702/12384 [5:43:54<20:27:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 22%|██▏ | 2702/12384 [5:44:02<20:27:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 22%|██▏ | 2703/12384 [5:44:02<20:41:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 22%|██▏ | 2703/12384 [5:44:10<20:41:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 22%|██▏ | 2704/12384 [5:44:10<20:37:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 22%|██▏ | 2704/12384 [5:44:17<20:37:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 22%|██▏ | 2705/12384 [5:44:17<20:33:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 22%|██▏ | 2705/12384 [5:44:25<20:33:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 22%|██▏ | 2706/12384 [5:44:25<20:30:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 22%|██▏ | 2706/12384 [5:44:32<20:30:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 22%|██▏ | 2707/12384 [5:44:32<20:28:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 22%|██▏ | 2707/12384 [5:44:40<20:28:49, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.85s]
Epoch 1: 22%|██▏ | 2708/12384 [5:44:40<20:30:26, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=8.85s]
Epoch 1: 22%|██▏ | 2708/12384 [5:44:48<20:30:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 22%|██▏ | 2709/12384 [5:44:48<20:28:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 22%|██▏ | 2709/12384 [5:44:55<20:28:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 22%|██▏ | 2710/12384 [5:44:55<20:29:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 22%|██▏ | 2710/12384 [5:45:03<20:29:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.92s]
Epoch 1: 22%|██▏ | 2711/12384 [5:45:03<20:28:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.92s]
Epoch 1: 22%|██▏ | 2711/12384 [5:45:11<20:28:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 22%|██▏ | 2712/12384 [5:45:11<20:28:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 22%|██▏ | 2712/12384 [5:45:19<20:28:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 22%|██▏ | 2713/12384 [5:45:19<20:44:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 22%|██▏ | 2713/12384 [5:45:26<20:44:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 22%|██▏ | 2714/12384 [5:45:26<20:42:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 22%|██▏ | 2714/12384 [5:45:34<20:42:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 22%|██▏ | 2715/12384 [5:45:34<20:36:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 22%|██▏ | 2715/12384 [5:45:41<20:36:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 22%|██▏ | 2716/12384 [5:45:41<20:34:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 22%|██▏ | 2716/12384 [5:45:49<20:34:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 22%|██▏ | 2717/12384 [5:45:49<20:31:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 22%|██▏ | 2717/12384 [5:45:57<20:31:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2718/12384 [5:45:57<20:29:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2718/12384 [5:46:04<20:29:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 22%|██▏ | 2719/12384 [5:46:04<20:27:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 22%|██▏ | 2719/12384 [5:46:12<20:27:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 22%|██▏ | 2720/12384 [5:46:12<20:25:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 22%|██▏ | 2720/12384 [5:46:19<20:25:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 1: 22%|██▏ | 2721/12384 [5:46:19<20:24:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 1: 22%|██▏ | 2721/12384 [5:46:27<20:24:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 22%|██▏ | 2722/12384 [5:46:27<20:23:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 22%|██▏ | 2722/12384 [5:46:35<20:23:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2723/12384 [5:46:35<20:23:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2723/12384 [5:46:42<20:23:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 22%|██▏ | 2724/12384 [5:46:42<20:22:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 22%|██▏ | 2724/12384 [5:46:50<20:22:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 22%|██▏ | 2725/12384 [5:46:50<20:22:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 22%|██▏ | 2725/12384 [5:46:57<20:22:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 22%|██▏ | 2726/12384 [5:46:57<20:22:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 22%|██▏ | 2726/12384 [5:47:05<20:22:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2727/12384 [5:47:05<20:22:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2727/12384 [5:47:13<20:22:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 22%|██▏ | 2728/12384 [5:47:13<20:37:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 22%|██▏ | 2728/12384 [5:47:20<20:37:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 22%|██▏ | 2729/12384 [5:47:20<20:32:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 22%|██▏ | 2729/12384 [5:47:28<20:32:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 22%|██▏ | 2730/12384 [5:47:28<20:30:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 22%|██▏ | 2730/12384 [5:47:36<20:30:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 22%|██▏ | 2731/12384 [5:47:36<20:28:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 22%|██▏ | 2731/12384 [5:47:43<20:28:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 22%|██▏ | 2732/12384 [5:47:43<20:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 22%|██▏ | 2732/12384 [5:47:51<20:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 22%|██▏ | 2733/12384 [5:47:51<20:24:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 22%|██▏ | 2733/12384 [5:47:58<20:24:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 22%|██▏ | 2734/12384 [5:47:58<20:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 22%|██▏ | 2734/12384 [5:48:06<20:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 22%|██▏ | 2735/12384 [5:48:06<20:23:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 22%|██▏ | 2735/12384 [5:48:14<20:23:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 22%|██▏ | 2736/12384 [5:48:14<20:25:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 22%|██▏ | 2736/12384 [5:48:21<20:25:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 22%|██▏ | 2737/12384 [5:48:21<20:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 22%|██▏ | 2737/12384 [5:48:29<20:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 22%|██▏ | 2738/12384 [5:48:29<20:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 22%|██▏ | 2738/12384 [5:48:37<20:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 22%|██▏ | 2739/12384 [5:48:37<20:41:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 22%|██▏ | 2739/12384 [5:48:45<20:41:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 22%|██▏ | 2740/12384 [5:48:45<20:35:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 22%|██▏ | 2740/12384 [5:48:52<20:35:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 22%|██▏ | 2741/12384 [5:48:52<20:31:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 22%|██▏ | 2741/12384 [5:49:00<20:31:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 22%|██▏ | 2742/12384 [5:49:00<20:28:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 22%|██▏ | 2742/12384 [5:49:07<20:28:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2743/12384 [5:49:07<20:27:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2743/12384 [5:49:15<20:27:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 22%|██▏ | 2744/12384 [5:49:15<20:26:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 22%|██▏ | 2744/12384 [5:49:23<20:26:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 22%|██▏ | 2745/12384 [5:49:23<20:25:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 22%|██▏ | 2745/12384 [5:49:30<20:25:18, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2746/12384 [5:49:30<20:24:50, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2746/12384 [5:49:38<20:24:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2747/12384 [5:49:38<20:23:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2747/12384 [5:49:45<20:23:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 22%|██▏ | 2748/12384 [5:49:45<20:21:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 22%|██▏ | 2748/12384 [5:49:53<20:21:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 22%|██▏ | 2749/12384 [5:49:53<20:21:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 22%|██▏ | 2749/12384 [5:50:01<20:21:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 22%|██▏ | 2750/12384 [5:50:01<20:21:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 22%|██▏ | 2750/12384 [5:50:08<20:21:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 22%|██▏ | 2751/12384 [5:50:08<20:20:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 22%|██▏ | 2751/12384 [5:50:16<20:20:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2752/12384 [5:50:16<20:26:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2752/12384 [5:50:24<20:26:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 22%|██▏ | 2753/12384 [5:50:24<20:24:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 22%|██▏ | 2753/12384 [5:50:31<20:24:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 22%|██▏ | 2754/12384 [5:50:31<20:35:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 22%|██▏ | 2754/12384 [5:50:39<20:35:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 22%|██▏ | 2755/12384 [5:50:39<20:30:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 22%|██▏ | 2755/12384 [5:50:47<20:30:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 22%|██▏ | 2756/12384 [5:50:47<20:27:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 22%|██▏ | 2756/12384 [5:50:54<20:27:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 22%|██▏ | 2757/12384 [5:50:54<20:24:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 22%|██▏ | 2757/12384 [5:51:02<20:24:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2758/12384 [5:51:02<20:27:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2758/12384 [5:51:09<20:27:34, 7.65s/it, loss=0.0002, acc=0.9983, iter_time=7.68s]
Epoch 1: 22%|██▏ | 2759/12384 [5:51:09<20:24:21, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=7.68s]
Epoch 1: 22%|██▏ | 2759/12384 [5:51:17<20:24:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 22%|██▏ | 2760/12384 [5:51:17<20:22:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 22%|██▏ | 2760/12384 [5:51:25<20:22:07, 7.62s/it, loss=0.0001, acc=0.9992, iter_time=6.21s]
Epoch 1: 22%|██▏ | 2761/12384 [5:51:25<20:20:57, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=6.21s]
Epoch 1: 22%|██▏ | 2761/12384 [5:51:32<20:20:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 22%|██▏ | 2762/12384 [5:51:32<20:21:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 22%|██▏ | 2762/12384 [5:51:40<20:21:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 22%|██▏ | 2763/12384 [5:51:40<20:23:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 22%|██▏ | 2763/12384 [5:51:47<20:23:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 22%|██▏ | 2764/12384 [5:51:47<20:19:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 22%|██▏ | 2764/12384 [5:51:55<20:19:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 22%|██▏ | 2765/12384 [5:51:55<20:32:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 22%|██▏ | 2765/12384 [5:52:03<20:32:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 22%|██▏ | 2766/12384 [5:52:03<20:29:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 22%|██▏ | 2766/12384 [5:52:11<20:29:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 22%|██▏ | 2767/12384 [5:52:11<20:26:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 22%|██▏ | 2767/12384 [5:52:18<20:26:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 22%|██▏ | 2768/12384 [5:52:18<20:24:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 22%|██▏ | 2768/12384 [5:52:26<20:24:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 22%|██▏ | 2769/12384 [5:52:26<20:21:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 22%|██▏ | 2769/12384 [5:52:33<20:21:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 22%|██▏ | 2770/12384 [5:52:33<20:20:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 22%|██▏ | 2770/12384 [5:52:41<20:20:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2771/12384 [5:52:41<20:19:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 22%|██▏ | 2771/12384 [5:52:49<20:19:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2772/12384 [5:52:49<20:20:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2772/12384 [5:52:56<20:20:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2773/12384 [5:52:56<20:19:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 22%|██▏ | 2773/12384 [5:53:04<20:19:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 22%|██▏ | 2774/12384 [5:53:04<20:23:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 22%|██▏ | 2774/12384 [5:53:12<20:23:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 22%|██▏ | 2775/12384 [5:53:12<20:20:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 22%|██▏ | 2775/12384 [5:53:19<20:20:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 22%|██▏ | 2776/12384 [5:53:19<20:20:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 22%|██▏ | 2776/12384 [5:53:27<20:20:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2777/12384 [5:53:27<20:17:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 22%|██▏ | 2777/12384 [5:53:34<20:17:59, 7.61s/it, loss=0.0009, acc=0.9986, iter_time=7.60s]
Epoch 1: 22%|██▏ | 2778/12384 [5:53:34<20:20:20, 7.62s/it, loss=0.0009, acc=0.9986, iter_time=7.60s]
Epoch 1: 22%|██▏ | 2778/12384 [5:53:42<20:20:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 22%|██▏ | 2779/12384 [5:53:42<20:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 22%|██▏ | 2779/12384 [5:53:50<20:20:27, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=5.38s]
Epoch 1: 22%|██▏ | 2780/12384 [5:53:50<20:25:11, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=5.38s]
Epoch 1: 22%|██▏ | 2780/12384 [5:53:57<20:25:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 22%|██▏ | 2781/12384 [5:53:57<20:22:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 22%|██▏ | 2781/12384 [5:54:05<20:22:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 22%|██▏ | 2782/12384 [5:54:05<20:22:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 22%|██▏ | 2782/12384 [5:54:13<20:22:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 22%|██▏ | 2783/12384 [5:54:13<20:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 22%|██▏ | 2783/12384 [5:54:20<20:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 22%|██▏ | 2784/12384 [5:54:20<20:19:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 22%|██▏ | 2784/12384 [5:54:28<20:19:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 1: 22%|██▏ | 2785/12384 [5:54:28<20:18:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 1: 22%|██▏ | 2785/12384 [5:54:35<20:18:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 22%|██▏ | 2786/12384 [5:54:35<20:17:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 22%|██▏ | 2786/12384 [5:54:43<20:17:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 1: 23%|██▎ | 2787/12384 [5:54:43<20:17:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 1: 23%|██▎ | 2787/12384 [5:54:51<20:17:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 23%|██▎ | 2788/12384 [5:54:51<20:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 23%|██▎ | 2788/12384 [5:54:58<20:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 23%|██▎ | 2789/12384 [5:54:58<20:16:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 23%|██▎ | 2789/12384 [5:55:06<20:16:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 23%|██▎ | 2790/12384 [5:55:06<20:18:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 23%|██▎ | 2790/12384 [5:55:13<20:18:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 23%|██▎ | 2791/12384 [5:55:13<20:18:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 23%|██▎ | 2791/12384 [5:55:21<20:18:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 23%|██▎ | 2792/12384 [5:55:21<20:32:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 23%|██▎ | 2792/12384 [5:55:29<20:32:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 23%|██▎ | 2793/12384 [5:55:29<20:27:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 23%|██▎ | 2793/12384 [5:55:37<20:27:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2794/12384 [5:55:37<20:23:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2794/12384 [5:55:44<20:23:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2795/12384 [5:55:44<20:21:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2795/12384 [5:55:52<20:21:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2796/12384 [5:55:52<20:19:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2796/12384 [5:55:59<20:19:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2797/12384 [5:55:59<20:17:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2797/12384 [5:56:07<20:17:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 23%|██▎ | 2798/12384 [5:56:07<20:17:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 23%|██▎ | 2798/12384 [5:56:15<20:17:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 23%|██▎ | 2799/12384 [5:56:15<20:17:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 23%|██▎ | 2799/12384 [5:56:22<20:17:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 23%|██▎ | 2800/12384 [5:56:22<20:16:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 23%|██▎ | 2800/12384 [5:56:30<20:16:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 23%|██▎ | 2801/12384 [5:56:30<20:16:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 23%|██▎ | 2801/12384 [5:56:37<20:16:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 23%|██▎ | 2802/12384 [5:56:37<20:17:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 23%|██▎ | 2802/12384 [5:56:45<20:17:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2803/12384 [5:56:45<20:17:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2803/12384 [5:56:53<20:17:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2804/12384 [5:56:53<20:16:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2804/12384 [5:57:00<20:16:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2805/12384 [5:57:00<20:15:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2805/12384 [5:57:08<20:15:33, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=7.88s]
Epoch 1: 23%|██▎ | 2806/12384 [5:57:08<20:28:12, 7.69s/it, loss=0.0002, acc=0.9991, iter_time=7.88s]
Epoch 1: 23%|██▎ | 2806/12384 [5:57:16<20:28:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 23%|██▎ | 2807/12384 [5:57:16<20:22:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 23%|██▎ | 2807/12384 [5:57:23<20:22:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 23%|██▎ | 2808/12384 [5:57:23<20:19:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 23%|██▎ | 2808/12384 [5:57:31<20:19:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 1: 23%|██▎ | 2809/12384 [5:57:31<20:18:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 1: 23%|██▎ | 2809/12384 [5:57:39<20:18:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 23%|██▎ | 2810/12384 [5:57:39<20:22:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 23%|██▎ | 2810/12384 [5:57:46<20:22:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 23%|██▎ | 2811/12384 [5:57:46<20:20:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 23%|██▎ | 2811/12384 [5:57:54<20:20:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 23%|██▎ | 2812/12384 [5:57:54<20:18:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 23%|██▎ | 2812/12384 [5:58:02<20:18:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2813/12384 [5:58:02<20:17:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2813/12384 [5:58:09<20:17:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2814/12384 [5:58:09<20:17:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2814/12384 [5:58:17<20:17:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 23%|██▎ | 2815/12384 [5:58:17<20:16:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 23%|██▎ | 2815/12384 [5:58:24<20:16:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 23%|██▎ | 2816/12384 [5:58:24<20:15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 23%|██▎ | 2816/12384 [5:58:32<20:15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 23%|██▎ | 2817/12384 [5:58:32<20:17:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 23%|██▎ | 2817/12384 [5:58:40<20:17:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 23%|██▎ | 2818/12384 [5:58:40<20:32:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 23%|██▎ | 2818/12384 [5:58:48<20:32:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 23%|██▎ | 2819/12384 [5:58:48<20:26:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 23%|██▎ | 2819/12384 [5:58:55<20:26:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2820/12384 [5:58:55<20:23:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2820/12384 [5:59:03<20:23:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2821/12384 [5:59:03<20:20:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2821/12384 [5:59:11<20:20:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 23%|██▎ | 2822/12384 [5:59:11<20:18:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 23%|██▎ | 2822/12384 [5:59:18<20:18:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 23%|██▎ | 2823/12384 [5:59:18<20:15:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 23%|██▎ | 2823/12384 [5:59:26<20:15:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2824/12384 [5:59:26<20:16:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2824/12384 [5:59:33<20:16:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 23%|██▎ | 2825/12384 [5:59:33<20:14:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 23%|██▎ | 2825/12384 [5:59:41<20:14:21, 7.62s/it, loss=0.0000, acc=0.9996, iter_time=9.65s]
Epoch 1: 23%|██▎ | 2826/12384 [5:59:41<20:12:46, 7.61s/it, loss=0.0000, acc=0.9996, iter_time=9.65s]
Epoch 1: 23%|██▎ | 2826/12384 [5:59:49<20:12:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 23%|██▎ | 2827/12384 [5:59:49<20:12:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 23%|██▎ | 2827/12384 [5:59:56<20:12:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 23%|██▎ | 2828/12384 [5:59:56<20:10:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 23%|██▎ | 2828/12384 [6:00:04<20:10:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 23%|██▎ | 2829/12384 [6:00:04<20:11:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 23%|██▎ | 2829/12384 [6:00:11<20:11:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 23%|██▎ | 2830/12384 [6:00:11<20:10:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 23%|██▎ | 2830/12384 [6:00:19<20:10:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 23%|██▎ | 2831/12384 [6:00:19<20:15:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 23%|██▎ | 2831/12384 [6:00:27<20:15:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 23%|██▎ | 2832/12384 [6:00:27<20:14:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 23%|██▎ | 2832/12384 [6:00:35<20:14:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 23%|██▎ | 2833/12384 [6:00:35<20:27:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 23%|██▎ | 2833/12384 [6:00:42<20:27:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 23%|██▎ | 2834/12384 [6:00:42<20:20:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 23%|██▎ | 2834/12384 [6:00:50<20:20:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 23%|██▎ | 2835/12384 [6:00:50<20:17:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 23%|██▎ | 2835/12384 [6:00:57<20:17:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2836/12384 [6:00:57<20:14:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2836/12384 [6:01:05<20:14:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2837/12384 [6:01:05<20:13:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2837/12384 [6:01:13<20:13:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 23%|██▎ | 2838/12384 [6:01:13<20:12:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 23%|██▎ | 2838/12384 [6:01:20<20:12:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 23%|██▎ | 2839/12384 [6:01:20<20:11:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 23%|██▎ | 2839/12384 [6:01:28<20:11:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2840/12384 [6:01:28<20:15:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2840/12384 [6:01:35<20:15:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 23%|██▎ | 2841/12384 [6:01:35<20:13:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 23%|██▎ | 2841/12384 [6:01:43<20:13:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2842/12384 [6:01:43<20:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2842/12384 [6:01:51<20:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 1: 23%|██▎ | 2843/12384 [6:01:51<20:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 1: 23%|██▎ | 2843/12384 [6:01:58<20:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 23%|██▎ | 2844/12384 [6:01:58<20:10:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 23%|██▎ | 2844/12384 [6:02:06<20:10:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 23%|██▎ | 2845/12384 [6:02:06<20:26:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 23%|██▎ | 2845/12384 [6:02:14<20:26:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 23%|██▎ | 2846/12384 [6:02:14<20:21:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 23%|██▎ | 2846/12384 [6:02:21<20:21:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2847/12384 [6:02:21<20:17:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 23%|██▎ | 2847/12384 [6:02:29<20:17:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 23%|██▎ | 2848/12384 [6:02:29<20:15:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 23%|██▎ | 2848/12384 [6:02:37<20:15:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 23%|██▎ | 2849/12384 [6:02:37<20:12:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 23%|██▎ | 2849/12384 [6:02:44<20:12:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 23%|██▎ | 2850/12384 [6:02:44<20:12:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 23%|██▎ | 2850/12384 [6:02:52<20:12:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 23%|██▎ | 2851/12384 [6:02:52<20:10:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 23%|██▎ | 2851/12384 [6:02:59<20:10:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2852/12384 [6:02:59<20:10:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2852/12384 [6:03:07<20:10:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 23%|██▎ | 2853/12384 [6:03:07<20:12:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 23%|██▎ | 2853/12384 [6:03:15<20:12:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 23%|██▎ | 2854/12384 [6:03:15<20:11:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 23%|██▎ | 2854/12384 [6:03:22<20:11:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 23%|██▎ | 2855/12384 [6:03:22<20:10:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 23%|██▎ | 2855/12384 [6:03:30<20:10:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 23%|██▎ | 2856/12384 [6:03:30<20:14:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 23%|██▎ | 2856/12384 [6:03:38<20:14:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 23%|██▎ | 2857/12384 [6:03:38<20:11:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 23%|██▎ | 2857/12384 [6:03:45<20:11:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 23%|██▎ | 2858/12384 [6:03:45<20:09:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 23%|██▎ | 2858/12384 [6:03:53<20:09:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 23%|██▎ | 2859/12384 [6:03:53<20:08:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 23%|██▎ | 2859/12384 [6:04:01<20:08:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.87s]
Epoch 1: 23%|██▎ | 2860/12384 [6:04:01<20:21:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.87s]
Epoch 1: 23%|██▎ | 2860/12384 [6:04:08<20:21:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.57s]
Epoch 1: 23%|██▎ | 2861/12384 [6:04:08<20:17:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.57s]
Epoch 1: 23%|██▎ | 2861/12384 [6:04:16<20:17:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.61s]
Epoch 1: 23%|██▎ | 2862/12384 [6:04:16<20:13:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.61s]
Epoch 1: 23%|██▎ | 2862/12384 [6:04:24<20:13:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 23%|██▎ | 2863/12384 [6:04:24<20:10:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 23%|██▎ | 2863/12384 [6:04:31<20:10:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 23%|██▎ | 2864/12384 [6:04:31<20:10:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 23%|██▎ | 2864/12384 [6:04:39<20:10:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 1: 23%|██▎ | 2865/12384 [6:04:39<20:07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 1: 23%|██▎ | 2865/12384 [6:04:46<20:07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 23%|██▎ | 2866/12384 [6:04:46<20:08:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 23%|██▎ | 2866/12384 [6:04:54<20:08:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 1: 23%|██▎ | 2867/12384 [6:04:54<20:08:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 1: 23%|██▎ | 2867/12384 [6:05:02<20:08:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 23%|██▎ | 2868/12384 [6:05:02<20:09:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 23%|██▎ | 2868/12384 [6:05:09<20:09:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2869/12384 [6:05:09<20:08:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2869/12384 [6:05:17<20:08:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2870/12384 [6:05:17<20:07:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 23%|██▎ | 2870/12384 [6:05:25<20:07:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 23%|██▎ | 2871/12384 [6:05:25<20:24:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 23%|██▎ | 2871/12384 [6:05:32<20:24:18, 7.72s/it, loss=0.0003, acc=1.0000, iter_time=8.30s]
Epoch 1: 23%|██▎ | 2872/12384 [6:05:32<20:18:33, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.30s]
Epoch 1: 23%|██▎ | 2872/12384 [6:05:40<20:18:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 1: 23%|██▎ | 2873/12384 [6:05:40<20:14:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 1: 23%|██▎ | 2873/12384 [6:05:48<20:14:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 23%|██▎ | 2874/12384 [6:05:48<20:12:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 23%|██▎ | 2874/12384 [6:05:55<20:12:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2875/12384 [6:05:55<20:10:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2875/12384 [6:06:03<20:10:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 23%|██▎ | 2876/12384 [6:06:03<20:08:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 23%|██▎ | 2876/12384 [6:06:10<20:08:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 23%|██▎ | 2877/12384 [6:06:10<20:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 23%|██▎ | 2877/12384 [6:06:18<20:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 23%|██▎ | 2878/12384 [6:06:18<20:07:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 23%|██▎ | 2878/12384 [6:06:26<20:07:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 1: 23%|██▎ | 2879/12384 [6:06:26<20:06:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 1: 23%|██▎ | 2879/12384 [6:06:33<20:06:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 23%|██▎ | 2880/12384 [6:06:33<20:06:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 23%|██▎ | 2880/12384 [6:06:41<20:06:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 1: 23%|██▎ | 2881/12384 [6:06:41<20:06:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 1: 23%|██▎ | 2881/12384 [6:06:49<20:06:31, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=7.64s]
Epoch 1: 23%|██▎ | 2882/12384 [6:06:49<20:06:04, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=7.64s]
Epoch 1: 23%|██▎ | 2882/12384 [6:06:56<20:06:04, 7.62s/it, loss=0.0001, acc=0.9984, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2883/12384 [6:06:56<20:08:18, 7.63s/it, loss=0.0001, acc=0.9984, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2883/12384 [6:07:04<20:08:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 23%|██▎ | 2884/12384 [6:07:04<20:07:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 23%|██▎ | 2884/12384 [6:07:11<20:07:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 23%|██▎ | 2885/12384 [6:07:11<20:06:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 23%|██▎ | 2885/12384 [6:07:19<20:06:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 23%|██▎ | 2886/12384 [6:07:19<20:05:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 23%|██▎ | 2886/12384 [6:07:27<20:05:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 23%|██▎ | 2887/12384 [6:07:27<20:08:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 23%|██▎ | 2887/12384 [6:07:34<20:08:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 23%|██▎ | 2888/12384 [6:07:34<20:07:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 23%|██▎ | 2888/12384 [6:07:42<20:07:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 23%|██▎ | 2889/12384 [6:07:42<20:08:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 23%|██▎ | 2889/12384 [6:07:50<20:08:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 23%|██▎ | 2890/12384 [6:07:50<20:07:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 23%|██▎ | 2890/12384 [6:07:57<20:07:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 23%|██▎ | 2891/12384 [6:07:57<20:06:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 23%|██▎ | 2891/12384 [6:08:05<20:06:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 23%|██▎ | 2892/12384 [6:08:05<20:06:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 23%|██▎ | 2892/12384 [6:08:12<20:06:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 23%|██▎ | 2893/12384 [6:08:12<20:04:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 23%|██▎ | 2893/12384 [6:08:20<20:04:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 23%|██▎ | 2894/12384 [6:08:20<20:04:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 23%|██▎ | 2894/12384 [6:08:28<20:04:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.08s]
Epoch 1: 23%|██▎ | 2895/12384 [6:08:28<20:04:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.08s]
Epoch 1: 23%|██▎ | 2895/12384 [6:08:35<20:04:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 23%|██▎ | 2896/12384 [6:08:35<20:03:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 23%|██▎ | 2896/12384 [6:08:43<20:03:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 23%|██▎ | 2897/12384 [6:08:43<20:18:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 23%|██▎ | 2897/12384 [6:08:51<20:18:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 23%|██▎ | 2898/12384 [6:08:51<20:13:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 23%|██▎ | 2898/12384 [6:08:58<20:13:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 23%|██▎ | 2899/12384 [6:08:58<20:10:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 23%|██▎ | 2899/12384 [6:09:06<20:10:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2900/12384 [6:09:06<20:07:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2900/12384 [6:09:14<20:07:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2901/12384 [6:09:14<20:06:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2901/12384 [6:09:21<20:06:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2902/12384 [6:09:21<20:04:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2902/12384 [6:09:29<20:04:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2903/12384 [6:09:29<20:04:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 23%|██▎ | 2903/12384 [6:09:37<20:04:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 23%|██▎ | 2904/12384 [6:09:37<20:04:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 23%|██▎ | 2904/12384 [6:09:44<20:04:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 23%|██▎ | 2905/12384 [6:09:44<20:04:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 23%|██▎ | 2905/12384 [6:09:52<20:04:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2906/12384 [6:09:52<20:04:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 23%|██▎ | 2906/12384 [6:09:59<20:04:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 23%|██▎ | 2907/12384 [6:09:59<20:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 23%|██▎ | 2907/12384 [6:10:07<20:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 23%|██▎ | 2908/12384 [6:10:07<20:00:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 23%|██▎ | 2908/12384 [6:10:15<20:00:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2909/12384 [6:10:15<20:00:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 23%|██▎ | 2909/12384 [6:10:22<20:00:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 23%|██▎ | 2910/12384 [6:10:22<20:00:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 23%|██▎ | 2910/12384 [6:10:30<20:00:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 24%|██▎ | 2911/12384 [6:10:30<20:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 24%|██▎ | 2911/12384 [6:10:37<20:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 24%|██▎ | 2912/12384 [6:10:37<20:00:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 24%|██▎ | 2912/12384 [6:10:45<20:00:05, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=6.72s]
Epoch 1: 24%|██▎ | 2913/12384 [6:10:45<20:00:34, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=6.72s]
Epoch 1: 24%|██▎ | 2913/12384 [6:10:53<20:00:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.44s]
Epoch 1: 24%|██▎ | 2914/12384 [6:10:53<20:00:16, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.44s]
Epoch 1: 24%|██▎ | 2914/12384 [6:11:00<20:00:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 24%|██▎ | 2915/12384 [6:11:00<20:00:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 24%|██▎ | 2915/12384 [6:11:08<20:00:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 24%|██▎ | 2916/12384 [6:11:08<20:00:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 24%|██▎ | 2916/12384 [6:11:15<20:00:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 24%|██▎ | 2917/12384 [6:11:15<20:04:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 24%|██▎ | 2917/12384 [6:11:23<20:04:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 24%|██▎ | 2918/12384 [6:11:23<20:03:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 24%|██▎ | 2918/12384 [6:11:31<20:03:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▎ | 2919/12384 [6:11:31<20:06:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▎ | 2919/12384 [6:11:38<20:06:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 24%|██▎ | 2920/12384 [6:11:38<20:04:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 24%|██▎ | 2920/12384 [6:11:46<20:04:28, 7.64s/it, loss=0.0003, acc=0.9972, iter_time=4.20s]
Epoch 1: 24%|██▎ | 2921/12384 [6:11:46<20:02:50, 7.63s/it, loss=0.0003, acc=0.9972, iter_time=4.20s]
Epoch 1: 24%|██▎ | 2921/12384 [6:11:54<20:02:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 24%|██▎ | 2922/12384 [6:11:54<20:02:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 24%|██▎ | 2922/12384 [6:12:02<20:02:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 24%|██▎ | 2923/12384 [6:12:02<20:15:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 24%|██▎ | 2923/12384 [6:12:09<20:15:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 24%|██▎ | 2924/12384 [6:12:09<20:10:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 24%|██▎ | 2924/12384 [6:12:17<20:10:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▎ | 2925/12384 [6:12:17<20:06:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▎ | 2925/12384 [6:12:24<20:06:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▎ | 2926/12384 [6:12:24<20:08:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▎ | 2926/12384 [6:12:32<20:08:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 24%|██▎ | 2927/12384 [6:12:32<20:08:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 24%|██▎ | 2927/12384 [6:12:40<20:08:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 24%|██▎ | 2928/12384 [6:12:40<20:05:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 24%|██▎ | 2928/12384 [6:12:47<20:05:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 24%|██▎ | 2929/12384 [6:12:47<20:07:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 24%|██▎ | 2929/12384 [6:12:55<20:07:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▎ | 2930/12384 [6:12:55<20:05:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▎ | 2930/12384 [6:13:03<20:05:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▎ | 2931/12384 [6:13:03<20:03:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▎ | 2931/12384 [6:13:10<20:03:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▎ | 2932/12384 [6:13:10<20:00:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▎ | 2932/12384 [6:13:18<20:00:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▎ | 2933/12384 [6:13:18<20:00:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▎ | 2933/12384 [6:13:25<20:00:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 24%|██▎ | 2934/12384 [6:13:25<19:59:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 24%|██▎ | 2934/12384 [6:13:33<19:59:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 24%|██▎ | 2935/12384 [6:13:33<19:59:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 24%|██▎ | 2935/12384 [6:13:41<19:59:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 24%|██▎ | 2936/12384 [6:13:41<19:58:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 24%|██▎ | 2936/12384 [6:13:48<19:58:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 24%|██▎ | 2937/12384 [6:13:48<19:57:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 24%|██▎ | 2937/12384 [6:13:56<19:57:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 1: 24%|██▎ | 2938/12384 [6:13:56<19:56:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 1: 24%|██▎ | 2938/12384 [6:14:03<19:56:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 24%|██▎ | 2939/12384 [6:14:03<19:57:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 24%|██▎ | 2939/12384 [6:14:11<19:57:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 24%|██▎ | 2940/12384 [6:14:11<19:57:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 24%|██▎ | 2940/12384 [6:14:19<19:57:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▎ | 2941/12384 [6:14:19<19:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▎ | 2941/12384 [6:14:26<19:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 24%|██▍ | 2942/12384 [6:14:26<19:55:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 24%|██▍ | 2942/12384 [6:14:34<19:55:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2943/12384 [6:14:34<19:56:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2943/12384 [6:14:42<19:56:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 24%|██▍ | 2944/12384 [6:14:42<20:00:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 24%|██▍ | 2944/12384 [6:14:49<20:00:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 24%|██▍ | 2945/12384 [6:14:49<19:59:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 24%|██▍ | 2945/12384 [6:14:57<19:59:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 24%|██▍ | 2946/12384 [6:14:57<19:59:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 24%|██▍ | 2946/12384 [6:15:04<19:59:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2947/12384 [6:15:04<19:57:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2947/12384 [6:15:12<19:57:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▍ | 2948/12384 [6:15:12<19:57:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▍ | 2948/12384 [6:15:20<19:57:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 24%|██▍ | 2949/12384 [6:15:20<20:13:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 24%|██▍ | 2949/12384 [6:15:28<20:13:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 24%|██▍ | 2950/12384 [6:15:28<20:08:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 24%|██▍ | 2950/12384 [6:15:35<20:08:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▍ | 2951/12384 [6:15:35<20:04:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▍ | 2951/12384 [6:15:43<20:04:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 24%|██▍ | 2952/12384 [6:15:43<20:01:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 24%|██▍ | 2952/12384 [6:15:50<20:01:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 24%|██▍ | 2953/12384 [6:15:50<19:59:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 24%|██▍ | 2953/12384 [6:15:58<19:59:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 24%|██▍ | 2954/12384 [6:15:58<19:58:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 24%|██▍ | 2954/12384 [6:16:06<19:58:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 24%|██▍ | 2955/12384 [6:16:06<19:57:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 24%|██▍ | 2955/12384 [6:16:13<19:57:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▍ | 2956/12384 [6:16:13<19:56:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▍ | 2956/12384 [6:16:21<19:56:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 24%|██▍ | 2957/12384 [6:16:21<19:56:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 24%|██▍ | 2957/12384 [6:16:28<19:56:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2958/12384 [6:16:28<19:56:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2958/12384 [6:16:36<19:56:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▍ | 2959/12384 [6:16:36<19:55:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 24%|██▍ | 2959/12384 [6:16:44<19:55:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 24%|██▍ | 2960/12384 [6:16:44<19:54:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 24%|██▍ | 2960/12384 [6:16:51<19:54:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 24%|██▍ | 2961/12384 [6:16:51<19:54:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 24%|██▍ | 2961/12384 [6:16:59<19:54:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2962/12384 [6:16:59<19:54:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2962/12384 [6:17:06<19:54:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▍ | 2963/12384 [6:17:06<19:54:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▍ | 2963/12384 [6:17:14<19:54:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 24%|██▍ | 2964/12384 [6:17:14<19:54:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 24%|██▍ | 2964/12384 [6:17:22<19:54:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 24%|██▍ | 2965/12384 [6:17:22<20:06:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 24%|██▍ | 2965/12384 [6:17:29<20:06:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 24%|██▍ | 2966/12384 [6:17:29<20:02:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 24%|██▍ | 2966/12384 [6:17:37<20:02:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 24%|██▍ | 2967/12384 [6:17:37<19:58:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 24%|██▍ | 2967/12384 [6:17:45<19:58:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 24%|██▍ | 2968/12384 [6:17:45<19:57:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 24%|██▍ | 2968/12384 [6:17:52<19:57:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=2.69s]
Epoch 1: 24%|██▍ | 2969/12384 [6:17:52<19:56:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=2.69s]
Epoch 1: 24%|██▍ | 2969/12384 [6:18:00<19:56:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=12.55s]
Epoch 1: 24%|██▍ | 2970/12384 [6:18:00<19:54:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=12.55s]
Epoch 1: 24%|██▍ | 2970/12384 [6:18:08<19:54:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2971/12384 [6:18:08<19:54:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2971/12384 [6:18:15<19:54:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 24%|██▍ | 2972/12384 [6:18:15<19:54:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 24%|██▍ | 2972/12384 [6:18:23<19:54:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 24%|██▍ | 2973/12384 [6:18:23<19:56:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 24%|██▍ | 2973/12384 [6:18:30<19:56:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 24%|██▍ | 2974/12384 [6:18:30<19:56:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 24%|██▍ | 2974/12384 [6:18:38<19:56:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 24%|██▍ | 2975/12384 [6:18:38<19:54:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 24%|██▍ | 2975/12384 [6:18:46<19:54:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 1: 24%|██▍ | 2976/12384 [6:18:46<20:08:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 1: 24%|██▍ | 2976/12384 [6:18:54<20:08:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 24%|██▍ | 2977/12384 [6:18:54<20:03:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 24%|██▍ | 2977/12384 [6:19:01<20:03:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 24%|██▍ | 2978/12384 [6:19:01<20:00:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 24%|██▍ | 2978/12384 [6:19:09<20:00:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 24%|██▍ | 2979/12384 [6:19:09<19:58:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 24%|██▍ | 2979/12384 [6:19:16<19:58:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2980/12384 [6:19:16<19:56:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2980/12384 [6:19:24<19:56:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 24%|██▍ | 2981/12384 [6:19:24<19:54:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 24%|██▍ | 2981/12384 [6:19:32<19:54:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 24%|██▍ | 2982/12384 [6:19:32<19:53:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 24%|██▍ | 2982/12384 [6:19:39<19:53:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 24%|██▍ | 2983/12384 [6:19:39<19:53:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 24%|██▍ | 2983/12384 [6:19:47<19:53:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 24%|██▍ | 2984/12384 [6:19:47<19:54:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 24%|██▍ | 2984/12384 [6:19:54<19:54:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 24%|██▍ | 2985/12384 [6:19:54<19:52:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 24%|██▍ | 2985/12384 [6:20:02<19:52:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 24%|██▍ | 2986/12384 [6:20:02<19:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 24%|██▍ | 2986/12384 [6:20:10<19:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 24%|██▍ | 2987/12384 [6:20:10<19:54:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 24%|██▍ | 2987/12384 [6:20:17<19:54:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 24%|██▍ | 2988/12384 [6:20:17<19:53:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 1: 24%|██▍ | 2988/12384 [6:20:25<19:53:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 24%|██▍ | 2989/12384 [6:20:25<19:53:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 24%|██▍ | 2989/12384 [6:20:33<19:53:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 24%|██▍ | 2990/12384 [6:20:33<20:04:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 24%|██▍ | 2990/12384 [6:20:40<20:04:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 24%|██▍ | 2991/12384 [6:20:40<19:58:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 24%|██▍ | 2991/12384 [6:20:48<19:58:34, 7.66s/it, loss=0.0001, acc=0.9994, iter_time=10.50s]
Epoch 1: 24%|██▍ | 2992/12384 [6:20:48<19:56:01, 7.64s/it, loss=0.0001, acc=0.9994, iter_time=10.50s]
Epoch 1: 24%|██▍ | 2992/12384 [6:20:56<19:56:01, 7.64s/it, loss=0.0011, acc=0.9976, iter_time=7.22s]
Epoch 1: 24%|██▍ | 2993/12384 [6:20:56<19:54:31, 7.63s/it, loss=0.0011, acc=0.9976, iter_time=7.22s]
Epoch 1: 24%|██▍ | 2993/12384 [6:21:03<19:54:31, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2994/12384 [6:21:03<19:53:24, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2994/12384 [6:21:11<19:53:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2995/12384 [6:21:11<19:53:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2995/12384 [6:21:18<19:53:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2996/12384 [6:21:18<19:51:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2996/12384 [6:21:26<19:51:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2997/12384 [6:21:26<19:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 2997/12384 [6:21:34<19:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2998/12384 [6:21:34<19:51:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 2998/12384 [6:21:41<19:51:15, 7.62s/it, loss=0.0004, acc=0.9980, iter_time=7.00s]
Epoch 1: 24%|██▍ | 2999/12384 [6:21:41<19:50:30, 7.61s/it, loss=0.0004, acc=0.9980, iter_time=7.00s]
Epoch 1: 24%|██▍ | 2999/12384 [6:21:49<19:50:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 24%|██▍ | 3000/12384 [6:21:49<19:51:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 24%|██▍ | 3000/12384 [6:21:56<19:51:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 24%|██▍ | 3001/12384 [6:21:56<19:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 24%|██▍ | 3001/12384 [6:22:04<19:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 24%|██▍ | 3002/12384 [6:22:04<20:06:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 24%|██▍ | 3002/12384 [6:22:12<20:06:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 24%|██▍ | 3003/12384 [6:22:12<20:01:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 24%|██▍ | 3003/12384 [6:22:20<20:01:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 24%|██▍ | 3004/12384 [6:22:20<19:57:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 24%|██▍ | 3004/12384 [6:22:27<19:57:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 24%|██▍ | 3005/12384 [6:22:27<19:56:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 24%|██▍ | 3005/12384 [6:22:35<19:56:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 24%|██▍ | 3006/12384 [6:22:35<19:53:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 24%|██▍ | 3006/12384 [6:22:42<19:53:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3007/12384 [6:22:42<19:52:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3007/12384 [6:22:50<19:52:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 24%|██▍ | 3008/12384 [6:22:50<19:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 24%|██▍ | 3008/12384 [6:22:58<19:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 24%|██▍ | 3009/12384 [6:22:58<19:51:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 24%|██▍ | 3009/12384 [6:23:05<19:51:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 24%|██▍ | 3010/12384 [6:23:05<19:50:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 24%|██▍ | 3010/12384 [6:23:13<19:50:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 24%|██▍ | 3011/12384 [6:23:13<19:49:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 24%|██▍ | 3011/12384 [6:23:21<19:49:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3012/12384 [6:23:21<19:49:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3012/12384 [6:23:28<19:49:54, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3013/12384 [6:23:28<19:49:03, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3013/12384 [6:23:36<19:49:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 3014/12384 [6:23:36<19:49:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 24%|██▍ | 3014/12384 [6:23:43<19:49:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 24%|██▍ | 3015/12384 [6:23:43<19:48:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 24%|██▍ | 3015/12384 [6:23:51<19:48:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 24%|██▍ | 3016/12384 [6:23:51<19:48:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 24%|██▍ | 3016/12384 [6:23:59<19:48:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 24%|██▍ | 3017/12384 [6:23:59<20:02:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 24%|██▍ | 3017/12384 [6:24:07<20:02:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 24%|██▍ | 3018/12384 [6:24:07<20:04:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 24%|██▍ | 3018/12384 [6:24:14<20:04:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 24%|██▍ | 3019/12384 [6:24:14<20:01:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 24%|██▍ | 3019/12384 [6:24:22<20:01:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 24%|██▍ | 3020/12384 [6:24:22<19:58:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 24%|██▍ | 3020/12384 [6:24:30<19:58:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3021/12384 [6:24:30<19:55:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3021/12384 [6:24:37<19:55:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3022/12384 [6:24:37<19:51:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 24%|██▍ | 3022/12384 [6:24:45<19:51:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▍ | 3023/12384 [6:24:45<19:50:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▍ | 3023/12384 [6:24:52<19:50:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 24%|██▍ | 3024/12384 [6:24:52<19:49:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 24%|██▍ | 3024/12384 [6:25:00<19:49:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 24%|██▍ | 3025/12384 [6:25:00<19:47:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 24%|██▍ | 3025/12384 [6:25:08<19:47:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 24%|██▍ | 3026/12384 [6:25:08<19:47:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 24%|██▍ | 3026/12384 [6:25:15<19:47:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 24%|██▍ | 3027/12384 [6:25:15<19:46:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 24%|██▍ | 3027/12384 [6:25:23<19:46:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▍ | 3028/12384 [6:25:23<19:45:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 24%|██▍ | 3028/12384 [6:25:31<19:45:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 24%|██▍ | 3029/12384 [6:25:31<20:01:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 24%|██▍ | 3029/12384 [6:25:38<20:01:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 24%|██▍ | 3030/12384 [6:25:38<19:56:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 24%|██▍ | 3030/12384 [6:25:46<19:56:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 24%|██▍ | 3031/12384 [6:25:46<19:53:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 24%|██▍ | 3031/12384 [6:25:54<19:53:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 1: 24%|██▍ | 3032/12384 [6:25:54<19:51:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 1: 24%|██▍ | 3032/12384 [6:26:01<19:51:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 24%|██▍ | 3033/12384 [6:26:01<19:50:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 24%|██▍ | 3033/12384 [6:26:09<19:50:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 24%|██▍ | 3034/12384 [6:26:09<19:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 24%|██▍ | 3034/12384 [6:26:16<19:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3035/12384 [6:26:16<19:47:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3035/12384 [6:26:24<19:47:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3036/12384 [6:26:24<19:46:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3036/12384 [6:26:32<19:46:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3037/12384 [6:26:32<19:45:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3037/12384 [6:26:39<19:45:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 25%|██▍ | 3038/12384 [6:26:39<19:46:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 25%|██▍ | 3038/12384 [6:26:47<19:46:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 25%|██▍ | 3039/12384 [6:26:47<19:45:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 25%|██▍ | 3039/12384 [6:26:54<19:45:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 25%|██▍ | 3040/12384 [6:26:54<19:44:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 25%|██▍ | 3040/12384 [6:27:02<19:44:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 1: 25%|██▍ | 3041/12384 [6:27:02<19:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 1: 25%|██▍ | 3041/12384 [6:27:10<19:45:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.76s]
Epoch 1: 25%|██▍ | 3042/12384 [6:27:10<19:45:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.76s]
Epoch 1: 25%|██▍ | 3042/12384 [6:27:17<19:45:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 25%|██▍ | 3043/12384 [6:27:17<19:51:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 25%|██▍ | 3043/12384 [6:27:25<19:51:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 25%|██▍ | 3044/12384 [6:27:25<20:03:06, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 25%|██▍ | 3044/12384 [6:27:33<20:03:06, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 25%|██▍ | 3045/12384 [6:27:33<19:57:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 25%|██▍ | 3045/12384 [6:27:41<19:57:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 25%|██▍ | 3046/12384 [6:27:41<19:53:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 25%|██▍ | 3046/12384 [6:27:48<19:53:26, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.03s]
Epoch 1: 25%|██▍ | 3047/12384 [6:27:48<19:49:55, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.03s]
Epoch 1: 25%|██▍ | 3047/12384 [6:27:56<19:49:55, 7.65s/it, loss=0.0001, acc=0.9997, iter_time=8.91s]
Epoch 1: 25%|██▍ | 3048/12384 [6:27:56<19:47:53, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=8.91s]
Epoch 1: 25%|██▍ | 3048/12384 [6:28:03<19:47:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 25%|██▍ | 3049/12384 [6:28:03<19:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 25%|██▍ | 3049/12384 [6:28:11<19:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▍ | 3050/12384 [6:28:11<19:49:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▍ | 3050/12384 [6:28:19<19:49:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 25%|██▍ | 3051/12384 [6:28:19<19:47:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 25%|██▍ | 3051/12384 [6:28:26<19:47:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 25%|██▍ | 3052/12384 [6:28:26<19:45:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 25%|██▍ | 3052/12384 [6:28:34<19:45:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3053/12384 [6:28:34<19:45:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3053/12384 [6:28:41<19:45:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▍ | 3054/12384 [6:28:41<19:44:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▍ | 3054/12384 [6:28:49<19:44:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▍ | 3055/12384 [6:28:49<19:59:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▍ | 3055/12384 [6:28:57<19:59:56, 7.72s/it, loss=0.0000, acc=0.9994, iter_time=8.33s]
Epoch 1: 25%|██▍ | 3056/12384 [6:28:57<19:55:38, 7.69s/it, loss=0.0000, acc=0.9994, iter_time=8.33s]
Epoch 1: 25%|██▍ | 3056/12384 [6:29:05<19:55:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 25%|██▍ | 3057/12384 [6:29:05<19:53:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 25%|██▍ | 3057/12384 [6:29:12<19:53:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 25%|██▍ | 3058/12384 [6:29:12<19:50:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 25%|██▍ | 3058/12384 [6:29:20<19:50:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 25%|██▍ | 3059/12384 [6:29:20<19:47:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 25%|██▍ | 3059/12384 [6:29:27<19:47:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 25%|██▍ | 3060/12384 [6:29:27<19:44:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 25%|██▍ | 3060/12384 [6:29:35<19:44:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3061/12384 [6:29:35<19:43:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3061/12384 [6:29:43<19:43:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 25%|██▍ | 3062/12384 [6:29:43<19:46:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 25%|██▍ | 3062/12384 [6:29:50<19:46:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 25%|██▍ | 3063/12384 [6:29:50<19:45:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 25%|██▍ | 3063/12384 [6:29:58<19:45:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 25%|██▍ | 3064/12384 [6:29:58<19:44:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 25%|██▍ | 3064/12384 [6:30:06<19:44:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 25%|██▍ | 3065/12384 [6:30:06<19:43:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 25%|██▍ | 3065/12384 [6:30:13<19:43:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 25%|██▍ | 3066/12384 [6:30:13<19:43:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 25%|██▍ | 3066/12384 [6:30:21<19:43:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 25%|██▍ | 3067/12384 [6:30:21<19:42:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 25%|██▍ | 3067/12384 [6:30:28<19:42:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 1: 25%|██▍ | 3068/12384 [6:30:28<19:42:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 1: 25%|██▍ | 3068/12384 [6:30:36<19:42:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 25%|██▍ | 3069/12384 [6:30:36<19:41:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 25%|██▍ | 3069/12384 [6:30:44<19:41:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 25%|██▍ | 3070/12384 [6:30:44<19:45:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 25%|██▍ | 3070/12384 [6:30:52<19:45:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 1: 25%|██▍ | 3071/12384 [6:30:52<19:56:19, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 1: 25%|██▍ | 3071/12384 [6:30:59<19:56:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 25%|██▍ | 3072/12384 [6:30:59<19:51:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 25%|██▍ | 3072/12384 [6:31:07<19:51:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▍ | 3073/12384 [6:31:07<19:47:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▍ | 3073/12384 [6:31:14<19:47:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3074/12384 [6:31:14<19:45:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3074/12384 [6:31:22<19:45:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 25%|██▍ | 3075/12384 [6:31:22<19:42:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 25%|██▍ | 3075/12384 [6:31:30<19:42:53, 7.62s/it, loss=0.0004, acc=0.9974, iter_time=10.10s]
Epoch 1: 25%|██▍ | 3076/12384 [6:31:30<19:42:01, 7.62s/it, loss=0.0004, acc=0.9974, iter_time=10.10s]
Epoch 1: 25%|██▍ | 3076/12384 [6:31:37<19:42:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▍ | 3077/12384 [6:31:37<19:42:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▍ | 3077/12384 [6:31:45<19:42:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▍ | 3078/12384 [6:31:45<19:41:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▍ | 3078/12384 [6:31:53<19:41:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 25%|██▍ | 3079/12384 [6:31:53<19:45:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 25%|██▍ | 3079/12384 [6:32:00<19:45:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 25%|██▍ | 3080/12384 [6:32:00<19:44:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 25%|██▍ | 3080/12384 [6:32:08<19:44:35, 7.64s/it, loss=0.0001, acc=0.9984, iter_time=5.16s]
Epoch 1: 25%|██▍ | 3081/12384 [6:32:08<19:59:09, 7.73s/it, loss=0.0001, acc=0.9984, iter_time=5.16s]
Epoch 1: 25%|██▍ | 3081/12384 [6:32:16<19:59:09, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=8.52s]
Epoch 1: 25%|██▍ | 3082/12384 [6:32:16<19:52:05, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.52s]
Epoch 1: 25%|██▍ | 3082/12384 [6:32:23<19:52:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 25%|██▍ | 3083/12384 [6:32:23<19:47:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 25%|██▍ | 3083/12384 [6:32:31<19:47:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▍ | 3084/12384 [6:32:31<19:49:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▍ | 3084/12384 [6:32:39<19:49:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 25%|██▍ | 3085/12384 [6:32:39<19:47:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 25%|██▍ | 3085/12384 [6:32:46<19:47:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3086/12384 [6:32:46<19:47:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▍ | 3086/12384 [6:32:54<19:47:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 25%|██▍ | 3087/12384 [6:32:54<19:45:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 25%|██▍ | 3087/12384 [6:33:02<19:45:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 25%|██▍ | 3088/12384 [6:33:02<19:44:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 25%|██▍ | 3088/12384 [6:33:09<19:44:56, 7.65s/it, loss=0.0004, acc=0.9990, iter_time=7.24s]
Epoch 1: 25%|██▍ | 3089/12384 [6:33:09<19:43:07, 7.64s/it, loss=0.0004, acc=0.9990, iter_time=7.24s]
Epoch 1: 25%|██▍ | 3089/12384 [6:33:17<19:43:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 25%|██▍ | 3090/12384 [6:33:17<19:41:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 25%|██▍ | 3090/12384 [6:33:24<19:41:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 25%|██▍ | 3091/12384 [6:33:24<19:43:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 25%|██▍ | 3091/12384 [6:33:32<19:43:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 1: 25%|██▍ | 3092/12384 [6:33:32<19:41:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 1: 25%|██▍ | 3092/12384 [6:33:40<19:41:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▍ | 3093/12384 [6:33:40<19:40:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▍ | 3093/12384 [6:33:47<19:40:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▍ | 3094/12384 [6:33:47<19:39:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▍ | 3094/12384 [6:33:55<19:39:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▍ | 3095/12384 [6:33:55<19:38:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▍ | 3095/12384 [6:34:03<19:38:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 25%|██▌ | 3096/12384 [6:34:03<19:50:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 25%|██▌ | 3096/12384 [6:34:10<19:50:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 25%|██▌ | 3097/12384 [6:34:10<19:47:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 25%|██▌ | 3097/12384 [6:34:18<19:47:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 25%|██▌ | 3098/12384 [6:34:18<19:46:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 25%|██▌ | 3098/12384 [6:34:26<19:46:22, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 25%|██▌ | 3099/12384 [6:34:26<19:44:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 25%|██▌ | 3099/12384 [6:34:33<19:44:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 25%|██▌ | 3100/12384 [6:34:33<19:42:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 25%|██▌ | 3100/12384 [6:34:41<19:42:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 25%|██▌ | 3101/12384 [6:34:41<19:39:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 25%|██▌ | 3101/12384 [6:34:48<19:39:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 25%|██▌ | 3102/12384 [6:34:48<19:38:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 25%|██▌ | 3102/12384 [6:34:56<19:38:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 25%|██▌ | 3103/12384 [6:34:56<19:37:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 25%|██▌ | 3103/12384 [6:35:04<19:37:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 25%|██▌ | 3104/12384 [6:35:04<19:40:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 25%|██▌ | 3104/12384 [6:35:11<19:40:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 25%|██▌ | 3105/12384 [6:35:11<19:37:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 25%|██▌ | 3105/12384 [6:35:19<19:37:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 1: 25%|██▌ | 3106/12384 [6:35:19<19:39:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 1: 25%|██▌ | 3106/12384 [6:35:27<19:39:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 25%|██▌ | 3107/12384 [6:35:27<19:53:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 25%|██▌ | 3107/12384 [6:35:35<19:53:30, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.18s]
Epoch 1: 25%|██▌ | 3108/12384 [6:35:35<19:48:21, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.18s]
Epoch 1: 25%|██▌ | 3108/12384 [6:35:42<19:48:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 25%|██▌ | 3109/12384 [6:35:42<19:44:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 25%|██▌ | 3109/12384 [6:35:50<19:44:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3110/12384 [6:35:50<19:42:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3110/12384 [6:35:57<19:42:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▌ | 3111/12384 [6:35:57<19:43:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▌ | 3111/12384 [6:36:05<19:43:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 25%|██▌ | 3112/12384 [6:36:05<19:41:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 25%|██▌ | 3112/12384 [6:36:13<19:41:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 25%|██▌ | 3113/12384 [6:36:13<19:40:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 25%|██▌ | 3113/12384 [6:36:20<19:40:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 25%|██▌ | 3114/12384 [6:36:20<19:41:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 25%|██▌ | 3114/12384 [6:36:28<19:41:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 25%|██▌ | 3115/12384 [6:36:28<19:38:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 25%|██▌ | 3115/12384 [6:36:36<19:38:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 1: 25%|██▌ | 3116/12384 [6:36:36<19:47:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 1: 25%|██▌ | 3116/12384 [6:36:43<19:47:45, 7.69s/it, loss=0.0009, acc=0.9980, iter_time=4.63s]
Epoch 1: 25%|██▌ | 3117/12384 [6:36:43<19:44:16, 7.67s/it, loss=0.0009, acc=0.9980, iter_time=4.63s]
Epoch 1: 25%|██▌ | 3117/12384 [6:36:51<19:44:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 25%|██▌ | 3118/12384 [6:36:51<19:40:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 25%|██▌ | 3118/12384 [6:36:59<19:40:57, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3119/12384 [6:36:59<19:38:29, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3119/12384 [6:37:06<19:38:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 25%|██▌ | 3120/12384 [6:37:06<19:36:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 25%|██▌ | 3120/12384 [6:37:14<19:36:27, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.64s]
Epoch 1: 25%|██▌ | 3121/12384 [6:37:14<19:34:40, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=7.64s]
Epoch 1: 25%|██▌ | 3121/12384 [6:37:21<19:34:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▌ | 3122/12384 [6:37:21<19:38:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▌ | 3122/12384 [6:37:29<19:38:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 25%|██▌ | 3123/12384 [6:37:29<19:49:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 25%|██▌ | 3123/12384 [6:37:37<19:49:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3124/12384 [6:37:37<19:45:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3124/12384 [6:37:45<19:45:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▌ | 3125/12384 [6:37:45<19:42:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▌ | 3125/12384 [6:37:52<19:42:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 1: 25%|██▌ | 3126/12384 [6:37:52<19:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 1: 25%|██▌ | 3126/12384 [6:38:00<19:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 1: 25%|██▌ | 3127/12384 [6:38:00<19:37:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 1: 25%|██▌ | 3127/12384 [6:38:07<19:37:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3128/12384 [6:38:07<19:38:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3128/12384 [6:38:15<19:38:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 25%|██▌ | 3129/12384 [6:38:15<19:36:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 25%|██▌ | 3129/12384 [6:38:23<19:36:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 25%|██▌ | 3130/12384 [6:38:23<19:36:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 25%|██▌ | 3130/12384 [6:38:30<19:36:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▌ | 3131/12384 [6:38:30<19:35:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 25%|██▌ | 3131/12384 [6:38:38<19:35:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3132/12384 [6:38:38<19:35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3132/12384 [6:38:46<19:35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 25%|██▌ | 3133/12384 [6:38:46<19:52:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 25%|██▌ | 3133/12384 [6:38:53<19:52:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 25%|██▌ | 3134/12384 [6:38:53<19:46:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 25%|██▌ | 3134/12384 [6:39:01<19:46:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 25%|██▌ | 3135/12384 [6:39:01<19:40:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 25%|██▌ | 3135/12384 [6:39:09<19:40:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 25%|██▌ | 3136/12384 [6:39:09<19:38:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 25%|██▌ | 3136/12384 [6:39:16<19:38:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.16s]
Epoch 1: 25%|██▌ | 3137/12384 [6:39:16<19:36:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.16s]
Epoch 1: 25%|██▌ | 3137/12384 [6:39:24<19:36:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 25%|██▌ | 3138/12384 [6:39:24<19:34:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 25%|██▌ | 3138/12384 [6:39:31<19:34:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▌ | 3139/12384 [6:39:31<19:33:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▌ | 3139/12384 [6:39:39<19:33:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 25%|██▌ | 3140/12384 [6:39:39<19:32:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 25%|██▌ | 3140/12384 [6:39:47<19:32:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 25%|██▌ | 3141/12384 [6:39:47<19:32:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 25%|██▌ | 3141/12384 [6:39:54<19:32:54, 7.61s/it, loss=0.0002, acc=0.9981, iter_time=5.87s]
Epoch 1: 25%|██▌ | 3142/12384 [6:39:54<19:31:45, 7.61s/it, loss=0.0002, acc=0.9981, iter_time=5.87s]
Epoch 1: 25%|██▌ | 3142/12384 [6:40:02<19:31:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 1: 25%|██▌ | 3143/12384 [6:40:02<19:32:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 1: 25%|██▌ | 3143/12384 [6:40:10<19:32:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 25%|██▌ | 3144/12384 [6:40:10<19:32:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 25%|██▌ | 3144/12384 [6:40:17<19:32:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.71s]
Epoch 1: 25%|██▌ | 3145/12384 [6:40:17<19:32:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.71s]
Epoch 1: 25%|██▌ | 3145/12384 [6:40:25<19:32:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 25%|██▌ | 3146/12384 [6:40:25<19:32:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 25%|██▌ | 3146/12384 [6:40:32<19:32:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▌ | 3147/12384 [6:40:32<19:32:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▌ | 3147/12384 [6:40:40<19:32:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 25%|██▌ | 3148/12384 [6:40:40<19:31:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 25%|██▌ | 3148/12384 [6:40:48<19:31:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 25%|██▌ | 3149/12384 [6:40:48<19:31:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 25%|██▌ | 3149/12384 [6:40:55<19:31:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 25%|██▌ | 3150/12384 [6:40:55<19:30:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 25%|██▌ | 3150/12384 [6:41:03<19:30:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3151/12384 [6:41:03<19:29:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 25%|██▌ | 3151/12384 [6:41:10<19:29:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 25%|██▌ | 3152/12384 [6:41:10<19:30:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 25%|██▌ | 3152/12384 [6:41:18<19:30:29, 7.61s/it, loss=0.0002, acc=0.9988, iter_time=7.53s]
Epoch 1: 25%|██▌ | 3153/12384 [6:41:18<19:30:31, 7.61s/it, loss=0.0002, acc=0.9988, iter_time=7.53s]
Epoch 1: 25%|██▌ | 3153/12384 [6:41:26<19:30:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▌ | 3154/12384 [6:41:26<19:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 25%|██▌ | 3154/12384 [6:41:33<19:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▌ | 3155/12384 [6:41:33<19:30:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 25%|██▌ | 3155/12384 [6:41:41<19:30:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 25%|██▌ | 3156/12384 [6:41:41<19:30:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 25%|██▌ | 3156/12384 [6:41:48<19:30:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 25%|██▌ | 3157/12384 [6:41:48<19:30:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 25%|██▌ | 3157/12384 [6:41:56<19:30:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 26%|██▌ | 3158/12384 [6:41:56<19:31:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 26%|██▌ | 3158/12384 [6:42:04<19:31:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 26%|██▌ | 3159/12384 [6:42:04<19:31:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 26%|██▌ | 3159/12384 [6:42:12<19:31:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 26%|██▌ | 3160/12384 [6:42:12<19:46:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 26%|██▌ | 3160/12384 [6:42:19<19:46:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 1: 26%|██▌ | 3161/12384 [6:42:19<19:40:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 1: 26%|██▌ | 3161/12384 [6:42:27<19:40:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 26%|██▌ | 3162/12384 [6:42:27<19:37:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 26%|██▌ | 3162/12384 [6:42:34<19:37:13, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3163/12384 [6:42:34<19:34:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3163/12384 [6:42:42<19:34:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 26%|██▌ | 3164/12384 [6:42:42<19:33:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 26%|██▌ | 3164/12384 [6:42:50<19:33:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 26%|██▌ | 3165/12384 [6:42:50<19:31:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 26%|██▌ | 3165/12384 [6:42:57<19:31:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 26%|██▌ | 3166/12384 [6:42:57<19:35:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 26%|██▌ | 3166/12384 [6:43:05<19:35:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 26%|██▌ | 3167/12384 [6:43:05<19:34:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 26%|██▌ | 3167/12384 [6:43:13<19:34:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 26%|██▌ | 3168/12384 [6:43:13<19:32:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 26%|██▌ | 3168/12384 [6:43:20<19:32:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 26%|██▌ | 3169/12384 [6:43:20<19:30:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 26%|██▌ | 3169/12384 [6:43:28<19:30:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 26%|██▌ | 3170/12384 [6:43:28<19:27:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 26%|██▌ | 3170/12384 [6:43:35<19:27:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 26%|██▌ | 3171/12384 [6:43:35<19:27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 26%|██▌ | 3171/12384 [6:43:43<19:27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 26%|██▌ | 3172/12384 [6:43:43<19:28:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 26%|██▌ | 3172/12384 [6:43:51<19:28:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 26%|██▌ | 3173/12384 [6:43:51<19:27:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 26%|██▌ | 3173/12384 [6:43:58<19:27:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 26%|██▌ | 3174/12384 [6:43:58<19:28:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 26%|██▌ | 3174/12384 [6:44:06<19:28:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 26%|██▌ | 3175/12384 [6:44:06<19:28:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 26%|██▌ | 3175/12384 [6:44:14<19:28:06, 7.61s/it, loss=0.0005, acc=0.9980, iter_time=8.34s]
Epoch 1: 26%|██▌ | 3176/12384 [6:44:14<19:42:29, 7.71s/it, loss=0.0005, acc=0.9980, iter_time=8.34s]
Epoch 1: 26%|██▌ | 3176/12384 [6:44:21<19:42:29, 7.71s/it, loss=0.0002, acc=0.9986, iter_time=7.22s]
Epoch 1: 26%|██▌ | 3177/12384 [6:44:21<19:38:17, 7.68s/it, loss=0.0002, acc=0.9986, iter_time=7.22s]
Epoch 1: 26%|██▌ | 3177/12384 [6:44:29<19:38:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 26%|██▌ | 3178/12384 [6:44:29<19:33:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 26%|██▌ | 3178/12384 [6:44:37<19:33:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 26%|██▌ | 3179/12384 [6:44:37<19:32:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 26%|██▌ | 3179/12384 [6:44:44<19:32:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.23s]
Epoch 1: 26%|██▌ | 3180/12384 [6:44:44<19:30:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.23s]
Epoch 1: 26%|██▌ | 3180/12384 [6:44:52<19:30:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3181/12384 [6:44:52<19:29:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3181/12384 [6:44:59<19:29:47, 7.63s/it, loss=0.0007, acc=0.9982, iter_time=7.62s]
Epoch 1: 26%|██▌ | 3182/12384 [6:44:59<19:28:32, 7.62s/it, loss=0.0007, acc=0.9982, iter_time=7.62s]
Epoch 1: 26%|██▌ | 3182/12384 [6:45:07<19:28:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 26%|██▌ | 3183/12384 [6:45:07<19:27:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 26%|██▌ | 3183/12384 [6:45:15<19:27:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 26%|██▌ | 3184/12384 [6:45:15<19:26:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 26%|██▌ | 3184/12384 [6:45:22<19:26:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▌ | 3185/12384 [6:45:22<19:26:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▌ | 3185/12384 [6:45:30<19:26:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 26%|██▌ | 3186/12384 [6:45:30<19:46:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 26%|██▌ | 3186/12384 [6:45:38<19:46:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 26%|██▌ | 3187/12384 [6:45:38<19:41:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 26%|██▌ | 3187/12384 [6:45:46<19:41:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 26%|██▌ | 3188/12384 [6:45:46<19:37:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 26%|██▌ | 3188/12384 [6:45:53<19:37:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 26%|██▌ | 3189/12384 [6:45:53<19:32:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 26%|██▌ | 3189/12384 [6:46:01<19:32:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 26%|██▌ | 3190/12384 [6:46:01<19:30:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 26%|██▌ | 3190/12384 [6:46:08<19:30:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 26%|██▌ | 3191/12384 [6:46:08<19:29:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 26%|██▌ | 3191/12384 [6:46:16<19:29:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 26%|██▌ | 3192/12384 [6:46:16<19:28:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 26%|██▌ | 3192/12384 [6:46:24<19:28:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 26%|██▌ | 3193/12384 [6:46:24<19:26:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 26%|██▌ | 3193/12384 [6:46:31<19:26:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 26%|██▌ | 3194/12384 [6:46:31<19:25:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 26%|██▌ | 3194/12384 [6:46:39<19:25:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 26%|██▌ | 3195/12384 [6:46:39<19:25:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 26%|██▌ | 3195/12384 [6:46:46<19:25:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 26%|██▌ | 3196/12384 [6:46:46<19:24:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 26%|██▌ | 3196/12384 [6:46:54<19:24:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 26%|██▌ | 3197/12384 [6:46:54<19:24:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 26%|██▌ | 3197/12384 [6:47:02<19:24:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 26%|██▌ | 3198/12384 [6:47:02<19:24:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 26%|██▌ | 3198/12384 [6:47:09<19:24:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3199/12384 [6:47:09<19:24:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3199/12384 [6:47:17<19:24:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 26%|██▌ | 3200/12384 [6:47:17<19:24:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 26%|██▌ | 3200/12384 [6:47:24<19:24:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 26%|██▌ | 3201/12384 [6:47:24<19:24:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 26%|██▌ | 3201/12384 [6:47:32<19:24:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 26%|██▌ | 3202/12384 [6:47:32<19:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 26%|██▌ | 3202/12384 [6:47:40<19:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 26%|██▌ | 3203/12384 [6:47:40<19:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 26%|██▌ | 3203/12384 [6:47:47<19:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 26%|██▌ | 3204/12384 [6:47:47<19:29:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 26%|██▌ | 3204/12384 [6:47:55<19:29:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 26%|██▌ | 3205/12384 [6:47:55<19:27:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 26%|██▌ | 3205/12384 [6:48:03<19:27:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 26%|██▌ | 3206/12384 [6:48:03<19:26:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 26%|██▌ | 3206/12384 [6:48:10<19:26:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 26%|██▌ | 3207/12384 [6:48:10<19:24:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 26%|██▌ | 3207/12384 [6:48:18<19:24:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 26%|██▌ | 3208/12384 [6:48:18<19:24:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 26%|██▌ | 3208/12384 [6:48:25<19:24:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 26%|██▌ | 3209/12384 [6:48:25<19:28:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 26%|██▌ | 3209/12384 [6:48:33<19:28:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 26%|██▌ | 3210/12384 [6:48:33<19:29:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 26%|██▌ | 3210/12384 [6:48:41<19:29:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 26%|██▌ | 3211/12384 [6:48:41<19:28:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 26%|██▌ | 3211/12384 [6:48:48<19:28:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 26%|██▌ | 3212/12384 [6:48:48<19:26:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 26%|██▌ | 3212/12384 [6:48:56<19:26:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 26%|██▌ | 3213/12384 [6:48:56<19:41:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 26%|██▌ | 3213/12384 [6:49:04<19:41:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 26%|██▌ | 3214/12384 [6:49:04<19:35:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 26%|██▌ | 3214/12384 [6:49:11<19:35:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 26%|██▌ | 3215/12384 [6:49:11<19:32:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 26%|██▌ | 3215/12384 [6:49:19<19:32:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 26%|██▌ | 3216/12384 [6:49:19<19:28:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 26%|██▌ | 3216/12384 [6:49:27<19:28:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 26%|██▌ | 3217/12384 [6:49:27<19:26:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 26%|██▌ | 3217/12384 [6:49:34<19:26:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3218/12384 [6:49:34<19:25:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3218/12384 [6:49:42<19:25:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 26%|██▌ | 3219/12384 [6:49:42<19:24:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 26%|██▌ | 3219/12384 [6:49:50<19:24:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 26%|██▌ | 3220/12384 [6:49:50<19:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 26%|██▌ | 3220/12384 [6:49:57<19:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 26%|██▌ | 3221/12384 [6:49:57<19:24:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 26%|██▌ | 3221/12384 [6:50:05<19:24:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 26%|██▌ | 3222/12384 [6:50:05<19:29:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 26%|██▌ | 3222/12384 [6:50:13<19:29:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 26%|██▌ | 3223/12384 [6:50:13<19:27:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 26%|██▌ | 3223/12384 [6:50:20<19:27:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 26%|██▌ | 3224/12384 [6:50:20<19:26:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 26%|██▌ | 3224/12384 [6:50:28<19:26:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 1: 26%|██▌ | 3225/12384 [6:50:28<19:23:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 1: 26%|██▌ | 3225/12384 [6:50:35<19:23:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 1: 26%|██▌ | 3226/12384 [6:50:35<19:23:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 1: 26%|██▌ | 3226/12384 [6:50:43<19:23:08, 7.62s/it, loss=0.0019, acc=0.9958, iter_time=6.09s]
Epoch 1: 26%|██▌ | 3227/12384 [6:50:43<19:23:02, 7.62s/it, loss=0.0019, acc=0.9958, iter_time=6.09s]
Epoch 1: 26%|██▌ | 3227/12384 [6:50:51<19:23:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 26%|██▌ | 3228/12384 [6:50:51<19:20:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 26%|██▌ | 3228/12384 [6:50:58<19:20:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 26%|██▌ | 3229/12384 [6:50:58<19:33:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 26%|██▌ | 3229/12384 [6:51:06<19:33:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 26%|██▌ | 3230/12384 [6:51:06<19:29:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 26%|██▌ | 3230/12384 [6:51:14<19:29:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 26%|██▌ | 3231/12384 [6:51:14<19:25:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 26%|██▌ | 3231/12384 [6:51:21<19:25:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 26%|██▌ | 3232/12384 [6:51:21<19:23:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 26%|██▌ | 3232/12384 [6:51:29<19:23:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 26%|██▌ | 3233/12384 [6:51:29<19:23:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 26%|██▌ | 3233/12384 [6:51:36<19:23:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3234/12384 [6:51:36<19:21:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3234/12384 [6:51:44<19:21:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 26%|██▌ | 3235/12384 [6:51:44<19:20:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 26%|██▌ | 3235/12384 [6:51:52<19:20:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 26%|██▌ | 3236/12384 [6:51:52<19:19:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 26%|██▌ | 3236/12384 [6:51:59<19:19:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 26%|██▌ | 3237/12384 [6:51:59<19:18:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 26%|██▌ | 3237/12384 [6:52:07<19:18:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 26%|██▌ | 3238/12384 [6:52:07<19:18:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 26%|██▌ | 3238/12384 [6:52:15<19:18:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 26%|██▌ | 3239/12384 [6:52:15<19:34:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 26%|██▌ | 3239/12384 [6:52:22<19:34:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 26%|██▌ | 3240/12384 [6:52:22<19:30:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 26%|██▌ | 3240/12384 [6:52:30<19:30:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▌ | 3241/12384 [6:52:30<19:27:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▌ | 3241/12384 [6:52:38<19:27:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 26%|██▌ | 3242/12384 [6:52:38<19:25:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 26%|██▌ | 3242/12384 [6:52:45<19:25:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3243/12384 [6:52:45<19:24:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3243/12384 [6:52:53<19:24:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 26%|██▌ | 3244/12384 [6:52:53<19:22:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 26%|██▌ | 3244/12384 [6:53:00<19:22:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3245/12384 [6:53:00<19:21:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▌ | 3245/12384 [6:53:08<19:21:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 26%|██▌ | 3246/12384 [6:53:08<19:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 26%|██▌ | 3246/12384 [6:53:16<19:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 26%|██▌ | 3247/12384 [6:53:16<19:19:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 26%|██▌ | 3247/12384 [6:53:23<19:19:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 26%|██▌ | 3248/12384 [6:53:23<19:19:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 26%|██▌ | 3248/12384 [6:53:31<19:19:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▌ | 3249/12384 [6:53:31<19:18:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▌ | 3249/12384 [6:53:39<19:18:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 26%|██▌ | 3250/12384 [6:53:39<19:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 26%|██▌ | 3250/12384 [6:53:46<19:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 26%|██▋ | 3251/12384 [6:53:46<19:19:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 26%|██▋ | 3251/12384 [6:53:54<19:19:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 26%|██▋ | 3252/12384 [6:53:54<19:19:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 26%|██▋ | 3252/12384 [6:54:01<19:19:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 26%|██▋ | 3253/12384 [6:54:01<19:18:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 26%|██▋ | 3253/12384 [6:54:09<19:18:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 26%|██▋ | 3254/12384 [6:54:09<19:18:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 26%|██▋ | 3254/12384 [6:54:17<19:18:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 26%|██▋ | 3255/12384 [6:54:17<19:29:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 26%|██▋ | 3255/12384 [6:54:24<19:29:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 26%|██▋ | 3256/12384 [6:54:24<19:26:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 26%|██▋ | 3256/12384 [6:54:32<19:26:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=2.47s]
Epoch 1: 26%|██▋ | 3257/12384 [6:54:32<19:23:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=2.47s]
Epoch 1: 26%|██▋ | 3257/12384 [6:54:40<19:23:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 26%|██▋ | 3258/12384 [6:54:40<19:25:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 26%|██▋ | 3258/12384 [6:54:47<19:25:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 26%|██▋ | 3259/12384 [6:54:47<19:22:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 26%|██▋ | 3259/12384 [6:54:55<19:22:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 26%|██▋ | 3260/12384 [6:54:55<19:19:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 26%|██▋ | 3260/12384 [6:55:03<19:19:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 26%|██▋ | 3261/12384 [6:55:03<19:18:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 26%|██▋ | 3261/12384 [6:55:10<19:18:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 26%|██▋ | 3262/12384 [6:55:10<19:17:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 26%|██▋ | 3262/12384 [6:55:18<19:17:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 26%|██▋ | 3263/12384 [6:55:18<19:16:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 26%|██▋ | 3263/12384 [6:55:25<19:16:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 26%|██▋ | 3264/12384 [6:55:25<19:16:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 26%|██▋ | 3264/12384 [6:55:33<19:16:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 26%|██▋ | 3265/12384 [6:55:33<19:32:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 26%|██▋ | 3265/12384 [6:55:41<19:32:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 1: 26%|██▋ | 3266/12384 [6:55:41<19:30:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 1: 26%|██▋ | 3266/12384 [6:55:49<19:30:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 1: 26%|██▋ | 3267/12384 [6:55:49<19:26:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 1: 26%|██▋ | 3267/12384 [6:55:56<19:26:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 26%|██▋ | 3268/12384 [6:55:56<19:22:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 26%|██▋ | 3268/12384 [6:56:04<19:22:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▋ | 3269/12384 [6:56:04<19:20:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▋ | 3269/12384 [6:56:11<19:20:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▋ | 3270/12384 [6:56:11<19:18:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 26%|██▋ | 3270/12384 [6:56:19<19:18:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 26%|██▋ | 3271/12384 [6:56:19<19:21:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 26%|██▋ | 3271/12384 [6:56:27<19:21:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 26%|██▋ | 3272/12384 [6:56:27<19:20:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 26%|██▋ | 3272/12384 [6:56:34<19:20:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▋ | 3273/12384 [6:56:34<19:18:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▋ | 3273/12384 [6:56:42<19:18:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 26%|██▋ | 3274/12384 [6:56:42<19:21:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 26%|██▋ | 3274/12384 [6:56:50<19:21:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 26%|██▋ | 3275/12384 [6:56:50<19:19:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 26%|██▋ | 3275/12384 [6:56:57<19:19:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 26%|██▋ | 3276/12384 [6:56:57<19:18:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 26%|██▋ | 3276/12384 [6:57:05<19:18:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 26%|██▋ | 3277/12384 [6:57:05<19:19:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 26%|██▋ | 3277/12384 [6:57:13<19:19:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▋ | 3278/12384 [6:57:13<19:16:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 26%|██▋ | 3278/12384 [6:57:20<19:16:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 26%|██▋ | 3279/12384 [6:57:20<19:16:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 26%|██▋ | 3279/12384 [6:57:28<19:16:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 26%|██▋ | 3280/12384 [6:57:28<19:16:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 26%|██▋ | 3280/12384 [6:57:36<19:16:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 26%|██▋ | 3281/12384 [6:57:36<19:27:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 26%|██▋ | 3281/12384 [6:57:43<19:27:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3282/12384 [6:57:43<19:23:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3282/12384 [6:57:51<19:23:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3283/12384 [6:57:51<19:19:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3283/12384 [6:57:58<19:19:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3284/12384 [6:57:58<19:17:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3284/12384 [6:58:06<19:17:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3285/12384 [6:58:06<19:16:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3285/12384 [6:58:14<19:16:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 27%|██▋ | 3286/12384 [6:58:14<19:16:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 27%|██▋ | 3286/12384 [6:58:21<19:16:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 27%|██▋ | 3287/12384 [6:58:21<19:20:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 27%|██▋ | 3287/12384 [6:58:29<19:20:51, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.13s]
Epoch 1: 27%|██▋ | 3288/12384 [6:58:29<19:18:42, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.13s]
Epoch 1: 27%|██▋ | 3288/12384 [6:58:37<19:18:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 27%|██▋ | 3289/12384 [6:58:37<19:17:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 27%|██▋ | 3289/12384 [6:58:44<19:17:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 27%|██▋ | 3290/12384 [6:58:44<19:16:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 27%|██▋ | 3290/12384 [6:58:52<19:16:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 27%|██▋ | 3291/12384 [6:58:52<19:29:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 27%|██▋ | 3291/12384 [6:59:00<19:29:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 27%|██▋ | 3292/12384 [6:59:00<19:24:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 27%|██▋ | 3292/12384 [6:59:07<19:24:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 1: 27%|██▋ | 3293/12384 [6:59:07<19:21:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 1: 27%|██▋ | 3293/12384 [6:59:15<19:21:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 27%|██▋ | 3294/12384 [6:59:15<19:19:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 27%|██▋ | 3294/12384 [6:59:23<19:19:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 27%|██▋ | 3295/12384 [6:59:23<19:16:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 27%|██▋ | 3295/12384 [6:59:30<19:16:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 27%|██▋ | 3296/12384 [6:59:30<19:16:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 27%|██▋ | 3296/12384 [6:59:38<19:16:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.38s]
Epoch 1: 27%|██▋ | 3297/12384 [6:59:38<19:16:55, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.38s]
Epoch 1: 27%|██▋ | 3297/12384 [6:59:46<19:16:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 27%|██▋ | 3298/12384 [6:59:46<19:15:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 27%|██▋ | 3298/12384 [6:59:53<19:15:38, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.06s]
Epoch 1: 27%|██▋ | 3299/12384 [6:59:53<19:13:31, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.06s]
Epoch 1: 27%|██▋ | 3299/12384 [7:00:01<19:13:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 27%|██▋ | 3300/12384 [7:00:01<19:13:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 27%|██▋ | 3300/12384 [7:00:08<19:13:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 27%|██▋ | 3301/12384 [7:00:08<19:13:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 27%|██▋ | 3301/12384 [7:00:16<19:13:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3302/12384 [7:00:16<19:13:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3302/12384 [7:00:24<19:13:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3303/12384 [7:00:24<19:13:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3303/12384 [7:00:31<19:13:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 27%|██▋ | 3304/12384 [7:00:31<19:12:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 27%|██▋ | 3304/12384 [7:00:39<19:12:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 27%|██▋ | 3305/12384 [7:00:39<19:11:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 27%|██▋ | 3305/12384 [7:00:46<19:11:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3306/12384 [7:00:46<19:10:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3306/12384 [7:00:54<19:10:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 27%|██▋ | 3307/12384 [7:00:54<19:11:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 27%|██▋ | 3307/12384 [7:01:02<19:11:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 27%|██▋ | 3308/12384 [7:01:02<19:09:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 27%|██▋ | 3308/12384 [7:01:09<19:09:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 27%|██▋ | 3309/12384 [7:01:09<19:10:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 27%|██▋ | 3309/12384 [7:01:17<19:10:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3310/12384 [7:01:17<19:09:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3310/12384 [7:01:24<19:09:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3311/12384 [7:01:24<19:09:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3311/12384 [7:01:32<19:09:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 27%|██▋ | 3312/12384 [7:01:32<19:09:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 27%|██▋ | 3312/12384 [7:01:40<19:09:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 27%|██▋ | 3313/12384 [7:01:40<19:09:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 27%|██▋ | 3313/12384 [7:01:47<19:09:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3314/12384 [7:01:47<19:10:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3314/12384 [7:01:55<19:10:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3315/12384 [7:01:55<19:09:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3315/12384 [7:02:02<19:09:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 27%|██▋ | 3316/12384 [7:02:02<19:12:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 27%|██▋ | 3316/12384 [7:02:10<19:12:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 27%|██▋ | 3317/12384 [7:02:10<19:26:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 27%|██▋ | 3317/12384 [7:02:18<19:26:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 27%|██▋ | 3318/12384 [7:02:18<19:21:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 27%|██▋ | 3318/12384 [7:02:26<19:21:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 1: 27%|██▋ | 3319/12384 [7:02:26<19:18:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 1: 27%|██▋ | 3319/12384 [7:02:33<19:18:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 27%|██▋ | 3320/12384 [7:02:33<19:15:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 27%|██▋ | 3320/12384 [7:02:41<19:15:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 27%|██▋ | 3321/12384 [7:02:41<19:13:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 27%|██▋ | 3321/12384 [7:02:48<19:13:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 27%|██▋ | 3322/12384 [7:02:48<19:12:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 27%|██▋ | 3322/12384 [7:02:56<19:12:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3323/12384 [7:02:56<19:10:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3323/12384 [7:03:04<19:10:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 27%|██▋ | 3324/12384 [7:03:04<19:09:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 27%|██▋ | 3324/12384 [7:03:11<19:09:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 27%|██▋ | 3325/12384 [7:03:11<19:08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 27%|██▋ | 3325/12384 [7:03:19<19:08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 27%|██▋ | 3326/12384 [7:03:19<19:08:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 27%|██▋ | 3326/12384 [7:03:26<19:08:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 27%|██▋ | 3327/12384 [7:03:26<19:08:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 27%|██▋ | 3327/12384 [7:03:34<19:08:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.54s]
Epoch 1: 27%|██▋ | 3328/12384 [7:03:34<19:06:57, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=9.54s]
Epoch 1: 27%|██▋ | 3328/12384 [7:03:42<19:06:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 27%|██▋ | 3329/12384 [7:03:42<19:07:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 27%|██▋ | 3329/12384 [7:03:49<19:07:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 27%|██▋ | 3330/12384 [7:03:49<19:08:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 27%|██▋ | 3330/12384 [7:03:57<19:08:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 27%|██▋ | 3331/12384 [7:03:57<19:07:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 27%|██▋ | 3331/12384 [7:04:05<19:07:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 27%|██▋ | 3332/12384 [7:04:05<19:07:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 27%|██▋ | 3332/12384 [7:04:12<19:07:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 27%|██▋ | 3333/12384 [7:04:12<19:19:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 27%|██▋ | 3333/12384 [7:04:20<19:19:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 27%|██▋ | 3334/12384 [7:04:20<19:15:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 27%|██▋ | 3334/12384 [7:04:28<19:15:28, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3335/12384 [7:04:28<19:13:15, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3335/12384 [7:04:35<19:13:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 27%|██▋ | 3336/12384 [7:04:35<19:11:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 27%|██▋ | 3336/12384 [7:04:43<19:11:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 27%|██▋ | 3337/12384 [7:04:43<19:10:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 27%|██▋ | 3337/12384 [7:04:50<19:10:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3338/12384 [7:04:50<19:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3338/12384 [7:04:58<19:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 27%|██▋ | 3339/12384 [7:04:58<19:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 27%|██▋ | 3339/12384 [7:05:06<19:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 27%|██▋ | 3340/12384 [7:05:06<19:12:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 27%|██▋ | 3340/12384 [7:05:13<19:12:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 27%|██▋ | 3341/12384 [7:05:13<19:10:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 27%|██▋ | 3341/12384 [7:05:21<19:10:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 27%|██▋ | 3342/12384 [7:05:21<19:10:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 27%|██▋ | 3342/12384 [7:05:29<19:10:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 27%|██▋ | 3343/12384 [7:05:29<19:09:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 27%|██▋ | 3343/12384 [7:05:37<19:09:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 27%|██▋ | 3344/12384 [7:05:37<19:23:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 27%|██▋ | 3344/12384 [7:05:44<19:23:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 27%|██▋ | 3345/12384 [7:05:44<19:18:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 27%|██▋ | 3345/12384 [7:05:52<19:18:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 27%|██▋ | 3346/12384 [7:05:52<19:13:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 27%|██▋ | 3346/12384 [7:05:59<19:13:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 27%|██▋ | 3347/12384 [7:05:59<19:10:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 27%|██▋ | 3347/12384 [7:06:07<19:10:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 27%|██▋ | 3348/12384 [7:06:07<19:09:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 27%|██▋ | 3348/12384 [7:06:15<19:09:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 27%|██▋ | 3349/12384 [7:06:15<19:08:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 27%|██▋ | 3349/12384 [7:06:22<19:08:25, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3350/12384 [7:06:22<19:08:38, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3350/12384 [7:06:30<19:08:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 1: 27%|██▋ | 3351/12384 [7:06:30<19:08:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 1: 27%|██▋ | 3351/12384 [7:06:37<19:08:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 1: 27%|██▋ | 3352/12384 [7:06:37<19:06:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 1: 27%|██▋ | 3352/12384 [7:06:45<19:06:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 27%|██▋ | 3353/12384 [7:06:45<19:05:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 27%|██▋ | 3353/12384 [7:06:53<19:05:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 27%|██▋ | 3354/12384 [7:06:53<19:03:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 27%|██▋ | 3354/12384 [7:07:00<19:03:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 1: 27%|██▋ | 3355/12384 [7:07:00<19:04:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 1: 27%|██▋ | 3355/12384 [7:07:08<19:04:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 27%|██▋ | 3356/12384 [7:07:08<19:03:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 27%|██▋ | 3356/12384 [7:07:15<19:03:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3357/12384 [7:07:15<19:03:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3357/12384 [7:07:23<19:03:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 27%|██▋ | 3358/12384 [7:07:23<19:03:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 27%|██▋ | 3358/12384 [7:07:31<19:03:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 27%|██▋ | 3359/12384 [7:07:31<19:03:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 27%|██▋ | 3359/12384 [7:07:39<19:03:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 1: 27%|██▋ | 3360/12384 [7:07:39<19:17:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 1: 27%|██▋ | 3360/12384 [7:07:46<19:17:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 27%|██▋ | 3361/12384 [7:07:46<19:13:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 27%|██▋ | 3361/12384 [7:07:54<19:13:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3362/12384 [7:07:54<19:10:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3362/12384 [7:08:01<19:10:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 27%|██▋ | 3363/12384 [7:08:01<19:11:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 27%|██▋ | 3363/12384 [7:08:09<19:11:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3364/12384 [7:08:09<19:08:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3364/12384 [7:08:17<19:08:51, 7.64s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3365/12384 [7:08:17<19:07:10, 7.63s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3365/12384 [7:08:24<19:07:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 27%|██▋ | 3366/12384 [7:08:24<19:06:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 27%|██▋ | 3366/12384 [7:08:32<19:06:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 27%|██▋ | 3367/12384 [7:08:32<19:05:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 27%|██▋ | 3367/12384 [7:08:39<19:05:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 27%|██▋ | 3368/12384 [7:08:39<19:05:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 27%|██▋ | 3368/12384 [7:08:47<19:05:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.29s]
Epoch 1: 27%|██▋ | 3369/12384 [7:08:47<19:03:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.29s]
Epoch 1: 27%|██▋ | 3369/12384 [7:08:55<19:03:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.37s]
Epoch 1: 27%|██▋ | 3370/12384 [7:08:55<19:18:52, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=10.37s]
Epoch 1: 27%|██▋ | 3370/12384 [7:09:03<19:18:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 27%|██▋ | 3371/12384 [7:09:03<19:14:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 27%|██▋ | 3371/12384 [7:09:10<19:14:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 27%|██▋ | 3372/12384 [7:09:10<19:10:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 27%|██▋ | 3372/12384 [7:09:18<19:10:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 27%|██▋ | 3373/12384 [7:09:18<19:08:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 27%|██▋ | 3373/12384 [7:09:25<19:08:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 27%|██▋ | 3374/12384 [7:09:25<19:07:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 27%|██▋ | 3374/12384 [7:09:33<19:07:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 27%|██▋ | 3375/12384 [7:09:33<19:05:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 27%|██▋ | 3375/12384 [7:09:41<19:05:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 27%|██▋ | 3376/12384 [7:09:41<19:05:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 27%|██▋ | 3376/12384 [7:09:48<19:05:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 27%|██▋ | 3377/12384 [7:09:48<19:03:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 27%|██▋ | 3377/12384 [7:09:56<19:03:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3378/12384 [7:09:56<19:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3378/12384 [7:10:04<19:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3379/12384 [7:10:04<19:02:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3379/12384 [7:10:11<19:02:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3380/12384 [7:10:11<19:02:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3380/12384 [7:10:19<19:02:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3381/12384 [7:10:19<19:01:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3381/12384 [7:10:26<19:01:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3382/12384 [7:10:26<19:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3382/12384 [7:10:34<19:01:48, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3383/12384 [7:10:34<19:00:41, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3383/12384 [7:10:42<19:00:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 27%|██▋ | 3384/12384 [7:10:42<19:00:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 27%|██▋ | 3384/12384 [7:10:49<19:00:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 27%|██▋ | 3385/12384 [7:10:49<18:59:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 27%|██▋ | 3385/12384 [7:10:57<18:59:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 1: 27%|██▋ | 3386/12384 [7:10:57<19:13:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 1: 27%|██▋ | 3386/12384 [7:11:05<19:13:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 27%|██▋ | 3387/12384 [7:11:05<19:09:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 27%|██▋ | 3387/12384 [7:11:12<19:09:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3388/12384 [7:11:12<19:06:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 27%|██▋ | 3388/12384 [7:11:20<19:06:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 27%|██▋ | 3389/12384 [7:11:20<19:12:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 27%|██▋ | 3389/12384 [7:11:28<19:12:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 27%|██▋ | 3390/12384 [7:11:28<19:09:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 27%|██▋ | 3390/12384 [7:11:35<19:09:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 27%|██▋ | 3391/12384 [7:11:35<19:07:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 27%|██▋ | 3391/12384 [7:11:43<19:07:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 27%|██▋ | 3392/12384 [7:11:43<19:04:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 27%|██▋ | 3392/12384 [7:11:51<19:04:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 1: 27%|██▋ | 3393/12384 [7:11:51<19:06:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 1: 27%|██▋ | 3393/12384 [7:11:58<19:06:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 27%|██▋ | 3394/12384 [7:11:58<19:03:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 27%|██▋ | 3394/12384 [7:12:06<19:03:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 27%|██▋ | 3395/12384 [7:12:06<19:06:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 27%|██▋ | 3395/12384 [7:12:13<19:06:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3396/12384 [7:12:13<19:04:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3396/12384 [7:12:21<19:04:50, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.68s]
Epoch 1: 27%|██▋ | 3397/12384 [7:12:21<19:17:13, 7.73s/it, loss=0.0001, acc=0.9998, iter_time=7.68s]
Epoch 1: 27%|██▋ | 3397/12384 [7:12:29<19:17:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 27%|██▋ | 3398/12384 [7:12:29<19:10:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 27%|██▋ | 3398/12384 [7:12:37<19:10:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3399/12384 [7:12:37<19:07:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 27%|██▋ | 3399/12384 [7:12:44<19:07:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 27%|██▋ | 3400/12384 [7:12:44<19:05:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 27%|██▋ | 3400/12384 [7:12:52<19:05:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 27%|██▋ | 3401/12384 [7:12:52<19:02:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 27%|██▋ | 3401/12384 [7:12:59<19:02:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 27%|██▋ | 3402/12384 [7:12:59<19:01:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 27%|██▋ | 3402/12384 [7:13:07<19:01:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 27%|██▋ | 3403/12384 [7:13:07<19:01:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 27%|██▋ | 3403/12384 [7:13:15<19:01:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3404/12384 [7:13:15<19:00:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 27%|██▋ | 3404/12384 [7:13:22<19:00:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3405/12384 [7:13:22<19:00:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 27%|██▋ | 3405/12384 [7:13:30<19:00:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 28%|██▊ | 3406/12384 [7:13:30<19:00:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 28%|██▊ | 3406/12384 [7:13:37<19:00:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 28%|██▊ | 3407/12384 [7:13:37<18:59:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 28%|██▊ | 3407/12384 [7:13:45<18:59:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 28%|██▊ | 3408/12384 [7:13:45<18:59:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 28%|██▊ | 3408/12384 [7:13:53<18:59:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 28%|██▊ | 3409/12384 [7:13:53<18:58:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 28%|██▊ | 3409/12384 [7:14:00<18:58:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 28%|██▊ | 3410/12384 [7:14:00<18:57:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 28%|██▊ | 3410/12384 [7:14:08<18:57:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 28%|██▊ | 3411/12384 [7:14:08<18:57:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 28%|██▊ | 3411/12384 [7:14:16<18:57:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 28%|██▊ | 3412/12384 [7:14:16<18:58:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 28%|██▊ | 3412/12384 [7:14:23<18:58:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 28%|██▊ | 3413/12384 [7:14:23<18:57:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 28%|██▊ | 3413/12384 [7:14:31<18:57:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 28%|██▊ | 3414/12384 [7:14:31<18:57:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 28%|██▊ | 3414/12384 [7:14:38<18:57:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 28%|██▊ | 3415/12384 [7:14:38<18:56:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 28%|██▊ | 3415/12384 [7:14:46<18:56:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 28%|██▊ | 3416/12384 [7:14:46<18:56:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 28%|██▊ | 3416/12384 [7:14:54<18:56:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 28%|██▊ | 3417/12384 [7:14:54<18:56:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 28%|██▊ | 3417/12384 [7:15:01<18:56:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 28%|██▊ | 3418/12384 [7:15:01<18:56:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 28%|██▊ | 3418/12384 [7:15:09<18:56:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 28%|██▊ | 3419/12384 [7:15:09<18:56:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 28%|██▊ | 3419/12384 [7:15:16<18:56:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 28%|██▊ | 3420/12384 [7:15:16<18:56:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 28%|██▊ | 3420/12384 [7:15:24<18:56:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 28%|██▊ | 3421/12384 [7:15:24<18:56:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 28%|██▊ | 3421/12384 [7:15:32<18:56:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 28%|██▊ | 3422/12384 [7:15:32<18:58:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 28%|██▊ | 3422/12384 [7:15:40<18:58:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 28%|██▊ | 3423/12384 [7:15:40<19:13:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 28%|██▊ | 3423/12384 [7:15:47<19:13:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 28%|██▊ | 3424/12384 [7:15:47<19:06:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 28%|██▊ | 3424/12384 [7:15:55<19:06:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 28%|██▊ | 3425/12384 [7:15:55<19:03:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 28%|██▊ | 3425/12384 [7:16:02<19:03:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 28%|██▊ | 3426/12384 [7:16:02<19:01:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 28%|██▊ | 3426/12384 [7:16:10<19:01:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 28%|██▊ | 3427/12384 [7:16:10<19:00:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 28%|██▊ | 3427/12384 [7:16:18<19:00:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 28%|██▊ | 3428/12384 [7:16:18<18:59:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 28%|██▊ | 3428/12384 [7:16:25<18:59:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 28%|██▊ | 3429/12384 [7:16:25<18:57:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 28%|██▊ | 3429/12384 [7:16:33<18:57:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 28%|██▊ | 3430/12384 [7:16:33<18:55:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 28%|██▊ | 3430/12384 [7:16:40<18:55:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 1: 28%|██▊ | 3431/12384 [7:16:40<18:56:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 1: 28%|██▊ | 3431/12384 [7:16:48<18:56:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 28%|██▊ | 3432/12384 [7:16:48<18:55:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 28%|██▊ | 3432/12384 [7:16:56<18:55:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 28%|██▊ | 3433/12384 [7:16:56<18:55:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 28%|██▊ | 3433/12384 [7:17:03<18:55:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 28%|██▊ | 3434/12384 [7:17:03<18:58:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 28%|██▊ | 3434/12384 [7:17:11<18:58:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 28%|██▊ | 3435/12384 [7:17:11<18:57:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 28%|██▊ | 3435/12384 [7:17:19<18:57:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 28%|██▊ | 3436/12384 [7:17:19<18:57:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 28%|██▊ | 3436/12384 [7:17:26<18:57:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 28%|██▊ | 3437/12384 [7:17:26<18:58:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 28%|██▊ | 3437/12384 [7:17:34<18:58:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 28%|██▊ | 3438/12384 [7:17:34<18:57:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 28%|██▊ | 3438/12384 [7:17:42<18:57:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 28%|██▊ | 3439/12384 [7:17:42<19:09:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 28%|██▊ | 3439/12384 [7:17:49<19:09:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 28%|██▊ | 3440/12384 [7:17:49<19:03:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 28%|██▊ | 3440/12384 [7:17:57<19:03:59, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.21s]
Epoch 1: 28%|██▊ | 3441/12384 [7:17:57<19:00:14, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.21s]
Epoch 1: 28%|██▊ | 3441/12384 [7:18:05<19:00:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 28%|██▊ | 3442/12384 [7:18:05<18:58:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 28%|██▊ | 3442/12384 [7:18:12<18:58:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 28%|██▊ | 3443/12384 [7:18:12<18:57:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 28%|██▊ | 3443/12384 [7:18:20<18:57:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 28%|██▊ | 3444/12384 [7:18:20<18:54:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 28%|██▊ | 3444/12384 [7:18:27<18:54:56, 7.62s/it, loss=0.0019, acc=0.9948, iter_time=10.87s]
Epoch 1: 28%|██▊ | 3445/12384 [7:18:27<18:53:49, 7.61s/it, loss=0.0019, acc=0.9948, iter_time=10.87s]
Epoch 1: 28%|██▊ | 3445/12384 [7:18:35<18:53:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 28%|██▊ | 3446/12384 [7:18:35<18:52:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 28%|██▊ | 3446/12384 [7:18:43<18:52:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 28%|██▊ | 3447/12384 [7:18:43<18:52:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 28%|██▊ | 3447/12384 [7:18:50<18:52:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 28%|██▊ | 3448/12384 [7:18:50<18:52:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 28%|██▊ | 3448/12384 [7:18:58<18:52:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 28%|██▊ | 3449/12384 [7:18:58<19:07:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 28%|██▊ | 3449/12384 [7:19:06<19:07:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 28%|██▊ | 3450/12384 [7:19:06<19:02:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 28%|██▊ | 3450/12384 [7:19:13<19:02:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 28%|██▊ | 3451/12384 [7:19:13<18:58:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 28%|██▊ | 3451/12384 [7:19:21<18:58:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 28%|██▊ | 3452/12384 [7:19:21<18:56:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 28%|██▊ | 3452/12384 [7:19:29<18:56:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 28%|██▊ | 3453/12384 [7:19:29<19:00:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 28%|██▊ | 3453/12384 [7:19:36<19:00:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 28%|██▊ | 3454/12384 [7:19:36<18:59:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 28%|██▊ | 3454/12384 [7:19:44<18:59:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3455/12384 [7:19:44<18:59:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3455/12384 [7:19:52<18:59:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 28%|██▊ | 3456/12384 [7:19:52<18:57:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 28%|██▊ | 3456/12384 [7:19:59<18:57:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 28%|██▊ | 3457/12384 [7:19:59<18:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 28%|██▊ | 3457/12384 [7:20:07<18:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 28%|██▊ | 3458/12384 [7:20:07<19:00:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 28%|██▊ | 3458/12384 [7:20:15<19:00:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 28%|██▊ | 3459/12384 [7:20:15<18:59:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 28%|██▊ | 3459/12384 [7:20:22<18:59:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3460/12384 [7:20:22<18:56:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3460/12384 [7:20:30<18:56:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 28%|██▊ | 3461/12384 [7:20:30<18:57:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 28%|██▊ | 3461/12384 [7:20:37<18:57:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 28%|██▊ | 3462/12384 [7:20:37<18:56:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 28%|██▊ | 3462/12384 [7:20:45<18:56:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 28%|██▊ | 3463/12384 [7:20:45<18:55:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 28%|██▊ | 3463/12384 [7:20:53<18:55:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 28%|██▊ | 3464/12384 [7:20:53<18:56:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 28%|██▊ | 3464/12384 [7:21:00<18:56:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 28%|██▊ | 3465/12384 [7:21:00<18:57:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 28%|██▊ | 3465/12384 [7:21:08<18:57:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 28%|██▊ | 3466/12384 [7:21:08<18:59:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 28%|██▊ | 3466/12384 [7:21:16<18:59:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 28%|██▊ | 3467/12384 [7:21:16<18:57:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 28%|██▊ | 3467/12384 [7:21:23<18:57:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 28%|██▊ | 3468/12384 [7:21:23<18:57:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 28%|██▊ | 3468/12384 [7:21:31<18:57:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3469/12384 [7:21:31<18:53:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3469/12384 [7:21:39<18:53:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 28%|██▊ | 3470/12384 [7:21:39<18:53:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 28%|██▊ | 3470/12384 [7:21:46<18:53:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 28%|██▊ | 3471/12384 [7:21:46<18:52:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 28%|██▊ | 3471/12384 [7:21:54<18:52:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 28%|██▊ | 3472/12384 [7:21:54<18:52:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 28%|██▊ | 3472/12384 [7:22:01<18:52:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 28%|██▊ | 3473/12384 [7:22:01<18:51:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 28%|██▊ | 3473/12384 [7:22:09<18:51:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 28%|██▊ | 3474/12384 [7:22:09<18:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 28%|██▊ | 3474/12384 [7:22:17<18:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 28%|██▊ | 3475/12384 [7:22:17<19:06:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 28%|██▊ | 3475/12384 [7:22:25<19:06:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 28%|██▊ | 3476/12384 [7:22:25<19:01:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 28%|██▊ | 3476/12384 [7:22:32<19:01:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 28%|██▊ | 3477/12384 [7:22:32<18:56:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 28%|██▊ | 3477/12384 [7:22:40<18:56:44, 7.66s/it, loss=0.0002, acc=0.9988, iter_time=8.45s]
Epoch 1: 28%|██▊ | 3478/12384 [7:22:40<18:54:22, 7.64s/it, loss=0.0002, acc=0.9988, iter_time=8.45s]
Epoch 1: 28%|██▊ | 3478/12384 [7:22:47<18:54:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 28%|██▊ | 3479/12384 [7:22:47<18:52:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 28%|██▊ | 3479/12384 [7:22:55<18:52:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 28%|██▊ | 3480/12384 [7:22:55<18:51:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 28%|██▊ | 3480/12384 [7:23:03<18:51:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 28%|██▊ | 3481/12384 [7:23:03<18:53:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 28%|██▊ | 3481/12384 [7:23:10<18:53:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 28%|██▊ | 3482/12384 [7:23:10<18:59:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 28%|██▊ | 3482/12384 [7:23:18<18:59:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 28%|██▊ | 3483/12384 [7:23:18<18:56:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 28%|██▊ | 3483/12384 [7:23:26<18:56:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 28%|██▊ | 3484/12384 [7:23:26<18:53:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 28%|██▊ | 3484/12384 [7:23:33<18:53:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 28%|██▊ | 3485/12384 [7:23:33<18:52:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 28%|██▊ | 3485/12384 [7:23:41<18:52:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 28%|██▊ | 3486/12384 [7:23:41<18:51:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 28%|██▊ | 3486/12384 [7:23:49<18:51:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 28%|██▊ | 3487/12384 [7:23:49<18:53:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 28%|██▊ | 3487/12384 [7:23:56<18:53:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 28%|██▊ | 3488/12384 [7:23:56<18:53:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 28%|██▊ | 3488/12384 [7:24:04<18:53:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 28%|██▊ | 3489/12384 [7:24:04<18:52:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 28%|██▊ | 3489/12384 [7:24:11<18:52:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 28%|██▊ | 3490/12384 [7:24:11<18:51:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 28%|██▊ | 3490/12384 [7:24:19<18:51:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 1: 28%|██▊ | 3491/12384 [7:24:19<18:52:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 1: 28%|██▊ | 3491/12384 [7:24:27<18:52:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 28%|██▊ | 3492/12384 [7:24:27<18:50:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 28%|██▊ | 3492/12384 [7:24:34<18:50:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 28%|██▊ | 3493/12384 [7:24:34<18:49:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 28%|██▊ | 3493/12384 [7:24:42<18:49:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 28%|██▊ | 3494/12384 [7:24:42<18:52:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 28%|██▊ | 3494/12384 [7:24:50<18:52:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 28%|██▊ | 3495/12384 [7:24:50<18:53:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 28%|██▊ | 3495/12384 [7:24:57<18:53:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 28%|██▊ | 3496/12384 [7:24:57<18:51:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 28%|██▊ | 3496/12384 [7:25:05<18:51:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 28%|██▊ | 3497/12384 [7:25:05<18:58:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 28%|██▊ | 3497/12384 [7:25:13<18:58:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 1: 28%|██▊ | 3498/12384 [7:25:13<18:57:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 1: 28%|██▊ | 3498/12384 [7:25:20<18:57:22, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 28%|██▊ | 3499/12384 [7:25:20<18:55:03, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 1: 28%|██▊ | 3499/12384 [7:25:28<18:55:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3500/12384 [7:25:28<18:57:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3500/12384 [7:25:36<18:57:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 28%|██▊ | 3501/12384 [7:25:36<19:10:36, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 28%|██▊ | 3501/12384 [7:25:44<19:10:36, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 28%|██▊ | 3502/12384 [7:25:44<19:05:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 28%|██▊ | 3502/12384 [7:25:51<19:05:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 28%|██▊ | 3503/12384 [7:25:51<19:00:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 28%|██▊ | 3503/12384 [7:25:59<19:00:10, 7.70s/it, loss=0.0002, acc=0.9987, iter_time=8.00s]
Epoch 1: 28%|██▊ | 3504/12384 [7:25:59<18:55:11, 7.67s/it, loss=0.0002, acc=0.9987, iter_time=8.00s]
Epoch 1: 28%|██▊ | 3504/12384 [7:26:07<18:55:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 28%|██▊ | 3505/12384 [7:26:07<18:52:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 28%|██▊ | 3505/12384 [7:26:14<18:52:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 28%|██▊ | 3506/12384 [7:26:14<18:49:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 28%|██▊ | 3506/12384 [7:26:22<18:49:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 28%|██▊ | 3507/12384 [7:26:22<18:47:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 28%|██▊ | 3507/12384 [7:26:29<18:47:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 28%|██▊ | 3508/12384 [7:26:29<18:47:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 28%|██▊ | 3508/12384 [7:26:37<18:47:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 28%|██▊ | 3509/12384 [7:26:37<18:49:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 28%|██▊ | 3509/12384 [7:26:45<18:49:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 28%|██▊ | 3510/12384 [7:26:45<18:47:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 28%|██▊ | 3510/12384 [7:26:52<18:47:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 28%|██▊ | 3511/12384 [7:26:52<18:47:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 28%|██▊ | 3511/12384 [7:27:00<18:47:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 28%|██▊ | 3512/12384 [7:27:00<18:46:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 28%|██▊ | 3512/12384 [7:27:08<18:46:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 28%|██▊ | 3513/12384 [7:27:08<18:47:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 28%|██▊ | 3513/12384 [7:27:15<18:47:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 28%|██▊ | 3514/12384 [7:27:15<18:47:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 28%|██▊ | 3514/12384 [7:27:23<18:47:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 28%|██▊ | 3515/12384 [7:27:23<18:46:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 28%|██▊ | 3515/12384 [7:27:30<18:46:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 28%|██▊ | 3516/12384 [7:27:30<18:48:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 28%|██▊ | 3516/12384 [7:27:38<18:48:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 1: 28%|██▊ | 3517/12384 [7:27:38<18:47:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 1: 28%|██▊ | 3517/12384 [7:27:46<18:47:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 28%|██▊ | 3518/12384 [7:27:46<18:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 28%|██▊ | 3518/12384 [7:27:53<18:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 28%|██▊ | 3519/12384 [7:27:53<18:50:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 28%|██▊ | 3519/12384 [7:28:01<18:50:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 28%|██▊ | 3520/12384 [7:28:01<18:50:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 28%|██▊ | 3520/12384 [7:28:09<18:50:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 28%|██▊ | 3521/12384 [7:28:09<18:47:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 28%|██▊ | 3521/12384 [7:28:16<18:47:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 28%|██▊ | 3522/12384 [7:28:16<18:45:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 28%|██▊ | 3522/12384 [7:28:24<18:45:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 28%|██▊ | 3523/12384 [7:28:24<18:45:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 28%|██▊ | 3523/12384 [7:28:31<18:45:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3524/12384 [7:28:31<18:45:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 28%|██▊ | 3524/12384 [7:28:39<18:45:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 1: 28%|██▊ | 3525/12384 [7:28:39<18:45:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 1: 28%|██▊ | 3525/12384 [7:28:47<18:45:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 1: 28%|██▊ | 3526/12384 [7:28:47<18:43:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 1: 28%|██▊ | 3526/12384 [7:28:54<18:43:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 28%|██▊ | 3527/12384 [7:28:54<18:43:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 28%|██▊ | 3527/12384 [7:29:02<18:43:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 1: 28%|██▊ | 3528/12384 [7:29:02<18:58:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 1: 28%|██▊ | 3528/12384 [7:29:10<18:58:05, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.18s]
Epoch 1: 28%|██▊ | 3529/12384 [7:29:10<18:52:31, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.18s]
Epoch 1: 28%|██▊ | 3529/12384 [7:29:17<18:52:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 29%|██▊ | 3530/12384 [7:29:17<18:49:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 29%|██▊ | 3530/12384 [7:29:25<18:49:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 29%|██▊ | 3531/12384 [7:29:25<18:47:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 29%|██▊ | 3531/12384 [7:29:33<18:47:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 29%|██▊ | 3532/12384 [7:29:33<18:46:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 29%|██▊ | 3532/12384 [7:29:40<18:46:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 29%|██▊ | 3533/12384 [7:29:40<18:45:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 29%|██▊ | 3533/12384 [7:29:48<18:45:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▊ | 3534/12384 [7:29:48<18:43:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▊ | 3534/12384 [7:29:55<18:43:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 29%|██▊ | 3535/12384 [7:29:55<18:42:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 29%|██▊ | 3535/12384 [7:30:03<18:42:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 29%|██▊ | 3536/12384 [7:30:03<18:43:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 29%|██▊ | 3536/12384 [7:30:11<18:43:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 29%|██▊ | 3537/12384 [7:30:11<18:42:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 29%|██▊ | 3537/12384 [7:30:18<18:42:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▊ | 3538/12384 [7:30:18<18:42:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▊ | 3538/12384 [7:30:26<18:42:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▊ | 3539/12384 [7:30:26<18:42:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▊ | 3539/12384 [7:30:34<18:42:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▊ | 3540/12384 [7:30:34<18:42:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▊ | 3540/12384 [7:30:41<18:42:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 1: 29%|██▊ | 3541/12384 [7:30:41<18:44:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 1: 29%|██▊ | 3541/12384 [7:30:49<18:44:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.63s]
Epoch 1: 29%|██▊ | 3542/12384 [7:30:49<18:43:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.63s]
Epoch 1: 29%|██▊ | 3542/12384 [7:30:56<18:43:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 29%|██▊ | 3543/12384 [7:30:56<18:43:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 29%|██▊ | 3543/12384 [7:31:04<18:43:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 29%|██▊ | 3544/12384 [7:31:04<18:41:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 29%|██▊ | 3544/12384 [7:31:12<18:41:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▊ | 3545/12384 [7:31:12<18:42:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▊ | 3545/12384 [7:31:19<18:42:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▊ | 3546/12384 [7:31:19<18:41:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▊ | 3546/12384 [7:31:27<18:41:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▊ | 3547/12384 [7:31:27<18:41:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▊ | 3547/12384 [7:31:34<18:41:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 29%|██▊ | 3548/12384 [7:31:34<18:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 29%|██▊ | 3548/12384 [7:31:42<18:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 29%|██▊ | 3549/12384 [7:31:42<18:41:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 29%|██▊ | 3549/12384 [7:31:50<18:41:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▊ | 3550/12384 [7:31:50<18:40:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▊ | 3550/12384 [7:31:57<18:40:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▊ | 3551/12384 [7:31:57<18:39:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▊ | 3551/12384 [7:32:05<18:39:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 29%|██▊ | 3552/12384 [7:32:05<18:39:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 29%|██▊ | 3552/12384 [7:32:12<18:39:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 29%|██▊ | 3553/12384 [7:32:12<18:40:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 29%|██▊ | 3553/12384 [7:32:20<18:40:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 29%|██▊ | 3554/12384 [7:32:20<18:54:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 29%|██▊ | 3554/12384 [7:32:28<18:54:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 29%|██▊ | 3555/12384 [7:32:28<18:53:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 29%|██▊ | 3555/12384 [7:32:36<18:53:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 29%|██▊ | 3556/12384 [7:32:36<18:50:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 29%|██▊ | 3556/12384 [7:32:43<18:50:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 29%|██▊ | 3557/12384 [7:32:43<18:48:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 29%|██▊ | 3557/12384 [7:32:51<18:48:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=12.51s]
Epoch 1: 29%|██▊ | 3558/12384 [7:32:51<18:45:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=12.51s]
Epoch 1: 29%|██▊ | 3558/12384 [7:32:59<18:45:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 29%|██▊ | 3559/12384 [7:32:59<18:43:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 29%|██▊ | 3559/12384 [7:33:06<18:43:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 29%|██▊ | 3560/12384 [7:33:06<18:45:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 29%|██▊ | 3560/12384 [7:33:14<18:45:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 29%|██▉ | 3561/12384 [7:33:14<18:46:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 29%|██▉ | 3561/12384 [7:33:22<18:46:31, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.49s]
Epoch 1: 29%|██▉ | 3562/12384 [7:33:22<18:43:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.49s]
Epoch 1: 29%|██▉ | 3562/12384 [7:33:29<18:43:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 29%|██▉ | 3563/12384 [7:33:29<18:41:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 29%|██▉ | 3563/12384 [7:33:37<18:41:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3564/12384 [7:33:37<18:41:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3564/12384 [7:33:44<18:41:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▉ | 3565/12384 [7:33:44<18:40:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▉ | 3565/12384 [7:33:52<18:40:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 29%|██▉ | 3566/12384 [7:33:52<18:39:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 29%|██▉ | 3566/12384 [7:34:00<18:39:32, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.21s]
Epoch 1: 29%|██▉ | 3567/12384 [7:34:00<18:39:36, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.21s]
Epoch 1: 29%|██▉ | 3567/12384 [7:34:07<18:39:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 29%|██▉ | 3568/12384 [7:34:07<18:38:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 29%|██▉ | 3568/12384 [7:34:15<18:38:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 29%|██▉ | 3569/12384 [7:34:15<18:38:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 29%|██▉ | 3569/12384 [7:34:23<18:38:06, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=10.23s]
Epoch 1: 29%|██▉ | 3570/12384 [7:34:23<18:50:35, 7.70s/it, loss=0.0002, acc=0.9996, iter_time=10.23s]
Epoch 1: 29%|██▉ | 3570/12384 [7:34:30<18:50:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 29%|██▉ | 3571/12384 [7:34:30<18:46:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 29%|██▉ | 3571/12384 [7:34:38<18:46:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 29%|██▉ | 3572/12384 [7:34:38<18:44:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 29%|██▉ | 3572/12384 [7:34:46<18:44:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 29%|██▉ | 3573/12384 [7:34:46<18:43:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 29%|██▉ | 3573/12384 [7:34:53<18:43:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 29%|██▉ | 3574/12384 [7:34:53<18:41:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 29%|██▉ | 3574/12384 [7:35:01<18:41:48, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.65s]
Epoch 1: 29%|██▉ | 3575/12384 [7:35:01<18:40:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.65s]
Epoch 1: 29%|██▉ | 3575/12384 [7:35:08<18:40:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 29%|██▉ | 3576/12384 [7:35:08<18:39:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 29%|██▉ | 3576/12384 [7:35:16<18:39:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 29%|██▉ | 3577/12384 [7:35:16<18:37:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 29%|██▉ | 3577/12384 [7:35:24<18:37:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 29%|██▉ | 3578/12384 [7:35:24<18:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 29%|██▉ | 3578/12384 [7:35:31<18:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 29%|██▉ | 3579/12384 [7:35:31<18:36:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 29%|██▉ | 3579/12384 [7:35:39<18:36:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3580/12384 [7:35:39<18:36:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3580/12384 [7:35:47<18:36:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3581/12384 [7:35:47<18:50:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3581/12384 [7:35:54<18:50:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 29%|██▉ | 3582/12384 [7:35:54<18:46:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 29%|██▉ | 3582/12384 [7:36:02<18:46:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3583/12384 [7:36:02<18:42:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3583/12384 [7:36:10<18:42:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 29%|██▉ | 3584/12384 [7:36:10<18:40:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 29%|██▉ | 3584/12384 [7:36:17<18:40:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3585/12384 [7:36:17<18:38:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3585/12384 [7:36:25<18:38:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 29%|██▉ | 3586/12384 [7:36:25<18:37:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 29%|██▉ | 3586/12384 [7:36:32<18:37:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 29%|██▉ | 3587/12384 [7:36:32<18:37:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 29%|██▉ | 3587/12384 [7:36:40<18:37:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3588/12384 [7:36:40<18:37:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3588/12384 [7:36:48<18:37:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3589/12384 [7:36:48<18:37:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3589/12384 [7:36:55<18:37:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3590/12384 [7:36:55<18:39:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3590/12384 [7:37:03<18:39:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 29%|██▉ | 3591/12384 [7:37:03<18:38:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 29%|██▉ | 3591/12384 [7:37:11<18:38:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 29%|██▉ | 3592/12384 [7:37:11<18:44:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 29%|██▉ | 3592/12384 [7:37:18<18:44:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 29%|██▉ | 3593/12384 [7:37:18<18:41:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 29%|██▉ | 3593/12384 [7:37:26<18:41:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 29%|██▉ | 3594/12384 [7:37:26<18:39:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 29%|██▉ | 3594/12384 [7:37:34<18:39:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 29%|██▉ | 3595/12384 [7:37:34<18:37:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 29%|██▉ | 3595/12384 [7:37:41<18:37:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 29%|██▉ | 3596/12384 [7:37:41<18:35:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 29%|██▉ | 3596/12384 [7:37:49<18:35:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 29%|██▉ | 3597/12384 [7:37:49<18:47:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 29%|██▉ | 3597/12384 [7:37:57<18:47:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3598/12384 [7:37:57<18:43:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3598/12384 [7:38:04<18:43:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 29%|██▉ | 3599/12384 [7:38:04<18:40:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 29%|██▉ | 3599/12384 [7:38:12<18:40:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 29%|██▉ | 3600/12384 [7:38:12<18:38:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 29%|██▉ | 3600/12384 [7:38:19<18:38:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3601/12384 [7:38:19<18:36:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3601/12384 [7:38:27<18:36:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▉ | 3602/12384 [7:38:27<18:35:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 29%|██▉ | 3602/12384 [7:38:35<18:35:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3603/12384 [7:38:35<18:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3603/12384 [7:38:42<18:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 29%|██▉ | 3604/12384 [7:38:42<18:33:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 29%|██▉ | 3604/12384 [7:38:50<18:33:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 29%|██▉ | 3605/12384 [7:38:50<18:34:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 29%|██▉ | 3605/12384 [7:38:58<18:34:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3606/12384 [7:38:58<18:34:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 29%|██▉ | 3606/12384 [7:39:06<18:34:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 29%|██▉ | 3607/12384 [7:39:06<18:51:49, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 29%|██▉ | 3607/12384 [7:39:13<18:51:49, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 29%|██▉ | 3608/12384 [7:39:13<18:46:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 29%|██▉ | 3608/12384 [7:39:21<18:46:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 29%|██▉ | 3609/12384 [7:39:21<18:42:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 29%|██▉ | 3609/12384 [7:39:28<18:42:19, 7.67s/it, loss=0.0011, acc=0.9969, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3610/12384 [7:39:28<18:38:57, 7.65s/it, loss=0.0011, acc=0.9969, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3610/12384 [7:39:36<18:38:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3611/12384 [7:39:36<18:38:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3611/12384 [7:39:44<18:38:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 29%|██▉ | 3612/12384 [7:39:44<18:36:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 29%|██▉ | 3612/12384 [7:39:51<18:36:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 29%|██▉ | 3613/12384 [7:39:51<18:34:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 29%|██▉ | 3613/12384 [7:39:59<18:34:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 29%|██▉ | 3614/12384 [7:39:59<18:34:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 29%|██▉ | 3614/12384 [7:40:06<18:34:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 29%|██▉ | 3615/12384 [7:40:06<18:34:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 29%|██▉ | 3615/12384 [7:40:14<18:34:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 29%|██▉ | 3616/12384 [7:40:14<18:42:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 29%|██▉ | 3616/12384 [7:40:22<18:42:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 29%|██▉ | 3617/12384 [7:40:22<18:38:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 29%|██▉ | 3617/12384 [7:40:29<18:38:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3618/12384 [7:40:29<18:35:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3618/12384 [7:40:37<18:35:44, 7.64s/it, loss=0.0007, acc=0.9981, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3619/12384 [7:40:37<18:34:38, 7.63s/it, loss=0.0007, acc=0.9981, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3619/12384 [7:40:45<18:34:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3620/12384 [7:40:45<18:33:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3620/12384 [7:40:52<18:33:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3621/12384 [7:40:52<18:36:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3621/12384 [7:41:00<18:36:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 29%|██▉ | 3622/12384 [7:41:00<18:35:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 29%|██▉ | 3622/12384 [7:41:08<18:35:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 29%|██▉ | 3623/12384 [7:41:08<18:33:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 29%|██▉ | 3623/12384 [7:41:15<18:33:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 29%|██▉ | 3624/12384 [7:41:15<18:32:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 29%|██▉ | 3624/12384 [7:41:23<18:32:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 29%|██▉ | 3625/12384 [7:41:23<18:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 29%|██▉ | 3625/12384 [7:41:30<18:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3626/12384 [7:41:30<18:35:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 29%|██▉ | 3626/12384 [7:41:38<18:35:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 29%|██▉ | 3627/12384 [7:41:38<18:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 29%|██▉ | 3627/12384 [7:41:46<18:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 29%|██▉ | 3628/12384 [7:41:46<18:31:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 29%|██▉ | 3628/12384 [7:41:53<18:31:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3629/12384 [7:41:53<18:30:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 29%|██▉ | 3629/12384 [7:42:01<18:30:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 29%|██▉ | 3630/12384 [7:42:01<18:29:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 29%|██▉ | 3630/12384 [7:42:08<18:29:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 29%|██▉ | 3631/12384 [7:42:08<18:28:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 29%|██▉ | 3631/12384 [7:42:16<18:28:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 29%|██▉ | 3632/12384 [7:42:16<18:28:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 29%|██▉ | 3632/12384 [7:42:24<18:28:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 29%|██▉ | 3633/12384 [7:42:24<18:43:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 29%|██▉ | 3633/12384 [7:42:32<18:43:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 29%|██▉ | 3634/12384 [7:42:32<18:39:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 29%|██▉ | 3634/12384 [7:42:39<18:39:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 29%|██▉ | 3635/12384 [7:42:39<18:35:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 29%|██▉ | 3635/12384 [7:42:47<18:35:57, 7.65s/it, loss=0.0003, acc=0.9979, iter_time=4.49s]
Epoch 1: 29%|██▉ | 3636/12384 [7:42:47<18:31:27, 7.62s/it, loss=0.0003, acc=0.9979, iter_time=4.49s]
Epoch 1: 29%|██▉ | 3636/12384 [7:42:54<18:31:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.66s]
Epoch 1: 29%|██▉ | 3637/12384 [7:42:54<18:31:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.66s]
Epoch 1: 29%|██▉ | 3637/12384 [7:43:02<18:31:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 29%|██▉ | 3638/12384 [7:43:02<18:31:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 29%|██▉ | 3638/12384 [7:43:10<18:31:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 29%|██▉ | 3639/12384 [7:43:10<18:30:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 29%|██▉ | 3639/12384 [7:43:17<18:30:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 29%|██▉ | 3640/12384 [7:43:17<18:29:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 29%|██▉ | 3640/12384 [7:43:25<18:29:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 1: 29%|██▉ | 3641/12384 [7:43:25<18:30:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 1: 29%|██▉ | 3641/12384 [7:43:32<18:30:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 29%|██▉ | 3642/12384 [7:43:32<18:30:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 29%|██▉ | 3642/12384 [7:43:40<18:30:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 29%|██▉ | 3643/12384 [7:43:40<18:30:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 29%|██▉ | 3643/12384 [7:43:48<18:30:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 29%|██▉ | 3644/12384 [7:43:48<18:29:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 29%|██▉ | 3644/12384 [7:43:55<18:29:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3645/12384 [7:43:55<18:29:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 29%|██▉ | 3645/12384 [7:44:03<18:29:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 29%|██▉ | 3646/12384 [7:44:03<18:29:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 29%|██▉ | 3646/12384 [7:44:11<18:29:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 29%|██▉ | 3647/12384 [7:44:11<18:29:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 29%|██▉ | 3647/12384 [7:44:18<18:29:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 29%|██▉ | 3648/12384 [7:44:18<18:41:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 29%|██▉ | 3648/12384 [7:44:26<18:41:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 29%|██▉ | 3649/12384 [7:44:26<18:37:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 29%|██▉ | 3649/12384 [7:44:34<18:37:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 29%|██▉ | 3650/12384 [7:44:34<18:34:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 29%|██▉ | 3650/12384 [7:44:41<18:34:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 29%|██▉ | 3651/12384 [7:44:41<18:35:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 29%|██▉ | 3651/12384 [7:44:49<18:35:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 29%|██▉ | 3652/12384 [7:44:49<18:33:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 29%|██▉ | 3652/12384 [7:44:57<18:33:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 29%|██▉ | 3653/12384 [7:44:57<18:32:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 29%|██▉ | 3653/12384 [7:45:04<18:32:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 30%|██▉ | 3654/12384 [7:45:04<18:30:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 30%|██▉ | 3654/12384 [7:45:12<18:30:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3655/12384 [7:45:12<18:28:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3655/12384 [7:45:19<18:28:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 30%|██▉ | 3656/12384 [7:45:19<18:28:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 30%|██▉ | 3656/12384 [7:45:27<18:28:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 1: 30%|██▉ | 3657/12384 [7:45:27<18:27:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 1: 30%|██▉ | 3657/12384 [7:45:35<18:27:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|██▉ | 3658/12384 [7:45:35<18:28:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|██▉ | 3658/12384 [7:45:43<18:28:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|██▉ | 3659/12384 [7:45:43<18:43:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|██▉ | 3659/12384 [7:45:50<18:43:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 30%|██▉ | 3660/12384 [7:45:50<18:38:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 30%|██▉ | 3660/12384 [7:45:58<18:38:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 30%|██▉ | 3661/12384 [7:45:58<18:34:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 30%|██▉ | 3661/12384 [7:46:05<18:34:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 30%|██▉ | 3662/12384 [7:46:05<18:32:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 30%|██▉ | 3662/12384 [7:46:13<18:32:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 30%|██▉ | 3663/12384 [7:46:13<18:30:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 30%|██▉ | 3663/12384 [7:46:21<18:30:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 30%|██▉ | 3664/12384 [7:46:21<18:28:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 30%|██▉ | 3664/12384 [7:46:28<18:28:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 30%|██▉ | 3665/12384 [7:46:28<18:27:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 30%|██▉ | 3665/12384 [7:46:36<18:27:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 30%|██▉ | 3666/12384 [7:46:36<18:26:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 30%|██▉ | 3666/12384 [7:46:43<18:26:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 1: 30%|██▉ | 3667/12384 [7:46:43<18:25:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 1: 30%|██▉ | 3667/12384 [7:46:51<18:25:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 30%|██▉ | 3668/12384 [7:46:51<18:25:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 30%|██▉ | 3668/12384 [7:46:59<18:25:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 30%|██▉ | 3669/12384 [7:46:59<18:25:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 30%|██▉ | 3669/12384 [7:47:06<18:25:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|██▉ | 3670/12384 [7:47:06<18:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|██▉ | 3670/12384 [7:47:14<18:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 30%|██▉ | 3671/12384 [7:47:14<18:26:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 30%|██▉ | 3671/12384 [7:47:22<18:26:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 30%|██▉ | 3672/12384 [7:47:22<18:25:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 30%|██▉ | 3672/12384 [7:47:29<18:25:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 30%|██▉ | 3673/12384 [7:47:29<18:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 30%|██▉ | 3673/12384 [7:47:37<18:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 30%|██▉ | 3674/12384 [7:47:37<18:23:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 30%|██▉ | 3674/12384 [7:47:45<18:23:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 30%|██▉ | 3675/12384 [7:47:45<18:36:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 30%|██▉ | 3675/12384 [7:47:52<18:36:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 30%|██▉ | 3676/12384 [7:47:52<18:32:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 30%|██▉ | 3676/12384 [7:48:00<18:32:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 30%|██▉ | 3677/12384 [7:48:00<18:29:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 30%|██▉ | 3677/12384 [7:48:07<18:29:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3678/12384 [7:48:07<18:27:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3678/12384 [7:48:15<18:27:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 30%|██▉ | 3679/12384 [7:48:15<18:26:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 30%|██▉ | 3679/12384 [7:48:23<18:26:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 30%|██▉ | 3680/12384 [7:48:23<18:25:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 30%|██▉ | 3680/12384 [7:48:30<18:25:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 30%|██▉ | 3681/12384 [7:48:30<18:25:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 30%|██▉ | 3681/12384 [7:48:38<18:25:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 30%|██▉ | 3682/12384 [7:48:38<18:25:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 30%|██▉ | 3682/12384 [7:48:46<18:25:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 30%|██▉ | 3683/12384 [7:48:46<18:24:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 30%|██▉ | 3683/12384 [7:48:53<18:24:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 30%|██▉ | 3684/12384 [7:48:53<18:23:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 30%|██▉ | 3684/12384 [7:49:01<18:23:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3685/12384 [7:49:01<18:36:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3685/12384 [7:49:09<18:36:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 30%|██▉ | 3686/12384 [7:49:09<18:32:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 30%|██▉ | 3686/12384 [7:49:16<18:32:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 30%|██▉ | 3687/12384 [7:49:16<18:31:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 30%|██▉ | 3687/12384 [7:49:24<18:31:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 30%|██▉ | 3688/12384 [7:49:24<18:28:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 30%|██▉ | 3688/12384 [7:49:31<18:28:19, 7.65s/it, loss=0.0014, acc=0.9987, iter_time=7.65s]
Epoch 1: 30%|██▉ | 3689/12384 [7:49:31<18:25:44, 7.63s/it, loss=0.0014, acc=0.9987, iter_time=7.65s]
Epoch 1: 30%|██▉ | 3689/12384 [7:49:39<18:25:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 30%|██▉ | 3690/12384 [7:49:39<18:24:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 30%|██▉ | 3690/12384 [7:49:47<18:24:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 30%|██▉ | 3691/12384 [7:49:47<18:27:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 30%|██▉ | 3691/12384 [7:49:54<18:27:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 30%|██▉ | 3692/12384 [7:49:54<18:25:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 30%|██▉ | 3692/12384 [7:50:02<18:25:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 30%|██▉ | 3693/12384 [7:50:02<18:24:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 30%|██▉ | 3693/12384 [7:50:10<18:24:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3694/12384 [7:50:10<18:23:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3694/12384 [7:50:17<18:23:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|██▉ | 3695/12384 [7:50:17<18:22:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|██▉ | 3695/12384 [7:50:25<18:22:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 30%|██▉ | 3696/12384 [7:50:25<18:22:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 30%|██▉ | 3696/12384 [7:50:32<18:22:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 30%|██▉ | 3697/12384 [7:50:32<18:24:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 30%|██▉ | 3697/12384 [7:50:40<18:24:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 30%|██▉ | 3698/12384 [7:50:40<18:23:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 30%|██▉ | 3698/12384 [7:50:48<18:23:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|██▉ | 3699/12384 [7:50:48<18:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|██▉ | 3699/12384 [7:50:55<18:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3700/12384 [7:50:55<18:21:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3700/12384 [7:51:03<18:21:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 30%|██▉ | 3701/12384 [7:51:03<18:19:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 30%|██▉ | 3701/12384 [7:51:10<18:19:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 30%|██▉ | 3702/12384 [7:51:10<18:18:55, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 30%|██▉ | 3702/12384 [7:51:18<18:18:55, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 30%|██▉ | 3703/12384 [7:51:18<18:19:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 30%|██▉ | 3703/12384 [7:51:26<18:19:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 30%|██▉ | 3704/12384 [7:51:26<18:21:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 30%|██▉ | 3704/12384 [7:51:33<18:21:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 30%|██▉ | 3705/12384 [7:51:33<18:21:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 30%|██▉ | 3705/12384 [7:51:41<18:21:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3706/12384 [7:51:41<18:21:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3706/12384 [7:51:49<18:21:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3707/12384 [7:51:49<18:21:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|██▉ | 3707/12384 [7:51:56<18:21:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 30%|██▉ | 3708/12384 [7:51:56<18:21:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 30%|██▉ | 3708/12384 [7:52:04<18:21:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 30%|██▉ | 3709/12384 [7:52:04<18:20:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 30%|██▉ | 3709/12384 [7:52:11<18:20:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 30%|██▉ | 3710/12384 [7:52:11<18:19:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 30%|██▉ | 3710/12384 [7:52:19<18:19:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 30%|██▉ | 3711/12384 [7:52:19<18:20:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 30%|██▉ | 3711/12384 [7:52:27<18:20:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 30%|██▉ | 3712/12384 [7:52:27<18:32:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 30%|██▉ | 3712/12384 [7:52:35<18:32:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|██▉ | 3713/12384 [7:52:35<18:28:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|██▉ | 3713/12384 [7:52:42<18:28:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|██▉ | 3714/12384 [7:52:42<18:26:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|██▉ | 3714/12384 [7:52:50<18:26:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|██▉ | 3715/12384 [7:52:50<18:24:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|██▉ | 3715/12384 [7:52:57<18:24:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 30%|███ | 3716/12384 [7:52:57<18:22:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 30%|███ | 3716/12384 [7:53:05<18:22:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 30%|███ | 3717/12384 [7:53:05<18:21:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 30%|███ | 3717/12384 [7:53:13<18:21:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 30%|███ | 3718/12384 [7:53:13<18:20:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 30%|███ | 3718/12384 [7:53:20<18:20:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 30%|███ | 3719/12384 [7:53:20<18:20:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 30%|███ | 3719/12384 [7:53:28<18:20:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 30%|███ | 3720/12384 [7:53:28<18:19:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 30%|███ | 3720/12384 [7:53:35<18:19:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3721/12384 [7:53:35<18:18:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3721/12384 [7:53:43<18:18:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|███ | 3722/12384 [7:53:43<18:18:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|███ | 3722/12384 [7:53:51<18:18:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 30%|███ | 3723/12384 [7:53:51<18:18:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 30%|███ | 3723/12384 [7:53:58<18:18:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 30%|███ | 3724/12384 [7:53:58<18:17:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 30%|███ | 3724/12384 [7:54:06<18:17:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 30%|███ | 3725/12384 [7:54:06<18:17:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 30%|███ | 3725/12384 [7:54:13<18:17:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 30%|███ | 3726/12384 [7:54:13<18:16:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 30%|███ | 3726/12384 [7:54:21<18:16:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 30%|███ | 3727/12384 [7:54:21<18:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 30%|███ | 3727/12384 [7:54:29<18:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.47s]
Epoch 1: 30%|███ | 3728/12384 [7:54:29<18:17:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.47s]
Epoch 1: 30%|███ | 3728/12384 [7:54:36<18:17:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 30%|███ | 3729/12384 [7:54:36<18:17:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 30%|███ | 3729/12384 [7:54:44<18:17:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 30%|███ | 3730/12384 [7:54:44<18:18:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 30%|███ | 3730/12384 [7:54:51<18:18:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 30%|███ | 3731/12384 [7:54:51<18:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 30%|███ | 3731/12384 [7:54:59<18:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 30%|███ | 3732/12384 [7:54:59<18:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 30%|███ | 3732/12384 [7:55:07<18:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 30%|███ | 3733/12384 [7:55:07<18:20:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 30%|███ | 3733/12384 [7:55:14<18:20:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 1: 30%|███ | 3734/12384 [7:55:14<18:19:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 1: 30%|███ | 3734/12384 [7:55:22<18:19:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 30%|███ | 3735/12384 [7:55:22<18:18:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 30%|███ | 3735/12384 [7:55:30<18:18:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 30%|███ | 3736/12384 [7:55:30<18:18:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 30%|███ | 3736/12384 [7:55:37<18:18:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 30%|███ | 3737/12384 [7:55:37<18:18:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 30%|███ | 3737/12384 [7:55:45<18:18:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 30%|███ | 3738/12384 [7:55:45<18:29:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 30%|███ | 3738/12384 [7:55:53<18:29:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 30%|███ | 3739/12384 [7:55:53<18:25:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 30%|███ | 3739/12384 [7:56:00<18:25:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 30%|███ | 3740/12384 [7:56:00<18:22:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 30%|███ | 3740/12384 [7:56:08<18:22:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 30%|███ | 3741/12384 [7:56:08<18:20:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 30%|███ | 3741/12384 [7:56:16<18:20:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|███ | 3742/12384 [7:56:16<18:19:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|███ | 3742/12384 [7:56:23<18:19:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 30%|███ | 3743/12384 [7:56:23<18:19:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 30%|███ | 3743/12384 [7:56:31<18:19:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.35s]
Epoch 1: 30%|███ | 3744/12384 [7:56:31<18:18:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.35s]
Epoch 1: 30%|███ | 3744/12384 [7:56:38<18:18:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3745/12384 [7:56:38<18:16:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3745/12384 [7:56:46<18:16:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|███ | 3746/12384 [7:56:46<18:16:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 30%|███ | 3746/12384 [7:56:54<18:16:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 30%|███ | 3747/12384 [7:56:54<18:15:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 30%|███ | 3747/12384 [7:57:01<18:15:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 30%|███ | 3748/12384 [7:57:01<18:14:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 30%|███ | 3748/12384 [7:57:09<18:14:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 30%|███ | 3749/12384 [7:57:09<18:14:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 30%|███ | 3749/12384 [7:57:16<18:14:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 30%|███ | 3750/12384 [7:57:16<18:13:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 30%|███ | 3750/12384 [7:57:24<18:13:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 30%|███ | 3751/12384 [7:57:24<18:15:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 30%|███ | 3751/12384 [7:57:32<18:15:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 30%|███ | 3752/12384 [7:57:32<18:15:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 30%|███ | 3752/12384 [7:57:39<18:15:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3753/12384 [7:57:39<18:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3753/12384 [7:57:47<18:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 1: 30%|███ | 3754/12384 [7:57:47<18:16:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.88s]
Epoch 1: 30%|███ | 3754/12384 [7:57:55<18:16:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 1: 30%|███ | 3755/12384 [7:57:55<18:17:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 1: 30%|███ | 3755/12384 [7:58:02<18:17:07, 7.63s/it, loss=0.0004, acc=0.9987, iter_time=4.79s]
Epoch 1: 30%|███ | 3756/12384 [7:58:02<18:16:32, 7.63s/it, loss=0.0004, acc=0.9987, iter_time=4.79s]
Epoch 1: 30%|███ | 3756/12384 [7:58:10<18:16:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 30%|███ | 3757/12384 [7:58:10<18:14:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 30%|███ | 3757/12384 [7:58:17<18:14:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 30%|███ | 3758/12384 [7:58:17<18:14:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 30%|███ | 3758/12384 [7:58:25<18:14:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 30%|███ | 3759/12384 [7:58:25<18:17:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 30%|███ | 3759/12384 [7:58:33<18:17:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 30%|███ | 3760/12384 [7:58:33<18:16:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 30%|███ | 3760/12384 [7:58:40<18:16:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 30%|███ | 3761/12384 [7:58:40<18:16:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 30%|███ | 3761/12384 [7:58:48<18:16:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|███ | 3762/12384 [7:58:48<18:14:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 30%|███ | 3762/12384 [7:58:56<18:14:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 30%|███ | 3763/12384 [7:58:56<18:16:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 30%|███ | 3763/12384 [7:59:03<18:16:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 30%|███ | 3764/12384 [7:59:03<18:16:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 30%|███ | 3764/12384 [7:59:11<18:16:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 30%|███ | 3765/12384 [7:59:11<18:28:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 30%|███ | 3765/12384 [7:59:19<18:28:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 30%|███ | 3766/12384 [7:59:19<18:24:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 30%|███ | 3766/12384 [7:59:26<18:24:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 30%|███ | 3767/12384 [7:59:26<18:20:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 30%|███ | 3767/12384 [7:59:34<18:20:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 30%|███ | 3768/12384 [7:59:34<18:18:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 30%|███ | 3768/12384 [7:59:42<18:18:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3769/12384 [7:59:42<18:16:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3769/12384 [7:59:49<18:16:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3770/12384 [7:59:49<18:15:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 30%|███ | 3770/12384 [7:59:57<18:15:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 30%|███ | 3771/12384 [7:59:57<18:14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 30%|███ | 3771/12384 [8:00:04<18:14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 30%|███ | 3772/12384 [8:00:04<18:13:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 30%|███ | 3772/12384 [8:00:12<18:13:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 30%|███ | 3773/12384 [8:00:12<18:13:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 30%|███ | 3773/12384 [8:00:20<18:13:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 30%|███ | 3774/12384 [8:00:20<18:12:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 30%|███ | 3774/12384 [8:00:27<18:12:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 30%|███ | 3775/12384 [8:00:27<18:12:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 30%|███ | 3775/12384 [8:00:35<18:12:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 30%|███ | 3776/12384 [8:00:35<18:12:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 30%|███ | 3776/12384 [8:00:42<18:12:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 30%|███ | 3777/12384 [8:00:42<18:12:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 30%|███ | 3777/12384 [8:00:50<18:12:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 31%|███ | 3778/12384 [8:00:50<18:15:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 31%|███ | 3778/12384 [8:00:58<18:15:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 31%|███ | 3779/12384 [8:00:58<18:15:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 31%|███ | 3779/12384 [8:01:05<18:15:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 31%|███ | 3780/12384 [8:01:05<18:14:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 31%|███ | 3780/12384 [8:01:13<18:14:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3781/12384 [8:01:13<18:12:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3781/12384 [8:01:21<18:12:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3782/12384 [8:01:21<18:11:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3782/12384 [8:01:28<18:11:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3783/12384 [8:01:28<18:10:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3783/12384 [8:01:36<18:10:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 31%|███ | 3784/12384 [8:01:36<18:10:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 31%|███ | 3784/12384 [8:01:43<18:10:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 31%|███ | 3785/12384 [8:01:43<18:10:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 31%|███ | 3785/12384 [8:01:51<18:10:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 31%|███ | 3786/12384 [8:01:51<18:09:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 31%|███ | 3786/12384 [8:01:59<18:09:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3787/12384 [8:01:59<18:10:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3787/12384 [8:02:06<18:10:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3788/12384 [8:02:06<18:09:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3788/12384 [8:02:14<18:09:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 1: 31%|███ | 3789/12384 [8:02:14<18:09:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 1: 31%|███ | 3789/12384 [8:02:21<18:09:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 31%|███ | 3790/12384 [8:02:21<18:09:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 31%|███ | 3790/12384 [8:02:29<18:09:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 31%|███ | 3791/12384 [8:02:29<18:24:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 31%|███ | 3791/12384 [8:02:37<18:24:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 31%|███ | 3792/12384 [8:02:37<18:23:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 31%|███ | 3792/12384 [8:02:45<18:23:32, 7.71s/it, loss=0.0003, acc=0.9983, iter_time=7.75s]
Epoch 1: 31%|███ | 3793/12384 [8:02:45<18:22:34, 7.70s/it, loss=0.0003, acc=0.9983, iter_time=7.75s]
Epoch 1: 31%|███ | 3793/12384 [8:02:52<18:22:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 31%|███ | 3794/12384 [8:02:52<18:17:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 31%|███ | 3794/12384 [8:03:00<18:17:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 31%|███ | 3795/12384 [8:03:00<18:14:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 31%|███ | 3795/12384 [8:03:08<18:14:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 31%|███ | 3796/12384 [8:03:08<18:13:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 31%|███ | 3796/12384 [8:03:15<18:13:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 31%|███ | 3797/12384 [8:03:15<18:12:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 31%|███ | 3797/12384 [8:03:23<18:12:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 31%|███ | 3798/12384 [8:03:23<18:12:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 31%|███ | 3798/12384 [8:03:30<18:12:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 31%|███ | 3799/12384 [8:03:30<18:10:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 31%|███ | 3799/12384 [8:03:38<18:10:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.74s]
Epoch 1: 31%|███ | 3800/12384 [8:03:38<18:09:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.74s]
Epoch 1: 31%|███ | 3800/12384 [8:03:46<18:09:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 31%|███ | 3801/12384 [8:03:46<18:09:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 31%|███ | 3801/12384 [8:03:53<18:09:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 31%|███ | 3802/12384 [8:03:53<18:11:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 31%|███ | 3802/12384 [8:04:01<18:11:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 31%|███ | 3803/12384 [8:04:01<18:09:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 31%|███ | 3803/12384 [8:04:09<18:09:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 31%|███ | 3804/12384 [8:04:09<18:10:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 31%|███ | 3804/12384 [8:04:16<18:10:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 1: 31%|███ | 3805/12384 [8:04:16<18:11:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 1: 31%|███ | 3805/12384 [8:04:24<18:11:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 31%|███ | 3806/12384 [8:04:24<18:23:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 31%|███ | 3806/12384 [8:04:32<18:23:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 31%|███ | 3807/12384 [8:04:32<18:19:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 31%|███ | 3807/12384 [8:04:39<18:19:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 31%|███ | 3808/12384 [8:04:39<18:15:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 31%|███ | 3808/12384 [8:04:47<18:15:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 31%|███ | 3809/12384 [8:04:47<18:16:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 31%|███ | 3809/12384 [8:04:55<18:16:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 31%|███ | 3810/12384 [8:04:55<18:14:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 31%|███ | 3810/12384 [8:05:02<18:14:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 31%|███ | 3811/12384 [8:05:02<18:11:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 31%|███ | 3811/12384 [8:05:10<18:11:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 31%|███ | 3812/12384 [8:05:10<18:08:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 31%|███ | 3812/12384 [8:05:17<18:08:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 31%|███ | 3813/12384 [8:05:17<18:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 31%|███ | 3813/12384 [8:05:25<18:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 1: 31%|███ | 3814/12384 [8:05:25<18:12:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 1: 31%|███ | 3814/12384 [8:05:33<18:12:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 1: 31%|███ | 3815/12384 [8:05:33<18:10:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 1: 31%|███ | 3815/12384 [8:05:40<18:10:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 31%|███ | 3816/12384 [8:05:40<18:10:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 31%|███ | 3816/12384 [8:05:48<18:10:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 31%|███ | 3817/12384 [8:05:48<18:23:50, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 31%|███ | 3817/12384 [8:05:56<18:23:50, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 31%|███ | 3818/12384 [8:05:56<18:17:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 31%|███ | 3818/12384 [8:06:04<18:17:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3819/12384 [8:06:04<18:14:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3819/12384 [8:06:11<18:14:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 1: 31%|███ | 3820/12384 [8:06:11<18:12:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 1: 31%|███ | 3820/12384 [8:06:19<18:12:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 31%|███ | 3821/12384 [8:06:19<18:10:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 31%|███ | 3821/12384 [8:06:26<18:10:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 1: 31%|███ | 3822/12384 [8:06:26<18:09:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 1: 31%|███ | 3822/12384 [8:06:34<18:09:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 31%|███ | 3823/12384 [8:06:34<18:08:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 31%|███ | 3823/12384 [8:06:42<18:08:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 31%|███ | 3824/12384 [8:06:42<18:07:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 31%|███ | 3824/12384 [8:06:49<18:07:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 31%|███ | 3825/12384 [8:06:49<18:07:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 31%|███ | 3825/12384 [8:06:57<18:07:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 31%|███ | 3826/12384 [8:06:57<18:09:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 31%|███ | 3826/12384 [8:07:05<18:09:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 31%|███ | 3827/12384 [8:07:05<18:07:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 31%|███ | 3827/12384 [8:07:12<18:07:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3828/12384 [8:07:12<18:07:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3828/12384 [8:07:20<18:07:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3829/12384 [8:07:20<18:06:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3829/12384 [8:07:27<18:06:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 31%|███ | 3830/12384 [8:07:27<18:06:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 31%|███ | 3830/12384 [8:07:35<18:06:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 31%|███ | 3831/12384 [8:07:35<18:06:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 31%|███ | 3831/12384 [8:07:43<18:06:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 31%|███ | 3832/12384 [8:07:43<18:06:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 31%|███ | 3832/12384 [8:07:50<18:06:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 31%|███ | 3833/12384 [8:07:50<18:05:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 31%|███ | 3833/12384 [8:07:58<18:05:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3834/12384 [8:07:58<18:05:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3834/12384 [8:08:06<18:05:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3835/12384 [8:08:06<18:05:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3835/12384 [8:08:13<18:05:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 31%|███ | 3836/12384 [8:08:13<18:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 31%|███ | 3836/12384 [8:08:21<18:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 31%|███ | 3837/12384 [8:08:21<18:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 31%|███ | 3837/12384 [8:08:28<18:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 31%|███ | 3838/12384 [8:08:28<18:05:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 31%|███ | 3838/12384 [8:08:36<18:05:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 31%|███ | 3839/12384 [8:08:36<18:06:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 31%|███ | 3839/12384 [8:08:44<18:06:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 1: 31%|███ | 3840/12384 [8:08:44<18:06:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 1: 31%|███ | 3840/12384 [8:08:51<18:06:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 31%|███ | 3841/12384 [8:08:51<18:08:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 31%|███ | 3841/12384 [8:08:59<18:08:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 31%|███ | 3842/12384 [8:08:59<18:06:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 31%|███ | 3842/12384 [8:09:07<18:06:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 31%|███ | 3843/12384 [8:09:07<18:19:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 31%|███ | 3843/12384 [8:09:15<18:19:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 31%|███ | 3844/12384 [8:09:15<18:14:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 31%|███ | 3844/12384 [8:09:22<18:14:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3845/12384 [8:09:22<18:10:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3845/12384 [8:09:30<18:10:46, 7.66s/it, loss=0.0006, acc=0.9967, iter_time=7.60s]
Epoch 1: 31%|███ | 3846/12384 [8:09:30<18:08:41, 7.65s/it, loss=0.0006, acc=0.9967, iter_time=7.60s]
Epoch 1: 31%|███ | 3846/12384 [8:09:37<18:08:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 31%|███ | 3847/12384 [8:09:37<18:05:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 31%|███ | 3847/12384 [8:09:45<18:05:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 31%|███ | 3848/12384 [8:09:45<18:05:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 31%|███ | 3848/12384 [8:09:53<18:05:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 1: 31%|███ | 3849/12384 [8:09:53<18:04:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 1: 31%|███ | 3849/12384 [8:10:00<18:04:29, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=8.83s]
Epoch 1: 31%|███ | 3850/12384 [8:10:00<18:03:38, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=8.83s]
Epoch 1: 31%|███ | 3850/12384 [8:10:08<18:03:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 31%|███ | 3851/12384 [8:10:08<18:02:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 31%|███ | 3851/12384 [8:10:15<18:02:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3852/12384 [8:10:15<18:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███ | 3852/12384 [8:10:23<18:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3853/12384 [8:10:23<18:02:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 31%|███ | 3853/12384 [8:10:31<18:02:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 31%|███ | 3854/12384 [8:10:31<18:02:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 31%|███ | 3854/12384 [8:10:38<18:02:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 31%|███ | 3855/12384 [8:10:38<18:02:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 31%|███ | 3855/12384 [8:10:46<18:02:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.84s]
Epoch 1: 31%|███ | 3856/12384 [8:10:46<18:02:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.84s]
Epoch 1: 31%|███ | 3856/12384 [8:10:54<18:02:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 31%|███ | 3857/12384 [8:10:54<18:13:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 31%|███ | 3857/12384 [8:11:01<18:13:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3858/12384 [8:11:01<18:10:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3858/12384 [8:11:09<18:10:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3859/12384 [8:11:09<18:07:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3859/12384 [8:11:17<18:07:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3860/12384 [8:11:17<18:05:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 31%|███ | 3860/12384 [8:11:24<18:05:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 31%|███ | 3861/12384 [8:11:24<18:04:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 31%|███ | 3861/12384 [8:11:32<18:04:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 31%|███ | 3862/12384 [8:11:32<18:03:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 31%|███ | 3862/12384 [8:11:39<18:03:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 31%|███ | 3863/12384 [8:11:39<18:02:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 31%|███ | 3863/12384 [8:11:47<18:02:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 31%|███ | 3864/12384 [8:11:47<18:01:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 31%|███ | 3864/12384 [8:11:55<18:01:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 31%|███ | 3865/12384 [8:11:55<18:00:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 31%|███ | 3865/12384 [8:12:02<18:00:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 31%|███ | 3866/12384 [8:12:02<18:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 31%|███ | 3866/12384 [8:12:10<18:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 1: 31%|███ | 3867/12384 [8:12:10<17:59:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 1: 31%|███ | 3867/12384 [8:12:17<17:59:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 31%|███ | 3868/12384 [8:12:17<17:59:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 31%|███ | 3868/12384 [8:12:25<17:59:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 31%|███ | 3869/12384 [8:12:25<18:13:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 31%|███ | 3869/12384 [8:12:33<18:13:35, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 31%|███▏ | 3870/12384 [8:12:33<18:08:48, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 31%|███▏ | 3870/12384 [8:12:41<18:08:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 31%|███▏ | 3871/12384 [8:12:41<18:05:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 31%|███▏ | 3871/12384 [8:12:48<18:05:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 31%|███▏ | 3872/12384 [8:12:48<18:04:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 31%|███▏ | 3872/12384 [8:12:56<18:04:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 31%|███▏ | 3873/12384 [8:12:56<18:01:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 31%|███▏ | 3873/12384 [8:13:03<18:01:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 31%|███▏ | 3874/12384 [8:13:03<18:00:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 31%|███▏ | 3874/12384 [8:13:11<18:00:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 31%|███▏ | 3875/12384 [8:13:11<18:00:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 31%|███▏ | 3875/12384 [8:13:19<18:00:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 31%|███▏ | 3876/12384 [8:13:19<18:00:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 31%|███▏ | 3876/12384 [8:13:26<18:00:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 31%|███▏ | 3877/12384 [8:13:26<18:01:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 31%|███▏ | 3877/12384 [8:13:34<18:01:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 31%|███▏ | 3878/12384 [8:13:34<17:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 31%|███▏ | 3878/12384 [8:13:41<17:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 31%|███▏ | 3879/12384 [8:13:41<17:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 31%|███▏ | 3879/12384 [8:13:49<17:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 31%|███▏ | 3880/12384 [8:13:49<17:59:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 31%|███▏ | 3880/12384 [8:13:57<17:59:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 31%|███▏ | 3881/12384 [8:13:57<17:59:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 31%|███▏ | 3881/12384 [8:14:04<17:59:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 31%|███▏ | 3882/12384 [8:14:04<17:59:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 31%|███▏ | 3882/12384 [8:14:12<17:59:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 31%|███▏ | 3883/12384 [8:14:12<18:11:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 31%|███▏ | 3883/12384 [8:14:20<18:11:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 31%|███▏ | 3884/12384 [8:14:20<18:07:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 31%|███▏ | 3884/12384 [8:14:27<18:07:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███▏ | 3885/12384 [8:14:27<18:03:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 31%|███▏ | 3885/12384 [8:14:35<18:03:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 31%|███▏ | 3886/12384 [8:14:35<18:01:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 31%|███▏ | 3886/12384 [8:14:43<18:01:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 31%|███▏ | 3887/12384 [8:14:43<18:02:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 31%|███▏ | 3887/12384 [8:14:50<18:02:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 31%|███▏ | 3888/12384 [8:14:50<17:59:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 31%|███▏ | 3888/12384 [8:14:58<17:59:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 31%|███▏ | 3889/12384 [8:14:58<17:59:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 31%|███▏ | 3889/12384 [8:15:06<17:59:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 31%|███▏ | 3890/12384 [8:15:06<18:02:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 31%|███▏ | 3890/12384 [8:15:13<18:02:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 1: 31%|███▏ | 3891/12384 [8:15:13<18:00:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 1: 31%|███▏ | 3891/12384 [8:15:21<18:00:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 31%|███▏ | 3892/12384 [8:15:21<17:58:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 31%|███▏ | 3892/12384 [8:15:28<17:58:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 31%|███▏ | 3893/12384 [8:15:28<17:58:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 31%|███▏ | 3893/12384 [8:15:36<17:58:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 31%|███▏ | 3894/12384 [8:15:36<17:57:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 31%|███▏ | 3894/12384 [8:15:44<17:57:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 31%|███▏ | 3895/12384 [8:15:44<17:57:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 31%|███▏ | 3895/12384 [8:15:52<17:57:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 31%|███▏ | 3896/12384 [8:15:52<18:12:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 31%|███▏ | 3896/12384 [8:15:59<18:12:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 31%|███▏ | 3897/12384 [8:15:59<18:06:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 31%|███▏ | 3897/12384 [8:16:07<18:06:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 31%|███▏ | 3898/12384 [8:16:07<18:04:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 31%|███▏ | 3898/12384 [8:16:14<18:04:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 31%|███▏ | 3899/12384 [8:16:14<18:02:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 31%|███▏ | 3899/12384 [8:16:22<18:02:49, 7.66s/it, loss=0.0006, acc=0.9982, iter_time=4.61s]
Epoch 1: 31%|███▏ | 3900/12384 [8:16:22<18:01:50, 7.65s/it, loss=0.0006, acc=0.9982, iter_time=4.61s]
Epoch 1: 31%|███▏ | 3900/12384 [8:16:30<18:01:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 32%|███▏ | 3901/12384 [8:16:30<18:00:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 32%|███▏ | 3901/12384 [8:16:37<18:00:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 32%|███▏ | 3902/12384 [8:16:37<17:59:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 32%|███▏ | 3902/12384 [8:16:45<17:59:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3903/12384 [8:16:45<17:57:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3903/12384 [8:16:53<17:57:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 32%|███▏ | 3904/12384 [8:16:53<17:57:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 32%|███▏ | 3904/12384 [8:17:00<17:57:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 32%|███▏ | 3905/12384 [8:17:00<17:56:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 32%|███▏ | 3905/12384 [8:17:08<17:56:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 32%|███▏ | 3906/12384 [8:17:08<17:56:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 32%|███▏ | 3906/12384 [8:17:15<17:56:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3907/12384 [8:17:15<17:55:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3907/12384 [8:17:23<17:55:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 32%|███▏ | 3908/12384 [8:17:23<17:53:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 32%|███▏ | 3908/12384 [8:17:31<17:53:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 32%|███▏ | 3909/12384 [8:17:31<18:04:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 32%|███▏ | 3909/12384 [8:17:38<18:04:21, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.51s]
Epoch 1: 32%|███▏ | 3910/12384 [8:17:38<18:03:39, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.51s]
Epoch 1: 32%|███▏ | 3910/12384 [8:17:46<18:03:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 32%|███▏ | 3911/12384 [8:17:46<18:01:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 32%|███▏ | 3911/12384 [8:17:54<18:01:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 32%|███▏ | 3912/12384 [8:17:54<17:58:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 32%|███▏ | 3912/12384 [8:18:01<17:58:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 32%|███▏ | 3913/12384 [8:18:01<17:57:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 32%|███▏ | 3913/12384 [8:18:09<17:57:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 32%|███▏ | 3914/12384 [8:18:09<18:00:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 32%|███▏ | 3914/12384 [8:18:17<18:00:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 32%|███▏ | 3915/12384 [8:18:17<17:58:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 32%|███▏ | 3915/12384 [8:18:24<17:58:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 32%|███▏ | 3916/12384 [8:18:24<18:00:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 32%|███▏ | 3916/12384 [8:18:32<18:00:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 32%|███▏ | 3917/12384 [8:18:32<18:00:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 32%|███▏ | 3917/12384 [8:18:40<18:00:16, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.64s]
Epoch 1: 32%|███▏ | 3918/12384 [8:18:40<17:58:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.64s]
Epoch 1: 32%|███▏ | 3918/12384 [8:18:47<17:58:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 32%|███▏ | 3919/12384 [8:18:47<17:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 32%|███▏ | 3919/12384 [8:18:55<17:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 32%|███▏ | 3920/12384 [8:18:55<17:58:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 32%|███▏ | 3920/12384 [8:19:02<17:58:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 1: 32%|███▏ | 3921/12384 [8:19:02<17:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 1: 32%|███▏ | 3921/12384 [8:19:10<17:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 32%|███▏ | 3922/12384 [8:19:10<18:10:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 32%|███▏ | 3922/12384 [8:19:18<18:10:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 32%|███▏ | 3923/12384 [8:19:18<18:05:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 32%|███▏ | 3923/12384 [8:19:26<18:05:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 32%|███▏ | 3924/12384 [8:19:26<18:02:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 32%|███▏ | 3924/12384 [8:19:33<18:02:36, 7.68s/it, loss=0.0003, acc=0.9992, iter_time=4.72s]
Epoch 1: 32%|███▏ | 3925/12384 [8:19:33<17:59:18, 7.66s/it, loss=0.0003, acc=0.9992, iter_time=4.72s]
Epoch 1: 32%|███▏ | 3925/12384 [8:19:41<17:59:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 32%|███▏ | 3926/12384 [8:19:41<17:58:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 32%|███▏ | 3926/12384 [8:19:48<17:58:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3927/12384 [8:19:48<17:55:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3927/12384 [8:19:56<17:55:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 32%|███▏ | 3928/12384 [8:19:56<17:58:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 32%|███▏ | 3928/12384 [8:20:04<17:58:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 1: 32%|███▏ | 3929/12384 [8:20:04<17:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 1: 32%|███▏ | 3929/12384 [8:20:11<17:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 32%|███▏ | 3930/12384 [8:20:11<17:56:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 32%|███▏ | 3930/12384 [8:20:19<17:56:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 32%|███▏ | 3931/12384 [8:20:19<17:54:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 32%|███▏ | 3931/12384 [8:20:27<17:54:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 32%|███▏ | 3932/12384 [8:20:27<17:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 32%|███▏ | 3932/12384 [8:20:34<17:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 32%|███▏ | 3933/12384 [8:20:34<17:53:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 32%|███▏ | 3933/12384 [8:20:42<17:53:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 32%|███▏ | 3934/12384 [8:20:42<17:52:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 32%|███▏ | 3934/12384 [8:20:49<17:52:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 32%|███▏ | 3935/12384 [8:20:49<17:52:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 32%|███▏ | 3935/12384 [8:20:57<17:52:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 32%|███▏ | 3936/12384 [8:20:57<18:03:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 32%|███▏ | 3936/12384 [8:21:05<18:03:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 32%|███▏ | 3937/12384 [8:21:05<17:59:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 32%|███▏ | 3937/12384 [8:21:13<17:59:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 32%|███▏ | 3938/12384 [8:21:13<17:57:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 32%|███▏ | 3938/12384 [8:21:20<17:57:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3939/12384 [8:21:20<17:54:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3939/12384 [8:21:28<17:54:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 3940/12384 [8:21:28<17:55:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 3940/12384 [8:21:35<17:55:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 32%|███▏ | 3941/12384 [8:21:35<17:53:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 32%|███▏ | 3941/12384 [8:21:43<17:53:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3942/12384 [8:21:43<17:52:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3942/12384 [8:21:51<17:52:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 32%|███▏ | 3943/12384 [8:21:51<17:53:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 32%|███▏ | 3943/12384 [8:21:58<17:53:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 1: 32%|███▏ | 3944/12384 [8:21:58<17:52:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 1: 32%|███▏ | 3944/12384 [8:22:06<17:52:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 32%|███▏ | 3945/12384 [8:22:06<17:52:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 32%|███▏ | 3945/12384 [8:22:13<17:52:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 32%|███▏ | 3946/12384 [8:22:13<17:50:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 32%|███▏ | 3946/12384 [8:22:21<17:50:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 32%|███▏ | 3947/12384 [8:22:21<17:50:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 32%|███▏ | 3947/12384 [8:22:29<17:50:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 3948/12384 [8:22:29<17:49:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 3948/12384 [8:22:37<17:49:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 32%|███▏ | 3949/12384 [8:22:37<18:03:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 32%|███▏ | 3949/12384 [8:22:44<18:03:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 32%|███▏ | 3950/12384 [8:22:44<17:58:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 32%|███▏ | 3950/12384 [8:22:52<17:58:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 32%|███▏ | 3951/12384 [8:22:52<17:54:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 32%|███▏ | 3951/12384 [8:22:59<17:54:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 32%|███▏ | 3952/12384 [8:22:59<17:55:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 32%|███▏ | 3952/12384 [8:23:07<17:55:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 32%|███▏ | 3953/12384 [8:23:07<17:53:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 32%|███▏ | 3953/12384 [8:23:15<17:53:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 32%|███▏ | 3954/12384 [8:23:15<17:51:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 32%|███▏ | 3954/12384 [8:23:22<17:51:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 32%|███▏ | 3955/12384 [8:23:22<17:51:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 32%|███▏ | 3955/12384 [8:23:30<17:51:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 32%|███▏ | 3956/12384 [8:23:30<17:49:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 32%|███▏ | 3956/12384 [8:23:38<17:49:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 32%|███▏ | 3957/12384 [8:23:38<17:52:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 32%|███▏ | 3957/12384 [8:23:45<17:52:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3958/12384 [8:23:45<17:50:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3958/12384 [8:23:53<17:50:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 32%|███▏ | 3959/12384 [8:23:53<17:49:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 32%|███▏ | 3959/12384 [8:24:00<17:49:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 32%|███▏ | 3960/12384 [8:24:00<17:48:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 32%|███▏ | 3960/12384 [8:24:08<17:48:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 32%|███▏ | 3961/12384 [8:24:08<17:48:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 32%|███▏ | 3961/12384 [8:24:16<17:48:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 32%|███▏ | 3962/12384 [8:24:16<17:48:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 32%|███▏ | 3962/12384 [8:24:23<17:48:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 1: 32%|███▏ | 3963/12384 [8:24:23<17:48:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 1: 32%|███▏ | 3963/12384 [8:24:31<17:48:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 32%|███▏ | 3964/12384 [8:24:31<17:48:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 32%|███▏ | 3964/12384 [8:24:38<17:48:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 32%|███▏ | 3965/12384 [8:24:38<17:48:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 32%|███▏ | 3965/12384 [8:24:46<17:48:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.63s]
Epoch 1: 32%|███▏ | 3966/12384 [8:24:46<17:48:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.63s]
Epoch 1: 32%|███▏ | 3966/12384 [8:24:54<17:48:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 32%|███▏ | 3967/12384 [8:24:54<17:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 32%|███▏ | 3967/12384 [8:25:01<17:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 32%|███▏ | 3968/12384 [8:25:01<17:46:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 32%|███▏ | 3968/12384 [8:25:09<17:46:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 32%|███▏ | 3969/12384 [8:25:09<17:46:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 32%|███▏ | 3969/12384 [8:25:16<17:46:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.61s]
Epoch 1: 32%|███▏ | 3970/12384 [8:25:16<17:46:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.61s]
Epoch 1: 32%|███▏ | 3970/12384 [8:25:24<17:46:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.59s]
Epoch 1: 32%|███▏ | 3971/12384 [8:25:24<17:45:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.59s]
Epoch 1: 32%|███▏ | 3971/12384 [8:25:32<17:45:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3972/12384 [8:25:32<17:46:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3972/12384 [8:25:39<17:46:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 32%|███▏ | 3973/12384 [8:25:39<17:46:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 32%|███▏ | 3973/12384 [8:25:47<17:46:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3974/12384 [8:25:47<17:49:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 32%|███▏ | 3974/12384 [8:25:55<17:49:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 32%|███▏ | 3975/12384 [8:25:55<18:01:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 32%|███▏ | 3975/12384 [8:26:03<18:01:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 32%|███▏ | 3976/12384 [8:26:03<17:57:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 32%|███▏ | 3976/12384 [8:26:10<17:57:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 32%|███▏ | 3977/12384 [8:26:10<17:53:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 32%|███▏ | 3977/12384 [8:26:18<17:53:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 32%|███▏ | 3978/12384 [8:26:18<17:52:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 32%|███▏ | 3978/12384 [8:26:25<17:52:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 32%|███▏ | 3979/12384 [8:26:25<17:50:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 32%|███▏ | 3979/12384 [8:26:33<17:50:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 32%|███▏ | 3980/12384 [8:26:33<17:52:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 32%|███▏ | 3980/12384 [8:26:41<17:52:00, 7.65s/it, loss=0.0011, acc=0.9991, iter_time=10.58s]
Epoch 1: 32%|███▏ | 3981/12384 [8:26:41<17:50:55, 7.65s/it, loss=0.0011, acc=0.9991, iter_time=10.58s]
Epoch 1: 32%|███▏ | 3981/12384 [8:26:48<17:50:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 3982/12384 [8:26:48<17:52:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 3982/12384 [8:26:56<17:52:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 32%|███▏ | 3983/12384 [8:26:56<17:50:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 32%|███▏ | 3983/12384 [8:27:04<17:50:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 32%|███▏ | 3984/12384 [8:27:04<17:49:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 32%|███▏ | 3984/12384 [8:27:11<17:49:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 1: 32%|███▏ | 3985/12384 [8:27:11<17:48:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 1: 32%|███▏ | 3985/12384 [8:27:19<17:48:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 32%|███▏ | 3986/12384 [8:27:19<17:47:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 32%|███▏ | 3986/12384 [8:27:26<17:47:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 32%|███▏ | 3987/12384 [8:27:26<17:48:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 32%|███▏ | 3987/12384 [8:27:34<17:48:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 32%|███▏ | 3988/12384 [8:27:34<17:46:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 32%|███▏ | 3988/12384 [8:27:42<17:46:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 1: 32%|███▏ | 3989/12384 [8:27:42<17:44:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 1: 32%|███▏ | 3989/12384 [8:27:49<17:44:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 32%|███▏ | 3990/12384 [8:27:49<17:44:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 32%|███▏ | 3990/12384 [8:27:57<17:44:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 32%|███▏ | 3991/12384 [8:27:57<17:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 32%|███▏ | 3991/12384 [8:28:05<17:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 32%|███▏ | 3992/12384 [8:28:05<17:47:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 32%|███▏ | 3992/12384 [8:28:12<17:47:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 1: 32%|███▏ | 3993/12384 [8:28:12<17:46:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 1: 32%|███▏ | 3993/12384 [8:28:20<17:46:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 32%|███▏ | 3994/12384 [8:28:20<17:45:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 32%|███▏ | 3994/12384 [8:28:27<17:45:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 3995/12384 [8:28:27<17:43:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 3995/12384 [8:28:35<17:43:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 32%|███▏ | 3996/12384 [8:28:35<17:43:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 32%|███▏ | 3996/12384 [8:28:43<17:43:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 32%|███▏ | 3997/12384 [8:28:43<17:43:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 32%|███▏ | 3997/12384 [8:28:50<17:43:10, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 1: 32%|███▏ | 3998/12384 [8:28:50<17:42:53, 7.60s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 1: 32%|███▏ | 3998/12384 [8:28:58<17:42:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 32%|███▏ | 3999/12384 [8:28:58<17:42:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 32%|███▏ | 3999/12384 [8:29:05<17:42:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 32%|███▏ | 4000/12384 [8:29:05<17:42:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 32%|███▏ | 4000/12384 [8:29:13<17:42:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 32%|███▏ | 4001/12384 [8:29:13<17:56:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 32%|███▏ | 4001/12384 [8:29:21<17:56:13, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=5.81s]
Epoch 1: 32%|███▏ | 4002/12384 [8:29:21<17:52:16, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=5.81s]
Epoch 1: 32%|███▏ | 4002/12384 [8:29:29<17:52:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 32%|███▏ | 4003/12384 [8:29:29<17:53:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 32%|███▏ | 4003/12384 [8:29:36<17:53:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 32%|███▏ | 4004/12384 [8:29:36<17:49:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 32%|███▏ | 4004/12384 [8:29:44<17:49:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 4005/12384 [8:29:44<17:47:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 4005/12384 [8:29:51<17:47:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 1: 32%|███▏ | 4006/12384 [8:29:51<17:46:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 1: 32%|███▏ | 4006/12384 [8:29:59<17:46:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 32%|███▏ | 4007/12384 [8:29:59<17:44:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 32%|███▏ | 4007/12384 [8:30:07<17:44:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 32%|███▏ | 4008/12384 [8:30:07<17:44:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 32%|███▏ | 4008/12384 [8:30:14<17:44:30, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=5.55s]
Epoch 1: 32%|███▏ | 4009/12384 [8:30:14<17:43:36, 7.62s/it, loss=0.0005, acc=0.9983, iter_time=5.55s]
Epoch 1: 32%|███▏ | 4009/12384 [8:30:22<17:43:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 32%|███▏ | 4010/12384 [8:30:22<17:43:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 32%|███▏ | 4010/12384 [8:30:29<17:43:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 32%|███▏ | 4011/12384 [8:30:29<17:41:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 32%|███▏ | 4011/12384 [8:30:37<17:41:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 32%|███▏ | 4012/12384 [8:30:37<17:42:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 32%|███▏ | 4012/12384 [8:30:45<17:42:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 32%|███▏ | 4013/12384 [8:30:45<17:42:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 32%|███▏ | 4013/12384 [8:30:52<17:42:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 32%|███▏ | 4014/12384 [8:30:52<17:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 32%|███▏ | 4014/12384 [8:31:00<17:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 32%|███▏ | 4015/12384 [8:31:00<17:41:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 32%|███▏ | 4015/12384 [8:31:08<17:41:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 32%|███▏ | 4016/12384 [8:31:08<17:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 32%|███▏ | 4016/12384 [8:31:15<17:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 32%|███▏ | 4017/12384 [8:31:15<17:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 32%|███▏ | 4017/12384 [8:31:23<17:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 32%|███▏ | 4018/12384 [8:31:23<17:41:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 32%|███▏ | 4018/12384 [8:31:30<17:41:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 32%|███▏ | 4019/12384 [8:31:30<17:40:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 32%|███▏ | 4019/12384 [8:31:38<17:40:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 4020/12384 [8:31:38<17:39:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 4020/12384 [8:31:46<17:39:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 32%|███▏ | 4021/12384 [8:31:46<17:41:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 32%|███▏ | 4021/12384 [8:31:53<17:41:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 4022/12384 [8:31:53<17:42:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 32%|███▏ | 4022/12384 [8:32:01<17:42:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 32%|███▏ | 4023/12384 [8:32:01<17:41:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 32%|███▏ | 4023/12384 [8:32:08<17:41:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 32%|███▏ | 4024/12384 [8:32:08<17:40:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 32%|███▏ | 4024/12384 [8:32:16<17:40:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 33%|███▎ | 4025/12384 [8:32:16<17:40:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 33%|███▎ | 4025/12384 [8:32:24<17:40:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4026/12384 [8:32:24<17:39:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4026/12384 [8:32:32<17:39:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 33%|███▎ | 4027/12384 [8:32:32<17:54:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 33%|███▎ | 4027/12384 [8:32:39<17:54:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 33%|███▎ | 4028/12384 [8:32:39<17:50:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 33%|███▎ | 4028/12384 [8:32:47<17:50:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4029/12384 [8:32:47<17:46:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4029/12384 [8:32:54<17:46:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4030/12384 [8:32:54<17:44:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4030/12384 [8:33:02<17:44:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4031/12384 [8:33:02<17:44:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4031/12384 [8:33:10<17:44:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 33%|███▎ | 4032/12384 [8:33:10<17:42:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 33%|███▎ | 4032/12384 [8:33:17<17:42:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 33%|███▎ | 4033/12384 [8:33:17<17:41:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 33%|███▎ | 4033/12384 [8:33:25<17:41:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 33%|███▎ | 4034/12384 [8:33:25<17:41:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 33%|███▎ | 4034/12384 [8:33:33<17:41:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4035/12384 [8:33:33<17:40:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4035/12384 [8:33:40<17:40:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4036/12384 [8:33:40<17:40:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4036/12384 [8:33:48<17:40:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4037/12384 [8:33:48<17:40:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4037/12384 [8:33:55<17:40:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4038/12384 [8:33:55<17:39:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4038/12384 [8:34:03<17:39:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4039/12384 [8:34:03<17:38:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4039/12384 [8:34:11<17:38:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4040/12384 [8:34:11<17:38:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4040/12384 [8:34:18<17:38:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 33%|███▎ | 4041/12384 [8:34:18<17:38:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 33%|███▎ | 4041/12384 [8:34:26<17:38:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 1: 33%|███▎ | 4042/12384 [8:34:26<17:38:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 1: 33%|███▎ | 4042/12384 [8:34:33<17:38:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 1: 33%|███▎ | 4043/12384 [8:34:33<17:38:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 1: 33%|███▎ | 4043/12384 [8:34:41<17:38:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 33%|███▎ | 4044/12384 [8:34:41<17:40:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 33%|███▎ | 4044/12384 [8:34:49<17:40:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4045/12384 [8:34:49<17:40:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4045/12384 [8:34:56<17:40:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4046/12384 [8:34:56<17:38:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4046/12384 [8:35:04<17:38:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4047/12384 [8:35:04<17:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4047/12384 [8:35:12<17:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4048/12384 [8:35:12<17:38:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4048/12384 [8:35:19<17:38:03, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.22s]
Epoch 1: 33%|███▎ | 4049/12384 [8:35:19<17:37:02, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.22s]
Epoch 1: 33%|███▎ | 4049/12384 [8:35:27<17:37:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 33%|███▎ | 4050/12384 [8:35:27<17:37:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 33%|███▎ | 4050/12384 [8:35:34<17:37:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 33%|███▎ | 4051/12384 [8:35:34<17:36:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 33%|███▎ | 4051/12384 [8:35:42<17:36:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 33%|███▎ | 4052/12384 [8:35:42<17:38:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 33%|███▎ | 4052/12384 [8:35:50<17:38:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 33%|███▎ | 4053/12384 [8:35:50<17:53:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 33%|███▎ | 4053/12384 [8:35:58<17:53:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 33%|███▎ | 4054/12384 [8:35:58<17:49:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 33%|███▎ | 4054/12384 [8:36:05<17:49:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 33%|███▎ | 4055/12384 [8:36:05<17:44:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 33%|███▎ | 4055/12384 [8:36:13<17:44:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 33%|███▎ | 4056/12384 [8:36:13<17:45:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 33%|███▎ | 4056/12384 [8:36:21<17:45:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 33%|███▎ | 4057/12384 [8:36:21<17:43:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 33%|███▎ | 4057/12384 [8:36:28<17:43:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 33%|███▎ | 4058/12384 [8:36:28<17:41:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 33%|███▎ | 4058/12384 [8:36:36<17:41:18, 7.65s/it, loss=0.0006, acc=1.0000, iter_time=5.05s]
Epoch 1: 33%|███▎ | 4059/12384 [8:36:36<17:39:37, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=5.05s]
Epoch 1: 33%|███▎ | 4059/12384 [8:36:43<17:39:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 33%|███▎ | 4060/12384 [8:36:43<17:37:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 33%|███▎ | 4060/12384 [8:36:51<17:37:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4061/12384 [8:36:51<17:36:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4061/12384 [8:36:59<17:36:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4062/12384 [8:36:59<17:36:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4062/12384 [8:37:06<17:36:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4063/12384 [8:37:06<17:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 33%|███▎ | 4063/12384 [8:37:14<17:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4064/12384 [8:37:14<17:37:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4064/12384 [8:37:21<17:37:43, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=7.27s]
Epoch 1: 33%|███▎ | 4065/12384 [8:37:21<17:36:47, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=7.27s]
Epoch 1: 33%|███▎ | 4065/12384 [8:37:29<17:36:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4066/12384 [8:37:29<17:35:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4066/12384 [8:37:37<17:35:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 33%|███▎ | 4067/12384 [8:37:37<17:35:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 33%|███▎ | 4067/12384 [8:37:44<17:35:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 33%|███▎ | 4068/12384 [8:37:44<17:36:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 33%|███▎ | 4068/12384 [8:37:52<17:36:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 33%|███▎ | 4069/12384 [8:37:52<17:36:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 33%|███▎ | 4069/12384 [8:38:00<17:36:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 33%|███▎ | 4070/12384 [8:38:00<17:35:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 33%|███▎ | 4070/12384 [8:38:07<17:35:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 33%|███▎ | 4071/12384 [8:38:07<17:34:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 33%|███▎ | 4071/12384 [8:38:15<17:34:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4072/12384 [8:38:15<17:35:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 33%|███▎ | 4072/12384 [8:38:22<17:35:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 1: 33%|███▎ | 4073/12384 [8:38:22<17:34:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 1: 33%|███▎ | 4073/12384 [8:38:30<17:34:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 33%|███▎ | 4074/12384 [8:38:30<17:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 33%|███▎ | 4074/12384 [8:38:38<17:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 33%|███▎ | 4075/12384 [8:38:38<17:34:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 33%|███▎ | 4075/12384 [8:38:45<17:34:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 33%|███▎ | 4076/12384 [8:38:45<17:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 33%|███▎ | 4076/12384 [8:38:53<17:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4077/12384 [8:38:53<17:35:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4077/12384 [8:39:01<17:35:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 33%|███▎ | 4078/12384 [8:39:01<17:35:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 33%|███▎ | 4078/12384 [8:39:08<17:35:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 33%|███▎ | 4079/12384 [8:39:08<17:35:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 33%|███▎ | 4079/12384 [8:39:16<17:35:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 33%|███▎ | 4080/12384 [8:39:16<17:49:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 33%|███▎ | 4080/12384 [8:39:24<17:49:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 1: 33%|███▎ | 4081/12384 [8:39:24<17:42:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 1: 33%|███▎ | 4081/12384 [8:39:31<17:42:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 33%|███▎ | 4082/12384 [8:39:31<17:39:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 33%|███▎ | 4082/12384 [8:39:39<17:39:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 33%|███▎ | 4083/12384 [8:39:39<17:37:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 33%|███▎ | 4083/12384 [8:39:47<17:37:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.23s]
Epoch 1: 33%|███▎ | 4084/12384 [8:39:47<17:36:12, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.23s]
Epoch 1: 33%|███▎ | 4084/12384 [8:39:54<17:36:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 33%|███▎ | 4085/12384 [8:39:54<17:34:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 33%|███▎ | 4085/12384 [8:40:02<17:34:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 33%|███▎ | 4086/12384 [8:40:02<17:33:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 33%|███▎ | 4086/12384 [8:40:09<17:33:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 33%|███▎ | 4087/12384 [8:40:09<17:33:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 33%|███▎ | 4087/12384 [8:40:17<17:33:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 33%|███▎ | 4088/12384 [8:40:17<17:32:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 33%|███▎ | 4088/12384 [8:40:25<17:32:52, 7.61s/it, loss=0.0002, acc=0.9980, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4089/12384 [8:40:25<17:32:37, 7.61s/it, loss=0.0002, acc=0.9980, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4089/12384 [8:40:32<17:32:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 33%|███▎ | 4090/12384 [8:40:32<17:32:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 33%|███▎ | 4090/12384 [8:40:40<17:32:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 33%|███▎ | 4091/12384 [8:40:40<17:31:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 33%|███▎ | 4091/12384 [8:40:47<17:31:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 33%|███▎ | 4092/12384 [8:40:47<17:31:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 33%|███▎ | 4092/12384 [8:40:55<17:31:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 33%|███▎ | 4093/12384 [8:40:55<17:30:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 33%|███▎ | 4093/12384 [8:41:03<17:30:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 33%|███▎ | 4094/12384 [8:41:03<17:32:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 33%|███▎ | 4094/12384 [8:41:10<17:32:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 33%|███▎ | 4095/12384 [8:41:10<17:31:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 33%|███▎ | 4095/12384 [8:41:18<17:31:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 33%|███▎ | 4096/12384 [8:41:18<17:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 33%|███▎ | 4096/12384 [8:41:25<17:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 33%|███▎ | 4097/12384 [8:41:25<17:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 33%|███▎ | 4097/12384 [8:41:33<17:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4098/12384 [8:41:33<17:31:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4098/12384 [8:41:41<17:31:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 33%|███▎ | 4099/12384 [8:41:41<17:31:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 33%|███▎ | 4099/12384 [8:41:48<17:31:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 33%|███▎ | 4100/12384 [8:41:48<17:31:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 33%|███▎ | 4100/12384 [8:41:56<17:31:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4101/12384 [8:41:56<17:31:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4101/12384 [8:42:04<17:31:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4102/12384 [8:42:04<17:31:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4102/12384 [8:42:11<17:31:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4103/12384 [8:42:11<17:30:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4103/12384 [8:42:19<17:30:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 33%|███▎ | 4104/12384 [8:42:19<17:30:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 33%|███▎ | 4104/12384 [8:42:26<17:30:51, 7.61s/it, loss=0.0011, acc=0.9990, iter_time=7.22s]
Epoch 1: 33%|███▎ | 4105/12384 [8:42:26<17:31:13, 7.62s/it, loss=0.0011, acc=0.9990, iter_time=7.22s]
Epoch 1: 33%|███▎ | 4105/12384 [8:42:34<17:31:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4106/12384 [8:42:34<17:43:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4106/12384 [8:42:42<17:43:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4107/12384 [8:42:42<17:39:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4107/12384 [8:42:50<17:39:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 33%|███▎ | 4108/12384 [8:42:50<17:36:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 33%|███▎ | 4108/12384 [8:42:57<17:36:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 33%|███▎ | 4109/12384 [8:42:57<17:33:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 33%|███▎ | 4109/12384 [8:43:05<17:33:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 1: 33%|███▎ | 4110/12384 [8:43:05<17:34:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 1: 33%|███▎ | 4110/12384 [8:43:12<17:34:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 33%|███▎ | 4111/12384 [8:43:12<17:33:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 33%|███▎ | 4111/12384 [8:43:20<17:33:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 33%|███▎ | 4112/12384 [8:43:20<17:33:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 33%|███▎ | 4112/12384 [8:43:28<17:33:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4113/12384 [8:43:28<17:31:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 33%|███▎ | 4113/12384 [8:43:35<17:31:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4114/12384 [8:43:35<17:30:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4114/12384 [8:43:43<17:30:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 33%|███▎ | 4115/12384 [8:43:43<17:29:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 33%|███▎ | 4115/12384 [8:43:50<17:29:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 33%|███▎ | 4116/12384 [8:43:51<17:38:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 33%|███▎ | 4116/12384 [8:43:58<17:38:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 33%|███▎ | 4117/12384 [8:43:58<17:34:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 33%|███▎ | 4117/12384 [8:44:06<17:34:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 33%|███▎ | 4118/12384 [8:44:06<17:32:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 33%|███▎ | 4118/12384 [8:44:13<17:32:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 33%|███▎ | 4119/12384 [8:44:13<17:30:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 33%|███▎ | 4119/12384 [8:44:21<17:30:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 33%|███▎ | 4120/12384 [8:44:21<17:42:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 33%|███▎ | 4120/12384 [8:44:29<17:42:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 33%|███▎ | 4121/12384 [8:44:29<17:37:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 33%|███▎ | 4121/12384 [8:44:37<17:37:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 33%|███▎ | 4122/12384 [8:44:37<17:34:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 33%|███▎ | 4122/12384 [8:44:44<17:34:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 33%|███▎ | 4123/12384 [8:44:44<17:31:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 33%|███▎ | 4123/12384 [8:44:52<17:31:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 33%|███▎ | 4124/12384 [8:44:52<17:29:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 33%|███▎ | 4124/12384 [8:44:59<17:29:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4125/12384 [8:44:59<17:28:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 33%|███▎ | 4125/12384 [8:45:07<17:28:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 33%|███▎ | 4126/12384 [8:45:07<17:28:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 33%|███▎ | 4126/12384 [8:45:15<17:28:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 33%|███▎ | 4127/12384 [8:45:15<17:27:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 33%|███▎ | 4127/12384 [8:45:22<17:27:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 33%|███▎ | 4128/12384 [8:45:22<17:26:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 33%|███▎ | 4128/12384 [8:45:30<17:26:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 33%|███▎ | 4129/12384 [8:45:30<17:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 33%|███▎ | 4129/12384 [8:45:37<17:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 33%|███▎ | 4130/12384 [8:45:37<17:27:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 33%|███▎ | 4130/12384 [8:45:45<17:27:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.31s]
Epoch 1: 33%|███▎ | 4131/12384 [8:45:45<17:26:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.31s]
Epoch 1: 33%|███▎ | 4131/12384 [8:45:53<17:26:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 33%|███▎ | 4132/12384 [8:45:53<17:26:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 33%|███▎ | 4132/12384 [8:46:01<17:26:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 33%|███▎ | 4133/12384 [8:46:01<17:37:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 33%|███▎ | 4133/12384 [8:46:08<17:37:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 33%|███▎ | 4134/12384 [8:46:08<17:34:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 33%|███▎ | 4134/12384 [8:46:16<17:34:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 33%|███▎ | 4135/12384 [8:46:16<17:32:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 33%|███▎ | 4135/12384 [8:46:23<17:32:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 33%|███▎ | 4136/12384 [8:46:23<17:31:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 33%|███▎ | 4136/12384 [8:46:31<17:31:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 33%|███▎ | 4137/12384 [8:46:31<17:29:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 33%|███▎ | 4137/12384 [8:46:39<17:29:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 33%|███▎ | 4138/12384 [8:46:39<17:27:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 33%|███▎ | 4138/12384 [8:46:46<17:27:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 33%|███▎ | 4139/12384 [8:46:46<17:25:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 33%|███▎ | 4139/12384 [8:46:54<17:25:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4140/12384 [8:46:54<17:24:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 33%|███▎ | 4140/12384 [8:47:01<17:24:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 33%|███▎ | 4141/12384 [8:47:01<17:25:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 33%|███▎ | 4141/12384 [8:47:09<17:25:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 33%|███▎ | 4142/12384 [8:47:09<17:25:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 33%|███▎ | 4142/12384 [8:47:17<17:25:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 33%|███▎ | 4143/12384 [8:47:17<17:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 33%|███▎ | 4143/12384 [8:47:24<17:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 33%|███▎ | 4144/12384 [8:47:24<17:25:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 33%|███▎ | 4144/12384 [8:47:32<17:25:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4145/12384 [8:47:32<17:28:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 33%|███▎ | 4145/12384 [8:47:40<17:28:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 33%|███▎ | 4146/12384 [8:47:40<17:27:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 33%|███▎ | 4146/12384 [8:47:47<17:27:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 33%|███▎ | 4147/12384 [8:47:47<17:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 33%|███▎ | 4147/12384 [8:47:55<17:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 33%|███▎ | 4148/12384 [8:47:55<17:25:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 33%|███▎ | 4148/12384 [8:48:02<17:25:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 34%|███▎ | 4149/12384 [8:48:02<17:25:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 34%|███▎ | 4149/12384 [8:48:10<17:25:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.65s]
Epoch 1: 34%|███▎ | 4150/12384 [8:48:10<17:24:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.65s]
Epoch 1: 34%|███▎ | 4150/12384 [8:48:18<17:24:43, 7.61s/it, loss=0.0009, acc=0.9983, iter_time=5.31s]
Epoch 1: 34%|███▎ | 4151/12384 [8:48:18<17:23:37, 7.61s/it, loss=0.0009, acc=0.9983, iter_time=5.31s]
Epoch 1: 34%|███▎ | 4151/12384 [8:48:25<17:23:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 34%|███▎ | 4152/12384 [8:48:25<17:24:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 34%|███▎ | 4152/12384 [8:48:33<17:24:41, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=7.25s]
Epoch 1: 34%|███▎ | 4153/12384 [8:48:33<17:24:47, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.25s]
Epoch 1: 34%|███▎ | 4153/12384 [8:48:40<17:24:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 1: 34%|███▎ | 4154/12384 [8:48:40<17:24:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 1: 34%|███▎ | 4154/12384 [8:48:48<17:24:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 1: 34%|███▎ | 4155/12384 [8:48:48<17:24:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 1: 34%|███▎ | 4155/12384 [8:48:56<17:24:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.01s]
Epoch 1: 34%|███▎ | 4156/12384 [8:48:56<17:23:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.01s]
Epoch 1: 34%|███▎ | 4156/12384 [8:49:03<17:23:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 34%|███▎ | 4157/12384 [8:49:03<17:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 34%|███▎ | 4157/12384 [8:49:11<17:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 34%|███▎ | 4158/12384 [8:49:11<17:23:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 34%|███▎ | 4158/12384 [8:49:19<17:23:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 34%|███▎ | 4159/12384 [8:49:19<17:37:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 34%|███▎ | 4159/12384 [8:49:26<17:37:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 34%|███▎ | 4160/12384 [8:49:26<17:32:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 34%|███▎ | 4160/12384 [8:49:34<17:32:00, 7.68s/it, loss=0.0014, acc=0.9956, iter_time=7.19s]
Epoch 1: 34%|███▎ | 4161/12384 [8:49:34<17:29:16, 7.66s/it, loss=0.0014, acc=0.9956, iter_time=7.19s]
Epoch 1: 34%|███▎ | 4161/12384 [8:49:42<17:29:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 34%|███▎ | 4162/12384 [8:49:42<17:26:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 34%|███▎ | 4162/12384 [8:49:49<17:26:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▎ | 4163/12384 [8:49:49<17:25:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▎ | 4163/12384 [8:49:57<17:25:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 34%|███▎ | 4164/12384 [8:49:57<17:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 34%|███▎ | 4164/12384 [8:50:04<17:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 34%|███▎ | 4165/12384 [8:50:04<17:24:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 34%|███▎ | 4165/12384 [8:50:12<17:24:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 1: 34%|███▎ | 4166/12384 [8:50:12<17:23:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 1: 34%|███▎ | 4166/12384 [8:50:20<17:23:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 34%|███▎ | 4167/12384 [8:50:20<17:22:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 34%|███▎ | 4167/12384 [8:50:27<17:22:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 1: 34%|███▎ | 4168/12384 [8:50:27<17:22:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 1: 34%|███▎ | 4168/12384 [8:50:35<17:22:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 34%|███▎ | 4169/12384 [8:50:35<17:25:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 34%|███▎ | 4169/12384 [8:50:43<17:25:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 1: 34%|███▎ | 4170/12384 [8:50:43<17:24:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 1: 34%|███▎ | 4170/12384 [8:50:50<17:24:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 34%|███▎ | 4171/12384 [8:50:50<17:23:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 34%|███▎ | 4171/12384 [8:50:58<17:23:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 34%|███▎ | 4172/12384 [8:50:58<17:23:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 34%|███▎ | 4172/12384 [8:51:05<17:23:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 1: 34%|███▎ | 4173/12384 [8:51:05<17:22:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 1: 34%|███▎ | 4173/12384 [8:51:13<17:22:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 34%|███▎ | 4174/12384 [8:51:13<17:21:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 34%|███▎ | 4174/12384 [8:51:21<17:21:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 34%|███▎ | 4175/12384 [8:51:21<17:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 34%|███▎ | 4175/12384 [8:51:28<17:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 34%|███▎ | 4176/12384 [8:51:28<17:21:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 34%|███▎ | 4176/12384 [8:51:36<17:21:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 34%|███▎ | 4177/12384 [8:51:36<17:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 34%|███▎ | 4177/12384 [8:51:43<17:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 34%|███▎ | 4178/12384 [8:51:43<17:20:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 34%|███▎ | 4178/12384 [8:51:51<17:20:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 34%|███▎ | 4179/12384 [8:51:51<17:19:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 34%|███▎ | 4179/12384 [8:51:59<17:19:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 34%|███▍ | 4180/12384 [8:51:59<17:19:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 34%|███▍ | 4180/12384 [8:52:06<17:19:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 34%|███▍ | 4181/12384 [8:52:06<17:18:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 34%|███▍ | 4181/12384 [8:52:14<17:18:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4182/12384 [8:52:14<17:18:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4182/12384 [8:52:21<17:18:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4183/12384 [8:52:21<17:18:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4183/12384 [8:52:29<17:18:52, 7.60s/it, loss=0.0003, acc=0.9999, iter_time=7.98s]
Epoch 1: 34%|███▍ | 4184/12384 [8:52:29<17:19:36, 7.61s/it, loss=0.0003, acc=0.9999, iter_time=7.98s]
Epoch 1: 34%|███▍ | 4184/12384 [8:52:37<17:19:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 34%|███▍ | 4185/12384 [8:52:37<17:31:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 34%|███▍ | 4185/12384 [8:52:45<17:31:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 34%|███▍ | 4186/12384 [8:52:45<17:28:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 34%|███▍ | 4186/12384 [8:52:52<17:28:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 34%|███▍ | 4187/12384 [8:52:52<17:25:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 34%|███▍ | 4187/12384 [8:53:00<17:25:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 34%|███▍ | 4188/12384 [8:53:00<17:23:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 34%|███▍ | 4188/12384 [8:53:07<17:23:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4189/12384 [8:53:07<17:21:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4189/12384 [8:53:15<17:21:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 34%|███▍ | 4190/12384 [8:53:15<17:20:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 34%|███▍ | 4190/12384 [8:53:23<17:20:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 34%|███▍ | 4191/12384 [8:53:23<17:20:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 34%|███▍ | 4191/12384 [8:53:30<17:20:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 34%|███▍ | 4192/12384 [8:53:30<17:19:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 34%|███▍ | 4192/12384 [8:53:38<17:19:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 34%|███▍ | 4193/12384 [8:53:38<17:18:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 34%|███▍ | 4193/12384 [8:53:46<17:18:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 34%|███▍ | 4194/12384 [8:53:46<17:23:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 34%|███▍ | 4194/12384 [8:53:53<17:23:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 34%|███▍ | 4195/12384 [8:53:53<17:25:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 34%|███▍ | 4195/12384 [8:54:01<17:25:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 34%|███▍ | 4196/12384 [8:54:01<17:23:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 34%|███▍ | 4196/12384 [8:54:08<17:23:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 34%|███▍ | 4197/12384 [8:54:08<17:22:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 34%|███▍ | 4197/12384 [8:54:16<17:22:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 34%|███▍ | 4198/12384 [8:54:16<17:21:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 34%|███▍ | 4198/12384 [8:54:24<17:21:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 34%|███▍ | 4199/12384 [8:54:24<17:32:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 34%|███▍ | 4199/12384 [8:54:32<17:32:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 34%|███▍ | 4200/12384 [8:54:32<17:27:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 34%|███▍ | 4200/12384 [8:54:39<17:27:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 34%|███▍ | 4201/12384 [8:54:39<17:24:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 34%|███▍ | 4201/12384 [8:54:47<17:24:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 34%|███▍ | 4202/12384 [8:54:47<17:21:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 34%|███▍ | 4202/12384 [8:54:54<17:21:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 34%|███▍ | 4203/12384 [8:54:54<17:19:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 34%|███▍ | 4203/12384 [8:55:02<17:19:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 34%|███▍ | 4204/12384 [8:55:02<17:18:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 34%|███▍ | 4204/12384 [8:55:10<17:18:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 34%|███▍ | 4205/12384 [8:55:10<17:21:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 34%|███▍ | 4205/12384 [8:55:17<17:21:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 34%|███▍ | 4206/12384 [8:55:17<17:18:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 34%|███▍ | 4206/12384 [8:55:25<17:18:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 34%|███▍ | 4207/12384 [8:55:25<17:17:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 34%|███▍ | 4207/12384 [8:55:32<17:17:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 34%|███▍ | 4208/12384 [8:55:32<17:17:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 34%|███▍ | 4208/12384 [8:55:40<17:17:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 34%|███▍ | 4209/12384 [8:55:40<17:16:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 34%|███▍ | 4209/12384 [8:55:48<17:16:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 34%|███▍ | 4210/12384 [8:55:48<17:16:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 34%|███▍ | 4210/12384 [8:55:56<17:16:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 34%|███▍ | 4211/12384 [8:55:56<17:27:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 34%|███▍ | 4211/12384 [8:56:03<17:27:56, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.85s]
Epoch 1: 34%|███▍ | 4212/12384 [8:56:03<17:23:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.85s]
Epoch 1: 34%|███▍ | 4212/12384 [8:56:11<17:23:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 34%|███▍ | 4213/12384 [8:56:11<17:22:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 34%|███▍ | 4213/12384 [8:56:18<17:22:31, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 1: 34%|███▍ | 4214/12384 [8:56:18<17:20:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 1: 34%|███▍ | 4214/12384 [8:56:26<17:20:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 34%|███▍ | 4215/12384 [8:56:26<17:22:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 34%|███▍ | 4215/12384 [8:56:34<17:22:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 34%|███▍ | 4216/12384 [8:56:34<17:20:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 34%|███▍ | 4216/12384 [8:56:41<17:20:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 34%|███▍ | 4217/12384 [8:56:41<17:23:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 34%|███▍ | 4217/12384 [8:56:49<17:23:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 34%|███▍ | 4218/12384 [8:56:49<17:19:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 34%|███▍ | 4218/12384 [8:56:57<17:19:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 34%|███▍ | 4219/12384 [8:56:57<17:21:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 34%|███▍ | 4219/12384 [8:57:04<17:21:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 34%|███▍ | 4220/12384 [8:57:04<17:19:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 34%|███▍ | 4220/12384 [8:57:12<17:19:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 34%|███▍ | 4221/12384 [8:57:12<17:16:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 34%|███▍ | 4221/12384 [8:57:20<17:16:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 34%|███▍ | 4222/12384 [8:57:20<17:17:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 34%|███▍ | 4222/12384 [8:57:27<17:17:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 34%|███▍ | 4223/12384 [8:57:27<17:17:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 34%|███▍ | 4223/12384 [8:57:35<17:17:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 1: 34%|███▍ | 4224/12384 [8:57:35<17:15:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 1: 34%|███▍ | 4224/12384 [8:57:43<17:15:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 34%|███▍ | 4225/12384 [8:57:43<17:27:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 34%|███▍ | 4225/12384 [8:57:50<17:27:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 34%|███▍ | 4226/12384 [8:57:50<17:22:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 34%|███▍ | 4226/12384 [8:57:58<17:22:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 34%|███▍ | 4227/12384 [8:57:58<17:20:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 34%|███▍ | 4227/12384 [8:58:06<17:20:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 34%|███▍ | 4228/12384 [8:58:06<17:20:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 34%|███▍ | 4228/12384 [8:58:13<17:20:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 34%|███▍ | 4229/12384 [8:58:13<17:17:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 34%|███▍ | 4229/12384 [8:58:21<17:17:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 34%|███▍ | 4230/12384 [8:58:21<17:17:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 34%|███▍ | 4230/12384 [8:58:28<17:17:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 34%|███▍ | 4231/12384 [8:58:28<17:16:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 34%|███▍ | 4231/12384 [8:58:36<17:16:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 34%|███▍ | 4232/12384 [8:58:36<17:14:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 34%|███▍ | 4232/12384 [8:58:44<17:14:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 34%|███▍ | 4233/12384 [8:58:44<17:13:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 34%|███▍ | 4233/12384 [8:58:51<17:13:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.64s]
Epoch 1: 34%|███▍ | 4234/12384 [8:58:51<17:13:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.64s]
Epoch 1: 34%|███▍ | 4234/12384 [8:58:59<17:13:23, 7.61s/it, loss=0.0002, acc=0.9993, iter_time=7.64s]
Epoch 1: 34%|███▍ | 4235/12384 [8:58:59<17:14:05, 7.61s/it, loss=0.0002, acc=0.9993, iter_time=7.64s]
Epoch 1: 34%|███▍ | 4235/12384 [8:59:06<17:14:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 34%|███▍ | 4236/12384 [8:59:06<17:15:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 34%|███▍ | 4236/12384 [8:59:14<17:15:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 34%|███▍ | 4237/12384 [8:59:14<17:27:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 34%|███▍ | 4237/12384 [8:59:22<17:27:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 34%|███▍ | 4238/12384 [8:59:22<17:24:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 34%|███▍ | 4238/12384 [8:59:30<17:24:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 34%|███▍ | 4239/12384 [8:59:30<17:21:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 34%|███▍ | 4239/12384 [8:59:37<17:21:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 34%|███▍ | 4240/12384 [8:59:37<17:20:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 34%|███▍ | 4240/12384 [8:59:45<17:20:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 34%|███▍ | 4241/12384 [8:59:45<17:18:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 34%|███▍ | 4241/12384 [8:59:52<17:18:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 34%|███▍ | 4242/12384 [8:59:52<17:15:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 34%|███▍ | 4242/12384 [9:00:00<17:15:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 34%|███▍ | 4243/12384 [9:00:00<17:13:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 34%|███▍ | 4243/12384 [9:00:08<17:13:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4244/12384 [9:00:08<17:12:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4244/12384 [9:00:15<17:12:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 34%|███▍ | 4245/12384 [9:00:15<17:12:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 34%|███▍ | 4245/12384 [9:00:23<17:12:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.65s]
Epoch 1: 34%|███▍ | 4246/12384 [9:00:23<17:13:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.65s]
Epoch 1: 34%|███▍ | 4246/12384 [9:00:30<17:13:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 34%|███▍ | 4247/12384 [9:00:30<17:11:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 34%|███▍ | 4247/12384 [9:00:38<17:11:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 34%|███▍ | 4248/12384 [9:00:38<17:11:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 34%|███▍ | 4248/12384 [9:00:46<17:11:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 34%|███▍ | 4249/12384 [9:00:46<17:10:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 34%|███▍ | 4249/12384 [9:00:53<17:10:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4250/12384 [9:00:53<17:10:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 34%|███▍ | 4250/12384 [9:01:01<17:10:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 34%|███▍ | 4251/12384 [9:01:01<17:10:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 34%|███▍ | 4251/12384 [9:01:08<17:10:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 34%|███▍ | 4252/12384 [9:01:08<17:10:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 34%|███▍ | 4252/12384 [9:01:16<17:10:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 34%|███▍ | 4253/12384 [9:01:16<17:10:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 34%|███▍ | 4253/12384 [9:01:24<17:10:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 34%|███▍ | 4254/12384 [9:01:24<17:11:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 34%|███▍ | 4254/12384 [9:01:31<17:11:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 34%|███▍ | 4255/12384 [9:01:31<17:13:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 34%|███▍ | 4255/12384 [9:01:39<17:13:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 1: 34%|███▍ | 4256/12384 [9:01:39<17:14:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 1: 34%|███▍ | 4256/12384 [9:01:47<17:14:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 34%|███▍ | 4257/12384 [9:01:47<17:12:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 34%|███▍ | 4257/12384 [9:01:54<17:12:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 34%|███▍ | 4258/12384 [9:01:54<17:12:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 34%|███▍ | 4258/12384 [9:02:02<17:12:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 34%|███▍ | 4259/12384 [9:02:02<17:10:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 34%|███▍ | 4259/12384 [9:02:09<17:10:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 34%|███▍ | 4260/12384 [9:02:09<17:10:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 34%|███▍ | 4260/12384 [9:02:17<17:10:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 34%|███▍ | 4261/12384 [9:02:17<17:09:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 34%|███▍ | 4261/12384 [9:02:25<17:09:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 34%|███▍ | 4262/12384 [9:02:25<17:09:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 34%|███▍ | 4262/12384 [9:02:32<17:09:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 34%|███▍ | 4263/12384 [9:02:32<17:09:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 34%|███▍ | 4263/12384 [9:02:40<17:09:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 1: 34%|███▍ | 4264/12384 [9:02:40<17:21:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 1: 34%|███▍ | 4264/12384 [9:02:48<17:21:41, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.42s]
Epoch 1: 34%|███▍ | 4265/12384 [9:02:48<17:17:14, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.42s]
Epoch 1: 34%|███▍ | 4265/12384 [9:02:55<17:17:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 34%|███▍ | 4266/12384 [9:02:55<17:14:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 34%|███▍ | 4266/12384 [9:03:03<17:14:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 34%|███▍ | 4267/12384 [9:03:03<17:12:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 34%|███▍ | 4267/12384 [9:03:11<17:12:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 34%|███▍ | 4268/12384 [9:03:11<17:11:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 34%|███▍ | 4268/12384 [9:03:18<17:11:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 34%|███▍ | 4269/12384 [9:03:18<17:11:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 34%|███▍ | 4269/12384 [9:03:26<17:11:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 34%|███▍ | 4270/12384 [9:03:26<17:10:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 34%|███▍ | 4270/12384 [9:03:33<17:10:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 34%|███▍ | 4271/12384 [9:03:33<17:10:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 34%|███▍ | 4271/12384 [9:03:41<17:10:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 34%|███▍ | 4272/12384 [9:03:41<17:09:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 34%|███▍ | 4272/12384 [9:03:49<17:09:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 35%|███▍ | 4273/12384 [9:03:49<17:10:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 35%|███▍ | 4273/12384 [9:03:56<17:10:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 35%|███▍ | 4274/12384 [9:03:56<17:09:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 35%|███▍ | 4274/12384 [9:04:04<17:09:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4275/12384 [9:04:04<17:08:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4275/12384 [9:04:11<17:08:45, 7.61s/it, loss=0.0011, acc=0.9977, iter_time=6.77s]
Epoch 1: 35%|███▍ | 4276/12384 [9:04:11<17:07:00, 7.60s/it, loss=0.0011, acc=0.9977, iter_time=6.77s]
Epoch 1: 35%|███▍ | 4276/12384 [9:04:19<17:07:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 35%|███▍ | 4277/12384 [9:04:19<17:07:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 35%|███▍ | 4277/12384 [9:04:27<17:07:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 35%|███▍ | 4278/12384 [9:04:27<17:19:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 35%|███▍ | 4278/12384 [9:04:35<17:19:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4279/12384 [9:04:35<17:15:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4279/12384 [9:04:42<17:15:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 35%|███▍ | 4280/12384 [9:04:42<17:13:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 35%|███▍ | 4280/12384 [9:04:50<17:13:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 35%|███▍ | 4281/12384 [9:04:50<17:12:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 35%|███▍ | 4281/12384 [9:04:57<17:12:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 35%|███▍ | 4282/12384 [9:04:57<17:11:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 35%|███▍ | 4282/12384 [9:05:05<17:11:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 35%|███▍ | 4283/12384 [9:05:05<17:10:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 35%|███▍ | 4283/12384 [9:05:13<17:10:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 35%|███▍ | 4284/12384 [9:05:13<17:10:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 35%|███▍ | 4284/12384 [9:05:20<17:10:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 35%|███▍ | 4285/12384 [9:05:20<17:09:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 35%|███▍ | 4285/12384 [9:05:28<17:09:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 35%|███▍ | 4286/12384 [9:05:28<17:09:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 35%|███▍ | 4286/12384 [9:05:35<17:09:24, 7.63s/it, loss=0.0006, acc=0.9996, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4287/12384 [9:05:35<17:08:14, 7.62s/it, loss=0.0006, acc=0.9996, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4287/12384 [9:05:43<17:08:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 35%|███▍ | 4288/12384 [9:05:43<17:07:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 35%|███▍ | 4288/12384 [9:05:51<17:07:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 35%|███▍ | 4289/12384 [9:05:51<17:06:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 35%|███▍ | 4289/12384 [9:05:59<17:06:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 35%|███▍ | 4290/12384 [9:05:59<17:18:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 35%|███▍ | 4290/12384 [9:06:06<17:18:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 35%|███▍ | 4291/12384 [9:06:06<17:15:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 35%|███▍ | 4291/12384 [9:06:14<17:15:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 35%|███▍ | 4292/12384 [9:06:14<17:15:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 35%|███▍ | 4292/12384 [9:06:22<17:15:22, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.96s]
Epoch 1: 35%|███▍ | 4293/12384 [9:06:22<17:13:12, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.96s]
Epoch 1: 35%|███▍ | 4293/12384 [9:06:29<17:13:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 35%|███▍ | 4294/12384 [9:06:29<17:10:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 35%|███▍ | 4294/12384 [9:06:37<17:10:35, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4295/12384 [9:06:37<17:08:54, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4295/12384 [9:06:44<17:08:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 35%|███▍ | 4296/12384 [9:06:44<17:08:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 35%|███▍ | 4296/12384 [9:06:52<17:08:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 1: 35%|███▍ | 4297/12384 [9:06:52<17:06:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 1: 35%|███▍ | 4297/12384 [9:07:00<17:06:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 35%|███▍ | 4298/12384 [9:07:00<17:05:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 35%|███▍ | 4298/12384 [9:07:07<17:05:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 35%|███▍ | 4299/12384 [9:07:07<17:05:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 35%|███▍ | 4299/12384 [9:07:15<17:05:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 35%|███▍ | 4300/12384 [9:07:15<17:05:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 35%|███▍ | 4300/12384 [9:07:22<17:05:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 35%|███▍ | 4301/12384 [9:07:22<17:05:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 35%|███▍ | 4301/12384 [9:07:30<17:05:25, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4302/12384 [9:07:30<17:06:07, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4302/12384 [9:07:38<17:06:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4303/12384 [9:07:38<17:05:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4303/12384 [9:07:46<17:05:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 35%|███▍ | 4304/12384 [9:07:46<17:16:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 35%|███▍ | 4304/12384 [9:07:53<17:16:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 35%|███▍ | 4305/12384 [9:07:53<17:12:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 35%|███▍ | 4305/12384 [9:08:01<17:12:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4306/12384 [9:08:01<17:09:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4306/12384 [9:08:08<17:09:40, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4307/12384 [9:08:08<17:07:13, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4307/12384 [9:08:16<17:07:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4308/12384 [9:08:16<17:06:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▍ | 4308/12384 [9:08:24<17:06:15, 7.62s/it, loss=0.0017, acc=0.9964, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4309/12384 [9:08:24<17:05:38, 7.62s/it, loss=0.0017, acc=0.9964, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4309/12384 [9:08:31<17:05:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 35%|███▍ | 4310/12384 [9:08:31<17:04:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 35%|███▍ | 4310/12384 [9:08:39<17:04:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 35%|███▍ | 4311/12384 [9:08:39<17:03:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 35%|███▍ | 4311/12384 [9:08:46<17:03:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 35%|███▍ | 4312/12384 [9:08:46<17:03:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 35%|███▍ | 4312/12384 [9:08:54<17:03:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 35%|███▍ | 4313/12384 [9:08:54<17:03:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 35%|███▍ | 4313/12384 [9:09:02<17:03:14, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4314/12384 [9:09:02<17:02:55, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4314/12384 [9:09:09<17:02:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4315/12384 [9:09:09<17:03:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▍ | 4315/12384 [9:09:17<17:03:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 35%|███▍ | 4316/12384 [9:09:17<17:06:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 35%|███▍ | 4316/12384 [9:09:25<17:06:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 35%|███▍ | 4317/12384 [9:09:25<17:18:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 35%|███▍ | 4317/12384 [9:09:32<17:18:16, 7.72s/it, loss=0.0001, acc=0.9994, iter_time=8.51s]
Epoch 1: 35%|███▍ | 4318/12384 [9:09:32<17:13:24, 7.69s/it, loss=0.0001, acc=0.9994, iter_time=8.51s]
Epoch 1: 35%|███▍ | 4318/12384 [9:09:40<17:13:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 35%|███▍ | 4319/12384 [9:09:40<17:09:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 35%|███▍ | 4319/12384 [9:09:48<17:09:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 35%|███▍ | 4320/12384 [9:09:48<17:07:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 35%|███▍ | 4320/12384 [9:09:55<17:07:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 35%|███▍ | 4321/12384 [9:09:55<17:07:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 35%|███▍ | 4321/12384 [9:10:03<17:07:43, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.69s]
Epoch 1: 35%|███▍ | 4322/12384 [9:10:03<17:06:50, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.69s]
Epoch 1: 35%|███▍ | 4322/12384 [9:10:10<17:06:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 35%|███▍ | 4323/12384 [9:10:10<17:05:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 35%|███▍ | 4323/12384 [9:10:18<17:05:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 35%|███▍ | 4324/12384 [9:10:18<17:03:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 35%|███▍ | 4324/12384 [9:10:26<17:03:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 35%|███▍ | 4325/12384 [9:10:26<17:03:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 35%|███▍ | 4325/12384 [9:10:33<17:03:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 35%|███▍ | 4326/12384 [9:10:33<17:03:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 35%|███▍ | 4326/12384 [9:10:41<17:03:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 35%|███▍ | 4327/12384 [9:10:41<17:03:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 35%|███▍ | 4327/12384 [9:10:49<17:03:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 35%|███▍ | 4328/12384 [9:10:49<17:02:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 35%|███▍ | 4328/12384 [9:10:56<17:02:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 35%|███▍ | 4329/12384 [9:10:56<17:01:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 35%|███▍ | 4329/12384 [9:11:04<17:01:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 35%|███▍ | 4330/12384 [9:11:04<17:05:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 35%|███▍ | 4330/12384 [9:11:11<17:05:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 35%|███▍ | 4331/12384 [9:11:11<17:04:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 35%|███▍ | 4331/12384 [9:11:19<17:04:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 35%|███▍ | 4332/12384 [9:11:19<17:04:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 35%|███▍ | 4332/12384 [9:11:27<17:04:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 35%|███▍ | 4333/12384 [9:11:27<17:03:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 35%|███▍ | 4333/12384 [9:11:34<17:03:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 35%|███▍ | 4334/12384 [9:11:34<17:02:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 35%|███▍ | 4334/12384 [9:11:42<17:02:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4335/12384 [9:11:42<17:01:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4335/12384 [9:11:50<17:01:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 35%|███▌ | 4336/12384 [9:11:50<17:01:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 35%|███▌ | 4336/12384 [9:11:57<17:01:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 1: 35%|███▌ | 4337/12384 [9:11:57<16:59:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 1: 35%|███▌ | 4337/12384 [9:12:05<16:59:51, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=9.90s]
Epoch 1: 35%|███▌ | 4338/12384 [9:12:05<16:59:19, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=9.90s]
Epoch 1: 35%|███▌ | 4338/12384 [9:12:12<16:59:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▌ | 4339/12384 [9:12:12<16:59:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▌ | 4339/12384 [9:12:20<16:59:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▌ | 4340/12384 [9:12:20<16:58:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▌ | 4340/12384 [9:12:27<16:58:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 35%|███▌ | 4341/12384 [9:12:27<16:59:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 35%|███▌ | 4341/12384 [9:12:35<16:59:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 35%|███▌ | 4342/12384 [9:12:35<16:59:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 35%|███▌ | 4342/12384 [9:12:43<16:59:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.33s]
Epoch 1: 35%|███▌ | 4343/12384 [9:12:43<17:13:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.33s]
Epoch 1: 35%|███▌ | 4343/12384 [9:12:51<17:13:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.44s]
Epoch 1: 35%|███▌ | 4344/12384 [9:12:51<17:10:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.44s]
Epoch 1: 35%|███▌ | 4344/12384 [9:12:58<17:10:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 35%|███▌ | 4345/12384 [9:12:58<17:05:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 35%|███▌ | 4345/12384 [9:13:06<17:05:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4346/12384 [9:13:06<17:03:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4346/12384 [9:13:13<17:03:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 35%|███▌ | 4347/12384 [9:13:13<17:01:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 35%|███▌ | 4347/12384 [9:13:21<17:01:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 35%|███▌ | 4348/12384 [9:13:21<17:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 35%|███▌ | 4348/12384 [9:13:29<17:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 35%|███▌ | 4349/12384 [9:13:29<17:00:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 35%|███▌ | 4349/12384 [9:13:36<17:00:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4350/12384 [9:13:36<16:59:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4350/12384 [9:13:44<16:59:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 35%|███▌ | 4351/12384 [9:13:44<16:59:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 35%|███▌ | 4351/12384 [9:13:52<16:59:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 1: 35%|███▌ | 4352/12384 [9:13:52<16:59:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 1: 35%|███▌ | 4352/12384 [9:13:59<16:59:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 35%|███▌ | 4353/12384 [9:13:59<16:59:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 35%|███▌ | 4353/12384 [9:14:07<16:59:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 35%|███▌ | 4354/12384 [9:14:07<16:59:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 35%|███▌ | 4354/12384 [9:14:14<16:59:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 35%|███▌ | 4355/12384 [9:14:14<16:59:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 35%|███▌ | 4355/12384 [9:14:22<16:59:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 35%|███▌ | 4356/12384 [9:14:22<17:10:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 35%|███▌ | 4356/12384 [9:14:30<17:10:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 35%|███▌ | 4357/12384 [9:14:30<17:07:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 35%|███▌ | 4357/12384 [9:14:38<17:07:13, 7.68s/it, loss=0.0001, acc=0.9992, iter_time=6.70s]
Epoch 1: 35%|███▌ | 4358/12384 [9:14:38<17:04:49, 7.66s/it, loss=0.0001, acc=0.9992, iter_time=6.70s]
Epoch 1: 35%|███▌ | 4358/12384 [9:14:45<17:04:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 35%|███▌ | 4359/12384 [9:14:45<17:02:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 35%|███▌ | 4359/12384 [9:14:53<17:02:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 35%|███▌ | 4360/12384 [9:14:53<17:01:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 35%|███▌ | 4360/12384 [9:15:00<17:01:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 35%|███▌ | 4361/12384 [9:15:00<16:59:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 35%|███▌ | 4361/12384 [9:15:08<16:59:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 35%|███▌ | 4362/12384 [9:15:08<16:58:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 35%|███▌ | 4362/12384 [9:15:16<16:58:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▌ | 4363/12384 [9:15:16<16:57:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▌ | 4363/12384 [9:15:23<16:57:34, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.86s]
Epoch 1: 35%|███▌ | 4364/12384 [9:15:23<16:56:36, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.86s]
Epoch 1: 35%|███▌ | 4364/12384 [9:15:31<16:56:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 1: 35%|███▌ | 4365/12384 [9:15:31<16:56:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 1: 35%|███▌ | 4365/12384 [9:15:38<16:56:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 35%|███▌ | 4366/12384 [9:15:38<16:57:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 35%|███▌ | 4366/12384 [9:15:46<16:57:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 35%|███▌ | 4367/12384 [9:15:46<16:56:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 35%|███▌ | 4367/12384 [9:15:54<16:56:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 35%|███▌ | 4368/12384 [9:15:54<16:56:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 35%|███▌ | 4368/12384 [9:16:02<16:56:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 35%|███▌ | 4369/12384 [9:16:02<17:09:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 35%|███▌ | 4369/12384 [9:16:09<17:09:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 35%|███▌ | 4370/12384 [9:16:09<17:06:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 35%|███▌ | 4370/12384 [9:16:17<17:06:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 35%|███▌ | 4371/12384 [9:16:17<17:03:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 35%|███▌ | 4371/12384 [9:16:24<17:03:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 35%|███▌ | 4372/12384 [9:16:24<17:02:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 35%|███▌ | 4372/12384 [9:16:32<17:02:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 35%|███▌ | 4373/12384 [9:16:32<17:00:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 35%|███▌ | 4373/12384 [9:16:40<17:00:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 35%|███▌ | 4374/12384 [9:16:40<16:58:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 35%|███▌ | 4374/12384 [9:16:47<16:58:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▌ | 4375/12384 [9:16:47<16:57:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 35%|███▌ | 4375/12384 [9:16:55<16:57:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 35%|███▌ | 4376/12384 [9:16:55<16:57:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 35%|███▌ | 4376/12384 [9:17:02<16:57:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 35%|███▌ | 4377/12384 [9:17:02<16:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 35%|███▌ | 4377/12384 [9:17:10<16:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4378/12384 [9:17:10<16:57:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4378/12384 [9:17:18<16:57:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 35%|███▌ | 4379/12384 [9:17:18<16:56:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 35%|███▌ | 4379/12384 [9:17:25<16:56:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 35%|███▌ | 4380/12384 [9:17:25<16:55:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 35%|███▌ | 4380/12384 [9:17:33<16:55:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 35%|███▌ | 4381/12384 [9:17:33<16:55:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 35%|███▌ | 4381/12384 [9:17:41<16:55:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 35%|███▌ | 4382/12384 [9:17:41<16:55:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 35%|███▌ | 4382/12384 [9:17:48<16:55:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 1: 35%|███▌ | 4383/12384 [9:17:48<16:54:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 1: 35%|███▌ | 4383/12384 [9:17:56<16:54:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 35%|███▌ | 4384/12384 [9:17:56<16:55:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 35%|███▌ | 4384/12384 [9:18:03<16:55:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 35%|███▌ | 4385/12384 [9:18:03<16:55:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 35%|███▌ | 4385/12384 [9:18:11<16:55:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4386/12384 [9:18:11<16:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4386/12384 [9:18:19<16:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4387/12384 [9:18:19<16:55:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 35%|███▌ | 4387/12384 [9:18:26<16:55:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 35%|███▌ | 4388/12384 [9:18:26<16:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 35%|███▌ | 4388/12384 [9:18:34<16:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 35%|███▌ | 4389/12384 [9:18:34<16:55:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 35%|███▌ | 4389/12384 [9:18:42<16:55:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.35s]
Epoch 1: 35%|███▌ | 4390/12384 [9:18:42<16:56:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.35s]
Epoch 1: 35%|███▌ | 4390/12384 [9:18:49<16:56:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 35%|███▌ | 4391/12384 [9:18:49<16:56:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 35%|███▌ | 4391/12384 [9:18:57<16:56:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 35%|███▌ | 4392/12384 [9:18:57<16:59:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 35%|███▌ | 4392/12384 [9:19:04<16:59:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 35%|███▌ | 4393/12384 [9:19:04<16:57:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 35%|███▌ | 4393/12384 [9:19:12<16:57:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 35%|███▌ | 4394/12384 [9:19:12<16:57:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 35%|███▌ | 4394/12384 [9:19:20<16:57:27, 7.64s/it, loss=0.0001, acc=0.9995, iter_time=7.37s]
Epoch 1: 35%|███▌ | 4395/12384 [9:19:20<17:10:52, 7.74s/it, loss=0.0001, acc=0.9995, iter_time=7.37s]
Epoch 1: 35%|███▌ | 4395/12384 [9:19:28<17:10:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 35%|███▌ | 4396/12384 [9:19:28<17:05:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 35%|███▌ | 4396/12384 [9:19:35<17:05:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 36%|███▌ | 4397/12384 [9:19:35<17:01:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 36%|███▌ | 4397/12384 [9:19:43<17:01:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 36%|███▌ | 4398/12384 [9:19:43<16:59:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 36%|███▌ | 4398/12384 [9:19:51<16:59:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 36%|███▌ | 4399/12384 [9:19:51<16:58:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 36%|███▌ | 4399/12384 [9:19:58<16:58:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 36%|███▌ | 4400/12384 [9:19:58<16:56:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 36%|███▌ | 4400/12384 [9:20:06<16:56:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 36%|███▌ | 4401/12384 [9:20:06<16:55:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 36%|███▌ | 4401/12384 [9:20:13<16:55:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 1: 36%|███▌ | 4402/12384 [9:20:13<16:53:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 1: 36%|███▌ | 4402/12384 [9:20:21<16:53:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 36%|███▌ | 4403/12384 [9:20:21<16:51:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 36%|███▌ | 4403/12384 [9:20:29<16:51:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4404/12384 [9:20:29<16:51:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4404/12384 [9:20:36<16:51:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 36%|███▌ | 4405/12384 [9:20:36<16:51:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 36%|███▌ | 4405/12384 [9:20:44<16:51:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 36%|███▌ | 4406/12384 [9:20:44<16:50:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 36%|███▌ | 4406/12384 [9:20:51<16:50:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 36%|███▌ | 4407/12384 [9:20:51<16:50:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 36%|███▌ | 4407/12384 [9:20:59<16:50:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 36%|███▌ | 4408/12384 [9:20:59<16:51:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 36%|███▌ | 4408/12384 [9:21:07<16:51:46, 7.61s/it, loss=0.0008, acc=0.9975, iter_time=7.27s]
Epoch 1: 36%|███▌ | 4409/12384 [9:21:07<16:55:08, 7.64s/it, loss=0.0008, acc=0.9975, iter_time=7.27s]
Epoch 1: 36%|███▌ | 4409/12384 [9:21:14<16:55:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 36%|███▌ | 4410/12384 [9:21:14<16:54:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 36%|███▌ | 4410/12384 [9:21:22<16:54:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 36%|███▌ | 4411/12384 [9:21:22<16:53:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 36%|███▌ | 4411/12384 [9:21:30<16:53:06, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.84s]
Epoch 1: 36%|███▌ | 4412/12384 [9:21:30<16:52:39, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.84s]
Epoch 1: 36%|███▌ | 4412/12384 [9:21:37<16:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 36%|███▌ | 4413/12384 [9:21:37<16:53:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 36%|███▌ | 4413/12384 [9:21:45<16:53:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 36%|███▌ | 4414/12384 [9:21:45<16:53:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 36%|███▌ | 4414/12384 [9:21:52<16:53:33, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=8.56s]
Epoch 1: 36%|███▌ | 4415/12384 [9:21:52<16:53:02, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=8.56s]
Epoch 1: 36%|███▌ | 4415/12384 [9:22:00<16:53:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 36%|███▌ | 4416/12384 [9:22:00<16:52:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 36%|███▌ | 4416/12384 [9:22:08<16:52:43, 7.63s/it, loss=0.0009, acc=0.9952, iter_time=7.19s]
Epoch 1: 36%|███▌ | 4417/12384 [9:22:08<16:50:58, 7.61s/it, loss=0.0009, acc=0.9952, iter_time=7.19s]
Epoch 1: 36%|███▌ | 4417/12384 [9:22:15<16:50:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4418/12384 [9:22:15<16:50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4418/12384 [9:22:23<16:50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4419/12384 [9:22:23<16:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4419/12384 [9:22:30<16:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 36%|███▌ | 4420/12384 [9:22:30<16:50:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 36%|███▌ | 4420/12384 [9:22:38<16:50:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 36%|███▌ | 4421/12384 [9:22:38<17:04:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 36%|███▌ | 4421/12384 [9:22:46<17:04:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 36%|███▌ | 4422/12384 [9:22:46<16:59:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 36%|███▌ | 4422/12384 [9:22:54<16:59:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 36%|███▌ | 4423/12384 [9:22:54<16:56:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 36%|███▌ | 4423/12384 [9:23:01<16:56:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 36%|███▌ | 4424/12384 [9:23:01<16:55:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 36%|███▌ | 4424/12384 [9:23:09<16:55:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 36%|███▌ | 4425/12384 [9:23:09<16:53:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 36%|███▌ | 4425/12384 [9:23:16<16:53:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 36%|███▌ | 4426/12384 [9:23:16<16:52:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 36%|███▌ | 4426/12384 [9:23:24<16:52:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 36%|███▌ | 4427/12384 [9:23:24<16:52:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 36%|███▌ | 4427/12384 [9:23:32<16:52:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 36%|███▌ | 4428/12384 [9:23:32<16:51:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 36%|███▌ | 4428/12384 [9:23:39<16:51:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4429/12384 [9:23:39<16:50:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4429/12384 [9:23:47<16:50:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4430/12384 [9:23:47<16:50:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4430/12384 [9:23:55<16:50:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 36%|███▌ | 4431/12384 [9:23:55<16:49:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 36%|███▌ | 4431/12384 [9:24:02<16:49:53, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.11s]
Epoch 1: 36%|███▌ | 4432/12384 [9:24:02<16:48:06, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=8.11s]
Epoch 1: 36%|███▌ | 4432/12384 [9:24:10<16:48:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 36%|███▌ | 4433/12384 [9:24:10<16:47:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 36%|███▌ | 4433/12384 [9:24:17<16:47:43, 7.60s/it, loss=0.0001, acc=0.9996, iter_time=9.11s]
Epoch 1: 36%|███▌ | 4434/12384 [9:24:17<16:48:06, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=9.11s]
Epoch 1: 36%|███▌ | 4434/12384 [9:24:25<16:48:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.40s]
Epoch 1: 36%|███▌ | 4435/12384 [9:24:25<16:48:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.40s]
Epoch 1: 36%|███▌ | 4435/12384 [9:24:33<16:48:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 36%|███▌ | 4436/12384 [9:24:33<16:58:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 36%|███▌ | 4436/12384 [9:24:40<16:58:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4437/12384 [9:24:40<16:55:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4437/12384 [9:24:48<16:55:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 36%|███▌ | 4438/12384 [9:24:48<16:53:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 36%|███▌ | 4438/12384 [9:24:56<16:53:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 36%|███▌ | 4439/12384 [9:24:56<16:51:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 36%|███▌ | 4439/12384 [9:25:03<16:51:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 36%|███▌ | 4440/12384 [9:25:03<16:50:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 36%|███▌ | 4440/12384 [9:25:11<16:50:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 36%|███▌ | 4441/12384 [9:25:11<16:48:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 36%|███▌ | 4441/12384 [9:25:19<16:48:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 36%|███▌ | 4442/12384 [9:25:19<16:49:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 36%|███▌ | 4442/12384 [9:25:26<16:49:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 36%|███▌ | 4443/12384 [9:25:26<16:47:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 36%|███▌ | 4443/12384 [9:25:34<16:47:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 36%|███▌ | 4444/12384 [9:25:34<16:47:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 36%|███▌ | 4444/12384 [9:25:41<16:47:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4445/12384 [9:25:41<16:46:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4445/12384 [9:25:49<16:46:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4446/12384 [9:25:49<16:46:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4446/12384 [9:25:57<16:46:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 36%|███▌ | 4447/12384 [9:25:57<16:46:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 36%|███▌ | 4447/12384 [9:26:05<16:46:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 36%|███▌ | 4448/12384 [9:26:05<17:00:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 36%|███▌ | 4448/12384 [9:26:12<17:00:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 1: 36%|███▌ | 4449/12384 [9:26:12<16:55:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 1: 36%|███▌ | 4449/12384 [9:26:20<16:55:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 36%|███▌ | 4450/12384 [9:26:20<16:53:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 36%|███▌ | 4450/12384 [9:26:27<16:53:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4451/12384 [9:26:27<16:51:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4451/12384 [9:26:35<16:51:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 36%|███▌ | 4452/12384 [9:26:35<16:49:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 36%|███▌ | 4452/12384 [9:26:43<16:49:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 36%|███▌ | 4453/12384 [9:26:43<16:49:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 36%|███▌ | 4453/12384 [9:26:50<16:49:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4454/12384 [9:26:50<16:47:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4454/12384 [9:26:58<16:47:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4455/12384 [9:26:58<16:48:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4455/12384 [9:27:05<16:48:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 36%|███▌ | 4456/12384 [9:27:05<16:47:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 36%|███▌ | 4456/12384 [9:27:13<16:47:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 36%|███▌ | 4457/12384 [9:27:13<16:46:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 36%|███▌ | 4457/12384 [9:27:21<16:46:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4458/12384 [9:27:21<16:46:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4458/12384 [9:27:28<16:46:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4459/12384 [9:27:28<16:45:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4459/12384 [9:27:36<16:45:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 36%|███▌ | 4460/12384 [9:27:36<16:44:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 36%|███▌ | 4460/12384 [9:27:43<16:44:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 36%|███▌ | 4461/12384 [9:27:43<16:43:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 36%|███▌ | 4461/12384 [9:27:51<16:43:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 36%|███▌ | 4462/12384 [9:27:51<16:43:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 36%|███▌ | 4462/12384 [9:27:59<16:43:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 36%|███▌ | 4463/12384 [9:27:59<16:44:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 36%|███▌ | 4463/12384 [9:28:06<16:44:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 36%|███▌ | 4464/12384 [9:28:06<16:43:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 36%|███▌ | 4464/12384 [9:28:14<16:43:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 1: 36%|███▌ | 4465/12384 [9:28:14<16:43:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.66s]
Epoch 1: 36%|███▌ | 4465/12384 [9:28:21<16:43:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 1: 36%|███▌ | 4466/12384 [9:28:21<16:42:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 1: 36%|███▌ | 4466/12384 [9:28:29<16:42:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 36%|███▌ | 4467/12384 [9:28:29<16:42:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 36%|███▌ | 4467/12384 [9:28:37<16:42:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 36%|███▌ | 4468/12384 [9:28:37<16:42:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 36%|███▌ | 4468/12384 [9:28:44<16:42:27, 7.60s/it, loss=0.0001, acc=0.9990, iter_time=9.68s]
Epoch 1: 36%|███▌ | 4469/12384 [9:28:44<16:43:21, 7.61s/it, loss=0.0001, acc=0.9990, iter_time=9.68s]
Epoch 1: 36%|███▌ | 4469/12384 [9:28:52<16:43:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 1: 36%|███▌ | 4470/12384 [9:28:52<16:43:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 1: 36%|███▌ | 4470/12384 [9:29:00<16:43:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 1: 36%|███▌ | 4471/12384 [9:29:00<16:43:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 1: 36%|███▌ | 4471/12384 [9:29:07<16:43:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 36%|███▌ | 4472/12384 [9:29:07<16:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 36%|███▌ | 4472/12384 [9:29:15<16:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 36%|███▌ | 4473/12384 [9:29:15<16:45:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 36%|███▌ | 4473/12384 [9:29:23<16:45:25, 7.63s/it, loss=0.0006, acc=0.9958, iter_time=6.82s]
Epoch 1: 36%|███▌ | 4474/12384 [9:29:23<16:58:12, 7.72s/it, loss=0.0006, acc=0.9958, iter_time=6.82s]
Epoch 1: 36%|███▌ | 4474/12384 [9:29:30<16:58:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 36%|███▌ | 4475/12384 [9:29:30<16:53:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 36%|███▌ | 4475/12384 [9:29:38<16:53:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 36%|███▌ | 4476/12384 [9:29:38<16:49:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 36%|███▌ | 4476/12384 [9:29:46<16:49:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4477/12384 [9:29:46<16:47:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4477/12384 [9:29:53<16:47:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4478/12384 [9:29:53<16:46:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▌ | 4478/12384 [9:30:01<16:46:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 36%|███▌ | 4479/12384 [9:30:01<16:44:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 36%|███▌ | 4479/12384 [9:30:08<16:44:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 36%|███▌ | 4480/12384 [9:30:08<16:43:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 36%|███▌ | 4480/12384 [9:30:16<16:43:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 36%|███▌ | 4481/12384 [9:30:16<16:42:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 36%|███▌ | 4481/12384 [9:30:24<16:42:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4482/12384 [9:30:24<16:42:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4482/12384 [9:30:31<16:42:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4483/12384 [9:30:31<16:42:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4483/12384 [9:30:39<16:42:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4484/12384 [9:30:39<16:42:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4484/12384 [9:30:46<16:42:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4485/12384 [9:30:46<16:42:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 36%|███▌ | 4485/12384 [9:30:54<16:42:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4486/12384 [9:30:54<16:42:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 36%|███▌ | 4486/12384 [9:31:02<16:42:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 36%|███▌ | 4487/12384 [9:31:02<16:41:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 36%|███▌ | 4487/12384 [9:31:09<16:41:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 36%|███▌ | 4488/12384 [9:31:09<16:42:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 36%|███▌ | 4488/12384 [9:31:17<16:42:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 36%|███▌ | 4489/12384 [9:31:17<16:41:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 36%|███▌ | 4489/12384 [9:31:25<16:41:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 36%|███▋ | 4490/12384 [9:31:25<16:41:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 36%|███▋ | 4490/12384 [9:31:32<16:41:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 36%|███▋ | 4491/12384 [9:31:32<16:40:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 36%|███▋ | 4491/12384 [9:31:40<16:40:29, 7.61s/it, loss=0.0003, acc=0.9979, iter_time=7.65s]
Epoch 1: 36%|███▋ | 4492/12384 [9:31:40<16:42:01, 7.62s/it, loss=0.0003, acc=0.9979, iter_time=7.65s]
Epoch 1: 36%|███▋ | 4492/12384 [9:31:47<16:42:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▋ | 4493/12384 [9:31:47<16:41:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▋ | 4493/12384 [9:31:55<16:41:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 36%|███▋ | 4494/12384 [9:31:55<16:40:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 36%|███▋ | 4494/12384 [9:32:03<16:40:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 36%|███▋ | 4495/12384 [9:32:03<16:40:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 36%|███▋ | 4495/12384 [9:32:10<16:40:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 1: 36%|███▋ | 4496/12384 [9:32:10<16:41:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 1: 36%|███▋ | 4496/12384 [9:32:18<16:41:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 36%|███▋ | 4497/12384 [9:32:18<16:41:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 36%|███▋ | 4497/12384 [9:32:25<16:41:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 36%|███▋ | 4498/12384 [9:32:25<16:40:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 36%|███▋ | 4498/12384 [9:32:33<16:40:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 36%|███▋ | 4499/12384 [9:32:33<16:40:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 36%|███▋ | 4499/12384 [9:32:41<16:40:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▋ | 4500/12384 [9:32:41<16:40:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 36%|███▋ | 4500/12384 [9:32:49<16:40:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 36%|███▋ | 4501/12384 [9:32:49<16:54:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 36%|███▋ | 4501/12384 [9:32:56<16:54:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 36%|███▋ | 4502/12384 [9:32:56<16:50:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 36%|███▋ | 4502/12384 [9:33:04<16:50:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 36%|███▋ | 4503/12384 [9:33:04<16:46:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 36%|███▋ | 4503/12384 [9:33:12<16:46:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 36%|███▋ | 4504/12384 [9:33:12<16:46:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 36%|███▋ | 4504/12384 [9:33:19<16:46:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 36%|███▋ | 4505/12384 [9:33:19<16:44:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 36%|███▋ | 4505/12384 [9:33:27<16:44:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 36%|███▋ | 4506/12384 [9:33:27<16:42:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 36%|███▋ | 4506/12384 [9:33:34<16:42:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 36%|███▋ | 4507/12384 [9:33:34<16:42:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 36%|███▋ | 4507/12384 [9:33:42<16:42:58, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 1: 36%|███▋ | 4508/12384 [9:33:42<16:41:00, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 1: 36%|███▋ | 4508/12384 [9:33:50<16:41:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 36%|███▋ | 4509/12384 [9:33:50<16:40:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 36%|███▋ | 4509/12384 [9:33:57<16:40:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.75s]
Epoch 1: 36%|███▋ | 4510/12384 [9:33:57<16:39:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.75s]
Epoch 1: 36%|███▋ | 4510/12384 [9:34:05<16:39:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 36%|███▋ | 4511/12384 [9:34:05<16:39:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 36%|███▋ | 4511/12384 [9:34:12<16:39:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.85s]
Epoch 1: 36%|███▋ | 4512/12384 [9:34:12<16:39:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.85s]
Epoch 1: 36%|███▋ | 4512/12384 [9:34:20<16:39:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 36%|███▋ | 4513/12384 [9:34:20<16:38:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 36%|███▋ | 4513/12384 [9:34:28<16:38:30, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=6.05s]
Epoch 1: 36%|███▋ | 4514/12384 [9:34:28<16:38:32, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=6.05s]
Epoch 1: 36%|███▋ | 4514/12384 [9:34:35<16:38:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 36%|███▋ | 4515/12384 [9:34:35<16:39:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 36%|███▋ | 4515/12384 [9:34:43<16:39:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 36%|███▋ | 4516/12384 [9:34:43<16:38:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 36%|███▋ | 4516/12384 [9:34:51<16:38:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 36%|███▋ | 4517/12384 [9:34:51<16:39:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 36%|███▋ | 4517/12384 [9:34:58<16:39:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 36%|███▋ | 4518/12384 [9:34:58<16:37:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 36%|███▋ | 4518/12384 [9:35:06<16:37:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 36%|███▋ | 4519/12384 [9:35:06<16:37:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 36%|███▋ | 4519/12384 [9:35:13<16:37:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 36%|███▋ | 4520/12384 [9:35:13<16:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 36%|███▋ | 4520/12384 [9:35:21<16:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 37%|███▋ | 4521/12384 [9:35:21<16:36:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 37%|███▋ | 4521/12384 [9:35:29<16:36:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 37%|███▋ | 4522/12384 [9:35:29<16:37:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 37%|███▋ | 4522/12384 [9:35:36<16:37:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 37%|███▋ | 4523/12384 [9:35:36<16:36:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 37%|███▋ | 4523/12384 [9:35:44<16:36:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 37%|███▋ | 4524/12384 [9:35:44<16:36:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 37%|███▋ | 4524/12384 [9:35:51<16:36:38, 7.61s/it, loss=0.0015, acc=0.9969, iter_time=4.72s]
Epoch 1: 37%|███▋ | 4525/12384 [9:35:51<16:37:25, 7.61s/it, loss=0.0015, acc=0.9969, iter_time=4.72s]
Epoch 1: 37%|███▋ | 4525/12384 [9:35:59<16:37:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 37%|███▋ | 4526/12384 [9:35:59<16:37:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 37%|███▋ | 4526/12384 [9:36:07<16:37:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 37%|███▋ | 4527/12384 [9:36:07<16:50:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 37%|███▋ | 4527/12384 [9:36:15<16:50:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 37%|███▋ | 4528/12384 [9:36:15<16:46:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 37%|███▋ | 4528/12384 [9:36:22<16:46:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 37%|███▋ | 4529/12384 [9:36:22<16:42:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 37%|███▋ | 4529/12384 [9:36:30<16:42:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 37%|███▋ | 4530/12384 [9:36:30<16:40:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 37%|███▋ | 4530/12384 [9:36:37<16:40:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 1: 37%|███▋ | 4531/12384 [9:36:37<16:42:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 1: 37%|███▋ | 4531/12384 [9:36:45<16:42:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 37%|███▋ | 4532/12384 [9:36:45<16:44:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 37%|███▋ | 4532/12384 [9:36:53<16:44:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 37%|███▋ | 4533/12384 [9:36:53<16:45:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 37%|███▋ | 4533/12384 [9:37:01<16:45:50, 7.69s/it, loss=0.0023, acc=0.9978, iter_time=10.26s]
Epoch 1: 37%|███▋ | 4534/12384 [9:37:01<16:43:01, 7.67s/it, loss=0.0023, acc=0.9978, iter_time=10.26s]
Epoch 1: 37%|███▋ | 4534/12384 [9:37:08<16:43:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4535/12384 [9:37:08<16:39:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4535/12384 [9:37:16<16:39:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 1: 37%|███▋ | 4536/12384 [9:37:16<16:38:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 1: 37%|███▋ | 4536/12384 [9:37:23<16:38:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 37%|███▋ | 4537/12384 [9:37:23<16:36:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 37%|███▋ | 4537/12384 [9:37:31<16:36:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 1: 37%|███▋ | 4538/12384 [9:37:31<16:37:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 1: 37%|███▋ | 4538/12384 [9:37:39<16:37:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 37%|███▋ | 4539/12384 [9:37:39<16:36:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 37%|███▋ | 4539/12384 [9:37:46<16:36:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 37%|███▋ | 4540/12384 [9:37:46<16:47:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 37%|███▋ | 4540/12384 [9:37:54<16:47:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 37%|███▋ | 4541/12384 [9:37:54<16:43:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 37%|███▋ | 4541/12384 [9:38:02<16:43:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 37%|███▋ | 4542/12384 [9:38:02<16:40:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 37%|███▋ | 4542/12384 [9:38:09<16:40:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 37%|███▋ | 4543/12384 [9:38:09<16:38:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 37%|███▋ | 4543/12384 [9:38:17<16:38:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 37%|███▋ | 4544/12384 [9:38:17<16:37:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 37%|███▋ | 4544/12384 [9:38:24<16:37:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 37%|███▋ | 4545/12384 [9:38:24<16:35:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 37%|███▋ | 4545/12384 [9:38:32<16:35:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 37%|███▋ | 4546/12384 [9:38:32<16:34:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 37%|███▋ | 4546/12384 [9:38:40<16:34:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4547/12384 [9:38:40<16:34:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4547/12384 [9:38:47<16:34:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 37%|███▋ | 4548/12384 [9:38:47<16:33:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 37%|███▋ | 4548/12384 [9:38:55<16:33:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 37%|███▋ | 4549/12384 [9:38:55<16:36:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 37%|███▋ | 4549/12384 [9:39:03<16:36:30, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=5.06s]
Epoch 1: 37%|███▋ | 4550/12384 [9:39:03<16:34:59, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=5.06s]
Epoch 1: 37%|███▋ | 4550/12384 [9:39:10<16:34:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 37%|███▋ | 4551/12384 [9:39:10<16:33:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 37%|███▋ | 4551/12384 [9:39:18<16:33:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 37%|███▋ | 4552/12384 [9:39:18<16:33:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 37%|███▋ | 4552/12384 [9:39:26<16:33:26, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.26s]
Epoch 1: 37%|███▋ | 4553/12384 [9:39:26<16:45:46, 7.71s/it, loss=0.0001, acc=0.9999, iter_time=7.26s]
Epoch 1: 37%|███▋ | 4553/12384 [9:39:33<16:45:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 37%|███▋ | 4554/12384 [9:39:33<16:42:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 37%|███▋ | 4554/12384 [9:39:41<16:42:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 1: 37%|███▋ | 4555/12384 [9:39:41<16:39:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 1: 37%|███▋ | 4555/12384 [9:39:49<16:39:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4556/12384 [9:39:49<16:36:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4556/12384 [9:39:56<16:36:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4557/12384 [9:39:56<16:35:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4557/12384 [9:40:04<16:35:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 37%|███▋ | 4558/12384 [9:40:04<16:34:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 37%|███▋ | 4558/12384 [9:40:11<16:34:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4559/12384 [9:40:11<16:37:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4559/12384 [9:40:19<16:37:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 37%|███▋ | 4560/12384 [9:40:19<16:35:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 37%|███▋ | 4560/12384 [9:40:27<16:35:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 37%|███▋ | 4561/12384 [9:40:27<16:34:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 37%|███▋ | 4561/12384 [9:40:34<16:34:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 37%|███▋ | 4562/12384 [9:40:34<16:32:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 37%|███▋ | 4562/12384 [9:40:42<16:32:50, 7.62s/it, loss=0.0005, acc=0.9985, iter_time=7.66s]
Epoch 1: 37%|███▋ | 4563/12384 [9:40:42<16:34:29, 7.63s/it, loss=0.0005, acc=0.9985, iter_time=7.66s]
Epoch 1: 37%|███▋ | 4563/12384 [9:40:50<16:34:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 37%|███▋ | 4564/12384 [9:40:50<16:33:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 37%|███▋ | 4564/12384 [9:40:57<16:33:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 37%|███▋ | 4565/12384 [9:40:57<16:32:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 37%|███▋ | 4565/12384 [9:41:05<16:32:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 37%|███▋ | 4566/12384 [9:41:05<16:31:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 37%|███▋ | 4566/12384 [9:41:12<16:31:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 37%|███▋ | 4567/12384 [9:41:12<16:30:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 37%|███▋ | 4567/12384 [9:41:20<16:30:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 1: 37%|███▋ | 4568/12384 [9:41:20<16:31:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 1: 37%|███▋ | 4568/12384 [9:41:28<16:31:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 37%|███▋ | 4569/12384 [9:41:28<16:32:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 37%|███▋ | 4569/12384 [9:41:35<16:32:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 37%|███▋ | 4570/12384 [9:41:35<16:32:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 37%|███▋ | 4570/12384 [9:41:43<16:32:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 37%|███▋ | 4571/12384 [9:41:43<16:32:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 37%|███▋ | 4571/12384 [9:41:50<16:32:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 37%|███▋ | 4572/12384 [9:41:50<16:32:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 37%|███▋ | 4572/12384 [9:41:58<16:32:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 37%|███▋ | 4573/12384 [9:41:58<16:31:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 37%|███▋ | 4573/12384 [9:42:06<16:31:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4574/12384 [9:42:06<16:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4574/12384 [9:42:13<16:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 37%|███▋ | 4575/12384 [9:42:13<16:30:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 37%|███▋ | 4575/12384 [9:42:21<16:30:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 37%|███▋ | 4576/12384 [9:42:21<16:30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 37%|███▋ | 4576/12384 [9:42:28<16:30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 37%|███▋ | 4577/12384 [9:42:28<16:30:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 37%|███▋ | 4577/12384 [9:42:36<16:30:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 37%|███▋ | 4578/12384 [9:42:36<16:30:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 37%|███▋ | 4578/12384 [9:42:44<16:30:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 37%|███▋ | 4579/12384 [9:42:44<16:42:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 37%|███▋ | 4579/12384 [9:42:52<16:42:50, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.59s]
Epoch 1: 37%|███▋ | 4580/12384 [9:42:52<16:38:42, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.59s]
Epoch 1: 37%|███▋ | 4580/12384 [9:42:59<16:38:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 37%|███▋ | 4581/12384 [9:42:59<16:36:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 37%|███▋ | 4581/12384 [9:43:07<16:36:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 37%|███▋ | 4582/12384 [9:43:07<16:33:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 37%|███▋ | 4582/12384 [9:43:14<16:33:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4583/12384 [9:43:14<16:32:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4583/12384 [9:43:22<16:32:29, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.56s]
Epoch 1: 37%|███▋ | 4584/12384 [9:43:22<16:30:38, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.56s]
Epoch 1: 37%|███▋ | 4584/12384 [9:43:30<16:30:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 37%|███▋ | 4585/12384 [9:43:30<16:30:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 37%|███▋ | 4585/12384 [9:43:37<16:30:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 37%|███▋ | 4586/12384 [9:43:37<16:30:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 37%|███▋ | 4586/12384 [9:43:45<16:30:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 37%|███▋ | 4587/12384 [9:43:45<16:29:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 37%|███▋ | 4587/12384 [9:43:52<16:29:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 37%|███▋ | 4588/12384 [9:43:52<16:28:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 37%|███▋ | 4588/12384 [9:44:00<16:28:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4589/12384 [9:44:00<16:28:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4589/12384 [9:44:08<16:28:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4590/12384 [9:44:08<16:28:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4590/12384 [9:44:15<16:28:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 37%|███▋ | 4591/12384 [9:44:15<16:28:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 37%|███▋ | 4591/12384 [9:44:23<16:28:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 37%|███▋ | 4592/12384 [9:44:23<16:29:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 37%|███▋ | 4592/12384 [9:44:31<16:29:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 37%|███▋ | 4593/12384 [9:44:31<16:39:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 37%|███▋ | 4593/12384 [9:44:38<16:39:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4594/12384 [9:44:38<16:36:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4594/12384 [9:44:46<16:36:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4595/12384 [9:44:46<16:34:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4595/12384 [9:44:54<16:34:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 37%|███▋ | 4596/12384 [9:44:54<16:32:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 37%|███▋ | 4596/12384 [9:45:01<16:32:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 1: 37%|███▋ | 4597/12384 [9:45:01<16:30:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 1: 37%|███▋ | 4597/12384 [9:45:09<16:30:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 37%|███▋ | 4598/12384 [9:45:09<16:29:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 37%|███▋ | 4598/12384 [9:45:17<16:29:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 37%|███▋ | 4599/12384 [9:45:17<16:28:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 37%|███▋ | 4599/12384 [9:45:24<16:28:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 37%|███▋ | 4600/12384 [9:45:24<16:27:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 37%|███▋ | 4600/12384 [9:45:32<16:27:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 37%|███▋ | 4601/12384 [9:45:32<16:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 37%|███▋ | 4601/12384 [9:45:39<16:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 37%|███▋ | 4602/12384 [9:45:39<16:27:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 37%|███▋ | 4602/12384 [9:45:47<16:27:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 37%|███▋ | 4603/12384 [9:45:47<16:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 37%|███▋ | 4603/12384 [9:45:55<16:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 37%|███▋ | 4604/12384 [9:45:55<16:26:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 37%|███▋ | 4604/12384 [9:46:02<16:26:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.56s]
Epoch 1: 37%|███▋ | 4605/12384 [9:46:02<16:38:21, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.56s]
Epoch 1: 37%|███▋ | 4605/12384 [9:46:10<16:38:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 1: 37%|███▋ | 4606/12384 [9:46:10<16:34:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 1: 37%|███▋ | 4606/12384 [9:46:18<16:34:47, 7.67s/it, loss=0.0003, acc=0.9980, iter_time=7.64s]
Epoch 1: 37%|███▋ | 4607/12384 [9:46:18<16:36:21, 7.69s/it, loss=0.0003, acc=0.9980, iter_time=7.64s]
Epoch 1: 37%|███▋ | 4607/12384 [9:46:25<16:36:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 37%|███▋ | 4608/12384 [9:46:25<16:33:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 1: 37%|███▋ | 4608/12384 [9:46:33<16:33:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 37%|███▋ | 4609/12384 [9:46:33<16:30:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 37%|███▋ | 4609/12384 [9:46:41<16:30:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 37%|███▋ | 4610/12384 [9:46:41<16:28:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 37%|███▋ | 4610/12384 [9:46:48<16:28:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 37%|███▋ | 4611/12384 [9:46:48<16:27:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 37%|███▋ | 4611/12384 [9:46:56<16:27:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 37%|███▋ | 4612/12384 [9:46:56<16:26:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 37%|███▋ | 4612/12384 [9:47:03<16:26:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 37%|███▋ | 4613/12384 [9:47:03<16:27:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 37%|███▋ | 4613/12384 [9:47:11<16:27:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 1: 37%|███▋ | 4614/12384 [9:47:11<16:26:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 1: 37%|███▋ | 4614/12384 [9:47:19<16:26:34, 7.62s/it, loss=0.0012, acc=0.9980, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4615/12384 [9:47:19<16:25:48, 7.61s/it, loss=0.0012, acc=0.9980, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4615/12384 [9:47:26<16:25:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 37%|███▋ | 4616/12384 [9:47:26<16:33:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 37%|███▋ | 4616/12384 [9:47:34<16:33:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 37%|███▋ | 4617/12384 [9:47:34<16:30:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 37%|███▋ | 4617/12384 [9:47:42<16:30:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 37%|███▋ | 4618/12384 [9:47:42<16:28:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 37%|███▋ | 4618/12384 [9:47:49<16:28:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 37%|███▋ | 4619/12384 [9:47:49<16:27:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 37%|███▋ | 4619/12384 [9:47:57<16:27:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 1: 37%|███▋ | 4620/12384 [9:47:57<16:36:55, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 1: 37%|███▋ | 4620/12384 [9:48:05<16:36:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 37%|███▋ | 4621/12384 [9:48:05<16:33:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 37%|███▋ | 4621/12384 [9:48:12<16:33:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 37%|███▋ | 4622/12384 [9:48:12<16:30:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 37%|███▋ | 4622/12384 [9:48:20<16:30:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 37%|███▋ | 4623/12384 [9:48:20<16:28:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 37%|███▋ | 4623/12384 [9:48:28<16:28:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 1: 37%|███▋ | 4624/12384 [9:48:28<16:27:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 1: 37%|███▋ | 4624/12384 [9:48:35<16:27:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 37%|███▋ | 4625/12384 [9:48:35<16:27:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 37%|███▋ | 4625/12384 [9:48:43<16:27:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4626/12384 [9:48:43<16:26:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 37%|███▋ | 4626/12384 [9:48:50<16:26:16, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=5.81s]
Epoch 1: 37%|███▋ | 4627/12384 [9:48:50<16:25:30, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=5.81s]
Epoch 1: 37%|███▋ | 4627/12384 [9:48:58<16:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 37%|███▋ | 4628/12384 [9:48:58<16:24:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 37%|███▋ | 4628/12384 [9:49:06<16:24:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 1: 37%|███▋ | 4629/12384 [9:49:06<16:23:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 1: 37%|███▋ | 4629/12384 [9:49:13<16:23:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 1: 37%|███▋ | 4630/12384 [9:49:13<16:22:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 1: 37%|███▋ | 4630/12384 [9:49:21<16:22:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 37%|███▋ | 4631/12384 [9:49:21<16:21:14, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 37%|███▋ | 4631/12384 [9:49:29<16:21:14, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 37%|███▋ | 4632/12384 [9:49:29<16:34:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 37%|███▋ | 4632/12384 [9:49:36<16:34:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 37%|███▋ | 4633/12384 [9:49:36<16:31:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 37%|███▋ | 4633/12384 [9:49:44<16:31:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 37%|███▋ | 4634/12384 [9:49:44<16:27:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 37%|███▋ | 4634/12384 [9:49:52<16:27:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4635/12384 [9:49:52<16:26:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4635/12384 [9:49:59<16:26:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4636/12384 [9:49:59<16:25:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4636/12384 [9:50:07<16:25:05, 7.63s/it, loss=0.0003, acc=0.9983, iter_time=7.61s]
Epoch 1: 37%|███▋ | 4637/12384 [9:50:07<16:24:14, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=7.61s]
Epoch 1: 37%|███▋ | 4637/12384 [9:50:14<16:24:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4638/12384 [9:50:14<16:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4638/12384 [9:50:22<16:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 37%|███▋ | 4639/12384 [9:50:22<16:21:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 37%|███▋ | 4639/12384 [9:50:30<16:21:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 37%|███▋ | 4640/12384 [9:50:30<16:21:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 37%|███▋ | 4640/12384 [9:50:37<16:21:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 37%|███▋ | 4641/12384 [9:50:37<16:21:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 37%|███▋ | 4641/12384 [9:50:45<16:21:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 37%|███▋ | 4642/12384 [9:50:45<16:20:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 37%|███▋ | 4642/12384 [9:50:52<16:20:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4643/12384 [9:50:52<16:20:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 37%|███▋ | 4643/12384 [9:51:00<16:20:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 38%|███▊ | 4644/12384 [9:51:00<16:21:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 38%|███▊ | 4644/12384 [9:51:08<16:21:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 38%|███▊ | 4645/12384 [9:51:08<16:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 38%|███▊ | 4645/12384 [9:51:16<16:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 38%|███▊ | 4646/12384 [9:51:16<16:32:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 38%|███▊ | 4646/12384 [9:51:23<16:32:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 38%|███▊ | 4647/12384 [9:51:23<16:29:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 38%|███▊ | 4647/12384 [9:51:31<16:29:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 38%|███▊ | 4648/12384 [9:51:31<16:27:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 38%|███▊ | 4648/12384 [9:51:38<16:27:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 38%|███▊ | 4649/12384 [9:51:38<16:24:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 38%|███▊ | 4649/12384 [9:51:46<16:24:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 38%|███▊ | 4650/12384 [9:51:46<16:23:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 38%|███▊ | 4650/12384 [9:51:54<16:23:30, 7.63s/it, loss=0.0002, acc=0.9988, iter_time=8.47s]
Epoch 1: 38%|███▊ | 4651/12384 [9:51:54<16:23:44, 7.63s/it, loss=0.0002, acc=0.9988, iter_time=8.47s]
Epoch 1: 38%|███▊ | 4651/12384 [9:52:01<16:23:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 38%|███▊ | 4652/12384 [9:52:01<16:22:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 38%|███▊ | 4652/12384 [9:52:09<16:22:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 38%|███▊ | 4653/12384 [9:52:09<16:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 38%|███▊ | 4653/12384 [9:52:16<16:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 38%|███▊ | 4654/12384 [9:52:16<16:21:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 38%|███▊ | 4654/12384 [9:52:24<16:21:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 38%|███▊ | 4655/12384 [9:52:24<16:20:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 38%|███▊ | 4655/12384 [9:52:32<16:20:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 1: 38%|███▊ | 4656/12384 [9:52:32<16:22:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 1: 38%|███▊ | 4656/12384 [9:52:39<16:22:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 38%|███▊ | 4657/12384 [9:52:39<16:21:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 38%|███▊ | 4657/12384 [9:52:47<16:21:48, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=10.24s]
Epoch 1: 38%|███▊ | 4658/12384 [9:52:47<16:32:35, 7.71s/it, loss=0.0002, acc=0.9988, iter_time=10.24s]
Epoch 1: 38%|███▊ | 4658/12384 [9:52:55<16:32:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 38%|███▊ | 4659/12384 [9:52:55<16:28:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 38%|███▊ | 4659/12384 [9:53:02<16:28:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 38%|███▊ | 4660/12384 [9:53:02<16:26:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 38%|███▊ | 4660/12384 [9:53:10<16:26:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 38%|███▊ | 4661/12384 [9:53:10<16:27:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 38%|███▊ | 4661/12384 [9:53:18<16:27:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 38%|███▊ | 4662/12384 [9:53:18<16:24:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 38%|███▊ | 4662/12384 [9:53:25<16:24:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 38%|███▊ | 4663/12384 [9:53:25<16:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 38%|███▊ | 4663/12384 [9:53:33<16:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 38%|███▊ | 4664/12384 [9:53:33<16:21:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 38%|███▊ | 4664/12384 [9:53:41<16:21:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 38%|███▊ | 4665/12384 [9:53:41<16:19:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 38%|███▊ | 4665/12384 [9:53:48<16:19:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 38%|███▊ | 4666/12384 [9:53:48<16:19:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 38%|███▊ | 4666/12384 [9:53:56<16:19:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 38%|███▊ | 4667/12384 [9:53:56<16:19:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 38%|███▊ | 4667/12384 [9:54:03<16:19:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4668/12384 [9:54:03<16:18:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4668/12384 [9:54:11<16:18:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.29s]
Epoch 1: 38%|███▊ | 4669/12384 [9:54:11<16:17:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.29s]
Epoch 1: 38%|███▊ | 4669/12384 [9:54:19<16:17:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 38%|███▊ | 4670/12384 [9:54:19<16:17:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 38%|███▊ | 4670/12384 [9:54:26<16:17:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 38%|███▊ | 4671/12384 [9:54:26<16:17:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 38%|███▊ | 4671/12384 [9:54:34<16:17:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 38%|███▊ | 4672/12384 [9:54:34<16:16:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 38%|███▊ | 4672/12384 [9:54:42<16:16:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 38%|███▊ | 4673/12384 [9:54:42<16:26:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 38%|███▊ | 4673/12384 [9:54:49<16:26:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 38%|███▊ | 4674/12384 [9:54:49<16:23:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 38%|███▊ | 4674/12384 [9:54:57<16:23:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 38%|███▊ | 4675/12384 [9:54:57<16:23:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 38%|███▊ | 4675/12384 [9:55:05<16:23:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 38%|███▊ | 4676/12384 [9:55:05<16:23:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 38%|███▊ | 4676/12384 [9:55:12<16:23:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 38%|███▊ | 4677/12384 [9:55:12<16:20:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 38%|███▊ | 4677/12384 [9:55:20<16:20:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 38%|███▊ | 4678/12384 [9:55:20<16:20:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 38%|███▊ | 4678/12384 [9:55:27<16:20:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 38%|███▊ | 4679/12384 [9:55:27<16:20:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 38%|███▊ | 4679/12384 [9:55:35<16:20:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 38%|███▊ | 4680/12384 [9:55:35<16:19:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 38%|███▊ | 4680/12384 [9:55:43<16:19:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 38%|███▊ | 4681/12384 [9:55:43<16:17:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 38%|███▊ | 4681/12384 [9:55:50<16:17:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 38%|███▊ | 4682/12384 [9:55:50<16:17:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 38%|███▊ | 4682/12384 [9:55:58<16:17:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 38%|███▊ | 4683/12384 [9:55:58<16:16:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 38%|███▊ | 4683/12384 [9:56:06<16:16:25, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.70s]
Epoch 1: 38%|███▊ | 4684/12384 [9:56:06<16:21:15, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=9.70s]
Epoch 1: 38%|███▊ | 4684/12384 [9:56:13<16:21:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 38%|███▊ | 4685/12384 [9:56:13<16:32:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 38%|███▊ | 4685/12384 [9:56:21<16:32:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 38%|███▊ | 4686/12384 [9:56:21<16:27:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 38%|███▊ | 4686/12384 [9:56:29<16:27:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 38%|███▊ | 4687/12384 [9:56:29<16:24:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 38%|███▊ | 4687/12384 [9:56:36<16:24:13, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 1: 38%|███▊ | 4688/12384 [9:56:36<16:21:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 1: 38%|███▊ | 4688/12384 [9:56:44<16:21:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 1: 38%|███▊ | 4689/12384 [9:56:44<16:19:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.88s]
Epoch 1: 38%|███▊ | 4689/12384 [9:56:52<16:19:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 38%|███▊ | 4690/12384 [9:56:52<16:19:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 38%|███▊ | 4690/12384 [9:56:59<16:19:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 38%|███▊ | 4691/12384 [9:56:59<16:17:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 38%|███▊ | 4691/12384 [9:57:07<16:17:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 38%|███▊ | 4692/12384 [9:57:07<16:18:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 38%|███▊ | 4692/12384 [9:57:14<16:18:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 38%|███▊ | 4693/12384 [9:57:14<16:16:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 38%|███▊ | 4693/12384 [9:57:22<16:16:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 38%|███▊ | 4694/12384 [9:57:22<16:16:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 38%|███▊ | 4694/12384 [9:57:30<16:16:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 38%|███▊ | 4695/12384 [9:57:30<16:15:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 38%|███▊ | 4695/12384 [9:57:37<16:15:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 38%|███▊ | 4696/12384 [9:57:37<16:15:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 38%|███▊ | 4696/12384 [9:57:45<16:15:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 38%|███▊ | 4697/12384 [9:57:45<16:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 38%|███▊ | 4697/12384 [9:57:53<16:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 38%|███▊ | 4698/12384 [9:57:53<16:17:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 38%|███▊ | 4698/12384 [9:58:00<16:17:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 38%|███▊ | 4699/12384 [9:58:00<16:17:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 38%|███▊ | 4699/12384 [9:58:08<16:17:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 38%|███▊ | 4700/12384 [9:58:08<16:16:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 38%|███▊ | 4700/12384 [9:58:15<16:16:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 38%|███▊ | 4701/12384 [9:58:15<16:16:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 38%|███▊ | 4701/12384 [9:58:23<16:16:00, 7.62s/it, loss=0.0011, acc=0.9985, iter_time=9.90s]
Epoch 1: 38%|███▊ | 4702/12384 [9:58:23<16:15:24, 7.62s/it, loss=0.0011, acc=0.9985, iter_time=9.90s]
Epoch 1: 38%|███▊ | 4702/12384 [9:58:31<16:15:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 38%|███▊ | 4703/12384 [9:58:31<16:14:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 38%|███▊ | 4703/12384 [9:58:38<16:14:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 38%|███▊ | 4704/12384 [9:58:38<16:13:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 38%|███▊ | 4704/12384 [9:58:46<16:13:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 38%|███▊ | 4705/12384 [9:58:46<16:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 38%|███▊ | 4705/12384 [9:58:53<16:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 38%|███▊ | 4706/12384 [9:58:53<16:15:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 38%|███▊ | 4706/12384 [9:59:01<16:15:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 38%|███▊ | 4707/12384 [9:59:01<16:15:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 38%|███▊ | 4707/12384 [9:59:09<16:15:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 38%|███▊ | 4708/12384 [9:59:09<16:15:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 38%|███▊ | 4708/12384 [9:59:16<16:15:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 38%|███▊ | 4709/12384 [9:59:16<16:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 38%|███▊ | 4709/12384 [9:59:24<16:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 38%|███▊ | 4710/12384 [9:59:24<16:12:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 38%|███▊ | 4710/12384 [9:59:32<16:12:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 38%|███▊ | 4711/12384 [9:59:32<16:25:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 38%|███▊ | 4711/12384 [9:59:39<16:25:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 38%|███▊ | 4712/12384 [9:59:39<16:22:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 38%|███▊ | 4712/12384 [9:59:47<16:22:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 38%|███▊ | 4713/12384 [9:59:47<16:19:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 38%|███▊ | 4713/12384 [9:59:55<16:19:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 38%|███▊ | 4714/12384 [9:59:55<16:16:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 38%|███▊ | 4714/12384 [10:00:02<16:16:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 38%|███▊ | 4715/12384 [10:00:02<16:15:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 38%|███▊ | 4715/12384 [10:00:10<16:15:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 38%|███▊ | 4716/12384 [10:00:10<16:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 38%|███▊ | 4716/12384 [10:00:17<16:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 38%|███▊ | 4717/12384 [10:00:17<16:12:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 38%|███▊ | 4717/12384 [10:00:25<16:12:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 38%|███▊ | 4718/12384 [10:00:25<16:13:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 38%|███▊ | 4718/12384 [10:00:33<16:13:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4719/12384 [10:00:33<16:11:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4719/12384 [10:00:40<16:11:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 38%|███▊ | 4720/12384 [10:00:40<16:11:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 38%|███▊ | 4720/12384 [10:00:48<16:11:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 38%|███▊ | 4721/12384 [10:00:48<16:10:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 38%|███▊ | 4721/12384 [10:00:56<16:10:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4722/12384 [10:00:56<16:14:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4722/12384 [10:01:03<16:14:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 38%|███▊ | 4723/12384 [10:01:03<16:15:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 38%|███▊ | 4723/12384 [10:01:11<16:15:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 38%|███▊ | 4724/12384 [10:01:11<16:13:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 38%|███▊ | 4724/12384 [10:01:19<16:13:17, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=7.87s]
Epoch 1: 38%|███▊ | 4725/12384 [10:01:19<16:22:31, 7.70s/it, loss=0.0005, acc=0.9998, iter_time=7.87s]
Epoch 1: 38%|███▊ | 4725/12384 [10:01:26<16:22:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 38%|███▊ | 4726/12384 [10:01:26<16:19:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 38%|███▊ | 4726/12384 [10:01:34<16:19:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 38%|███▊ | 4727/12384 [10:01:34<16:16:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 38%|███▊ | 4727/12384 [10:01:41<16:16:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 38%|███▊ | 4728/12384 [10:01:41<16:14:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 38%|███▊ | 4728/12384 [10:01:49<16:14:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 38%|███▊ | 4729/12384 [10:01:49<16:13:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 1: 38%|███▊ | 4729/12384 [10:01:57<16:13:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 38%|███▊ | 4730/12384 [10:01:57<16:12:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 38%|███▊ | 4730/12384 [10:02:04<16:12:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 38%|███▊ | 4731/12384 [10:02:04<16:12:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 38%|███▊ | 4731/12384 [10:02:12<16:12:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 38%|███▊ | 4732/12384 [10:02:12<16:11:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 38%|███▊ | 4732/12384 [10:02:20<16:11:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4733/12384 [10:02:20<16:10:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4733/12384 [10:02:27<16:10:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 38%|███▊ | 4734/12384 [10:02:27<16:10:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 38%|███▊ | 4734/12384 [10:02:35<16:10:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 38%|███▊ | 4735/12384 [10:02:35<16:09:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 38%|███▊ | 4735/12384 [10:02:42<16:09:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 1: 38%|███▊ | 4736/12384 [10:02:42<16:09:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 1: 38%|███▊ | 4736/12384 [10:02:50<16:09:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 38%|███▊ | 4737/12384 [10:02:50<16:19:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 38%|███▊ | 4737/12384 [10:02:58<16:19:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 38%|███▊ | 4738/12384 [10:02:58<16:16:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 38%|███▊ | 4738/12384 [10:03:05<16:16:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 38%|███▊ | 4739/12384 [10:03:05<16:14:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 38%|███▊ | 4739/12384 [10:03:13<16:14:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 38%|███▊ | 4740/12384 [10:03:13<16:13:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 38%|███▊ | 4740/12384 [10:03:21<16:13:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 38%|███▊ | 4741/12384 [10:03:21<16:12:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 38%|███▊ | 4741/12384 [10:03:28<16:12:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 38%|███▊ | 4742/12384 [10:03:28<16:12:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 38%|███▊ | 4742/12384 [10:03:36<16:12:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 38%|███▊ | 4743/12384 [10:03:36<16:10:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 38%|███▊ | 4743/12384 [10:03:44<16:10:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 38%|███▊ | 4744/12384 [10:03:44<16:10:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 38%|███▊ | 4744/12384 [10:03:51<16:10:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 38%|███▊ | 4745/12384 [10:03:51<16:09:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 38%|███▊ | 4745/12384 [10:03:59<16:09:39, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4746/12384 [10:03:59<16:09:27, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4746/12384 [10:04:06<16:09:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 38%|███▊ | 4747/12384 [10:04:06<16:07:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 38%|███▊ | 4747/12384 [10:04:14<16:07:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 38%|███▊ | 4748/12384 [10:04:14<16:10:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 38%|███▊ | 4748/12384 [10:04:22<16:10:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4749/12384 [10:04:22<16:10:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4749/12384 [10:04:29<16:10:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4750/12384 [10:04:29<16:10:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 38%|███▊ | 4750/12384 [10:04:37<16:10:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 38%|███▊ | 4751/12384 [10:04:37<16:09:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 38%|███▊ | 4751/12384 [10:04:44<16:09:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 38%|███▊ | 4752/12384 [10:04:44<16:08:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 38%|███▊ | 4752/12384 [10:04:52<16:08:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 38%|███▊ | 4753/12384 [10:04:52<16:07:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 38%|███▊ | 4753/12384 [10:05:00<16:07:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 38%|███▊ | 4754/12384 [10:05:00<16:09:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 38%|███▊ | 4754/12384 [10:05:07<16:09:02, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=10.51s]
Epoch 1: 38%|███▊ | 4755/12384 [10:05:07<16:11:43, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.51s]
Epoch 1: 38%|███▊ | 4755/12384 [10:05:15<16:11:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 38%|███▊ | 4756/12384 [10:05:15<16:11:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 38%|███▊ | 4756/12384 [10:05:23<16:11:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 38%|███▊ | 4757/12384 [10:05:23<16:09:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 38%|███▊ | 4757/12384 [10:05:31<16:09:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 38%|███▊ | 4758/12384 [10:05:31<16:35:08, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 38%|███▊ | 4758/12384 [10:05:39<16:35:08, 7.83s/it, loss=0.0001, acc=0.9994, iter_time=8.20s]
Epoch 1: 38%|███▊ | 4759/12384 [10:05:39<16:49:08, 7.94s/it, loss=0.0001, acc=0.9994, iter_time=8.20s]
Epoch 1: 38%|███▊ | 4759/12384 [10:05:48<16:49:08, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 38%|███▊ | 4760/12384 [10:05:48<17:18:04, 8.17s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 38%|███▊ | 4760/12384 [10:05:56<17:18:04, 8.17s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 1: 38%|███▊ | 4761/12384 [10:05:56<17:13:48, 8.14s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 1: 38%|███▊ | 4761/12384 [10:06:04<17:13:48, 8.14s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 38%|███▊ | 4762/12384 [10:06:04<16:54:32, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 38%|███▊ | 4762/12384 [10:06:12<16:54:32, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 38%|███▊ | 4763/12384 [10:06:12<16:55:58, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 38%|███▊ | 4763/12384 [10:06:19<16:55:58, 8.00s/it, loss=0.0004, acc=0.9998, iter_time=8.28s]
Epoch 1: 38%|███▊ | 4764/12384 [10:06:19<16:45:18, 7.92s/it, loss=0.0004, acc=0.9998, iter_time=8.28s]
Epoch 1: 38%|███▊ | 4764/12384 [10:06:27<16:45:18, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 38%|███▊ | 4765/12384 [10:06:27<16:47:02, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 38%|███▊ | 4765/12384 [10:06:35<16:47:02, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 1: 38%|███▊ | 4766/12384 [10:06:35<16:36:03, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 1: 38%|███▊ | 4766/12384 [10:06:43<16:36:03, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 38%|███▊ | 4767/12384 [10:06:43<16:29:15, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 38%|███▊ | 4767/12384 [10:06:50<16:29:15, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▊ | 4768/12384 [10:06:50<16:24:46, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▊ | 4768/12384 [10:06:58<16:24:46, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 39%|███▊ | 4769/12384 [10:06:58<16:20:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 39%|███▊ | 4769/12384 [10:07:06<16:20:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 39%|███▊ | 4770/12384 [10:07:06<16:15:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 39%|███▊ | 4770/12384 [10:07:13<16:15:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 39%|███▊ | 4771/12384 [10:07:13<16:13:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 39%|███▊ | 4771/12384 [10:07:21<16:13:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 39%|███▊ | 4772/12384 [10:07:21<16:14:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 39%|███▊ | 4772/12384 [10:07:28<16:14:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 39%|███▊ | 4773/12384 [10:07:28<16:11:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 39%|███▊ | 4773/12384 [10:07:36<16:11:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 39%|███▊ | 4774/12384 [10:07:36<16:10:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 39%|███▊ | 4774/12384 [10:07:44<16:10:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 39%|███▊ | 4775/12384 [10:07:44<16:11:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 39%|███▊ | 4775/12384 [10:07:51<16:11:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 39%|███▊ | 4776/12384 [10:07:51<16:10:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 39%|███▊ | 4776/12384 [10:07:59<16:10:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 39%|███▊ | 4777/12384 [10:07:59<16:21:04, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 39%|███▊ | 4777/12384 [10:08:07<16:21:04, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▊ | 4778/12384 [10:08:07<16:16:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▊ | 4778/12384 [10:08:15<16:16:42, 7.70s/it, loss=0.0002, acc=0.9993, iter_time=4.60s]
Epoch 1: 39%|███▊ | 4779/12384 [10:08:15<16:14:47, 7.69s/it, loss=0.0002, acc=0.9993, iter_time=4.60s]
Epoch 1: 39%|███▊ | 4779/12384 [10:08:22<16:14:47, 7.69s/it, loss=0.0005, acc=0.9973, iter_time=10.70s]
Epoch 1: 39%|███▊ | 4780/12384 [10:08:22<16:14:00, 7.69s/it, loss=0.0005, acc=0.9973, iter_time=10.70s]
Epoch 1: 39%|███▊ | 4780/12384 [10:08:30<16:14:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 39%|███▊ | 4781/12384 [10:08:30<16:10:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 39%|███▊ | 4781/12384 [10:08:38<16:10:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▊ | 4782/12384 [10:08:38<16:09:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▊ | 4782/12384 [10:08:45<16:09:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 39%|███▊ | 4783/12384 [10:08:45<16:08:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 39%|███▊ | 4783/12384 [10:08:53<16:08:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 39%|███▊ | 4784/12384 [10:08:53<16:08:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 39%|███▊ | 4784/12384 [10:09:00<16:08:17, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=5.20s]
Epoch 1: 39%|███▊ | 4785/12384 [10:09:00<16:05:25, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=5.20s]
Epoch 1: 39%|███▊ | 4785/12384 [10:09:08<16:05:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 39%|███▊ | 4786/12384 [10:09:08<16:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 39%|███▊ | 4786/12384 [10:09:16<16:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 39%|███▊ | 4787/12384 [10:09:16<16:06:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 39%|███▊ | 4787/12384 [10:09:23<16:06:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 39%|███▊ | 4788/12384 [10:09:23<16:04:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 39%|███▊ | 4788/12384 [10:09:31<16:04:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 39%|███▊ | 4789/12384 [10:09:31<16:18:05, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 39%|███▊ | 4789/12384 [10:09:39<16:18:05, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 39%|███▊ | 4790/12384 [10:09:39<16:13:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 39%|███▊ | 4790/12384 [10:09:46<16:13:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▊ | 4791/12384 [10:09:46<16:11:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▊ | 4791/12384 [10:09:54<16:11:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 39%|███▊ | 4792/12384 [10:09:54<16:09:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 39%|███▊ | 4792/12384 [10:10:02<16:09:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 39%|███▊ | 4793/12384 [10:10:02<16:07:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 39%|███▊ | 4793/12384 [10:10:09<16:07:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 39%|███▊ | 4794/12384 [10:10:09<16:05:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 39%|███▊ | 4794/12384 [10:10:17<16:05:52, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.57s]
Epoch 1: 39%|███▊ | 4795/12384 [10:10:17<16:04:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.57s]
Epoch 1: 39%|███▊ | 4795/12384 [10:10:25<16:04:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 39%|███▊ | 4796/12384 [10:10:25<16:03:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 39%|███▊ | 4796/12384 [10:10:32<16:03:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 1: 39%|███▊ | 4797/12384 [10:10:32<16:02:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 1: 39%|███▊ | 4797/12384 [10:10:40<16:02:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.16s]
Epoch 1: 39%|███▊ | 4798/12384 [10:10:40<16:03:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.16s]
Epoch 1: 39%|███▊ | 4798/12384 [10:10:47<16:03:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 39%|███▉ | 4799/12384 [10:10:47<16:03:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 39%|███▉ | 4799/12384 [10:10:55<16:03:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 39%|███▉ | 4800/12384 [10:10:55<16:03:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 39%|███▉ | 4800/12384 [10:11:03<16:03:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 39%|███▉ | 4801/12384 [10:11:03<16:02:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 39%|███▉ | 4801/12384 [10:11:10<16:02:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4802/12384 [10:11:10<16:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4802/12384 [10:11:18<16:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 39%|███▉ | 4803/12384 [10:11:18<16:13:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 39%|███▉ | 4803/12384 [10:11:26<16:13:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4804/12384 [10:11:26<16:09:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4804/12384 [10:11:33<16:09:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4805/12384 [10:11:33<16:06:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4805/12384 [10:11:41<16:06:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 39%|███▉ | 4806/12384 [10:11:41<16:05:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 39%|███▉ | 4806/12384 [10:11:49<16:05:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 39%|███▉ | 4807/12384 [10:11:49<16:03:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 39%|███▉ | 4807/12384 [10:11:56<16:03:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 39%|███▉ | 4808/12384 [10:11:56<16:03:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 39%|███▉ | 4808/12384 [10:12:04<16:03:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 39%|███▉ | 4809/12384 [10:12:04<16:01:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 39%|███▉ | 4809/12384 [10:12:11<16:01:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 39%|███▉ | 4810/12384 [10:12:11<16:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 39%|███▉ | 4810/12384 [10:12:19<16:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4811/12384 [10:12:19<15:59:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4811/12384 [10:12:27<15:59:49, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=5.81s]
Epoch 1: 39%|███▉ | 4812/12384 [10:12:27<16:01:58, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=5.81s]
Epoch 1: 39%|███▉ | 4812/12384 [10:12:34<16:01:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 1: 39%|███▉ | 4813/12384 [10:12:34<16:02:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 1: 39%|███▉ | 4813/12384 [10:12:42<16:02:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 1: 39%|███▉ | 4814/12384 [10:12:42<16:02:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 1: 39%|███▉ | 4814/12384 [10:12:50<16:02:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 39%|███▉ | 4815/12384 [10:12:50<16:01:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 39%|███▉ | 4815/12384 [10:12:57<16:01:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 1: 39%|███▉ | 4816/12384 [10:12:57<16:14:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 1: 39%|███▉ | 4816/12384 [10:13:05<16:14:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 39%|███▉ | 4817/12384 [10:13:05<16:11:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 39%|███▉ | 4817/12384 [10:13:13<16:11:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 39%|███▉ | 4818/12384 [10:13:13<16:08:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 39%|███▉ | 4818/12384 [10:13:20<16:08:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 39%|███▉ | 4819/12384 [10:13:20<16:04:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 39%|███▉ | 4819/12384 [10:13:28<16:04:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 39%|███▉ | 4820/12384 [10:13:28<16:02:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 39%|███▉ | 4820/12384 [10:13:36<16:02:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4821/12384 [10:13:36<16:01:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4821/12384 [10:13:43<16:01:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4822/12384 [10:13:43<16:00:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4822/12384 [10:13:51<16:00:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4823/12384 [10:13:51<15:59:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4823/12384 [10:13:58<15:59:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 1: 39%|███▉ | 4824/12384 [10:13:58<15:59:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 1: 39%|███▉ | 4824/12384 [10:14:06<15:59:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 39%|███▉ | 4825/12384 [10:14:06<15:59:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 39%|███▉ | 4825/12384 [10:14:14<15:59:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4826/12384 [10:14:14<15:59:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4826/12384 [10:14:21<15:59:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 39%|███▉ | 4827/12384 [10:14:21<15:59:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 39%|███▉ | 4827/12384 [10:14:29<15:59:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 39%|███▉ | 4828/12384 [10:14:29<15:59:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 39%|███▉ | 4828/12384 [10:14:37<15:59:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 39%|███▉ | 4829/12384 [10:14:37<16:01:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 39%|███▉ | 4829/12384 [10:14:44<16:01:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 1: 39%|███▉ | 4830/12384 [10:14:44<16:11:25, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 1: 39%|███▉ | 4830/12384 [10:14:52<16:11:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 39%|███▉ | 4831/12384 [10:14:52<16:07:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 39%|███▉ | 4831/12384 [10:15:00<16:07:29, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=10.30s]
Epoch 1: 39%|███▉ | 4832/12384 [10:15:00<16:04:38, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.30s]
Epoch 1: 39%|███▉ | 4832/12384 [10:15:07<16:04:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 39%|███▉ | 4833/12384 [10:15:07<16:01:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 39%|███▉ | 4833/12384 [10:15:15<16:01:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 39%|███▉ | 4834/12384 [10:15:15<16:03:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 39%|███▉ | 4834/12384 [10:15:23<16:03:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 39%|███▉ | 4835/12384 [10:15:23<16:03:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 39%|███▉ | 4835/12384 [10:15:30<16:03:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 39%|███▉ | 4836/12384 [10:15:30<16:01:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 39%|███▉ | 4836/12384 [10:15:38<16:01:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 39%|███▉ | 4837/12384 [10:15:38<16:02:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 39%|███▉ | 4837/12384 [10:15:45<16:02:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 39%|███▉ | 4838/12384 [10:15:45<16:00:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 39%|███▉ | 4838/12384 [10:15:53<16:00:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 39%|███▉ | 4839/12384 [10:15:53<15:59:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 39%|███▉ | 4839/12384 [10:16:01<15:59:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 39%|███▉ | 4840/12384 [10:16:01<15:58:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 39%|███▉ | 4840/12384 [10:16:08<15:58:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 39%|███▉ | 4841/12384 [10:16:08<15:57:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 39%|███▉ | 4841/12384 [10:16:16<15:57:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 39%|███▉ | 4842/12384 [10:16:16<16:09:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 39%|███▉ | 4842/12384 [10:16:24<16:09:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 39%|███▉ | 4843/12384 [10:16:24<16:05:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 39%|███▉ | 4843/12384 [10:16:31<16:05:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4844/12384 [10:16:31<16:02:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4844/12384 [10:16:39<16:02:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 39%|███▉ | 4845/12384 [10:16:39<15:59:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 39%|███▉ | 4845/12384 [10:16:47<15:59:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4846/12384 [10:16:47<15:58:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4846/12384 [10:16:54<15:58:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 39%|███▉ | 4847/12384 [10:16:54<15:57:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 39%|███▉ | 4847/12384 [10:17:02<15:57:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 39%|███▉ | 4848/12384 [10:17:02<15:58:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 39%|███▉ | 4848/12384 [10:17:10<15:58:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 39%|███▉ | 4849/12384 [10:17:10<15:57:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 39%|███▉ | 4849/12384 [10:17:17<15:57:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 39%|███▉ | 4850/12384 [10:17:17<15:57:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 39%|███▉ | 4850/12384 [10:17:25<15:57:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 39%|███▉ | 4851/12384 [10:17:25<15:56:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 39%|███▉ | 4851/12384 [10:17:32<15:56:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 39%|███▉ | 4852/12384 [10:17:32<15:56:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 39%|███▉ | 4852/12384 [10:17:40<15:56:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 39%|███▉ | 4853/12384 [10:17:40<15:56:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 39%|███▉ | 4853/12384 [10:17:48<15:56:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 39%|███▉ | 4854/12384 [10:17:48<15:55:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 39%|███▉ | 4854/12384 [10:17:55<15:55:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4855/12384 [10:17:55<15:55:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4855/12384 [10:18:03<15:55:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 39%|███▉ | 4856/12384 [10:18:03<15:54:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 39%|███▉ | 4856/12384 [10:18:11<15:54:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 39%|███▉ | 4857/12384 [10:18:11<16:05:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 39%|███▉ | 4857/12384 [10:18:18<16:05:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4858/12384 [10:18:18<16:02:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4858/12384 [10:18:26<16:02:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 39%|███▉ | 4859/12384 [10:18:26<16:00:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 39%|███▉ | 4859/12384 [10:18:34<16:00:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 39%|███▉ | 4860/12384 [10:18:34<15:57:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 39%|███▉ | 4860/12384 [10:18:41<15:57:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 39%|███▉ | 4861/12384 [10:18:41<15:56:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 39%|███▉ | 4861/12384 [10:18:49<15:56:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4862/12384 [10:18:49<15:58:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4862/12384 [10:18:56<15:58:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 39%|███▉ | 4863/12384 [10:18:56<15:57:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 39%|███▉ | 4863/12384 [10:19:04<15:57:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 39%|███▉ | 4864/12384 [10:19:04<15:56:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 39%|███▉ | 4864/12384 [10:19:12<15:56:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 39%|███▉ | 4865/12384 [10:19:12<15:55:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 39%|███▉ | 4865/12384 [10:19:19<15:55:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 39%|███▉ | 4866/12384 [10:19:19<15:54:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 39%|███▉ | 4866/12384 [10:19:27<15:54:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 39%|███▉ | 4867/12384 [10:19:27<15:54:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 39%|███▉ | 4867/12384 [10:19:35<15:54:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 39%|███▉ | 4868/12384 [10:19:35<15:53:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 39%|███▉ | 4868/12384 [10:19:42<15:53:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 39%|███▉ | 4869/12384 [10:19:42<16:05:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 39%|███▉ | 4869/12384 [10:19:50<16:05:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 39%|███▉ | 4870/12384 [10:19:50<16:01:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 39%|███▉ | 4870/12384 [10:19:58<16:01:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 39%|███▉ | 4871/12384 [10:19:58<15:58:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 39%|███▉ | 4871/12384 [10:20:05<15:58:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 1: 39%|███▉ | 4872/12384 [10:20:05<15:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 1: 39%|███▉ | 4872/12384 [10:20:13<15:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 39%|███▉ | 4873/12384 [10:20:13<15:54:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 39%|███▉ | 4873/12384 [10:20:20<15:54:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4874/12384 [10:20:20<15:54:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4874/12384 [10:20:28<15:54:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4875/12384 [10:20:28<15:54:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4875/12384 [10:20:36<15:54:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4876/12384 [10:20:36<15:53:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4876/12384 [10:20:43<15:53:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 39%|███▉ | 4877/12384 [10:20:43<15:52:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 39%|███▉ | 4877/12384 [10:20:51<15:52:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4878/12384 [10:20:51<15:52:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4878/12384 [10:20:59<15:52:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4879/12384 [10:20:59<15:52:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 39%|███▉ | 4879/12384 [10:21:06<15:52:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 39%|███▉ | 4880/12384 [10:21:06<15:52:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 39%|███▉ | 4880/12384 [10:21:14<15:52:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 39%|███▉ | 4881/12384 [10:21:14<15:52:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 39%|███▉ | 4881/12384 [10:21:21<15:52:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4882/12384 [10:21:21<15:51:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 39%|███▉ | 4882/12384 [10:21:29<15:51:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 39%|███▉ | 4883/12384 [10:21:29<16:01:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 39%|███▉ | 4883/12384 [10:21:37<16:01:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 39%|███▉ | 4884/12384 [10:21:37<15:58:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 39%|███▉ | 4884/12384 [10:21:44<15:58:19, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.69s]
Epoch 1: 39%|███▉ | 4885/12384 [10:21:44<15:56:14, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.69s]
Epoch 1: 39%|███▉ | 4885/12384 [10:21:52<15:56:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4886/12384 [10:21:52<15:57:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 39%|███▉ | 4886/12384 [10:22:00<15:57:14, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 1: 39%|███▉ | 4887/12384 [10:22:00<15:55:26, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 1: 39%|███▉ | 4887/12384 [10:22:07<15:55:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 39%|███▉ | 4888/12384 [10:22:07<15:54:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 39%|███▉ | 4888/12384 [10:22:15<15:54:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 39%|███▉ | 4889/12384 [10:22:15<15:53:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 39%|███▉ | 4889/12384 [10:22:23<15:53:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 39%|███▉ | 4890/12384 [10:22:23<15:52:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 39%|███▉ | 4890/12384 [10:22:30<15:52:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 39%|███▉ | 4891/12384 [10:22:30<15:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 39%|███▉ | 4891/12384 [10:22:38<15:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|███▉ | 4892/12384 [10:22:38<15:51:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|███▉ | 4892/12384 [10:22:46<15:51:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 40%|███▉ | 4893/12384 [10:22:46<15:52:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 40%|███▉ | 4893/12384 [10:22:53<15:52:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.96s]
Epoch 1: 40%|███▉ | 4894/12384 [10:22:53<15:51:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.96s]
Epoch 1: 40%|███▉ | 4894/12384 [10:23:01<15:51:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 40%|███▉ | 4895/12384 [10:23:01<16:03:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 40%|███▉ | 4895/12384 [10:23:09<16:03:24, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.28s]
Epoch 1: 40%|███▉ | 4896/12384 [10:23:09<15:59:33, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.28s]
Epoch 1: 40%|███▉ | 4896/12384 [10:23:16<15:59:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 40%|███▉ | 4897/12384 [10:23:16<15:55:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 40%|███▉ | 4897/12384 [10:23:24<15:55:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4898/12384 [10:23:24<15:54:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4898/12384 [10:23:31<15:54:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 40%|███▉ | 4899/12384 [10:23:31<15:51:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 40%|███▉ | 4899/12384 [10:23:39<15:51:46, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=8.13s]
Epoch 1: 40%|███▉ | 4900/12384 [10:23:39<15:50:11, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.13s]
Epoch 1: 40%|███▉ | 4900/12384 [10:23:47<15:50:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 40%|███▉ | 4901/12384 [10:23:47<15:49:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 40%|███▉ | 4901/12384 [10:23:54<15:49:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 1: 40%|███▉ | 4902/12384 [10:23:54<15:48:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 1: 40%|███▉ | 4902/12384 [10:24:02<15:48:25, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 1: 40%|███▉ | 4903/12384 [10:24:02<15:47:26, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.59s]
Epoch 1: 40%|███▉ | 4903/12384 [10:24:09<15:47:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 40%|███▉ | 4904/12384 [10:24:09<15:48:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 40%|███▉ | 4904/12384 [10:24:17<15:48:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 40%|███▉ | 4905/12384 [10:24:17<15:48:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 40%|███▉ | 4905/12384 [10:24:25<15:48:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|███▉ | 4906/12384 [10:24:25<15:48:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|███▉ | 4906/12384 [10:24:32<15:48:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 40%|███▉ | 4907/12384 [10:24:32<15:48:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 40%|███▉ | 4907/12384 [10:24:40<15:48:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|███▉ | 4908/12384 [10:24:40<15:49:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|███▉ | 4908/12384 [10:24:48<15:49:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 40%|███▉ | 4909/12384 [10:24:48<15:58:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 40%|███▉ | 4909/12384 [10:24:55<15:58:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|███▉ | 4910/12384 [10:24:55<15:54:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|███▉ | 4910/12384 [10:25:03<15:54:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4911/12384 [10:25:03<15:52:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4911/12384 [10:25:11<15:52:37, 7.65s/it, loss=0.0000, acc=0.9999, iter_time=7.99s]
Epoch 1: 40%|███▉ | 4912/12384 [10:25:11<15:51:35, 7.64s/it, loss=0.0000, acc=0.9999, iter_time=7.99s]
Epoch 1: 40%|███▉ | 4912/12384 [10:25:18<15:51:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 40%|███▉ | 4913/12384 [10:25:18<15:49:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 40%|███▉ | 4913/12384 [10:25:26<15:49:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|███▉ | 4914/12384 [10:25:26<15:49:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|███▉ | 4914/12384 [10:25:33<15:49:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4915/12384 [10:25:33<15:48:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4915/12384 [10:25:41<15:48:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 40%|███▉ | 4916/12384 [10:25:41<15:48:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 40%|███▉ | 4916/12384 [10:25:49<15:48:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 40%|███▉ | 4917/12384 [10:25:49<15:50:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 40%|███▉ | 4917/12384 [10:25:56<15:50:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4918/12384 [10:25:56<15:49:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4918/12384 [10:26:04<15:49:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4919/12384 [10:26:04<15:47:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4919/12384 [10:26:12<15:47:58, 7.62s/it, loss=0.0004, acc=0.9973, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4920/12384 [10:26:12<15:50:03, 7.64s/it, loss=0.0004, acc=0.9973, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4920/12384 [10:26:20<15:50:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 40%|███▉ | 4921/12384 [10:26:20<15:59:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 40%|███▉ | 4921/12384 [10:26:27<15:59:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 40%|███▉ | 4922/12384 [10:26:27<15:57:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 40%|███▉ | 4922/12384 [10:26:35<15:57:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 40%|███▉ | 4923/12384 [10:26:35<15:54:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 40%|███▉ | 4923/12384 [10:26:42<15:54:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 40%|███▉ | 4924/12384 [10:26:42<15:53:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 40%|███▉ | 4924/12384 [10:26:50<15:53:54, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.93s]
Epoch 1: 40%|███▉ | 4925/12384 [10:26:50<15:51:11, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.93s]
Epoch 1: 40%|███▉ | 4925/12384 [10:26:58<15:51:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 40%|███▉ | 4926/12384 [10:26:58<15:49:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 40%|███▉ | 4926/12384 [10:27:05<15:49:16, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=10.99s]
Epoch 1: 40%|███▉ | 4927/12384 [10:27:05<15:48:35, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=10.99s]
Epoch 1: 40%|███▉ | 4927/12384 [10:27:13<15:48:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 40%|███▉ | 4928/12384 [10:27:13<15:48:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 40%|███▉ | 4928/12384 [10:27:21<15:48:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 40%|███▉ | 4929/12384 [10:27:21<15:46:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 40%|███▉ | 4929/12384 [10:27:28<15:46:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 40%|███▉ | 4930/12384 [10:27:28<15:47:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 40%|███▉ | 4930/12384 [10:27:36<15:47:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.37s]
Epoch 1: 40%|███▉ | 4931/12384 [10:27:36<15:46:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.37s]
Epoch 1: 40%|███▉ | 4931/12384 [10:27:43<15:46:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 40%|███▉ | 4932/12384 [10:27:43<15:46:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 40%|███▉ | 4932/12384 [10:27:51<15:46:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 40%|███▉ | 4933/12384 [10:27:51<15:47:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 40%|███▉ | 4933/12384 [10:27:59<15:47:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 40%|███▉ | 4934/12384 [10:27:59<15:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 40%|███▉ | 4934/12384 [10:28:06<15:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 40%|███▉ | 4935/12384 [10:28:06<15:45:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 40%|███▉ | 4935/12384 [10:28:14<15:45:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|███▉ | 4936/12384 [10:28:14<15:45:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|███▉ | 4936/12384 [10:28:22<15:45:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 40%|███▉ | 4937/12384 [10:28:22<15:47:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 40%|███▉ | 4937/12384 [10:28:29<15:47:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 40%|███▉ | 4938/12384 [10:28:29<15:46:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 40%|███▉ | 4938/12384 [10:28:37<15:46:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 40%|███▉ | 4939/12384 [10:28:37<15:45:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 40%|███▉ | 4939/12384 [10:28:44<15:45:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4940/12384 [10:28:44<15:45:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4940/12384 [10:28:52<15:45:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4941/12384 [10:28:52<15:45:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|███▉ | 4941/12384 [10:29:00<15:45:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 40%|███▉ | 4942/12384 [10:29:00<15:44:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 40%|███▉ | 4942/12384 [10:29:07<15:44:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|███▉ | 4943/12384 [10:29:07<15:44:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|███▉ | 4943/12384 [10:29:15<15:44:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 40%|███▉ | 4944/12384 [10:29:15<15:44:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 40%|███▉ | 4944/12384 [10:29:23<15:44:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 40%|███▉ | 4945/12384 [10:29:23<15:47:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 40%|███▉ | 4945/12384 [10:29:30<15:47:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 40%|███▉ | 4946/12384 [10:29:30<15:47:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 40%|███▉ | 4946/12384 [10:29:38<15:47:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 40%|███▉ | 4947/12384 [10:29:38<15:57:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 40%|███▉ | 4947/12384 [10:29:46<15:57:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 40%|███▉ | 4948/12384 [10:29:46<15:52:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 40%|███▉ | 4948/12384 [10:29:53<15:52:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 40%|███▉ | 4949/12384 [10:29:53<15:49:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 40%|███▉ | 4949/12384 [10:30:01<15:49:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 40%|███▉ | 4950/12384 [10:30:01<15:47:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 40%|███▉ | 4950/12384 [10:30:08<15:47:06, 7.64s/it, loss=0.0006, acc=0.9978, iter_time=9.75s]
Epoch 1: 40%|███▉ | 4951/12384 [10:30:08<15:44:32, 7.62s/it, loss=0.0006, acc=0.9978, iter_time=9.75s]
Epoch 1: 40%|███▉ | 4951/12384 [10:30:16<15:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 40%|███▉ | 4952/12384 [10:30:16<15:43:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 40%|███▉ | 4952/12384 [10:30:24<15:43:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 40%|███▉ | 4953/12384 [10:30:24<15:42:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 40%|███▉ | 4953/12384 [10:30:31<15:42:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4954/12384 [10:30:31<15:42:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4954/12384 [10:30:39<15:42:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|████ | 4955/12384 [10:30:39<15:42:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|████ | 4955/12384 [10:30:47<15:42:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4956/12384 [10:30:47<15:42:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4956/12384 [10:30:54<15:42:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|████ | 4957/12384 [10:30:54<15:42:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|████ | 4957/12384 [10:31:02<15:42:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 40%|████ | 4958/12384 [10:31:02<15:41:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 40%|████ | 4958/12384 [10:31:09<15:41:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 40%|████ | 4959/12384 [10:31:09<15:41:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 40%|████ | 4959/12384 [10:31:17<15:41:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 40%|████ | 4960/12384 [10:31:17<15:42:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 40%|████ | 4960/12384 [10:31:25<15:42:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 40%|████ | 4961/12384 [10:31:25<15:51:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 40%|████ | 4961/12384 [10:31:32<15:51:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 40%|████ | 4962/12384 [10:31:32<15:49:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 40%|████ | 4962/12384 [10:31:40<15:49:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 40%|████ | 4963/12384 [10:31:40<15:47:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 40%|████ | 4963/12384 [10:31:48<15:47:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4964/12384 [10:31:48<15:45:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4964/12384 [10:31:55<15:45:38, 7.65s/it, loss=0.0007, acc=0.9958, iter_time=7.62s]
Epoch 1: 40%|████ | 4965/12384 [10:31:55<15:43:32, 7.63s/it, loss=0.0007, acc=0.9958, iter_time=7.62s]
Epoch 1: 40%|████ | 4965/12384 [10:32:03<15:43:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 40%|████ | 4966/12384 [10:32:03<15:43:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 40%|████ | 4966/12384 [10:32:11<15:43:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 40%|████ | 4967/12384 [10:32:11<15:41:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 40%|████ | 4967/12384 [10:32:18<15:41:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 40%|████ | 4968/12384 [10:32:18<15:41:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 40%|████ | 4968/12384 [10:32:26<15:41:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 40%|████ | 4969/12384 [10:32:26<15:45:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 40%|████ | 4969/12384 [10:32:34<15:45:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 40%|████ | 4970/12384 [10:32:34<15:46:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 40%|████ | 4970/12384 [10:32:41<15:46:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 40%|████ | 4971/12384 [10:32:41<15:44:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 40%|████ | 4971/12384 [10:32:49<15:44:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 40%|████ | 4972/12384 [10:32:49<15:44:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 40%|████ | 4972/12384 [10:32:57<15:44:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 40%|████ | 4973/12384 [10:32:57<15:56:24, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 40%|████ | 4973/12384 [10:33:04<15:56:24, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|████ | 4974/12384 [10:33:04<15:51:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|████ | 4974/12384 [10:33:12<15:51:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 40%|████ | 4975/12384 [10:33:12<15:48:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 40%|████ | 4975/12384 [10:33:20<15:48:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 40%|████ | 4976/12384 [10:33:20<15:46:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 40%|████ | 4976/12384 [10:33:27<15:46:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 1: 40%|████ | 4977/12384 [10:33:27<15:44:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 1: 40%|████ | 4977/12384 [10:33:35<15:44:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 40%|████ | 4978/12384 [10:33:35<15:42:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 40%|████ | 4978/12384 [10:33:42<15:42:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 40%|████ | 4979/12384 [10:33:42<15:41:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 40%|████ | 4979/12384 [10:33:50<15:41:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 40%|████ | 4980/12384 [10:33:50<15:40:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 40%|████ | 4980/12384 [10:33:58<15:40:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|████ | 4981/12384 [10:33:58<15:40:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|████ | 4981/12384 [10:34:05<15:40:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4982/12384 [10:34:05<15:39:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4982/12384 [10:34:13<15:39:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4983/12384 [10:34:13<15:38:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4983/12384 [10:34:21<15:38:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 40%|████ | 4984/12384 [10:34:21<15:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 40%|████ | 4984/12384 [10:34:28<15:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 40%|████ | 4985/12384 [10:34:28<15:38:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 40%|████ | 4985/12384 [10:34:36<15:38:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4986/12384 [10:34:36<15:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 40%|████ | 4986/12384 [10:34:43<15:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 1: 40%|████ | 4987/12384 [10:34:43<15:38:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 1: 40%|████ | 4987/12384 [10:34:51<15:38:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 40%|████ | 4988/12384 [10:34:51<15:38:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 40%|████ | 4988/12384 [10:34:59<15:38:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|████ | 4989/12384 [10:34:59<15:38:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|████ | 4989/12384 [10:35:06<15:38:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|████ | 4990/12384 [10:35:06<15:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|████ | 4990/12384 [10:35:14<15:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 40%|████ | 4991/12384 [10:35:14<15:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 40%|████ | 4991/12384 [10:35:21<15:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 40%|████ | 4992/12384 [10:35:21<15:39:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 40%|████ | 4992/12384 [10:35:29<15:39:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 1: 40%|████ | 4993/12384 [10:35:29<15:41:46, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 1: 40%|████ | 4993/12384 [10:35:37<15:41:46, 7.65s/it, loss=0.0013, acc=0.9951, iter_time=5.51s]
Epoch 1: 40%|████ | 4994/12384 [10:35:37<15:40:33, 7.64s/it, loss=0.0013, acc=0.9951, iter_time=5.51s]
Epoch 1: 40%|████ | 4994/12384 [10:35:44<15:40:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 40%|████ | 4995/12384 [10:35:44<15:39:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 40%|████ | 4995/12384 [10:35:52<15:39:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 1: 40%|████ | 4996/12384 [10:35:52<15:39:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 1: 40%|████ | 4996/12384 [10:36:00<15:39:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 40%|████ | 4997/12384 [10:36:00<15:38:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 40%|████ | 4997/12384 [10:36:07<15:38:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|████ | 4998/12384 [10:36:07<15:38:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 40%|████ | 4998/12384 [10:36:15<15:38:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|████ | 4999/12384 [10:36:15<15:38:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|████ | 4999/12384 [10:36:23<15:38:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 40%|████ | 5000/12384 [10:36:23<15:53:35, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 40%|████ | 5000/12384 [10:36:31<15:53:35, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 40%|████ | 5001/12384 [10:36:31<15:48:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 40%|████ | 5001/12384 [10:36:38<15:48:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|████ | 5002/12384 [10:36:38<15:44:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|████ | 5002/12384 [10:36:46<15:44:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|████ | 5003/12384 [10:36:46<15:42:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 40%|████ | 5003/12384 [10:36:53<15:42:33, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 1: 40%|████ | 5004/12384 [10:36:53<15:40:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.05s]
Epoch 1: 40%|████ | 5004/12384 [10:37:01<15:40:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 40%|████ | 5005/12384 [10:37:01<15:41:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 40%|████ | 5005/12384 [10:37:09<15:41:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 40%|████ | 5006/12384 [10:37:09<15:39:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 40%|████ | 5006/12384 [10:37:16<15:39:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 40%|████ | 5007/12384 [10:37:16<15:37:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 40%|████ | 5007/12384 [10:37:24<15:37:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 40%|████ | 5008/12384 [10:37:24<15:37:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 40%|████ | 5008/12384 [10:37:32<15:37:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 40%|████ | 5009/12384 [10:37:32<15:36:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 40%|████ | 5009/12384 [10:37:39<15:36:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 40%|████ | 5010/12384 [10:37:39<15:36:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 40%|████ | 5010/12384 [10:37:47<15:36:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 40%|████ | 5011/12384 [10:37:47<15:35:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 40%|████ | 5011/12384 [10:37:54<15:35:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 40%|████ | 5012/12384 [10:37:54<15:35:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 40%|████ | 5012/12384 [10:38:02<15:35:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 40%|████ | 5013/12384 [10:38:02<15:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 40%|████ | 5013/12384 [10:38:10<15:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 40%|████ | 5014/12384 [10:38:10<15:45:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 40%|████ | 5014/12384 [10:38:17<15:45:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|████ | 5015/12384 [10:38:17<15:42:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 40%|████ | 5015/12384 [10:38:25<15:42:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 41%|████ | 5016/12384 [10:38:25<15:40:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 41%|████ | 5016/12384 [10:38:33<15:40:01, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 41%|████ | 5017/12384 [10:38:33<15:38:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 41%|████ | 5017/12384 [10:38:40<15:38:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 41%|████ | 5018/12384 [10:38:40<15:36:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 41%|████ | 5018/12384 [10:38:48<15:36:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 41%|████ | 5019/12384 [10:38:48<15:36:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 41%|████ | 5019/12384 [10:38:55<15:36:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 41%|████ | 5020/12384 [10:38:55<15:34:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 41%|████ | 5020/12384 [10:39:03<15:34:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████ | 5021/12384 [10:39:03<15:35:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████ | 5021/12384 [10:39:11<15:35:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 41%|████ | 5022/12384 [10:39:11<15:34:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 41%|████ | 5022/12384 [10:39:18<15:34:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████ | 5023/12384 [10:39:18<15:33:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████ | 5023/12384 [10:39:26<15:33:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 41%|████ | 5024/12384 [10:39:26<15:33:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 41%|████ | 5024/12384 [10:39:34<15:33:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 41%|████ | 5025/12384 [10:39:34<15:32:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 41%|████ | 5025/12384 [10:39:41<15:32:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 41%|████ | 5026/12384 [10:39:41<15:45:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 41%|████ | 5026/12384 [10:39:49<15:45:47, 7.71s/it, loss=0.0007, acc=0.9973, iter_time=9.43s]
Epoch 1: 41%|████ | 5027/12384 [10:39:49<15:41:52, 7.68s/it, loss=0.0007, acc=0.9973, iter_time=9.43s]
Epoch 1: 41%|████ | 5027/12384 [10:39:57<15:41:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 41%|████ | 5028/12384 [10:39:57<15:41:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 41%|████ | 5028/12384 [10:40:04<15:41:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████ | 5029/12384 [10:40:04<15:38:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████ | 5029/12384 [10:40:12<15:38:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████ | 5030/12384 [10:40:12<15:36:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████ | 5030/12384 [10:40:20<15:36:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████ | 5031/12384 [10:40:20<15:35:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████ | 5031/12384 [10:40:27<15:35:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 41%|████ | 5032/12384 [10:40:27<15:34:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 41%|████ | 5032/12384 [10:40:35<15:34:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 41%|████ | 5033/12384 [10:40:35<15:33:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 41%|████ | 5033/12384 [10:40:42<15:33:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████ | 5034/12384 [10:40:42<15:33:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████ | 5034/12384 [10:40:50<15:33:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.43s]
Epoch 1: 41%|████ | 5035/12384 [10:40:50<15:33:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.43s]
Epoch 1: 41%|████ | 5035/12384 [10:40:58<15:33:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 41%|████ | 5036/12384 [10:40:58<15:31:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 41%|████ | 5036/12384 [10:41:05<15:31:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 41%|████ | 5037/12384 [10:41:05<15:30:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 41%|████ | 5037/12384 [10:41:13<15:30:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 41%|████ | 5038/12384 [10:41:13<15:31:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 41%|████ | 5038/12384 [10:41:20<15:31:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 41%|████ | 5039/12384 [10:41:20<15:32:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 41%|████ | 5039/12384 [10:41:28<15:32:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 41%|████ | 5040/12384 [10:41:28<15:31:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 41%|████ | 5040/12384 [10:41:36<15:31:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 41%|████ | 5041/12384 [10:41:36<15:40:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 41%|████ | 5041/12384 [10:41:44<15:40:54, 7.69s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 1: 41%|████ | 5042/12384 [10:41:44<15:38:23, 7.67s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 1: 41%|████ | 5042/12384 [10:41:51<15:38:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 41%|████ | 5043/12384 [10:41:51<15:37:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 41%|████ | 5043/12384 [10:41:59<15:37:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 41%|████ | 5044/12384 [10:41:59<15:35:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 41%|████ | 5044/12384 [10:42:07<15:35:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 41%|████ | 5045/12384 [10:42:07<15:38:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 41%|████ | 5045/12384 [10:42:14<15:38:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 41%|████ | 5046/12384 [10:42:14<15:35:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 41%|████ | 5046/12384 [10:42:22<15:35:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 41%|████ | 5047/12384 [10:42:22<15:33:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 41%|████ | 5047/12384 [10:42:29<15:33:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 1: 41%|████ | 5048/12384 [10:42:29<15:31:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 1: 41%|████ | 5048/12384 [10:42:37<15:31:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 41%|████ | 5049/12384 [10:42:37<15:31:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 41%|████ | 5049/12384 [10:42:45<15:31:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 1: 41%|████ | 5050/12384 [10:42:45<15:30:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 1: 41%|████ | 5050/12384 [10:42:52<15:30:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 41%|████ | 5051/12384 [10:42:52<15:29:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 41%|████ | 5051/12384 [10:43:00<15:29:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 41%|████ | 5052/12384 [10:43:00<15:29:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 41%|████ | 5052/12384 [10:43:08<15:29:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 41%|████ | 5053/12384 [10:43:08<15:41:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 41%|████ | 5053/12384 [10:43:15<15:41:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 41%|████ | 5054/12384 [10:43:15<15:38:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 41%|████ | 5054/12384 [10:43:23<15:38:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 41%|████ | 5055/12384 [10:43:23<15:37:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 41%|████ | 5055/12384 [10:43:31<15:37:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 41%|████ | 5056/12384 [10:43:31<15:34:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 41%|████ | 5056/12384 [10:43:38<15:34:58, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.45s]
Epoch 1: 41%|████ | 5057/12384 [10:43:38<15:32:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.45s]
Epoch 1: 41%|████ | 5057/12384 [10:43:46<15:32:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 41%|████ | 5058/12384 [10:43:46<15:32:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 41%|████ | 5058/12384 [10:43:53<15:32:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 41%|████ | 5059/12384 [10:43:53<15:29:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 41%|████ | 5059/12384 [10:44:01<15:29:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 41%|████ | 5060/12384 [10:44:01<15:29:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 41%|████ | 5060/12384 [10:44:09<15:29:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████ | 5061/12384 [10:44:09<15:28:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████ | 5061/12384 [10:44:16<15:28:31, 7.61s/it, loss=0.0003, acc=0.9982, iter_time=7.71s]
Epoch 1: 41%|████ | 5062/12384 [10:44:16<15:32:07, 7.64s/it, loss=0.0003, acc=0.9982, iter_time=7.71s]
Epoch 1: 41%|████ | 5062/12384 [10:44:24<15:32:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 41%|████ | 5063/12384 [10:44:24<15:31:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 41%|████ | 5063/12384 [10:44:32<15:31:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 41%|████ | 5064/12384 [10:44:32<15:30:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 41%|████ | 5064/12384 [10:44:39<15:30:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 41%|████ | 5065/12384 [10:44:39<15:29:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 41%|████ | 5065/12384 [10:44:47<15:29:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 41%|████ | 5066/12384 [10:44:47<15:28:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 41%|████ | 5066/12384 [10:44:54<15:28:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 41%|████ | 5067/12384 [10:44:54<15:29:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 41%|████ | 5067/12384 [10:45:02<15:29:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 41%|████ | 5068/12384 [10:45:02<15:28:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 41%|████ | 5068/12384 [10:45:10<15:28:59, 7.62s/it, loss=0.0004, acc=0.9990, iter_time=6.76s]
Epoch 1: 41%|████ | 5069/12384 [10:45:10<15:28:36, 7.62s/it, loss=0.0004, acc=0.9990, iter_time=6.76s]
Epoch 1: 41%|████ | 5069/12384 [10:45:17<15:28:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 41%|████ | 5070/12384 [10:45:17<15:28:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 41%|████ | 5070/12384 [10:45:25<15:28:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 1: 41%|████ | 5071/12384 [10:45:25<15:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 1: 41%|████ | 5071/12384 [10:45:33<15:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.73s]
Epoch 1: 41%|████ | 5072/12384 [10:45:33<15:31:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.73s]
Epoch 1: 41%|████ | 5072/12384 [10:45:40<15:31:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 41%|████ | 5073/12384 [10:45:40<15:29:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 41%|████ | 5073/12384 [10:45:48<15:29:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 41%|████ | 5074/12384 [10:45:48<15:30:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 41%|████ | 5074/12384 [10:45:55<15:30:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 41%|████ | 5075/12384 [10:45:55<15:28:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 41%|████ | 5075/12384 [10:46:03<15:28:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 1: 41%|████ | 5076/12384 [10:46:03<15:27:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 1: 41%|████ | 5076/12384 [10:46:11<15:27:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 41%|████ | 5077/12384 [10:46:11<15:27:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 41%|████ | 5077/12384 [10:46:18<15:27:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 41%|████ | 5078/12384 [10:46:18<15:26:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 41%|████ | 5078/12384 [10:46:26<15:26:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 41%|████ | 5079/12384 [10:46:26<15:38:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 41%|████ | 5079/12384 [10:46:34<15:38:37, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.84s]
Epoch 1: 41%|████ | 5080/12384 [10:46:34<15:34:38, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.84s]
Epoch 1: 41%|████ | 5080/12384 [10:46:41<15:34:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 41%|████ | 5081/12384 [10:46:41<15:31:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 41%|████ | 5081/12384 [10:46:49<15:31:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 41%|████ | 5082/12384 [10:46:49<15:29:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 41%|████ | 5082/12384 [10:46:57<15:29:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 41%|████ | 5083/12384 [10:46:57<15:28:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 41%|████ | 5083/12384 [10:47:04<15:28:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 41%|████ | 5084/12384 [10:47:04<15:27:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 41%|████ | 5084/12384 [10:47:12<15:27:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████ | 5085/12384 [10:47:12<15:26:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████ | 5085/12384 [10:47:19<15:26:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 41%|████ | 5086/12384 [10:47:19<15:27:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 41%|████ | 5086/12384 [10:47:27<15:27:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 41%|████ | 5087/12384 [10:47:27<15:26:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 41%|████ | 5087/12384 [10:47:35<15:26:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 41%|████ | 5088/12384 [10:47:35<15:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 41%|████ | 5088/12384 [10:47:42<15:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 41%|████ | 5089/12384 [10:47:42<15:26:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 41%|████ | 5089/12384 [10:47:50<15:26:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 41%|████ | 5090/12384 [10:47:50<15:25:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 41%|████ | 5090/12384 [10:47:57<15:25:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 1: 41%|████ | 5091/12384 [10:47:57<15:24:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 1: 41%|████ | 5091/12384 [10:48:05<15:24:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 41%|████ | 5092/12384 [10:48:05<15:24:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 41%|████ | 5092/12384 [10:48:13<15:24:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 41%|████ | 5093/12384 [10:48:13<15:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 41%|████ | 5093/12384 [10:48:20<15:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 41%|████ | 5094/12384 [10:48:20<15:25:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 41%|████ | 5094/12384 [10:48:28<15:25:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 41%|████ | 5095/12384 [10:48:28<15:24:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 41%|████ | 5095/12384 [10:48:35<15:24:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 41%|████ | 5096/12384 [10:48:35<15:24:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 41%|████ | 5096/12384 [10:48:43<15:24:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.26s]
Epoch 1: 41%|████ | 5097/12384 [10:48:43<15:24:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.26s]
Epoch 1: 41%|████ | 5097/12384 [10:48:51<15:24:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 1: 41%|████ | 5098/12384 [10:48:51<15:24:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 1: 41%|████ | 5098/12384 [10:48:58<15:24:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 41%|████ | 5099/12384 [10:48:58<15:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 41%|████ | 5099/12384 [10:49:06<15:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 41%|████ | 5100/12384 [10:49:06<15:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 41%|████ | 5100/12384 [10:49:14<15:24:23, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.32s]
Epoch 1: 41%|████ | 5101/12384 [10:49:14<15:24:28, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.32s]
Epoch 1: 41%|████ | 5101/12384 [10:49:21<15:24:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 41%|████ | 5102/12384 [10:49:21<15:24:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 41%|████ | 5102/12384 [10:49:29<15:24:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 41%|████ | 5103/12384 [10:49:29<15:26:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 41%|████ | 5103/12384 [10:49:37<15:26:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 41%|████ | 5104/12384 [10:49:37<15:26:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 41%|████ | 5104/12384 [10:49:44<15:26:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 41%|████ | 5105/12384 [10:49:44<15:38:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 41%|████ | 5105/12384 [10:49:52<15:38:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 41%|████ | 5106/12384 [10:49:52<15:33:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 41%|████ | 5106/12384 [10:50:00<15:33:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 41%|████ | 5107/12384 [10:50:00<15:29:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 41%|████ | 5107/12384 [10:50:07<15:29:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 41%|████ | 5108/12384 [10:50:07<15:27:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 41%|████ | 5108/12384 [10:50:15<15:27:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 41%|████▏ | 5109/12384 [10:50:15<15:26:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 41%|████▏ | 5109/12384 [10:50:23<15:26:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.40s]
Epoch 1: 41%|████▏ | 5110/12384 [10:50:23<15:25:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.40s]
Epoch 1: 41%|████▏ | 5110/12384 [10:50:30<15:25:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 41%|████▏ | 5111/12384 [10:50:30<15:24:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 41%|████▏ | 5111/12384 [10:50:38<15:24:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 41%|████▏ | 5112/12384 [10:50:38<15:24:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 41%|████▏ | 5112/12384 [10:50:45<15:24:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 41%|████▏ | 5113/12384 [10:50:45<15:23:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 41%|████▏ | 5113/12384 [10:50:53<15:23:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 41%|████▏ | 5114/12384 [10:50:53<15:22:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 41%|████▏ | 5114/12384 [10:51:01<15:22:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 41%|████▏ | 5115/12384 [10:51:01<15:21:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 41%|████▏ | 5115/12384 [10:51:08<15:21:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 41%|████▏ | 5116/12384 [10:51:08<15:28:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 41%|████▏ | 5116/12384 [10:51:16<15:28:51, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.47s]
Epoch 1: 41%|████▏ | 5117/12384 [10:51:16<15:26:48, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.47s]
Epoch 1: 41%|████▏ | 5117/12384 [10:51:24<15:26:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 41%|████▏ | 5118/12384 [10:51:24<15:24:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 41%|████▏ | 5118/12384 [10:51:31<15:24:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 41%|████▏ | 5119/12384 [10:51:31<15:24:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 41%|████▏ | 5119/12384 [10:51:39<15:24:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 41%|████▏ | 5120/12384 [10:51:39<15:23:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 41%|████▏ | 5120/12384 [10:51:46<15:23:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 41%|████▏ | 5121/12384 [10:51:46<15:22:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 41%|████▏ | 5121/12384 [10:51:54<15:22:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████▏ | 5122/12384 [10:51:54<15:21:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████▏ | 5122/12384 [10:52:02<15:21:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 41%|████▏ | 5123/12384 [10:52:02<15:21:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 41%|████▏ | 5123/12384 [10:52:09<15:21:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 41%|████▏ | 5124/12384 [10:52:09<15:21:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 41%|████▏ | 5124/12384 [10:52:17<15:21:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 41%|████▏ | 5125/12384 [10:52:17<15:21:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 41%|████▏ | 5125/12384 [10:52:24<15:21:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 41%|████▏ | 5126/12384 [10:52:24<15:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 41%|████▏ | 5126/12384 [10:52:32<15:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 41%|████▏ | 5127/12384 [10:52:32<15:21:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 41%|████▏ | 5127/12384 [10:52:40<15:21:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████▏ | 5128/12384 [10:52:40<15:22:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 41%|████▏ | 5128/12384 [10:52:47<15:22:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 41%|████▏ | 5129/12384 [10:52:47<15:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 41%|████▏ | 5129/12384 [10:52:55<15:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████▏ | 5130/12384 [10:52:55<15:21:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 41%|████▏ | 5130/12384 [10:53:03<15:21:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 41%|████▏ | 5131/12384 [10:53:03<15:33:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 41%|████▏ | 5131/12384 [10:53:11<15:33:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 41%|████▏ | 5132/12384 [10:53:11<15:28:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 41%|████▏ | 5132/12384 [10:53:18<15:28:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 41%|████▏ | 5133/12384 [10:53:18<15:26:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 41%|████▏ | 5133/12384 [10:53:26<15:26:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 41%|████▏ | 5134/12384 [10:53:26<15:24:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 41%|████▏ | 5134/12384 [10:53:33<15:24:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 41%|████▏ | 5135/12384 [10:53:33<15:24:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 41%|████▏ | 5135/12384 [10:53:41<15:24:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 1: 41%|████▏ | 5136/12384 [10:53:41<15:22:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 1: 41%|████▏ | 5136/12384 [10:53:49<15:22:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 41%|████▏ | 5137/12384 [10:53:49<15:21:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 41%|████▏ | 5137/12384 [10:53:56<15:21:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 41%|████▏ | 5138/12384 [10:53:56<15:23:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 41%|████▏ | 5138/12384 [10:54:04<15:23:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 41%|████▏ | 5139/12384 [10:54:04<15:21:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 41%|████▏ | 5139/12384 [10:54:12<15:21:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5140/12384 [10:54:12<15:21:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5140/12384 [10:54:19<15:21:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 42%|████▏ | 5141/12384 [10:54:19<15:22:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 42%|████▏ | 5141/12384 [10:54:27<15:22:01, 7.64s/it, loss=0.0004, acc=0.9999, iter_time=9.19s]
Epoch 1: 42%|████▏ | 5142/12384 [10:54:27<15:21:05, 7.63s/it, loss=0.0004, acc=0.9999, iter_time=9.19s]
Epoch 1: 42%|████▏ | 5142/12384 [10:54:34<15:21:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 42%|████▏ | 5143/12384 [10:54:34<15:20:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 42%|████▏ | 5143/12384 [10:54:42<15:20:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 42%|████▏ | 5144/12384 [10:54:42<15:20:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 42%|████▏ | 5144/12384 [10:54:50<15:20:02, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.45s]
Epoch 1: 42%|████▏ | 5145/12384 [10:54:50<15:19:36, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.45s]
Epoch 1: 42%|████▏ | 5145/12384 [10:54:57<15:19:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 42%|████▏ | 5146/12384 [10:54:57<15:19:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 42%|████▏ | 5146/12384 [10:55:05<15:19:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 42%|████▏ | 5147/12384 [10:55:05<15:20:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 42%|████▏ | 5147/12384 [10:55:13<15:20:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 42%|████▏ | 5148/12384 [10:55:13<15:20:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 42%|████▏ | 5148/12384 [10:55:20<15:20:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5149/12384 [10:55:20<15:19:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5149/12384 [10:55:28<15:19:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 42%|████▏ | 5150/12384 [10:55:28<15:19:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 42%|████▏ | 5150/12384 [10:55:35<15:19:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 42%|████▏ | 5151/12384 [10:55:35<15:18:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 42%|████▏ | 5151/12384 [10:55:43<15:18:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 42%|████▏ | 5152/12384 [10:55:43<15:18:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 42%|████▏ | 5152/12384 [10:55:51<15:18:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 1: 42%|████▏ | 5153/12384 [10:55:51<15:17:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 1: 42%|████▏ | 5153/12384 [10:55:58<15:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 42%|████▏ | 5154/12384 [10:55:58<15:16:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 42%|████▏ | 5154/12384 [10:56:06<15:16:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 42%|████▏ | 5155/12384 [10:56:06<15:16:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 42%|████▏ | 5155/12384 [10:56:13<15:16:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 42%|████▏ | 5156/12384 [10:56:13<15:16:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 42%|████▏ | 5156/12384 [10:56:21<15:16:14, 7.61s/it, loss=0.0022, acc=0.9957, iter_time=7.64s]
Epoch 1: 42%|████▏ | 5157/12384 [10:56:21<15:27:52, 7.70s/it, loss=0.0022, acc=0.9957, iter_time=7.64s]
Epoch 1: 42%|████▏ | 5157/12384 [10:56:29<15:27:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 42%|████▏ | 5158/12384 [10:56:29<15:24:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 42%|████▏ | 5158/12384 [10:56:37<15:24:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5159/12384 [10:56:37<15:21:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5159/12384 [10:56:44<15:21:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 42%|████▏ | 5160/12384 [10:56:44<15:22:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 42%|████▏ | 5160/12384 [10:56:52<15:22:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 42%|████▏ | 5161/12384 [10:56:52<15:20:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 42%|████▏ | 5161/12384 [10:56:59<15:20:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 42%|████▏ | 5162/12384 [10:56:59<15:19:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 42%|████▏ | 5162/12384 [10:57:07<15:19:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5163/12384 [10:57:07<15:20:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5163/12384 [10:57:15<15:20:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 42%|████▏ | 5164/12384 [10:57:15<15:19:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 42%|████▏ | 5164/12384 [10:57:22<15:19:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 42%|████▏ | 5165/12384 [10:57:22<15:17:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 42%|████▏ | 5165/12384 [10:57:30<15:17:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 42%|████▏ | 5166/12384 [10:57:30<15:17:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 42%|████▏ | 5166/12384 [10:57:38<15:17:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 42%|████▏ | 5167/12384 [10:57:38<15:17:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 42%|████▏ | 5167/12384 [10:57:45<15:17:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 42%|████▏ | 5168/12384 [10:57:45<15:16:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 42%|████▏ | 5168/12384 [10:57:53<15:16:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 42%|████▏ | 5169/12384 [10:57:53<15:18:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 42%|████▏ | 5169/12384 [10:58:01<15:18:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 1: 42%|████▏ | 5170/12384 [10:58:01<15:27:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 1: 42%|████▏ | 5170/12384 [10:58:08<15:27:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 42%|████▏ | 5171/12384 [10:58:08<15:24:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 42%|████▏ | 5171/12384 [10:58:16<15:24:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 42%|████▏ | 5172/12384 [10:58:16<15:21:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 42%|████▏ | 5172/12384 [10:58:24<15:21:15, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5173/12384 [10:58:24<15:18:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5173/12384 [10:58:31<15:18:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5174/12384 [10:58:31<15:16:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5174/12384 [10:58:39<15:16:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5175/12384 [10:58:39<15:16:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5175/12384 [10:58:46<15:16:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 42%|████▏ | 5176/12384 [10:58:46<15:15:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 42%|████▏ | 5176/12384 [10:58:54<15:15:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 42%|████▏ | 5177/12384 [10:58:54<15:15:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 42%|████▏ | 5177/12384 [10:59:02<15:15:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 42%|████▏ | 5178/12384 [10:59:02<15:15:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 42%|████▏ | 5178/12384 [10:59:09<15:15:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 42%|████▏ | 5179/12384 [10:59:09<15:14:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 42%|████▏ | 5179/12384 [10:59:17<15:14:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5180/12384 [10:59:17<15:14:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5180/12384 [10:59:25<15:14:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 42%|████▏ | 5181/12384 [10:59:25<15:16:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 42%|████▏ | 5181/12384 [10:59:32<15:16:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 42%|████▏ | 5182/12384 [10:59:32<15:14:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 42%|████▏ | 5182/12384 [10:59:40<15:14:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 42%|████▏ | 5183/12384 [10:59:40<15:13:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 42%|████▏ | 5183/12384 [10:59:48<15:13:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.90s]
Epoch 1: 42%|████▏ | 5184/12384 [10:59:48<15:24:04, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.90s]
Epoch 1: 42%|████▏ | 5184/12384 [10:59:55<15:24:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 42%|████▏ | 5185/12384 [10:59:55<15:20:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 42%|████▏ | 5185/12384 [11:00:03<15:20:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 42%|████▏ | 5186/12384 [11:00:03<15:18:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 42%|████▏ | 5186/12384 [11:00:11<15:18:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 1: 42%|████▏ | 5187/12384 [11:00:11<15:17:00, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.92s]
Epoch 1: 42%|████▏ | 5187/12384 [11:00:18<15:17:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5188/12384 [11:00:18<15:15:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5188/12384 [11:00:26<15:15:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 42%|████▏ | 5189/12384 [11:00:26<15:14:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 42%|████▏ | 5189/12384 [11:00:33<15:14:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 42%|████▏ | 5190/12384 [11:00:33<15:13:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 42%|████▏ | 5190/12384 [11:00:41<15:13:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5191/12384 [11:00:41<15:12:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 42%|████▏ | 5191/12384 [11:00:49<15:12:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 42%|████▏ | 5192/12384 [11:00:49<15:12:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 42%|████▏ | 5192/12384 [11:00:56<15:12:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 42%|████▏ | 5193/12384 [11:00:56<15:11:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 42%|████▏ | 5193/12384 [11:01:04<15:11:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 42%|████▏ | 5194/12384 [11:01:04<15:11:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 42%|████▏ | 5194/12384 [11:01:11<15:11:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5195/12384 [11:01:11<15:11:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5195/12384 [11:01:19<15:11:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 42%|████▏ | 5196/12384 [11:01:19<15:11:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 42%|████▏ | 5196/12384 [11:01:27<15:11:08, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=10.10s]
Epoch 1: 42%|████▏ | 5197/12384 [11:01:27<15:11:14, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=10.10s]
Epoch 1: 42%|████▏ | 5197/12384 [11:01:34<15:11:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5198/12384 [11:01:34<15:11:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5198/12384 [11:01:42<15:11:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 42%|████▏ | 5199/12384 [11:01:42<15:11:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 42%|████▏ | 5199/12384 [11:01:49<15:11:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 1: 42%|████▏ | 5200/12384 [11:01:49<15:11:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 1: 42%|████▏ | 5200/12384 [11:01:57<15:11:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 42%|████▏ | 5201/12384 [11:01:57<15:11:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 42%|████▏ | 5201/12384 [11:02:05<15:11:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5202/12384 [11:02:05<15:11:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5202/12384 [11:02:12<15:11:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 42%|████▏ | 5203/12384 [11:02:12<15:11:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 42%|████▏ | 5203/12384 [11:02:20<15:11:19, 7.61s/it, loss=0.0002, acc=0.9984, iter_time=8.23s]
Epoch 1: 42%|████▏ | 5204/12384 [11:02:20<15:10:48, 7.61s/it, loss=0.0002, acc=0.9984, iter_time=8.23s]
Epoch 1: 42%|████▏ | 5204/12384 [11:02:28<15:10:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 42%|████▏ | 5205/12384 [11:02:28<15:11:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 42%|████▏ | 5205/12384 [11:02:35<15:11:17, 7.62s/it, loss=0.0007, acc=0.9988, iter_time=8.85s]
Epoch 1: 42%|████▏ | 5206/12384 [11:02:35<15:11:15, 7.62s/it, loss=0.0007, acc=0.9988, iter_time=8.85s]
Epoch 1: 42%|████▏ | 5206/12384 [11:02:43<15:11:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5207/12384 [11:02:43<15:10:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5207/12384 [11:02:50<15:10:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 42%|████▏ | 5208/12384 [11:02:50<15:11:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 42%|████▏ | 5208/12384 [11:02:58<15:11:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 42%|████▏ | 5209/12384 [11:02:58<15:10:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 42%|████▏ | 5209/12384 [11:03:06<15:10:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 42%|████▏ | 5210/12384 [11:03:06<15:23:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 42%|████▏ | 5210/12384 [11:03:14<15:23:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 42%|████▏ | 5211/12384 [11:03:14<15:19:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 42%|████▏ | 5211/12384 [11:03:21<15:19:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 42%|████▏ | 5212/12384 [11:03:21<15:15:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 42%|████▏ | 5212/12384 [11:03:29<15:15:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 42%|████▏ | 5213/12384 [11:03:29<15:13:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 42%|████▏ | 5213/12384 [11:03:36<15:13:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 42%|████▏ | 5214/12384 [11:03:36<15:11:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 42%|████▏ | 5214/12384 [11:03:44<15:11:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 42%|████▏ | 5215/12384 [11:03:44<15:11:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 42%|████▏ | 5215/12384 [11:03:52<15:11:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 42%|████▏ | 5216/12384 [11:03:52<15:12:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 42%|████▏ | 5216/12384 [11:03:59<15:12:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 42%|████▏ | 5217/12384 [11:03:59<15:11:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 42%|████▏ | 5217/12384 [11:04:07<15:11:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 42%|████▏ | 5218/12384 [11:04:07<15:09:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 42%|████▏ | 5218/12384 [11:04:15<15:09:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 42%|████▏ | 5219/12384 [11:04:15<15:13:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 42%|████▏ | 5219/12384 [11:04:22<15:13:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 42%|████▏ | 5220/12384 [11:04:22<15:12:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 42%|████▏ | 5220/12384 [11:04:30<15:12:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 42%|████▏ | 5221/12384 [11:04:30<15:10:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 42%|████▏ | 5221/12384 [11:04:38<15:10:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 42%|████▏ | 5222/12384 [11:04:38<15:19:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 42%|████▏ | 5222/12384 [11:04:45<15:19:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 42%|████▏ | 5223/12384 [11:04:45<15:15:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 42%|████▏ | 5223/12384 [11:04:53<15:15:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 1: 42%|████▏ | 5224/12384 [11:04:53<15:13:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 1: 42%|████▏ | 5224/12384 [11:05:00<15:13:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 42%|████▏ | 5225/12384 [11:05:00<15:12:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 42%|████▏ | 5225/12384 [11:05:08<15:12:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5226/12384 [11:05:08<15:10:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5226/12384 [11:05:16<15:10:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 1: 42%|████▏ | 5227/12384 [11:05:16<15:09:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 1: 42%|████▏ | 5227/12384 [11:05:23<15:09:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 42%|████▏ | 5228/12384 [11:05:23<15:08:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 42%|████▏ | 5228/12384 [11:05:31<15:08:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5229/12384 [11:05:31<15:08:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5229/12384 [11:05:39<15:08:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5230/12384 [11:05:39<15:07:57, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5230/12384 [11:05:46<15:07:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 42%|████▏ | 5231/12384 [11:05:46<15:09:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 42%|████▏ | 5231/12384 [11:05:54<15:09:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 42%|████▏ | 5232/12384 [11:05:54<15:08:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 42%|████▏ | 5232/12384 [11:06:01<15:08:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.58s]
Epoch 1: 42%|████▏ | 5233/12384 [11:06:01<15:08:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.58s]
Epoch 1: 42%|████▏ | 5233/12384 [11:06:09<15:08:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 42%|████▏ | 5234/12384 [11:06:09<15:08:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 42%|████▏ | 5234/12384 [11:06:17<15:08:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 42%|████▏ | 5235/12384 [11:06:17<15:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 42%|████▏ | 5235/12384 [11:06:24<15:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 42%|████▏ | 5236/12384 [11:06:24<15:07:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 42%|████▏ | 5236/12384 [11:06:32<15:07:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 42%|████▏ | 5237/12384 [11:06:32<15:18:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 42%|████▏ | 5237/12384 [11:06:40<15:18:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 42%|████▏ | 5238/12384 [11:06:40<15:14:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 42%|████▏ | 5238/12384 [11:06:47<15:14:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 42%|████▏ | 5239/12384 [11:06:47<15:12:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 42%|████▏ | 5239/12384 [11:06:55<15:12:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 1: 42%|████▏ | 5240/12384 [11:06:55<15:11:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 1: 42%|████▏ | 5240/12384 [11:07:03<15:11:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 42%|████▏ | 5241/12384 [11:07:03<15:10:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 42%|████▏ | 5241/12384 [11:07:10<15:10:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 42%|████▏ | 5242/12384 [11:07:10<15:09:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 42%|████▏ | 5242/12384 [11:07:18<15:09:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5243/12384 [11:07:18<15:07:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5243/12384 [11:07:25<15:07:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 42%|████▏ | 5244/12384 [11:07:25<15:05:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 42%|████▏ | 5244/12384 [11:07:33<15:05:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 42%|████▏ | 5245/12384 [11:07:33<15:05:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 42%|████▏ | 5245/12384 [11:07:41<15:05:12, 7.61s/it, loss=0.0007, acc=0.9985, iter_time=9.27s]
Epoch 1: 42%|████▏ | 5246/12384 [11:07:41<15:05:14, 7.61s/it, loss=0.0007, acc=0.9985, iter_time=9.27s]
Epoch 1: 42%|████▏ | 5246/12384 [11:07:48<15:05:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.93s]
Epoch 1: 42%|████▏ | 5247/12384 [11:07:48<15:04:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.93s]
Epoch 1: 42%|████▏ | 5247/12384 [11:07:56<15:04:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 42%|████▏ | 5248/12384 [11:07:56<15:05:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 42%|████▏ | 5248/12384 [11:08:04<15:05:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.66s]
Epoch 1: 42%|████▏ | 5249/12384 [11:08:04<15:05:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.66s]
Epoch 1: 42%|████▏ | 5249/12384 [11:08:11<15:05:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 42%|████▏ | 5250/12384 [11:08:11<15:05:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 42%|████▏ | 5250/12384 [11:08:19<15:05:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 42%|████▏ | 5251/12384 [11:08:19<15:05:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 42%|████▏ | 5251/12384 [11:08:26<15:05:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 42%|████▏ | 5252/12384 [11:08:26<15:05:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 42%|████▏ | 5252/12384 [11:08:34<15:05:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5253/12384 [11:08:34<15:04:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 42%|████▏ | 5253/12384 [11:08:42<15:04:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5254/12384 [11:08:42<15:04:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5254/12384 [11:08:49<15:04:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 42%|████▏ | 5255/12384 [11:08:49<15:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 42%|████▏ | 5255/12384 [11:08:57<15:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 42%|████▏ | 5256/12384 [11:08:57<15:04:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 42%|████▏ | 5256/12384 [11:09:04<15:04:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 42%|████▏ | 5257/12384 [11:09:04<15:03:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 42%|████▏ | 5257/12384 [11:09:12<15:03:54, 7.61s/it, loss=0.0004, acc=0.9965, iter_time=8.21s]
Epoch 1: 42%|████▏ | 5258/12384 [11:09:12<15:04:11, 7.61s/it, loss=0.0004, acc=0.9965, iter_time=8.21s]
Epoch 1: 42%|████▏ | 5258/12384 [11:09:20<15:04:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 42%|████▏ | 5259/12384 [11:09:20<15:02:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 42%|████▏ | 5259/12384 [11:09:27<15:02:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 42%|████▏ | 5260/12384 [11:09:27<15:02:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 42%|████▏ | 5260/12384 [11:09:35<15:02:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5261/12384 [11:09:35<15:02:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 42%|████▏ | 5261/12384 [11:09:42<15:02:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 42%|████▏ | 5262/12384 [11:09:42<15:02:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 42%|████▏ | 5262/12384 [11:09:50<15:02:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 42%|████▏ | 5263/12384 [11:09:50<15:14:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 42%|████▏ | 5263/12384 [11:09:58<15:14:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 43%|████▎ | 5264/12384 [11:09:58<15:11:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 43%|████▎ | 5264/12384 [11:10:06<15:11:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 43%|████▎ | 5265/12384 [11:10:06<15:08:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 43%|████▎ | 5265/12384 [11:10:13<15:08:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 43%|████▎ | 5266/12384 [11:10:13<15:07:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 43%|████▎ | 5266/12384 [11:10:21<15:07:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 1: 43%|████▎ | 5267/12384 [11:10:21<15:06:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 1: 43%|████▎ | 5267/12384 [11:10:28<15:06:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 43%|████▎ | 5268/12384 [11:10:28<15:04:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 43%|████▎ | 5268/12384 [11:10:36<15:04:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 43%|████▎ | 5269/12384 [11:10:36<15:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 43%|████▎ | 5269/12384 [11:10:44<15:03:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5270/12384 [11:10:44<15:02:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5270/12384 [11:10:51<15:02:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 43%|████▎ | 5271/12384 [11:10:51<15:01:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 43%|████▎ | 5271/12384 [11:10:59<15:01:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 43%|████▎ | 5272/12384 [11:10:59<15:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 43%|████▎ | 5272/12384 [11:11:06<15:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 43%|████▎ | 5273/12384 [11:11:06<15:01:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 43%|████▎ | 5273/12384 [11:11:14<15:01:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 43%|████▎ | 5274/12384 [11:11:14<15:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 43%|████▎ | 5274/12384 [11:11:22<15:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 43%|████▎ | 5275/12384 [11:11:22<15:12:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 43%|████▎ | 5275/12384 [11:11:30<15:12:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5276/12384 [11:11:30<15:09:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5276/12384 [11:11:37<15:09:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5277/12384 [11:11:37<15:07:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5277/12384 [11:11:45<15:07:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 43%|████▎ | 5278/12384 [11:11:45<15:04:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 43%|████▎ | 5278/12384 [11:11:52<15:04:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5279/12384 [11:11:52<15:03:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5279/12384 [11:12:00<15:03:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 43%|████▎ | 5280/12384 [11:12:00<15:02:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 43%|████▎ | 5280/12384 [11:12:08<15:02:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 43%|████▎ | 5281/12384 [11:12:08<15:01:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 43%|████▎ | 5281/12384 [11:12:15<15:01:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 43%|████▎ | 5282/12384 [11:12:15<15:01:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 43%|████▎ | 5282/12384 [11:12:23<15:01:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5283/12384 [11:12:23<15:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5283/12384 [11:12:30<15:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5284/12384 [11:12:30<15:00:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5284/12384 [11:12:38<15:00:55, 7.61s/it, loss=0.0006, acc=0.9988, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5285/12384 [11:12:38<15:00:30, 7.61s/it, loss=0.0006, acc=0.9988, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5285/12384 [11:12:46<15:00:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 43%|████▎ | 5286/12384 [11:12:46<15:00:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 43%|████▎ | 5286/12384 [11:12:53<15:00:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 43%|████▎ | 5287/12384 [11:12:53<15:00:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 43%|████▎ | 5287/12384 [11:13:01<15:00:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 43%|████▎ | 5288/12384 [11:13:01<15:00:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 43%|████▎ | 5288/12384 [11:13:09<15:00:58, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 1: 43%|████▎ | 5289/12384 [11:13:09<15:12:02, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 1: 43%|████▎ | 5289/12384 [11:13:17<15:12:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 43%|████▎ | 5290/12384 [11:13:17<15:08:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 43%|████▎ | 5290/12384 [11:13:24<15:08:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 43%|████▎ | 5291/12384 [11:13:24<15:05:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 43%|████▎ | 5291/12384 [11:13:32<15:05:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5292/12384 [11:13:32<15:03:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5292/12384 [11:13:39<15:03:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 43%|████▎ | 5293/12384 [11:13:39<15:02:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 43%|████▎ | 5293/12384 [11:13:47<15:02:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 43%|████▎ | 5294/12384 [11:13:47<15:00:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 43%|████▎ | 5294/12384 [11:13:55<15:00:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5295/12384 [11:13:55<15:00:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5295/12384 [11:14:02<15:00:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 43%|████▎ | 5296/12384 [11:14:02<15:00:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 43%|████▎ | 5296/12384 [11:14:10<15:00:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 1: 43%|████▎ | 5297/12384 [11:14:10<14:59:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 1: 43%|████▎ | 5297/12384 [11:14:17<14:59:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 43%|████▎ | 5298/12384 [11:14:17<14:59:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 43%|████▎ | 5298/12384 [11:14:25<14:59:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5299/12384 [11:14:25<14:58:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5299/12384 [11:14:33<14:58:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 43%|████▎ | 5300/12384 [11:14:33<14:59:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 43%|████▎ | 5300/12384 [11:14:40<14:59:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 43%|████▎ | 5301/12384 [11:14:40<15:01:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 43%|████▎ | 5301/12384 [11:14:48<15:01:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 43%|████▎ | 5302/12384 [11:14:48<15:01:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 43%|████▎ | 5302/12384 [11:14:56<15:01:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 43%|████▎ | 5303/12384 [11:14:56<15:00:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 43%|████▎ | 5303/12384 [11:15:03<15:00:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 43%|████▎ | 5304/12384 [11:15:03<14:59:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 43%|████▎ | 5304/12384 [11:15:11<14:59:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 43%|████▎ | 5305/12384 [11:15:11<15:00:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 43%|████▎ | 5305/12384 [11:15:18<15:00:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 43%|████▎ | 5306/12384 [11:15:18<14:59:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 43%|████▎ | 5306/12384 [11:15:26<14:59:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 43%|████▎ | 5307/12384 [11:15:26<14:59:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 43%|████▎ | 5307/12384 [11:15:34<14:59:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 43%|████▎ | 5308/12384 [11:15:34<14:58:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 43%|████▎ | 5308/12384 [11:15:41<14:58:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 43%|████▎ | 5309/12384 [11:15:41<14:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 43%|████▎ | 5309/12384 [11:15:49<14:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 43%|████▎ | 5310/12384 [11:15:49<14:58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 43%|████▎ | 5310/12384 [11:15:57<14:58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5311/12384 [11:15:57<14:58:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5311/12384 [11:16:04<14:58:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 43%|████▎ | 5312/12384 [11:16:04<14:57:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 43%|████▎ | 5312/12384 [11:16:12<14:57:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 43%|████▎ | 5313/12384 [11:16:12<14:56:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 43%|████▎ | 5313/12384 [11:16:19<14:56:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 43%|████▎ | 5314/12384 [11:16:19<14:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 43%|████▎ | 5314/12384 [11:16:27<14:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 43%|████▎ | 5315/12384 [11:16:27<15:09:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 43%|████▎ | 5315/12384 [11:16:35<15:09:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 43%|████▎ | 5316/12384 [11:16:35<15:06:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 43%|████▎ | 5316/12384 [11:16:43<15:06:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 1: 43%|████▎ | 5317/12384 [11:16:43<15:04:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 1: 43%|████▎ | 5317/12384 [11:16:50<15:04:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 43%|████▎ | 5318/12384 [11:16:50<15:01:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 43%|████▎ | 5318/12384 [11:16:58<15:01:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5319/12384 [11:16:58<15:00:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5319/12384 [11:17:05<15:00:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 43%|████▎ | 5320/12384 [11:17:05<14:58:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 43%|████▎ | 5320/12384 [11:17:13<14:58:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 43%|████▎ | 5321/12384 [11:17:13<14:58:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 43%|████▎ | 5321/12384 [11:17:21<14:58:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 43%|████▎ | 5322/12384 [11:17:21<14:57:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 43%|████▎ | 5322/12384 [11:17:28<14:57:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 43%|████▎ | 5323/12384 [11:17:28<14:55:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 43%|████▎ | 5323/12384 [11:17:36<14:55:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 43%|████▎ | 5324/12384 [11:17:36<14:55:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 43%|████▎ | 5324/12384 [11:17:43<14:55:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 43%|████▎ | 5325/12384 [11:17:43<14:55:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 43%|████▎ | 5325/12384 [11:17:51<14:55:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5326/12384 [11:17:51<14:55:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5326/12384 [11:17:59<14:55:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 43%|████▎ | 5327/12384 [11:17:59<15:04:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 43%|████▎ | 5327/12384 [11:18:07<15:04:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 43%|████▎ | 5328/12384 [11:18:07<15:01:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 43%|████▎ | 5328/12384 [11:18:14<15:01:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 1: 43%|████▎ | 5329/12384 [11:18:14<14:59:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 1: 43%|████▎ | 5329/12384 [11:18:22<14:59:48, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=11.13s]
Epoch 1: 43%|████▎ | 5330/12384 [11:18:22<15:01:20, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.13s]
Epoch 1: 43%|████▎ | 5330/12384 [11:18:30<15:01:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 43%|████▎ | 5331/12384 [11:18:30<15:02:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 43%|████▎ | 5331/12384 [11:18:37<15:02:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 43%|████▎ | 5332/12384 [11:18:37<15:04:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 43%|████▎ | 5332/12384 [11:18:45<15:04:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 43%|████▎ | 5333/12384 [11:18:45<15:01:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 43%|████▎ | 5333/12384 [11:18:52<15:01:40, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=10.48s]
Epoch 1: 43%|████▎ | 5334/12384 [11:18:52<14:58:36, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=10.48s]
Epoch 1: 43%|████▎ | 5334/12384 [11:19:00<14:58:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 43%|████▎ | 5335/12384 [11:19:00<14:56:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 43%|████▎ | 5335/12384 [11:19:08<14:56:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.09s]
Epoch 1: 43%|████▎ | 5336/12384 [11:19:08<14:56:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.09s]
Epoch 1: 43%|████▎ | 5336/12384 [11:19:15<14:56:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 43%|████▎ | 5337/12384 [11:19:15<14:55:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 43%|████▎ | 5337/12384 [11:19:23<14:55:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 43%|████▎ | 5338/12384 [11:19:23<14:54:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 43%|████▎ | 5338/12384 [11:19:31<14:54:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5339/12384 [11:19:31<14:54:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5339/12384 [11:19:38<14:54:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5340/12384 [11:19:38<14:53:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5340/12384 [11:19:46<14:53:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 43%|████▎ | 5341/12384 [11:19:46<15:05:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 43%|████▎ | 5341/12384 [11:19:54<15:05:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 43%|████▎ | 5342/12384 [11:19:54<15:01:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 43%|████▎ | 5342/12384 [11:20:01<15:01:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 43%|████▎ | 5343/12384 [11:20:01<14:59:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 43%|████▎ | 5343/12384 [11:20:09<14:59:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 43%|████▎ | 5344/12384 [11:20:09<14:57:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 43%|████▎ | 5344/12384 [11:20:17<14:57:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 43%|████▎ | 5345/12384 [11:20:17<14:57:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 43%|████▎ | 5345/12384 [11:20:24<14:57:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5346/12384 [11:20:24<14:54:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5346/12384 [11:20:32<14:54:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 43%|████▎ | 5347/12384 [11:20:32<14:53:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 43%|████▎ | 5347/12384 [11:20:39<14:53:27, 7.62s/it, loss=0.0037, acc=0.9909, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5348/12384 [11:20:39<14:53:17, 7.62s/it, loss=0.0037, acc=0.9909, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5348/12384 [11:20:47<14:53:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5349/12384 [11:20:47<14:52:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5349/12384 [11:20:55<14:52:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 43%|████▎ | 5350/12384 [11:20:55<14:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 43%|████▎ | 5350/12384 [11:21:02<14:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 43%|████▎ | 5351/12384 [11:21:02<14:51:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 43%|████▎ | 5351/12384 [11:21:10<14:51:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 43%|████▎ | 5352/12384 [11:21:10<14:52:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 43%|████▎ | 5352/12384 [11:21:18<14:52:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 43%|████▎ | 5353/12384 [11:21:18<15:01:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 43%|████▎ | 5353/12384 [11:21:25<15:01:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5354/12384 [11:21:25<14:58:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5354/12384 [11:21:33<14:58:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 43%|████▎ | 5355/12384 [11:21:33<14:56:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 43%|████▎ | 5355/12384 [11:21:41<14:56:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 43%|████▎ | 5356/12384 [11:21:41<14:54:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 43%|████▎ | 5356/12384 [11:21:48<14:54:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5357/12384 [11:21:48<14:53:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5357/12384 [11:21:56<14:53:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5358/12384 [11:21:56<14:52:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5358/12384 [11:22:03<14:52:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 43%|████▎ | 5359/12384 [11:22:03<14:51:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 43%|████▎ | 5359/12384 [11:22:11<14:51:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 43%|████▎ | 5360/12384 [11:22:11<14:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 43%|████▎ | 5360/12384 [11:22:19<14:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 43%|████▎ | 5361/12384 [11:22:19<14:49:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 43%|████▎ | 5361/12384 [11:22:26<14:49:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 43%|████▎ | 5362/12384 [11:22:26<14:49:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 43%|████▎ | 5362/12384 [11:22:34<14:49:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5363/12384 [11:22:34<14:49:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5363/12384 [11:22:41<14:49:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5364/12384 [11:22:41<14:49:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5364/12384 [11:22:49<14:49:02, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.21s]
Epoch 1: 43%|████▎ | 5365/12384 [11:22:49<14:49:13, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.21s]
Epoch 1: 43%|████▎ | 5365/12384 [11:22:56<14:49:13, 7.60s/it, loss=0.0003, acc=0.9981, iter_time=11.37s]
Epoch 1: 43%|████▎ | 5366/12384 [11:22:56<14:48:28, 7.60s/it, loss=0.0003, acc=0.9981, iter_time=11.37s]
Epoch 1: 43%|████▎ | 5366/12384 [11:23:04<14:48:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 43%|████▎ | 5367/12384 [11:23:04<14:48:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 43%|████▎ | 5367/12384 [11:23:12<14:48:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 43%|████▎ | 5368/12384 [11:23:12<15:01:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 43%|████▎ | 5368/12384 [11:23:20<15:01:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 43%|████▎ | 5369/12384 [11:23:20<14:58:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 43%|████▎ | 5369/12384 [11:23:27<14:58:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5370/12384 [11:23:27<14:57:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 43%|████▎ | 5370/12384 [11:23:35<14:57:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 43%|████▎ | 5371/12384 [11:23:35<14:54:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 43%|████▎ | 5371/12384 [11:23:43<14:54:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 43%|████▎ | 5372/12384 [11:23:43<14:52:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 43%|████▎ | 5372/12384 [11:23:50<14:52:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 43%|████▎ | 5373/12384 [11:23:50<14:53:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 43%|████▎ | 5373/12384 [11:23:58<14:53:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.93s]
Epoch 1: 43%|████▎ | 5374/12384 [11:23:58<14:51:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.93s]
Epoch 1: 43%|████▎ | 5374/12384 [11:24:05<14:51:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5375/12384 [11:24:05<14:49:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5375/12384 [11:24:13<14:49:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 43%|████▎ | 5376/12384 [11:24:13<14:49:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 43%|████▎ | 5376/12384 [11:24:21<14:49:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 43%|████▎ | 5377/12384 [11:24:21<14:51:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 43%|████▎ | 5377/12384 [11:24:28<14:51:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 43%|████▎ | 5378/12384 [11:24:28<14:50:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 43%|████▎ | 5378/12384 [11:24:36<14:50:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 43%|████▎ | 5379/12384 [11:24:36<14:49:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 43%|████▎ | 5379/12384 [11:24:44<14:49:29, 7.62s/it, loss=0.0003, acc=0.9977, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5380/12384 [11:24:44<14:49:09, 7.62s/it, loss=0.0003, acc=0.9977, iter_time=7.62s]
Epoch 1: 43%|████▎ | 5380/12384 [11:24:51<14:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5381/12384 [11:24:51<14:50:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 43%|████▎ | 5381/12384 [11:24:59<14:50:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 43%|████▎ | 5382/12384 [11:24:59<14:49:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 43%|████▎ | 5382/12384 [11:25:06<14:49:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 43%|████▎ | 5383/12384 [11:25:06<14:50:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 43%|████▎ | 5383/12384 [11:25:14<14:50:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 43%|████▎ | 5384/12384 [11:25:14<14:49:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 43%|████▎ | 5384/12384 [11:25:22<14:49:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 43%|████▎ | 5385/12384 [11:25:22<14:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 43%|████▎ | 5385/12384 [11:25:29<14:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5386/12384 [11:25:29<14:47:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 43%|████▎ | 5386/12384 [11:25:37<14:47:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 43%|████▎ | 5387/12384 [11:25:37<14:48:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 43%|████▎ | 5387/12384 [11:25:44<14:48:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 44%|████▎ | 5388/12384 [11:25:44<14:48:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 44%|████▎ | 5388/12384 [11:25:52<14:48:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 44%|████▎ | 5389/12384 [11:25:52<14:48:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 44%|████▎ | 5389/12384 [11:26:00<14:48:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.48s]
Epoch 1: 44%|████▎ | 5390/12384 [11:26:00<14:48:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.48s]
Epoch 1: 44%|████▎ | 5390/12384 [11:26:07<14:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 44%|████▎ | 5391/12384 [11:26:07<14:48:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 44%|████▎ | 5391/12384 [11:26:15<14:48:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 44%|████▎ | 5392/12384 [11:26:15<14:49:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 44%|████▎ | 5392/12384 [11:26:23<14:49:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 44%|████▎ | 5393/12384 [11:26:23<14:47:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 44%|████▎ | 5393/12384 [11:26:31<14:47:43, 7.62s/it, loss=0.0004, acc=0.9986, iter_time=8.23s]
Epoch 1: 44%|████▎ | 5394/12384 [11:26:31<14:57:39, 7.71s/it, loss=0.0004, acc=0.9986, iter_time=8.23s]
Epoch 1: 44%|████▎ | 5394/12384 [11:26:38<14:57:39, 7.71s/it, loss=0.0013, acc=0.9974, iter_time=7.86s]
Epoch 1: 44%|████▎ | 5395/12384 [11:26:38<14:54:15, 7.68s/it, loss=0.0013, acc=0.9974, iter_time=7.86s]
Epoch 1: 44%|████▎ | 5395/12384 [11:26:46<14:54:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 44%|████▎ | 5396/12384 [11:26:46<14:51:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 44%|████▎ | 5396/12384 [11:26:53<14:51:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 44%|████▎ | 5397/12384 [11:26:53<14:50:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 44%|████▎ | 5397/12384 [11:27:01<14:50:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 44%|████▎ | 5398/12384 [11:27:01<14:49:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 44%|████▎ | 5398/12384 [11:27:09<14:49:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 44%|████▎ | 5399/12384 [11:27:09<14:48:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 44%|████▎ | 5399/12384 [11:27:16<14:48:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 44%|████▎ | 5400/12384 [11:27:16<14:47:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 44%|████▎ | 5400/12384 [11:27:24<14:47:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 44%|████▎ | 5401/12384 [11:27:24<14:47:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 44%|████▎ | 5401/12384 [11:27:31<14:47:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 44%|████▎ | 5402/12384 [11:27:31<14:46:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 44%|████▎ | 5402/12384 [11:27:39<14:46:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 44%|████▎ | 5403/12384 [11:27:39<14:45:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 44%|████▎ | 5403/12384 [11:27:47<14:45:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 44%|████▎ | 5404/12384 [11:27:47<14:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 44%|████▎ | 5404/12384 [11:27:54<14:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 44%|████▎ | 5405/12384 [11:27:54<14:46:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 44%|████▎ | 5405/12384 [11:28:02<14:46:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 44%|████▎ | 5406/12384 [11:28:02<14:46:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 44%|████▎ | 5406/12384 [11:28:09<14:46:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 44%|████▎ | 5407/12384 [11:28:09<14:45:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 44%|████▎ | 5407/12384 [11:28:17<14:45:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 44%|████▎ | 5408/12384 [11:28:17<14:45:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 44%|████▎ | 5408/12384 [11:28:25<14:45:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 44%|████▎ | 5409/12384 [11:28:25<14:44:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 44%|████▎ | 5409/12384 [11:28:32<14:44:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 44%|████▎ | 5410/12384 [11:28:32<14:43:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 44%|████▎ | 5410/12384 [11:28:40<14:43:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 44%|████▎ | 5411/12384 [11:28:40<14:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 44%|████▎ | 5411/12384 [11:28:48<14:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 44%|████▎ | 5412/12384 [11:28:48<14:44:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 44%|████▎ | 5412/12384 [11:28:55<14:44:51, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.81s]
Epoch 1: 44%|████▎ | 5413/12384 [11:28:55<14:48:11, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.81s]
Epoch 1: 44%|████▎ | 5413/12384 [11:29:03<14:48:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 44%|████▎ | 5414/12384 [11:29:03<14:47:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 44%|████▎ | 5414/12384 [11:29:10<14:47:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 44%|████▎ | 5415/12384 [11:29:10<14:46:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 44%|████▎ | 5415/12384 [11:29:18<14:46:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 44%|████▎ | 5416/12384 [11:29:18<14:44:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 44%|████▎ | 5416/12384 [11:29:26<14:44:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 44%|████▎ | 5417/12384 [11:29:26<14:44:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 44%|████▎ | 5417/12384 [11:29:33<14:44:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 44%|████▍ | 5418/12384 [11:29:33<14:43:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 44%|████▍ | 5418/12384 [11:29:41<14:43:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 44%|████▍ | 5419/12384 [11:29:41<14:45:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 44%|████▍ | 5419/12384 [11:29:49<14:45:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 44%|████▍ | 5420/12384 [11:29:49<14:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 44%|████▍ | 5420/12384 [11:29:56<14:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 44%|████▍ | 5421/12384 [11:29:56<14:54:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 44%|████▍ | 5421/12384 [11:30:04<14:54:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 44%|████▍ | 5422/12384 [11:30:04<14:51:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 44%|████▍ | 5422/12384 [11:30:12<14:51:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 44%|████▍ | 5423/12384 [11:30:12<14:49:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 44%|████▍ | 5423/12384 [11:30:19<14:49:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 44%|████▍ | 5424/12384 [11:30:19<14:46:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 44%|████▍ | 5424/12384 [11:30:27<14:46:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 44%|████▍ | 5425/12384 [11:30:27<14:48:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 44%|████▍ | 5425/12384 [11:30:35<14:48:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 44%|████▍ | 5426/12384 [11:30:35<14:50:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 44%|████▍ | 5426/12384 [11:30:42<14:50:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 44%|████▍ | 5427/12384 [11:30:42<14:47:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 44%|████▍ | 5427/12384 [11:30:50<14:47:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 44%|████▍ | 5428/12384 [11:30:50<14:45:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 44%|████▍ | 5428/12384 [11:30:58<14:45:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 44%|████▍ | 5429/12384 [11:30:58<14:44:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 44%|████▍ | 5429/12384 [11:31:05<14:44:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 1: 44%|████▍ | 5430/12384 [11:31:05<14:44:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 1: 44%|████▍ | 5430/12384 [11:31:13<14:44:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 44%|████▍ | 5431/12384 [11:31:13<14:43:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 44%|████▍ | 5431/12384 [11:31:20<14:43:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.30s]
Epoch 1: 44%|████▍ | 5432/12384 [11:31:20<14:43:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.30s]
Epoch 1: 44%|████▍ | 5432/12384 [11:31:28<14:43:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 44%|████▍ | 5433/12384 [11:31:28<14:45:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 44%|████▍ | 5433/12384 [11:31:36<14:45:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 44%|████▍ | 5434/12384 [11:31:36<14:43:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 44%|████▍ | 5434/12384 [11:31:43<14:43:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 44%|████▍ | 5435/12384 [11:31:43<14:42:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 44%|████▍ | 5435/12384 [11:31:51<14:42:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 44%|████▍ | 5436/12384 [11:31:51<14:41:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 44%|████▍ | 5436/12384 [11:31:59<14:41:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 44%|████▍ | 5437/12384 [11:31:59<14:42:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 44%|████▍ | 5437/12384 [11:32:06<14:42:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 44%|████▍ | 5438/12384 [11:32:06<14:43:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 44%|████▍ | 5438/12384 [11:32:14<14:43:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 44%|████▍ | 5439/12384 [11:32:14<14:43:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 44%|████▍ | 5439/12384 [11:32:21<14:43:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 44%|████▍ | 5440/12384 [11:32:21<14:43:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 44%|████▍ | 5440/12384 [11:32:29<14:43:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 44%|████▍ | 5441/12384 [11:32:29<14:42:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 44%|████▍ | 5441/12384 [11:32:37<14:42:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 44%|████▍ | 5442/12384 [11:32:37<14:44:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 44%|████▍ | 5442/12384 [11:32:44<14:44:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 44%|████▍ | 5443/12384 [11:32:44<14:42:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 44%|████▍ | 5443/12384 [11:32:52<14:42:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 44%|████▍ | 5444/12384 [11:32:52<14:42:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 44%|████▍ | 5444/12384 [11:33:00<14:42:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 44%|████▍ | 5445/12384 [11:33:00<14:41:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 44%|████▍ | 5445/12384 [11:33:07<14:41:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 44%|████▍ | 5446/12384 [11:33:07<14:40:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 44%|████▍ | 5446/12384 [11:33:15<14:40:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 44%|████▍ | 5447/12384 [11:33:15<14:52:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 44%|████▍ | 5447/12384 [11:33:23<14:52:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.43s]
Epoch 1: 44%|████▍ | 5448/12384 [11:33:23<14:49:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.43s]
Epoch 1: 44%|████▍ | 5448/12384 [11:33:30<14:49:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.94s]
Epoch 1: 44%|████▍ | 5449/12384 [11:33:30<14:48:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.94s]
Epoch 1: 44%|████▍ | 5449/12384 [11:33:38<14:48:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 1: 44%|████▍ | 5450/12384 [11:33:38<14:45:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 1: 44%|████▍ | 5450/12384 [11:33:46<14:45:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 44%|████▍ | 5451/12384 [11:33:46<14:43:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 44%|████▍ | 5451/12384 [11:33:53<14:43:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 44%|████▍ | 5452/12384 [11:33:53<14:41:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 44%|████▍ | 5452/12384 [11:34:01<14:41:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 44%|████▍ | 5453/12384 [11:34:01<14:40:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 44%|████▍ | 5453/12384 [11:34:08<14:40:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 44%|████▍ | 5454/12384 [11:34:08<14:40:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 44%|████▍ | 5454/12384 [11:34:16<14:40:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 44%|████▍ | 5455/12384 [11:34:16<14:40:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 44%|████▍ | 5455/12384 [11:34:24<14:40:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 44%|████▍ | 5456/12384 [11:34:24<14:38:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 44%|████▍ | 5456/12384 [11:34:31<14:38:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 44%|████▍ | 5457/12384 [11:34:31<14:38:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 44%|████▍ | 5457/12384 [11:34:39<14:38:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 44%|████▍ | 5458/12384 [11:34:39<14:39:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 44%|████▍ | 5458/12384 [11:34:47<14:39:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 44%|████▍ | 5459/12384 [11:34:47<14:50:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 44%|████▍ | 5459/12384 [11:34:54<14:50:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 44%|████▍ | 5460/12384 [11:34:54<14:46:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 44%|████▍ | 5460/12384 [11:35:02<14:46:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 44%|████▍ | 5461/12384 [11:35:02<14:43:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 44%|████▍ | 5461/12384 [11:35:10<14:43:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 44%|████▍ | 5462/12384 [11:35:10<14:41:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 44%|████▍ | 5462/12384 [11:35:17<14:41:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 44%|████▍ | 5463/12384 [11:35:17<14:41:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 44%|████▍ | 5463/12384 [11:35:25<14:41:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 1: 44%|████▍ | 5464/12384 [11:35:25<14:40:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 1: 44%|████▍ | 5464/12384 [11:35:33<14:40:11, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 1: 44%|████▍ | 5465/12384 [11:35:33<14:39:22, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 1: 44%|████▍ | 5465/12384 [11:35:40<14:39:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 44%|████▍ | 5466/12384 [11:35:40<14:38:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 44%|████▍ | 5466/12384 [11:35:48<14:38:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 1: 44%|████▍ | 5467/12384 [11:35:48<14:38:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 1: 44%|████▍ | 5467/12384 [11:35:55<14:38:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 44%|████▍ | 5468/12384 [11:35:55<14:37:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 44%|████▍ | 5468/12384 [11:36:03<14:37:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 1: 44%|████▍ | 5469/12384 [11:36:03<14:37:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 1: 44%|████▍ | 5469/12384 [11:36:11<14:37:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 44%|████▍ | 5470/12384 [11:36:11<14:36:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 44%|████▍ | 5470/12384 [11:36:18<14:36:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 44%|████▍ | 5471/12384 [11:36:18<14:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 44%|████▍ | 5471/12384 [11:36:26<14:36:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 44%|████▍ | 5472/12384 [11:36:26<14:37:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 44%|████▍ | 5472/12384 [11:36:34<14:37:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 44%|████▍ | 5473/12384 [11:36:34<14:48:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 44%|████▍ | 5473/12384 [11:36:41<14:48:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 44%|████▍ | 5474/12384 [11:36:41<14:46:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 44%|████▍ | 5474/12384 [11:36:49<14:46:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 44%|████▍ | 5475/12384 [11:36:49<14:43:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 44%|████▍ | 5475/12384 [11:36:57<14:43:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 44%|████▍ | 5476/12384 [11:36:57<14:40:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 44%|████▍ | 5476/12384 [11:37:04<14:40:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 44%|████▍ | 5477/12384 [11:37:04<14:38:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 44%|████▍ | 5477/12384 [11:37:12<14:38:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 44%|████▍ | 5478/12384 [11:37:12<14:40:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 44%|████▍ | 5478/12384 [11:37:20<14:40:20, 7.65s/it, loss=0.0011, acc=1.0000, iter_time=9.11s]
Epoch 1: 44%|████▍ | 5479/12384 [11:37:20<14:39:25, 7.64s/it, loss=0.0011, acc=1.0000, iter_time=9.11s]
Epoch 1: 44%|████▍ | 5479/12384 [11:37:27<14:39:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 44%|████▍ | 5480/12384 [11:37:27<14:38:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 44%|████▍ | 5480/12384 [11:37:35<14:38:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 44%|████▍ | 5481/12384 [11:37:35<14:37:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 44%|████▍ | 5481/12384 [11:37:42<14:37:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 44%|████▍ | 5482/12384 [11:37:42<14:37:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 44%|████▍ | 5482/12384 [11:37:50<14:37:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 44%|████▍ | 5483/12384 [11:37:50<14:37:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 44%|████▍ | 5483/12384 [11:37:58<14:37:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 44%|████▍ | 5484/12384 [11:37:58<14:36:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 44%|████▍ | 5484/12384 [11:38:06<14:36:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 44%|████▍ | 5485/12384 [11:38:06<14:45:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 44%|████▍ | 5485/12384 [11:38:13<14:45:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 44%|████▍ | 5486/12384 [11:38:13<14:41:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 44%|████▍ | 5486/12384 [11:38:21<14:41:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 44%|████▍ | 5487/12384 [11:38:21<14:39:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 44%|████▍ | 5487/12384 [11:38:28<14:39:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 44%|████▍ | 5488/12384 [11:38:28<14:37:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 44%|████▍ | 5488/12384 [11:38:36<14:37:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 44%|████▍ | 5489/12384 [11:38:36<14:36:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 44%|████▍ | 5489/12384 [11:38:44<14:36:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 44%|████▍ | 5490/12384 [11:38:44<14:36:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 44%|████▍ | 5490/12384 [11:38:51<14:36:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 44%|████▍ | 5491/12384 [11:38:51<14:36:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 44%|████▍ | 5491/12384 [11:38:59<14:36:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 44%|████▍ | 5492/12384 [11:38:59<14:34:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 44%|████▍ | 5492/12384 [11:39:06<14:34:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 44%|████▍ | 5493/12384 [11:39:06<14:33:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 44%|████▍ | 5493/12384 [11:39:14<14:33:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 44%|████▍ | 5494/12384 [11:39:14<14:34:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 44%|████▍ | 5494/12384 [11:39:22<14:34:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 44%|████▍ | 5495/12384 [11:39:22<14:34:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 44%|████▍ | 5495/12384 [11:39:29<14:34:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 44%|████▍ | 5496/12384 [11:39:29<14:33:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 44%|████▍ | 5496/12384 [11:39:37<14:33:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 44%|████▍ | 5497/12384 [11:39:37<14:34:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 44%|████▍ | 5497/12384 [11:39:44<14:34:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 44%|████▍ | 5498/12384 [11:39:44<14:33:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 44%|████▍ | 5498/12384 [11:39:52<14:33:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 44%|████▍ | 5499/12384 [11:39:52<14:44:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 44%|████▍ | 5499/12384 [11:40:00<14:44:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 44%|████▍ | 5500/12384 [11:40:00<14:41:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 44%|████▍ | 5500/12384 [11:40:08<14:41:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 44%|████▍ | 5501/12384 [11:40:08<14:37:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 44%|████▍ | 5501/12384 [11:40:15<14:37:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 44%|████▍ | 5502/12384 [11:40:15<14:35:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 44%|████▍ | 5502/12384 [11:40:23<14:35:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 44%|████▍ | 5503/12384 [11:40:23<14:33:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 44%|████▍ | 5503/12384 [11:40:30<14:33:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 44%|████▍ | 5504/12384 [11:40:30<14:33:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 44%|████▍ | 5504/12384 [11:40:38<14:33:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 1: 44%|████▍ | 5505/12384 [11:40:38<14:32:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 1: 44%|████▍ | 5505/12384 [11:40:46<14:32:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 44%|████▍ | 5506/12384 [11:40:46<14:31:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 44%|████▍ | 5506/12384 [11:40:53<14:31:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 44%|████▍ | 5507/12384 [11:40:53<14:31:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 44%|████▍ | 5507/12384 [11:41:01<14:31:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 44%|████▍ | 5508/12384 [11:41:01<14:31:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 44%|████▍ | 5508/12384 [11:41:08<14:31:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 44%|████▍ | 5509/12384 [11:41:08<14:33:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 44%|████▍ | 5509/12384 [11:41:16<14:33:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 44%|████▍ | 5510/12384 [11:41:16<14:32:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 44%|████▍ | 5510/12384 [11:41:24<14:32:24, 7.61s/it, loss=0.0018, acc=0.9974, iter_time=7.92s]
Epoch 1: 45%|████▍ | 5511/12384 [11:41:24<14:42:41, 7.71s/it, loss=0.0018, acc=0.9974, iter_time=7.92s]
Epoch 1: 45%|████▍ | 5511/12384 [11:41:32<14:42:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 45%|████▍ | 5512/12384 [11:41:32<14:40:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 45%|████▍ | 5512/12384 [11:41:39<14:40:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 45%|████▍ | 5513/12384 [11:41:39<14:36:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 45%|████▍ | 5513/12384 [11:41:47<14:36:50, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 45%|████▍ | 5514/12384 [11:41:47<14:35:31, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 45%|████▍ | 5514/12384 [11:41:54<14:35:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 45%|████▍ | 5515/12384 [11:41:54<14:34:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 45%|████▍ | 5515/12384 [11:42:02<14:34:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 45%|████▍ | 5516/12384 [11:42:02<14:33:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 45%|████▍ | 5516/12384 [11:42:10<14:33:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 45%|████▍ | 5517/12384 [11:42:10<14:33:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 45%|████▍ | 5517/12384 [11:42:17<14:33:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 45%|████▍ | 5518/12384 [11:42:17<14:31:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 45%|████▍ | 5518/12384 [11:42:25<14:31:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▍ | 5519/12384 [11:42:25<14:30:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▍ | 5519/12384 [11:42:32<14:30:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 45%|████▍ | 5520/12384 [11:42:32<14:30:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 45%|████▍ | 5520/12384 [11:42:40<14:30:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 45%|████▍ | 5521/12384 [11:42:40<14:30:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 45%|████▍ | 5521/12384 [11:42:48<14:30:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5522/12384 [11:42:48<14:30:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5522/12384 [11:42:55<14:30:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 45%|████▍ | 5523/12384 [11:42:55<14:30:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 45%|████▍ | 5523/12384 [11:43:03<14:30:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 45%|████▍ | 5524/12384 [11:43:03<14:31:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 45%|████▍ | 5524/12384 [11:43:11<14:31:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 45%|████▍ | 5525/12384 [11:43:11<14:42:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 45%|████▍ | 5525/12384 [11:43:18<14:42:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 45%|████▍ | 5526/12384 [11:43:18<14:38:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 45%|████▍ | 5526/12384 [11:43:26<14:38:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5527/12384 [11:43:26<14:36:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5527/12384 [11:43:34<14:36:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 45%|████▍ | 5528/12384 [11:43:34<14:34:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 45%|████▍ | 5528/12384 [11:43:41<14:34:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.94s]
Epoch 1: 45%|████▍ | 5529/12384 [11:43:41<14:33:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.94s]
Epoch 1: 45%|████▍ | 5529/12384 [11:43:49<14:33:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 45%|████▍ | 5530/12384 [11:43:49<14:32:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 45%|████▍ | 5530/12384 [11:43:57<14:32:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5531/12384 [11:43:57<14:31:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5531/12384 [11:44:04<14:31:35, 7.63s/it, loss=0.0013, acc=0.9949, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5532/12384 [11:44:04<14:29:58, 7.62s/it, loss=0.0013, acc=0.9949, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5532/12384 [11:44:12<14:29:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 45%|████▍ | 5533/12384 [11:44:12<14:29:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 45%|████▍ | 5533/12384 [11:44:19<14:29:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 45%|████▍ | 5534/12384 [11:44:19<14:31:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 45%|████▍ | 5534/12384 [11:44:27<14:31:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5535/12384 [11:44:27<14:31:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5535/12384 [11:44:35<14:31:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 45%|████▍ | 5536/12384 [11:44:35<14:30:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 45%|████▍ | 5536/12384 [11:44:42<14:30:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 45%|████▍ | 5537/12384 [11:44:42<14:33:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 45%|████▍ | 5537/12384 [11:44:50<14:33:02, 7.65s/it, loss=0.0030, acc=0.9907, iter_time=6.92s]
Epoch 1: 45%|████▍ | 5538/12384 [11:44:50<14:31:11, 7.64s/it, loss=0.0030, acc=0.9907, iter_time=6.92s]
Epoch 1: 45%|████▍ | 5538/12384 [11:44:58<14:31:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 45%|████▍ | 5539/12384 [11:44:58<14:29:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 45%|████▍ | 5539/12384 [11:45:05<14:29:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.62s]
Epoch 1: 45%|████▍ | 5540/12384 [11:45:05<14:28:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.62s]
Epoch 1: 45%|████▍ | 5540/12384 [11:45:13<14:28:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 45%|████▍ | 5541/12384 [11:45:13<14:28:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 45%|████▍ | 5541/12384 [11:45:20<14:28:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 45%|████▍ | 5542/12384 [11:45:20<14:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 45%|████▍ | 5542/12384 [11:45:28<14:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 45%|████▍ | 5543/12384 [11:45:28<14:28:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 45%|████▍ | 5543/12384 [11:45:36<14:28:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 45%|████▍ | 5544/12384 [11:45:36<14:30:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 45%|████▍ | 5544/12384 [11:45:43<14:30:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 45%|████▍ | 5545/12384 [11:45:43<14:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 45%|████▍ | 5545/12384 [11:45:51<14:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 45%|████▍ | 5546/12384 [11:45:51<14:28:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 45%|████▍ | 5546/12384 [11:45:59<14:28:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 45%|████▍ | 5547/12384 [11:45:59<14:27:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 45%|████▍ | 5547/12384 [11:46:06<14:27:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 45%|████▍ | 5548/12384 [11:46:06<14:26:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 45%|████▍ | 5548/12384 [11:46:14<14:26:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 45%|████▍ | 5549/12384 [11:46:14<14:26:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 45%|████▍ | 5549/12384 [11:46:21<14:26:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▍ | 5550/12384 [11:46:21<14:25:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▍ | 5550/12384 [11:46:29<14:25:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 45%|████▍ | 5551/12384 [11:46:29<14:24:23, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 45%|████▍ | 5551/12384 [11:46:37<14:24:23, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 45%|████▍ | 5552/12384 [11:46:37<14:36:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 45%|████▍ | 5552/12384 [11:46:45<14:36:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 45%|████▍ | 5553/12384 [11:46:45<14:36:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 45%|████▍ | 5553/12384 [11:46:52<14:36:26, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 1: 45%|████▍ | 5554/12384 [11:46:52<14:33:50, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 1: 45%|████▍ | 5554/12384 [11:47:00<14:33:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5555/12384 [11:47:00<14:30:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▍ | 5555/12384 [11:47:07<14:30:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▍ | 5556/12384 [11:47:07<14:28:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▍ | 5556/12384 [11:47:15<14:28:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 45%|████▍ | 5557/12384 [11:47:15<14:27:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 45%|████▍ | 5557/12384 [11:47:23<14:27:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 45%|████▍ | 5558/12384 [11:47:23<14:26:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 45%|████▍ | 5558/12384 [11:47:30<14:26:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 45%|████▍ | 5559/12384 [11:47:30<14:25:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 45%|████▍ | 5559/12384 [11:47:38<14:25:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 45%|████▍ | 5560/12384 [11:47:38<14:24:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 45%|████▍ | 5560/12384 [11:47:45<14:24:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 45%|████▍ | 5561/12384 [11:47:45<14:24:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 45%|████▍ | 5561/12384 [11:47:53<14:24:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▍ | 5562/12384 [11:47:53<14:24:27, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▍ | 5562/12384 [11:48:01<14:24:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 45%|████▍ | 5563/12384 [11:48:01<14:24:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 45%|████▍ | 5563/12384 [11:48:08<14:24:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▍ | 5564/12384 [11:48:08<14:27:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▍ | 5564/12384 [11:48:16<14:27:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 45%|████▍ | 5565/12384 [11:48:16<14:26:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 45%|████▍ | 5565/12384 [11:48:23<14:26:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 45%|████▍ | 5566/12384 [11:48:23<14:25:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 45%|████▍ | 5566/12384 [11:48:31<14:25:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 45%|████▍ | 5567/12384 [11:48:31<14:25:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 45%|████▍ | 5567/12384 [11:48:39<14:25:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 45%|████▍ | 5568/12384 [11:48:39<14:25:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 45%|████▍ | 5568/12384 [11:48:46<14:25:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 45%|████▍ | 5569/12384 [11:48:46<14:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 45%|████▍ | 5569/12384 [11:48:54<14:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 45%|████▍ | 5570/12384 [11:48:54<14:25:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 45%|████▍ | 5570/12384 [11:49:02<14:25:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 45%|████▍ | 5571/12384 [11:49:02<14:24:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 45%|████▍ | 5571/12384 [11:49:09<14:24:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 45%|████▍ | 5572/12384 [11:49:09<14:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 45%|████▍ | 5572/12384 [11:49:17<14:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 45%|████▌ | 5573/12384 [11:49:17<14:24:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 45%|████▌ | 5573/12384 [11:49:24<14:24:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 45%|████▌ | 5574/12384 [11:49:24<14:23:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 45%|████▌ | 5574/12384 [11:49:32<14:23:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5575/12384 [11:49:32<14:23:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5575/12384 [11:49:40<14:23:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 45%|████▌ | 5576/12384 [11:49:40<14:26:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 45%|████▌ | 5576/12384 [11:49:47<14:26:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 45%|████▌ | 5577/12384 [11:49:47<14:26:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 45%|████▌ | 5577/12384 [11:49:55<14:26:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 45%|████▌ | 5578/12384 [11:49:55<14:36:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 45%|████▌ | 5578/12384 [11:50:03<14:36:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 45%|████▌ | 5579/12384 [11:50:03<14:32:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 45%|████▌ | 5579/12384 [11:50:10<14:32:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 45%|████▌ | 5580/12384 [11:50:10<14:30:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 45%|████▌ | 5580/12384 [11:50:18<14:30:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5581/12384 [11:50:18<14:27:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5581/12384 [11:50:26<14:27:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 45%|████▌ | 5582/12384 [11:50:26<14:26:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 45%|████▌ | 5582/12384 [11:50:33<14:26:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 45%|████▌ | 5583/12384 [11:50:33<14:25:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 45%|████▌ | 5583/12384 [11:50:41<14:25:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 45%|████▌ | 5584/12384 [11:50:41<14:23:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 45%|████▌ | 5584/12384 [11:50:49<14:23:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 1: 45%|████▌ | 5585/12384 [11:50:49<14:22:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 1: 45%|████▌ | 5585/12384 [11:50:56<14:22:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 45%|████▌ | 5586/12384 [11:50:56<14:23:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 45%|████▌ | 5586/12384 [11:51:04<14:23:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 45%|████▌ | 5587/12384 [11:51:04<14:22:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 45%|████▌ | 5587/12384 [11:51:11<14:22:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5588/12384 [11:51:11<14:22:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5588/12384 [11:51:19<14:22:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5589/12384 [11:51:19<14:23:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5589/12384 [11:51:27<14:23:17, 7.62s/it, loss=0.0005, acc=0.9987, iter_time=7.93s]
Epoch 1: 45%|████▌ | 5590/12384 [11:51:27<14:31:57, 7.70s/it, loss=0.0005, acc=0.9987, iter_time=7.93s]
Epoch 1: 45%|████▌ | 5590/12384 [11:51:35<14:31:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 45%|████▌ | 5591/12384 [11:51:35<14:28:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 45%|████▌ | 5591/12384 [11:51:42<14:28:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 1: 45%|████▌ | 5592/12384 [11:51:42<14:26:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 1: 45%|████▌ | 5592/12384 [11:51:50<14:26:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 45%|████▌ | 5593/12384 [11:51:50<14:23:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 45%|████▌ | 5593/12384 [11:51:57<14:23:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 45%|████▌ | 5594/12384 [11:51:57<14:23:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 45%|████▌ | 5594/12384 [11:52:05<14:23:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 45%|████▌ | 5595/12384 [11:52:05<14:22:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 45%|████▌ | 5595/12384 [11:52:13<14:22:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▌ | 5596/12384 [11:52:13<14:21:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▌ | 5596/12384 [11:52:20<14:21:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5597/12384 [11:52:20<14:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5597/12384 [11:52:28<14:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 45%|████▌ | 5598/12384 [11:52:28<14:20:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 45%|████▌ | 5598/12384 [11:52:35<14:20:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 1: 45%|████▌ | 5599/12384 [11:52:35<14:20:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 1: 45%|████▌ | 5599/12384 [11:52:43<14:20:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▌ | 5600/12384 [11:52:43<14:21:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 45%|████▌ | 5600/12384 [11:52:51<14:21:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 45%|████▌ | 5601/12384 [11:52:51<14:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 45%|████▌ | 5601/12384 [11:52:58<14:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 45%|████▌ | 5602/12384 [11:52:58<14:19:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 45%|████▌ | 5602/12384 [11:53:06<14:19:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 45%|████▌ | 5603/12384 [11:53:06<14:19:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 45%|████▌ | 5603/12384 [11:53:13<14:19:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 45%|████▌ | 5604/12384 [11:53:13<14:19:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 45%|████▌ | 5604/12384 [11:53:21<14:19:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 45%|████▌ | 5605/12384 [11:53:21<14:30:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 45%|████▌ | 5605/12384 [11:53:29<14:30:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 45%|████▌ | 5606/12384 [11:53:29<14:28:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 45%|████▌ | 5606/12384 [11:53:37<14:28:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 45%|████▌ | 5607/12384 [11:53:37<14:26:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 45%|████▌ | 5607/12384 [11:53:44<14:26:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 45%|████▌ | 5608/12384 [11:53:44<14:23:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 45%|████▌ | 5608/12384 [11:53:52<14:23:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 45%|████▌ | 5609/12384 [11:53:52<14:23:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 45%|████▌ | 5609/12384 [11:53:59<14:23:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 45%|████▌ | 5610/12384 [11:53:59<14:22:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 45%|████▌ | 5610/12384 [11:54:07<14:22:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 45%|████▌ | 5611/12384 [11:54:07<14:21:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 45%|████▌ | 5611/12384 [11:54:15<14:21:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5612/12384 [11:54:15<14:20:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5612/12384 [11:54:22<14:20:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5613/12384 [11:54:22<14:19:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5613/12384 [11:54:30<14:19:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 45%|████▌ | 5614/12384 [11:54:30<14:19:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 45%|████▌ | 5614/12384 [11:54:37<14:19:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 45%|████▌ | 5615/12384 [11:54:37<14:19:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 45%|████▌ | 5615/12384 [11:54:45<14:19:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 45%|████▌ | 5616/12384 [11:54:45<14:26:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 45%|████▌ | 5616/12384 [11:54:53<14:26:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 45%|████▌ | 5617/12384 [11:54:53<14:23:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 45%|████▌ | 5617/12384 [11:55:01<14:23:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 1: 45%|████▌ | 5618/12384 [11:55:01<14:21:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 1: 45%|████▌ | 5618/12384 [11:55:08<14:21:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 45%|████▌ | 5619/12384 [11:55:08<14:21:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 45%|████▌ | 5619/12384 [11:55:16<14:21:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 45%|████▌ | 5620/12384 [11:55:16<14:20:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 45%|████▌ | 5620/12384 [11:55:23<14:20:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 45%|████▌ | 5621/12384 [11:55:23<14:19:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 45%|████▌ | 5621/12384 [11:55:31<14:19:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 45%|████▌ | 5622/12384 [11:55:31<14:19:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 45%|████▌ | 5622/12384 [11:55:39<14:19:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 45%|████▌ | 5623/12384 [11:55:39<14:18:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 45%|████▌ | 5623/12384 [11:55:46<14:18:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 45%|████▌ | 5624/12384 [11:55:46<14:19:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 45%|████▌ | 5624/12384 [11:55:54<14:19:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 45%|████▌ | 5625/12384 [11:55:54<14:18:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 45%|████▌ | 5625/12384 [11:56:01<14:18:57, 7.63s/it, loss=0.0001, acc=0.9992, iter_time=7.65s]
Epoch 1: 45%|████▌ | 5626/12384 [11:56:01<14:18:36, 7.62s/it, loss=0.0001, acc=0.9992, iter_time=7.65s]
Epoch 1: 45%|████▌ | 5626/12384 [11:56:09<14:18:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 45%|████▌ | 5627/12384 [11:56:09<14:17:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 45%|████▌ | 5627/12384 [11:56:17<14:17:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 45%|████▌ | 5628/12384 [11:56:17<14:17:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 45%|████▌ | 5628/12384 [11:56:24<14:17:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5629/12384 [11:56:24<14:16:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 45%|████▌ | 5629/12384 [11:56:32<14:16:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5630/12384 [11:56:32<14:17:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5630/12384 [11:56:40<14:17:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 45%|████▌ | 5631/12384 [11:56:40<14:27:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 45%|████▌ | 5631/12384 [11:56:47<14:27:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 45%|████▌ | 5632/12384 [11:56:47<14:23:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 45%|████▌ | 5632/12384 [11:56:55<14:23:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 45%|████▌ | 5633/12384 [11:56:55<14:20:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 45%|████▌ | 5633/12384 [11:57:03<14:20:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5634/12384 [11:57:03<14:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 45%|████▌ | 5634/12384 [11:57:10<14:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 46%|████▌ | 5635/12384 [11:57:10<14:18:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 46%|████▌ | 5635/12384 [11:57:18<14:18:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 46%|████▌ | 5636/12384 [11:57:18<14:16:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 46%|████▌ | 5636/12384 [11:57:25<14:16:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 46%|████▌ | 5637/12384 [11:57:25<14:15:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 46%|████▌ | 5637/12384 [11:57:33<14:15:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 46%|████▌ | 5638/12384 [11:57:33<14:16:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 46%|████▌ | 5638/12384 [11:57:41<14:16:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 46%|████▌ | 5639/12384 [11:57:41<14:15:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 46%|████▌ | 5639/12384 [11:57:48<14:15:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 46%|████▌ | 5640/12384 [11:57:48<14:15:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 46%|████▌ | 5640/12384 [11:57:56<14:15:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 46%|████▌ | 5641/12384 [11:57:56<14:16:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 46%|████▌ | 5641/12384 [11:58:04<14:16:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 46%|████▌ | 5642/12384 [11:58:04<14:15:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 46%|████▌ | 5642/12384 [11:58:11<14:15:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5643/12384 [11:58:11<14:15:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5643/12384 [11:58:19<14:15:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 46%|████▌ | 5644/12384 [11:58:19<14:25:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 46%|████▌ | 5644/12384 [11:58:27<14:25:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5645/12384 [11:58:27<14:21:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5645/12384 [11:58:34<14:21:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5646/12384 [11:58:34<14:19:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5646/12384 [11:58:42<14:19:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5647/12384 [11:58:42<14:18:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5647/12384 [11:58:50<14:18:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 46%|████▌ | 5648/12384 [11:58:50<14:17:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 46%|████▌ | 5648/12384 [11:58:57<14:17:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 46%|████▌ | 5649/12384 [11:58:57<14:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 46%|████▌ | 5649/12384 [11:59:05<14:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 46%|████▌ | 5650/12384 [11:59:05<14:14:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 46%|████▌ | 5650/12384 [11:59:12<14:14:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5651/12384 [11:59:12<14:14:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5651/12384 [11:59:20<14:14:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5652/12384 [11:59:20<14:14:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5652/12384 [11:59:28<14:14:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 46%|████▌ | 5653/12384 [11:59:28<14:14:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 46%|████▌ | 5653/12384 [11:59:35<14:14:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5654/12384 [11:59:35<14:14:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5654/12384 [11:59:43<14:14:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5655/12384 [11:59:43<14:15:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5655/12384 [11:59:50<14:15:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5656/12384 [11:59:50<14:14:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5656/12384 [11:59:58<14:14:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 46%|████▌ | 5657/12384 [11:59:58<14:25:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 46%|████▌ | 5657/12384 [12:00:06<14:25:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 46%|████▌ | 5658/12384 [12:00:06<14:21:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 46%|████▌ | 5658/12384 [12:00:14<14:21:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 46%|████▌ | 5659/12384 [12:00:14<14:19:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 46%|████▌ | 5659/12384 [12:00:21<14:19:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 46%|████▌ | 5660/12384 [12:00:21<14:17:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 46%|████▌ | 5660/12384 [12:00:29<14:17:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 46%|████▌ | 5661/12384 [12:00:29<14:15:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 46%|████▌ | 5661/12384 [12:00:36<14:15:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 46%|████▌ | 5662/12384 [12:00:36<14:15:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 46%|████▌ | 5662/12384 [12:00:44<14:15:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 1: 46%|████▌ | 5663/12384 [12:00:44<14:14:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 1: 46%|████▌ | 5663/12384 [12:00:52<14:14:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 46%|████▌ | 5664/12384 [12:00:52<14:12:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 46%|████▌ | 5664/12384 [12:00:59<14:12:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5665/12384 [12:00:59<14:11:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5665/12384 [12:01:07<14:11:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 46%|████▌ | 5666/12384 [12:01:07<14:11:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 46%|████▌ | 5666/12384 [12:01:14<14:11:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 46%|████▌ | 5667/12384 [12:01:14<14:11:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 46%|████▌ | 5667/12384 [12:01:22<14:11:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 46%|████▌ | 5668/12384 [12:01:22<14:13:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 46%|████▌ | 5668/12384 [12:01:30<14:13:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 46%|████▌ | 5669/12384 [12:01:30<14:12:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 46%|████▌ | 5669/12384 [12:01:37<14:12:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 46%|████▌ | 5670/12384 [12:01:37<14:12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 46%|████▌ | 5670/12384 [12:01:45<14:12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.08s]
Epoch 1: 46%|████▌ | 5671/12384 [12:01:45<14:11:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.08s]
Epoch 1: 46%|████▌ | 5671/12384 [12:01:53<14:11:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 46%|████▌ | 5672/12384 [12:01:53<14:11:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 46%|████▌ | 5672/12384 [12:02:00<14:11:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 46%|████▌ | 5673/12384 [12:02:00<14:12:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 46%|████▌ | 5673/12384 [12:02:08<14:12:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 46%|████▌ | 5674/12384 [12:02:08<14:11:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 46%|████▌ | 5674/12384 [12:02:15<14:11:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 46%|████▌ | 5675/12384 [12:02:15<14:12:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 46%|████▌ | 5675/12384 [12:02:23<14:12:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 46%|████▌ | 5676/12384 [12:02:23<14:12:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 46%|████▌ | 5676/12384 [12:02:31<14:12:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5677/12384 [12:02:31<14:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5677/12384 [12:02:38<14:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5678/12384 [12:02:38<14:11:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5678/12384 [12:02:46<14:11:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 46%|████▌ | 5679/12384 [12:02:46<14:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 46%|████▌ | 5679/12384 [12:02:53<14:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 46%|████▌ | 5680/12384 [12:02:53<14:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 46%|████▌ | 5680/12384 [12:03:01<14:11:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 46%|████▌ | 5681/12384 [12:03:01<14:11:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 46%|████▌ | 5681/12384 [12:03:09<14:11:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5682/12384 [12:03:09<14:10:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5682/12384 [12:03:17<14:10:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 46%|████▌ | 5683/12384 [12:03:17<14:21:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 46%|████▌ | 5683/12384 [12:03:24<14:21:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 46%|████▌ | 5684/12384 [12:03:24<14:18:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 46%|████▌ | 5684/12384 [12:03:32<14:18:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5685/12384 [12:03:32<14:16:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5685/12384 [12:03:40<14:16:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5686/12384 [12:03:40<14:13:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5686/12384 [12:03:47<14:13:36, 7.65s/it, loss=0.0007, acc=0.9948, iter_time=6.47s]
Epoch 1: 46%|████▌ | 5687/12384 [12:03:47<14:11:44, 7.63s/it, loss=0.0007, acc=0.9948, iter_time=6.47s]
Epoch 1: 46%|████▌ | 5687/12384 [12:03:55<14:11:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 46%|████▌ | 5688/12384 [12:03:55<14:11:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 46%|████▌ | 5688/12384 [12:04:02<14:11:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 46%|████▌ | 5689/12384 [12:04:02<14:10:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 46%|████▌ | 5689/12384 [12:04:10<14:10:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 46%|████▌ | 5690/12384 [12:04:10<14:10:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 46%|████▌ | 5690/12384 [12:04:18<14:10:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 46%|████▌ | 5691/12384 [12:04:18<14:11:56, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 46%|████▌ | 5691/12384 [12:04:25<14:11:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 46%|████▌ | 5692/12384 [12:04:25<14:12:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 46%|████▌ | 5692/12384 [12:04:33<14:12:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5693/12384 [12:04:33<14:11:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5693/12384 [12:04:41<14:11:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 46%|████▌ | 5694/12384 [12:04:41<14:11:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 46%|████▌ | 5694/12384 [12:04:48<14:11:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 46%|████▌ | 5695/12384 [12:04:48<14:14:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 46%|████▌ | 5695/12384 [12:04:56<14:14:18, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=8.39s]
Epoch 1: 46%|████▌ | 5696/12384 [12:04:56<14:25:46, 7.77s/it, loss=0.0002, acc=0.9998, iter_time=8.39s]
Epoch 1: 46%|████▌ | 5696/12384 [12:05:04<14:25:46, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 46%|████▌ | 5697/12384 [12:05:04<14:20:38, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 46%|████▌ | 5697/12384 [12:05:12<14:20:38, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5698/12384 [12:05:12<14:16:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5698/12384 [12:05:19<14:16:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 46%|████▌ | 5699/12384 [12:05:19<14:13:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 46%|████▌ | 5699/12384 [12:05:27<14:13:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 46%|████▌ | 5700/12384 [12:05:27<14:11:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 46%|████▌ | 5700/12384 [12:05:34<14:11:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5701/12384 [12:05:34<14:09:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5701/12384 [12:05:42<14:09:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5702/12384 [12:05:42<14:09:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5702/12384 [12:05:50<14:09:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 46%|████▌ | 5703/12384 [12:05:50<14:08:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 46%|████▌ | 5703/12384 [12:05:57<14:08:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 46%|████▌ | 5704/12384 [12:05:57<14:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 46%|████▌ | 5704/12384 [12:06:05<14:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 46%|████▌ | 5705/12384 [12:06:05<14:06:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 46%|████▌ | 5705/12384 [12:06:12<14:06:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 46%|████▌ | 5706/12384 [12:06:12<14:06:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 46%|████▌ | 5706/12384 [12:06:20<14:06:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 46%|████▌ | 5707/12384 [12:06:20<14:06:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 46%|████▌ | 5707/12384 [12:06:28<14:06:32, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=4.83s]
Epoch 1: 46%|████▌ | 5708/12384 [12:06:28<14:05:42, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=4.83s]
Epoch 1: 46%|████▌ | 5708/12384 [12:06:35<14:05:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 46%|████▌ | 5709/12384 [12:06:35<14:17:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 46%|████▌ | 5709/12384 [12:06:43<14:17:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 46%|████▌ | 5710/12384 [12:06:43<14:14:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 46%|████▌ | 5710/12384 [12:06:51<14:14:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5711/12384 [12:06:51<14:12:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 46%|████▌ | 5711/12384 [12:06:58<14:12:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 46%|████▌ | 5712/12384 [12:06:58<14:10:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 46%|████▌ | 5712/12384 [12:07:06<14:10:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 46%|████▌ | 5713/12384 [12:07:06<14:08:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 46%|████▌ | 5713/12384 [12:07:14<14:08:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 46%|████▌ | 5714/12384 [12:07:14<14:07:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 46%|████▌ | 5714/12384 [12:07:21<14:07:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 46%|████▌ | 5715/12384 [12:07:21<14:06:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 46%|████▌ | 5715/12384 [12:07:29<14:06:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 46%|████▌ | 5716/12384 [12:07:29<14:06:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 46%|████▌ | 5716/12384 [12:07:36<14:06:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 46%|████▌ | 5717/12384 [12:07:36<14:06:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 46%|████▌ | 5717/12384 [12:07:44<14:06:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 46%|████▌ | 5718/12384 [12:07:44<14:06:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 46%|████▌ | 5718/12384 [12:07:52<14:06:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 46%|████▌ | 5719/12384 [12:07:52<14:05:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 46%|████▌ | 5719/12384 [12:07:59<14:05:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 46%|████▌ | 5720/12384 [12:07:59<14:05:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 46%|████▌ | 5720/12384 [12:08:07<14:05:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 46%|████▌ | 5721/12384 [12:08:07<14:14:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 46%|████▌ | 5721/12384 [12:08:15<14:14:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5722/12384 [12:08:15<14:10:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5722/12384 [12:08:22<14:10:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5723/12384 [12:08:22<14:08:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▌ | 5723/12384 [12:08:30<14:08:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 46%|████▌ | 5724/12384 [12:08:30<14:08:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 46%|████▌ | 5724/12384 [12:08:38<14:08:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 46%|████▌ | 5725/12384 [12:08:38<14:08:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 46%|████▌ | 5725/12384 [12:08:45<14:08:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 46%|████▌ | 5726/12384 [12:08:45<14:06:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 46%|████▌ | 5726/12384 [12:08:53<14:06:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5727/12384 [12:08:53<14:05:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 46%|████▌ | 5727/12384 [12:09:00<14:05:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 46%|████▋ | 5728/12384 [12:09:00<14:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 46%|████▋ | 5728/12384 [12:09:08<14:04:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.38s]
Epoch 1: 46%|████▋ | 5729/12384 [12:09:08<14:03:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.38s]
Epoch 1: 46%|████▋ | 5729/12384 [12:09:16<14:03:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 46%|████▋ | 5730/12384 [12:09:16<14:02:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 46%|████▋ | 5730/12384 [12:09:23<14:02:53, 7.60s/it, loss=0.0002, acc=0.9988, iter_time=7.84s]
Epoch 1: 46%|████▋ | 5731/12384 [12:09:23<14:02:23, 7.60s/it, loss=0.0002, acc=0.9988, iter_time=7.84s]
Epoch 1: 46%|████▋ | 5731/12384 [12:09:31<14:02:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 46%|████▋ | 5732/12384 [12:09:31<14:01:55, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 46%|████▋ | 5732/12384 [12:09:38<14:01:55, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 46%|████▋ | 5733/12384 [12:09:38<14:03:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 46%|████▋ | 5733/12384 [12:09:46<14:03:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 46%|████▋ | 5734/12384 [12:09:46<14:02:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 46%|████▋ | 5734/12384 [12:09:54<14:02:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 46%|████▋ | 5735/12384 [12:09:54<14:02:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 46%|████▋ | 5735/12384 [12:10:01<14:02:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 1: 46%|████▋ | 5736/12384 [12:10:01<14:13:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 1: 46%|████▋ | 5736/12384 [12:10:09<14:13:29, 7.70s/it, loss=0.0014, acc=0.9976, iter_time=5.67s]
Epoch 1: 46%|████▋ | 5737/12384 [12:10:09<14:10:12, 7.67s/it, loss=0.0014, acc=0.9976, iter_time=5.67s]
Epoch 1: 46%|████▋ | 5737/12384 [12:10:17<14:10:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 46%|████▋ | 5738/12384 [12:10:17<14:08:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 46%|████▋ | 5738/12384 [12:10:24<14:08:21, 7.66s/it, loss=0.0003, acc=0.9980, iter_time=6.78s]
Epoch 1: 46%|████▋ | 5739/12384 [12:10:24<14:07:07, 7.65s/it, loss=0.0003, acc=0.9980, iter_time=6.78s]
Epoch 1: 46%|████▋ | 5739/12384 [12:10:32<14:07:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 1: 46%|████▋ | 5740/12384 [12:10:32<14:04:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 1: 46%|████▋ | 5740/12384 [12:10:40<14:04:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=12.27s]
Epoch 1: 46%|████▋ | 5741/12384 [12:10:40<14:03:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=12.27s]
Epoch 1: 46%|████▋ | 5741/12384 [12:10:47<14:03:48, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.11s]
Epoch 1: 46%|████▋ | 5742/12384 [12:10:47<14:03:28, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.11s]
Epoch 1: 46%|████▋ | 5742/12384 [12:10:55<14:03:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 46%|████▋ | 5743/12384 [12:10:55<14:03:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 46%|████▋ | 5743/12384 [12:11:02<14:03:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 46%|████▋ | 5744/12384 [12:11:02<14:02:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 46%|████▋ | 5744/12384 [12:11:10<14:02:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 46%|████▋ | 5745/12384 [12:11:10<14:03:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 46%|████▋ | 5745/12384 [12:11:18<14:03:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 46%|████▋ | 5746/12384 [12:11:18<14:13:51, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 46%|████▋ | 5746/12384 [12:11:26<14:13:51, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 46%|████▋ | 5747/12384 [12:11:26<14:10:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 46%|████▋ | 5747/12384 [12:11:33<14:10:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 46%|████▋ | 5748/12384 [12:11:33<14:07:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 46%|████▋ | 5748/12384 [12:11:41<14:07:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 46%|████▋ | 5749/12384 [12:11:41<14:05:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 46%|████▋ | 5749/12384 [12:11:48<14:05:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 46%|████▋ | 5750/12384 [12:11:48<14:04:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 46%|████▋ | 5750/12384 [12:11:56<14:04:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 46%|████▋ | 5751/12384 [12:11:56<14:02:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 46%|████▋ | 5751/12384 [12:12:04<14:02:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 46%|████▋ | 5752/12384 [12:12:04<14:02:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 46%|████▋ | 5752/12384 [12:12:11<14:02:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 46%|████▋ | 5753/12384 [12:12:11<14:01:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 46%|████▋ | 5753/12384 [12:12:19<14:01:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▋ | 5754/12384 [12:12:19<14:01:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▋ | 5754/12384 [12:12:26<14:01:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 46%|████▋ | 5755/12384 [12:12:26<14:00:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 46%|████▋ | 5755/12384 [12:12:34<14:00:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▋ | 5756/12384 [12:12:34<14:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▋ | 5756/12384 [12:12:42<14:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▋ | 5757/12384 [12:12:42<13:59:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▋ | 5757/12384 [12:12:49<13:59:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▋ | 5758/12384 [12:12:49<14:00:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 46%|████▋ | 5758/12384 [12:12:57<14:00:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 47%|████▋ | 5759/12384 [12:12:57<13:59:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 47%|████▋ | 5759/12384 [12:13:04<13:59:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 47%|████▋ | 5760/12384 [12:13:04<14:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 47%|████▋ | 5760/12384 [12:13:12<14:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5761/12384 [12:13:12<13:59:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5761/12384 [12:13:20<13:59:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 47%|████▋ | 5762/12384 [12:13:20<14:11:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 47%|████▋ | 5762/12384 [12:13:28<14:11:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 47%|████▋ | 5763/12384 [12:13:28<14:07:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 47%|████▋ | 5763/12384 [12:13:35<14:07:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 47%|████▋ | 5764/12384 [12:13:35<14:05:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 47%|████▋ | 5764/12384 [12:13:43<14:05:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 47%|████▋ | 5765/12384 [12:13:43<14:03:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 47%|████▋ | 5765/12384 [12:13:50<14:03:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 47%|████▋ | 5766/12384 [12:13:50<14:00:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 47%|████▋ | 5766/12384 [12:13:58<14:00:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 47%|████▋ | 5767/12384 [12:13:58<14:00:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 47%|████▋ | 5767/12384 [12:14:06<14:00:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 1: 47%|████▋ | 5768/12384 [12:14:06<14:00:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 1: 47%|████▋ | 5768/12384 [12:14:13<14:00:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 1: 47%|████▋ | 5769/12384 [12:14:13<13:59:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 1: 47%|████▋ | 5769/12384 [12:14:21<13:59:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 47%|████▋ | 5770/12384 [12:14:21<13:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 47%|████▋ | 5770/12384 [12:14:29<13:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 47%|████▋ | 5771/12384 [12:14:29<13:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 47%|████▋ | 5771/12384 [12:14:36<13:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 1: 47%|████▋ | 5772/12384 [12:14:36<13:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 1: 47%|████▋ | 5772/12384 [12:14:44<13:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5773/12384 [12:14:44<13:59:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5773/12384 [12:14:51<13:59:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5774/12384 [12:14:51<13:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5774/12384 [12:14:59<13:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 47%|████▋ | 5775/12384 [12:14:59<13:58:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 47%|████▋ | 5775/12384 [12:15:07<13:58:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 47%|████▋ | 5776/12384 [12:15:07<13:58:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 47%|████▋ | 5776/12384 [12:15:14<13:58:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 47%|████▋ | 5777/12384 [12:15:14<13:58:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 47%|████▋ | 5777/12384 [12:15:22<13:58:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 47%|████▋ | 5778/12384 [12:15:22<13:59:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 47%|████▋ | 5778/12384 [12:15:29<13:59:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 47%|████▋ | 5779/12384 [12:15:29<13:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 47%|████▋ | 5779/12384 [12:15:37<13:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5780/12384 [12:15:37<13:59:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5780/12384 [12:15:45<13:59:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 47%|████▋ | 5781/12384 [12:15:45<14:01:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 47%|████▋ | 5781/12384 [12:15:52<14:01:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 47%|████▋ | 5782/12384 [12:15:52<14:01:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 47%|████▋ | 5782/12384 [12:16:00<14:01:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5783/12384 [12:16:00<14:00:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5783/12384 [12:16:08<14:00:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 47%|████▋ | 5784/12384 [12:16:08<13:59:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 47%|████▋ | 5784/12384 [12:16:15<13:59:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5785/12384 [12:16:15<13:58:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5785/12384 [12:16:23<13:58:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5786/12384 [12:16:23<13:57:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5786/12384 [12:16:30<13:57:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 47%|████▋ | 5787/12384 [12:16:30<13:57:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 47%|████▋ | 5787/12384 [12:16:38<13:57:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5788/12384 [12:16:38<13:57:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5788/12384 [12:16:46<13:57:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5789/12384 [12:16:46<14:06:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5789/12384 [12:16:54<14:06:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 47%|████▋ | 5790/12384 [12:16:54<14:03:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 47%|████▋ | 5790/12384 [12:17:01<14:03:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 47%|████▋ | 5791/12384 [12:17:01<14:01:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 47%|████▋ | 5791/12384 [12:17:09<14:01:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 47%|████▋ | 5792/12384 [12:17:09<13:58:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 47%|████▋ | 5792/12384 [12:17:16<13:58:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 47%|████▋ | 5793/12384 [12:17:16<13:58:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 47%|████▋ | 5793/12384 [12:17:24<13:58:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 47%|████▋ | 5794/12384 [12:17:24<13:57:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 47%|████▋ | 5794/12384 [12:17:32<13:57:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5795/12384 [12:17:32<13:56:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5795/12384 [12:17:39<13:56:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 47%|████▋ | 5796/12384 [12:17:39<13:56:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 47%|████▋ | 5796/12384 [12:17:47<13:56:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 1: 47%|████▋ | 5797/12384 [12:17:47<13:55:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 1: 47%|████▋ | 5797/12384 [12:17:55<13:55:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 1: 47%|████▋ | 5798/12384 [12:17:55<14:04:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 1: 47%|████▋ | 5798/12384 [12:18:02<14:04:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5799/12384 [12:18:02<14:01:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5799/12384 [12:18:10<14:01:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 47%|████▋ | 5800/12384 [12:18:10<13:59:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 47%|████▋ | 5800/12384 [12:18:18<13:59:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 47%|████▋ | 5801/12384 [12:18:18<13:56:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 47%|████▋ | 5801/12384 [12:18:25<13:56:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 47%|████▋ | 5802/12384 [12:18:25<13:55:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 47%|████▋ | 5802/12384 [12:18:33<13:55:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 47%|████▋ | 5803/12384 [12:18:33<13:54:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 47%|████▋ | 5803/12384 [12:18:40<13:54:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 47%|████▋ | 5804/12384 [12:18:40<13:53:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 47%|████▋ | 5804/12384 [12:18:48<13:53:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 47%|████▋ | 5805/12384 [12:18:48<13:53:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 47%|████▋ | 5805/12384 [12:18:55<13:53:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 47%|████▋ | 5806/12384 [12:18:55<13:53:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 47%|████▋ | 5806/12384 [12:19:03<13:53:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 47%|████▋ | 5807/12384 [12:19:03<13:53:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 47%|████▋ | 5807/12384 [12:19:11<13:53:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 47%|████▋ | 5808/12384 [12:19:11<13:54:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 47%|████▋ | 5808/12384 [12:19:18<13:54:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 47%|████▋ | 5809/12384 [12:19:18<13:53:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 47%|████▋ | 5809/12384 [12:19:26<13:53:10, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.80s]
Epoch 1: 47%|████▋ | 5810/12384 [12:19:26<13:54:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.80s]
Epoch 1: 47%|████▋ | 5810/12384 [12:19:34<13:54:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 47%|████▋ | 5811/12384 [12:19:34<13:54:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 47%|████▋ | 5811/12384 [12:19:41<13:54:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 47%|████▋ | 5812/12384 [12:19:41<13:53:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 47%|████▋ | 5812/12384 [12:19:49<13:53:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 47%|████▋ | 5813/12384 [12:19:49<13:53:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 47%|████▋ | 5813/12384 [12:19:56<13:53:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 47%|████▋ | 5814/12384 [12:19:56<13:52:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 47%|████▋ | 5814/12384 [12:20:04<13:52:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 47%|████▋ | 5815/12384 [12:20:04<14:03:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 47%|████▋ | 5815/12384 [12:20:12<14:03:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 1: 47%|████▋ | 5816/12384 [12:20:12<14:01:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 1: 47%|████▋ | 5816/12384 [12:20:20<14:01:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 47%|████▋ | 5817/12384 [12:20:20<13:59:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 47%|████▋ | 5817/12384 [12:20:27<13:59:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 47%|████▋ | 5818/12384 [12:20:27<14:00:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 47%|████▋ | 5818/12384 [12:20:35<14:00:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5819/12384 [12:20:35<13:57:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5819/12384 [12:20:42<13:57:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5820/12384 [12:20:42<13:55:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5820/12384 [12:20:50<13:55:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 47%|████▋ | 5821/12384 [12:20:50<13:54:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 47%|████▋ | 5821/12384 [12:20:58<13:54:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 47%|████▋ | 5822/12384 [12:20:58<13:56:33, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 47%|████▋ | 5822/12384 [12:21:05<13:56:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 47%|████▋ | 5823/12384 [12:21:05<13:55:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 47%|████▋ | 5823/12384 [12:21:13<13:55:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 47%|████▋ | 5824/12384 [12:21:13<13:53:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 47%|████▋ | 5824/12384 [12:21:21<13:53:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 47%|████▋ | 5825/12384 [12:21:21<13:53:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 47%|████▋ | 5825/12384 [12:21:28<13:53:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 47%|████▋ | 5826/12384 [12:21:28<13:55:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 47%|████▋ | 5826/12384 [12:21:36<13:55:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 47%|████▋ | 5827/12384 [12:21:36<13:55:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 47%|████▋ | 5827/12384 [12:21:44<13:55:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 47%|████▋ | 5828/12384 [12:21:44<13:55:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 47%|████▋ | 5828/12384 [12:21:51<13:55:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 47%|████▋ | 5829/12384 [12:21:51<13:54:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 47%|████▋ | 5829/12384 [12:21:59<13:54:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5830/12384 [12:21:59<13:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5830/12384 [12:22:06<13:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 47%|████▋ | 5831/12384 [12:22:06<13:53:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 47%|████▋ | 5831/12384 [12:22:14<13:53:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 47%|████▋ | 5832/12384 [12:22:14<13:52:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 47%|████▋ | 5832/12384 [12:22:22<13:52:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 47%|████▋ | 5833/12384 [12:22:22<13:52:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 47%|████▋ | 5833/12384 [12:22:29<13:52:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 47%|████▋ | 5834/12384 [12:22:29<13:52:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 47%|████▋ | 5834/12384 [12:22:37<13:52:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 47%|████▋ | 5835/12384 [12:22:37<13:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 47%|████▋ | 5835/12384 [12:22:45<13:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 47%|████▋ | 5836/12384 [12:22:45<13:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 47%|████▋ | 5836/12384 [12:22:52<13:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 47%|████▋ | 5837/12384 [12:22:52<13:50:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 47%|████▋ | 5837/12384 [12:23:00<13:50:02, 7.61s/it, loss=0.0015, acc=0.9972, iter_time=5.56s]
Epoch 1: 47%|████▋ | 5838/12384 [12:23:00<13:50:06, 7.61s/it, loss=0.0015, acc=0.9972, iter_time=5.56s]
Epoch 1: 47%|████▋ | 5838/12384 [12:23:07<13:50:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 47%|████▋ | 5839/12384 [12:23:07<13:49:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 47%|████▋ | 5839/12384 [12:23:15<13:49:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 47%|████▋ | 5840/12384 [12:23:15<13:51:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 47%|████▋ | 5840/12384 [12:23:23<13:51:14, 7.62s/it, loss=0.0005, acc=0.9984, iter_time=7.76s]
Epoch 1: 47%|████▋ | 5841/12384 [12:23:23<14:01:09, 7.71s/it, loss=0.0005, acc=0.9984, iter_time=7.76s]
Epoch 1: 47%|████▋ | 5841/12384 [12:23:31<14:01:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 47%|████▋ | 5842/12384 [12:23:31<13:58:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 47%|████▋ | 5842/12384 [12:23:38<13:58:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 47%|████▋ | 5843/12384 [12:23:38<13:55:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 47%|████▋ | 5843/12384 [12:23:46<13:55:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 47%|████▋ | 5844/12384 [12:23:46<13:52:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 47%|████▋ | 5844/12384 [12:23:53<13:52:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 47%|████▋ | 5845/12384 [12:23:53<13:50:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 47%|████▋ | 5845/12384 [12:24:01<13:50:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 47%|████▋ | 5846/12384 [12:24:01<13:49:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 47%|████▋ | 5846/12384 [12:24:08<13:49:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5847/12384 [12:24:08<13:49:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5847/12384 [12:24:16<13:49:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 47%|████▋ | 5848/12384 [12:24:16<13:49:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 47%|████▋ | 5848/12384 [12:24:24<13:49:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 47%|████▋ | 5849/12384 [12:24:24<13:49:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 47%|████▋ | 5849/12384 [12:24:31<13:49:14, 7.61s/it, loss=0.0008, acc=0.9981, iter_time=9.95s]
Epoch 1: 47%|████▋ | 5850/12384 [12:24:31<13:49:55, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=9.95s]
Epoch 1: 47%|████▋ | 5850/12384 [12:24:39<13:49:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 47%|████▋ | 5851/12384 [12:24:39<13:59:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 47%|████▋ | 5851/12384 [12:24:47<13:59:11, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5852/12384 [12:24:47<13:58:11, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5852/12384 [12:24:55<13:58:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 47%|████▋ | 5853/12384 [12:24:55<13:55:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 47%|████▋ | 5853/12384 [12:25:02<13:55:10, 7.67s/it, loss=0.0004, acc=0.9994, iter_time=5.80s]
Epoch 1: 47%|████▋ | 5854/12384 [12:25:02<13:52:18, 7.65s/it, loss=0.0004, acc=0.9994, iter_time=5.80s]
Epoch 1: 47%|████▋ | 5854/12384 [12:25:10<13:52:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 47%|████▋ | 5855/12384 [12:25:10<13:51:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 47%|████▋ | 5855/12384 [12:25:17<13:51:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 47%|████▋ | 5856/12384 [12:25:17<13:50:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 47%|████▋ | 5856/12384 [12:25:25<13:50:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 47%|████▋ | 5857/12384 [12:25:25<13:49:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 47%|████▋ | 5857/12384 [12:25:33<13:49:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5858/12384 [12:25:33<13:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5858/12384 [12:25:40<13:48:45, 7.62s/it, loss=0.0000, acc=0.9997, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5859/12384 [12:25:40<13:48:26, 7.62s/it, loss=0.0000, acc=0.9997, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5859/12384 [12:25:48<13:48:26, 7.62s/it, loss=0.0007, acc=0.9991, iter_time=7.67s]
Epoch 1: 47%|████▋ | 5860/12384 [12:25:48<13:49:51, 7.63s/it, loss=0.0007, acc=0.9991, iter_time=7.67s]
Epoch 1: 47%|████▋ | 5860/12384 [12:25:55<13:49:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5861/12384 [12:25:55<13:48:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 47%|████▋ | 5861/12384 [12:26:03<13:48:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 47%|████▋ | 5862/12384 [12:26:03<13:47:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 47%|████▋ | 5862/12384 [12:26:11<13:47:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 47%|████▋ | 5863/12384 [12:26:11<13:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 47%|████▋ | 5863/12384 [12:26:18<13:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 47%|████▋ | 5864/12384 [12:26:18<13:47:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 47%|████▋ | 5864/12384 [12:26:26<13:47:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5865/12384 [12:26:26<13:47:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 47%|████▋ | 5865/12384 [12:26:34<13:47:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 47%|████▋ | 5866/12384 [12:26:34<13:46:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 47%|████▋ | 5866/12384 [12:26:42<13:46:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 47%|████▋ | 5867/12384 [12:26:42<13:59:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 47%|████▋ | 5867/12384 [12:26:49<13:59:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 47%|████▋ | 5868/12384 [12:26:49<13:55:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 47%|████▋ | 5868/12384 [12:26:57<13:55:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5869/12384 [12:26:57<13:52:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5869/12384 [12:27:04<13:52:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 47%|████▋ | 5870/12384 [12:27:04<13:52:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 47%|████▋ | 5870/12384 [12:27:12<13:52:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 1: 47%|████▋ | 5871/12384 [12:27:12<13:53:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 1: 47%|████▋ | 5871/12384 [12:27:20<13:53:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 47%|████▋ | 5872/12384 [12:27:20<13:51:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 47%|████▋ | 5872/12384 [12:27:27<13:51:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 47%|████▋ | 5873/12384 [12:27:27<13:49:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 47%|████▋ | 5873/12384 [12:27:35<13:49:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5874/12384 [12:27:35<13:48:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5874/12384 [12:27:43<13:48:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5875/12384 [12:27:43<13:47:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5875/12384 [12:27:50<13:47:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5876/12384 [12:27:50<13:46:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 47%|████▋ | 5876/12384 [12:27:58<13:46:48, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.89s]
Epoch 1: 47%|████▋ | 5877/12384 [12:27:58<13:55:20, 7.70s/it, loss=0.0001, acc=0.9995, iter_time=7.89s]
Epoch 1: 47%|████▋ | 5877/12384 [12:28:06<13:55:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 47%|████▋ | 5878/12384 [12:28:06<13:51:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 47%|████▋ | 5878/12384 [12:28:13<13:51:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 47%|████▋ | 5879/12384 [12:28:13<13:49:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 47%|████▋ | 5879/12384 [12:28:21<13:49:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 47%|████▋ | 5880/12384 [12:28:21<13:47:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 47%|████▋ | 5880/12384 [12:28:28<13:47:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 1: 47%|████▋ | 5881/12384 [12:28:28<13:46:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 1: 47%|████▋ | 5881/12384 [12:28:36<13:46:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 47%|████▋ | 5882/12384 [12:28:36<13:46:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 47%|████▋ | 5882/12384 [12:28:44<13:46:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 48%|████▊ | 5883/12384 [12:28:44<13:45:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 48%|████▊ | 5883/12384 [12:28:51<13:45:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5884/12384 [12:28:51<13:45:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5884/12384 [12:28:59<13:45:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 48%|████▊ | 5885/12384 [12:28:59<13:44:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 48%|████▊ | 5885/12384 [12:29:07<13:44:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 48%|████▊ | 5886/12384 [12:29:07<13:42:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 48%|████▊ | 5886/12384 [12:29:14<13:42:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 1: 48%|████▊ | 5887/12384 [12:29:14<13:43:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 1: 48%|████▊ | 5887/12384 [12:29:22<13:43:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 1: 48%|████▊ | 5888/12384 [12:29:22<13:44:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 1: 48%|████▊ | 5888/12384 [12:29:29<13:44:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 48%|████▊ | 5889/12384 [12:29:29<13:44:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 48%|████▊ | 5889/12384 [12:29:37<13:44:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5890/12384 [12:29:37<13:43:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5890/12384 [12:29:45<13:43:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 48%|████▊ | 5891/12384 [12:29:45<13:47:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 48%|████▊ | 5891/12384 [12:29:52<13:47:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 48%|████▊ | 5892/12384 [12:29:52<13:45:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 48%|████▊ | 5892/12384 [12:30:00<13:45:36, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 1: 48%|████▊ | 5893/12384 [12:30:00<13:54:54, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 1: 48%|████▊ | 5893/12384 [12:30:08<13:54:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 48%|████▊ | 5894/12384 [12:30:08<13:51:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 48%|████▊ | 5894/12384 [12:30:15<13:51:30, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=11.15s]
Epoch 1: 48%|████▊ | 5895/12384 [12:30:15<13:49:11, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.15s]
Epoch 1: 48%|████▊ | 5895/12384 [12:30:23<13:49:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 48%|████▊ | 5896/12384 [12:30:23<13:46:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 48%|████▊ | 5896/12384 [12:30:31<13:46:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 48%|████▊ | 5897/12384 [12:30:31<13:45:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 48%|████▊ | 5897/12384 [12:30:38<13:45:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 48%|████▊ | 5898/12384 [12:30:38<13:44:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 48%|████▊ | 5898/12384 [12:30:46<13:44:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 48%|████▊ | 5899/12384 [12:30:46<13:44:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 48%|████▊ | 5899/12384 [12:30:54<13:44:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 48%|████▊ | 5900/12384 [12:30:54<13:43:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 48%|████▊ | 5900/12384 [12:31:01<13:43:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 48%|████▊ | 5901/12384 [12:31:01<13:43:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 48%|████▊ | 5901/12384 [12:31:09<13:43:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 48%|████▊ | 5902/12384 [12:31:09<13:42:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 48%|████▊ | 5902/12384 [12:31:17<13:42:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 48%|████▊ | 5903/12384 [12:31:17<13:51:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 48%|████▊ | 5903/12384 [12:31:24<13:51:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 48%|████▊ | 5904/12384 [12:31:24<13:48:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 48%|████▊ | 5904/12384 [12:31:32<13:48:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 48%|████▊ | 5905/12384 [12:31:32<13:46:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 48%|████▊ | 5905/12384 [12:31:39<13:46:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 48%|████▊ | 5906/12384 [12:31:39<13:44:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 48%|████▊ | 5906/12384 [12:31:47<13:44:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5907/12384 [12:31:47<13:43:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5907/12384 [12:31:55<13:43:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 48%|████▊ | 5908/12384 [12:31:55<13:44:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 48%|████▊ | 5908/12384 [12:32:02<13:44:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5909/12384 [12:32:02<13:44:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5909/12384 [12:32:10<13:44:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5910/12384 [12:32:10<13:43:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5910/12384 [12:32:18<13:43:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.84s]
Epoch 1: 48%|████▊ | 5911/12384 [12:32:18<13:42:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.84s]
Epoch 1: 48%|████▊ | 5911/12384 [12:32:25<13:42:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 48%|████▊ | 5912/12384 [12:32:25<13:41:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 48%|████▊ | 5912/12384 [12:32:33<13:41:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 48%|████▊ | 5913/12384 [12:32:33<13:41:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 48%|████▊ | 5913/12384 [12:32:40<13:41:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 48%|████▊ | 5914/12384 [12:32:40<13:40:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 48%|████▊ | 5914/12384 [12:32:48<13:40:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 48%|████▊ | 5915/12384 [12:32:48<13:39:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 48%|████▊ | 5915/12384 [12:32:56<13:39:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 48%|████▊ | 5916/12384 [12:32:56<13:40:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 48%|████▊ | 5916/12384 [12:33:03<13:40:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 48%|████▊ | 5917/12384 [12:33:03<13:40:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 48%|████▊ | 5917/12384 [12:33:11<13:40:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 48%|████▊ | 5918/12384 [12:33:11<13:40:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 48%|████▊ | 5918/12384 [12:33:18<13:40:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 48%|████▊ | 5919/12384 [12:33:18<13:38:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 48%|████▊ | 5919/12384 [12:33:26<13:38:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 48%|████▊ | 5920/12384 [12:33:26<13:49:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 48%|████▊ | 5920/12384 [12:33:34<13:49:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 48%|████▊ | 5921/12384 [12:33:34<13:46:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 48%|████▊ | 5921/12384 [12:33:42<13:46:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 48%|████▊ | 5922/12384 [12:33:42<13:43:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 48%|████▊ | 5922/12384 [12:33:49<13:43:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 48%|████▊ | 5923/12384 [12:33:49<13:41:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 48%|████▊ | 5923/12384 [12:33:57<13:41:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 48%|████▊ | 5924/12384 [12:33:57<13:41:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 48%|████▊ | 5924/12384 [12:34:04<13:41:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 48%|████▊ | 5925/12384 [12:34:04<13:40:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 48%|████▊ | 5925/12384 [12:34:12<13:40:31, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=6.09s]
Epoch 1: 48%|████▊ | 5926/12384 [12:34:12<13:40:19, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=6.09s]
Epoch 1: 48%|████▊ | 5926/12384 [12:34:20<13:40:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 48%|████▊ | 5927/12384 [12:34:20<13:39:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 48%|████▊ | 5927/12384 [12:34:27<13:39:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 48%|████▊ | 5928/12384 [12:34:27<13:39:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 48%|████▊ | 5928/12384 [12:34:35<13:39:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 48%|████▊ | 5929/12384 [12:34:35<13:48:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 48%|████▊ | 5929/12384 [12:34:43<13:48:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5930/12384 [12:34:43<13:44:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5930/12384 [12:34:50<13:44:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5931/12384 [12:34:50<13:42:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5931/12384 [12:34:58<13:42:37, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 1: 48%|████▊ | 5932/12384 [12:34:58<13:41:31, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 1: 48%|████▊ | 5932/12384 [12:35:06<13:41:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5933/12384 [12:35:06<13:40:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5933/12384 [12:35:13<13:40:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5934/12384 [12:35:13<13:40:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5934/12384 [12:35:21<13:40:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5935/12384 [12:35:21<13:39:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5935/12384 [12:35:28<13:39:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 48%|████▊ | 5936/12384 [12:35:28<13:38:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 48%|████▊ | 5936/12384 [12:35:36<13:38:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 48%|████▊ | 5937/12384 [12:35:36<13:38:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 48%|████▊ | 5937/12384 [12:35:44<13:38:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 48%|████▊ | 5938/12384 [12:35:44<13:38:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 48%|████▊ | 5938/12384 [12:35:51<13:38:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5939/12384 [12:35:51<13:38:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5939/12384 [12:35:59<13:38:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5940/12384 [12:35:59<13:40:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5940/12384 [12:36:07<13:40:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 48%|████▊ | 5941/12384 [12:36:07<13:39:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 48%|████▊ | 5941/12384 [12:36:14<13:39:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5942/12384 [12:36:14<13:39:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5942/12384 [12:36:22<13:39:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 48%|████▊ | 5943/12384 [12:36:22<13:38:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 48%|████▊ | 5943/12384 [12:36:29<13:38:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 48%|████▊ | 5944/12384 [12:36:29<13:38:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 48%|████▊ | 5944/12384 [12:36:37<13:38:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 48%|████▊ | 5945/12384 [12:36:37<13:37:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 48%|████▊ | 5945/12384 [12:36:45<13:37:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 48%|████▊ | 5946/12384 [12:36:45<13:47:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 1: 48%|████▊ | 5946/12384 [12:36:53<13:47:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 48%|████▊ | 5947/12384 [12:36:53<13:43:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 48%|████▊ | 5947/12384 [12:37:00<13:43:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 48%|████▊ | 5948/12384 [12:37:00<13:41:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 48%|████▊ | 5948/12384 [12:37:08<13:41:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5949/12384 [12:37:08<13:39:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5949/12384 [12:37:15<13:39:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 48%|████▊ | 5950/12384 [12:37:15<13:37:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 48%|████▊ | 5950/12384 [12:37:23<13:37:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 48%|████▊ | 5951/12384 [12:37:23<13:37:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 48%|████▊ | 5951/12384 [12:37:31<13:37:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 48%|████▊ | 5952/12384 [12:37:31<13:37:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 48%|████▊ | 5952/12384 [12:37:38<13:37:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 48%|████▊ | 5953/12384 [12:37:38<13:37:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 48%|████▊ | 5953/12384 [12:37:46<13:37:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5954/12384 [12:37:46<13:36:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5954/12384 [12:37:54<13:36:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 48%|████▊ | 5955/12384 [12:37:54<13:46:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 48%|████▊ | 5955/12384 [12:38:01<13:46:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5956/12384 [12:38:01<13:44:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5956/12384 [12:38:09<13:44:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 48%|████▊ | 5957/12384 [12:38:09<13:41:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 48%|████▊ | 5957/12384 [12:38:17<13:41:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5958/12384 [12:38:17<13:40:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5958/12384 [12:38:24<13:40:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5959/12384 [12:38:24<13:39:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5959/12384 [12:38:32<13:39:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 48%|████▊ | 5960/12384 [12:38:32<13:37:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 48%|████▊ | 5960/12384 [12:38:39<13:37:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 48%|████▊ | 5961/12384 [12:38:39<13:36:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 48%|████▊ | 5961/12384 [12:38:47<13:36:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5962/12384 [12:38:47<13:35:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5962/12384 [12:38:55<13:35:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 48%|████▊ | 5963/12384 [12:38:55<13:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 48%|████▊ | 5963/12384 [12:39:02<13:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 48%|████▊ | 5964/12384 [12:39:02<13:35:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 48%|████▊ | 5964/12384 [12:39:10<13:35:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5965/12384 [12:39:10<13:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5965/12384 [12:39:17<13:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 48%|████▊ | 5966/12384 [12:39:17<13:33:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 48%|████▊ | 5966/12384 [12:39:25<13:33:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 48%|████▊ | 5967/12384 [12:39:25<13:33:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 48%|████▊ | 5967/12384 [12:39:33<13:33:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 48%|████▊ | 5968/12384 [12:39:33<13:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 48%|████▊ | 5968/12384 [12:39:40<13:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5969/12384 [12:39:40<13:32:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5969/12384 [12:39:48<13:32:53, 7.60s/it, loss=0.0006, acc=0.9993, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5970/12384 [12:39:48<13:33:05, 7.61s/it, loss=0.0006, acc=0.9993, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5970/12384 [12:39:56<13:33:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5971/12384 [12:39:56<13:33:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5971/12384 [12:40:03<13:33:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5972/12384 [12:40:03<13:34:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5972/12384 [12:40:11<13:34:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 48%|████▊ | 5973/12384 [12:40:11<13:44:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 48%|████▊ | 5973/12384 [12:40:19<13:44:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 48%|████▊ | 5974/12384 [12:40:19<13:41:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 48%|████▊ | 5974/12384 [12:40:26<13:41:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 48%|████▊ | 5975/12384 [12:40:26<13:37:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 48%|████▊ | 5975/12384 [12:40:34<13:37:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 48%|████▊ | 5976/12384 [12:40:34<13:35:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 48%|████▊ | 5976/12384 [12:40:42<13:35:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 48%|████▊ | 5977/12384 [12:40:42<13:34:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 48%|████▊ | 5977/12384 [12:40:49<13:34:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 48%|████▊ | 5978/12384 [12:40:49<13:34:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 48%|████▊ | 5978/12384 [12:40:57<13:34:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 48%|████▊ | 5979/12384 [12:40:57<13:34:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 48%|████▊ | 5979/12384 [12:41:04<13:34:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 48%|████▊ | 5980/12384 [12:41:04<13:34:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 48%|████▊ | 5980/12384 [12:41:12<13:34:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5981/12384 [12:41:12<13:37:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 48%|████▊ | 5981/12384 [12:41:20<13:37:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 48%|████▊ | 5982/12384 [12:41:20<13:35:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 48%|████▊ | 5982/12384 [12:41:27<13:35:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5983/12384 [12:41:27<13:35:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 48%|████▊ | 5983/12384 [12:41:35<13:35:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 48%|████▊ | 5984/12384 [12:41:35<13:33:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 48%|████▊ | 5984/12384 [12:41:43<13:33:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 48%|████▊ | 5985/12384 [12:41:43<13:32:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 48%|████▊ | 5985/12384 [12:41:50<13:32:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 48%|████▊ | 5986/12384 [12:41:50<13:33:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 48%|████▊ | 5986/12384 [12:41:58<13:33:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 48%|████▊ | 5987/12384 [12:41:58<13:32:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 48%|████▊ | 5987/12384 [12:42:05<13:32:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 48%|████▊ | 5988/12384 [12:42:05<13:32:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 48%|████▊ | 5988/12384 [12:42:13<13:32:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 48%|████▊ | 5989/12384 [12:42:13<13:31:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 48%|████▊ | 5989/12384 [12:42:21<13:31:44, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.68s]
Epoch 1: 48%|████▊ | 5990/12384 [12:42:21<13:31:08, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=6.68s]
Epoch 1: 48%|████▊ | 5990/12384 [12:42:28<13:31:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 48%|████▊ | 5991/12384 [12:42:28<13:30:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 48%|████▊ | 5991/12384 [12:42:36<13:30:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 48%|████▊ | 5992/12384 [12:42:36<13:31:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 48%|████▊ | 5992/12384 [12:42:43<13:31:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 48%|████▊ | 5993/12384 [12:42:43<13:31:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 48%|████▊ | 5993/12384 [12:42:51<13:31:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 48%|████▊ | 5994/12384 [12:42:51<13:31:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 48%|████▊ | 5994/12384 [12:42:59<13:31:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 48%|████▊ | 5995/12384 [12:42:59<13:30:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 48%|████▊ | 5995/12384 [12:43:06<13:30:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5996/12384 [12:43:06<13:30:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 48%|████▊ | 5996/12384 [12:43:14<13:30:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5997/12384 [12:43:14<13:29:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5997/12384 [12:43:22<13:29:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5998/12384 [12:43:22<13:32:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 48%|████▊ | 5998/12384 [12:43:30<13:32:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 48%|████▊ | 5999/12384 [12:43:30<13:44:30, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 48%|████▊ | 5999/12384 [12:43:37<13:44:30, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 48%|████▊ | 6000/12384 [12:43:37<13:40:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 48%|████▊ | 6000/12384 [12:43:45<13:40:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 48%|████▊ | 6001/12384 [12:43:45<13:36:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 48%|████▊ | 6001/12384 [12:43:52<13:36:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 48%|████▊ | 6002/12384 [12:43:52<13:34:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 48%|████▊ | 6002/12384 [12:44:00<13:34:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 48%|████▊ | 6003/12384 [12:44:00<13:32:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 48%|████▊ | 6003/12384 [12:44:08<13:32:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 48%|████▊ | 6004/12384 [12:44:08<13:31:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 48%|████▊ | 6004/12384 [12:44:15<13:31:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 48%|████▊ | 6005/12384 [12:44:15<13:33:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 48%|████▊ | 6005/12384 [12:44:23<13:33:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 48%|████▊ | 6006/12384 [12:44:23<13:34:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 48%|████▊ | 6006/12384 [12:44:31<13:34:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 49%|████▊ | 6007/12384 [12:44:31<13:31:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 49%|████▊ | 6007/12384 [12:44:38<13:31:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 49%|████▊ | 6008/12384 [12:44:38<13:31:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 49%|████▊ | 6008/12384 [12:44:46<13:31:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 49%|████▊ | 6009/12384 [12:44:46<13:32:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 49%|████▊ | 6009/12384 [12:44:54<13:32:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 49%|████▊ | 6010/12384 [12:44:54<13:31:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 1: 49%|████▊ | 6010/12384 [12:45:01<13:31:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6011/12384 [12:45:01<13:30:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6011/12384 [12:45:09<13:30:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 49%|████▊ | 6012/12384 [12:45:09<13:28:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 49%|████▊ | 6012/12384 [12:45:16<13:28:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6013/12384 [12:45:16<13:29:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6013/12384 [12:45:24<13:29:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 49%|████▊ | 6014/12384 [12:45:24<13:28:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 49%|████▊ | 6014/12384 [12:45:32<13:28:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 49%|████▊ | 6015/12384 [12:45:32<13:29:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 49%|████▊ | 6015/12384 [12:45:39<13:29:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 1: 49%|████▊ | 6016/12384 [12:45:39<13:29:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 1: 49%|████▊ | 6016/12384 [12:45:47<13:29:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 49%|████▊ | 6017/12384 [12:45:47<13:30:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 49%|████▊ | 6017/12384 [12:45:55<13:30:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 49%|████▊ | 6018/12384 [12:45:55<13:29:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 49%|████▊ | 6018/12384 [12:46:02<13:29:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 49%|████▊ | 6019/12384 [12:46:02<13:28:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 49%|████▊ | 6019/12384 [12:46:10<13:28:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6020/12384 [12:46:10<13:27:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6020/12384 [12:46:17<13:27:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 49%|████▊ | 6021/12384 [12:46:17<13:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 49%|████▊ | 6021/12384 [12:46:25<13:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 49%|████▊ | 6022/12384 [12:46:25<13:27:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 49%|████▊ | 6022/12384 [12:46:33<13:27:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6023/12384 [12:46:33<13:26:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6023/12384 [12:46:40<13:26:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 49%|████▊ | 6024/12384 [12:46:40<13:26:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 49%|████▊ | 6024/12384 [12:46:48<13:26:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 49%|████▊ | 6025/12384 [12:46:48<13:36:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 49%|████▊ | 6025/12384 [12:46:56<13:36:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 49%|████▊ | 6026/12384 [12:46:56<13:33:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 49%|████▊ | 6026/12384 [12:47:03<13:33:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6027/12384 [12:47:03<13:30:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6027/12384 [12:47:11<13:30:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6028/12384 [12:47:11<13:29:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6028/12384 [12:47:19<13:29:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6029/12384 [12:47:19<13:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6029/12384 [12:47:26<13:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6030/12384 [12:47:26<13:27:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▊ | 6030/12384 [12:47:34<13:27:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6031/12384 [12:47:34<13:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6031/12384 [12:47:41<13:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6032/12384 [12:47:41<13:27:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▊ | 6032/12384 [12:47:49<13:27:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 49%|████▊ | 6033/12384 [12:47:49<13:27:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 49%|████▊ | 6033/12384 [12:47:57<13:27:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 49%|████▊ | 6034/12384 [12:47:57<13:29:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 49%|████▊ | 6034/12384 [12:48:05<13:29:58, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=8.97s]
Epoch 1: 49%|████▊ | 6035/12384 [12:48:05<13:40:42, 7.76s/it, loss=0.0006, acc=0.9977, iter_time=8.97s]
Epoch 1: 49%|████▊ | 6035/12384 [12:48:12<13:40:42, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 49%|████▊ | 6036/12384 [12:48:12<13:35:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 49%|████▊ | 6036/12384 [12:48:20<13:35:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 49%|████▊ | 6037/12384 [12:48:20<13:32:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 49%|████▊ | 6037/12384 [12:48:28<13:32:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 49%|████▉ | 6038/12384 [12:48:28<13:29:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 49%|████▉ | 6038/12384 [12:48:35<13:29:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▉ | 6039/12384 [12:48:35<13:27:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▉ | 6039/12384 [12:48:43<13:27:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 49%|████▉ | 6040/12384 [12:48:43<13:26:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 49%|████▉ | 6040/12384 [12:48:50<13:26:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 49%|████▉ | 6041/12384 [12:48:50<13:26:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 49%|████▉ | 6041/12384 [12:48:59<13:26:06, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.33s]
Epoch 1: 49%|████▉ | 6042/12384 [12:48:59<13:48:18, 7.84s/it, loss=0.0001, acc=1.0000, iter_time=7.33s]
Epoch 1: 49%|████▉ | 6042/12384 [12:49:06<13:48:18, 7.84s/it, loss=0.0001, acc=1.0000, iter_time=9.58s]
Epoch 1: 49%|████▉ | 6043/12384 [12:49:06<13:44:16, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=9.58s]
Epoch 1: 49%|████▉ | 6043/12384 [12:49:14<13:44:16, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 1: 49%|████▉ | 6044/12384 [12:49:14<13:38:42, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 1: 49%|████▉ | 6044/12384 [12:49:22<13:38:42, 7.75s/it, loss=0.0011, acc=0.9988, iter_time=7.92s]
Epoch 1: 49%|████▉ | 6045/12384 [12:49:22<13:34:53, 7.71s/it, loss=0.0011, acc=0.9988, iter_time=7.92s]
Epoch 1: 49%|████▉ | 6045/12384 [12:49:29<13:34:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 49%|████▉ | 6046/12384 [12:49:29<13:31:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 49%|████▉ | 6046/12384 [12:49:37<13:31:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 49%|████▉ | 6047/12384 [12:49:37<13:29:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 49%|████▉ | 6047/12384 [12:49:45<13:29:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 49%|████▉ | 6048/12384 [12:49:45<13:27:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 49%|████▉ | 6048/12384 [12:49:52<13:27:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 49%|████▉ | 6049/12384 [12:49:52<13:27:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 49%|████▉ | 6049/12384 [12:50:00<13:27:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 49%|████▉ | 6050/12384 [12:50:00<13:28:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 49%|████▉ | 6050/12384 [12:50:08<13:28:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 49%|████▉ | 6051/12384 [12:50:08<13:37:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 49%|████▉ | 6051/12384 [12:50:15<13:37:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 49%|████▉ | 6052/12384 [12:50:15<13:33:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 49%|████▉ | 6052/12384 [12:50:23<13:33:04, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 49%|████▉ | 6053/12384 [12:50:23<13:29:40, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 49%|████▉ | 6053/12384 [12:50:31<13:29:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 49%|████▉ | 6054/12384 [12:50:31<13:28:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 49%|████▉ | 6054/12384 [12:50:38<13:28:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6055/12384 [12:50:38<13:25:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6055/12384 [12:50:46<13:25:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 49%|████▉ | 6056/12384 [12:50:46<13:24:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 49%|████▉ | 6056/12384 [12:50:53<13:24:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 49%|████▉ | 6057/12384 [12:50:53<13:24:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 49%|████▉ | 6057/12384 [12:51:01<13:24:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 49%|████▉ | 6058/12384 [12:51:01<13:23:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 49%|████▉ | 6058/12384 [12:51:09<13:23:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6059/12384 [12:51:09<13:22:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6059/12384 [12:51:16<13:22:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6060/12384 [12:51:16<13:22:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6060/12384 [12:51:24<13:22:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 49%|████▉ | 6061/12384 [12:51:24<13:30:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 49%|████▉ | 6061/12384 [12:51:32<13:30:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 49%|████▉ | 6062/12384 [12:51:32<13:26:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 49%|████▉ | 6062/12384 [12:51:39<13:26:43, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.53s]
Epoch 1: 49%|████▉ | 6063/12384 [12:51:39<13:25:26, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.53s]
Epoch 1: 49%|████▉ | 6063/12384 [12:51:47<13:25:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 49%|████▉ | 6064/12384 [12:51:47<13:24:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 49%|████▉ | 6064/12384 [12:51:55<13:24:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 49%|████▉ | 6065/12384 [12:51:55<13:24:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 49%|████▉ | 6065/12384 [12:52:02<13:24:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 49%|████▉ | 6066/12384 [12:52:02<13:23:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 49%|████▉ | 6066/12384 [12:52:10<13:23:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 49%|████▉ | 6067/12384 [12:52:10<13:24:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 49%|████▉ | 6067/12384 [12:52:17<13:24:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 49%|████▉ | 6068/12384 [12:52:17<13:22:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 49%|████▉ | 6068/12384 [12:52:25<13:22:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6069/12384 [12:52:25<13:22:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6069/12384 [12:52:33<13:22:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▉ | 6070/12384 [12:52:33<13:22:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 49%|████▉ | 6070/12384 [12:52:40<13:22:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 49%|████▉ | 6071/12384 [12:52:40<13:21:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 49%|████▉ | 6071/12384 [12:52:48<13:21:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 49%|████▉ | 6072/12384 [12:52:48<13:21:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 49%|████▉ | 6072/12384 [12:52:56<13:21:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 49%|████▉ | 6073/12384 [12:52:56<13:21:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 49%|████▉ | 6073/12384 [12:53:03<13:21:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 49%|████▉ | 6074/12384 [12:53:03<13:21:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 49%|████▉ | 6074/12384 [12:53:11<13:21:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 49%|████▉ | 6075/12384 [12:53:11<13:19:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 49%|████▉ | 6075/12384 [12:53:18<13:19:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 49%|████▉ | 6076/12384 [12:53:18<13:19:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 49%|████▉ | 6076/12384 [12:53:26<13:19:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 49%|████▉ | 6077/12384 [12:53:26<13:29:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 49%|████▉ | 6077/12384 [12:53:34<13:29:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 49%|████▉ | 6078/12384 [12:53:34<13:26:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 49%|████▉ | 6078/12384 [12:53:41<13:26:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 49%|████▉ | 6079/12384 [12:53:41<13:24:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 49%|████▉ | 6079/12384 [12:53:49<13:24:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 49%|████▉ | 6080/12384 [12:53:49<13:23:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 49%|████▉ | 6080/12384 [12:53:57<13:23:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.50s]
Epoch 1: 49%|████▉ | 6081/12384 [12:53:57<13:23:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.50s]
Epoch 1: 49%|████▉ | 6081/12384 [12:54:04<13:23:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 49%|████▉ | 6082/12384 [12:54:04<13:24:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 49%|████▉ | 6082/12384 [12:54:12<13:24:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 49%|████▉ | 6083/12384 [12:54:12<13:22:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 49%|████▉ | 6083/12384 [12:54:20<13:22:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 49%|████▉ | 6084/12384 [12:54:20<13:21:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 49%|████▉ | 6084/12384 [12:54:27<13:21:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 49%|████▉ | 6085/12384 [12:54:27<13:20:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 49%|████▉ | 6085/12384 [12:54:35<13:20:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 49%|████▉ | 6086/12384 [12:54:35<13:20:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 49%|████▉ | 6086/12384 [12:54:43<13:20:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 49%|████▉ | 6087/12384 [12:54:43<13:19:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 49%|████▉ | 6087/12384 [12:54:50<13:19:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 49%|████▉ | 6088/12384 [12:54:50<13:19:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 49%|████▉ | 6088/12384 [12:54:58<13:19:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 49%|████▉ | 6089/12384 [12:54:58<13:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 49%|████▉ | 6089/12384 [12:55:05<13:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 49%|████▉ | 6090/12384 [12:55:05<13:21:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 49%|████▉ | 6090/12384 [12:55:13<13:21:19, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.46s]
Epoch 1: 49%|████▉ | 6091/12384 [12:55:13<13:20:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.46s]
Epoch 1: 49%|████▉ | 6091/12384 [12:55:21<13:20:16, 7.63s/it, loss=0.0016, acc=0.9963, iter_time=7.70s]
Epoch 1: 49%|████▉ | 6092/12384 [12:55:21<13:22:08, 7.65s/it, loss=0.0016, acc=0.9963, iter_time=7.70s]
Epoch 1: 49%|████▉ | 6092/12384 [12:55:28<13:22:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6093/12384 [12:55:28<13:20:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6093/12384 [12:55:36<13:20:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 49%|████▉ | 6094/12384 [12:55:36<13:25:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 49%|████▉ | 6094/12384 [12:55:44<13:25:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 49%|████▉ | 6095/12384 [12:55:44<13:22:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 49%|████▉ | 6095/12384 [12:55:51<13:22:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 49%|████▉ | 6096/12384 [12:55:51<13:20:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 49%|████▉ | 6096/12384 [12:55:59<13:20:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 49%|████▉ | 6097/12384 [12:55:59<13:20:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 49%|████▉ | 6097/12384 [12:56:07<13:20:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 49%|████▉ | 6098/12384 [12:56:07<13:20:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 49%|████▉ | 6098/12384 [12:56:14<13:20:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 49%|████▉ | 6099/12384 [12:56:14<13:19:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 49%|████▉ | 6099/12384 [12:56:22<13:19:42, 7.63s/it, loss=0.0003, acc=0.9983, iter_time=7.60s]
Epoch 1: 49%|████▉ | 6100/12384 [12:56:22<13:18:26, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=7.60s]
Epoch 1: 49%|████▉ | 6100/12384 [12:56:29<13:18:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 49%|████▉ | 6101/12384 [12:56:29<13:19:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 49%|████▉ | 6101/12384 [12:56:37<13:19:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 49%|████▉ | 6102/12384 [12:56:37<13:21:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 49%|████▉ | 6102/12384 [12:56:45<13:21:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 49%|████▉ | 6103/12384 [12:56:45<13:42:16, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 49%|████▉ | 6103/12384 [12:56:54<13:42:16, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 49%|████▉ | 6104/12384 [12:56:54<13:49:35, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 49%|████▉ | 6104/12384 [12:57:01<13:49:35, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 49%|████▉ | 6105/12384 [12:57:01<13:42:31, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 49%|████▉ | 6105/12384 [12:57:09<13:42:31, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 1: 49%|████▉ | 6106/12384 [12:57:09<13:34:33, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 1: 49%|████▉ | 6106/12384 [12:57:17<13:34:33, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=11.46s]
Epoch 1: 49%|████▉ | 6107/12384 [12:57:17<13:30:48, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=11.46s]
Epoch 1: 49%|████▉ | 6107/12384 [12:57:24<13:30:48, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 49%|████▉ | 6108/12384 [12:57:24<13:26:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 49%|████▉ | 6108/12384 [12:57:32<13:26:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 49%|████▉ | 6109/12384 [12:57:32<13:22:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 49%|████▉ | 6109/12384 [12:57:39<13:22:53, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6110/12384 [12:57:39<13:20:33, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6110/12384 [12:57:47<13:20:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6111/12384 [12:57:47<13:19:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6111/12384 [12:57:55<13:19:15, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=8.02s]
Epoch 1: 49%|████▉ | 6112/12384 [12:57:55<13:19:28, 7.65s/it, loss=0.0003, acc=0.9991, iter_time=8.02s]
Epoch 1: 49%|████▉ | 6112/12384 [12:58:02<13:19:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 49%|████▉ | 6113/12384 [12:58:02<13:18:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 49%|████▉ | 6113/12384 [12:58:10<13:18:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 49%|████▉ | 6114/12384 [12:58:10<13:27:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 49%|████▉ | 6114/12384 [12:58:18<13:27:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 49%|████▉ | 6115/12384 [12:58:18<13:24:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 49%|████▉ | 6115/12384 [12:58:26<13:24:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 49%|████▉ | 6116/12384 [12:58:26<13:40:47, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 49%|████▉ | 6116/12384 [12:58:34<13:40:47, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 49%|████▉ | 6117/12384 [12:58:34<13:47:44, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 49%|████▉ | 6117/12384 [12:58:42<13:47:44, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 49%|████▉ | 6118/12384 [12:58:42<13:39:46, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 49%|████▉ | 6118/12384 [12:58:49<13:39:46, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 49%|████▉ | 6119/12384 [12:58:49<13:32:21, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 49%|████▉ | 6119/12384 [12:58:57<13:32:21, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 49%|████▉ | 6120/12384 [12:58:57<13:28:38, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 49%|████▉ | 6120/12384 [12:59:05<13:28:38, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 49%|████▉ | 6121/12384 [12:59:05<13:25:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 49%|████▉ | 6121/12384 [12:59:12<13:25:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 1: 49%|████▉ | 6122/12384 [12:59:12<13:22:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 1: 49%|████▉ | 6122/12384 [12:59:20<13:22:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 49%|████▉ | 6123/12384 [12:59:20<13:19:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 49%|████▉ | 6123/12384 [12:59:28<13:19:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 49%|████▉ | 6124/12384 [12:59:28<13:16:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 49%|████▉ | 6124/12384 [12:59:35<13:16:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 49%|████▉ | 6125/12384 [12:59:35<13:15:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 49%|████▉ | 6125/12384 [12:59:43<13:15:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6126/12384 [12:59:43<13:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 49%|████▉ | 6126/12384 [12:59:50<13:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 49%|████▉ | 6127/12384 [12:59:50<13:14:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 49%|████▉ | 6127/12384 [12:59:58<13:14:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 49%|████▉ | 6128/12384 [12:59:58<13:14:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 49%|████▉ | 6128/12384 [13:00:06<13:14:06, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.23s]
Epoch 1: 49%|████▉ | 6129/12384 [13:00:06<13:13:49, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.23s]
Epoch 1: 49%|████▉ | 6129/12384 [13:00:14<13:13:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 49%|████▉ | 6130/12384 [13:00:14<13:24:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 49%|████▉ | 6130/12384 [13:00:21<13:24:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 50%|████▉ | 6131/12384 [13:00:21<13:21:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 50%|████▉ | 6131/12384 [13:00:29<13:21:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 50%|████▉ | 6132/12384 [13:00:29<13:20:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 50%|████▉ | 6132/12384 [13:00:36<13:20:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 50%|████▉ | 6133/12384 [13:00:36<13:18:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 50%|████▉ | 6133/12384 [13:00:44<13:18:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|████▉ | 6134/12384 [13:00:44<13:16:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|████▉ | 6134/12384 [13:00:52<13:16:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 50%|████▉ | 6135/12384 [13:00:52<13:14:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 50%|████▉ | 6135/12384 [13:00:59<13:14:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 50%|████▉ | 6136/12384 [13:00:59<13:14:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 50%|████▉ | 6136/12384 [13:01:07<13:14:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 50%|████▉ | 6137/12384 [13:01:07<13:14:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 50%|████▉ | 6137/12384 [13:01:15<13:14:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 50%|████▉ | 6138/12384 [13:01:15<13:13:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 50%|████▉ | 6138/12384 [13:01:22<13:13:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 50%|████▉ | 6139/12384 [13:01:22<13:13:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 50%|████▉ | 6139/12384 [13:01:30<13:13:40, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.66s]
Epoch 1: 50%|████▉ | 6140/12384 [13:01:30<13:13:02, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.66s]
Epoch 1: 50%|████▉ | 6140/12384 [13:01:37<13:13:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 50%|████▉ | 6141/12384 [13:01:37<13:15:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 50%|████▉ | 6141/12384 [13:01:45<13:15:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 50%|████▉ | 6142/12384 [13:01:45<13:15:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 50%|████▉ | 6142/12384 [13:01:53<13:15:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 50%|████▉ | 6143/12384 [13:01:53<13:13:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 50%|████▉ | 6143/12384 [13:02:00<13:13:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 50%|████▉ | 6144/12384 [13:02:00<13:12:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 50%|████▉ | 6144/12384 [13:02:08<13:12:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 50%|████▉ | 6145/12384 [13:02:08<13:12:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 50%|████▉ | 6145/12384 [13:02:16<13:12:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 50%|████▉ | 6146/12384 [13:02:16<13:12:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 50%|████▉ | 6146/12384 [13:02:23<13:12:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|████▉ | 6147/12384 [13:02:23<13:12:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|████▉ | 6147/12384 [13:02:31<13:12:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 50%|████▉ | 6148/12384 [13:02:31<13:11:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 50%|████▉ | 6148/12384 [13:02:38<13:11:39, 7.62s/it, loss=0.0016, acc=0.9970, iter_time=4.00s]
Epoch 1: 50%|████▉ | 6149/12384 [13:02:38<13:11:19, 7.61s/it, loss=0.0016, acc=0.9970, iter_time=4.00s]
Epoch 1: 50%|████▉ | 6149/12384 [13:02:46<13:11:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=11.22s]
Epoch 1: 50%|████▉ | 6150/12384 [13:02:46<13:11:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.22s]
Epoch 1: 50%|████▉ | 6150/12384 [13:02:54<13:11:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 50%|████▉ | 6151/12384 [13:02:54<13:11:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 50%|████▉ | 6151/12384 [13:03:01<13:11:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 50%|████▉ | 6152/12384 [13:03:01<13:10:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 50%|████▉ | 6152/12384 [13:03:09<13:10:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 50%|████▉ | 6153/12384 [13:03:09<13:10:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 50%|████▉ | 6153/12384 [13:03:16<13:10:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 50%|████▉ | 6154/12384 [13:03:16<13:10:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 50%|████▉ | 6154/12384 [13:03:24<13:10:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 50%|████▉ | 6155/12384 [13:03:24<13:10:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 50%|████▉ | 6155/12384 [13:03:32<13:10:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 50%|████▉ | 6156/12384 [13:03:32<13:10:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 50%|████▉ | 6156/12384 [13:03:40<13:10:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 50%|████▉ | 6157/12384 [13:03:40<13:20:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 50%|████▉ | 6157/12384 [13:03:47<13:20:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 50%|████▉ | 6158/12384 [13:03:47<13:20:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 50%|████▉ | 6158/12384 [13:03:55<13:20:05, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 1: 50%|████▉ | 6159/12384 [13:03:55<13:17:17, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 1: 50%|████▉ | 6159/12384 [13:04:03<13:17:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 50%|████▉ | 6160/12384 [13:04:03<13:15:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 50%|████▉ | 6160/12384 [13:04:10<13:15:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 50%|████▉ | 6161/12384 [13:04:10<13:14:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 50%|████▉ | 6161/12384 [13:04:18<13:14:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.21s]
Epoch 1: 50%|████▉ | 6162/12384 [13:04:18<13:12:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.21s]
Epoch 1: 50%|████▉ | 6162/12384 [13:04:25<13:12:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 1: 50%|████▉ | 6163/12384 [13:04:25<13:11:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 1: 50%|████▉ | 6163/12384 [13:04:33<13:11:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 50%|████▉ | 6164/12384 [13:04:33<13:10:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 50%|████▉ | 6164/12384 [13:04:41<13:10:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 50%|████▉ | 6165/12384 [13:04:41<13:18:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 50%|████▉ | 6165/12384 [13:04:49<13:18:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 50%|████▉ | 6166/12384 [13:04:49<13:15:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 50%|████▉ | 6166/12384 [13:04:56<13:15:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 50%|████▉ | 6167/12384 [13:04:56<13:13:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 50%|████▉ | 6167/12384 [13:05:04<13:13:49, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.19s]
Epoch 1: 50%|████▉ | 6168/12384 [13:05:04<13:12:32, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.19s]
Epoch 1: 50%|████▉ | 6168/12384 [13:05:11<13:12:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 50%|████▉ | 6169/12384 [13:05:11<13:11:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 50%|████▉ | 6169/12384 [13:05:19<13:11:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|████▉ | 6170/12384 [13:05:19<13:10:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|████▉ | 6170/12384 [13:05:27<13:10:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 50%|████▉ | 6171/12384 [13:05:27<13:10:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 50%|████▉ | 6171/12384 [13:05:34<13:10:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 50%|████▉ | 6172/12384 [13:05:34<13:09:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 50%|████▉ | 6172/12384 [13:05:42<13:09:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 50%|████▉ | 6173/12384 [13:05:42<13:08:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 50%|████▉ | 6173/12384 [13:05:50<13:08:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 50%|████▉ | 6174/12384 [13:05:50<13:08:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 50%|████▉ | 6174/12384 [13:05:57<13:08:36, 7.62s/it, loss=0.0007, acc=0.9990, iter_time=9.91s]
Epoch 1: 50%|████▉ | 6175/12384 [13:05:57<13:08:27, 7.62s/it, loss=0.0007, acc=0.9990, iter_time=9.91s]
Epoch 1: 50%|████▉ | 6175/12384 [13:06:05<13:08:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 50%|████▉ | 6176/12384 [13:06:05<13:09:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 50%|████▉ | 6176/12384 [13:06:12<13:09:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 50%|████▉ | 6177/12384 [13:06:12<13:08:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 50%|████▉ | 6177/12384 [13:06:20<13:08:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 50%|████▉ | 6178/12384 [13:06:20<13:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 50%|████▉ | 6178/12384 [13:06:28<13:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 50%|████▉ | 6179/12384 [13:06:28<13:10:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 50%|████▉ | 6179/12384 [13:06:35<13:10:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 50%|████▉ | 6180/12384 [13:06:35<13:09:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 50%|████▉ | 6180/12384 [13:06:43<13:09:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 50%|████▉ | 6181/12384 [13:06:43<13:10:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 50%|████▉ | 6181/12384 [13:06:51<13:10:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 1: 50%|████▉ | 6182/12384 [13:06:51<13:09:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 1: 50%|████▉ | 6182/12384 [13:06:59<13:09:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 50%|████▉ | 6183/12384 [13:06:59<13:19:36, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 50%|████▉ | 6183/12384 [13:07:06<13:19:36, 7.74s/it, loss=0.0001, acc=0.9988, iter_time=9.79s]
Epoch 1: 50%|████▉ | 6184/12384 [13:07:06<13:15:13, 7.70s/it, loss=0.0001, acc=0.9988, iter_time=9.79s]
Epoch 1: 50%|████▉ | 6184/12384 [13:07:14<13:15:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 50%|████▉ | 6185/12384 [13:07:14<13:11:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 50%|████▉ | 6185/12384 [13:07:21<13:11:49, 7.66s/it, loss=0.0002, acc=0.9983, iter_time=6.67s]
Epoch 1: 50%|████▉ | 6186/12384 [13:07:21<13:09:39, 7.64s/it, loss=0.0002, acc=0.9983, iter_time=6.67s]
Epoch 1: 50%|████▉ | 6186/12384 [13:07:29<13:09:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 50%|████▉ | 6187/12384 [13:07:29<13:08:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 50%|████▉ | 6187/12384 [13:07:37<13:08:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|████▉ | 6188/12384 [13:07:37<13:07:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|████▉ | 6188/12384 [13:07:44<13:07:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|████▉ | 6189/12384 [13:07:44<13:07:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|████▉ | 6189/12384 [13:07:52<13:07:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 50%|████▉ | 6190/12384 [13:07:52<13:06:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 50%|████▉ | 6190/12384 [13:08:00<13:06:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 50%|████▉ | 6191/12384 [13:08:00<13:14:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 50%|████▉ | 6191/12384 [13:08:07<13:14:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 50%|█████ | 6192/12384 [13:08:07<13:15:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 50%|█████ | 6192/12384 [13:08:15<13:15:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 50%|█████ | 6193/12384 [13:08:15<13:12:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 50%|█████ | 6193/12384 [13:08:23<13:12:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 50%|█████ | 6194/12384 [13:08:23<13:10:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 50%|█████ | 6194/12384 [13:08:30<13:10:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|█████ | 6195/12384 [13:08:30<13:09:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|█████ | 6195/12384 [13:08:38<13:09:03, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6196/12384 [13:08:38<13:07:20, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6196/12384 [13:08:45<13:07:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6197/12384 [13:08:45<13:05:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6197/12384 [13:08:53<13:05:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 50%|█████ | 6198/12384 [13:08:53<13:09:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 50%|█████ | 6198/12384 [13:09:01<13:09:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 1: 50%|█████ | 6199/12384 [13:09:01<13:13:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 1: 50%|█████ | 6199/12384 [13:09:09<13:13:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 50%|█████ | 6200/12384 [13:09:09<13:13:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 50%|█████ | 6200/12384 [13:09:16<13:13:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 50%|█████ | 6201/12384 [13:09:16<13:12:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 50%|█████ | 6201/12384 [13:09:24<13:12:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 50%|█████ | 6202/12384 [13:09:24<13:09:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 50%|█████ | 6202/12384 [13:09:32<13:09:29, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.74s]
Epoch 1: 50%|█████ | 6203/12384 [13:09:32<13:08:01, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.74s]
Epoch 1: 50%|█████ | 6203/12384 [13:09:39<13:08:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 50%|█████ | 6204/12384 [13:09:39<13:06:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 50%|█████ | 6204/12384 [13:09:47<13:06:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 1: 50%|█████ | 6205/12384 [13:09:47<13:05:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 1: 50%|█████ | 6205/12384 [13:09:54<13:05:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6206/12384 [13:09:54<13:04:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6206/12384 [13:10:02<13:04:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 50%|█████ | 6207/12384 [13:10:02<13:04:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 50%|█████ | 6207/12384 [13:10:10<13:04:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 50%|█████ | 6208/12384 [13:10:10<13:04:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 50%|█████ | 6208/12384 [13:10:18<13:04:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 50%|█████ | 6209/12384 [13:10:18<13:14:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 50%|█████ | 6209/12384 [13:10:25<13:14:17, 7.72s/it, loss=0.0001, acc=0.9994, iter_time=8.02s]
Epoch 1: 50%|█████ | 6210/12384 [13:10:25<13:14:27, 7.72s/it, loss=0.0001, acc=0.9994, iter_time=8.02s]
Epoch 1: 50%|█████ | 6210/12384 [13:10:33<13:14:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.81s]
Epoch 1: 50%|█████ | 6211/12384 [13:10:33<13:15:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.81s]
Epoch 1: 50%|█████ | 6211/12384 [13:10:41<13:15:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 50%|█████ | 6212/12384 [13:10:41<13:12:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 50%|█████ | 6212/12384 [13:10:48<13:12:10, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=4.57s]
Epoch 1: 50%|█████ | 6213/12384 [13:10:48<13:09:25, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.57s]
Epoch 1: 50%|█████ | 6213/12384 [13:10:56<13:09:25, 7.68s/it, loss=0.0028, acc=0.9983, iter_time=10.67s]
Epoch 1: 50%|█████ | 6214/12384 [13:10:56<13:07:56, 7.66s/it, loss=0.0028, acc=0.9983, iter_time=10.67s]
Epoch 1: 50%|█████ | 6214/12384 [13:11:04<13:07:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 50%|█████ | 6215/12384 [13:11:04<13:06:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 50%|█████ | 6215/12384 [13:11:11<13:06:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 1: 50%|█████ | 6216/12384 [13:11:11<13:07:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 1: 50%|█████ | 6216/12384 [13:11:19<13:07:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 50%|█████ | 6217/12384 [13:11:19<13:05:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 50%|█████ | 6217/12384 [13:11:27<13:05:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 50%|█████ | 6218/12384 [13:11:27<13:13:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 50%|█████ | 6218/12384 [13:11:34<13:13:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6219/12384 [13:11:34<13:09:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6219/12384 [13:11:42<13:09:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 50%|█████ | 6220/12384 [13:11:42<13:06:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 50%|█████ | 6220/12384 [13:11:50<13:06:47, 7.66s/it, loss=0.0013, acc=0.9940, iter_time=8.17s]
Epoch 1: 50%|█████ | 6221/12384 [13:11:50<13:05:11, 7.64s/it, loss=0.0013, acc=0.9940, iter_time=8.17s]
Epoch 1: 50%|█████ | 6221/12384 [13:11:57<13:05:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 50%|█████ | 6222/12384 [13:11:57<13:04:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 50%|█████ | 6222/12384 [13:12:05<13:04:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 1: 50%|█████ | 6223/12384 [13:12:05<13:03:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 1: 50%|█████ | 6223/12384 [13:12:12<13:03:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 50%|█████ | 6224/12384 [13:12:12<13:03:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 50%|█████ | 6224/12384 [13:12:20<13:03:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 50%|█████ | 6225/12384 [13:12:20<13:02:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 50%|█████ | 6225/12384 [13:12:28<13:02:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 50%|█████ | 6226/12384 [13:12:28<13:03:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 50%|█████ | 6226/12384 [13:12:35<13:03:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 50%|█████ | 6227/12384 [13:12:35<13:02:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 50%|█████ | 6227/12384 [13:12:43<13:02:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 50%|█████ | 6228/12384 [13:12:43<13:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 50%|█████ | 6228/12384 [13:12:51<13:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 50%|█████ | 6229/12384 [13:12:51<13:02:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 50%|█████ | 6229/12384 [13:12:59<13:02:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 50%|█████ | 6230/12384 [13:12:59<13:12:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 50%|█████ | 6230/12384 [13:13:06<13:12:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 50%|█████ | 6231/12384 [13:13:06<13:08:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 50%|█████ | 6231/12384 [13:13:14<13:08:49, 7.69s/it, loss=0.0002, acc=0.9990, iter_time=10.57s]
Epoch 1: 50%|█████ | 6232/12384 [13:13:14<13:07:12, 7.68s/it, loss=0.0002, acc=0.9990, iter_time=10.57s]
Epoch 1: 50%|█████ | 6232/12384 [13:13:21<13:07:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 50%|█████ | 6233/12384 [13:13:21<13:04:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 50%|█████ | 6233/12384 [13:13:29<13:04:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6234/12384 [13:13:29<13:05:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 50%|█████ | 6234/12384 [13:13:37<13:05:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 50%|█████ | 6235/12384 [13:13:37<13:13:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 50%|█████ | 6235/12384 [13:13:45<13:13:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 50%|█████ | 6236/12384 [13:13:45<13:08:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 50%|█████ | 6236/12384 [13:13:52<13:08:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|█████ | 6237/12384 [13:13:52<13:05:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 50%|█████ | 6237/12384 [13:14:00<13:05:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 50%|█████ | 6238/12384 [13:14:00<13:03:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 50%|█████ | 6238/12384 [13:14:07<13:03:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 50%|█████ | 6239/12384 [13:14:07<13:02:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 50%|█████ | 6239/12384 [13:14:15<13:02:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 50%|█████ | 6240/12384 [13:14:15<13:00:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 50%|█████ | 6240/12384 [13:14:23<13:00:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 1: 50%|█████ | 6241/12384 [13:14:23<13:02:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 1: 50%|█████ | 6241/12384 [13:14:32<13:02:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 50%|█████ | 6242/12384 [13:14:32<13:46:51, 8.08s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 50%|█████ | 6242/12384 [13:14:40<13:46:51, 8.08s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 1: 50%|█████ | 6243/12384 [13:14:40<13:41:20, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 1: 50%|█████ | 6243/12384 [13:14:48<13:41:20, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 50%|█████ | 6244/12384 [13:14:48<13:37:15, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 50%|█████ | 6244/12384 [13:14:57<13:37:15, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 50%|█████ | 6245/12384 [13:14:57<14:08:25, 8.29s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 50%|█████ | 6245/12384 [13:15:04<14:08:25, 8.29s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 50%|█████ | 6246/12384 [13:15:04<13:47:46, 8.09s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 50%|█████ | 6246/12384 [13:15:12<13:47:46, 8.09s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 50%|█████ | 6247/12384 [13:15:12<13:32:43, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 50%|█████ | 6247/12384 [13:15:19<13:32:43, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 50%|█████ | 6248/12384 [13:15:19<13:22:19, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 50%|█████ | 6248/12384 [13:15:27<13:22:19, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 50%|█████ | 6249/12384 [13:15:27<13:16:49, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 50%|█████ | 6249/12384 [13:15:35<13:16:49, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 50%|█████ | 6250/12384 [13:15:35<13:11:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 50%|█████ | 6250/12384 [13:15:42<13:11:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 50%|█████ | 6251/12384 [13:15:42<13:07:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 50%|█████ | 6251/12384 [13:15:50<13:07:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 50%|█████ | 6252/12384 [13:15:50<13:04:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 50%|█████ | 6252/12384 [13:15:58<13:04:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 50%|█████ | 6253/12384 [13:15:58<13:02:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 50%|█████ | 6253/12384 [13:16:05<13:02:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 51%|█████ | 6254/12384 [13:16:05<13:01:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 51%|█████ | 6254/12384 [13:16:13<13:01:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 51%|█████ | 6255/12384 [13:16:13<12:59:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 51%|█████ | 6255/12384 [13:16:20<12:59:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 51%|█████ | 6256/12384 [13:16:20<12:58:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 51%|█████ | 6256/12384 [13:16:28<12:58:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 51%|█████ | 6257/12384 [13:16:28<12:58:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 51%|█████ | 6257/12384 [13:16:36<12:58:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 51%|█████ | 6258/12384 [13:16:36<12:58:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 51%|█████ | 6258/12384 [13:16:43<12:58:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 51%|█████ | 6259/12384 [13:16:43<12:58:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 51%|█████ | 6259/12384 [13:16:51<12:58:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 51%|█████ | 6260/12384 [13:16:51<12:58:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 51%|█████ | 6260/12384 [13:16:59<12:58:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 51%|█████ | 6261/12384 [13:16:59<13:09:47, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 51%|█████ | 6261/12384 [13:17:06<13:09:47, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 51%|█████ | 6262/12384 [13:17:06<13:05:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 51%|█████ | 6262/12384 [13:17:14<13:05:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 51%|█████ | 6263/12384 [13:17:14<13:03:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 51%|█████ | 6263/12384 [13:17:22<13:03:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 51%|█████ | 6264/12384 [13:17:22<13:00:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 51%|█████ | 6264/12384 [13:17:29<13:00:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 51%|█████ | 6265/12384 [13:17:29<12:59:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 51%|█████ | 6265/12384 [13:17:37<12:59:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 51%|█████ | 6266/12384 [13:17:37<12:57:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 51%|█████ | 6266/12384 [13:17:44<12:57:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 51%|█████ | 6267/12384 [13:17:44<12:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 51%|█████ | 6267/12384 [13:17:52<12:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 51%|█████ | 6268/12384 [13:17:52<12:56:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 51%|█████ | 6268/12384 [13:18:00<12:56:12, 7.61s/it, loss=0.0007, acc=0.9981, iter_time=7.60s]
Epoch 1: 51%|█████ | 6269/12384 [13:18:00<12:56:26, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=7.60s]
Epoch 1: 51%|█████ | 6269/12384 [13:18:07<12:56:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 51%|█████ | 6270/12384 [13:18:07<12:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 51%|█████ | 6270/12384 [13:18:15<12:56:09, 7.62s/it, loss=0.0005, acc=0.9979, iter_time=10.20s]
Epoch 1: 51%|█████ | 6271/12384 [13:18:15<12:55:21, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=10.20s]
Epoch 1: 51%|█████ | 6271/12384 [13:18:23<12:55:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 51%|█████ | 6272/12384 [13:18:23<12:56:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 51%|█████ | 6272/12384 [13:18:30<12:56:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 51%|█████ | 6273/12384 [13:18:30<12:55:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 51%|█████ | 6273/12384 [13:18:38<12:55:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 51%|█████ | 6274/12384 [13:18:38<12:54:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 51%|█████ | 6274/12384 [13:18:45<12:54:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 51%|█████ | 6275/12384 [13:18:45<12:54:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 51%|█████ | 6275/12384 [13:18:53<12:54:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 51%|█████ | 6276/12384 [13:18:53<12:55:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 51%|█████ | 6276/12384 [13:19:01<12:55:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 1: 51%|█████ | 6277/12384 [13:19:01<12:54:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.28s]
Epoch 1: 51%|█████ | 6277/12384 [13:19:08<12:54:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 51%|█████ | 6278/12384 [13:19:08<12:55:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 51%|█████ | 6278/12384 [13:19:16<12:55:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6279/12384 [13:19:16<12:54:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6279/12384 [13:19:23<12:54:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████ | 6280/12384 [13:19:23<12:55:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████ | 6280/12384 [13:19:31<12:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 51%|█████ | 6281/12384 [13:19:31<12:55:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 51%|█████ | 6281/12384 [13:19:39<12:55:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6282/12384 [13:19:39<12:54:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6282/12384 [13:19:46<12:54:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 51%|█████ | 6283/12384 [13:19:46<12:54:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 51%|█████ | 6283/12384 [13:19:54<12:54:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████ | 6284/12384 [13:19:54<12:56:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████ | 6284/12384 [13:20:02<12:56:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 1: 51%|█████ | 6285/12384 [13:20:02<12:55:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 1: 51%|█████ | 6285/12384 [13:20:09<12:55:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 51%|█████ | 6286/12384 [13:20:09<12:55:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 51%|█████ | 6286/12384 [13:20:17<12:55:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 51%|█████ | 6287/12384 [13:20:17<12:55:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 51%|█████ | 6287/12384 [13:20:25<12:55:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 51%|█████ | 6288/12384 [13:20:25<13:03:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 51%|█████ | 6288/12384 [13:20:32<13:03:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6289/12384 [13:20:32<12:59:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6289/12384 [13:20:40<12:59:54, 7.68s/it, loss=0.0012, acc=0.9982, iter_time=7.60s]
Epoch 1: 51%|█████ | 6290/12384 [13:20:40<12:57:25, 7.65s/it, loss=0.0012, acc=0.9982, iter_time=7.60s]
Epoch 1: 51%|█████ | 6290/12384 [13:20:48<12:57:25, 7.65s/it, loss=0.0009, acc=0.9970, iter_time=7.59s]
Epoch 1: 51%|█████ | 6291/12384 [13:20:48<12:56:02, 7.64s/it, loss=0.0009, acc=0.9970, iter_time=7.59s]
Epoch 1: 51%|█████ | 6291/12384 [13:20:55<12:56:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 51%|█████ | 6292/12384 [13:20:55<12:55:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 51%|█████ | 6292/12384 [13:21:03<12:55:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 51%|█████ | 6293/12384 [13:21:03<12:54:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 51%|█████ | 6293/12384 [13:21:10<12:54:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 51%|█████ | 6294/12384 [13:21:10<12:53:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 51%|█████ | 6294/12384 [13:21:18<12:53:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 51%|█████ | 6295/12384 [13:21:18<12:52:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 51%|█████ | 6295/12384 [13:21:26<12:52:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 51%|█████ | 6296/12384 [13:21:26<13:01:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 51%|█████ | 6296/12384 [13:21:34<13:01:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 51%|█████ | 6297/12384 [13:21:34<12:57:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 51%|█████ | 6297/12384 [13:21:41<12:57:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 51%|█████ | 6298/12384 [13:21:41<12:58:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 51%|█████ | 6298/12384 [13:21:49<12:58:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 51%|█████ | 6299/12384 [13:21:49<12:56:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 51%|█████ | 6299/12384 [13:21:56<12:56:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████ | 6300/12384 [13:21:56<12:54:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████ | 6300/12384 [13:22:04<12:54:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 51%|█████ | 6301/12384 [13:22:04<12:56:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 51%|█████ | 6301/12384 [13:22:12<12:56:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 51%|█████ | 6302/12384 [13:22:12<12:54:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 51%|█████ | 6302/12384 [13:22:19<12:54:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████ | 6303/12384 [13:22:19<12:53:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████ | 6303/12384 [13:22:27<12:53:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 51%|█████ | 6304/12384 [13:22:27<12:52:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 51%|█████ | 6304/12384 [13:22:35<12:52:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 51%|█████ | 6305/12384 [13:22:35<12:52:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 51%|█████ | 6305/12384 [13:22:42<12:52:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 51%|█████ | 6306/12384 [13:22:42<12:51:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 51%|█████ | 6306/12384 [13:22:50<12:51:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6307/12384 [13:22:50<12:51:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6307/12384 [13:22:57<12:51:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 51%|█████ | 6308/12384 [13:22:57<12:51:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 51%|█████ | 6308/12384 [13:23:05<12:51:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 51%|█████ | 6309/12384 [13:23:05<12:50:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 51%|█████ | 6309/12384 [13:23:13<12:50:56, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=7.62s]
Epoch 1: 51%|█████ | 6310/12384 [13:23:13<12:50:57, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.62s]
Epoch 1: 51%|█████ | 6310/12384 [13:23:20<12:50:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 51%|█████ | 6311/12384 [13:23:20<12:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 51%|█████ | 6311/12384 [13:23:28<12:49:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 1: 51%|█████ | 6312/12384 [13:23:28<12:50:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 1: 51%|█████ | 6312/12384 [13:23:35<12:50:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 51%|█████ | 6313/12384 [13:23:35<12:50:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 51%|█████ | 6313/12384 [13:23:43<12:50:09, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.63s]
Epoch 1: 51%|█████ | 6314/12384 [13:23:43<12:58:54, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=4.63s]
Epoch 1: 51%|█████ | 6314/12384 [13:23:51<12:58:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 51%|█████ | 6315/12384 [13:23:51<12:56:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 51%|█████ | 6315/12384 [13:23:59<12:56:15, 7.67s/it, loss=0.0001, acc=0.9986, iter_time=8.01s]
Epoch 1: 51%|█████ | 6316/12384 [13:23:59<12:53:47, 7.65s/it, loss=0.0001, acc=0.9986, iter_time=8.01s]
Epoch 1: 51%|█████ | 6316/12384 [13:24:06<12:53:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 51%|█████ | 6317/12384 [13:24:06<12:52:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 51%|█████ | 6317/12384 [13:24:14<12:52:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 51%|█████ | 6318/12384 [13:24:14<12:50:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 51%|█████ | 6318/12384 [13:24:21<12:50:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6319/12384 [13:24:21<12:49:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6319/12384 [13:24:29<12:49:52, 7.62s/it, loss=0.0009, acc=0.9981, iter_time=8.07s]
Epoch 1: 51%|█████ | 6320/12384 [13:24:29<12:51:40, 7.64s/it, loss=0.0009, acc=0.9981, iter_time=8.07s]
Epoch 1: 51%|█████ | 6320/12384 [13:24:37<12:51:40, 7.64s/it, loss=0.0001, acc=0.9993, iter_time=7.21s]
Epoch 1: 51%|█████ | 6321/12384 [13:24:37<12:50:37, 7.63s/it, loss=0.0001, acc=0.9993, iter_time=7.21s]
Epoch 1: 51%|█████ | 6321/12384 [13:24:45<12:50:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 51%|█████ | 6322/12384 [13:24:45<12:59:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 51%|█████ | 6322/12384 [13:24:52<12:59:54, 7.72s/it, loss=0.0003, acc=0.9977, iter_time=4.30s]
Epoch 1: 51%|█████ | 6323/12384 [13:24:52<12:57:16, 7.69s/it, loss=0.0003, acc=0.9977, iter_time=4.30s]
Epoch 1: 51%|█████ | 6323/12384 [13:25:00<12:57:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 51%|█████ | 6324/12384 [13:25:00<12:54:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 51%|█████ | 6324/12384 [13:25:07<12:54:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.61s]
Epoch 1: 51%|█████ | 6325/12384 [13:25:07<12:53:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.61s]
Epoch 1: 51%|█████ | 6325/12384 [13:25:15<12:53:05, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6326/12384 [13:25:15<12:51:48, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6326/12384 [13:25:23<12:51:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6327/12384 [13:25:23<12:50:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6327/12384 [13:25:30<12:50:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 51%|█████ | 6328/12384 [13:25:30<12:49:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 51%|█████ | 6328/12384 [13:25:38<12:49:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 51%|█████ | 6329/12384 [13:25:38<12:48:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 51%|█████ | 6329/12384 [13:25:46<12:48:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 51%|█████ | 6330/12384 [13:25:46<12:48:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 51%|█████ | 6330/12384 [13:25:53<12:48:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 51%|█████ | 6331/12384 [13:25:53<12:48:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 51%|█████ | 6331/12384 [13:26:01<12:48:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6332/12384 [13:26:01<12:48:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████ | 6332/12384 [13:26:08<12:48:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 1: 51%|█████ | 6333/12384 [13:26:08<12:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 1: 51%|█████ | 6333/12384 [13:26:16<12:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 1: 51%|█████ | 6334/12384 [13:26:16<12:47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 1: 51%|█████ | 6334/12384 [13:26:24<12:47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6335/12384 [13:26:24<12:47:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6335/12384 [13:26:31<12:47:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████ | 6336/12384 [13:26:31<12:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████ | 6336/12384 [13:26:39<12:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 51%|█████ | 6337/12384 [13:26:39<12:47:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 51%|█████ | 6337/12384 [13:26:46<12:47:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 51%|█████ | 6338/12384 [13:26:46<12:46:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 51%|█████ | 6338/12384 [13:26:54<12:46:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 51%|█████ | 6339/12384 [13:26:54<12:46:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 51%|█████ | 6339/12384 [13:27:02<12:46:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████ | 6340/12384 [13:27:02<12:46:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████ | 6340/12384 [13:27:10<12:46:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 51%|█████ | 6341/12384 [13:27:10<12:59:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 51%|█████ | 6341/12384 [13:27:17<12:59:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 51%|█████ | 6342/12384 [13:27:17<12:57:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 51%|█████ | 6342/12384 [13:27:25<12:57:03, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6343/12384 [13:27:25<12:53:37, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████ | 6343/12384 [13:27:33<12:53:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████ | 6344/12384 [13:27:33<12:51:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████ | 6344/12384 [13:27:40<12:51:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 51%|█████ | 6345/12384 [13:27:40<12:50:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 51%|█████ | 6345/12384 [13:27:48<12:50:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 51%|█████ | 6346/12384 [13:27:48<12:48:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 51%|█████ | 6346/12384 [13:27:55<12:48:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 51%|█████▏ | 6347/12384 [13:27:55<12:47:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 51%|█████▏ | 6347/12384 [13:28:03<12:47:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 51%|█████▏ | 6348/12384 [13:28:03<12:56:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 51%|█████▏ | 6348/12384 [13:28:11<12:56:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6349/12384 [13:28:11<12:53:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6349/12384 [13:28:19<12:53:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████▏ | 6350/12384 [13:28:19<12:52:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████▏ | 6350/12384 [13:28:26<12:52:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 51%|█████▏ | 6351/12384 [13:28:26<12:51:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 51%|█████▏ | 6351/12384 [13:28:34<12:51:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 51%|█████▏ | 6352/12384 [13:28:34<12:49:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 51%|█████▏ | 6352/12384 [13:28:42<12:49:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 1: 51%|█████▏ | 6353/12384 [13:28:42<12:48:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 1: 51%|█████▏ | 6353/12384 [13:28:49<12:48:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.61s]
Epoch 1: 51%|█████▏ | 6354/12384 [13:28:49<12:46:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.61s]
Epoch 1: 51%|█████▏ | 6354/12384 [13:28:57<12:46:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 51%|█████▏ | 6355/12384 [13:28:57<12:46:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 51%|█████▏ | 6355/12384 [13:29:04<12:46:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 51%|█████▏ | 6356/12384 [13:29:04<12:45:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 51%|█████▏ | 6356/12384 [13:29:12<12:45:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6357/12384 [13:29:12<12:44:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6357/12384 [13:29:20<12:44:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████▏ | 6358/12384 [13:29:20<12:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 51%|█████▏ | 6358/12384 [13:29:27<12:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 51%|█████▏ | 6359/12384 [13:29:27<12:46:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 51%|█████▏ | 6359/12384 [13:29:35<12:46:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████▏ | 6360/12384 [13:29:35<12:49:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████▏ | 6360/12384 [13:29:43<12:49:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 51%|█████▏ | 6361/12384 [13:29:43<12:47:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 51%|█████▏ | 6361/12384 [13:29:50<12:47:01, 7.64s/it, loss=0.0003, acc=0.9977, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6362/12384 [13:29:50<12:46:11, 7.63s/it, loss=0.0003, acc=0.9977, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6362/12384 [13:29:58<12:46:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 51%|█████▏ | 6363/12384 [13:29:58<12:45:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 51%|█████▏ | 6363/12384 [13:30:05<12:45:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████▏ | 6364/12384 [13:30:05<12:45:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 51%|█████▏ | 6364/12384 [13:30:13<12:45:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████▏ | 6365/12384 [13:30:13<12:45:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 51%|█████▏ | 6365/12384 [13:30:21<12:45:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 51%|█████▏ | 6366/12384 [13:30:21<13:03:04, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 51%|█████▏ | 6366/12384 [13:30:29<13:03:04, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 51%|█████▏ | 6367/12384 [13:30:29<13:11:25, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 51%|█████▏ | 6367/12384 [13:30:37<13:11:25, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 1: 51%|█████▏ | 6368/12384 [13:30:37<13:04:38, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 1: 51%|█████▏ | 6368/12384 [13:30:45<13:04:38, 7.83s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 1: 51%|█████▏ | 6369/12384 [13:30:45<12:57:29, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 1: 51%|█████▏ | 6369/12384 [13:30:52<12:57:29, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6370/12384 [13:30:52<12:52:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6370/12384 [13:31:00<12:52:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 51%|█████▏ | 6371/12384 [13:31:00<12:49:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 51%|█████▏ | 6371/12384 [13:31:08<12:49:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 51%|█████▏ | 6372/12384 [13:31:08<13:00:52, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 51%|█████▏ | 6372/12384 [13:31:16<13:00:52, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 51%|█████▏ | 6373/12384 [13:31:16<13:12:45, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 51%|█████▏ | 6373/12384 [13:31:24<13:12:45, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 51%|█████▏ | 6374/12384 [13:31:24<13:25:00, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 51%|█████▏ | 6374/12384 [13:31:32<13:25:00, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6375/12384 [13:31:32<13:12:03, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 51%|█████▏ | 6375/12384 [13:31:40<13:12:03, 7.91s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████▏ | 6376/12384 [13:31:40<13:02:53, 7.82s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 51%|█████▏ | 6376/12384 [13:31:47<13:02:53, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 51%|█████▏ | 6377/12384 [13:31:47<12:56:02, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 51%|█████▏ | 6377/12384 [13:31:55<12:56:02, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 52%|█████▏ | 6378/12384 [13:31:55<12:51:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 52%|█████▏ | 6378/12384 [13:32:03<12:51:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 1: 52%|█████▏ | 6379/12384 [13:32:03<12:58:15, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 1: 52%|█████▏ | 6379/12384 [13:32:10<12:58:15, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6380/12384 [13:32:10<12:52:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6380/12384 [13:32:18<12:52:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 52%|█████▏ | 6381/12384 [13:32:18<12:48:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 52%|█████▏ | 6381/12384 [13:32:26<12:48:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6382/12384 [13:32:26<12:47:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6382/12384 [13:32:33<12:47:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 52%|█████▏ | 6383/12384 [13:32:33<12:45:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 52%|█████▏ | 6383/12384 [13:32:41<12:45:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 1: 52%|█████▏ | 6384/12384 [13:32:41<12:44:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 1: 52%|█████▏ | 6384/12384 [13:32:48<12:44:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 52%|█████▏ | 6385/12384 [13:32:48<12:43:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 52%|█████▏ | 6385/12384 [13:32:56<12:43:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 52%|█████▏ | 6386/12384 [13:32:56<12:42:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 52%|█████▏ | 6386/12384 [13:33:04<12:42:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 52%|█████▏ | 6387/12384 [13:33:04<12:41:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 52%|█████▏ | 6387/12384 [13:33:11<12:41:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 52%|█████▏ | 6388/12384 [13:33:11<12:41:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 52%|█████▏ | 6388/12384 [13:33:19<12:41:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6389/12384 [13:33:19<12:41:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6389/12384 [13:33:26<12:41:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6390/12384 [13:33:26<12:40:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6390/12384 [13:33:34<12:40:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 52%|█████▏ | 6391/12384 [13:33:34<12:40:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 52%|█████▏ | 6391/12384 [13:33:42<12:40:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 52%|█████▏ | 6392/12384 [13:33:42<12:39:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 52%|█████▏ | 6392/12384 [13:33:50<12:39:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 52%|█████▏ | 6393/12384 [13:33:50<12:55:48, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 52%|█████▏ | 6393/12384 [13:33:57<12:55:48, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 52%|█████▏ | 6394/12384 [13:33:57<12:50:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 52%|█████▏ | 6394/12384 [13:34:05<12:50:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 52%|█████▏ | 6395/12384 [13:34:05<12:46:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 52%|█████▏ | 6395/12384 [13:34:13<12:46:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 52%|█████▏ | 6396/12384 [13:34:13<12:44:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 52%|█████▏ | 6396/12384 [13:34:20<12:44:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 52%|█████▏ | 6397/12384 [13:34:20<12:42:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 52%|█████▏ | 6397/12384 [13:34:28<12:42:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 52%|█████▏ | 6398/12384 [13:34:28<12:42:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 52%|█████▏ | 6398/12384 [13:34:36<12:42:57, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 52%|█████▏ | 6399/12384 [13:34:36<12:41:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 52%|█████▏ | 6399/12384 [13:34:43<12:41:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 52%|█████▏ | 6400/12384 [13:34:43<12:40:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 52%|█████▏ | 6400/12384 [13:34:51<12:40:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 52%|█████▏ | 6401/12384 [13:34:51<12:48:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 52%|█████▏ | 6401/12384 [13:34:59<12:48:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6402/12384 [13:34:59<12:46:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6402/12384 [13:35:06<12:46:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 52%|█████▏ | 6403/12384 [13:35:06<12:44:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 1: 52%|█████▏ | 6403/12384 [13:35:14<12:44:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 52%|█████▏ | 6404/12384 [13:35:14<12:41:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 52%|█████▏ | 6404/12384 [13:35:21<12:41:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 52%|█████▏ | 6405/12384 [13:35:21<12:40:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 52%|█████▏ | 6405/12384 [13:35:29<12:40:58, 7.64s/it, loss=0.0020, acc=0.9936, iter_time=7.58s]
Epoch 1: 52%|█████▏ | 6406/12384 [13:35:29<12:40:18, 7.63s/it, loss=0.0020, acc=0.9936, iter_time=7.58s]
Epoch 1: 52%|█████▏ | 6406/12384 [13:35:37<12:40:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 52%|█████▏ | 6407/12384 [13:35:37<12:39:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 52%|█████▏ | 6407/12384 [13:35:44<12:39:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 52%|█████▏ | 6408/12384 [13:35:44<12:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 52%|█████▏ | 6408/12384 [13:35:52<12:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 1: 52%|█████▏ | 6409/12384 [13:35:52<12:38:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 1: 52%|█████▏ | 6409/12384 [13:36:00<12:38:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 1: 52%|█████▏ | 6410/12384 [13:36:00<12:38:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 1: 52%|█████▏ | 6410/12384 [13:36:07<12:38:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 52%|█████▏ | 6411/12384 [13:36:07<12:37:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 52%|█████▏ | 6411/12384 [13:36:15<12:37:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 52%|█████▏ | 6412/12384 [13:36:15<12:37:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 52%|█████▏ | 6412/12384 [13:36:22<12:37:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 52%|█████▏ | 6413/12384 [13:36:22<12:37:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 52%|█████▏ | 6413/12384 [13:36:30<12:37:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 52%|█████▏ | 6414/12384 [13:36:30<12:37:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 52%|█████▏ | 6414/12384 [13:36:38<12:37:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6415/12384 [13:36:38<12:37:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6415/12384 [13:36:45<12:37:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 52%|█████▏ | 6416/12384 [13:36:45<12:36:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 52%|█████▏ | 6416/12384 [13:36:53<12:36:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 1: 52%|█████▏ | 6417/12384 [13:36:53<12:36:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 1: 52%|█████▏ | 6417/12384 [13:37:00<12:36:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 52%|█████▏ | 6418/12384 [13:37:00<12:35:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 52%|█████▏ | 6418/12384 [13:37:08<12:35:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 52%|█████▏ | 6419/12384 [13:37:08<12:47:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 52%|█████▏ | 6419/12384 [13:37:16<12:47:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 52%|█████▏ | 6420/12384 [13:37:16<12:44:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 52%|█████▏ | 6420/12384 [13:37:24<12:44:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 52%|█████▏ | 6421/12384 [13:37:24<12:41:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 52%|█████▏ | 6421/12384 [13:37:31<12:41:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 52%|█████▏ | 6422/12384 [13:37:31<12:39:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 52%|█████▏ | 6422/12384 [13:37:39<12:39:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 52%|█████▏ | 6423/12384 [13:37:39<12:40:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 52%|█████▏ | 6423/12384 [13:37:46<12:40:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 52%|█████▏ | 6424/12384 [13:37:46<12:39:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 52%|█████▏ | 6424/12384 [13:37:54<12:39:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 52%|█████▏ | 6425/12384 [13:37:54<12:37:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 52%|█████▏ | 6425/12384 [13:38:02<12:37:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6426/12384 [13:38:02<12:36:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6426/12384 [13:38:09<12:36:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 52%|█████▏ | 6427/12384 [13:38:09<12:36:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 52%|█████▏ | 6427/12384 [13:38:17<12:36:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 52%|█████▏ | 6428/12384 [13:38:17<12:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 52%|█████▏ | 6428/12384 [13:38:25<12:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 52%|█████▏ | 6429/12384 [13:38:25<12:35:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 52%|█████▏ | 6429/12384 [13:38:32<12:35:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 52%|█████▏ | 6430/12384 [13:38:32<12:35:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 52%|█████▏ | 6430/12384 [13:38:40<12:35:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 52%|█████▏ | 6431/12384 [13:38:40<12:34:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 52%|█████▏ | 6431/12384 [13:38:47<12:34:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 52%|█████▏ | 6432/12384 [13:38:47<12:35:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 52%|█████▏ | 6432/12384 [13:38:55<12:35:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 52%|█████▏ | 6433/12384 [13:38:55<12:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 52%|█████▏ | 6433/12384 [13:39:03<12:34:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6434/12384 [13:39:03<12:34:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6434/12384 [13:39:10<12:34:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6435/12384 [13:39:10<12:33:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6435/12384 [13:39:18<12:33:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6436/12384 [13:39:18<12:35:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6436/12384 [13:39:25<12:35:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 52%|█████▏ | 6437/12384 [13:39:25<12:35:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 52%|█████▏ | 6437/12384 [13:39:33<12:35:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 52%|█████▏ | 6438/12384 [13:39:33<12:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 52%|█████▏ | 6438/12384 [13:39:41<12:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 52%|█████▏ | 6439/12384 [13:39:41<12:34:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 52%|█████▏ | 6439/12384 [13:39:48<12:34:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 52%|█████▏ | 6440/12384 [13:39:48<12:34:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 52%|█████▏ | 6440/12384 [13:39:56<12:34:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 52%|█████▏ | 6441/12384 [13:39:56<12:36:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 52%|█████▏ | 6441/12384 [13:40:04<12:36:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 52%|█████▏ | 6442/12384 [13:40:04<12:36:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 52%|█████▏ | 6442/12384 [13:40:11<12:36:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 52%|█████▏ | 6443/12384 [13:40:11<12:35:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 52%|█████▏ | 6443/12384 [13:40:19<12:35:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 52%|█████▏ | 6444/12384 [13:40:19<12:34:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 52%|█████▏ | 6444/12384 [13:40:27<12:34:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 52%|█████▏ | 6445/12384 [13:40:27<12:44:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 52%|█████▏ | 6445/12384 [13:40:34<12:44:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 52%|█████▏ | 6446/12384 [13:40:34<12:40:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 52%|█████▏ | 6446/12384 [13:40:42<12:40:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 52%|█████▏ | 6447/12384 [13:40:42<12:38:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 52%|█████▏ | 6447/12384 [13:40:50<12:38:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 52%|█████▏ | 6448/12384 [13:40:50<12:38:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 52%|█████▏ | 6448/12384 [13:40:57<12:38:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 52%|█████▏ | 6449/12384 [13:40:57<12:36:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 52%|█████▏ | 6449/12384 [13:41:05<12:36:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 52%|█████▏ | 6450/12384 [13:41:05<12:35:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 52%|█████▏ | 6450/12384 [13:41:13<12:35:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 52%|█████▏ | 6451/12384 [13:41:13<12:34:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 52%|█████▏ | 6451/12384 [13:41:20<12:34:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 52%|█████▏ | 6452/12384 [13:41:20<12:34:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 52%|█████▏ | 6452/12384 [13:41:28<12:34:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 52%|█████▏ | 6453/12384 [13:41:28<12:41:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 52%|█████▏ | 6453/12384 [13:41:36<12:41:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6454/12384 [13:41:36<12:38:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6454/12384 [13:41:43<12:38:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 52%|█████▏ | 6455/12384 [13:41:43<12:36:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 52%|█████▏ | 6455/12384 [13:41:51<12:36:02, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.51s]
Epoch 1: 52%|█████▏ | 6456/12384 [13:41:51<12:35:01, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.51s]
Epoch 1: 52%|█████▏ | 6456/12384 [13:41:58<12:35:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 52%|█████▏ | 6457/12384 [13:41:58<12:34:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 52%|█████▏ | 6457/12384 [13:42:06<12:34:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 52%|█████▏ | 6458/12384 [13:42:06<12:34:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 52%|█████▏ | 6458/12384 [13:42:14<12:34:33, 7.64s/it, loss=0.0001, acc=0.9997, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6459/12384 [13:42:14<12:34:03, 7.64s/it, loss=0.0001, acc=0.9997, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6459/12384 [13:42:21<12:34:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 52%|█████▏ | 6460/12384 [13:42:21<12:32:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 52%|█████▏ | 6460/12384 [13:42:29<12:32:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 52%|█████▏ | 6461/12384 [13:42:29<12:32:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 52%|█████▏ | 6461/12384 [13:42:36<12:32:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 52%|█████▏ | 6462/12384 [13:42:36<12:23:37, 7.53s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 52%|█████▏ | 6462/12384 [13:42:44<12:23:37, 7.53s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6463/12384 [13:42:44<12:26:11, 7.56s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6463/12384 [13:42:52<12:26:11, 7.56s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 52%|█████▏ | 6464/12384 [13:42:52<12:27:41, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 52%|█████▏ | 6464/12384 [13:42:59<12:27:41, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 52%|█████▏ | 6465/12384 [13:42:59<12:27:59, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 1: 52%|█████▏ | 6465/12384 [13:43:07<12:27:59, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=11.82s]
Epoch 1: 52%|█████▏ | 6466/12384 [13:43:07<12:28:45, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=11.82s]
Epoch 1: 52%|█████▏ | 6466/12384 [13:43:14<12:28:45, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 52%|█████▏ | 6467/12384 [13:43:14<12:29:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 52%|█████▏ | 6467/12384 [13:43:22<12:29:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6468/12384 [13:43:22<12:29:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6468/12384 [13:43:30<12:29:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6469/12384 [13:43:30<12:29:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6469/12384 [13:43:37<12:29:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 52%|█████▏ | 6470/12384 [13:43:37<12:30:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 52%|█████▏ | 6470/12384 [13:43:45<12:30:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 52%|█████▏ | 6471/12384 [13:43:45<12:30:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 52%|█████▏ | 6471/12384 [13:43:53<12:30:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 52%|█████▏ | 6472/12384 [13:43:53<12:41:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 52%|█████▏ | 6472/12384 [13:44:00<12:41:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 52%|█████▏ | 6473/12384 [13:44:00<12:38:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 52%|█████▏ | 6473/12384 [13:44:08<12:38:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 52%|█████▏ | 6474/12384 [13:44:08<12:34:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 52%|█████▏ | 6474/12384 [13:44:16<12:34:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 52%|█████▏ | 6475/12384 [13:44:16<12:33:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 52%|█████▏ | 6475/12384 [13:44:23<12:33:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6476/12384 [13:44:23<12:32:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 52%|█████▏ | 6476/12384 [13:44:31<12:32:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 52%|█████▏ | 6477/12384 [13:44:31<12:31:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 52%|█████▏ | 6477/12384 [13:44:38<12:31:20, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=4.82s]
Epoch 1: 52%|█████▏ | 6478/12384 [13:44:38<12:30:02, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.82s]
Epoch 1: 52%|█████▏ | 6478/12384 [13:44:46<12:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.64s]
Epoch 1: 52%|█████▏ | 6479/12384 [13:44:46<12:38:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.64s]
Epoch 1: 52%|█████▏ | 6479/12384 [13:44:54<12:38:10, 7.70s/it, loss=0.0002, acc=0.9980, iter_time=7.97s]
Epoch 1: 52%|█████▏ | 6480/12384 [13:44:54<12:34:57, 7.67s/it, loss=0.0002, acc=0.9980, iter_time=7.97s]
Epoch 1: 52%|█████▏ | 6480/12384 [13:45:02<12:34:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 52%|█████▏ | 6481/12384 [13:45:02<12:32:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 52%|█████▏ | 6481/12384 [13:45:09<12:32:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 52%|█████▏ | 6482/12384 [13:45:09<12:30:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 52%|█████▏ | 6482/12384 [13:45:17<12:30:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.84s]
Epoch 1: 52%|█████▏ | 6483/12384 [13:45:17<12:29:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.84s]
Epoch 1: 52%|█████▏ | 6483/12384 [13:45:24<12:29:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 52%|█████▏ | 6484/12384 [13:45:24<12:30:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 52%|█████▏ | 6484/12384 [13:45:32<12:30:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 52%|█████▏ | 6485/12384 [13:45:32<12:32:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 52%|█████▏ | 6485/12384 [13:45:40<12:32:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 52%|█████▏ | 6486/12384 [13:45:40<12:30:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 52%|█████▏ | 6486/12384 [13:45:47<12:30:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6487/12384 [13:45:47<12:29:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 52%|█████▏ | 6487/12384 [13:45:55<12:29:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 52%|█████▏ | 6488/12384 [13:45:55<12:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 52%|█████▏ | 6488/12384 [13:46:03<12:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 52%|█████▏ | 6489/12384 [13:46:03<12:29:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 52%|█████▏ | 6489/12384 [13:46:10<12:29:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 52%|█████▏ | 6490/12384 [13:46:10<12:28:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 52%|█████▏ | 6490/12384 [13:46:18<12:28:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6491/12384 [13:46:18<12:29:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 52%|█████▏ | 6491/12384 [13:46:25<12:29:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 52%|█████▏ | 6492/12384 [13:46:25<12:28:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 52%|█████▏ | 6492/12384 [13:46:33<12:28:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 52%|█████▏ | 6493/12384 [13:46:33<12:29:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 52%|█████▏ | 6493/12384 [13:46:41<12:29:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 52%|█████▏ | 6494/12384 [13:46:41<12:29:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 52%|█████▏ | 6494/12384 [13:46:48<12:29:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 52%|█████▏ | 6495/12384 [13:46:48<12:29:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 52%|█████▏ | 6495/12384 [13:46:56<12:29:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 52%|█████▏ | 6496/12384 [13:46:56<12:28:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 52%|█████▏ | 6496/12384 [13:47:04<12:28:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 52%|█████▏ | 6497/12384 [13:47:04<12:27:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 52%|█████▏ | 6497/12384 [13:47:11<12:27:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 52%|█████▏ | 6498/12384 [13:47:11<12:36:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 52%|█████▏ | 6498/12384 [13:47:19<12:36:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 52%|█████▏ | 6499/12384 [13:47:19<12:33:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 52%|█████▏ | 6499/12384 [13:47:27<12:33:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 52%|█████▏ | 6500/12384 [13:47:27<12:31:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 52%|█████▏ | 6500/12384 [13:47:34<12:31:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 52%|█████▏ | 6501/12384 [13:47:34<12:29:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 52%|█████▏ | 6501/12384 [13:47:42<12:29:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 53%|█████▎ | 6502/12384 [13:47:42<12:28:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 53%|█████▎ | 6502/12384 [13:47:50<12:28:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6503/12384 [13:47:50<12:26:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6503/12384 [13:47:57<12:26:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 53%|█████▎ | 6504/12384 [13:47:57<12:27:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 53%|█████▎ | 6504/12384 [13:48:05<12:27:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 53%|█████▎ | 6505/12384 [13:48:05<12:26:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 53%|█████▎ | 6505/12384 [13:48:12<12:26:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 53%|█████▎ | 6506/12384 [13:48:12<12:26:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 53%|█████▎ | 6506/12384 [13:48:20<12:26:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 53%|█████▎ | 6507/12384 [13:48:20<12:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 53%|█████▎ | 6507/12384 [13:48:28<12:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 53%|█████▎ | 6508/12384 [13:48:28<12:25:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 53%|█████▎ | 6508/12384 [13:48:35<12:25:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 53%|█████▎ | 6509/12384 [13:48:35<12:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 53%|█████▎ | 6509/12384 [13:48:43<12:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 53%|█████▎ | 6510/12384 [13:48:43<12:24:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 53%|█████▎ | 6510/12384 [13:48:50<12:24:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 53%|█████▎ | 6511/12384 [13:48:50<12:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 53%|█████▎ | 6511/12384 [13:48:58<12:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 53%|█████▎ | 6512/12384 [13:48:58<12:24:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 53%|█████▎ | 6512/12384 [13:49:06<12:24:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 53%|█████▎ | 6513/12384 [13:49:06<12:24:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 53%|█████▎ | 6513/12384 [13:49:13<12:24:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 53%|█████▎ | 6514/12384 [13:49:13<12:24:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 53%|█████▎ | 6514/12384 [13:49:21<12:24:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6515/12384 [13:49:21<12:24:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6515/12384 [13:49:28<12:24:54, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=8.03s]
Epoch 1: 53%|█████▎ | 6516/12384 [13:49:28<12:24:52, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=8.03s]
Epoch 1: 53%|█████▎ | 6516/12384 [13:49:36<12:24:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 53%|█████▎ | 6517/12384 [13:49:36<12:24:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 53%|█████▎ | 6517/12384 [13:49:44<12:24:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 1: 53%|█████▎ | 6518/12384 [13:49:44<12:24:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 1: 53%|█████▎ | 6518/12384 [13:49:51<12:24:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 53%|█████▎ | 6519/12384 [13:49:51<12:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 53%|█████▎ | 6519/12384 [13:49:59<12:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 53%|█████▎ | 6520/12384 [13:49:59<12:24:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 53%|█████▎ | 6520/12384 [13:50:07<12:24:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 53%|█████▎ | 6521/12384 [13:50:07<12:24:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 53%|█████▎ | 6521/12384 [13:50:14<12:24:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 53%|█████▎ | 6522/12384 [13:50:14<12:25:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 53%|█████▎ | 6522/12384 [13:50:22<12:25:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.40s]
Epoch 1: 53%|█████▎ | 6523/12384 [13:50:22<12:25:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.40s]
Epoch 1: 53%|█████▎ | 6523/12384 [13:50:29<12:25:17, 7.63s/it, loss=0.0003, acc=0.9985, iter_time=7.64s]
Epoch 1: 53%|█████▎ | 6524/12384 [13:50:29<12:24:39, 7.62s/it, loss=0.0003, acc=0.9985, iter_time=7.64s]
Epoch 1: 53%|█████▎ | 6524/12384 [13:50:37<12:24:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 53%|█████▎ | 6525/12384 [13:50:37<12:34:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 53%|█████▎ | 6525/12384 [13:50:45<12:34:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 53%|█████▎ | 6526/12384 [13:50:45<12:30:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 53%|█████▎ | 6526/12384 [13:50:53<12:30:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 53%|█████▎ | 6527/12384 [13:50:53<12:27:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 53%|█████▎ | 6527/12384 [13:51:00<12:27:36, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.18s]
Epoch 1: 53%|█████▎ | 6528/12384 [13:51:00<12:25:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.18s]
Epoch 1: 53%|█████▎ | 6528/12384 [13:51:08<12:25:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 53%|█████▎ | 6529/12384 [13:51:08<12:24:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 53%|█████▎ | 6529/12384 [13:51:15<12:24:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 53%|█████▎ | 6530/12384 [13:51:15<12:23:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 53%|█████▎ | 6530/12384 [13:51:23<12:23:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 53%|█████▎ | 6531/12384 [13:51:23<12:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 53%|█████▎ | 6531/12384 [13:51:31<12:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 53%|█████▎ | 6532/12384 [13:51:31<12:24:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 53%|█████▎ | 6532/12384 [13:51:38<12:24:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 53%|█████▎ | 6533/12384 [13:51:38<12:23:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 53%|█████▎ | 6533/12384 [13:51:46<12:23:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 53%|█████▎ | 6534/12384 [13:51:46<12:23:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 53%|█████▎ | 6534/12384 [13:51:54<12:23:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6535/12384 [13:51:54<12:23:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6535/12384 [13:52:01<12:23:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 53%|█████▎ | 6536/12384 [13:52:01<12:23:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 53%|█████▎ | 6536/12384 [13:52:09<12:23:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 53%|█████▎ | 6537/12384 [13:52:09<12:22:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 53%|█████▎ | 6537/12384 [13:52:16<12:22:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 53%|█████▎ | 6538/12384 [13:52:16<12:22:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 53%|█████▎ | 6538/12384 [13:52:24<12:22:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 53%|█████▎ | 6539/12384 [13:52:24<12:22:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 53%|█████▎ | 6539/12384 [13:52:32<12:22:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 1: 53%|█████▎ | 6540/12384 [13:52:32<12:21:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 1: 53%|█████▎ | 6540/12384 [13:52:39<12:21:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6541/12384 [13:52:39<12:21:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6541/12384 [13:52:47<12:21:01, 7.61s/it, loss=0.0002, acc=0.9992, iter_time=4.79s]
Epoch 1: 53%|█████▎ | 6542/12384 [13:52:47<12:20:23, 7.60s/it, loss=0.0002, acc=0.9992, iter_time=4.79s]
Epoch 1: 53%|█████▎ | 6542/12384 [13:52:54<12:20:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 53%|█████▎ | 6543/12384 [13:52:54<12:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 53%|█████▎ | 6543/12384 [13:53:02<12:20:49, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=8.04s]
Epoch 1: 53%|█████▎ | 6544/12384 [13:53:02<12:20:59, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=8.04s]
Epoch 1: 53%|█████▎ | 6544/12384 [13:53:10<12:20:59, 7.61s/it, loss=0.0007, acc=0.9981, iter_time=7.21s]
Epoch 1: 53%|█████▎ | 6545/12384 [13:53:10<12:21:02, 7.61s/it, loss=0.0007, acc=0.9981, iter_time=7.21s]
Epoch 1: 53%|█████▎ | 6545/12384 [13:53:17<12:21:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6546/12384 [13:53:17<12:20:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6546/12384 [13:53:25<12:20:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 53%|█████▎ | 6547/12384 [13:53:25<12:20:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 53%|█████▎ | 6547/12384 [13:53:33<12:20:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 53%|█████▎ | 6548/12384 [13:53:33<12:20:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 53%|█████▎ | 6548/12384 [13:53:40<12:20:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 53%|█████▎ | 6549/12384 [13:53:40<12:20:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 53%|█████▎ | 6549/12384 [13:53:48<12:20:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6550/12384 [13:53:48<12:19:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6550/12384 [13:53:56<12:19:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 53%|█████▎ | 6551/12384 [13:53:56<12:31:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 53%|█████▎ | 6551/12384 [13:54:03<12:31:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 53%|█████▎ | 6552/12384 [13:54:03<12:28:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 53%|█████▎ | 6552/12384 [13:54:11<12:28:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 53%|█████▎ | 6553/12384 [13:54:11<12:25:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 53%|█████▎ | 6553/12384 [13:54:19<12:25:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6554/12384 [13:54:19<12:24:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6554/12384 [13:54:26<12:24:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6555/12384 [13:54:26<12:23:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6555/12384 [13:54:34<12:23:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 53%|█████▎ | 6556/12384 [13:54:34<12:22:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 53%|█████▎ | 6556/12384 [13:54:42<12:22:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 53%|█████▎ | 6557/12384 [13:54:42<12:23:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 53%|█████▎ | 6557/12384 [13:54:49<12:23:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 53%|█████▎ | 6558/12384 [13:54:49<12:30:29, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 53%|█████▎ | 6558/12384 [13:54:57<12:30:29, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 53%|█████▎ | 6559/12384 [13:54:57<12:26:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 53%|█████▎ | 6559/12384 [13:55:05<12:26:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 53%|█████▎ | 6560/12384 [13:55:05<12:26:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 53%|█████▎ | 6560/12384 [13:55:12<12:26:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 53%|█████▎ | 6561/12384 [13:55:12<12:23:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 53%|█████▎ | 6561/12384 [13:55:20<12:23:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 53%|█████▎ | 6562/12384 [13:55:20<12:21:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 53%|█████▎ | 6562/12384 [13:55:28<12:21:56, 7.65s/it, loss=0.0001, acc=0.9992, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6563/12384 [13:55:28<12:20:30, 7.63s/it, loss=0.0001, acc=0.9992, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6563/12384 [13:55:35<12:20:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6564/12384 [13:55:35<12:20:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6564/12384 [13:55:43<12:20:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6565/12384 [13:55:43<12:19:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6565/12384 [13:55:50<12:19:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 53%|█████▎ | 6566/12384 [13:55:50<12:19:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 53%|█████▎ | 6566/12384 [13:55:58<12:19:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 53%|█████▎ | 6567/12384 [13:55:58<12:20:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 53%|█████▎ | 6567/12384 [13:56:06<12:20:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6568/12384 [13:56:06<12:19:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6568/12384 [13:56:13<12:19:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 53%|█████▎ | 6569/12384 [13:56:13<12:18:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 53%|█████▎ | 6569/12384 [13:56:21<12:18:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 53%|█████▎ | 6570/12384 [13:56:21<12:17:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 53%|█████▎ | 6570/12384 [13:56:28<12:17:36, 7.61s/it, loss=0.0006, acc=0.9974, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6571/12384 [13:56:28<12:17:08, 7.61s/it, loss=0.0006, acc=0.9974, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6571/12384 [13:56:36<12:17:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6572/12384 [13:56:36<12:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6572/12384 [13:56:44<12:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6573/12384 [13:56:44<12:16:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6573/12384 [13:56:51<12:16:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6574/12384 [13:56:51<12:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6574/12384 [13:56:59<12:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6575/12384 [13:56:59<12:16:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6575/12384 [13:57:07<12:16:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 53%|█████▎ | 6576/12384 [13:57:07<12:16:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 53%|█████▎ | 6576/12384 [13:57:14<12:16:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 53%|█████▎ | 6577/12384 [13:57:14<12:26:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 53%|█████▎ | 6577/12384 [13:57:22<12:26:34, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 53%|█████▎ | 6578/12384 [13:57:22<12:23:12, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 53%|█████▎ | 6578/12384 [13:57:30<12:23:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6579/12384 [13:57:30<12:21:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6579/12384 [13:57:37<12:21:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6580/12384 [13:57:37<12:20:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6580/12384 [13:57:45<12:20:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 53%|█████▎ | 6581/12384 [13:57:45<12:19:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 53%|█████▎ | 6581/12384 [13:57:53<12:19:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 53%|█████▎ | 6582/12384 [13:57:53<12:17:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 53%|█████▎ | 6582/12384 [13:58:00<12:17:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 53%|█████▎ | 6583/12384 [13:58:00<12:15:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 53%|█████▎ | 6583/12384 [13:58:08<12:15:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 53%|█████▎ | 6584/12384 [13:58:08<12:15:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 53%|█████▎ | 6584/12384 [13:58:15<12:15:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 53%|█████▎ | 6585/12384 [13:58:15<12:14:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 53%|█████▎ | 6585/12384 [13:58:23<12:14:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 53%|█████▎ | 6586/12384 [13:58:23<12:14:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 53%|█████▎ | 6586/12384 [13:58:31<12:14:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6587/12384 [13:58:31<12:14:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 53%|█████▎ | 6587/12384 [13:58:38<12:14:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6588/12384 [13:58:38<12:14:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6588/12384 [13:58:46<12:14:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6589/12384 [13:58:46<12:15:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6589/12384 [13:58:53<12:15:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6590/12384 [13:58:53<12:15:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 53%|█████▎ | 6590/12384 [13:59:01<12:15:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 53%|█████▎ | 6591/12384 [13:59:01<12:15:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 53%|█████▎ | 6591/12384 [13:59:09<12:15:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 53%|█████▎ | 6592/12384 [13:59:09<12:14:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 53%|█████▎ | 6592/12384 [13:59:16<12:14:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 53%|█████▎ | 6593/12384 [13:59:16<12:14:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 53%|█████▎ | 6593/12384 [13:59:24<12:14:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6594/12384 [13:59:24<12:14:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6594/12384 [13:59:31<12:14:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 53%|█████▎ | 6595/12384 [13:59:31<12:13:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 53%|█████▎ | 6595/12384 [13:59:39<12:13:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 53%|█████▎ | 6596/12384 [13:59:39<12:14:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 53%|█████▎ | 6596/12384 [13:59:47<12:14:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 53%|█████▎ | 6597/12384 [13:59:47<12:14:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 53%|█████▎ | 6597/12384 [13:59:54<12:14:03, 7.61s/it, loss=0.0025, acc=0.9981, iter_time=7.59s]
Epoch 1: 53%|█████▎ | 6598/12384 [13:59:54<12:13:21, 7.60s/it, loss=0.0025, acc=0.9981, iter_time=7.59s]
Epoch 1: 53%|█████▎ | 6598/12384 [14:00:02<12:13:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 53%|█████▎ | 6599/12384 [14:00:02<12:13:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 53%|█████▎ | 6599/12384 [14:00:09<12:13:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 53%|█████▎ | 6600/12384 [14:00:09<12:13:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 53%|█████▎ | 6600/12384 [14:00:17<12:13:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 53%|█████▎ | 6601/12384 [14:00:17<12:15:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 53%|█████▎ | 6601/12384 [14:00:25<12:15:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 53%|█████▎ | 6602/12384 [14:00:25<12:15:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 53%|█████▎ | 6602/12384 [14:00:33<12:15:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 1: 53%|█████▎ | 6603/12384 [14:00:33<12:24:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 1: 53%|█████▎ | 6603/12384 [14:00:40<12:24:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 53%|█████▎ | 6604/12384 [14:00:40<12:21:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 53%|█████▎ | 6604/12384 [14:00:48<12:21:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6605/12384 [14:00:48<12:18:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 53%|█████▎ | 6605/12384 [14:00:56<12:18:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 53%|█████▎ | 6606/12384 [14:00:56<12:15:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 53%|█████▎ | 6606/12384 [14:01:03<12:15:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 53%|█████▎ | 6607/12384 [14:01:03<12:14:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 53%|█████▎ | 6607/12384 [14:01:11<12:14:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 53%|█████▎ | 6608/12384 [14:01:11<12:13:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 53%|█████▎ | 6608/12384 [14:01:18<12:13:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 53%|█████▎ | 6609/12384 [14:01:18<12:13:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 53%|█████▎ | 6609/12384 [14:01:26<12:13:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 53%|█████▎ | 6610/12384 [14:01:26<12:15:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 53%|█████▎ | 6610/12384 [14:01:34<12:15:51, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=5.65s]
Epoch 1: 53%|█████▎ | 6611/12384 [14:01:34<12:14:32, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.65s]
Epoch 1: 53%|█████▎ | 6611/12384 [14:01:41<12:14:32, 7.63s/it, loss=0.0004, acc=0.9978, iter_time=6.36s]
Epoch 1: 53%|█████▎ | 6612/12384 [14:01:41<12:13:46, 7.63s/it, loss=0.0004, acc=0.9978, iter_time=6.36s]
Epoch 1: 53%|█████▎ | 6612/12384 [14:01:49<12:13:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 53%|█████▎ | 6613/12384 [14:01:49<12:12:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 53%|█████▎ | 6613/12384 [14:01:56<12:12:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 53%|█████▎ | 6614/12384 [14:01:56<12:12:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 53%|█████▎ | 6614/12384 [14:02:04<12:12:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 53%|█████▎ | 6615/12384 [14:02:04<12:12:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 53%|█████▎ | 6615/12384 [14:02:12<12:12:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 53%|█████▎ | 6616/12384 [14:02:12<12:18:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 53%|█████▎ | 6616/12384 [14:02:20<12:18:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 53%|█████▎ | 6617/12384 [14:02:20<12:17:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 53%|█████▎ | 6617/12384 [14:02:27<12:17:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 53%|█████▎ | 6618/12384 [14:02:27<12:15:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 53%|█████▎ | 6618/12384 [14:02:35<12:15:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 53%|█████▎ | 6619/12384 [14:02:35<12:13:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 53%|█████▎ | 6619/12384 [14:02:42<12:13:59, 7.64s/it, loss=0.0002, acc=0.9990, iter_time=8.45s]
Epoch 1: 53%|█████▎ | 6620/12384 [14:02:42<12:12:10, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=8.45s]
Epoch 1: 53%|█████▎ | 6620/12384 [14:02:50<12:12:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 53%|█████▎ | 6621/12384 [14:02:50<12:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 53%|█████▎ | 6621/12384 [14:02:58<12:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 53%|█████▎ | 6622/12384 [14:02:58<12:11:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 53%|█████▎ | 6622/12384 [14:03:05<12:11:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6623/12384 [14:03:05<12:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 53%|█████▎ | 6623/12384 [14:03:13<12:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 53%|█████▎ | 6624/12384 [14:03:13<12:11:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 53%|█████▎ | 6624/12384 [14:03:20<12:11:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 53%|█████▎ | 6625/12384 [14:03:20<12:11:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 53%|█████▎ | 6625/12384 [14:03:28<12:11:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▎ | 6626/12384 [14:03:28<12:10:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▎ | 6626/12384 [14:03:36<12:10:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 54%|█████▎ | 6627/12384 [14:03:36<12:10:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 54%|█████▎ | 6627/12384 [14:03:43<12:10:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 54%|█████▎ | 6628/12384 [14:03:43<12:10:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 54%|█████▎ | 6628/12384 [14:03:51<12:10:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 54%|█████▎ | 6629/12384 [14:03:51<12:20:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 54%|█████▎ | 6629/12384 [14:03:59<12:20:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 54%|█████▎ | 6630/12384 [14:03:59<12:16:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 54%|█████▎ | 6630/12384 [14:04:06<12:16:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 54%|█████▎ | 6631/12384 [14:04:06<12:15:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 54%|█████▎ | 6631/12384 [14:04:14<12:15:09, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.05s]
Epoch 1: 54%|█████▎ | 6632/12384 [14:04:14<12:13:29, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.05s]
Epoch 1: 54%|█████▎ | 6632/12384 [14:04:22<12:13:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 54%|█████▎ | 6633/12384 [14:04:22<12:11:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 54%|█████▎ | 6633/12384 [14:04:29<12:11:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 54%|█████▎ | 6634/12384 [14:04:29<12:12:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 54%|█████▎ | 6634/12384 [14:04:37<12:12:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 54%|█████▎ | 6635/12384 [14:04:37<12:11:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 54%|█████▎ | 6635/12384 [14:04:45<12:11:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 54%|█████▎ | 6636/12384 [14:04:45<12:10:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 54%|█████▎ | 6636/12384 [14:04:52<12:10:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 54%|█████▎ | 6637/12384 [14:04:52<12:09:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 54%|█████▎ | 6637/12384 [14:05:00<12:09:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 54%|█████▎ | 6638/12384 [14:05:00<12:09:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 54%|█████▎ | 6638/12384 [14:05:07<12:09:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 54%|█████▎ | 6639/12384 [14:05:07<12:10:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 54%|█████▎ | 6639/12384 [14:05:15<12:10:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 54%|█████▎ | 6640/12384 [14:05:15<12:09:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 54%|█████▎ | 6640/12384 [14:05:23<12:09:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 54%|█████▎ | 6641/12384 [14:05:23<12:09:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 54%|█████▎ | 6641/12384 [14:05:30<12:09:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 54%|█████▎ | 6642/12384 [14:05:30<12:09:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 54%|█████▎ | 6642/12384 [14:05:38<12:09:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 54%|█████▎ | 6643/12384 [14:05:38<12:08:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 54%|█████▎ | 6643/12384 [14:05:46<12:08:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 54%|█████▎ | 6644/12384 [14:05:46<12:08:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 54%|█████▎ | 6644/12384 [14:05:53<12:08:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 54%|█████▎ | 6645/12384 [14:05:53<12:08:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 54%|█████▎ | 6645/12384 [14:06:01<12:08:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 54%|█████▎ | 6646/12384 [14:06:01<12:08:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 54%|█████▎ | 6646/12384 [14:06:09<12:08:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 54%|█████▎ | 6647/12384 [14:06:09<12:27:57, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 54%|█████▎ | 6647/12384 [14:06:17<12:27:57, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 54%|█████▎ | 6648/12384 [14:06:17<12:24:59, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 54%|█████▎ | 6648/12384 [14:06:25<12:24:59, 7.79s/it, loss=0.0002, acc=0.9991, iter_time=7.55s]
Epoch 1: 54%|█████▎ | 6649/12384 [14:06:25<12:27:50, 7.82s/it, loss=0.0002, acc=0.9991, iter_time=7.55s]
Epoch 1: 54%|█████▎ | 6649/12384 [14:06:32<12:27:50, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 54%|█████▎ | 6650/12384 [14:06:32<12:21:41, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 54%|█████▎ | 6650/12384 [14:06:40<12:21:41, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 54%|█████▎ | 6651/12384 [14:06:40<12:16:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 54%|█████▎ | 6651/12384 [14:06:48<12:16:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 54%|█████▎ | 6652/12384 [14:06:48<12:14:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 54%|█████▎ | 6652/12384 [14:06:55<12:14:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 54%|█████▎ | 6653/12384 [14:06:55<12:12:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 54%|█████▎ | 6653/12384 [14:07:03<12:12:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▎ | 6654/12384 [14:07:03<12:11:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▎ | 6654/12384 [14:07:10<12:11:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▎ | 6655/12384 [14:07:10<12:09:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▎ | 6655/12384 [14:07:18<12:09:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 54%|█████▎ | 6656/12384 [14:07:18<12:18:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 54%|█████▎ | 6656/12384 [14:07:26<12:18:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 54%|█████▍ | 6657/12384 [14:07:26<12:14:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 54%|█████▍ | 6657/12384 [14:07:34<12:14:27, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.84s]
Epoch 1: 54%|█████▍ | 6658/12384 [14:07:34<12:11:59, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.84s]
Epoch 1: 54%|█████▍ | 6658/12384 [14:07:41<12:11:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 54%|█████▍ | 6659/12384 [14:07:41<12:10:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 54%|█████▍ | 6659/12384 [14:07:49<12:10:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 54%|█████▍ | 6660/12384 [14:07:49<12:10:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 54%|█████▍ | 6660/12384 [14:07:56<12:10:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 54%|█████▍ | 6661/12384 [14:07:56<12:08:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 54%|█████▍ | 6661/12384 [14:08:04<12:08:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 54%|█████▍ | 6662/12384 [14:08:04<12:08:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 54%|█████▍ | 6662/12384 [14:08:12<12:08:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 54%|█████▍ | 6663/12384 [14:08:12<12:07:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 54%|█████▍ | 6663/12384 [14:08:19<12:07:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 54%|█████▍ | 6664/12384 [14:08:19<12:06:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 54%|█████▍ | 6664/12384 [14:08:27<12:06:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 54%|█████▍ | 6665/12384 [14:08:27<12:06:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 54%|█████▍ | 6665/12384 [14:08:34<12:06:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 54%|█████▍ | 6666/12384 [14:08:34<12:05:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 54%|█████▍ | 6666/12384 [14:08:42<12:05:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 54%|█████▍ | 6667/12384 [14:08:42<12:05:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 54%|█████▍ | 6667/12384 [14:08:50<12:05:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 54%|█████▍ | 6668/12384 [14:08:50<12:05:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 54%|█████▍ | 6668/12384 [14:08:57<12:05:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.45s]
Epoch 1: 54%|█████▍ | 6669/12384 [14:08:57<12:05:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.45s]
Epoch 1: 54%|█████▍ | 6669/12384 [14:09:05<12:05:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 54%|█████▍ | 6670/12384 [14:09:05<12:06:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 54%|█████▍ | 6670/12384 [14:09:13<12:06:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 54%|█████▍ | 6671/12384 [14:09:13<12:05:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 54%|█████▍ | 6671/12384 [14:09:20<12:05:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 54%|█████▍ | 6672/12384 [14:09:20<12:04:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 54%|█████▍ | 6672/12384 [14:09:28<12:04:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.68s]
Epoch 1: 54%|█████▍ | 6673/12384 [14:09:28<12:04:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.68s]
Epoch 1: 54%|█████▍ | 6673/12384 [14:09:35<12:04:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 54%|█████▍ | 6674/12384 [14:09:35<12:05:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 54%|█████▍ | 6674/12384 [14:09:43<12:05:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 54%|█████▍ | 6675/12384 [14:09:43<12:05:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 54%|█████▍ | 6675/12384 [14:09:51<12:05:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6676/12384 [14:09:51<12:05:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6676/12384 [14:09:58<12:05:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6677/12384 [14:09:58<12:05:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6677/12384 [14:10:06<12:05:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 54%|█████▍ | 6678/12384 [14:10:06<12:05:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 1: 54%|█████▍ | 6678/12384 [14:10:14<12:05:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 54%|█████▍ | 6679/12384 [14:10:14<12:04:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 54%|█████▍ | 6679/12384 [14:10:21<12:04:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 54%|█████▍ | 6680/12384 [14:10:21<12:04:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 54%|█████▍ | 6680/12384 [14:10:29<12:04:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 54%|█████▍ | 6681/12384 [14:10:29<12:04:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 54%|█████▍ | 6681/12384 [14:10:37<12:04:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 54%|█████▍ | 6682/12384 [14:10:37<12:13:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 54%|█████▍ | 6682/12384 [14:10:44<12:13:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 54%|█████▍ | 6683/12384 [14:10:44<12:10:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 54%|█████▍ | 6683/12384 [14:10:52<12:10:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 54%|█████▍ | 6684/12384 [14:10:52<12:08:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 54%|█████▍ | 6684/12384 [14:11:00<12:08:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 54%|█████▍ | 6685/12384 [14:11:00<12:06:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 54%|█████▍ | 6685/12384 [14:11:07<12:06:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 54%|█████▍ | 6686/12384 [14:11:07<12:06:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 54%|█████▍ | 6686/12384 [14:11:15<12:06:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 1: 54%|█████▍ | 6687/12384 [14:11:15<12:04:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 1: 54%|█████▍ | 6687/12384 [14:11:23<12:04:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 54%|█████▍ | 6688/12384 [14:11:23<12:05:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 54%|█████▍ | 6688/12384 [14:11:30<12:05:12, 7.64s/it, loss=0.0004, acc=0.9997, iter_time=7.22s]
Epoch 1: 54%|█████▍ | 6689/12384 [14:11:30<12:04:21, 7.63s/it, loss=0.0004, acc=0.9997, iter_time=7.22s]
Epoch 1: 54%|█████▍ | 6689/12384 [14:11:38<12:04:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 54%|█████▍ | 6690/12384 [14:11:38<12:03:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 54%|█████▍ | 6690/12384 [14:11:45<12:03:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6691/12384 [14:11:45<12:02:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6691/12384 [14:11:53<12:02:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 1: 54%|█████▍ | 6692/12384 [14:11:53<12:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 1: 54%|█████▍ | 6692/12384 [14:12:01<12:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 54%|█████▍ | 6693/12384 [14:12:01<12:02:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 54%|█████▍ | 6693/12384 [14:12:08<12:02:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 54%|█████▍ | 6694/12384 [14:12:08<12:02:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 54%|█████▍ | 6694/12384 [14:12:16<12:02:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 54%|█████▍ | 6695/12384 [14:12:16<12:02:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 54%|█████▍ | 6695/12384 [14:12:23<12:02:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 54%|█████▍ | 6696/12384 [14:12:23<12:02:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 54%|█████▍ | 6696/12384 [14:12:31<12:02:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 54%|█████▍ | 6697/12384 [14:12:31<12:01:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 54%|█████▍ | 6697/12384 [14:12:39<12:01:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 54%|█████▍ | 6698/12384 [14:12:39<12:00:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 54%|█████▍ | 6698/12384 [14:12:46<12:00:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 54%|█████▍ | 6699/12384 [14:12:46<12:03:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 54%|█████▍ | 6699/12384 [14:12:54<12:03:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.33s]
Epoch 1: 54%|█████▍ | 6700/12384 [14:12:54<12:02:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.33s]
Epoch 1: 54%|█████▍ | 6700/12384 [14:13:02<12:02:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 54%|█████▍ | 6701/12384 [14:13:02<12:03:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 54%|█████▍ | 6701/12384 [14:13:09<12:03:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 54%|█████▍ | 6702/12384 [14:13:09<12:02:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 54%|█████▍ | 6702/12384 [14:13:17<12:02:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 54%|█████▍ | 6703/12384 [14:13:17<12:01:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 54%|█████▍ | 6703/12384 [14:13:24<12:01:05, 7.62s/it, loss=0.0007, acc=0.9969, iter_time=7.99s]
Epoch 1: 54%|█████▍ | 6704/12384 [14:13:24<12:00:58, 7.62s/it, loss=0.0007, acc=0.9969, iter_time=7.99s]
Epoch 1: 54%|█████▍ | 6704/12384 [14:13:32<12:00:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 54%|█████▍ | 6705/12384 [14:13:32<12:00:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 54%|█████▍ | 6705/12384 [14:13:40<12:00:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 54%|█████▍ | 6706/12384 [14:13:40<12:00:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 54%|█████▍ | 6706/12384 [14:13:47<12:00:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6707/12384 [14:13:47<12:00:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6707/12384 [14:13:55<12:00:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 1: 54%|█████▍ | 6708/12384 [14:13:55<12:01:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 1: 54%|█████▍ | 6708/12384 [14:14:03<12:01:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 1: 54%|█████▍ | 6709/12384 [14:14:03<12:09:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 1: 54%|█████▍ | 6709/12384 [14:14:10<12:09:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 54%|█████▍ | 6710/12384 [14:14:10<12:06:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 54%|█████▍ | 6710/12384 [14:14:18<12:06:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 54%|█████▍ | 6711/12384 [14:14:18<12:04:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 54%|█████▍ | 6711/12384 [14:14:26<12:04:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 54%|█████▍ | 6712/12384 [14:14:26<12:02:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 54%|█████▍ | 6712/12384 [14:14:33<12:02:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 54%|█████▍ | 6713/12384 [14:14:33<12:01:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 54%|█████▍ | 6713/12384 [14:14:41<12:01:58, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=5.05s]
Epoch 1: 54%|█████▍ | 6714/12384 [14:14:41<12:01:17, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=5.05s]
Epoch 1: 54%|█████▍ | 6714/12384 [14:14:48<12:01:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 54%|█████▍ | 6715/12384 [14:14:48<12:00:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 54%|█████▍ | 6715/12384 [14:14:56<12:00:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 54%|█████▍ | 6716/12384 [14:14:56<11:59:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 54%|█████▍ | 6716/12384 [14:15:04<11:59:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 54%|█████▍ | 6717/12384 [14:15:04<11:59:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 54%|█████▍ | 6717/12384 [14:15:11<11:59:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 54%|█████▍ | 6718/12384 [14:15:11<12:00:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 54%|█████▍ | 6718/12384 [14:15:19<12:00:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 54%|█████▍ | 6719/12384 [14:15:19<11:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 54%|█████▍ | 6719/12384 [14:15:27<11:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.75s]
Epoch 1: 54%|█████▍ | 6720/12384 [14:15:27<11:59:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.75s]
Epoch 1: 54%|█████▍ | 6720/12384 [14:15:34<11:59:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 1: 54%|█████▍ | 6721/12384 [14:15:34<11:58:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 1: 54%|█████▍ | 6721/12384 [14:15:42<11:58:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 54%|█████▍ | 6722/12384 [14:15:42<11:57:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 54%|█████▍ | 6722/12384 [14:15:49<11:57:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.04s]
Epoch 1: 54%|█████▍ | 6723/12384 [14:15:49<11:57:22, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.04s]
Epoch 1: 54%|█████▍ | 6723/12384 [14:15:57<11:57:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 54%|█████▍ | 6724/12384 [14:15:57<11:57:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 54%|█████▍ | 6724/12384 [14:16:05<11:57:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 54%|█████▍ | 6725/12384 [14:16:05<11:57:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 54%|█████▍ | 6725/12384 [14:16:12<11:57:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 54%|█████▍ | 6726/12384 [14:16:12<11:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 54%|█████▍ | 6726/12384 [14:16:20<11:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6727/12384 [14:16:20<11:56:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 54%|█████▍ | 6727/12384 [14:16:27<11:56:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 54%|█████▍ | 6728/12384 [14:16:27<11:56:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 54%|█████▍ | 6728/12384 [14:16:35<11:56:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 54%|█████▍ | 6729/12384 [14:16:35<11:56:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 54%|█████▍ | 6729/12384 [14:16:43<11:56:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 54%|█████▍ | 6730/12384 [14:16:43<11:56:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 54%|█████▍ | 6730/12384 [14:16:50<11:56:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 54%|█████▍ | 6731/12384 [14:16:50<11:56:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 54%|█████▍ | 6731/12384 [14:16:58<11:56:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 54%|█████▍ | 6732/12384 [14:16:58<11:57:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 54%|█████▍ | 6732/12384 [14:17:05<11:57:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 54%|█████▍ | 6733/12384 [14:17:05<11:57:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 54%|█████▍ | 6733/12384 [14:17:13<11:57:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 54%|█████▍ | 6734/12384 [14:17:13<11:57:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 54%|█████▍ | 6734/12384 [14:17:21<11:57:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 54%|█████▍ | 6735/12384 [14:17:21<12:06:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 54%|█████▍ | 6735/12384 [14:17:29<12:06:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 54%|█████▍ | 6736/12384 [14:17:29<12:03:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 54%|█████▍ | 6736/12384 [14:17:36<12:03:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 54%|█████▍ | 6737/12384 [14:17:36<12:02:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 54%|█████▍ | 6737/12384 [14:17:44<12:02:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 54%|█████▍ | 6738/12384 [14:17:44<12:00:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 54%|█████▍ | 6738/12384 [14:17:52<12:00:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 54%|█████▍ | 6739/12384 [14:17:52<11:59:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 54%|█████▍ | 6739/12384 [14:17:59<11:59:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 54%|█████▍ | 6740/12384 [14:17:59<11:58:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 54%|█████▍ | 6740/12384 [14:18:07<11:58:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 54%|█████▍ | 6741/12384 [14:18:07<11:57:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 54%|█████▍ | 6741/12384 [14:18:14<11:57:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 54%|█████▍ | 6742/12384 [14:18:14<11:57:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 54%|█████▍ | 6742/12384 [14:18:22<11:57:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 54%|█████▍ | 6743/12384 [14:18:22<11:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 54%|█████▍ | 6743/12384 [14:18:30<11:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 54%|█████▍ | 6744/12384 [14:18:30<11:56:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 54%|█████▍ | 6744/12384 [14:18:37<11:56:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 54%|█████▍ | 6745/12384 [14:18:37<11:58:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 54%|█████▍ | 6745/12384 [14:18:45<11:58:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 54%|█████▍ | 6746/12384 [14:18:45<11:57:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 54%|█████▍ | 6746/12384 [14:18:53<11:57:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 54%|█████▍ | 6747/12384 [14:18:53<11:57:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 54%|█████▍ | 6747/12384 [14:19:00<11:57:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 54%|█████▍ | 6748/12384 [14:19:00<11:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 54%|█████▍ | 6748/12384 [14:19:08<11:56:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 54%|█████▍ | 6749/12384 [14:19:08<11:56:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 54%|█████▍ | 6749/12384 [14:19:15<11:56:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 55%|█████▍ | 6750/12384 [14:19:15<11:55:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 55%|█████▍ | 6750/12384 [14:19:23<11:55:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 55%|█████▍ | 6751/12384 [14:19:23<11:54:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 55%|█████▍ | 6751/12384 [14:19:31<11:54:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 55%|█████▍ | 6752/12384 [14:19:31<11:54:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 55%|█████▍ | 6752/12384 [14:19:38<11:54:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 55%|█████▍ | 6753/12384 [14:19:38<11:54:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 55%|█████▍ | 6753/12384 [14:19:46<11:54:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6754/12384 [14:19:46<11:54:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6754/12384 [14:19:53<11:54:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 55%|█████▍ | 6755/12384 [14:19:53<11:54:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 55%|█████▍ | 6755/12384 [14:20:01<11:54:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6756/12384 [14:20:01<11:54:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6756/12384 [14:20:09<11:54:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 55%|█████▍ | 6757/12384 [14:20:09<11:53:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 55%|█████▍ | 6757/12384 [14:20:16<11:53:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 55%|█████▍ | 6758/12384 [14:20:16<11:54:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 55%|█████▍ | 6758/12384 [14:20:24<11:54:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6759/12384 [14:20:24<11:54:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6759/12384 [14:20:32<11:54:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 55%|█████▍ | 6760/12384 [14:20:32<11:54:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 55%|█████▍ | 6760/12384 [14:20:39<11:54:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 55%|█████▍ | 6761/12384 [14:20:39<12:01:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 55%|█████▍ | 6761/12384 [14:20:47<12:01:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 55%|█████▍ | 6762/12384 [14:20:47<11:59:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 55%|█████▍ | 6762/12384 [14:20:55<11:59:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 55%|█████▍ | 6763/12384 [14:20:55<11:56:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 55%|█████▍ | 6763/12384 [14:21:02<11:56:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 55%|█████▍ | 6764/12384 [14:21:02<11:55:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 55%|█████▍ | 6764/12384 [14:21:10<11:55:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 1: 55%|█████▍ | 6765/12384 [14:21:10<11:54:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 1: 55%|█████▍ | 6765/12384 [14:21:17<11:54:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 55%|█████▍ | 6766/12384 [14:21:17<11:54:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 55%|█████▍ | 6766/12384 [14:21:25<11:54:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 55%|█████▍ | 6767/12384 [14:21:25<11:55:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 55%|█████▍ | 6767/12384 [14:21:33<11:55:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 1: 55%|█████▍ | 6768/12384 [14:21:33<11:54:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 1: 55%|█████▍ | 6768/12384 [14:21:40<11:54:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 55%|█████▍ | 6769/12384 [14:21:40<11:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 55%|█████▍ | 6769/12384 [14:21:48<11:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6770/12384 [14:21:48<11:52:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6770/12384 [14:21:56<11:52:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 55%|█████▍ | 6771/12384 [14:21:56<11:52:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 55%|█████▍ | 6771/12384 [14:22:03<11:52:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 55%|█████▍ | 6772/12384 [14:22:03<11:52:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 55%|█████▍ | 6772/12384 [14:22:11<11:52:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6773/12384 [14:22:11<11:52:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▍ | 6773/12384 [14:22:18<11:52:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 55%|█████▍ | 6774/12384 [14:22:18<11:52:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 55%|█████▍ | 6774/12384 [14:22:26<11:52:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 55%|█████▍ | 6775/12384 [14:22:26<11:51:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 55%|█████▍ | 6775/12384 [14:22:34<11:51:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 55%|█████▍ | 6776/12384 [14:22:34<11:51:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 55%|█████▍ | 6776/12384 [14:22:41<11:51:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 55%|█████▍ | 6777/12384 [14:22:41<11:51:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 55%|█████▍ | 6777/12384 [14:22:49<11:51:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 55%|█████▍ | 6778/12384 [14:22:49<12:02:06, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 55%|█████▍ | 6778/12384 [14:22:57<12:02:06, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 55%|█████▍ | 6779/12384 [14:22:57<11:58:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 55%|█████▍ | 6779/12384 [14:23:04<11:58:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 55%|█████▍ | 6780/12384 [14:23:04<11:56:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 55%|█████▍ | 6780/12384 [14:23:12<11:56:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 55%|█████▍ | 6781/12384 [14:23:12<11:54:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 55%|█████▍ | 6781/12384 [14:23:20<11:54:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 55%|█████▍ | 6782/12384 [14:23:20<11:53:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 55%|█████▍ | 6782/12384 [14:23:28<11:53:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 55%|█████▍ | 6783/12384 [14:23:28<11:58:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 55%|█████▍ | 6783/12384 [14:23:35<11:58:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 55%|█████▍ | 6784/12384 [14:23:35<11:55:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 55%|█████▍ | 6784/12384 [14:23:43<11:55:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 55%|█████▍ | 6785/12384 [14:23:43<12:05:07, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 55%|█████▍ | 6785/12384 [14:23:51<12:05:07, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 55%|█████▍ | 6786/12384 [14:23:51<12:02:48, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 55%|█████▍ | 6786/12384 [14:23:59<12:02:48, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 55%|█████▍ | 6787/12384 [14:23:59<12:10:21, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 55%|█████▍ | 6787/12384 [14:24:06<12:10:21, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 55%|█████▍ | 6788/12384 [14:24:06<12:04:24, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 55%|█████▍ | 6788/12384 [14:24:14<12:04:24, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 55%|█████▍ | 6789/12384 [14:24:14<12:04:29, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 55%|█████▍ | 6789/12384 [14:24:22<12:04:29, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 55%|█████▍ | 6790/12384 [14:24:22<12:01:55, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 55%|█████▍ | 6790/12384 [14:24:30<12:01:55, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 55%|█████▍ | 6791/12384 [14:24:30<11:57:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 55%|█████▍ | 6791/12384 [14:24:37<11:57:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 55%|█████▍ | 6792/12384 [14:24:37<11:54:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 55%|█████▍ | 6792/12384 [14:24:45<11:54:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 55%|█████▍ | 6793/12384 [14:24:45<11:52:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 55%|█████▍ | 6793/12384 [14:24:52<11:52:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 55%|█████▍ | 6794/12384 [14:24:52<11:51:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 55%|█████▍ | 6794/12384 [14:25:00<11:51:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 55%|█████▍ | 6795/12384 [14:25:00<11:49:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 55%|█████▍ | 6795/12384 [14:25:08<11:49:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 55%|█████▍ | 6796/12384 [14:25:08<11:49:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 55%|█████▍ | 6796/12384 [14:25:15<11:49:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 55%|█████▍ | 6797/12384 [14:25:15<11:49:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 55%|█████▍ | 6797/12384 [14:25:23<11:49:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 55%|█████▍ | 6798/12384 [14:25:23<11:49:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 55%|█████▍ | 6798/12384 [14:25:30<11:49:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 55%|█████▍ | 6799/12384 [14:25:30<11:48:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 55%|█████▍ | 6799/12384 [14:25:38<11:48:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 55%|█████▍ | 6800/12384 [14:25:38<11:48:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 55%|█████▍ | 6800/12384 [14:25:46<11:48:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 55%|█████▍ | 6801/12384 [14:25:46<11:48:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 55%|█████▍ | 6801/12384 [14:25:53<11:48:01, 7.61s/it, loss=0.0002, acc=0.9985, iter_time=8.23s]
Epoch 1: 55%|█████▍ | 6802/12384 [14:25:53<11:48:09, 7.61s/it, loss=0.0002, acc=0.9985, iter_time=8.23s]
Epoch 1: 55%|█████▍ | 6802/12384 [14:26:01<11:48:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 55%|█████▍ | 6803/12384 [14:26:01<11:47:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 55%|█████▍ | 6803/12384 [14:26:09<11:47:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 55%|█████▍ | 6804/12384 [14:26:09<11:55:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 55%|█████▍ | 6804/12384 [14:26:16<11:55:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 55%|█████▍ | 6805/12384 [14:26:16<11:53:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 55%|█████▍ | 6805/12384 [14:26:24<11:53:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 55%|█████▍ | 6806/12384 [14:26:24<11:53:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 55%|█████▍ | 6806/12384 [14:26:32<11:53:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 55%|█████▍ | 6807/12384 [14:26:32<11:54:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 55%|█████▍ | 6807/12384 [14:26:39<11:54:51, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.17s]
Epoch 1: 55%|█████▍ | 6808/12384 [14:26:39<11:55:04, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.17s]
Epoch 1: 55%|█████▍ | 6808/12384 [14:26:47<11:55:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 55%|█████▍ | 6809/12384 [14:26:47<11:54:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 55%|█████▍ | 6809/12384 [14:26:55<11:54:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 1: 55%|█████▍ | 6810/12384 [14:26:55<11:54:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 1: 55%|█████▍ | 6810/12384 [14:27:03<11:54:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 55%|█████▍ | 6811/12384 [14:27:03<11:54:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 55%|█████▍ | 6811/12384 [14:27:10<11:54:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 55%|█████▌ | 6812/12384 [14:27:10<11:54:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 55%|█████▌ | 6812/12384 [14:27:19<11:54:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 1: 55%|█████▌ | 6813/12384 [14:27:19<12:11:35, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 1: 55%|█████▌ | 6813/12384 [14:27:27<12:11:35, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 55%|█████▌ | 6814/12384 [14:27:27<12:26:13, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 55%|█████▌ | 6814/12384 [14:27:35<12:26:13, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 55%|█████▌ | 6815/12384 [14:27:35<12:16:47, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 55%|█████▌ | 6815/12384 [14:27:42<12:16:47, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 55%|█████▌ | 6816/12384 [14:27:42<12:12:24, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 55%|█████▌ | 6816/12384 [14:27:50<12:12:24, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 55%|█████▌ | 6817/12384 [14:27:50<12:06:56, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 55%|█████▌ | 6817/12384 [14:27:58<12:06:56, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=6.33s]
Epoch 1: 55%|█████▌ | 6818/12384 [14:27:58<12:06:20, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=6.33s]
Epoch 1: 55%|█████▌ | 6818/12384 [14:28:06<12:06:20, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 55%|█████▌ | 6819/12384 [14:28:06<12:10:55, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 55%|█████▌ | 6819/12384 [14:28:14<12:10:55, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 55%|█████▌ | 6820/12384 [14:28:14<12:05:36, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 55%|█████▌ | 6820/12384 [14:28:21<12:05:36, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 55%|█████▌ | 6821/12384 [14:28:21<12:01:46, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 55%|█████▌ | 6821/12384 [14:28:29<12:01:46, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 55%|█████▌ | 6822/12384 [14:28:29<11:58:33, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 55%|█████▌ | 6822/12384 [14:28:37<11:58:33, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 55%|█████▌ | 6823/12384 [14:28:37<11:57:15, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 55%|█████▌ | 6823/12384 [14:28:44<11:57:15, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 55%|█████▌ | 6824/12384 [14:28:44<11:56:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 55%|█████▌ | 6824/12384 [14:28:52<11:56:21, 7.73s/it, loss=0.0004, acc=0.9979, iter_time=3.69s]
Epoch 1: 55%|█████▌ | 6825/12384 [14:28:52<11:53:44, 7.70s/it, loss=0.0004, acc=0.9979, iter_time=3.69s]
Epoch 1: 55%|█████▌ | 6825/12384 [14:29:00<11:53:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 55%|█████▌ | 6826/12384 [14:29:00<11:55:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 55%|█████▌ | 6826/12384 [14:29:08<11:55:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 55%|█████▌ | 6827/12384 [14:29:08<11:54:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 55%|█████▌ | 6827/12384 [14:29:15<11:54:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 55%|█████▌ | 6828/12384 [14:29:15<11:51:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 55%|█████▌ | 6828/12384 [14:29:23<11:51:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 55%|█████▌ | 6829/12384 [14:29:23<11:51:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 55%|█████▌ | 6829/12384 [14:29:30<11:51:45, 7.69s/it, loss=0.0004, acc=1.0000, iter_time=7.95s]
Epoch 1: 55%|█████▌ | 6830/12384 [14:29:30<11:49:52, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=7.95s]
Epoch 1: 55%|█████▌ | 6830/12384 [14:29:38<11:49:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 55%|█████▌ | 6831/12384 [14:29:38<11:55:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 55%|█████▌ | 6831/12384 [14:29:46<11:55:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 55%|█████▌ | 6832/12384 [14:29:46<11:58:40, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 55%|█████▌ | 6832/12384 [14:29:54<11:58:40, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 55%|█████▌ | 6833/12384 [14:29:54<12:00:51, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 55%|█████▌ | 6833/12384 [14:30:02<12:00:51, 7.79s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 1: 55%|█████▌ | 6834/12384 [14:30:02<12:01:46, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 1: 55%|█████▌ | 6834/12384 [14:30:10<12:01:46, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 55%|█████▌ | 6835/12384 [14:30:10<12:02:36, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 55%|█████▌ | 6835/12384 [14:30:18<12:02:36, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 55%|█████▌ | 6836/12384 [14:30:18<12:14:38, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 55%|█████▌ | 6836/12384 [14:30:26<12:14:38, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 55%|█████▌ | 6837/12384 [14:30:26<12:11:19, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 55%|█████▌ | 6837/12384 [14:30:34<12:11:19, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 1: 55%|█████▌ | 6838/12384 [14:30:34<12:08:00, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 1: 55%|█████▌ | 6838/12384 [14:30:41<12:08:00, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 55%|█████▌ | 6839/12384 [14:30:41<12:07:19, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 55%|█████▌ | 6839/12384 [14:30:50<12:07:19, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 1: 55%|█████▌ | 6840/12384 [14:30:50<12:21:24, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 1: 55%|█████▌ | 6840/12384 [14:30:58<12:21:24, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 55%|█████▌ | 6841/12384 [14:30:58<12:18:12, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 55%|█████▌ | 6841/12384 [14:31:06<12:18:12, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 55%|█████▌ | 6842/12384 [14:31:06<12:23:41, 8.05s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 55%|█████▌ | 6842/12384 [14:31:14<12:23:41, 8.05s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 55%|█████▌ | 6843/12384 [14:31:14<12:19:37, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 55%|█████▌ | 6843/12384 [14:31:22<12:19:37, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 55%|█████▌ | 6844/12384 [14:31:22<12:13:15, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 55%|█████▌ | 6844/12384 [14:31:30<12:13:15, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 55%|█████▌ | 6845/12384 [14:31:30<12:14:44, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 55%|█████▌ | 6845/12384 [14:31:37<12:14:44, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 55%|█████▌ | 6846/12384 [14:31:37<12:06:45, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 55%|█████▌ | 6846/12384 [14:31:45<12:06:45, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 55%|█████▌ | 6847/12384 [14:31:45<12:00:45, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 55%|█████▌ | 6847/12384 [14:31:53<12:00:45, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 55%|█████▌ | 6848/12384 [14:31:53<11:57:25, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 55%|█████▌ | 6848/12384 [14:32:00<11:57:25, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 55%|█████▌ | 6849/12384 [14:32:00<11:54:19, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 55%|█████▌ | 6849/12384 [14:32:08<11:54:19, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 55%|█████▌ | 6850/12384 [14:32:08<12:04:22, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 55%|█████▌ | 6850/12384 [14:32:16<12:04:22, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 55%|█████▌ | 6851/12384 [14:32:16<11:59:50, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 55%|█████▌ | 6851/12384 [14:32:24<11:59:50, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 1: 55%|█████▌ | 6852/12384 [14:32:24<11:54:56, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 1: 55%|█████▌ | 6852/12384 [14:32:32<11:54:56, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 55%|█████▌ | 6853/12384 [14:32:32<11:53:46, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 55%|█████▌ | 6853/12384 [14:32:39<11:53:46, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 55%|█████▌ | 6854/12384 [14:32:39<11:55:30, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 55%|█████▌ | 6854/12384 [14:32:47<11:55:30, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▌ | 6855/12384 [14:32:47<11:52:29, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 55%|█████▌ | 6855/12384 [14:32:55<11:52:29, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 55%|█████▌ | 6856/12384 [14:32:55<11:50:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 55%|█████▌ | 6856/12384 [14:33:02<11:50:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 55%|█████▌ | 6857/12384 [14:33:02<11:48:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 55%|█████▌ | 6857/12384 [14:33:10<11:48:58, 7.70s/it, loss=0.0004, acc=0.9988, iter_time=7.74s]
Epoch 1: 55%|█████▌ | 6858/12384 [14:33:10<11:49:53, 7.71s/it, loss=0.0004, acc=0.9988, iter_time=7.74s]
Epoch 1: 55%|█████▌ | 6858/12384 [14:33:18<11:49:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 55%|█████▌ | 6859/12384 [14:33:18<11:50:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 55%|█████▌ | 6859/12384 [14:33:25<11:50:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 55%|█████▌ | 6860/12384 [14:33:25<11:49:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 55%|█████▌ | 6860/12384 [14:33:33<11:49:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 55%|█████▌ | 6861/12384 [14:33:33<11:55:53, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 55%|█████▌ | 6861/12384 [14:33:41<11:55:53, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 55%|█████▌ | 6862/12384 [14:33:41<11:53:00, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 55%|█████▌ | 6862/12384 [14:33:49<11:53:00, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 55%|█████▌ | 6863/12384 [14:33:49<11:55:47, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 55%|█████▌ | 6863/12384 [14:33:57<11:55:47, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 55%|█████▌ | 6864/12384 [14:33:57<11:54:10, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 55%|█████▌ | 6864/12384 [14:34:04<11:54:10, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 1: 55%|█████▌ | 6865/12384 [14:34:04<11:52:58, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 1: 55%|█████▌ | 6865/12384 [14:34:12<11:52:58, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 55%|█████▌ | 6866/12384 [14:34:12<12:02:17, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 55%|█████▌ | 6866/12384 [14:34:20<12:02:17, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 55%|█████▌ | 6867/12384 [14:34:20<11:59:28, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 55%|█████▌ | 6867/12384 [14:34:28<11:59:28, 7.82s/it, loss=0.0004, acc=0.9982, iter_time=8.04s]
Epoch 1: 55%|█████▌ | 6868/12384 [14:34:28<11:57:00, 7.80s/it, loss=0.0004, acc=0.9982, iter_time=8.04s]
Epoch 1: 55%|█████▌ | 6868/12384 [14:34:36<11:57:00, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 55%|█████▌ | 6869/12384 [14:34:36<11:52:16, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 55%|█████▌ | 6869/12384 [14:34:43<11:52:16, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.24s]
Epoch 1: 55%|█████▌ | 6870/12384 [14:34:43<11:55:55, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.24s]
Epoch 1: 55%|█████▌ | 6870/12384 [14:34:51<11:55:55, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 55%|█████▌ | 6871/12384 [14:34:51<12:01:03, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 55%|█████▌ | 6871/12384 [14:34:59<12:01:03, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 55%|█████▌ | 6872/12384 [14:34:59<12:03:52, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 55%|█████▌ | 6872/12384 [14:35:07<12:03:52, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 55%|█████▌ | 6873/12384 [14:35:07<11:57:13, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 55%|█████▌ | 6873/12384 [14:35:15<11:57:13, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 56%|█████▌ | 6874/12384 [14:35:15<11:54:19, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 56%|█████▌ | 6874/12384 [14:35:22<11:54:19, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 56%|█████▌ | 6875/12384 [14:35:22<11:51:56, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 56%|█████▌ | 6875/12384 [14:35:30<11:51:56, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 56%|█████▌ | 6876/12384 [14:35:30<11:48:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 56%|█████▌ | 6876/12384 [14:35:38<11:48:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 56%|█████▌ | 6877/12384 [14:35:38<11:46:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 56%|█████▌ | 6877/12384 [14:35:45<11:46:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6878/12384 [14:35:45<11:44:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6878/12384 [14:35:53<11:44:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 56%|█████▌ | 6879/12384 [14:35:53<11:45:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 56%|█████▌ | 6879/12384 [14:36:01<11:45:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 56%|█████▌ | 6880/12384 [14:36:01<11:46:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 56%|█████▌ | 6880/12384 [14:36:08<11:46:50, 7.71s/it, loss=0.0001, acc=0.9999, iter_time=7.67s]
Epoch 1: 56%|█████▌ | 6881/12384 [14:36:08<11:44:06, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=7.67s]
Epoch 1: 56%|█████▌ | 6881/12384 [14:36:16<11:44:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6882/12384 [14:36:16<11:42:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6882/12384 [14:36:24<11:42:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 56%|█████▌ | 6883/12384 [14:36:24<11:40:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 56%|█████▌ | 6883/12384 [14:36:31<11:40:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 56%|█████▌ | 6884/12384 [14:36:31<11:39:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 56%|█████▌ | 6884/12384 [14:36:39<11:39:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 56%|█████▌ | 6885/12384 [14:36:39<11:39:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 56%|█████▌ | 6885/12384 [14:36:47<11:39:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 56%|█████▌ | 6886/12384 [14:36:47<11:38:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 56%|█████▌ | 6886/12384 [14:36:54<11:38:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 56%|█████▌ | 6887/12384 [14:36:54<11:37:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 56%|█████▌ | 6887/12384 [14:37:02<11:37:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6888/12384 [14:37:02<11:39:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6888/12384 [14:37:09<11:39:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 56%|█████▌ | 6889/12384 [14:37:09<11:38:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 56%|█████▌ | 6889/12384 [14:37:17<11:38:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6890/12384 [14:37:17<11:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6890/12384 [14:37:25<11:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6891/12384 [14:37:25<11:38:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6891/12384 [14:37:32<11:38:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▌ | 6892/12384 [14:37:32<11:38:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▌ | 6892/12384 [14:37:40<11:38:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 56%|█████▌ | 6893/12384 [14:37:40<11:48:29, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 56%|█████▌ | 6893/12384 [14:37:48<11:48:29, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 56%|█████▌ | 6894/12384 [14:37:48<11:44:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 56%|█████▌ | 6894/12384 [14:37:55<11:44:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 56%|█████▌ | 6895/12384 [14:37:55<11:41:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 56%|█████▌ | 6895/12384 [14:38:03<11:41:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 1: 56%|█████▌ | 6896/12384 [14:38:03<11:39:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 1: 56%|█████▌ | 6896/12384 [14:38:11<11:39:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 1: 56%|█████▌ | 6897/12384 [14:38:11<11:38:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 1: 56%|█████▌ | 6897/12384 [14:38:18<11:38:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 56%|█████▌ | 6898/12384 [14:38:18<11:37:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 56%|█████▌ | 6898/12384 [14:38:26<11:37:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 56%|█████▌ | 6899/12384 [14:38:26<11:36:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 56%|█████▌ | 6899/12384 [14:38:33<11:36:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 56%|█████▌ | 6900/12384 [14:38:34<11:35:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 56%|█████▌ | 6900/12384 [14:38:41<11:35:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6901/12384 [14:38:41<11:35:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6901/12384 [14:38:49<11:35:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6902/12384 [14:38:49<11:35:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6902/12384 [14:38:56<11:35:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▌ | 6903/12384 [14:38:56<11:34:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▌ | 6903/12384 [14:39:04<11:34:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 56%|█████▌ | 6904/12384 [14:39:04<11:35:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 56%|█████▌ | 6904/12384 [14:39:12<11:35:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 1: 56%|█████▌ | 6905/12384 [14:39:12<11:35:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.62s]
Epoch 1: 56%|█████▌ | 6905/12384 [14:39:19<11:35:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 56%|█████▌ | 6906/12384 [14:39:19<11:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 56%|█████▌ | 6906/12384 [14:39:27<11:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 56%|█████▌ | 6907/12384 [14:39:27<11:33:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 56%|█████▌ | 6907/12384 [14:39:34<11:33:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6908/12384 [14:39:34<11:33:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6908/12384 [14:39:42<11:33:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6909/12384 [14:39:42<11:33:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6909/12384 [14:39:50<11:33:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6910/12384 [14:39:50<11:33:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6910/12384 [14:39:57<11:33:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 56%|█████▌ | 6911/12384 [14:39:57<11:35:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 56%|█████▌ | 6911/12384 [14:40:05<11:35:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.51s]
Epoch 1: 56%|█████▌ | 6912/12384 [14:40:05<11:35:40, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.51s]
Epoch 1: 56%|█████▌ | 6912/12384 [14:40:12<11:35:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 56%|█████▌ | 6913/12384 [14:40:12<11:34:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 56%|█████▌ | 6913/12384 [14:40:20<11:34:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 56%|█████▌ | 6914/12384 [14:40:20<11:33:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 56%|█████▌ | 6914/12384 [14:40:28<11:33:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 56%|█████▌ | 6915/12384 [14:40:28<11:34:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 56%|█████▌ | 6915/12384 [14:40:35<11:34:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 56%|█████▌ | 6916/12384 [14:40:35<11:33:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 56%|█████▌ | 6916/12384 [14:40:43<11:33:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 56%|█████▌ | 6917/12384 [14:40:43<11:35:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 56%|█████▌ | 6917/12384 [14:40:51<11:35:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 56%|█████▌ | 6918/12384 [14:40:51<11:34:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 56%|█████▌ | 6918/12384 [14:40:59<11:34:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6919/12384 [14:40:59<11:45:10, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6919/12384 [14:41:06<11:45:10, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 56%|█████▌ | 6920/12384 [14:41:06<11:41:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 56%|█████▌ | 6920/12384 [14:41:14<11:41:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6921/12384 [14:41:14<11:38:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6921/12384 [14:41:21<11:38:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 56%|█████▌ | 6922/12384 [14:41:21<11:36:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 56%|█████▌ | 6922/12384 [14:41:29<11:36:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 1: 56%|█████▌ | 6923/12384 [14:41:29<11:35:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 1: 56%|█████▌ | 6923/12384 [14:41:37<11:35:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 56%|█████▌ | 6924/12384 [14:41:37<11:35:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 56%|█████▌ | 6924/12384 [14:41:44<11:35:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 56%|█████▌ | 6925/12384 [14:41:44<11:33:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 56%|█████▌ | 6925/12384 [14:41:52<11:33:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 56%|█████▌ | 6926/12384 [14:41:52<11:32:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 56%|█████▌ | 6926/12384 [14:42:00<11:32:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6927/12384 [14:42:00<11:35:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6927/12384 [14:42:07<11:35:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 56%|█████▌ | 6928/12384 [14:42:07<11:34:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 56%|█████▌ | 6928/12384 [14:42:15<11:34:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 56%|█████▌ | 6929/12384 [14:42:15<11:35:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 56%|█████▌ | 6929/12384 [14:42:22<11:35:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.95s]
Epoch 1: 56%|█████▌ | 6930/12384 [14:42:22<11:34:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.95s]
Epoch 1: 56%|█████▌ | 6930/12384 [14:42:30<11:34:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 1: 56%|█████▌ | 6931/12384 [14:42:30<11:33:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 1: 56%|█████▌ | 6931/12384 [14:42:38<11:33:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 56%|█████▌ | 6932/12384 [14:42:38<11:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 56%|█████▌ | 6932/12384 [14:42:45<11:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6933/12384 [14:42:45<11:32:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6933/12384 [14:42:53<11:32:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6934/12384 [14:42:53<11:31:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6934/12384 [14:43:01<11:31:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▌ | 6935/12384 [14:43:01<11:31:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▌ | 6935/12384 [14:43:08<11:31:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 56%|█████▌ | 6936/12384 [14:43:08<11:30:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 56%|█████▌ | 6936/12384 [14:43:16<11:30:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 56%|█████▌ | 6937/12384 [14:43:16<11:30:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 56%|█████▌ | 6937/12384 [14:43:23<11:30:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 56%|█████▌ | 6938/12384 [14:43:23<11:30:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 56%|█████▌ | 6938/12384 [14:43:31<11:30:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 56%|█████▌ | 6939/12384 [14:43:31<11:28:52, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 56%|█████▌ | 6939/12384 [14:43:38<11:28:52, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 1: 56%|█████▌ | 6940/12384 [14:43:38<11:28:47, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 1: 56%|█████▌ | 6940/12384 [14:43:46<11:28:47, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 56%|█████▌ | 6941/12384 [14:43:46<11:28:29, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 56%|█████▌ | 6941/12384 [14:43:54<11:28:29, 7.59s/it, loss=0.0002, acc=1.0000, iter_time=7.93s]
Epoch 1: 56%|█████▌ | 6942/12384 [14:43:54<11:29:12, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.93s]
Epoch 1: 56%|█████▌ | 6942/12384 [14:44:01<11:29:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 56%|█████▌ | 6943/12384 [14:44:01<11:29:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 56%|█████▌ | 6943/12384 [14:44:09<11:29:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 56%|█████▌ | 6944/12384 [14:44:09<11:30:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 56%|█████▌ | 6944/12384 [14:44:17<11:30:07, 7.61s/it, loss=0.0011, acc=0.9948, iter_time=7.59s]
Epoch 1: 56%|█████▌ | 6945/12384 [14:44:17<11:38:48, 7.71s/it, loss=0.0011, acc=0.9948, iter_time=7.59s]
Epoch 1: 56%|█████▌ | 6945/12384 [14:44:25<11:38:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 56%|█████▌ | 6946/12384 [14:44:25<11:37:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 56%|█████▌ | 6946/12384 [14:44:32<11:37:40, 7.70s/it, loss=0.0002, acc=0.9988, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6947/12384 [14:44:32<11:34:46, 7.67s/it, loss=0.0002, acc=0.9988, iter_time=7.65s]
Epoch 1: 56%|█████▌ | 6947/12384 [14:44:40<11:34:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6948/12384 [14:44:40<11:32:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6948/12384 [14:44:47<11:32:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 56%|█████▌ | 6949/12384 [14:44:47<11:31:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 56%|█████▌ | 6949/12384 [14:44:55<11:31:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 56%|█████▌ | 6950/12384 [14:44:55<11:31:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 56%|█████▌ | 6950/12384 [14:45:03<11:31:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 1: 56%|█████▌ | 6951/12384 [14:45:03<11:30:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 1: 56%|█████▌ | 6951/12384 [14:45:10<11:30:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 56%|█████▌ | 6952/12384 [14:45:10<11:30:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 56%|█████▌ | 6952/12384 [14:45:18<11:30:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 1: 56%|█████▌ | 6953/12384 [14:45:18<11:30:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 1: 56%|█████▌ | 6953/12384 [14:45:25<11:30:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 56%|█████▌ | 6954/12384 [14:45:25<11:29:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 56%|█████▌ | 6954/12384 [14:45:33<11:29:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 56%|█████▌ | 6955/12384 [14:45:33<11:28:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 56%|█████▌ | 6955/12384 [14:45:41<11:28:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6956/12384 [14:45:41<11:28:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6956/12384 [14:45:48<11:28:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 56%|█████▌ | 6957/12384 [14:45:48<11:28:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 56%|█████▌ | 6957/12384 [14:45:56<11:28:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6958/12384 [14:45:56<11:28:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▌ | 6958/12384 [14:46:03<11:28:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 56%|█████▌ | 6959/12384 [14:46:03<11:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 56%|█████▌ | 6959/12384 [14:46:11<11:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 1: 56%|█████▌ | 6960/12384 [14:46:11<11:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 1: 56%|█████▌ | 6960/12384 [14:46:19<11:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 56%|█████▌ | 6961/12384 [14:46:19<11:27:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 56%|█████▌ | 6961/12384 [14:46:26<11:27:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 56%|█████▌ | 6962/12384 [14:46:26<11:28:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 56%|█████▌ | 6962/12384 [14:46:34<11:28:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6963/12384 [14:46:34<11:28:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▌ | 6963/12384 [14:46:42<11:28:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 56%|█████▌ | 6964/12384 [14:46:42<11:28:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 56%|█████▌ | 6964/12384 [14:46:49<11:28:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6965/12384 [14:46:49<11:27:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▌ | 6965/12384 [14:46:57<11:27:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 56%|█████▋ | 6966/12384 [14:46:57<11:30:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 56%|█████▋ | 6966/12384 [14:47:05<11:30:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 1: 56%|█████▋ | 6967/12384 [14:47:05<11:29:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 1: 56%|█████▋ | 6967/12384 [14:47:12<11:29:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 56%|█████▋ | 6968/12384 [14:47:12<11:30:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 56%|█████▋ | 6968/12384 [14:47:20<11:30:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 1: 56%|█████▋ | 6969/12384 [14:47:20<11:29:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 1: 56%|█████▋ | 6969/12384 [14:47:27<11:29:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 56%|█████▋ | 6970/12384 [14:47:27<11:28:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 56%|█████▋ | 6970/12384 [14:47:35<11:28:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 56%|█████▋ | 6971/12384 [14:47:35<11:37:15, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 56%|█████▋ | 6971/12384 [14:47:43<11:37:15, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 56%|█████▋ | 6972/12384 [14:47:43<11:33:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 56%|█████▋ | 6972/12384 [14:47:51<11:33:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▋ | 6973/12384 [14:47:51<11:30:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 56%|█████▋ | 6973/12384 [14:47:58<11:30:47, 7.66s/it, loss=0.0002, acc=0.9993, iter_time=5.04s]
Epoch 1: 56%|█████▋ | 6974/12384 [14:47:58<11:28:39, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=5.04s]
Epoch 1: 56%|█████▋ | 6974/12384 [14:48:06<11:28:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 56%|█████▋ | 6975/12384 [14:48:06<11:27:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 56%|█████▋ | 6975/12384 [14:48:13<11:27:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 56%|█████▋ | 6976/12384 [14:48:13<11:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 56%|█████▋ | 6976/12384 [14:48:21<11:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 56%|█████▋ | 6977/12384 [14:48:21<11:26:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 56%|█████▋ | 6977/12384 [14:48:29<11:26:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 56%|█████▋ | 6978/12384 [14:48:29<11:25:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 56%|█████▋ | 6978/12384 [14:48:36<11:25:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 56%|█████▋ | 6979/12384 [14:48:36<11:25:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 56%|█████▋ | 6979/12384 [14:48:44<11:25:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 56%|█████▋ | 6980/12384 [14:48:44<11:25:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 56%|█████▋ | 6980/12384 [14:48:51<11:25:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 56%|█████▋ | 6981/12384 [14:48:51<11:26:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 56%|█████▋ | 6981/12384 [14:48:59<11:26:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.34s]
Epoch 1: 56%|█████▋ | 6982/12384 [14:48:59<11:25:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.34s]
Epoch 1: 56%|█████▋ | 6982/12384 [14:49:07<11:25:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 56%|█████▋ | 6983/12384 [14:49:07<11:25:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 56%|█████▋ | 6983/12384 [14:49:14<11:25:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 56%|█████▋ | 6984/12384 [14:49:14<11:25:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 56%|█████▋ | 6984/12384 [14:49:22<11:25:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▋ | 6985/12384 [14:49:22<11:25:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 56%|█████▋ | 6985/12384 [14:49:29<11:25:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▋ | 6986/12384 [14:49:29<11:24:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▋ | 6986/12384 [14:49:37<11:24:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▋ | 6987/12384 [14:49:37<11:24:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▋ | 6987/12384 [14:49:45<11:24:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▋ | 6988/12384 [14:49:45<11:23:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 56%|█████▋ | 6988/12384 [14:49:52<11:23:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▋ | 6989/12384 [14:49:52<11:23:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 56%|█████▋ | 6989/12384 [14:50:00<11:23:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▋ | 6990/12384 [14:50:00<11:24:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 56%|█████▋ | 6990/12384 [14:50:08<11:24:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 56%|█████▋ | 6991/12384 [14:50:08<11:24:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 56%|█████▋ | 6991/12384 [14:50:15<11:24:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 1: 56%|█████▋ | 6992/12384 [14:50:15<11:26:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 1: 56%|█████▋ | 6992/12384 [14:50:23<11:26:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.76s]
Epoch 1: 56%|█████▋ | 6993/12384 [14:50:23<11:26:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.76s]
Epoch 1: 56%|█████▋ | 6993/12384 [14:50:31<11:26:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 56%|█████▋ | 6994/12384 [14:50:31<11:25:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 56%|█████▋ | 6994/12384 [14:50:38<11:25:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 56%|█████▋ | 6995/12384 [14:50:38<11:26:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 56%|█████▋ | 6995/12384 [14:50:46<11:26:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 1: 56%|█████▋ | 6996/12384 [14:50:46<11:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 1: 56%|█████▋ | 6996/12384 [14:50:54<11:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 6997/12384 [14:50:54<11:33:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 6997/12384 [14:51:01<11:33:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 57%|█████▋ | 6998/12384 [14:51:01<11:33:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 57%|█████▋ | 6998/12384 [14:51:09<11:33:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 1: 57%|█████▋ | 6999/12384 [14:51:09<11:30:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 1: 57%|█████▋ | 6999/12384 [14:51:17<11:30:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 57%|█████▋ | 7000/12384 [14:51:17<11:27:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 57%|█████▋ | 7000/12384 [14:51:24<11:27:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 57%|█████▋ | 7001/12384 [14:51:24<11:26:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 57%|█████▋ | 7001/12384 [14:51:32<11:26:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 57%|█████▋ | 7002/12384 [14:51:32<11:25:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 57%|█████▋ | 7002/12384 [14:51:40<11:25:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 57%|█████▋ | 7003/12384 [14:51:40<11:24:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 57%|█████▋ | 7003/12384 [14:51:47<11:24:30, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.65s]
Epoch 1: 57%|█████▋ | 7004/12384 [14:51:47<11:23:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.65s]
Epoch 1: 57%|█████▋ | 7004/12384 [14:51:55<11:23:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 1: 57%|█████▋ | 7005/12384 [14:51:55<11:23:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 1: 57%|█████▋ | 7005/12384 [14:52:02<11:23:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7006/12384 [14:52:02<11:23:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7006/12384 [14:52:10<11:23:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 57%|█████▋ | 7007/12384 [14:52:10<11:22:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 57%|█████▋ | 7007/12384 [14:52:18<11:22:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 57%|█████▋ | 7008/12384 [14:52:18<11:22:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 57%|█████▋ | 7008/12384 [14:52:25<11:22:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 57%|█████▋ | 7009/12384 [14:52:25<11:21:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 57%|█████▋ | 7009/12384 [14:52:33<11:21:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7010/12384 [14:52:33<11:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7010/12384 [14:52:40<11:21:50, 7.61s/it, loss=0.0006, acc=0.9987, iter_time=6.82s]
Epoch 1: 57%|█████▋ | 7011/12384 [14:52:40<11:21:49, 7.61s/it, loss=0.0006, acc=0.9987, iter_time=6.82s]
Epoch 1: 57%|█████▋ | 7011/12384 [14:52:48<11:21:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 57%|█████▋ | 7012/12384 [14:52:48<11:21:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 57%|█████▋ | 7012/12384 [14:52:56<11:21:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7013/12384 [14:52:56<11:21:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7013/12384 [14:53:03<11:21:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 57%|█████▋ | 7014/12384 [14:53:03<11:21:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 57%|█████▋ | 7014/12384 [14:53:11<11:21:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 57%|█████▋ | 7015/12384 [14:53:11<11:21:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 57%|█████▋ | 7015/12384 [14:53:18<11:21:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 57%|█████▋ | 7016/12384 [14:53:19<11:21:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 57%|█████▋ | 7016/12384 [14:53:26<11:21:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 57%|█████▋ | 7017/12384 [14:53:26<11:21:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 57%|█████▋ | 7017/12384 [14:53:34<11:21:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7018/12384 [14:53:34<11:20:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7018/12384 [14:53:41<11:20:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 57%|█████▋ | 7019/12384 [14:53:41<11:22:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 57%|█████▋ | 7019/12384 [14:53:49<11:22:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 57%|█████▋ | 7020/12384 [14:53:49<11:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 57%|█████▋ | 7020/12384 [14:53:57<11:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7021/12384 [14:53:57<11:21:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7021/12384 [14:54:04<11:21:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 57%|█████▋ | 7022/12384 [14:54:04<11:21:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 57%|█████▋ | 7022/12384 [14:54:12<11:21:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 57%|█████▋ | 7023/12384 [14:54:12<11:20:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 57%|█████▋ | 7023/12384 [14:54:20<11:20:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 1: 57%|█████▋ | 7024/12384 [14:54:20<11:28:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.39s]
Epoch 1: 57%|█████▋ | 7024/12384 [14:54:27<11:28:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 57%|█████▋ | 7025/12384 [14:54:27<11:26:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 57%|█████▋ | 7025/12384 [14:54:35<11:26:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 57%|█████▋ | 7026/12384 [14:54:35<11:25:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 57%|█████▋ | 7026/12384 [14:54:43<11:25:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 57%|█████▋ | 7027/12384 [14:54:43<11:25:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 57%|█████▋ | 7027/12384 [14:54:50<11:25:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 57%|█████▋ | 7028/12384 [14:54:50<11:24:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 57%|█████▋ | 7028/12384 [14:54:58<11:24:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 57%|█████▋ | 7029/12384 [14:54:58<11:22:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 57%|█████▋ | 7029/12384 [14:55:06<11:22:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 57%|█████▋ | 7030/12384 [14:55:06<11:22:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 57%|█████▋ | 7030/12384 [14:55:13<11:22:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 57%|█████▋ | 7031/12384 [14:55:13<11:21:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 57%|█████▋ | 7031/12384 [14:55:21<11:21:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 57%|█████▋ | 7032/12384 [14:55:21<11:21:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 57%|█████▋ | 7032/12384 [14:55:29<11:21:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 57%|█████▋ | 7033/12384 [14:55:29<11:20:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 57%|█████▋ | 7033/12384 [14:55:36<11:20:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 57%|█████▋ | 7034/12384 [14:55:36<11:19:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 57%|█████▋ | 7034/12384 [14:55:44<11:19:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 57%|█████▋ | 7035/12384 [14:55:44<11:19:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 57%|█████▋ | 7035/12384 [14:55:51<11:19:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 57%|█████▋ | 7036/12384 [14:55:51<11:19:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 57%|█████▋ | 7036/12384 [14:55:59<11:19:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.46s]
Epoch 1: 57%|█████▋ | 7037/12384 [14:55:59<11:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.46s]
Epoch 1: 57%|█████▋ | 7037/12384 [14:56:07<11:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 57%|█████▋ | 7038/12384 [14:56:07<11:18:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 57%|█████▋ | 7038/12384 [14:56:14<11:18:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 57%|█████▋ | 7039/12384 [14:56:14<11:17:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 57%|█████▋ | 7039/12384 [14:56:22<11:17:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 57%|█████▋ | 7040/12384 [14:56:22<11:18:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 57%|█████▋ | 7040/12384 [14:56:29<11:18:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 57%|█████▋ | 7041/12384 [14:56:29<11:17:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 57%|█████▋ | 7041/12384 [14:56:37<11:17:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 57%|█████▋ | 7042/12384 [14:56:37<11:17:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 57%|█████▋ | 7042/12384 [14:56:45<11:17:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7043/12384 [14:56:45<11:17:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7043/12384 [14:56:52<11:17:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 57%|█████▋ | 7044/12384 [14:56:52<11:18:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 57%|█████▋ | 7044/12384 [14:57:00<11:18:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 57%|█████▋ | 7045/12384 [14:57:00<11:17:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 57%|█████▋ | 7045/12384 [14:57:08<11:17:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 57%|█████▋ | 7046/12384 [14:57:08<11:19:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 57%|█████▋ | 7046/12384 [14:57:15<11:19:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 1: 57%|█████▋ | 7047/12384 [14:57:15<11:18:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 1: 57%|█████▋ | 7047/12384 [14:57:23<11:18:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 57%|█████▋ | 7048/12384 [14:57:23<11:18:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 57%|█████▋ | 7048/12384 [14:57:30<11:18:51, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7049/12384 [14:57:30<11:17:55, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7049/12384 [14:57:38<11:17:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 57%|█████▋ | 7050/12384 [14:57:38<11:26:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 57%|█████▋ | 7050/12384 [14:57:46<11:26:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 57%|█████▋ | 7051/12384 [14:57:46<11:24:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 57%|█████▋ | 7051/12384 [14:57:54<11:24:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7052/12384 [14:57:54<11:22:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7052/12384 [14:58:01<11:22:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 57%|█████▋ | 7053/12384 [14:58:01<11:21:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 57%|█████▋ | 7053/12384 [14:58:09<11:21:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 57%|█████▋ | 7054/12384 [14:58:09<11:20:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 57%|█████▋ | 7054/12384 [14:58:17<11:20:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 57%|█████▋ | 7055/12384 [14:58:17<11:26:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 57%|█████▋ | 7055/12384 [14:58:24<11:26:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 57%|█████▋ | 7056/12384 [14:58:24<11:22:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 57%|█████▋ | 7056/12384 [14:58:32<11:22:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 57%|█████▋ | 7057/12384 [14:58:32<11:20:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 57%|█████▋ | 7057/12384 [14:58:40<11:20:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 1: 57%|█████▋ | 7058/12384 [14:58:40<11:20:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 1: 57%|█████▋ | 7058/12384 [14:58:47<11:20:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 57%|█████▋ | 7059/12384 [14:58:47<11:18:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 57%|█████▋ | 7059/12384 [14:58:55<11:18:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 1: 57%|█████▋ | 7060/12384 [14:58:55<11:18:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 1: 57%|█████▋ | 7060/12384 [14:59:03<11:18:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 57%|█████▋ | 7061/12384 [14:59:03<11:16:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 57%|█████▋ | 7061/12384 [14:59:10<11:16:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 57%|█████▋ | 7062/12384 [14:59:10<11:15:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 57%|█████▋ | 7062/12384 [14:59:18<11:15:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 57%|█████▋ | 7063/12384 [14:59:18<11:16:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 57%|█████▋ | 7063/12384 [14:59:25<11:16:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 57%|█████▋ | 7064/12384 [14:59:25<11:15:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 57%|█████▋ | 7064/12384 [14:59:33<11:15:24, 7.62s/it, loss=0.0004, acc=0.9992, iter_time=7.21s]
Epoch 1: 57%|█████▋ | 7065/12384 [14:59:33<11:14:47, 7.61s/it, loss=0.0004, acc=0.9992, iter_time=7.21s]
Epoch 1: 57%|█████▋ | 7065/12384 [14:59:41<11:14:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 57%|█████▋ | 7066/12384 [14:59:41<11:14:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 57%|█████▋ | 7066/12384 [14:59:48<11:14:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 57%|█████▋ | 7067/12384 [14:59:48<11:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 57%|█████▋ | 7067/12384 [14:59:56<11:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 57%|█████▋ | 7068/12384 [14:59:56<11:14:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 57%|█████▋ | 7068/12384 [15:00:03<11:14:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.93s]
Epoch 1: 57%|█████▋ | 7069/12384 [15:00:03<11:14:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.93s]
Epoch 1: 57%|█████▋ | 7069/12384 [15:00:11<11:14:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 57%|█████▋ | 7070/12384 [15:00:11<11:13:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 57%|█████▋ | 7070/12384 [15:00:19<11:13:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7071/12384 [15:00:19<11:13:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7071/12384 [15:00:26<11:13:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 57%|█████▋ | 7072/12384 [15:00:26<11:15:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 57%|█████▋ | 7072/12384 [15:00:34<11:15:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7073/12384 [15:00:34<11:14:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7073/12384 [15:00:41<11:14:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7074/12384 [15:00:41<11:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7074/12384 [15:00:49<11:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 57%|█████▋ | 7075/12384 [15:00:49<11:13:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 57%|█████▋ | 7075/12384 [15:00:57<11:13:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 57%|█████▋ | 7076/12384 [15:00:57<11:13:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 57%|█████▋ | 7076/12384 [15:01:05<11:13:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 57%|█████▋ | 7077/12384 [15:01:05<11:21:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 57%|█████▋ | 7077/12384 [15:01:12<11:21:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 57%|█████▋ | 7078/12384 [15:01:12<11:18:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 57%|█████▋ | 7078/12384 [15:01:20<11:18:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 57%|█████▋ | 7079/12384 [15:01:20<11:18:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 57%|█████▋ | 7079/12384 [15:01:28<11:18:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 57%|█████▋ | 7080/12384 [15:01:28<11:17:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 57%|█████▋ | 7080/12384 [15:01:35<11:17:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 57%|█████▋ | 7081/12384 [15:01:35<11:23:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 57%|█████▋ | 7081/12384 [15:01:43<11:23:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7082/12384 [15:01:43<11:21:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7082/12384 [15:01:51<11:21:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 57%|█████▋ | 7083/12384 [15:01:51<11:19:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 57%|█████▋ | 7083/12384 [15:01:58<11:19:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 57%|█████▋ | 7084/12384 [15:01:58<11:17:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 57%|█████▋ | 7084/12384 [15:02:06<11:17:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 57%|█████▋ | 7085/12384 [15:02:06<11:16:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 57%|█████▋ | 7085/12384 [15:02:14<11:16:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 57%|█████▋ | 7086/12384 [15:02:14<11:15:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 57%|█████▋ | 7086/12384 [15:02:21<11:15:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 1: 57%|█████▋ | 7087/12384 [15:02:21<11:14:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 1: 57%|█████▋ | 7087/12384 [15:02:29<11:14:16, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.62s]
Epoch 1: 57%|█████▋ | 7088/12384 [15:02:29<11:13:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.62s]
Epoch 1: 57%|█████▋ | 7088/12384 [15:02:36<11:13:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 57%|█████▋ | 7089/12384 [15:02:36<11:13:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 57%|█████▋ | 7089/12384 [15:02:44<11:13:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 57%|█████▋ | 7090/12384 [15:02:44<11:14:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 57%|█████▋ | 7090/12384 [15:02:52<11:14:40, 7.65s/it, loss=0.0001, acc=0.9992, iter_time=7.98s]
Epoch 1: 57%|█████▋ | 7091/12384 [15:02:52<11:13:56, 7.64s/it, loss=0.0001, acc=0.9992, iter_time=7.98s]
Epoch 1: 57%|█████▋ | 7091/12384 [15:02:59<11:13:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 57%|█████▋ | 7092/12384 [15:02:59<11:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 57%|█████▋ | 7092/12384 [15:03:07<11:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 57%|█████▋ | 7093/12384 [15:03:07<11:12:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 57%|█████▋ | 7093/12384 [15:03:15<11:12:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 57%|█████▋ | 7094/12384 [15:03:15<11:12:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 57%|█████▋ | 7094/12384 [15:03:22<11:12:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 57%|█████▋ | 7095/12384 [15:03:22<11:11:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 57%|█████▋ | 7095/12384 [15:03:30<11:11:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 57%|█████▋ | 7096/12384 [15:03:30<11:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 57%|█████▋ | 7096/12384 [15:03:37<11:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7097/12384 [15:03:37<11:11:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7097/12384 [15:03:45<11:11:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7098/12384 [15:03:45<11:11:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7098/12384 [15:03:53<11:11:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7099/12384 [15:03:53<11:10:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 57%|█████▋ | 7099/12384 [15:04:00<11:10:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7100/12384 [15:04:00<11:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7100/12384 [15:04:08<11:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 57%|█████▋ | 7101/12384 [15:04:08<11:10:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 57%|█████▋ | 7101/12384 [15:04:16<11:10:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7102/12384 [15:04:16<11:11:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 57%|█████▋ | 7102/12384 [15:04:23<11:11:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 57%|█████▋ | 7103/12384 [15:04:23<11:18:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 57%|█████▋ | 7103/12384 [15:04:31<11:18:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 57%|█████▋ | 7104/12384 [15:04:31<11:17:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 57%|█████▋ | 7104/12384 [15:04:39<11:17:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 1: 57%|█████▋ | 7105/12384 [15:04:39<11:14:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 1: 57%|█████▋ | 7105/12384 [15:04:46<11:14:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 57%|█████▋ | 7106/12384 [15:04:46<11:13:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 57%|█████▋ | 7106/12384 [15:04:54<11:13:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 57%|█████▋ | 7107/12384 [15:04:54<11:11:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 57%|█████▋ | 7107/12384 [15:05:02<11:11:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 57%|█████▋ | 7108/12384 [15:05:02<11:10:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 57%|█████▋ | 7108/12384 [15:05:09<11:10:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 57%|█████▋ | 7109/12384 [15:05:09<11:10:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 57%|█████▋ | 7109/12384 [15:05:17<11:10:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 57%|█████▋ | 7110/12384 [15:05:17<11:10:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 57%|█████▋ | 7110/12384 [15:05:24<11:10:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 57%|█████▋ | 7111/12384 [15:05:24<11:10:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 57%|█████▋ | 7111/12384 [15:05:32<11:10:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 57%|█████▋ | 7112/12384 [15:05:32<11:10:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 57%|█████▋ | 7112/12384 [15:05:40<11:10:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7113/12384 [15:05:40<11:09:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 57%|█████▋ | 7113/12384 [15:05:47<11:09:49, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.01s]
Epoch 1: 57%|█████▋ | 7114/12384 [15:05:47<11:09:37, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.01s]
Epoch 1: 57%|█████▋ | 7114/12384 [15:05:55<11:09:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 57%|█████▋ | 7115/12384 [15:05:55<11:08:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 57%|█████▋ | 7115/12384 [15:06:03<11:08:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 57%|█████▋ | 7116/12384 [15:06:03<11:13:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 57%|█████▋ | 7116/12384 [15:06:10<11:13:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 57%|█████▋ | 7117/12384 [15:06:10<11:11:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 57%|█████▋ | 7117/12384 [15:06:18<11:11:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 57%|█████▋ | 7118/12384 [15:06:18<11:11:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 57%|█████▋ | 7118/12384 [15:06:26<11:11:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 1: 57%|█████▋ | 7119/12384 [15:06:26<11:10:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 1: 57%|█████▋ | 7119/12384 [15:06:33<11:10:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 57%|█████▋ | 7120/12384 [15:06:33<11:10:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 57%|█████▋ | 7120/12384 [15:06:41<11:10:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 58%|█████▊ | 7121/12384 [15:06:41<11:09:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 58%|█████▊ | 7121/12384 [15:06:48<11:09:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 58%|█████▊ | 7122/12384 [15:06:48<11:08:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 58%|█████▊ | 7122/12384 [15:06:56<11:08:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 58%|█████▊ | 7123/12384 [15:06:56<11:08:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 58%|█████▊ | 7123/12384 [15:07:04<11:08:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 58%|█████▊ | 7124/12384 [15:07:04<11:07:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 58%|█████▊ | 7124/12384 [15:07:11<11:07:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 58%|█████▊ | 7125/12384 [15:07:11<11:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 58%|█████▊ | 7125/12384 [15:07:19<11:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 1: 58%|█████▊ | 7126/12384 [15:07:19<11:07:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 1: 58%|█████▊ | 7126/12384 [15:07:27<11:07:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 58%|█████▊ | 7127/12384 [15:07:27<11:10:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 58%|█████▊ | 7127/12384 [15:07:34<11:10:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 58%|█████▊ | 7128/12384 [15:07:34<11:10:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 58%|█████▊ | 7128/12384 [15:07:42<11:10:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 58%|█████▊ | 7129/12384 [15:07:42<11:16:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 58%|█████▊ | 7129/12384 [15:07:50<11:16:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 58%|█████▊ | 7130/12384 [15:07:50<11:13:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 58%|█████▊ | 7130/12384 [15:07:57<11:13:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7131/12384 [15:07:57<11:11:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7131/12384 [15:08:05<11:11:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 58%|█████▊ | 7132/12384 [15:08:05<11:11:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 58%|█████▊ | 7132/12384 [15:08:13<11:11:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 58%|█████▊ | 7133/12384 [15:08:13<11:09:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 58%|█████▊ | 7133/12384 [15:08:21<11:09:58, 7.66s/it, loss=0.0001, acc=0.9994, iter_time=7.92s]
Epoch 1: 58%|█████▊ | 7134/12384 [15:08:21<11:16:16, 7.73s/it, loss=0.0001, acc=0.9994, iter_time=7.92s]
Epoch 1: 58%|█████▊ | 7134/12384 [15:08:28<11:16:16, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 58%|█████▊ | 7135/12384 [15:08:28<11:13:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 58%|█████▊ | 7135/12384 [15:08:36<11:13:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 58%|█████▊ | 7136/12384 [15:08:36<11:11:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 58%|█████▊ | 7136/12384 [15:08:43<11:11:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 58%|█████▊ | 7137/12384 [15:08:43<11:09:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 58%|█████▊ | 7137/12384 [15:08:51<11:09:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 58%|█████▊ | 7138/12384 [15:08:51<11:07:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 58%|█████▊ | 7138/12384 [15:08:59<11:07:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 58%|█████▊ | 7139/12384 [15:08:59<11:07:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 58%|█████▊ | 7139/12384 [15:09:06<11:07:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 58%|█████▊ | 7140/12384 [15:09:06<11:05:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 58%|█████▊ | 7140/12384 [15:09:14<11:05:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 58%|█████▊ | 7141/12384 [15:09:14<11:05:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 58%|█████▊ | 7141/12384 [15:09:21<11:05:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 58%|█████▊ | 7142/12384 [15:09:21<11:04:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 58%|█████▊ | 7142/12384 [15:09:29<11:04:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 58%|█████▊ | 7143/12384 [15:09:29<11:04:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 58%|█████▊ | 7143/12384 [15:09:37<11:04:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 1: 58%|█████▊ | 7144/12384 [15:09:37<11:04:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 1: 58%|█████▊ | 7144/12384 [15:09:44<11:04:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 58%|█████▊ | 7145/12384 [15:09:44<11:03:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 58%|█████▊ | 7145/12384 [15:09:52<11:03:50, 7.60s/it, loss=0.0007, acc=0.9983, iter_time=9.08s]
Epoch 1: 58%|█████▊ | 7146/12384 [15:09:52<11:04:06, 7.61s/it, loss=0.0007, acc=0.9983, iter_time=9.08s]
Epoch 1: 58%|█████▊ | 7146/12384 [15:09:59<11:04:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 58%|█████▊ | 7147/12384 [15:09:59<11:03:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 58%|█████▊ | 7147/12384 [15:10:07<11:03:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 58%|█████▊ | 7148/12384 [15:10:07<11:03:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 58%|█████▊ | 7148/12384 [15:10:15<11:03:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 58%|█████▊ | 7149/12384 [15:10:15<11:02:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 58%|█████▊ | 7149/12384 [15:10:22<11:02:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 58%|█████▊ | 7150/12384 [15:10:22<11:03:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 58%|█████▊ | 7150/12384 [15:10:30<11:03:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 58%|█████▊ | 7151/12384 [15:10:30<11:03:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 58%|█████▊ | 7151/12384 [15:10:37<11:03:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 58%|█████▊ | 7152/12384 [15:10:37<11:03:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 58%|█████▊ | 7152/12384 [15:10:45<11:03:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 58%|█████▊ | 7153/12384 [15:10:45<11:02:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 58%|█████▊ | 7153/12384 [15:10:53<11:02:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 58%|█████▊ | 7154/12384 [15:10:53<11:02:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 58%|█████▊ | 7154/12384 [15:11:01<11:02:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 58%|█████▊ | 7155/12384 [15:11:01<11:10:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 58%|█████▊ | 7155/12384 [15:11:08<11:10:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 58%|█████▊ | 7156/12384 [15:11:08<11:08:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 58%|█████▊ | 7156/12384 [15:11:16<11:08:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 58%|█████▊ | 7157/12384 [15:11:16<11:07:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 58%|█████▊ | 7157/12384 [15:11:23<11:07:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 58%|█████▊ | 7158/12384 [15:11:23<11:06:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 58%|█████▊ | 7158/12384 [15:11:31<11:06:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 58%|█████▊ | 7159/12384 [15:11:31<11:05:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 58%|█████▊ | 7159/12384 [15:11:39<11:05:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 1: 58%|█████▊ | 7160/12384 [15:11:39<11:03:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 1: 58%|█████▊ | 7160/12384 [15:11:47<11:03:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 58%|█████▊ | 7161/12384 [15:11:47<11:10:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 58%|█████▊ | 7161/12384 [15:11:54<11:10:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 58%|█████▊ | 7162/12384 [15:11:54<11:07:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 58%|█████▊ | 7162/12384 [15:12:02<11:07:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 58%|█████▊ | 7163/12384 [15:12:02<11:06:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 58%|█████▊ | 7163/12384 [15:12:09<11:06:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 58%|█████▊ | 7164/12384 [15:12:09<11:05:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 58%|█████▊ | 7164/12384 [15:12:17<11:05:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 58%|█████▊ | 7165/12384 [15:12:17<11:06:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 58%|█████▊ | 7165/12384 [15:12:25<11:06:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 58%|█████▊ | 7166/12384 [15:12:25<11:05:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 58%|█████▊ | 7166/12384 [15:12:32<11:05:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 58%|█████▊ | 7167/12384 [15:12:32<11:04:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 58%|█████▊ | 7167/12384 [15:12:40<11:04:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 58%|█████▊ | 7168/12384 [15:12:40<11:03:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 58%|█████▊ | 7168/12384 [15:12:48<11:03:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 58%|█████▊ | 7169/12384 [15:12:48<11:02:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 58%|█████▊ | 7169/12384 [15:12:55<11:02:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 58%|█████▊ | 7170/12384 [15:12:55<11:02:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 58%|█████▊ | 7170/12384 [15:13:03<11:02:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 58%|█████▊ | 7171/12384 [15:13:03<11:01:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 58%|█████▊ | 7171/12384 [15:13:10<11:01:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7172/12384 [15:13:10<11:00:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7172/12384 [15:13:18<11:00:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.58s]
Epoch 1: 58%|█████▊ | 7173/12384 [15:13:18<11:00:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.58s]
Epoch 1: 58%|█████▊ | 7173/12384 [15:13:26<11:00:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.61s]
Epoch 1: 58%|█████▊ | 7174/12384 [15:13:26<11:01:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.61s]
Epoch 1: 58%|█████▊ | 7174/12384 [15:13:33<11:01:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 58%|█████▊ | 7175/12384 [15:13:33<11:01:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 58%|█████▊ | 7175/12384 [15:13:41<11:01:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 58%|█████▊ | 7176/12384 [15:13:41<11:01:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 58%|█████▊ | 7176/12384 [15:13:48<11:01:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 58%|█████▊ | 7177/12384 [15:13:48<11:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 58%|█████▊ | 7177/12384 [15:13:56<11:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7178/12384 [15:13:56<11:00:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7178/12384 [15:14:04<11:00:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 58%|█████▊ | 7179/12384 [15:14:04<11:01:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 58%|█████▊ | 7179/12384 [15:14:11<11:01:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 58%|█████▊ | 7180/12384 [15:14:11<11:00:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 58%|█████▊ | 7180/12384 [15:14:19<11:00:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 58%|█████▊ | 7181/12384 [15:14:19<11:09:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 58%|█████▊ | 7181/12384 [15:14:27<11:09:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 58%|█████▊ | 7182/12384 [15:14:27<11:06:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 58%|█████▊ | 7182/12384 [15:14:35<11:06:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7183/12384 [15:14:35<11:04:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7183/12384 [15:14:42<11:04:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 58%|█████▊ | 7184/12384 [15:14:42<11:04:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 58%|█████▊ | 7184/12384 [15:14:50<11:04:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 58%|█████▊ | 7185/12384 [15:14:50<11:05:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 58%|█████▊ | 7185/12384 [15:14:57<11:05:44, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 1: 58%|█████▊ | 7186/12384 [15:14:57<11:02:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 1: 58%|█████▊ | 7186/12384 [15:15:05<11:02:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 58%|█████▊ | 7187/12384 [15:15:05<11:03:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 58%|█████▊ | 7187/12384 [15:15:13<11:03:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 58%|█████▊ | 7188/12384 [15:15:13<11:09:16, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 58%|█████▊ | 7188/12384 [15:15:21<11:09:16, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7189/12384 [15:15:21<11:05:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7189/12384 [15:15:28<11:05:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 58%|█████▊ | 7190/12384 [15:15:28<11:04:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 58%|█████▊ | 7190/12384 [15:15:36<11:04:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 58%|█████▊ | 7191/12384 [15:15:36<11:01:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 58%|█████▊ | 7191/12384 [15:15:43<11:01:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 58%|█████▊ | 7192/12384 [15:15:43<11:00:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 58%|█████▊ | 7192/12384 [15:15:51<11:00:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 58%|█████▊ | 7193/12384 [15:15:51<10:59:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 58%|█████▊ | 7193/12384 [15:15:59<10:59:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 58%|█████▊ | 7194/12384 [15:15:59<10:59:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 58%|█████▊ | 7194/12384 [15:16:06<10:59:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 58%|█████▊ | 7195/12384 [15:16:06<10:59:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 58%|█████▊ | 7195/12384 [15:16:14<10:59:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 58%|█████▊ | 7196/12384 [15:16:14<10:59:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 58%|█████▊ | 7196/12384 [15:16:22<10:59:49, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=9.95s]
Epoch 1: 58%|█████▊ | 7197/12384 [15:16:22<10:59:08, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=9.95s]
Epoch 1: 58%|█████▊ | 7197/12384 [15:16:29<10:59:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 58%|█████▊ | 7198/12384 [15:16:29<10:58:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 58%|█████▊ | 7198/12384 [15:16:37<10:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7199/12384 [15:16:37<10:58:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7199/12384 [15:16:44<10:58:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7200/12384 [15:16:44<10:58:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7200/12384 [15:16:52<10:58:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 1: 58%|█████▊ | 7201/12384 [15:16:52<10:58:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 1: 58%|█████▊ | 7201/12384 [15:17:00<10:58:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 58%|█████▊ | 7202/12384 [15:17:00<10:57:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 58%|█████▊ | 7202/12384 [15:17:07<10:57:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 58%|█████▊ | 7203/12384 [15:17:07<10:57:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 58%|█████▊ | 7203/12384 [15:17:15<10:57:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 58%|█████▊ | 7204/12384 [15:17:15<10:56:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 58%|█████▊ | 7204/12384 [15:17:22<10:56:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7205/12384 [15:17:22<10:56:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7205/12384 [15:17:30<10:56:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 58%|█████▊ | 7206/12384 [15:17:30<10:56:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 58%|█████▊ | 7206/12384 [15:17:38<10:56:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 1: 58%|█████▊ | 7207/12384 [15:17:38<10:57:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 1: 58%|█████▊ | 7207/12384 [15:17:46<10:57:19, 7.62s/it, loss=0.0004, acc=0.9978, iter_time=8.06s]
Epoch 1: 58%|█████▊ | 7208/12384 [15:17:46<11:05:25, 7.71s/it, loss=0.0004, acc=0.9978, iter_time=8.06s]
Epoch 1: 58%|█████▊ | 7208/12384 [15:17:53<11:05:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 58%|█████▊ | 7209/12384 [15:17:53<11:02:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 58%|█████▊ | 7209/12384 [15:18:01<11:02:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 58%|█████▊ | 7210/12384 [15:18:01<11:01:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 58%|█████▊ | 7210/12384 [15:18:08<11:01:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 58%|█████▊ | 7211/12384 [15:18:08<10:58:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 58%|█████▊ | 7211/12384 [15:18:16<10:58:50, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=9.53s]
Epoch 1: 58%|█████▊ | 7212/12384 [15:18:16<10:57:26, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=9.53s]
Epoch 1: 58%|█████▊ | 7212/12384 [15:18:24<10:57:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 58%|█████▊ | 7213/12384 [15:18:24<10:57:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 58%|█████▊ | 7213/12384 [15:18:32<10:57:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 58%|█████▊ | 7214/12384 [15:18:32<11:03:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 58%|█████▊ | 7214/12384 [15:18:39<11:03:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 58%|█████▊ | 7215/12384 [15:18:39<11:01:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 58%|█████▊ | 7215/12384 [15:18:47<11:01:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.08s]
Epoch 1: 58%|█████▊ | 7216/12384 [15:18:47<11:00:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.08s]
Epoch 1: 58%|█████▊ | 7216/12384 [15:18:54<11:00:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 58%|█████▊ | 7217/12384 [15:18:54<10:58:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 58%|█████▊ | 7217/12384 [15:19:02<10:58:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 58%|█████▊ | 7218/12384 [15:19:02<10:57:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 58%|█████▊ | 7218/12384 [15:19:10<10:57:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7219/12384 [15:19:10<10:56:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7219/12384 [15:19:17<10:56:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7220/12384 [15:19:17<10:56:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 58%|█████▊ | 7220/12384 [15:19:25<10:56:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 58%|█████▊ | 7221/12384 [15:19:25<10:56:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 58%|█████▊ | 7221/12384 [15:19:33<10:56:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 58%|█████▊ | 7222/12384 [15:19:33<10:55:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 58%|█████▊ | 7222/12384 [15:19:40<10:55:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 58%|█████▊ | 7223/12384 [15:19:40<10:56:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 58%|█████▊ | 7223/12384 [15:19:48<10:56:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 58%|█████▊ | 7224/12384 [15:19:48<10:55:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 58%|█████▊ | 7224/12384 [15:19:55<10:55:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=2.78s]
Epoch 1: 58%|█████▊ | 7225/12384 [15:19:55<10:54:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=2.78s]
Epoch 1: 58%|█████▊ | 7225/12384 [15:20:03<10:54:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=12.02s]
Epoch 1: 58%|█████▊ | 7226/12384 [15:20:03<10:53:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=12.02s]
Epoch 1: 58%|█████▊ | 7226/12384 [15:20:11<10:53:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 58%|█████▊ | 7227/12384 [15:20:11<10:54:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 58%|█████▊ | 7227/12384 [15:20:18<10:54:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 58%|█████▊ | 7228/12384 [15:20:18<10:53:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 58%|█████▊ | 7228/12384 [15:20:26<10:53:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 58%|█████▊ | 7229/12384 [15:20:26<10:53:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 58%|█████▊ | 7229/12384 [15:20:33<10:53:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 58%|█████▊ | 7230/12384 [15:20:33<10:53:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 58%|█████▊ | 7230/12384 [15:20:41<10:53:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 58%|█████▊ | 7231/12384 [15:20:41<10:53:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 58%|█████▊ | 7231/12384 [15:20:49<10:53:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 58%|█████▊ | 7232/12384 [15:20:49<10:53:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 58%|█████▊ | 7232/12384 [15:20:56<10:53:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 58%|█████▊ | 7233/12384 [15:20:56<10:53:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 58%|█████▊ | 7233/12384 [15:21:04<10:53:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 58%|█████▊ | 7234/12384 [15:21:04<11:01:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 58%|█████▊ | 7234/12384 [15:21:12<11:01:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 58%|█████▊ | 7235/12384 [15:21:12<10:59:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 58%|█████▊ | 7235/12384 [15:21:19<10:59:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 58%|█████▊ | 7236/12384 [15:21:19<10:57:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 58%|█████▊ | 7236/12384 [15:21:27<10:57:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 58%|█████▊ | 7237/12384 [15:21:27<10:55:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 1: 58%|█████▊ | 7237/12384 [15:21:35<10:55:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7238/12384 [15:21:35<10:55:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7238/12384 [15:21:42<10:55:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7239/12384 [15:21:42<10:54:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 58%|█████▊ | 7239/12384 [15:21:50<10:54:37, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.58s]
Epoch 1: 58%|█████▊ | 7240/12384 [15:21:50<10:53:47, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.58s]
Epoch 1: 58%|█████▊ | 7240/12384 [15:21:57<10:53:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 58%|█████▊ | 7241/12384 [15:21:57<10:53:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 58%|█████▊ | 7241/12384 [15:22:05<10:53:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 58%|█████▊ | 7242/12384 [15:22:05<10:52:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 58%|█████▊ | 7242/12384 [15:22:13<10:52:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 58%|█████▊ | 7243/12384 [15:22:13<10:52:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 58%|█████▊ | 7243/12384 [15:22:20<10:52:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 58%|█████▊ | 7244/12384 [15:22:20<10:52:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 58%|█████▊ | 7244/12384 [15:22:28<10:52:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 59%|█████▊ | 7245/12384 [15:22:28<10:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 59%|█████▊ | 7245/12384 [15:22:36<10:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 59%|█████▊ | 7246/12384 [15:22:36<10:51:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 59%|█████▊ | 7246/12384 [15:22:43<10:51:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 59%|█████▊ | 7247/12384 [15:22:43<10:51:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 59%|█████▊ | 7247/12384 [15:22:51<10:51:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 59%|█████▊ | 7248/12384 [15:22:51<10:51:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 59%|█████▊ | 7248/12384 [15:22:58<10:51:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 59%|█████▊ | 7249/12384 [15:22:58<10:51:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 59%|█████▊ | 7249/12384 [15:23:06<10:51:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 59%|█████▊ | 7250/12384 [15:23:06<10:51:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 59%|█████▊ | 7250/12384 [15:23:14<10:51:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 59%|█████▊ | 7251/12384 [15:23:14<10:51:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 59%|█████▊ | 7251/12384 [15:23:21<10:51:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 59%|█████▊ | 7252/12384 [15:23:21<10:51:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 59%|█████▊ | 7252/12384 [15:23:29<10:51:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 59%|█████▊ | 7253/12384 [15:23:29<10:51:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 59%|█████▊ | 7253/12384 [15:23:36<10:51:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 59%|█████▊ | 7254/12384 [15:23:37<11:16:23, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 59%|█████▊ | 7254/12384 [15:23:45<11:16:23, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 59%|█████▊ | 7255/12384 [15:23:45<11:08:16, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 59%|█████▊ | 7255/12384 [15:23:53<11:08:16, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 59%|█████▊ | 7256/12384 [15:23:53<11:03:08, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 59%|█████▊ | 7256/12384 [15:24:00<11:03:08, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 59%|█████▊ | 7257/12384 [15:24:00<10:58:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 59%|█████▊ | 7257/12384 [15:24:08<10:58:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 59%|█████▊ | 7258/12384 [15:24:08<10:56:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 59%|█████▊ | 7258/12384 [15:24:16<10:56:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▊ | 7259/12384 [15:24:16<10:54:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▊ | 7259/12384 [15:24:23<10:54:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 59%|█████▊ | 7260/12384 [15:24:23<10:53:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 59%|█████▊ | 7260/12384 [15:24:31<10:53:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 59%|█████▊ | 7261/12384 [15:24:31<11:00:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 59%|█████▊ | 7261/12384 [15:24:39<11:00:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 59%|█████▊ | 7262/12384 [15:24:39<10:56:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 59%|█████▊ | 7262/12384 [15:24:46<10:56:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 59%|█████▊ | 7263/12384 [15:24:46<10:54:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 59%|█████▊ | 7263/12384 [15:24:54<10:54:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 59%|█████▊ | 7264/12384 [15:24:54<10:52:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 59%|█████▊ | 7264/12384 [15:25:01<10:52:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 59%|█████▊ | 7265/12384 [15:25:01<10:52:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 59%|█████▊ | 7265/12384 [15:25:09<10:52:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 59%|█████▊ | 7266/12384 [15:25:09<10:53:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 59%|█████▊ | 7266/12384 [15:25:17<10:53:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 59%|█████▊ | 7267/12384 [15:25:17<10:52:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 59%|█████▊ | 7267/12384 [15:25:24<10:52:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▊ | 7268/12384 [15:25:24<10:51:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▊ | 7268/12384 [15:25:32<10:51:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▊ | 7269/12384 [15:25:32<10:50:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▊ | 7269/12384 [15:25:40<10:50:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 59%|█████▊ | 7270/12384 [15:25:40<10:49:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 59%|█████▊ | 7270/12384 [15:25:47<10:49:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 59%|█████▊ | 7271/12384 [15:25:47<10:51:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 59%|█████▊ | 7271/12384 [15:25:55<10:51:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 59%|█████▊ | 7272/12384 [15:25:55<10:51:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 59%|█████▊ | 7272/12384 [15:26:03<10:51:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 59%|█████▊ | 7273/12384 [15:26:03<10:51:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 59%|█████▊ | 7273/12384 [15:26:10<10:51:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 59%|█████▊ | 7274/12384 [15:26:10<10:50:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 59%|█████▊ | 7274/12384 [15:26:18<10:50:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 59%|█████▊ | 7275/12384 [15:26:18<10:49:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 59%|█████▊ | 7275/12384 [15:26:25<10:49:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 59%|█████▉ | 7276/12384 [15:26:25<10:49:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 59%|█████▉ | 7276/12384 [15:26:33<10:49:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 59%|█████▉ | 7277/12384 [15:26:33<10:48:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 59%|█████▉ | 7277/12384 [15:26:41<10:48:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 59%|█████▉ | 7278/12384 [15:26:41<10:49:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 59%|█████▉ | 7278/12384 [15:26:48<10:49:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▉ | 7279/12384 [15:26:48<10:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▉ | 7279/12384 [15:26:56<10:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 59%|█████▉ | 7280/12384 [15:26:56<10:48:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 59%|█████▉ | 7280/12384 [15:27:04<10:48:42, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.09s]
Epoch 1: 59%|█████▉ | 7281/12384 [15:27:04<10:48:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.09s]
Epoch 1: 59%|█████▉ | 7281/12384 [15:27:11<10:48:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 59%|█████▉ | 7282/12384 [15:27:11<10:47:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 59%|█████▉ | 7282/12384 [15:27:19<10:47:30, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.53s]
Epoch 1: 59%|█████▉ | 7283/12384 [15:27:19<10:46:47, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.53s]
Epoch 1: 59%|█████▉ | 7283/12384 [15:27:26<10:46:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 59%|█████▉ | 7284/12384 [15:27:26<10:46:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 59%|█████▉ | 7284/12384 [15:27:34<10:46:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 59%|█████▉ | 7285/12384 [15:27:34<10:46:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 59%|█████▉ | 7285/12384 [15:27:42<10:46:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 59%|█████▉ | 7286/12384 [15:27:42<10:45:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 59%|█████▉ | 7286/12384 [15:27:50<10:45:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 59%|█████▉ | 7287/12384 [15:27:50<10:55:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 59%|█████▉ | 7287/12384 [15:27:57<10:55:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 59%|█████▉ | 7288/12384 [15:27:57<10:53:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 59%|█████▉ | 7288/12384 [15:28:05<10:53:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 59%|█████▉ | 7289/12384 [15:28:05<10:51:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 1: 59%|█████▉ | 7289/12384 [15:28:12<10:51:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 59%|█████▉ | 7290/12384 [15:28:12<10:49:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 59%|█████▉ | 7290/12384 [15:28:20<10:49:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 59%|█████▉ | 7291/12384 [15:28:20<10:47:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 59%|█████▉ | 7291/12384 [15:28:28<10:47:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 59%|█████▉ | 7292/12384 [15:28:28<10:47:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 59%|█████▉ | 7292/12384 [15:28:35<10:47:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 59%|█████▉ | 7293/12384 [15:28:35<10:46:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 59%|█████▉ | 7293/12384 [15:28:43<10:46:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 59%|█████▉ | 7294/12384 [15:28:43<10:45:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 59%|█████▉ | 7294/12384 [15:28:51<10:45:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 59%|█████▉ | 7295/12384 [15:28:51<10:47:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 59%|█████▉ | 7295/12384 [15:28:58<10:47:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 59%|█████▉ | 7296/12384 [15:28:58<10:46:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 59%|█████▉ | 7296/12384 [15:29:06<10:46:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 59%|█████▉ | 7297/12384 [15:29:06<10:46:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 59%|█████▉ | 7297/12384 [15:29:13<10:46:04, 7.62s/it, loss=0.0016, acc=0.9976, iter_time=4.74s]
Epoch 1: 59%|█████▉ | 7298/12384 [15:29:13<10:45:31, 7.62s/it, loss=0.0016, acc=0.9976, iter_time=4.74s]
Epoch 1: 59%|█████▉ | 7298/12384 [15:29:21<10:45:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 59%|█████▉ | 7299/12384 [15:29:21<10:44:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 59%|█████▉ | 7299/12384 [15:29:29<10:44:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 59%|█████▉ | 7300/12384 [15:29:29<10:44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 59%|█████▉ | 7300/12384 [15:29:36<10:44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▉ | 7301/12384 [15:29:36<10:47:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▉ | 7301/12384 [15:29:44<10:47:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 59%|█████▉ | 7302/12384 [15:29:44<10:46:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 59%|█████▉ | 7302/12384 [15:29:52<10:46:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 59%|█████▉ | 7303/12384 [15:29:52<10:46:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 59%|█████▉ | 7303/12384 [15:29:59<10:46:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 59%|█████▉ | 7304/12384 [15:29:59<10:45:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 59%|█████▉ | 7304/12384 [15:30:07<10:45:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 59%|█████▉ | 7305/12384 [15:30:07<10:46:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 59%|█████▉ | 7305/12384 [15:30:14<10:46:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 59%|█████▉ | 7306/12384 [15:30:14<10:44:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 59%|█████▉ | 7306/12384 [15:30:22<10:44:47, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.58s]
Epoch 1: 59%|█████▉ | 7307/12384 [15:30:22<10:44:35, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.58s]
Epoch 1: 59%|█████▉ | 7307/12384 [15:30:30<10:44:35, 7.62s/it, loss=0.0003, acc=0.9979, iter_time=4.24s]
Epoch 1: 59%|█████▉ | 7308/12384 [15:30:30<10:44:33, 7.62s/it, loss=0.0003, acc=0.9979, iter_time=4.24s]
Epoch 1: 59%|█████▉ | 7308/12384 [15:30:37<10:44:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 59%|█████▉ | 7309/12384 [15:30:37<10:43:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 59%|█████▉ | 7309/12384 [15:30:45<10:43:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▉ | 7310/12384 [15:30:45<10:43:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▉ | 7310/12384 [15:30:52<10:43:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 59%|█████▉ | 7311/12384 [15:30:52<10:42:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 59%|█████▉ | 7311/12384 [15:31:00<10:42:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 59%|█████▉ | 7312/12384 [15:31:00<10:42:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 59%|█████▉ | 7312/12384 [15:31:08<10:42:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 59%|█████▉ | 7313/12384 [15:31:08<10:52:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 59%|█████▉ | 7313/12384 [15:31:16<10:52:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 59%|█████▉ | 7314/12384 [15:31:16<10:50:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 59%|█████▉ | 7314/12384 [15:31:23<10:50:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 59%|█████▉ | 7315/12384 [15:31:23<10:47:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 59%|█████▉ | 7315/12384 [15:31:31<10:47:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 59%|█████▉ | 7316/12384 [15:31:31<10:45:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 59%|█████▉ | 7316/12384 [15:31:38<10:45:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 59%|█████▉ | 7317/12384 [15:31:38<10:44:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 59%|█████▉ | 7317/12384 [15:31:46<10:44:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 59%|█████▉ | 7318/12384 [15:31:46<10:45:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 59%|█████▉ | 7318/12384 [15:31:54<10:45:48, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.16s]
Epoch 1: 59%|█████▉ | 7319/12384 [15:31:54<10:44:58, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.16s]
Epoch 1: 59%|█████▉ | 7319/12384 [15:32:01<10:44:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 59%|█████▉ | 7320/12384 [15:32:01<10:43:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 59%|█████▉ | 7320/12384 [15:32:10<10:43:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 59%|█████▉ | 7321/12384 [15:32:10<10:59:41, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 59%|█████▉ | 7321/12384 [15:32:18<10:59:41, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 1: 59%|█████▉ | 7322/12384 [15:32:18<11:13:47, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 1: 59%|█████▉ | 7322/12384 [15:32:26<11:13:47, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 59%|█████▉ | 7323/12384 [15:32:26<11:05:38, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 59%|█████▉ | 7323/12384 [15:32:33<11:05:38, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 59%|█████▉ | 7324/12384 [15:32:33<10:59:49, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 59%|█████▉ | 7324/12384 [15:32:41<10:59:49, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 59%|█████▉ | 7325/12384 [15:32:41<11:02:10, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 59%|█████▉ | 7325/12384 [15:32:49<11:02:10, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 59%|█████▉ | 7326/12384 [15:32:49<10:59:19, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 59%|█████▉ | 7326/12384 [15:32:57<10:59:19, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 59%|█████▉ | 7327/12384 [15:32:57<10:54:58, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 59%|█████▉ | 7327/12384 [15:33:04<10:54:58, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 1: 59%|█████▉ | 7328/12384 [15:33:04<10:53:40, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 1: 59%|█████▉ | 7328/12384 [15:33:12<10:53:40, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 59%|█████▉ | 7329/12384 [15:33:12<10:51:42, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 59%|█████▉ | 7329/12384 [15:33:20<10:51:42, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 59%|█████▉ | 7330/12384 [15:33:20<10:49:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 59%|█████▉ | 7330/12384 [15:33:27<10:49:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 59%|█████▉ | 7331/12384 [15:33:27<10:50:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 59%|█████▉ | 7331/12384 [15:33:35<10:50:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 59%|█████▉ | 7332/12384 [15:33:35<10:48:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 59%|█████▉ | 7332/12384 [15:33:43<10:48:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 59%|█████▉ | 7333/12384 [15:33:43<10:46:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 59%|█████▉ | 7333/12384 [15:33:50<10:46:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 59%|█████▉ | 7334/12384 [15:33:50<10:45:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 59%|█████▉ | 7334/12384 [15:33:58<10:45:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 59%|█████▉ | 7335/12384 [15:33:58<10:48:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 59%|█████▉ | 7335/12384 [15:34:06<10:48:17, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 1: 59%|█████▉ | 7336/12384 [15:34:06<10:48:40, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 1: 59%|█████▉ | 7336/12384 [15:34:14<10:48:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 59%|█████▉ | 7337/12384 [15:34:14<10:47:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 59%|█████▉ | 7337/12384 [15:34:21<10:47:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 59%|█████▉ | 7338/12384 [15:34:21<10:46:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 59%|█████▉ | 7338/12384 [15:34:29<10:46:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 59%|█████▉ | 7339/12384 [15:34:29<10:56:50, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 59%|█████▉ | 7339/12384 [15:34:37<10:56:50, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 1: 59%|█████▉ | 7340/12384 [15:34:37<10:53:11, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 1: 59%|█████▉ | 7340/12384 [15:34:45<10:53:11, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 59%|█████▉ | 7341/12384 [15:34:45<10:51:00, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 59%|█████▉ | 7341/12384 [15:34:52<10:51:00, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 59%|█████▉ | 7342/12384 [15:34:52<10:49:43, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 59%|█████▉ | 7342/12384 [15:35:00<10:49:43, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 59%|█████▉ | 7343/12384 [15:35:00<10:48:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 59%|█████▉ | 7343/12384 [15:35:08<10:48:11, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 1: 59%|█████▉ | 7344/12384 [15:35:08<10:47:29, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 1: 59%|█████▉ | 7344/12384 [15:35:15<10:47:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 59%|█████▉ | 7345/12384 [15:35:15<10:46:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 59%|█████▉ | 7345/12384 [15:35:23<10:46:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 59%|█████▉ | 7346/12384 [15:35:23<10:45:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 59%|█████▉ | 7346/12384 [15:35:31<10:45:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 59%|█████▉ | 7347/12384 [15:35:31<10:44:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 59%|█████▉ | 7347/12384 [15:35:38<10:44:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 59%|█████▉ | 7348/12384 [15:35:38<10:45:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 59%|█████▉ | 7348/12384 [15:35:46<10:45:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 59%|█████▉ | 7349/12384 [15:35:46<10:45:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 59%|█████▉ | 7349/12384 [15:35:54<10:45:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 59%|█████▉ | 7350/12384 [15:35:54<10:44:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 59%|█████▉ | 7350/12384 [15:36:02<10:44:49, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=6.31s]
Epoch 1: 59%|█████▉ | 7351/12384 [15:36:02<10:45:00, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=6.31s]
Epoch 1: 59%|█████▉ | 7351/12384 [15:36:09<10:45:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 59%|█████▉ | 7352/12384 [15:36:09<10:45:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 59%|█████▉ | 7352/12384 [15:36:17<10:45:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 59%|█████▉ | 7353/12384 [15:36:17<10:51:18, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 59%|█████▉ | 7353/12384 [15:36:25<10:51:18, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 59%|█████▉ | 7354/12384 [15:36:25<10:48:19, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 59%|█████▉ | 7354/12384 [15:36:33<10:48:19, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 59%|█████▉ | 7355/12384 [15:36:33<10:46:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 59%|█████▉ | 7355/12384 [15:36:40<10:46:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 59%|█████▉ | 7356/12384 [15:36:40<10:45:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 59%|█████▉ | 7356/12384 [15:36:48<10:45:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 1: 59%|█████▉ | 7357/12384 [15:36:48<10:42:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 1: 59%|█████▉ | 7357/12384 [15:36:55<10:42:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▉ | 7358/12384 [15:36:55<10:42:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 59%|█████▉ | 7358/12384 [15:37:03<10:42:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 59%|█████▉ | 7359/12384 [15:37:03<10:41:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 59%|█████▉ | 7359/12384 [15:37:11<10:41:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 59%|█████▉ | 7360/12384 [15:37:11<10:39:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 59%|█████▉ | 7360/12384 [15:37:18<10:39:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 59%|█████▉ | 7361/12384 [15:37:18<10:38:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 59%|█████▉ | 7361/12384 [15:37:26<10:38:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 59%|█████▉ | 7362/12384 [15:37:26<10:38:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 59%|█████▉ | 7362/12384 [15:37:33<10:38:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 59%|█████▉ | 7363/12384 [15:37:33<10:37:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 59%|█████▉ | 7363/12384 [15:37:41<10:37:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 59%|█████▉ | 7364/12384 [15:37:41<10:37:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 59%|█████▉ | 7364/12384 [15:37:49<10:37:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 59%|█████▉ | 7365/12384 [15:37:49<10:45:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 59%|█████▉ | 7365/12384 [15:37:57<10:45:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 59%|█████▉ | 7366/12384 [15:37:57<10:43:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 59%|█████▉ | 7366/12384 [15:38:04<10:43:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 59%|█████▉ | 7367/12384 [15:38:04<10:42:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 59%|█████▉ | 7367/12384 [15:38:12<10:42:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 59%|█████▉ | 7368/12384 [15:38:12<10:40:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 59%|█████▉ | 7368/12384 [15:38:20<10:40:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.96s]
Epoch 1: 60%|█████▉ | 7369/12384 [15:38:20<10:38:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.96s]
Epoch 1: 60%|█████▉ | 7369/12384 [15:38:27<10:38:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 60%|█████▉ | 7370/12384 [15:38:27<10:37:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 60%|█████▉ | 7370/12384 [15:38:35<10:37:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 60%|█████▉ | 7371/12384 [15:38:35<10:36:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 60%|█████▉ | 7371/12384 [15:38:42<10:36:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 60%|█████▉ | 7372/12384 [15:38:42<10:35:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 60%|█████▉ | 7372/12384 [15:38:50<10:35:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|█████▉ | 7373/12384 [15:38:50<10:35:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|█████▉ | 7373/12384 [15:38:58<10:35:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|█████▉ | 7374/12384 [15:38:58<10:34:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|█████▉ | 7374/12384 [15:39:05<10:34:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|█████▉ | 7375/12384 [15:39:05<10:34:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|█████▉ | 7375/12384 [15:39:13<10:34:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 60%|█████▉ | 7376/12384 [15:39:13<10:34:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 60%|█████▉ | 7376/12384 [15:39:20<10:34:42, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 1: 60%|█████▉ | 7377/12384 [15:39:20<10:34:07, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 1: 60%|█████▉ | 7377/12384 [15:39:28<10:34:07, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=4.74s]
Epoch 1: 60%|█████▉ | 7378/12384 [15:39:28<10:34:30, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=4.74s]
Epoch 1: 60%|█████▉ | 7378/12384 [15:39:36<10:34:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 60%|█████▉ | 7379/12384 [15:39:36<10:34:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 60%|█████▉ | 7379/12384 [15:39:43<10:34:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 60%|█████▉ | 7380/12384 [15:39:43<10:34:08, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 60%|█████▉ | 7380/12384 [15:39:51<10:34:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 60%|█████▉ | 7381/12384 [15:39:51<10:34:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 60%|█████▉ | 7381/12384 [15:39:58<10:34:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 60%|█████▉ | 7382/12384 [15:39:58<10:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 60%|█████▉ | 7382/12384 [15:40:06<10:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 60%|█████▉ | 7383/12384 [15:40:06<10:34:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 60%|█████▉ | 7383/12384 [15:40:14<10:34:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 60%|█████▉ | 7384/12384 [15:40:14<10:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 60%|█████▉ | 7384/12384 [15:40:21<10:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 60%|█████▉ | 7385/12384 [15:40:21<10:36:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 60%|█████▉ | 7385/12384 [15:40:29<10:36:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 60%|█████▉ | 7386/12384 [15:40:29<10:35:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 60%|█████▉ | 7386/12384 [15:40:37<10:35:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 60%|█████▉ | 7387/12384 [15:40:37<10:35:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 60%|█████▉ | 7387/12384 [15:40:44<10:35:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 60%|█████▉ | 7388/12384 [15:40:44<10:34:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 60%|█████▉ | 7388/12384 [15:40:52<10:34:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|█████▉ | 7389/12384 [15:40:52<10:33:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|█████▉ | 7389/12384 [15:40:59<10:33:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.24s]
Epoch 1: 60%|█████▉ | 7390/12384 [15:40:59<10:33:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.24s]
Epoch 1: 60%|█████▉ | 7390/12384 [15:41:07<10:33:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 60%|█████▉ | 7391/12384 [15:41:07<10:33:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 60%|█████▉ | 7391/12384 [15:41:15<10:33:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 60%|█████▉ | 7392/12384 [15:41:15<10:41:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 60%|█████▉ | 7392/12384 [15:41:23<10:41:35, 7.71s/it, loss=0.0003, acc=0.9981, iter_time=4.30s]
Epoch 1: 60%|█████▉ | 7393/12384 [15:41:23<10:39:43, 7.69s/it, loss=0.0003, acc=0.9981, iter_time=4.30s]
Epoch 1: 60%|█████▉ | 7393/12384 [15:41:30<10:39:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 60%|█████▉ | 7394/12384 [15:41:30<10:37:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 60%|█████▉ | 7394/12384 [15:41:38<10:37:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 60%|█████▉ | 7395/12384 [15:41:38<10:43:02, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 60%|█████▉ | 7395/12384 [15:41:46<10:43:02, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 60%|█████▉ | 7396/12384 [15:41:46<10:39:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 60%|█████▉ | 7396/12384 [15:41:53<10:39:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 60%|█████▉ | 7397/12384 [15:41:53<10:37:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 60%|█████▉ | 7397/12384 [15:42:01<10:37:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 60%|█████▉ | 7398/12384 [15:42:01<10:38:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 60%|█████▉ | 7398/12384 [15:42:09<10:38:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 60%|█████▉ | 7399/12384 [15:42:09<10:36:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 60%|█████▉ | 7399/12384 [15:42:16<10:36:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 60%|█████▉ | 7400/12384 [15:42:16<10:34:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 60%|█████▉ | 7400/12384 [15:42:24<10:34:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 60%|█████▉ | 7401/12384 [15:42:24<10:33:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 60%|█████▉ | 7401/12384 [15:42:31<10:33:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|█████▉ | 7402/12384 [15:42:31<10:32:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|█████▉ | 7402/12384 [15:42:39<10:32:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 60%|█████▉ | 7403/12384 [15:42:39<10:31:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 60%|█████▉ | 7403/12384 [15:42:47<10:31:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 60%|█████▉ | 7404/12384 [15:42:47<10:31:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 60%|█████▉ | 7404/12384 [15:42:54<10:31:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 60%|█████▉ | 7405/12384 [15:42:54<10:31:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 60%|█████▉ | 7405/12384 [15:43:02<10:31:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 60%|█████▉ | 7406/12384 [15:43:02<10:31:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 60%|█████▉ | 7406/12384 [15:43:09<10:31:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 60%|█████▉ | 7407/12384 [15:43:09<10:31:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 60%|█████▉ | 7407/12384 [15:43:17<10:31:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.41s]
Epoch 1: 60%|█████▉ | 7408/12384 [15:43:17<10:31:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.41s]
Epoch 1: 60%|█████▉ | 7408/12384 [15:43:25<10:31:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 1: 60%|█████▉ | 7409/12384 [15:43:25<10:31:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 1: 60%|█████▉ | 7409/12384 [15:43:32<10:31:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 1: 60%|█████▉ | 7410/12384 [15:43:32<10:30:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 1: 60%|█████▉ | 7410/12384 [15:43:40<10:30:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 60%|█████▉ | 7411/12384 [15:43:40<10:31:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 60%|█████▉ | 7411/12384 [15:43:47<10:31:01, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.61s]
Epoch 1: 60%|█████▉ | 7412/12384 [15:43:47<10:31:03, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.61s]
Epoch 1: 60%|█████▉ | 7412/12384 [15:43:55<10:31:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 60%|█████▉ | 7413/12384 [15:43:55<10:31:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 60%|█████▉ | 7413/12384 [15:44:03<10:31:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 60%|█████▉ | 7414/12384 [15:44:03<10:31:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 60%|█████▉ | 7414/12384 [15:44:10<10:31:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 60%|█████▉ | 7415/12384 [15:44:10<10:32:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 60%|█████▉ | 7415/12384 [15:44:18<10:32:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 60%|█████▉ | 7416/12384 [15:44:18<10:31:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 60%|█████▉ | 7416/12384 [15:44:26<10:31:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 60%|█████▉ | 7417/12384 [15:44:26<10:30:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 60%|█████▉ | 7417/12384 [15:44:34<10:30:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.20s]
Epoch 1: 60%|█████▉ | 7418/12384 [15:44:34<10:38:01, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.20s]
Epoch 1: 60%|█████▉ | 7418/12384 [15:44:41<10:38:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 60%|█████▉ | 7419/12384 [15:44:41<10:35:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 60%|█████▉ | 7419/12384 [15:44:49<10:35:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 60%|█████▉ | 7420/12384 [15:44:49<10:33:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 60%|█████▉ | 7420/12384 [15:44:57<10:33:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 60%|█████▉ | 7421/12384 [15:44:57<10:38:29, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 60%|█████▉ | 7421/12384 [15:45:04<10:38:29, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 60%|█████▉ | 7422/12384 [15:45:04<10:35:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 60%|█████▉ | 7422/12384 [15:45:12<10:35:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 60%|█████▉ | 7423/12384 [15:45:12<10:34:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 60%|█████▉ | 7423/12384 [15:45:19<10:34:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.62s]
Epoch 1: 60%|█████▉ | 7424/12384 [15:45:19<10:32:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.62s]
Epoch 1: 60%|█████▉ | 7424/12384 [15:45:27<10:32:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|█████▉ | 7425/12384 [15:45:27<10:30:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|█████▉ | 7425/12384 [15:45:35<10:30:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 60%|█████▉ | 7426/12384 [15:45:35<10:30:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 60%|█████▉ | 7426/12384 [15:45:42<10:30:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|█████▉ | 7427/12384 [15:45:42<10:29:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|█████▉ | 7427/12384 [15:45:50<10:29:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 60%|█████▉ | 7428/12384 [15:45:50<10:28:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 60%|█████▉ | 7428/12384 [15:45:57<10:28:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 60%|█████▉ | 7429/12384 [15:45:57<10:28:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 60%|█████▉ | 7429/12384 [15:46:05<10:28:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|█████▉ | 7430/12384 [15:46:05<10:28:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|█████▉ | 7430/12384 [15:46:13<10:28:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 60%|██████ | 7431/12384 [15:46:13<10:28:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 60%|██████ | 7431/12384 [15:46:20<10:28:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 60%|██████ | 7432/12384 [15:46:20<10:27:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 60%|██████ | 7432/12384 [15:46:28<10:27:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 60%|██████ | 7433/12384 [15:46:28<10:27:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 60%|██████ | 7433/12384 [15:46:35<10:27:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 60%|██████ | 7434/12384 [15:46:35<10:27:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 60%|██████ | 7434/12384 [15:46:43<10:27:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7435/12384 [15:46:43<10:27:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7435/12384 [15:46:51<10:27:30, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7436/12384 [15:46:51<10:27:46, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7436/12384 [15:46:58<10:27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 60%|██████ | 7437/12384 [15:46:58<10:27:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 60%|██████ | 7437/12384 [15:47:06<10:27:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|██████ | 7438/12384 [15:47:06<10:27:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|██████ | 7438/12384 [15:47:14<10:27:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 60%|██████ | 7439/12384 [15:47:14<10:26:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 60%|██████ | 7439/12384 [15:47:21<10:26:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 60%|██████ | 7440/12384 [15:47:21<10:27:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 60%|██████ | 7440/12384 [15:47:29<10:27:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 60%|██████ | 7441/12384 [15:47:29<10:27:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 60%|██████ | 7441/12384 [15:47:36<10:27:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|██████ | 7442/12384 [15:47:36<10:26:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 60%|██████ | 7442/12384 [15:47:44<10:26:54, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=7.61s]
Epoch 1: 60%|██████ | 7443/12384 [15:47:44<10:27:13, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=7.61s]
Epoch 1: 60%|██████ | 7443/12384 [15:47:52<10:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 60%|██████ | 7444/12384 [15:47:52<10:26:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 60%|██████ | 7444/12384 [15:48:00<10:26:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 60%|██████ | 7445/12384 [15:48:00<10:34:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 60%|██████ | 7445/12384 [15:48:07<10:34:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 60%|██████ | 7446/12384 [15:48:07<10:31:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 60%|██████ | 7446/12384 [15:48:15<10:31:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 60%|██████ | 7447/12384 [15:48:15<10:29:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 60%|██████ | 7447/12384 [15:48:22<10:29:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 60%|██████ | 7448/12384 [15:48:22<10:28:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 60%|██████ | 7448/12384 [15:48:30<10:28:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 60%|██████ | 7449/12384 [15:48:30<10:27:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 60%|██████ | 7449/12384 [15:48:38<10:27:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7450/12384 [15:48:38<10:27:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7450/12384 [15:48:45<10:27:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7451/12384 [15:48:45<10:28:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7451/12384 [15:48:53<10:28:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 60%|██████ | 7452/12384 [15:48:53<10:27:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 60%|██████ | 7452/12384 [15:49:00<10:27:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 60%|██████ | 7453/12384 [15:49:00<10:26:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 60%|██████ | 7453/12384 [15:49:08<10:26:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 60%|██████ | 7454/12384 [15:49:08<10:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 60%|██████ | 7454/12384 [15:49:16<10:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 60%|██████ | 7455/12384 [15:49:16<10:25:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 60%|██████ | 7455/12384 [15:49:23<10:25:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 60%|██████ | 7456/12384 [15:49:23<10:25:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 60%|██████ | 7456/12384 [15:49:31<10:25:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 1: 60%|██████ | 7457/12384 [15:49:31<10:25:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 1: 60%|██████ | 7457/12384 [15:49:39<10:25:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 1: 60%|██████ | 7458/12384 [15:49:39<10:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 1: 60%|██████ | 7458/12384 [15:49:46<10:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 60%|██████ | 7459/12384 [15:49:46<10:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 60%|██████ | 7459/12384 [15:49:54<10:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 60%|██████ | 7460/12384 [15:49:54<10:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 60%|██████ | 7460/12384 [15:50:01<10:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7461/12384 [15:50:01<10:25:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7461/12384 [15:50:09<10:25:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7462/12384 [15:50:09<10:25:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7462/12384 [15:50:17<10:25:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7463/12384 [15:50:17<10:24:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7463/12384 [15:50:24<10:24:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 60%|██████ | 7464/12384 [15:50:24<10:24:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 60%|██████ | 7464/12384 [15:50:32<10:24:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 60%|██████ | 7465/12384 [15:50:32<10:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 60%|██████ | 7465/12384 [15:50:39<10:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 60%|██████ | 7466/12384 [15:50:39<10:25:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 60%|██████ | 7466/12384 [15:50:47<10:25:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 60%|██████ | 7467/12384 [15:50:47<10:24:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 1: 60%|██████ | 7467/12384 [15:50:55<10:24:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 60%|██████ | 7468/12384 [15:50:55<10:24:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 60%|██████ | 7468/12384 [15:51:02<10:24:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 60%|██████ | 7469/12384 [15:51:02<10:23:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 60%|██████ | 7469/12384 [15:51:10<10:23:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 60%|██████ | 7470/12384 [15:51:10<10:22:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 60%|██████ | 7470/12384 [15:51:18<10:22:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7471/12384 [15:51:18<10:31:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7471/12384 [15:51:25<10:31:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 60%|██████ | 7472/12384 [15:51:25<10:28:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 60%|██████ | 7472/12384 [15:51:33<10:28:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 60%|██████ | 7473/12384 [15:51:33<10:33:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 60%|██████ | 7473/12384 [15:51:41<10:33:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|██████ | 7474/12384 [15:51:41<10:29:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|██████ | 7474/12384 [15:51:49<10:29:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 60%|██████ | 7475/12384 [15:51:49<10:30:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 60%|██████ | 7475/12384 [15:51:56<10:30:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 60%|██████ | 7476/12384 [15:51:56<10:27:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 60%|██████ | 7476/12384 [15:52:04<10:27:34, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7477/12384 [15:52:04<10:25:42, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7477/12384 [15:52:11<10:25:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|██████ | 7478/12384 [15:52:11<10:24:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 60%|██████ | 7478/12384 [15:52:19<10:24:23, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=7.60s]
Epoch 1: 60%|██████ | 7479/12384 [15:52:19<10:23:39, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=7.60s]
Epoch 1: 60%|██████ | 7479/12384 [15:52:27<10:23:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 60%|██████ | 7480/12384 [15:52:27<10:23:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 60%|██████ | 7480/12384 [15:52:34<10:23:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 60%|██████ | 7481/12384 [15:52:34<10:22:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 60%|██████ | 7481/12384 [15:52:42<10:22:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 60%|██████ | 7482/12384 [15:52:42<10:22:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 60%|██████ | 7482/12384 [15:52:50<10:22:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 60%|██████ | 7483/12384 [15:52:50<10:22:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 60%|██████ | 7483/12384 [15:52:57<10:22:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7484/12384 [15:52:57<10:22:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7484/12384 [15:53:05<10:22:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 60%|██████ | 7485/12384 [15:53:05<10:21:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 60%|██████ | 7485/12384 [15:53:12<10:21:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 60%|██████ | 7486/12384 [15:53:12<10:21:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 60%|██████ | 7486/12384 [15:53:20<10:21:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7487/12384 [15:53:20<10:23:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 60%|██████ | 7487/12384 [15:53:28<10:23:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 60%|██████ | 7488/12384 [15:53:28<10:22:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 60%|██████ | 7488/12384 [15:53:35<10:22:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 60%|██████ | 7489/12384 [15:53:35<10:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 60%|██████ | 7489/12384 [15:53:43<10:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 60%|██████ | 7490/12384 [15:53:43<10:21:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 60%|██████ | 7490/12384 [15:53:51<10:21:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7491/12384 [15:53:51<10:22:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 60%|██████ | 7491/12384 [15:53:58<10:22:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 60%|██████ | 7492/12384 [15:53:58<10:22:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 60%|██████ | 7492/12384 [15:54:06<10:22:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 61%|██████ | 7493/12384 [15:54:06<10:20:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 61%|██████ | 7493/12384 [15:54:13<10:20:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 61%|██████ | 7494/12384 [15:54:13<10:20:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 61%|██████ | 7494/12384 [15:54:21<10:20:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 61%|██████ | 7495/12384 [15:54:21<10:20:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 61%|██████ | 7495/12384 [15:54:29<10:20:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 61%|██████ | 7496/12384 [15:54:29<10:19:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 61%|██████ | 7496/12384 [15:54:37<10:19:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 61%|██████ | 7497/12384 [15:54:37<10:27:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 61%|██████ | 7497/12384 [15:54:44<10:27:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 61%|██████ | 7498/12384 [15:54:44<10:25:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 61%|██████ | 7498/12384 [15:54:52<10:25:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 61%|██████ | 7499/12384 [15:54:52<10:30:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 61%|██████ | 7499/12384 [15:55:00<10:30:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 61%|██████ | 7500/12384 [15:55:00<10:26:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 61%|██████ | 7500/12384 [15:55:07<10:26:47, 7.70s/it, loss=0.0004, acc=0.9983, iter_time=7.64s]
Epoch 1: 61%|██████ | 7501/12384 [15:55:07<10:25:35, 7.69s/it, loss=0.0004, acc=0.9983, iter_time=7.64s]
Epoch 1: 61%|██████ | 7501/12384 [15:55:15<10:25:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 61%|██████ | 7502/12384 [15:55:15<10:23:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 61%|██████ | 7502/12384 [15:55:23<10:23:34, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 61%|██████ | 7503/12384 [15:55:23<10:22:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 61%|██████ | 7503/12384 [15:55:30<10:22:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 61%|██████ | 7504/12384 [15:55:30<10:21:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 61%|██████ | 7504/12384 [15:55:38<10:21:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 61%|██████ | 7505/12384 [15:55:38<10:20:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 61%|██████ | 7505/12384 [15:55:45<10:20:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7506/12384 [15:55:45<10:19:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7506/12384 [15:55:53<10:19:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████ | 7507/12384 [15:55:53<10:18:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████ | 7507/12384 [15:56:01<10:18:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 61%|██████ | 7508/12384 [15:56:01<10:20:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 61%|██████ | 7508/12384 [15:56:08<10:20:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 61%|██████ | 7509/12384 [15:56:08<10:20:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 61%|██████ | 7509/12384 [15:56:16<10:20:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 61%|██████ | 7510/12384 [15:56:16<10:19:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 61%|██████ | 7510/12384 [15:56:24<10:19:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 61%|██████ | 7511/12384 [15:56:24<10:19:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 61%|██████ | 7511/12384 [15:56:31<10:19:33, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.75s]
Epoch 1: 61%|██████ | 7512/12384 [15:56:31<10:21:00, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.75s]
Epoch 1: 61%|██████ | 7512/12384 [15:56:39<10:21:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 61%|██████ | 7513/12384 [15:56:39<10:20:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 61%|██████ | 7513/12384 [15:56:47<10:20:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 61%|██████ | 7514/12384 [15:56:47<10:21:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 61%|██████ | 7514/12384 [15:56:54<10:21:33, 7.66s/it, loss=0.0001, acc=0.9997, iter_time=7.70s]
Epoch 1: 61%|██████ | 7515/12384 [15:56:54<10:23:08, 7.68s/it, loss=0.0001, acc=0.9997, iter_time=7.70s]
Epoch 1: 61%|██████ | 7515/12384 [15:57:02<10:23:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 61%|██████ | 7516/12384 [15:57:02<10:21:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 61%|██████ | 7516/12384 [15:57:10<10:21:09, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=3.40s]
Epoch 1: 61%|██████ | 7517/12384 [15:57:10<10:21:11, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=3.40s]
Epoch 1: 61%|██████ | 7517/12384 [15:57:17<10:21:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.47s]
Epoch 1: 61%|██████ | 7518/12384 [15:57:17<10:21:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.47s]
Epoch 1: 61%|██████ | 7518/12384 [15:57:25<10:21:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 61%|██████ | 7519/12384 [15:57:25<10:20:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 61%|██████ | 7519/12384 [15:57:32<10:20:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 61%|██████ | 7520/12384 [15:57:32<10:18:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 61%|██████ | 7520/12384 [15:57:40<10:18:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 61%|██████ | 7521/12384 [15:57:40<10:18:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 61%|██████ | 7521/12384 [15:57:48<10:18:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 61%|██████ | 7522/12384 [15:57:48<10:17:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 61%|██████ | 7522/12384 [15:57:56<10:17:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 61%|██████ | 7523/12384 [15:57:56<10:27:00, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 61%|██████ | 7523/12384 [15:58:03<10:27:00, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 61%|██████ | 7524/12384 [15:58:03<10:26:10, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 61%|██████ | 7524/12384 [15:58:11<10:26:10, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 1: 61%|██████ | 7525/12384 [15:58:11<10:23:06, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 1: 61%|██████ | 7525/12384 [15:58:19<10:23:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 61%|██████ | 7526/12384 [15:58:19<10:21:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 61%|██████ | 7526/12384 [15:58:26<10:21:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7527/12384 [15:58:26<10:19:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7527/12384 [15:58:34<10:19:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 61%|██████ | 7528/12384 [15:58:34<10:18:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 61%|██████ | 7528/12384 [15:58:41<10:18:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 61%|██████ | 7529/12384 [15:58:41<10:18:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 61%|██████ | 7529/12384 [15:58:49<10:18:19, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.62s]
Epoch 1: 61%|██████ | 7530/12384 [15:58:49<10:18:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.62s]
Epoch 1: 61%|██████ | 7530/12384 [15:58:57<10:18:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7531/12384 [15:58:57<10:17:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7531/12384 [15:59:04<10:17:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 61%|██████ | 7532/12384 [15:59:04<10:17:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 61%|██████ | 7532/12384 [15:59:12<10:17:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 61%|██████ | 7533/12384 [15:59:12<10:15:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 61%|██████ | 7533/12384 [15:59:20<10:15:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 61%|██████ | 7534/12384 [15:59:20<10:15:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 61%|██████ | 7534/12384 [15:59:27<10:15:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 61%|██████ | 7535/12384 [15:59:27<10:14:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 61%|██████ | 7535/12384 [15:59:35<10:14:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 61%|██████ | 7536/12384 [15:59:35<10:15:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 61%|██████ | 7536/12384 [15:59:42<10:15:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 61%|██████ | 7537/12384 [15:59:42<10:14:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 61%|██████ | 7537/12384 [15:59:50<10:14:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7538/12384 [15:59:50<10:14:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7538/12384 [15:59:58<10:14:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 61%|██████ | 7539/12384 [15:59:58<10:13:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 61%|██████ | 7539/12384 [16:00:05<10:13:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 61%|██████ | 7540/12384 [16:00:05<10:13:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 61%|██████ | 7540/12384 [16:00:13<10:13:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 61%|██████ | 7541/12384 [16:00:13<10:13:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 61%|██████ | 7541/12384 [16:00:20<10:13:26, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7542/12384 [16:00:20<10:13:22, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7542/12384 [16:00:28<10:13:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 61%|██████ | 7543/12384 [16:00:28<10:12:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 61%|██████ | 7543/12384 [16:00:36<10:12:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 61%|██████ | 7544/12384 [16:00:36<10:13:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 61%|██████ | 7544/12384 [16:00:43<10:13:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 61%|██████ | 7545/12384 [16:00:43<10:12:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 61%|██████ | 7545/12384 [16:00:51<10:12:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 61%|██████ | 7546/12384 [16:00:51<10:13:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 61%|██████ | 7546/12384 [16:00:58<10:13:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 61%|██████ | 7547/12384 [16:00:58<10:13:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 61%|██████ | 7547/12384 [16:01:06<10:13:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 61%|██████ | 7548/12384 [16:01:06<10:13:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 61%|██████ | 7548/12384 [16:01:14<10:13:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 61%|██████ | 7549/12384 [16:01:14<10:21:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 61%|██████ | 7549/12384 [16:01:22<10:21:20, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████ | 7550/12384 [16:01:22<10:19:01, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████ | 7550/12384 [16:01:29<10:19:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 61%|██████ | 7551/12384 [16:01:29<10:18:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 61%|██████ | 7551/12384 [16:01:37<10:18:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 61%|██████ | 7552/12384 [16:01:37<10:18:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 61%|██████ | 7552/12384 [16:01:45<10:18:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7553/12384 [16:01:45<10:23:56, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7553/12384 [16:01:52<10:23:56, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7554/12384 [16:01:52<10:20:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7554/12384 [16:02:00<10:20:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7555/12384 [16:02:00<10:17:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7555/12384 [16:02:08<10:17:53, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7556/12384 [16:02:08<10:16:10, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7556/12384 [16:02:15<10:16:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7557/12384 [16:02:15<10:14:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7557/12384 [16:02:23<10:14:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 61%|██████ | 7558/12384 [16:02:23<10:14:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 61%|██████ | 7558/12384 [16:02:31<10:14:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 61%|██████ | 7559/12384 [16:02:31<10:13:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 61%|██████ | 7559/12384 [16:02:38<10:13:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7560/12384 [16:02:38<10:13:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7560/12384 [16:02:46<10:13:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 61%|██████ | 7561/12384 [16:02:46<10:12:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 61%|██████ | 7561/12384 [16:02:53<10:12:32, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.80s]
Epoch 1: 61%|██████ | 7562/12384 [16:02:53<10:12:22, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.80s]
Epoch 1: 61%|██████ | 7562/12384 [16:03:01<10:12:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 61%|██████ | 7563/12384 [16:03:01<10:11:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 61%|██████ | 7563/12384 [16:03:09<10:11:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 61%|██████ | 7564/12384 [16:03:09<10:11:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 61%|██████ | 7564/12384 [16:03:16<10:11:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7565/12384 [16:03:16<10:10:13, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7565/12384 [16:03:24<10:10:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 61%|██████ | 7566/12384 [16:03:24<10:10:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 61%|██████ | 7566/12384 [16:03:31<10:10:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 61%|██████ | 7567/12384 [16:03:31<10:10:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 61%|██████ | 7567/12384 [16:03:39<10:10:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 61%|██████ | 7568/12384 [16:03:39<10:10:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 61%|██████ | 7568/12384 [16:03:47<10:10:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 61%|██████ | 7569/12384 [16:03:47<10:10:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 61%|██████ | 7569/12384 [16:03:54<10:10:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 61%|██████ | 7570/12384 [16:03:54<10:10:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 61%|██████ | 7570/12384 [16:04:02<10:10:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7571/12384 [16:04:02<10:10:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7571/12384 [16:04:09<10:10:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7572/12384 [16:04:09<10:09:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7572/12384 [16:04:17<10:09:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7573/12384 [16:04:17<10:09:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████ | 7573/12384 [16:04:25<10:09:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████ | 7574/12384 [16:04:25<10:09:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████ | 7574/12384 [16:04:32<10:09:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7575/12384 [16:04:32<10:09:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 61%|██████ | 7575/12384 [16:04:40<10:09:17, 7.60s/it, loss=0.0003, acc=1.0000, iter_time=8.05s]
Epoch 1: 61%|██████ | 7576/12384 [16:04:40<10:16:40, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=8.05s]
Epoch 1: 61%|██████ | 7576/12384 [16:04:48<10:16:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 61%|██████ | 7577/12384 [16:04:48<10:14:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 61%|██████ | 7577/12384 [16:04:55<10:14:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.60s]
Epoch 1: 61%|██████ | 7578/12384 [16:04:55<10:13:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.60s]
Epoch 1: 61%|██████ | 7578/12384 [16:05:03<10:13:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.94s]
Epoch 1: 61%|██████ | 7579/12384 [16:05:03<10:18:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.94s]
Epoch 1: 61%|██████ | 7579/12384 [16:05:11<10:18:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7580/12384 [16:05:11<10:15:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████ | 7580/12384 [16:05:18<10:15:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 61%|██████ | 7581/12384 [16:05:18<10:14:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 61%|██████ | 7581/12384 [16:05:26<10:14:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 61%|██████ | 7582/12384 [16:05:26<10:12:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 61%|██████ | 7582/12384 [16:05:34<10:12:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 61%|██████ | 7583/12384 [16:05:34<10:11:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 61%|██████ | 7583/12384 [16:05:41<10:11:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 61%|██████ | 7584/12384 [16:05:41<10:11:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 61%|██████ | 7584/12384 [16:05:49<10:11:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 1: 61%|██████ | 7585/12384 [16:05:49<10:10:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 1: 61%|██████ | 7585/12384 [16:05:57<10:10:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 61%|██████▏ | 7586/12384 [16:05:57<10:09:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 61%|██████▏ | 7586/12384 [16:06:04<10:09:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 61%|██████▏ | 7587/12384 [16:06:04<10:09:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 61%|██████▏ | 7587/12384 [16:06:12<10:09:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 61%|██████▏ | 7588/12384 [16:06:12<10:08:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 61%|██████▏ | 7588/12384 [16:06:19<10:08:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 61%|██████▏ | 7589/12384 [16:06:19<10:09:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 61%|██████▏ | 7589/12384 [16:06:27<10:09:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 61%|██████▏ | 7590/12384 [16:06:27<10:09:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 61%|██████▏ | 7590/12384 [16:06:35<10:09:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 61%|██████▏ | 7591/12384 [16:06:35<10:09:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 61%|██████▏ | 7591/12384 [16:06:42<10:09:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 61%|██████▏ | 7592/12384 [16:06:42<10:08:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 61%|██████▏ | 7592/12384 [16:06:50<10:08:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 61%|██████▏ | 7593/12384 [16:06:50<10:08:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 61%|██████▏ | 7593/12384 [16:06:57<10:08:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████▏ | 7594/12384 [16:06:57<10:07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████▏ | 7594/12384 [16:07:05<10:07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 61%|██████▏ | 7595/12384 [16:07:05<10:07:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 61%|██████▏ | 7595/12384 [16:07:13<10:07:30, 7.61s/it, loss=0.0004, acc=0.9988, iter_time=7.60s]
Epoch 1: 61%|██████▏ | 7596/12384 [16:07:13<10:06:54, 7.61s/it, loss=0.0004, acc=0.9988, iter_time=7.60s]
Epoch 1: 61%|██████▏ | 7596/12384 [16:07:20<10:06:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 61%|██████▏ | 7597/12384 [16:07:20<10:06:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 61%|██████▏ | 7597/12384 [16:07:28<10:06:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████▏ | 7598/12384 [16:07:28<10:06:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 61%|██████▏ | 7598/12384 [16:07:35<10:06:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████▏ | 7599/12384 [16:07:35<10:06:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████▏ | 7599/12384 [16:07:43<10:06:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 61%|██████▏ | 7600/12384 [16:07:43<10:06:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 61%|██████▏ | 7600/12384 [16:07:51<10:06:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 61%|██████▏ | 7601/12384 [16:07:51<10:06:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 61%|██████▏ | 7601/12384 [16:07:59<10:06:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 61%|██████▏ | 7602/12384 [16:07:59<10:13:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 61%|██████▏ | 7602/12384 [16:08:06<10:13:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 61%|██████▏ | 7603/12384 [16:08:06<10:11:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 61%|██████▏ | 7603/12384 [16:08:14<10:11:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 61%|██████▏ | 7604/12384 [16:08:14<10:09:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 61%|██████▏ | 7604/12384 [16:08:22<10:09:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 61%|██████▏ | 7605/12384 [16:08:22<10:14:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 61%|██████▏ | 7605/12384 [16:08:29<10:14:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 61%|██████▏ | 7606/12384 [16:08:29<10:12:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 61%|██████▏ | 7606/12384 [16:08:37<10:12:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 61%|██████▏ | 7607/12384 [16:08:37<10:09:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 61%|██████▏ | 7607/12384 [16:08:45<10:09:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 61%|██████▏ | 7608/12384 [16:08:45<10:08:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 1: 61%|██████▏ | 7608/12384 [16:08:52<10:08:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 61%|██████▏ | 7609/12384 [16:08:52<10:07:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 61%|██████▏ | 7609/12384 [16:09:00<10:07:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 61%|██████▏ | 7610/12384 [16:09:00<10:07:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 61%|██████▏ | 7610/12384 [16:09:07<10:07:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████▏ | 7611/12384 [16:09:07<10:06:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████▏ | 7611/12384 [16:09:15<10:06:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 61%|██████▏ | 7612/12384 [16:09:15<10:07:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 61%|██████▏ | 7612/12384 [16:09:23<10:07:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████▏ | 7613/12384 [16:09:23<10:06:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 61%|██████▏ | 7613/12384 [16:09:30<10:06:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████▏ | 7614/12384 [16:09:30<10:05:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 61%|██████▏ | 7614/12384 [16:09:38<10:05:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 61%|██████▏ | 7615/12384 [16:09:38<10:05:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 61%|██████▏ | 7615/12384 [16:09:45<10:05:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 61%|██████▏ | 7616/12384 [16:09:46<10:10:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 61%|██████▏ | 7616/12384 [16:09:53<10:10:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 62%|██████▏ | 7617/12384 [16:09:53<10:08:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 62%|██████▏ | 7617/12384 [16:10:01<10:08:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 62%|██████▏ | 7618/12384 [16:10:01<10:07:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 62%|██████▏ | 7618/12384 [16:10:09<10:07:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 62%|██████▏ | 7619/12384 [16:10:09<10:07:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 62%|██████▏ | 7619/12384 [16:10:16<10:07:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 62%|██████▏ | 7620/12384 [16:10:16<10:06:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 62%|██████▏ | 7620/12384 [16:10:24<10:06:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7621/12384 [16:10:24<10:05:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7621/12384 [16:10:31<10:05:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7622/12384 [16:10:31<10:04:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7622/12384 [16:10:39<10:04:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7623/12384 [16:10:39<10:04:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7623/12384 [16:10:47<10:04:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 62%|██████▏ | 7624/12384 [16:10:47<10:04:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 62%|██████▏ | 7624/12384 [16:10:54<10:04:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 62%|██████▏ | 7625/12384 [16:10:54<10:04:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 62%|██████▏ | 7625/12384 [16:11:02<10:04:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 62%|██████▏ | 7626/12384 [16:11:02<10:03:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 62%|██████▏ | 7626/12384 [16:11:09<10:03:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 62%|██████▏ | 7627/12384 [16:11:09<10:03:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 62%|██████▏ | 7627/12384 [16:11:17<10:03:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 62%|██████▏ | 7628/12384 [16:11:17<10:02:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 62%|██████▏ | 7628/12384 [16:11:25<10:02:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 62%|██████▏ | 7629/12384 [16:11:25<10:10:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 62%|██████▏ | 7629/12384 [16:11:33<10:10:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 62%|██████▏ | 7630/12384 [16:11:33<10:07:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 62%|██████▏ | 7630/12384 [16:11:40<10:07:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 62%|██████▏ | 7631/12384 [16:11:40<10:06:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 62%|██████▏ | 7631/12384 [16:11:48<10:06:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 62%|██████▏ | 7632/12384 [16:11:48<10:05:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 62%|██████▏ | 7632/12384 [16:11:55<10:05:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 62%|██████▏ | 7633/12384 [16:11:55<10:04:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 62%|██████▏ | 7633/12384 [16:12:03<10:04:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 62%|██████▏ | 7634/12384 [16:12:03<10:04:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 62%|██████▏ | 7634/12384 [16:12:11<10:04:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 62%|██████▏ | 7635/12384 [16:12:11<10:03:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 62%|██████▏ | 7635/12384 [16:12:18<10:03:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7636/12384 [16:12:18<10:03:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7636/12384 [16:12:26<10:03:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 62%|██████▏ | 7637/12384 [16:12:26<10:02:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 62%|██████▏ | 7637/12384 [16:12:34<10:02:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 62%|██████▏ | 7638/12384 [16:12:34<10:03:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 62%|██████▏ | 7638/12384 [16:12:41<10:03:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7639/12384 [16:12:41<10:02:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7639/12384 [16:12:49<10:02:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 62%|██████▏ | 7640/12384 [16:12:49<10:02:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 62%|██████▏ | 7640/12384 [16:12:56<10:02:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 62%|██████▏ | 7641/12384 [16:12:56<10:01:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 62%|██████▏ | 7641/12384 [16:13:04<10:01:35, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7642/12384 [16:13:04<10:01:20, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7642/12384 [16:13:12<10:01:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 62%|██████▏ | 7643/12384 [16:13:12<10:01:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 62%|██████▏ | 7643/12384 [16:13:19<10:01:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 62%|██████▏ | 7644/12384 [16:13:19<10:01:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 62%|██████▏ | 7644/12384 [16:13:27<10:01:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.90s]
Epoch 1: 62%|██████▏ | 7645/12384 [16:13:27<10:01:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.90s]
Epoch 1: 62%|██████▏ | 7645/12384 [16:13:34<10:01:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 62%|██████▏ | 7646/12384 [16:13:34<10:00:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 62%|██████▏ | 7646/12384 [16:13:42<10:00:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 62%|██████▏ | 7647/12384 [16:13:42<10:00:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 62%|██████▏ | 7647/12384 [16:13:50<10:00:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 62%|██████▏ | 7648/12384 [16:13:50<10:00:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 62%|██████▏ | 7648/12384 [16:13:57<10:00:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 62%|██████▏ | 7649/12384 [16:13:57<10:00:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 62%|██████▏ | 7649/12384 [16:14:05<10:00:13, 7.61s/it, loss=0.0007, acc=0.9965, iter_time=7.02s]
Epoch 1: 62%|██████▏ | 7650/12384 [16:14:05<10:00:27, 7.61s/it, loss=0.0007, acc=0.9965, iter_time=7.02s]
Epoch 1: 62%|██████▏ | 7650/12384 [16:14:12<10:00:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 62%|██████▏ | 7651/12384 [16:14:12<10:00:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 62%|██████▏ | 7651/12384 [16:14:20<10:00:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 62%|██████▏ | 7652/12384 [16:14:20<10:00:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 62%|██████▏ | 7652/12384 [16:14:28<10:00:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 62%|██████▏ | 7653/12384 [16:14:28<10:00:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 62%|██████▏ | 7653/12384 [16:14:35<10:00:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 1: 62%|██████▏ | 7654/12384 [16:14:35<10:00:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 1: 62%|██████▏ | 7654/12384 [16:14:43<10:00:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 62%|██████▏ | 7655/12384 [16:14:43<10:07:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 62%|██████▏ | 7655/12384 [16:14:51<10:07:28, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=11.88s]
Epoch 1: 62%|██████▏ | 7656/12384 [16:14:51<10:12:04, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=11.88s]
Epoch 1: 62%|██████▏ | 7656/12384 [16:14:59<10:12:04, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 62%|██████▏ | 7657/12384 [16:14:59<10:08:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 62%|██████▏ | 7657/12384 [16:15:06<10:08:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 62%|██████▏ | 7658/12384 [16:15:06<10:05:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 62%|██████▏ | 7658/12384 [16:15:14<10:05:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7659/12384 [16:15:14<10:03:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7659/12384 [16:15:22<10:03:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 62%|██████▏ | 7660/12384 [16:15:22<10:01:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 62%|██████▏ | 7660/12384 [16:15:29<10:01:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7661/12384 [16:15:29<10:00:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7661/12384 [16:15:37<10:00:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 62%|██████▏ | 7662/12384 [16:15:37<10:00:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 62%|██████▏ | 7662/12384 [16:15:44<10:00:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 62%|██████▏ | 7663/12384 [16:15:44<9:59:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 62%|██████▏ | 7663/12384 [16:15:52<9:59:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 62%|██████▏ | 7664/12384 [16:15:52<10:00:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 62%|██████▏ | 7664/12384 [16:16:00<10:00:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 62%|██████▏ | 7665/12384 [16:16:00<10:00:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 62%|██████▏ | 7665/12384 [16:16:07<10:00:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 62%|██████▏ | 7666/12384 [16:16:07<9:59:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 62%|██████▏ | 7666/12384 [16:16:15<9:59:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 62%|██████▏ | 7667/12384 [16:16:15<9:59:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 62%|██████▏ | 7667/12384 [16:16:23<9:59:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 62%|██████▏ | 7668/12384 [16:16:23<9:59:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 62%|██████▏ | 7668/12384 [16:16:30<9:59:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 62%|██████▏ | 7669/12384 [16:16:30<9:59:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 62%|██████▏ | 7669/12384 [16:16:38<9:59:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 62%|██████▏ | 7670/12384 [16:16:38<9:58:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 62%|██████▏ | 7670/12384 [16:16:45<9:58:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7671/12384 [16:16:45<9:58:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7671/12384 [16:16:53<9:58:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 62%|██████▏ | 7672/12384 [16:16:53<9:58:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 62%|██████▏ | 7672/12384 [16:17:01<9:58:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 62%|██████▏ | 7673/12384 [16:17:01<9:57:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 62%|██████▏ | 7673/12384 [16:17:08<9:57:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 62%|██████▏ | 7674/12384 [16:17:08<9:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 62%|██████▏ | 7674/12384 [16:17:16<9:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7675/12384 [16:17:16<9:57:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7675/12384 [16:17:23<9:57:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7676/12384 [16:17:23<9:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7676/12384 [16:17:31<9:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 62%|██████▏ | 7677/12384 [16:17:31<9:57:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 62%|██████▏ | 7677/12384 [16:17:39<9:57:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 62%|██████▏ | 7678/12384 [16:17:39<9:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 62%|██████▏ | 7678/12384 [16:17:46<9:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7679/12384 [16:17:46<9:56:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7679/12384 [16:17:54<9:56:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 62%|██████▏ | 7680/12384 [16:17:54<9:56:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 62%|██████▏ | 7680/12384 [16:18:02<9:56:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 62%|██████▏ | 7681/12384 [16:18:02<10:03:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 62%|██████▏ | 7681/12384 [16:18:10<10:03:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 62%|██████▏ | 7682/12384 [16:18:10<10:07:59, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 62%|██████▏ | 7682/12384 [16:18:17<10:07:59, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 62%|██████▏ | 7683/12384 [16:18:17<10:04:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 62%|██████▏ | 7683/12384 [16:18:25<10:04:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 62%|██████▏ | 7684/12384 [16:18:25<10:02:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 62%|██████▏ | 7684/12384 [16:18:33<10:02:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7685/12384 [16:18:33<10:00:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7685/12384 [16:18:40<10:00:06, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 1: 62%|██████▏ | 7686/12384 [16:18:40<9:59:02, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 1: 62%|██████▏ | 7686/12384 [16:18:48<9:59:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 62%|██████▏ | 7687/12384 [16:18:48<9:57:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 62%|██████▏ | 7687/12384 [16:18:55<9:57:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 62%|██████▏ | 7688/12384 [16:18:55<9:56:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 62%|██████▏ | 7688/12384 [16:19:03<9:56:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 62%|██████▏ | 7689/12384 [16:19:03<9:58:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 62%|██████▏ | 7689/12384 [16:19:11<9:58:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 62%|██████▏ | 7690/12384 [16:19:11<9:57:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 62%|██████▏ | 7690/12384 [16:19:18<9:57:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 62%|██████▏ | 7691/12384 [16:19:18<9:56:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 62%|██████▏ | 7691/12384 [16:19:26<9:56:21, 7.62s/it, loss=0.0007, acc=0.9989, iter_time=8.15s]
Epoch 1: 62%|██████▏ | 7692/12384 [16:19:26<9:55:57, 7.62s/it, loss=0.0007, acc=0.9989, iter_time=8.15s]
Epoch 1: 62%|██████▏ | 7692/12384 [16:19:34<9:55:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 62%|██████▏ | 7693/12384 [16:19:34<9:57:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 62%|██████▏ | 7693/12384 [16:19:41<9:57:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 62%|██████▏ | 7694/12384 [16:19:41<9:56:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 62%|██████▏ | 7694/12384 [16:19:49<9:56:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7695/12384 [16:19:49<9:55:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7695/12384 [16:19:56<9:55:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 62%|██████▏ | 7696/12384 [16:19:56<9:55:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 62%|██████▏ | 7696/12384 [16:20:04<9:55:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 62%|██████▏ | 7697/12384 [16:20:04<9:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 62%|██████▏ | 7697/12384 [16:20:12<9:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7698/12384 [16:20:12<9:55:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7698/12384 [16:20:19<9:55:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 62%|██████▏ | 7699/12384 [16:20:19<9:55:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 62%|██████▏ | 7699/12384 [16:20:27<9:55:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 62%|██████▏ | 7700/12384 [16:20:27<9:55:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 62%|██████▏ | 7700/12384 [16:20:34<9:55:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 62%|██████▏ | 7701/12384 [16:20:34<9:54:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 62%|██████▏ | 7701/12384 [16:20:42<9:54:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 62%|██████▏ | 7702/12384 [16:20:42<9:53:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 62%|██████▏ | 7702/12384 [16:20:50<9:53:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 62%|██████▏ | 7703/12384 [16:20:50<9:53:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 62%|██████▏ | 7703/12384 [16:20:57<9:53:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 62%|██████▏ | 7704/12384 [16:20:57<9:53:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 62%|██████▏ | 7704/12384 [16:21:05<9:53:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 1: 62%|██████▏ | 7705/12384 [16:21:05<9:53:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 1: 62%|██████▏ | 7705/12384 [16:21:12<9:53:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 1: 62%|██████▏ | 7706/12384 [16:21:12<9:53:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 1: 62%|██████▏ | 7706/12384 [16:21:20<9:53:09, 7.61s/it, loss=0.0006, acc=0.9983, iter_time=5.35s]
Epoch 1: 62%|██████▏ | 7707/12384 [16:21:20<10:00:27, 7.70s/it, loss=0.0006, acc=0.9983, iter_time=5.35s]
Epoch 1: 62%|██████▏ | 7707/12384 [16:21:28<10:00:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 1: 62%|██████▏ | 7708/12384 [16:21:28<10:05:24, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 1: 62%|██████▏ | 7708/12384 [16:21:36<10:05:24, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 62%|██████▏ | 7709/12384 [16:21:36<10:01:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 62%|██████▏ | 7709/12384 [16:21:44<10:01:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 62%|██████▏ | 7710/12384 [16:21:44<9:58:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 62%|██████▏ | 7710/12384 [16:21:51<9:58:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 62%|██████▏ | 7711/12384 [16:21:51<9:56:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 62%|██████▏ | 7711/12384 [16:21:59<9:56:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 62%|██████▏ | 7712/12384 [16:21:59<9:55:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 62%|██████▏ | 7712/12384 [16:22:06<9:55:29, 7.65s/it, loss=0.0005, acc=0.9984, iter_time=7.20s]
Epoch 1: 62%|██████▏ | 7713/12384 [16:22:06<9:56:16, 7.66s/it, loss=0.0005, acc=0.9984, iter_time=7.20s]
Epoch 1: 62%|██████▏ | 7713/12384 [16:22:14<9:56:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 62%|██████▏ | 7714/12384 [16:22:14<9:55:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 62%|██████▏ | 7714/12384 [16:22:22<9:55:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7715/12384 [16:22:22<9:54:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7715/12384 [16:22:29<9:54:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 62%|██████▏ | 7716/12384 [16:22:29<9:53:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 62%|██████▏ | 7716/12384 [16:22:37<9:53:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 62%|██████▏ | 7717/12384 [16:22:37<9:52:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 62%|██████▏ | 7717/12384 [16:22:44<9:52:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7718/12384 [16:22:44<9:52:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7718/12384 [16:22:52<9:52:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7719/12384 [16:22:52<9:52:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7719/12384 [16:23:00<9:52:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 62%|██████▏ | 7720/12384 [16:23:00<9:51:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 62%|██████▏ | 7720/12384 [16:23:07<9:51:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 62%|██████▏ | 7721/12384 [16:23:07<9:51:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 62%|██████▏ | 7721/12384 [16:23:15<9:51:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 62%|██████▏ | 7722/12384 [16:23:15<9:50:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 1: 62%|██████▏ | 7722/12384 [16:23:22<9:50:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 62%|██████▏ | 7723/12384 [16:23:22<9:50:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 62%|██████▏ | 7723/12384 [16:23:30<9:50:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 62%|██████▏ | 7724/12384 [16:23:30<9:49:49, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 62%|██████▏ | 7724/12384 [16:23:38<9:49:49, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 62%|██████▏ | 7725/12384 [16:23:38<9:50:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 62%|██████▏ | 7725/12384 [16:23:45<9:50:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 62%|██████▏ | 7726/12384 [16:23:45<9:50:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 1: 62%|██████▏ | 7726/12384 [16:23:53<9:50:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 62%|██████▏ | 7727/12384 [16:23:53<9:50:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 62%|██████▏ | 7727/12384 [16:24:01<9:50:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 62%|██████▏ | 7728/12384 [16:24:01<9:50:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 62%|██████▏ | 7728/12384 [16:24:08<9:50:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 62%|██████▏ | 7729/12384 [16:24:08<9:50:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 62%|██████▏ | 7729/12384 [16:24:16<9:50:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7730/12384 [16:24:16<9:49:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 62%|██████▏ | 7730/12384 [16:24:23<9:49:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7731/12384 [16:24:23<9:49:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7731/12384 [16:24:31<9:49:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7732/12384 [16:24:31<9:50:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7732/12384 [16:24:39<9:50:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 62%|██████▏ | 7733/12384 [16:24:39<9:58:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 62%|██████▏ | 7733/12384 [16:24:47<9:58:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 62%|██████▏ | 7734/12384 [16:24:47<10:02:02, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 62%|██████▏ | 7734/12384 [16:24:54<10:02:02, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7735/12384 [16:24:54<9:58:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 62%|██████▏ | 7735/12384 [16:25:02<9:58:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 62%|██████▏ | 7736/12384 [16:25:02<9:55:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 62%|██████▏ | 7736/12384 [16:25:10<9:55:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 62%|██████▏ | 7737/12384 [16:25:10<9:53:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 62%|██████▏ | 7737/12384 [16:25:17<9:53:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 62%|██████▏ | 7738/12384 [16:25:17<9:52:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 62%|██████▏ | 7738/12384 [16:25:25<9:52:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7739/12384 [16:25:25<9:52:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 62%|██████▏ | 7739/12384 [16:25:32<9:52:05, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.42s]
Epoch 1: 62%|██████▎ | 7740/12384 [16:25:32<9:51:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.42s]
Epoch 1: 62%|██████▎ | 7740/12384 [16:25:40<9:51:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7741/12384 [16:25:40<9:50:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7741/12384 [16:25:48<9:50:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 63%|██████▎ | 7742/12384 [16:25:48<9:49:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 63%|██████▎ | 7742/12384 [16:25:55<9:49:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7743/12384 [16:25:55<9:49:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7743/12384 [16:26:03<9:49:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 63%|██████▎ | 7744/12384 [16:26:03<9:48:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 63%|██████▎ | 7744/12384 [16:26:11<9:48:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 1: 63%|██████▎ | 7745/12384 [16:26:11<9:48:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 1: 63%|██████▎ | 7745/12384 [16:26:18<9:48:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 63%|██████▎ | 7746/12384 [16:26:18<9:48:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 63%|██████▎ | 7746/12384 [16:26:26<9:48:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 63%|██████▎ | 7747/12384 [16:26:26<9:50:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 63%|██████▎ | 7747/12384 [16:26:33<9:50:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 63%|██████▎ | 7748/12384 [16:26:33<9:49:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 63%|██████▎ | 7748/12384 [16:26:41<9:49:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 63%|██████▎ | 7749/12384 [16:26:41<9:49:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 63%|██████▎ | 7749/12384 [16:26:49<9:49:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7750/12384 [16:26:49<9:48:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7750/12384 [16:26:56<9:48:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 63%|██████▎ | 7751/12384 [16:26:56<9:48:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 63%|██████▎ | 7751/12384 [16:27:04<9:48:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 63%|██████▎ | 7752/12384 [16:27:04<9:48:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 63%|██████▎ | 7752/12384 [16:27:12<9:48:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 63%|██████▎ | 7753/12384 [16:27:12<9:47:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 63%|██████▎ | 7753/12384 [16:27:19<9:47:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7754/12384 [16:27:19<9:48:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7754/12384 [16:27:27<9:48:22, 7.62s/it, loss=0.0002, acc=0.9975, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7755/12384 [16:27:27<9:48:05, 7.62s/it, loss=0.0002, acc=0.9975, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7755/12384 [16:27:34<9:48:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.33s]
Epoch 1: 63%|██████▎ | 7756/12384 [16:27:34<9:47:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.33s]
Epoch 1: 63%|██████▎ | 7756/12384 [16:27:42<9:47:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 63%|██████▎ | 7757/12384 [16:27:42<9:49:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 63%|██████▎ | 7757/12384 [16:27:50<9:49:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7758/12384 [16:27:50<9:50:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7758/12384 [16:27:57<9:50:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 63%|██████▎ | 7759/12384 [16:27:57<9:48:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 63%|██████▎ | 7759/12384 [16:28:05<9:48:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 63%|██████▎ | 7760/12384 [16:28:05<9:55:37, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 63%|██████▎ | 7760/12384 [16:28:13<9:55:37, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 63%|██████▎ | 7761/12384 [16:28:13<9:52:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 63%|██████▎ | 7761/12384 [16:28:21<9:52:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 63%|██████▎ | 7762/12384 [16:28:21<9:52:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 63%|██████▎ | 7762/12384 [16:28:28<9:52:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 63%|██████▎ | 7763/12384 [16:28:28<9:50:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 63%|██████▎ | 7763/12384 [16:28:36<9:50:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 63%|██████▎ | 7764/12384 [16:28:36<9:49:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 63%|██████▎ | 7764/12384 [16:28:43<9:49:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7765/12384 [16:28:43<9:47:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7765/12384 [16:28:51<9:47:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 63%|██████▎ | 7766/12384 [16:28:51<9:47:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 63%|██████▎ | 7766/12384 [16:28:59<9:47:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 63%|██████▎ | 7767/12384 [16:28:59<9:46:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 63%|██████▎ | 7767/12384 [16:29:06<9:46:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 63%|██████▎ | 7768/12384 [16:29:06<9:46:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 63%|██████▎ | 7768/12384 [16:29:14<9:46:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7769/12384 [16:29:14<9:45:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7769/12384 [16:29:22<9:45:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 63%|██████▎ | 7770/12384 [16:29:22<9:45:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 63%|██████▎ | 7770/12384 [16:29:29<9:45:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 63%|██████▎ | 7771/12384 [16:29:29<9:44:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 63%|██████▎ | 7771/12384 [16:29:37<9:44:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 1: 63%|██████▎ | 7772/12384 [16:29:37<9:44:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.14s]
Epoch 1: 63%|██████▎ | 7772/12384 [16:29:44<9:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7773/12384 [16:29:44<9:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7773/12384 [16:29:52<9:44:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 63%|██████▎ | 7774/12384 [16:29:52<9:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 63%|██████▎ | 7774/12384 [16:30:00<9:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 63%|██████▎ | 7775/12384 [16:30:00<9:44:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 63%|██████▎ | 7775/12384 [16:30:07<9:44:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 63%|██████▎ | 7776/12384 [16:30:07<9:44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 63%|██████▎ | 7776/12384 [16:30:15<9:44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 63%|██████▎ | 7777/12384 [16:30:15<9:44:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 63%|██████▎ | 7777/12384 [16:30:22<9:44:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 63%|██████▎ | 7778/12384 [16:30:22<9:44:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 63%|██████▎ | 7778/12384 [16:30:30<9:44:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 63%|██████▎ | 7779/12384 [16:30:30<9:43:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 63%|██████▎ | 7779/12384 [16:30:38<9:43:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 63%|██████▎ | 7780/12384 [16:30:38<9:43:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 63%|██████▎ | 7780/12384 [16:30:45<9:43:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 63%|██████▎ | 7781/12384 [16:30:45<9:43:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 63%|██████▎ | 7781/12384 [16:30:53<9:43:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7782/12384 [16:30:53<9:43:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7782/12384 [16:31:00<9:43:19, 7.61s/it, loss=0.0004, acc=0.9983, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7783/12384 [16:31:00<9:43:31, 7.61s/it, loss=0.0004, acc=0.9983, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7783/12384 [16:31:08<9:43:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 63%|██████▎ | 7784/12384 [16:31:08<9:43:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 63%|██████▎ | 7784/12384 [16:31:16<9:43:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 63%|██████▎ | 7785/12384 [16:31:16<9:43:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 63%|██████▎ | 7785/12384 [16:31:24<9:43:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 63%|██████▎ | 7786/12384 [16:31:24<9:51:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 63%|██████▎ | 7786/12384 [16:31:31<9:51:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 63%|██████▎ | 7787/12384 [16:31:31<9:49:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 63%|██████▎ | 7787/12384 [16:31:39<9:49:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 63%|██████▎ | 7788/12384 [16:31:39<9:47:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 63%|██████▎ | 7788/12384 [16:31:46<9:47:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7789/12384 [16:31:46<9:46:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7789/12384 [16:31:54<9:46:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7790/12384 [16:31:54<9:45:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7790/12384 [16:32:02<9:45:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 63%|██████▎ | 7791/12384 [16:32:02<9:44:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 63%|██████▎ | 7791/12384 [16:32:09<9:44:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 1: 63%|██████▎ | 7792/12384 [16:32:09<9:44:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 1: 63%|██████▎ | 7792/12384 [16:32:17<9:44:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7793/12384 [16:32:17<9:43:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7793/12384 [16:32:25<9:43:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 63%|██████▎ | 7794/12384 [16:32:25<9:43:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 63%|██████▎ | 7794/12384 [16:32:32<9:43:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 63%|██████▎ | 7795/12384 [16:32:32<9:42:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 63%|██████▎ | 7795/12384 [16:32:40<9:42:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 63%|██████▎ | 7796/12384 [16:32:40<9:41:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 63%|██████▎ | 7796/12384 [16:32:47<9:41:44, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=5.80s]
Epoch 1: 63%|██████▎ | 7797/12384 [16:32:47<9:41:15, 7.60s/it, loss=0.0001, acc=0.9997, iter_time=5.80s]
Epoch 1: 63%|██████▎ | 7797/12384 [16:32:55<9:41:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 63%|██████▎ | 7798/12384 [16:32:55<9:41:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 63%|██████▎ | 7798/12384 [16:33:03<9:41:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 63%|██████▎ | 7799/12384 [16:33:03<9:41:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 63%|██████▎ | 7799/12384 [16:33:10<9:41:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 63%|██████▎ | 7800/12384 [16:33:10<9:41:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 63%|██████▎ | 7800/12384 [16:33:18<9:41:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 63%|██████▎ | 7801/12384 [16:33:18<9:42:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 63%|██████▎ | 7801/12384 [16:33:26<9:42:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 63%|██████▎ | 7802/12384 [16:33:26<9:44:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 63%|██████▎ | 7802/12384 [16:33:33<9:44:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 63%|██████▎ | 7803/12384 [16:33:33<9:42:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 63%|██████▎ | 7803/12384 [16:33:41<9:42:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 63%|██████▎ | 7804/12384 [16:33:41<9:41:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 63%|██████▎ | 7804/12384 [16:33:48<9:41:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 63%|██████▎ | 7805/12384 [16:33:48<9:41:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 63%|██████▎ | 7805/12384 [16:33:56<9:41:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 63%|██████▎ | 7806/12384 [16:33:56<9:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 63%|██████▎ | 7806/12384 [16:34:04<9:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 63%|██████▎ | 7807/12384 [16:34:04<9:41:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 63%|██████▎ | 7807/12384 [16:34:11<9:41:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 63%|██████▎ | 7808/12384 [16:34:11<9:40:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 63%|██████▎ | 7808/12384 [16:34:19<9:40:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 63%|██████▎ | 7809/12384 [16:34:19<9:40:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 63%|██████▎ | 7809/12384 [16:34:26<9:40:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 63%|██████▎ | 7810/12384 [16:34:26<9:39:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 63%|██████▎ | 7810/12384 [16:34:34<9:39:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 1: 63%|██████▎ | 7811/12384 [16:34:34<9:40:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 1: 63%|██████▎ | 7811/12384 [16:34:42<9:40:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 63%|██████▎ | 7812/12384 [16:34:42<9:42:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 63%|██████▎ | 7812/12384 [16:34:50<9:42:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 63%|██████▎ | 7813/12384 [16:34:50<9:49:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 63%|██████▎ | 7813/12384 [16:34:57<9:49:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 63%|██████▎ | 7814/12384 [16:34:57<9:46:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 63%|██████▎ | 7814/12384 [16:35:05<9:46:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 63%|██████▎ | 7815/12384 [16:35:05<9:43:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 63%|██████▎ | 7815/12384 [16:35:13<9:43:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 63%|██████▎ | 7816/12384 [16:35:13<9:42:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 63%|██████▎ | 7816/12384 [16:35:20<9:42:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 63%|██████▎ | 7817/12384 [16:35:20<9:41:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 1: 63%|██████▎ | 7817/12384 [16:35:28<9:41:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 63%|██████▎ | 7818/12384 [16:35:28<9:40:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 63%|██████▎ | 7818/12384 [16:35:35<9:40:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 63%|██████▎ | 7819/12384 [16:35:35<9:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 63%|██████▎ | 7819/12384 [16:35:43<9:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 63%|██████▎ | 7820/12384 [16:35:43<9:39:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 63%|██████▎ | 7820/12384 [16:35:51<9:39:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7821/12384 [16:35:51<9:39:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7821/12384 [16:35:58<9:39:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 63%|██████▎ | 7822/12384 [16:35:58<9:38:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 63%|██████▎ | 7822/12384 [16:36:06<9:38:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 63%|██████▎ | 7823/12384 [16:36:06<9:38:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 63%|██████▎ | 7823/12384 [16:36:13<9:38:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 63%|██████▎ | 7824/12384 [16:36:13<9:38:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 63%|██████▎ | 7824/12384 [16:36:21<9:38:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 63%|██████▎ | 7825/12384 [16:36:21<9:38:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 63%|██████▎ | 7825/12384 [16:36:29<9:38:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 63%|██████▎ | 7826/12384 [16:36:29<9:37:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 63%|██████▎ | 7826/12384 [16:36:36<9:37:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 63%|██████▎ | 7827/12384 [16:36:36<9:37:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 63%|██████▎ | 7827/12384 [16:36:44<9:37:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 63%|██████▎ | 7828/12384 [16:36:44<9:39:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 63%|██████▎ | 7828/12384 [16:36:52<9:39:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 63%|██████▎ | 7829/12384 [16:36:52<9:38:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 63%|██████▎ | 7829/12384 [16:36:59<9:38:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 63%|██████▎ | 7830/12384 [16:36:59<9:38:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 63%|██████▎ | 7830/12384 [16:37:07<9:38:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7831/12384 [16:37:07<9:38:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7831/12384 [16:37:14<9:38:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 63%|██████▎ | 7832/12384 [16:37:14<9:38:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 63%|██████▎ | 7832/12384 [16:37:22<9:38:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7833/12384 [16:37:22<9:38:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7833/12384 [16:37:30<9:38:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7834/12384 [16:37:30<9:37:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7834/12384 [16:37:37<9:37:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 63%|██████▎ | 7835/12384 [16:37:37<9:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 63%|██████▎ | 7835/12384 [16:37:45<9:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 63%|██████▎ | 7836/12384 [16:37:45<9:36:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 63%|██████▎ | 7836/12384 [16:37:53<9:36:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7837/12384 [16:37:53<9:38:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7837/12384 [16:38:00<9:38:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 63%|██████▎ | 7838/12384 [16:38:00<9:38:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 63%|██████▎ | 7838/12384 [16:38:08<9:38:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 63%|██████▎ | 7839/12384 [16:38:08<9:44:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 63%|██████▎ | 7839/12384 [16:38:16<9:44:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 63%|██████▎ | 7840/12384 [16:38:16<9:42:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 63%|██████▎ | 7840/12384 [16:38:23<9:42:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 63%|██████▎ | 7841/12384 [16:38:23<9:40:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 63%|██████▎ | 7841/12384 [16:38:31<9:40:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 63%|██████▎ | 7842/12384 [16:38:31<9:39:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 63%|██████▎ | 7842/12384 [16:38:39<9:39:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 63%|██████▎ | 7843/12384 [16:38:39<9:37:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 63%|██████▎ | 7843/12384 [16:38:46<9:37:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7844/12384 [16:38:46<9:36:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 63%|██████▎ | 7844/12384 [16:38:54<9:36:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 63%|██████▎ | 7845/12384 [16:38:54<9:38:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 63%|██████▎ | 7845/12384 [16:39:01<9:38:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 63%|██████▎ | 7846/12384 [16:39:01<9:37:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 63%|██████▎ | 7846/12384 [16:39:09<9:37:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 63%|██████▎ | 7847/12384 [16:39:09<9:36:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 63%|██████▎ | 7847/12384 [16:39:17<9:36:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 1: 63%|██████▎ | 7848/12384 [16:39:17<9:35:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 1: 63%|██████▎ | 7848/12384 [16:39:24<9:35:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 63%|██████▎ | 7849/12384 [16:39:24<9:35:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 63%|██████▎ | 7849/12384 [16:39:32<9:35:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7850/12384 [16:39:32<9:34:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7850/12384 [16:39:39<9:34:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7851/12384 [16:39:39<9:35:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7851/12384 [16:39:47<9:35:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 63%|██████▎ | 7852/12384 [16:39:47<9:34:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 63%|██████▎ | 7852/12384 [16:39:55<9:34:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 63%|██████▎ | 7853/12384 [16:39:55<9:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 63%|██████▎ | 7853/12384 [16:40:02<9:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7854/12384 [16:40:02<9:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7854/12384 [16:40:10<9:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7855/12384 [16:40:10<9:34:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7855/12384 [16:40:18<9:34:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 63%|██████▎ | 7856/12384 [16:40:18<9:34:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 63%|██████▎ | 7856/12384 [16:40:25<9:34:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7857/12384 [16:40:25<9:33:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 63%|██████▎ | 7857/12384 [16:40:33<9:33:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 63%|██████▎ | 7858/12384 [16:40:33<9:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 63%|██████▎ | 7858/12384 [16:40:40<9:33:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 63%|██████▎ | 7859/12384 [16:40:40<9:33:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 63%|██████▎ | 7859/12384 [16:40:48<9:33:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7860/12384 [16:40:48<9:33:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 63%|██████▎ | 7860/12384 [16:40:56<9:33:24, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7861/12384 [16:40:56<9:33:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 63%|██████▎ | 7861/12384 [16:41:03<9:33:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7862/12384 [16:41:03<9:33:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 63%|██████▎ | 7862/12384 [16:41:11<9:33:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 63%|██████▎ | 7863/12384 [16:41:11<9:34:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 63%|██████▎ | 7863/12384 [16:41:18<9:34:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 64%|██████▎ | 7864/12384 [16:41:18<9:33:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 64%|██████▎ | 7864/12384 [16:41:26<9:33:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 64%|██████▎ | 7865/12384 [16:41:26<9:40:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 64%|██████▎ | 7865/12384 [16:41:34<9:40:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 64%|██████▎ | 7866/12384 [16:41:34<9:38:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 64%|██████▎ | 7866/12384 [16:41:42<9:38:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 64%|██████▎ | 7867/12384 [16:41:42<9:37:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 64%|██████▎ | 7867/12384 [16:41:49<9:37:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▎ | 7868/12384 [16:41:49<9:36:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▎ | 7868/12384 [16:41:57<9:36:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▎ | 7869/12384 [16:41:57<9:34:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▎ | 7869/12384 [16:42:04<9:34:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▎ | 7870/12384 [16:42:04<9:33:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▎ | 7870/12384 [16:42:12<9:33:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▎ | 7871/12384 [16:42:12<9:33:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▎ | 7871/12384 [16:42:20<9:33:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 64%|██████▎ | 7872/12384 [16:42:20<9:33:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 64%|██████▎ | 7872/12384 [16:42:27<9:33:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 64%|██████▎ | 7873/12384 [16:42:27<9:32:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 64%|██████▎ | 7873/12384 [16:42:35<9:32:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▎ | 7874/12384 [16:42:35<9:32:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▎ | 7874/12384 [16:42:42<9:32:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 64%|██████▎ | 7875/12384 [16:42:42<9:32:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 64%|██████▎ | 7875/12384 [16:42:50<9:32:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 64%|██████▎ | 7876/12384 [16:42:50<9:31:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 64%|██████▎ | 7876/12384 [16:42:58<9:31:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▎ | 7877/12384 [16:42:58<9:32:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▎ | 7877/12384 [16:43:05<9:32:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 1: 64%|██████▎ | 7878/12384 [16:43:05<9:32:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 1: 64%|██████▎ | 7878/12384 [16:43:13<9:32:20, 7.62s/it, loss=0.0007, acc=0.9982, iter_time=7.61s]
Epoch 1: 64%|██████▎ | 7879/12384 [16:43:13<9:31:44, 7.61s/it, loss=0.0007, acc=0.9982, iter_time=7.61s]
Epoch 1: 64%|██████▎ | 7879/12384 [16:43:21<9:31:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 64%|██████▎ | 7880/12384 [16:43:21<9:31:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 64%|██████▎ | 7880/12384 [16:43:28<9:31:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 64%|██████▎ | 7881/12384 [16:43:28<9:31:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 64%|██████▎ | 7881/12384 [16:43:36<9:31:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 64%|██████▎ | 7882/12384 [16:43:36<9:31:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 64%|██████▎ | 7882/12384 [16:43:43<9:31:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▎ | 7883/12384 [16:43:43<9:30:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▎ | 7883/12384 [16:43:51<9:30:57, 7.61s/it, loss=0.0034, acc=0.9981, iter_time=7.61s]
Epoch 1: 64%|██████▎ | 7884/12384 [16:43:51<9:31:04, 7.61s/it, loss=0.0034, acc=0.9981, iter_time=7.61s]
Epoch 1: 64%|██████▎ | 7884/12384 [16:43:59<9:31:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▎ | 7885/12384 [16:43:59<9:30:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▎ | 7885/12384 [16:44:06<9:30:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 64%|██████▎ | 7886/12384 [16:44:06<9:30:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 64%|██████▎ | 7886/12384 [16:44:14<9:30:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 64%|██████▎ | 7887/12384 [16:44:14<9:29:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 64%|██████▎ | 7887/12384 [16:44:21<9:29:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 64%|██████▎ | 7888/12384 [16:44:21<9:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 64%|██████▎ | 7888/12384 [16:44:29<9:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 1: 64%|██████▎ | 7889/12384 [16:44:29<9:29:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 1: 64%|██████▎ | 7889/12384 [16:44:37<9:29:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 64%|██████▎ | 7890/12384 [16:44:37<9:29:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 64%|██████▎ | 7890/12384 [16:44:45<9:29:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 64%|██████▎ | 7891/12384 [16:44:45<9:37:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 64%|██████▎ | 7891/12384 [16:44:52<9:37:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 64%|██████▎ | 7892/12384 [16:44:52<9:34:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 64%|██████▎ | 7892/12384 [16:45:00<9:34:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▎ | 7893/12384 [16:45:00<9:32:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▎ | 7893/12384 [16:45:07<9:32:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 64%|██████▎ | 7894/12384 [16:45:07<9:31:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 64%|██████▎ | 7894/12384 [16:45:15<9:31:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 64%|██████▍ | 7895/12384 [16:45:15<9:30:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 64%|██████▍ | 7895/12384 [16:45:23<9:30:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 64%|██████▍ | 7896/12384 [16:45:23<9:30:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 64%|██████▍ | 7896/12384 [16:45:30<9:30:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 64%|██████▍ | 7897/12384 [16:45:30<9:30:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 64%|██████▍ | 7897/12384 [16:45:38<9:30:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 64%|██████▍ | 7898/12384 [16:45:38<9:29:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 64%|██████▍ | 7898/12384 [16:45:45<9:29:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7899/12384 [16:45:45<9:29:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7899/12384 [16:45:53<9:29:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 64%|██████▍ | 7900/12384 [16:45:53<9:29:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 64%|██████▍ | 7900/12384 [16:46:01<9:29:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 64%|██████▍ | 7901/12384 [16:46:01<9:29:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 64%|██████▍ | 7901/12384 [16:46:08<9:29:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 64%|██████▍ | 7902/12384 [16:46:08<9:30:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 64%|██████▍ | 7902/12384 [16:46:16<9:30:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.72s]
Epoch 1: 64%|██████▍ | 7903/12384 [16:46:16<9:29:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.72s]
Epoch 1: 64%|██████▍ | 7903/12384 [16:46:24<9:29:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 64%|██████▍ | 7904/12384 [16:46:24<9:28:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 64%|██████▍ | 7904/12384 [16:46:31<9:28:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 64%|██████▍ | 7905/12384 [16:46:31<9:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 64%|██████▍ | 7905/12384 [16:46:39<9:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 64%|██████▍ | 7906/12384 [16:46:39<9:28:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 64%|██████▍ | 7906/12384 [16:46:46<9:28:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 64%|██████▍ | 7907/12384 [16:46:46<9:28:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 64%|██████▍ | 7907/12384 [16:46:54<9:28:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 64%|██████▍ | 7908/12384 [16:46:54<9:28:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 64%|██████▍ | 7908/12384 [16:47:02<9:28:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 64%|██████▍ | 7909/12384 [16:47:02<9:27:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 64%|██████▍ | 7909/12384 [16:47:09<9:27:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 64%|██████▍ | 7910/12384 [16:47:09<9:27:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 64%|██████▍ | 7910/12384 [16:47:17<9:27:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7911/12384 [16:47:17<9:27:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7911/12384 [16:47:25<9:27:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 64%|██████▍ | 7912/12384 [16:47:25<9:29:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 64%|██████▍ | 7912/12384 [16:47:32<9:29:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 64%|██████▍ | 7913/12384 [16:47:32<9:29:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 64%|██████▍ | 7913/12384 [16:47:40<9:29:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 64%|██████▍ | 7914/12384 [16:47:40<9:29:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 64%|██████▍ | 7914/12384 [16:47:47<9:29:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 64%|██████▍ | 7915/12384 [16:47:47<9:28:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 64%|██████▍ | 7915/12384 [16:47:55<9:28:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 64%|██████▍ | 7916/12384 [16:47:55<9:27:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 64%|██████▍ | 7916/12384 [16:48:03<9:27:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 64%|██████▍ | 7917/12384 [16:48:03<9:35:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 64%|██████▍ | 7917/12384 [16:48:11<9:35:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 64%|██████▍ | 7918/12384 [16:48:11<9:34:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 64%|██████▍ | 7918/12384 [16:48:18<9:34:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 64%|██████▍ | 7919/12384 [16:48:18<9:33:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 64%|██████▍ | 7919/12384 [16:48:26<9:33:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 64%|██████▍ | 7920/12384 [16:48:26<9:31:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 64%|██████▍ | 7920/12384 [16:48:34<9:31:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 64%|██████▍ | 7921/12384 [16:48:34<9:29:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 64%|██████▍ | 7921/12384 [16:48:41<9:29:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 64%|██████▍ | 7922/12384 [16:48:41<9:29:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 64%|██████▍ | 7922/12384 [16:48:49<9:29:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7923/12384 [16:48:49<9:27:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7923/12384 [16:48:56<9:27:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7924/12384 [16:48:56<9:26:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7924/12384 [16:49:04<9:26:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7925/12384 [16:49:04<9:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7925/12384 [16:49:12<9:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 64%|██████▍ | 7926/12384 [16:49:12<9:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 64%|██████▍ | 7926/12384 [16:49:19<9:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 64%|██████▍ | 7927/12384 [16:49:19<9:26:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 64%|██████▍ | 7927/12384 [16:49:27<9:26:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 64%|██████▍ | 7928/12384 [16:49:27<9:26:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 64%|██████▍ | 7928/12384 [16:49:35<9:26:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 64%|██████▍ | 7929/12384 [16:49:35<9:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 64%|██████▍ | 7929/12384 [16:49:42<9:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7930/12384 [16:49:42<9:25:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7930/12384 [16:49:50<9:25:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▍ | 7931/12384 [16:49:50<9:25:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▍ | 7931/12384 [16:49:57<9:25:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 64%|██████▍ | 7932/12384 [16:49:57<9:25:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 64%|██████▍ | 7932/12384 [16:50:05<9:25:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7933/12384 [16:50:05<9:25:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7933/12384 [16:50:13<9:25:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 64%|██████▍ | 7934/12384 [16:50:13<9:25:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 64%|██████▍ | 7934/12384 [16:50:20<9:25:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 64%|██████▍ | 7935/12384 [16:50:20<9:24:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 64%|██████▍ | 7935/12384 [16:50:28<9:24:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 64%|██████▍ | 7936/12384 [16:50:28<9:24:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 64%|██████▍ | 7936/12384 [16:50:35<9:24:17, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.35s]
Epoch 1: 64%|██████▍ | 7937/12384 [16:50:35<9:24:00, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.35s]
Epoch 1: 64%|██████▍ | 7937/12384 [16:50:43<9:24:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7938/12384 [16:50:43<9:24:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7938/12384 [16:50:51<9:24:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.44s]
Epoch 1: 64%|██████▍ | 7939/12384 [16:50:51<9:24:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.44s]
Epoch 1: 64%|██████▍ | 7939/12384 [16:50:58<9:24:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 64%|██████▍ | 7940/12384 [16:50:58<9:23:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 64%|██████▍ | 7940/12384 [16:51:06<9:23:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 64%|██████▍ | 7941/12384 [16:51:06<9:22:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 64%|██████▍ | 7941/12384 [16:51:13<9:22:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 64%|██████▍ | 7942/12384 [16:51:13<9:22:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 64%|██████▍ | 7942/12384 [16:51:21<9:22:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 64%|██████▍ | 7943/12384 [16:51:21<9:24:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 64%|██████▍ | 7943/12384 [16:51:29<9:24:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 64%|██████▍ | 7944/12384 [16:51:29<9:31:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 64%|██████▍ | 7944/12384 [16:51:37<9:31:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 64%|██████▍ | 7945/12384 [16:51:37<9:34:59, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 64%|██████▍ | 7945/12384 [16:51:45<9:34:59, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7946/12384 [16:51:45<9:31:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7946/12384 [16:51:52<9:31:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7947/12384 [16:51:52<9:28:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7947/12384 [16:52:00<9:28:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7948/12384 [16:52:00<9:26:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7948/12384 [16:52:07<9:26:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7949/12384 [16:52:07<9:25:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7949/12384 [16:52:15<9:25:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 64%|██████▍ | 7950/12384 [16:52:15<9:24:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 64%|██████▍ | 7950/12384 [16:52:23<9:24:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 64%|██████▍ | 7951/12384 [16:52:23<9:24:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 64%|██████▍ | 7951/12384 [16:52:30<9:24:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 64%|██████▍ | 7952/12384 [16:52:30<9:23:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 64%|██████▍ | 7952/12384 [16:52:38<9:23:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 64%|██████▍ | 7953/12384 [16:52:38<9:23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 64%|██████▍ | 7953/12384 [16:52:46<9:23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7954/12384 [16:52:46<9:22:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 64%|██████▍ | 7954/12384 [16:52:53<9:22:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▍ | 7955/12384 [16:52:53<9:22:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 64%|██████▍ | 7955/12384 [16:53:01<9:22:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 64%|██████▍ | 7956/12384 [16:53:01<9:22:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 64%|██████▍ | 7956/12384 [16:53:08<9:22:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 64%|██████▍ | 7957/12384 [16:53:08<9:22:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 64%|██████▍ | 7957/12384 [16:53:16<9:22:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 64%|██████▍ | 7958/12384 [16:53:16<9:21:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 64%|██████▍ | 7958/12384 [16:53:24<9:21:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7959/12384 [16:53:24<9:21:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7959/12384 [16:53:31<9:21:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 64%|██████▍ | 7960/12384 [16:53:31<9:21:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 64%|██████▍ | 7960/12384 [16:53:39<9:21:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 64%|██████▍ | 7961/12384 [16:53:39<9:22:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 1: 64%|██████▍ | 7961/12384 [16:53:47<9:22:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 64%|██████▍ | 7962/12384 [16:53:47<9:22:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 64%|██████▍ | 7962/12384 [16:53:54<9:22:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7963/12384 [16:53:54<9:21:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7963/12384 [16:54:02<9:21:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 1: 64%|██████▍ | 7964/12384 [16:54:02<9:21:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 1: 64%|██████▍ | 7964/12384 [16:54:09<9:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 64%|██████▍ | 7965/12384 [16:54:09<9:21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 64%|██████▍ | 7965/12384 [16:54:17<9:21:28, 7.62s/it, loss=0.0004, acc=0.9983, iter_time=9.82s]
Epoch 1: 64%|██████▍ | 7966/12384 [16:54:17<9:20:50, 7.62s/it, loss=0.0004, acc=0.9983, iter_time=9.82s]
Epoch 1: 64%|██████▍ | 7966/12384 [16:54:25<9:20:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 64%|██████▍ | 7967/12384 [16:54:25<9:20:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 64%|██████▍ | 7967/12384 [16:54:32<9:20:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 64%|██████▍ | 7968/12384 [16:54:32<9:20:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 64%|██████▍ | 7968/12384 [16:54:40<9:20:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 1: 64%|██████▍ | 7969/12384 [16:54:40<9:19:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 1: 64%|██████▍ | 7969/12384 [16:54:48<9:19:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 64%|██████▍ | 7970/12384 [16:54:48<9:26:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 64%|██████▍ | 7970/12384 [16:54:55<9:26:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 64%|██████▍ | 7971/12384 [16:54:55<9:26:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 64%|██████▍ | 7971/12384 [16:55:03<9:26:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 64%|██████▍ | 7972/12384 [16:55:03<9:24:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 64%|██████▍ | 7972/12384 [16:55:11<9:24:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 64%|██████▍ | 7973/12384 [16:55:11<9:23:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 64%|██████▍ | 7973/12384 [16:55:18<9:23:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7974/12384 [16:55:18<9:21:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7974/12384 [16:55:26<9:21:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.38s]
Epoch 1: 64%|██████▍ | 7975/12384 [16:55:26<9:20:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.38s]
Epoch 1: 64%|██████▍ | 7975/12384 [16:55:33<9:20:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 64%|██████▍ | 7976/12384 [16:55:33<9:20:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 64%|██████▍ | 7976/12384 [16:55:41<9:20:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 64%|██████▍ | 7977/12384 [16:55:41<9:19:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 64%|██████▍ | 7977/12384 [16:55:49<9:19:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 64%|██████▍ | 7978/12384 [16:55:49<9:19:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 64%|██████▍ | 7978/12384 [16:55:56<9:19:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 64%|██████▍ | 7979/12384 [16:55:56<9:21:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 64%|██████▍ | 7979/12384 [16:56:04<9:21:03, 7.64s/it, loss=0.0001, acc=0.9994, iter_time=7.62s]
Epoch 1: 64%|██████▍ | 7980/12384 [16:56:04<9:20:34, 7.64s/it, loss=0.0001, acc=0.9994, iter_time=7.62s]
Epoch 1: 64%|██████▍ | 7980/12384 [16:56:12<9:20:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 64%|██████▍ | 7981/12384 [16:56:12<9:20:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 64%|██████▍ | 7981/12384 [16:56:19<9:20:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7982/12384 [16:56:19<9:19:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 64%|██████▍ | 7982/12384 [16:56:27<9:19:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7983/12384 [16:56:27<9:19:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 64%|██████▍ | 7983/12384 [16:56:34<9:19:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 64%|██████▍ | 7984/12384 [16:56:34<9:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 64%|██████▍ | 7984/12384 [16:56:42<9:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 64%|██████▍ | 7985/12384 [16:56:42<9:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 64%|██████▍ | 7985/12384 [16:56:50<9:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 64%|██████▍ | 7986/12384 [16:56:50<9:18:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 64%|██████▍ | 7986/12384 [16:56:57<9:18:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 64%|██████▍ | 7987/12384 [16:56:57<9:17:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 64%|██████▍ | 7987/12384 [16:57:05<9:17:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 65%|██████▍ | 7988/12384 [16:57:05<9:17:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 65%|██████▍ | 7988/12384 [16:57:13<9:17:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 65%|██████▍ | 7989/12384 [16:57:13<9:19:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 65%|██████▍ | 7989/12384 [16:57:20<9:19:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 65%|██████▍ | 7990/12384 [16:57:20<9:20:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 65%|██████▍ | 7990/12384 [16:57:28<9:20:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 65%|██████▍ | 7991/12384 [16:57:28<9:19:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 65%|██████▍ | 7991/12384 [16:57:36<9:19:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 65%|██████▍ | 7992/12384 [16:57:36<9:18:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 65%|██████▍ | 7992/12384 [16:57:43<9:18:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 65%|██████▍ | 7993/12384 [16:57:43<9:19:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 65%|██████▍ | 7993/12384 [16:57:51<9:19:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 65%|██████▍ | 7994/12384 [16:57:51<9:20:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 65%|██████▍ | 7994/12384 [16:57:59<9:20:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 65%|██████▍ | 7995/12384 [16:57:59<9:19:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 65%|██████▍ | 7995/12384 [16:58:06<9:19:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 65%|██████▍ | 7996/12384 [16:58:06<9:18:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 65%|██████▍ | 7996/12384 [16:58:14<9:18:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 1: 65%|██████▍ | 7997/12384 [16:58:14<9:25:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 1: 65%|██████▍ | 7997/12384 [16:58:22<9:25:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 65%|██████▍ | 7998/12384 [16:58:22<9:22:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 65%|██████▍ | 7998/12384 [16:58:29<9:22:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 65%|██████▍ | 7999/12384 [16:58:29<9:20:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 65%|██████▍ | 7999/12384 [16:58:37<9:20:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 65%|██████▍ | 8000/12384 [16:58:37<9:18:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 65%|██████▍ | 8000/12384 [16:58:44<9:18:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 65%|██████▍ | 8001/12384 [16:58:44<9:17:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 65%|██████▍ | 8001/12384 [16:58:52<9:17:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 65%|██████▍ | 8002/12384 [16:58:52<9:18:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 65%|██████▍ | 8002/12384 [16:59:00<9:18:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 65%|██████▍ | 8003/12384 [16:59:00<9:17:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 65%|██████▍ | 8003/12384 [16:59:07<9:17:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 65%|██████▍ | 8004/12384 [16:59:07<9:16:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 65%|██████▍ | 8004/12384 [16:59:15<9:16:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 65%|██████▍ | 8005/12384 [16:59:15<9:16:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 65%|██████▍ | 8005/12384 [16:59:23<9:16:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 65%|██████▍ | 8006/12384 [16:59:23<9:16:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 65%|██████▍ | 8006/12384 [16:59:30<9:16:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 65%|██████▍ | 8007/12384 [16:59:30<9:16:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 65%|██████▍ | 8007/12384 [16:59:38<9:16:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 65%|██████▍ | 8008/12384 [16:59:38<9:15:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 65%|██████▍ | 8008/12384 [16:59:45<9:15:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 65%|██████▍ | 8009/12384 [16:59:45<9:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 65%|██████▍ | 8009/12384 [16:59:53<9:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 65%|██████▍ | 8010/12384 [16:59:53<9:14:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 65%|██████▍ | 8010/12384 [17:00:01<9:14:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 65%|██████▍ | 8011/12384 [17:00:01<9:14:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 65%|██████▍ | 8011/12384 [17:00:08<9:14:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 65%|██████▍ | 8012/12384 [17:00:08<9:14:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 65%|██████▍ | 8012/12384 [17:00:16<9:14:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 65%|██████▍ | 8013/12384 [17:00:16<9:13:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 65%|██████▍ | 8013/12384 [17:00:23<9:13:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 65%|██████▍ | 8014/12384 [17:00:23<9:13:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 65%|██████▍ | 8014/12384 [17:00:31<9:13:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 1: 65%|██████▍ | 8015/12384 [17:00:31<9:13:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 1: 65%|██████▍ | 8015/12384 [17:00:39<9:13:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 65%|██████▍ | 8016/12384 [17:00:39<9:15:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 65%|██████▍ | 8016/12384 [17:00:46<9:15:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 65%|██████▍ | 8017/12384 [17:00:46<9:14:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 65%|██████▍ | 8017/12384 [17:00:54<9:14:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 65%|██████▍ | 8018/12384 [17:00:54<9:14:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 65%|██████▍ | 8018/12384 [17:01:02<9:14:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 65%|██████▍ | 8019/12384 [17:01:02<9:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 65%|██████▍ | 8019/12384 [17:01:09<9:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 65%|██████▍ | 8020/12384 [17:01:09<9:13:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 65%|██████▍ | 8020/12384 [17:01:17<9:13:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 65%|██████▍ | 8021/12384 [17:01:17<9:13:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 65%|██████▍ | 8021/12384 [17:01:24<9:13:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▍ | 8022/12384 [17:01:24<9:15:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▍ | 8022/12384 [17:01:32<9:15:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 65%|██████▍ | 8023/12384 [17:01:32<9:20:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 65%|██████▍ | 8023/12384 [17:01:40<9:20:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 65%|██████▍ | 8024/12384 [17:01:40<9:18:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 65%|██████▍ | 8024/12384 [17:01:48<9:18:26, 7.69s/it, loss=0.0002, acc=0.9985, iter_time=7.21s]
Epoch 1: 65%|██████▍ | 8025/12384 [17:01:48<9:16:49, 7.66s/it, loss=0.0002, acc=0.9985, iter_time=7.21s]
Epoch 1: 65%|██████▍ | 8025/12384 [17:01:55<9:16:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 65%|██████▍ | 8026/12384 [17:01:55<9:15:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 65%|██████▍ | 8026/12384 [17:02:03<9:15:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▍ | 8027/12384 [17:02:03<9:14:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▍ | 8027/12384 [17:02:10<9:14:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 65%|██████▍ | 8028/12384 [17:02:10<9:14:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 65%|██████▍ | 8028/12384 [17:02:18<9:14:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 65%|██████▍ | 8029/12384 [17:02:18<9:13:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 65%|██████▍ | 8029/12384 [17:02:26<9:13:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 65%|██████▍ | 8030/12384 [17:02:26<9:12:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 65%|██████▍ | 8030/12384 [17:02:33<9:12:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 65%|██████▍ | 8031/12384 [17:02:33<9:13:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 65%|██████▍ | 8031/12384 [17:02:41<9:13:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 65%|██████▍ | 8032/12384 [17:02:41<9:13:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 65%|██████▍ | 8032/12384 [17:02:49<9:13:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 65%|██████▍ | 8033/12384 [17:02:49<9:13:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 65%|██████▍ | 8033/12384 [17:02:56<9:13:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 65%|██████▍ | 8034/12384 [17:02:56<9:12:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 65%|██████▍ | 8034/12384 [17:03:04<9:12:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 65%|██████▍ | 8035/12384 [17:03:04<9:12:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 65%|██████▍ | 8035/12384 [17:03:11<9:12:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 65%|██████▍ | 8036/12384 [17:03:11<9:11:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 1: 65%|██████▍ | 8036/12384 [17:03:19<9:11:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 65%|██████▍ | 8037/12384 [17:03:19<9:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 65%|██████▍ | 8037/12384 [17:03:27<9:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 65%|██████▍ | 8038/12384 [17:03:27<9:11:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 65%|██████▍ | 8038/12384 [17:03:34<9:11:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 65%|██████▍ | 8039/12384 [17:03:34<9:11:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 65%|██████▍ | 8039/12384 [17:03:42<9:11:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 65%|██████▍ | 8040/12384 [17:03:42<9:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 65%|██████▍ | 8040/12384 [17:03:49<9:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 65%|██████▍ | 8041/12384 [17:03:49<9:10:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 65%|██████▍ | 8041/12384 [17:03:57<9:10:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▍ | 8042/12384 [17:03:57<9:10:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▍ | 8042/12384 [17:04:05<9:10:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▍ | 8043/12384 [17:04:05<9:10:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▍ | 8043/12384 [17:04:12<9:10:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 65%|██████▍ | 8044/12384 [17:04:12<9:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 65%|██████▍ | 8044/12384 [17:04:20<9:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 65%|██████▍ | 8045/12384 [17:04:20<9:09:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 65%|██████▍ | 8045/12384 [17:04:27<9:09:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 65%|██████▍ | 8046/12384 [17:04:27<9:10:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 65%|██████▍ | 8046/12384 [17:04:35<9:10:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 65%|██████▍ | 8047/12384 [17:04:35<9:12:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 65%|██████▍ | 8047/12384 [17:04:43<9:12:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 65%|██████▍ | 8048/12384 [17:04:43<9:12:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 65%|██████▍ | 8048/12384 [17:04:51<9:12:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 65%|██████▍ | 8049/12384 [17:04:51<9:18:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 65%|██████▍ | 8049/12384 [17:04:58<9:18:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▌ | 8050/12384 [17:04:58<9:15:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▌ | 8050/12384 [17:05:06<9:15:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▌ | 8051/12384 [17:05:06<9:13:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▌ | 8051/12384 [17:05:14<9:13:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▌ | 8052/12384 [17:05:14<9:12:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▌ | 8052/12384 [17:05:21<9:12:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 1: 65%|██████▌ | 8053/12384 [17:05:21<9:11:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 1: 65%|██████▌ | 8053/12384 [17:05:29<9:11:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 65%|██████▌ | 8054/12384 [17:05:29<9:11:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 65%|██████▌ | 8054/12384 [17:05:36<9:11:09, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=7.64s]
Epoch 1: 65%|██████▌ | 8055/12384 [17:05:36<9:10:13, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.64s]
Epoch 1: 65%|██████▌ | 8055/12384 [17:05:44<9:10:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 65%|██████▌ | 8056/12384 [17:05:44<9:10:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 65%|██████▌ | 8056/12384 [17:05:52<9:10:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 65%|██████▌ | 8057/12384 [17:05:52<9:09:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 65%|██████▌ | 8057/12384 [17:05:59<9:09:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▌ | 8058/12384 [17:05:59<9:09:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▌ | 8058/12384 [17:06:07<9:09:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▌ | 8059/12384 [17:06:07<9:08:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▌ | 8059/12384 [17:06:14<9:08:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 65%|██████▌ | 8060/12384 [17:06:14<9:08:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 65%|██████▌ | 8060/12384 [17:06:22<9:08:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 65%|██████▌ | 8061/12384 [17:06:22<9:08:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 65%|██████▌ | 8061/12384 [17:06:30<9:08:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 65%|██████▌ | 8062/12384 [17:06:30<9:08:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 65%|██████▌ | 8062/12384 [17:06:37<9:08:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▌ | 8063/12384 [17:06:37<9:08:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▌ | 8063/12384 [17:06:45<9:08:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 65%|██████▌ | 8064/12384 [17:06:45<9:08:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 1: 65%|██████▌ | 8064/12384 [17:06:53<9:08:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 65%|██████▌ | 8065/12384 [17:06:53<9:08:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 65%|██████▌ | 8065/12384 [17:07:00<9:08:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.90s]
Epoch 1: 65%|██████▌ | 8066/12384 [17:07:00<9:08:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.90s]
Epoch 1: 65%|██████▌ | 8066/12384 [17:07:08<9:08:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 1: 65%|██████▌ | 8067/12384 [17:07:08<9:08:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 1: 65%|██████▌ | 8067/12384 [17:07:15<9:08:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 65%|██████▌ | 8068/12384 [17:07:15<9:06:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 65%|██████▌ | 8068/12384 [17:07:23<9:06:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 65%|██████▌ | 8069/12384 [17:07:23<9:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 65%|██████▌ | 8069/12384 [17:07:31<9:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 65%|██████▌ | 8070/12384 [17:07:31<9:07:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 65%|██████▌ | 8070/12384 [17:07:38<9:07:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 65%|██████▌ | 8071/12384 [17:07:38<9:07:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 65%|██████▌ | 8071/12384 [17:07:46<9:07:04, 7.61s/it, loss=0.0002, acc=0.9979, iter_time=9.16s]
Epoch 1: 65%|██████▌ | 8072/12384 [17:07:46<9:06:53, 7.61s/it, loss=0.0002, acc=0.9979, iter_time=9.16s]
Epoch 1: 65%|██████▌ | 8072/12384 [17:07:53<9:06:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 65%|██████▌ | 8073/12384 [17:07:53<9:06:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 65%|██████▌ | 8073/12384 [17:08:01<9:06:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 65%|██████▌ | 8074/12384 [17:08:01<9:06:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 65%|██████▌ | 8074/12384 [17:08:09<9:06:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 65%|██████▌ | 8075/12384 [17:08:09<9:13:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 65%|██████▌ | 8075/12384 [17:08:17<9:13:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 65%|██████▌ | 8076/12384 [17:08:17<9:11:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 65%|██████▌ | 8076/12384 [17:08:24<9:11:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 65%|██████▌ | 8077/12384 [17:08:24<9:10:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 65%|██████▌ | 8077/12384 [17:08:32<9:10:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 1: 65%|██████▌ | 8078/12384 [17:08:32<9:09:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 1: 65%|██████▌ | 8078/12384 [17:08:40<9:09:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 65%|██████▌ | 8079/12384 [17:08:40<9:08:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 1: 65%|██████▌ | 8079/12384 [17:08:47<9:08:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 65%|██████▌ | 8080/12384 [17:08:47<9:07:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 65%|██████▌ | 8080/12384 [17:08:55<9:07:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 65%|██████▌ | 8081/12384 [17:08:55<9:08:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 65%|██████▌ | 8081/12384 [17:09:02<9:08:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 65%|██████▌ | 8082/12384 [17:09:02<9:07:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 65%|██████▌ | 8082/12384 [17:09:10<9:07:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▌ | 8083/12384 [17:09:10<9:06:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▌ | 8083/12384 [17:09:18<9:06:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 65%|██████▌ | 8084/12384 [17:09:18<9:05:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 65%|██████▌ | 8084/12384 [17:09:25<9:05:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 65%|██████▌ | 8085/12384 [17:09:25<9:06:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 65%|██████▌ | 8085/12384 [17:09:33<9:06:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 65%|██████▌ | 8086/12384 [17:09:33<9:07:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 65%|██████▌ | 8086/12384 [17:09:41<9:07:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 65%|██████▌ | 8087/12384 [17:09:41<9:07:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 65%|██████▌ | 8087/12384 [17:09:48<9:07:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 65%|██████▌ | 8088/12384 [17:09:48<9:06:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 65%|██████▌ | 8088/12384 [17:09:56<9:06:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 65%|██████▌ | 8089/12384 [17:09:56<9:08:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 65%|██████▌ | 8089/12384 [17:10:04<9:08:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 1: 65%|██████▌ | 8090/12384 [17:10:04<9:07:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 1: 65%|██████▌ | 8090/12384 [17:10:11<9:07:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 65%|██████▌ | 8091/12384 [17:10:11<9:08:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 65%|██████▌ | 8091/12384 [17:10:19<9:08:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 65%|██████▌ | 8092/12384 [17:10:19<9:06:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 65%|██████▌ | 8092/12384 [17:10:26<9:06:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▌ | 8093/12384 [17:10:26<9:05:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 65%|██████▌ | 8093/12384 [17:10:34<9:05:56, 7.63s/it, loss=0.0003, acc=0.9981, iter_time=7.60s]
Epoch 1: 65%|██████▌ | 8094/12384 [17:10:34<9:05:09, 7.62s/it, loss=0.0003, acc=0.9981, iter_time=7.60s]
Epoch 1: 65%|██████▌ | 8094/12384 [17:10:42<9:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▌ | 8095/12384 [17:10:42<9:05:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▌ | 8095/12384 [17:10:49<9:05:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 65%|██████▌ | 8096/12384 [17:10:49<9:06:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 65%|██████▌ | 8096/12384 [17:10:57<9:06:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 1: 65%|██████▌ | 8097/12384 [17:10:57<9:06:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.20s]
Epoch 1: 65%|██████▌ | 8097/12384 [17:11:05<9:06:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.69s]
Epoch 1: 65%|██████▌ | 8098/12384 [17:11:05<9:05:39, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.69s]
Epoch 1: 65%|██████▌ | 8098/12384 [17:11:12<9:05:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 65%|██████▌ | 8099/12384 [17:11:12<9:05:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 65%|██████▌ | 8099/12384 [17:11:20<9:05:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 65%|██████▌ | 8100/12384 [17:11:20<9:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 65%|██████▌ | 8100/12384 [17:11:28<9:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 65%|██████▌ | 8101/12384 [17:11:28<9:11:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 65%|██████▌ | 8101/12384 [17:11:35<9:11:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 65%|██████▌ | 8102/12384 [17:11:35<9:08:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 65%|██████▌ | 8102/12384 [17:11:43<9:08:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 65%|██████▌ | 8103/12384 [17:11:43<9:07:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 65%|██████▌ | 8103/12384 [17:11:51<9:07:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 65%|██████▌ | 8104/12384 [17:11:51<9:06:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 65%|██████▌ | 8104/12384 [17:11:58<9:06:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 65%|██████▌ | 8105/12384 [17:11:58<9:05:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 65%|██████▌ | 8105/12384 [17:12:06<9:05:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▌ | 8106/12384 [17:12:06<9:04:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 65%|██████▌ | 8106/12384 [17:12:14<9:04:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 65%|██████▌ | 8107/12384 [17:12:14<9:03:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 65%|██████▌ | 8107/12384 [17:12:21<9:03:27, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.58s]
Epoch 1: 65%|██████▌ | 8108/12384 [17:12:21<9:02:36, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.58s]
Epoch 1: 65%|██████▌ | 8108/12384 [17:12:29<9:02:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 65%|██████▌ | 8109/12384 [17:12:29<9:02:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 65%|██████▌ | 8109/12384 [17:12:36<9:02:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 65%|██████▌ | 8110/12384 [17:12:36<9:01:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 65%|██████▌ | 8110/12384 [17:12:44<9:01:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▌ | 8111/12384 [17:12:44<9:01:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 65%|██████▌ | 8111/12384 [17:12:51<9:01:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 66%|██████▌ | 8112/12384 [17:12:51<9:01:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 66%|██████▌ | 8112/12384 [17:12:59<9:01:09, 7.60s/it, loss=0.0004, acc=0.9995, iter_time=7.21s]
Epoch 1: 66%|██████▌ | 8113/12384 [17:12:59<9:01:22, 7.61s/it, loss=0.0004, acc=0.9995, iter_time=7.21s]
Epoch 1: 66%|██████▌ | 8113/12384 [17:13:07<9:01:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 66%|██████▌ | 8114/12384 [17:13:07<9:01:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 66%|██████▌ | 8114/12384 [17:13:14<9:01:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8115/12384 [17:13:14<9:01:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8115/12384 [17:13:22<9:01:40, 7.61s/it, loss=0.0001, acc=0.9991, iter_time=8.03s]
Epoch 1: 66%|██████▌ | 8116/12384 [17:13:22<9:05:57, 7.68s/it, loss=0.0001, acc=0.9991, iter_time=8.03s]
Epoch 1: 66%|██████▌ | 8116/12384 [17:13:30<9:05:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 66%|██████▌ | 8117/12384 [17:13:30<9:04:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 66%|██████▌ | 8117/12384 [17:13:37<9:04:12, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 1: 66%|██████▌ | 8118/12384 [17:13:37<9:03:13, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 1: 66%|██████▌ | 8118/12384 [17:13:45<9:03:13, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=5.33s]
Epoch 1: 66%|██████▌ | 8119/12384 [17:13:45<9:02:53, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=5.33s]
Epoch 1: 66%|██████▌ | 8119/12384 [17:13:53<9:02:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 66%|██████▌ | 8120/12384 [17:13:53<9:01:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 66%|██████▌ | 8120/12384 [17:14:00<9:01:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 1: 66%|██████▌ | 8121/12384 [17:14:00<9:01:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.23s]
Epoch 1: 66%|██████▌ | 8121/12384 [17:14:08<9:01:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 66%|██████▌ | 8122/12384 [17:14:08<9:01:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 66%|██████▌ | 8122/12384 [17:14:15<9:01:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 66%|██████▌ | 8123/12384 [17:14:15<9:01:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 66%|██████▌ | 8123/12384 [17:14:23<9:01:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 66%|██████▌ | 8124/12384 [17:14:23<9:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 66%|██████▌ | 8124/12384 [17:14:31<9:00:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 66%|██████▌ | 8125/12384 [17:14:31<9:00:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 66%|██████▌ | 8125/12384 [17:14:38<9:00:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 66%|██████▌ | 8126/12384 [17:14:38<9:00:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 66%|██████▌ | 8126/12384 [17:14:46<9:00:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 66%|██████▌ | 8127/12384 [17:14:46<9:05:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 66%|██████▌ | 8127/12384 [17:14:54<9:05:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 66%|██████▌ | 8128/12384 [17:14:54<9:12:07, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 66%|██████▌ | 8128/12384 [17:15:02<9:12:07, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 66%|██████▌ | 8129/12384 [17:15:02<9:08:57, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 66%|██████▌ | 8129/12384 [17:15:09<9:08:57, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 66%|██████▌ | 8130/12384 [17:15:09<9:06:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 66%|██████▌ | 8130/12384 [17:15:17<9:06:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 66%|██████▌ | 8131/12384 [17:15:17<9:04:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 66%|██████▌ | 8131/12384 [17:15:25<9:04:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 66%|██████▌ | 8132/12384 [17:15:25<9:02:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 66%|██████▌ | 8132/12384 [17:15:32<9:02:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 66%|██████▌ | 8133/12384 [17:15:32<9:01:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 66%|██████▌ | 8133/12384 [17:15:40<9:01:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 66%|██████▌ | 8134/12384 [17:15:40<9:02:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 66%|██████▌ | 8134/12384 [17:15:48<9:02:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▌ | 8135/12384 [17:15:48<9:01:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▌ | 8135/12384 [17:15:55<9:01:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 66%|██████▌ | 8136/12384 [17:15:55<9:02:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 66%|██████▌ | 8136/12384 [17:16:03<9:02:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 66%|██████▌ | 8137/12384 [17:16:03<9:01:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 66%|██████▌ | 8137/12384 [17:16:10<9:01:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 66%|██████▌ | 8138/12384 [17:16:11<9:00:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 66%|██████▌ | 8138/12384 [17:16:18<9:00:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 66%|██████▌ | 8139/12384 [17:16:18<8:59:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 66%|██████▌ | 8139/12384 [17:16:26<8:59:42, 7.63s/it, loss=0.0001, acc=0.9994, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8140/12384 [17:16:26<8:58:55, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8140/12384 [17:16:33<8:58:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8141/12384 [17:16:33<8:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8141/12384 [17:16:41<8:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 66%|██████▌ | 8142/12384 [17:16:41<8:58:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 66%|██████▌ | 8142/12384 [17:16:49<8:58:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 66%|██████▌ | 8143/12384 [17:16:49<8:58:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 66%|██████▌ | 8143/12384 [17:16:56<8:58:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 1: 66%|██████▌ | 8144/12384 [17:16:56<8:57:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 1: 66%|██████▌ | 8144/12384 [17:17:04<8:57:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 66%|██████▌ | 8145/12384 [17:17:04<8:58:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 66%|██████▌ | 8145/12384 [17:17:11<8:58:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 66%|██████▌ | 8146/12384 [17:17:11<8:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 66%|██████▌ | 8146/12384 [17:17:19<8:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 66%|██████▌ | 8147/12384 [17:17:19<8:57:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 66%|██████▌ | 8147/12384 [17:17:27<8:57:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 66%|██████▌ | 8148/12384 [17:17:27<8:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 1: 66%|██████▌ | 8148/12384 [17:17:34<8:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 66%|██████▌ | 8149/12384 [17:17:34<8:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 66%|██████▌ | 8149/12384 [17:17:42<8:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 66%|██████▌ | 8150/12384 [17:17:42<8:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 66%|██████▌ | 8150/12384 [17:17:49<8:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 66%|██████▌ | 8151/12384 [17:17:49<8:56:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 66%|██████▌ | 8151/12384 [17:17:57<8:56:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 66%|██████▌ | 8152/12384 [17:17:57<8:56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 66%|██████▌ | 8152/12384 [17:18:05<8:56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 1: 66%|██████▌ | 8153/12384 [17:18:05<8:56:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 1: 66%|██████▌ | 8153/12384 [17:18:13<8:56:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 66%|██████▌ | 8154/12384 [17:18:13<9:02:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 66%|██████▌ | 8154/12384 [17:18:20<9:02:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8155/12384 [17:18:20<9:00:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8155/12384 [17:18:28<9:00:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▌ | 8156/12384 [17:18:28<8:59:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▌ | 8156/12384 [17:18:35<8:59:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▌ | 8157/12384 [17:18:35<8:58:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▌ | 8157/12384 [17:18:43<8:58:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 66%|██████▌ | 8158/12384 [17:18:43<8:56:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 66%|██████▌ | 8158/12384 [17:18:51<8:56:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 66%|██████▌ | 8159/12384 [17:18:51<8:56:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 66%|██████▌ | 8159/12384 [17:18:58<8:56:24, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=10.55s]
Epoch 1: 66%|██████▌ | 8160/12384 [17:18:58<8:56:20, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=10.55s]
Epoch 1: 66%|██████▌ | 8160/12384 [17:19:06<8:56:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 66%|██████▌ | 8161/12384 [17:19:06<8:55:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 66%|██████▌ | 8161/12384 [17:19:13<8:55:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.06s]
Epoch 1: 66%|██████▌ | 8162/12384 [17:19:13<8:55:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.06s]
Epoch 1: 66%|██████▌ | 8162/12384 [17:19:21<8:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 66%|██████▌ | 8163/12384 [17:19:21<8:55:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 66%|██████▌ | 8163/12384 [17:19:29<8:55:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 66%|██████▌ | 8164/12384 [17:19:29<8:54:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 66%|██████▌ | 8164/12384 [17:19:36<8:54:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 66%|██████▌ | 8165/12384 [17:19:36<8:54:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 66%|██████▌ | 8165/12384 [17:19:44<8:54:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 66%|██████▌ | 8166/12384 [17:19:44<8:54:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 66%|██████▌ | 8166/12384 [17:19:51<8:54:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 66%|██████▌ | 8167/12384 [17:19:51<8:54:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 66%|██████▌ | 8167/12384 [17:19:59<8:54:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8168/12384 [17:19:59<8:54:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8168/12384 [17:20:07<8:54:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 66%|██████▌ | 8169/12384 [17:20:07<8:55:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 66%|██████▌ | 8169/12384 [17:20:14<8:55:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 66%|██████▌ | 8170/12384 [17:20:14<8:55:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 66%|██████▌ | 8170/12384 [17:20:22<8:55:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 66%|██████▌ | 8171/12384 [17:20:22<8:54:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 66%|██████▌ | 8171/12384 [17:20:29<8:54:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 66%|██████▌ | 8172/12384 [17:20:29<8:53:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 66%|██████▌ | 8172/12384 [17:20:37<8:53:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 66%|██████▌ | 8173/12384 [17:20:37<8:53:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 66%|██████▌ | 8173/12384 [17:20:45<8:53:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 66%|██████▌ | 8174/12384 [17:20:45<8:55:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 66%|██████▌ | 8174/12384 [17:20:52<8:55:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 66%|██████▌ | 8175/12384 [17:20:52<8:54:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 66%|██████▌ | 8175/12384 [17:21:00<8:54:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 66%|██████▌ | 8176/12384 [17:21:00<8:54:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 66%|██████▌ | 8176/12384 [17:21:08<8:54:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 66%|██████▌ | 8177/12384 [17:21:08<8:54:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 66%|██████▌ | 8177/12384 [17:21:15<8:54:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 66%|██████▌ | 8178/12384 [17:21:15<8:54:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 66%|██████▌ | 8178/12384 [17:21:23<8:54:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 1: 66%|██████▌ | 8179/12384 [17:21:23<8:53:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 1: 66%|██████▌ | 8179/12384 [17:21:30<8:53:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 66%|██████▌ | 8180/12384 [17:21:30<8:53:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 66%|██████▌ | 8180/12384 [17:21:38<8:53:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8181/12384 [17:21:38<8:59:26, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8181/12384 [17:21:46<8:59:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 66%|██████▌ | 8182/12384 [17:21:46<8:58:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 66%|██████▌ | 8182/12384 [17:21:54<8:58:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 66%|██████▌ | 8183/12384 [17:21:54<8:56:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 66%|██████▌ | 8183/12384 [17:22:01<8:56:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 66%|██████▌ | 8184/12384 [17:22:01<8:55:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 66%|██████▌ | 8184/12384 [17:22:09<8:55:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 66%|██████▌ | 8185/12384 [17:22:09<8:54:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 66%|██████▌ | 8185/12384 [17:22:16<8:54:06, 7.63s/it, loss=0.0002, acc=0.9990, iter_time=8.55s]
Epoch 1: 66%|██████▌ | 8186/12384 [17:22:16<8:53:30, 7.63s/it, loss=0.0002, acc=0.9990, iter_time=8.55s]
Epoch 1: 66%|██████▌ | 8186/12384 [17:22:24<8:53:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 66%|██████▌ | 8187/12384 [17:22:24<8:53:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 66%|██████▌ | 8187/12384 [17:22:32<8:53:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 66%|██████▌ | 8188/12384 [17:22:32<8:54:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 66%|██████▌ | 8188/12384 [17:22:39<8:54:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 66%|██████▌ | 8189/12384 [17:22:39<8:53:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 66%|██████▌ | 8189/12384 [17:22:47<8:53:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8190/12384 [17:22:47<8:52:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 66%|██████▌ | 8190/12384 [17:22:55<8:52:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8191/12384 [17:22:55<8:52:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8191/12384 [17:23:02<8:52:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 66%|██████▌ | 8192/12384 [17:23:02<8:53:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 66%|██████▌ | 8192/12384 [17:23:10<8:53:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 66%|██████▌ | 8193/12384 [17:23:10<8:54:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 66%|██████▌ | 8193/12384 [17:23:18<8:54:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8194/12384 [17:23:18<8:55:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8194/12384 [17:23:25<8:55:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 1: 66%|██████▌ | 8195/12384 [17:23:25<8:54:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 1: 66%|██████▌ | 8195/12384 [17:23:33<8:54:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 66%|██████▌ | 8196/12384 [17:23:33<8:52:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 66%|██████▌ | 8196/12384 [17:23:40<8:52:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8197/12384 [17:23:40<8:52:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▌ | 8197/12384 [17:23:48<8:52:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 66%|██████▌ | 8198/12384 [17:23:48<8:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 66%|██████▌ | 8198/12384 [17:23:56<8:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 66%|██████▌ | 8199/12384 [17:23:56<8:53:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 1: 66%|██████▌ | 8199/12384 [17:24:03<8:53:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.47s]
Epoch 1: 66%|██████▌ | 8200/12384 [17:24:03<8:51:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.47s]
Epoch 1: 66%|██████▌ | 8200/12384 [17:24:11<8:51:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 1: 66%|██████▌ | 8201/12384 [17:24:11<8:51:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 1: 66%|██████▌ | 8201/12384 [17:24:19<8:51:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 66%|██████▌ | 8202/12384 [17:24:19<8:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 66%|██████▌ | 8202/12384 [17:24:26<8:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 1: 66%|██████▌ | 8203/12384 [17:24:26<8:50:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 1: 66%|██████▌ | 8203/12384 [17:24:34<8:50:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 66%|██████▌ | 8204/12384 [17:24:34<8:50:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 66%|██████▌ | 8204/12384 [17:24:41<8:50:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 66%|██████▋ | 8205/12384 [17:24:41<8:50:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 66%|██████▋ | 8205/12384 [17:24:49<8:50:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 66%|██████▋ | 8206/12384 [17:24:49<8:55:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 66%|██████▋ | 8206/12384 [17:24:57<8:55:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 66%|██████▋ | 8207/12384 [17:24:57<9:00:25, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 66%|██████▋ | 8207/12384 [17:25:05<9:00:25, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 66%|██████▋ | 8208/12384 [17:25:05<8:57:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 66%|██████▋ | 8208/12384 [17:25:12<8:57:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 66%|██████▋ | 8209/12384 [17:25:12<8:54:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 66%|██████▋ | 8209/12384 [17:25:20<8:54:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 66%|██████▋ | 8210/12384 [17:25:20<8:52:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 66%|██████▋ | 8210/12384 [17:25:28<8:52:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 66%|██████▋ | 8211/12384 [17:25:28<8:51:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 66%|██████▋ | 8211/12384 [17:25:35<8:51:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 66%|██████▋ | 8212/12384 [17:25:35<8:50:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 66%|██████▋ | 8212/12384 [17:25:43<8:50:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8213/12384 [17:25:43<8:50:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8213/12384 [17:25:50<8:50:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 66%|██████▋ | 8214/12384 [17:25:50<8:50:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 66%|██████▋ | 8214/12384 [17:25:58<8:50:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 66%|██████▋ | 8215/12384 [17:25:58<8:49:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 66%|██████▋ | 8215/12384 [17:26:06<8:49:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 66%|██████▋ | 8216/12384 [17:26:06<8:48:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 66%|██████▋ | 8216/12384 [17:26:13<8:48:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 66%|██████▋ | 8217/12384 [17:26:13<8:48:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 66%|██████▋ | 8217/12384 [17:26:21<8:48:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8218/12384 [17:26:21<8:49:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8218/12384 [17:26:29<8:49:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 66%|██████▋ | 8219/12384 [17:26:29<8:49:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 66%|██████▋ | 8219/12384 [17:26:36<8:49:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8220/12384 [17:26:36<8:48:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8220/12384 [17:26:44<8:48:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▋ | 8221/12384 [17:26:44<8:48:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▋ | 8221/12384 [17:26:51<8:48:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8222/12384 [17:26:51<8:48:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8222/12384 [17:26:59<8:48:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8223/12384 [17:26:59<8:47:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8223/12384 [17:27:07<8:47:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 66%|██████▋ | 8224/12384 [17:27:07<8:47:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 66%|██████▋ | 8224/12384 [17:27:14<8:47:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 66%|██████▋ | 8225/12384 [17:27:14<8:47:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 66%|██████▋ | 8225/12384 [17:27:22<8:47:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8226/12384 [17:27:22<8:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 66%|██████▋ | 8226/12384 [17:27:29<8:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▋ | 8227/12384 [17:27:29<8:47:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 66%|██████▋ | 8227/12384 [17:27:37<8:47:14, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.74s]
Epoch 1: 66%|██████▋ | 8228/12384 [17:27:37<8:47:02, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.74s]
Epoch 1: 66%|██████▋ | 8228/12384 [17:27:45<8:47:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 66%|██████▋ | 8229/12384 [17:27:45<8:47:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 66%|██████▋ | 8229/12384 [17:27:52<8:47:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 66%|██████▋ | 8230/12384 [17:27:52<8:47:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 66%|██████▋ | 8230/12384 [17:28:00<8:47:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 66%|██████▋ | 8231/12384 [17:28:00<8:48:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 66%|██████▋ | 8231/12384 [17:28:08<8:48:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 66%|██████▋ | 8232/12384 [17:28:08<8:53:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 66%|██████▋ | 8232/12384 [17:28:16<8:53:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 66%|██████▋ | 8233/12384 [17:28:16<8:58:58, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 66%|██████▋ | 8233/12384 [17:28:23<8:58:58, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 66%|██████▋ | 8234/12384 [17:28:23<8:55:12, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 66%|██████▋ | 8234/12384 [17:28:31<8:55:12, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 66%|██████▋ | 8235/12384 [17:28:31<8:55:07, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 66%|██████▋ | 8235/12384 [17:28:39<8:55:07, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 67%|██████▋ | 8236/12384 [17:28:39<8:52:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 67%|██████▋ | 8236/12384 [17:28:46<8:52:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8237/12384 [17:28:46<8:50:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8237/12384 [17:28:54<8:50:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8238/12384 [17:28:54<8:49:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8238/12384 [17:29:02<8:49:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8239/12384 [17:29:02<8:48:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8239/12384 [17:29:09<8:48:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 67%|██████▋ | 8240/12384 [17:29:09<8:47:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 67%|██████▋ | 8240/12384 [17:29:17<8:47:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 67%|██████▋ | 8241/12384 [17:29:17<8:47:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 67%|██████▋ | 8241/12384 [17:29:25<8:47:45, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.70s]
Epoch 1: 67%|██████▋ | 8242/12384 [17:29:25<8:47:17, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.70s]
Epoch 1: 67%|██████▋ | 8242/12384 [17:29:32<8:47:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8243/12384 [17:29:32<8:46:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8243/12384 [17:29:40<8:46:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 67%|██████▋ | 8244/12384 [17:29:40<8:45:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 67%|██████▋ | 8244/12384 [17:29:47<8:45:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 67%|██████▋ | 8245/12384 [17:29:47<8:45:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 67%|██████▋ | 8245/12384 [17:29:55<8:45:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 67%|██████▋ | 8246/12384 [17:29:55<8:46:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 67%|██████▋ | 8246/12384 [17:30:03<8:46:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 67%|██████▋ | 8247/12384 [17:30:03<8:45:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 67%|██████▋ | 8247/12384 [17:30:10<8:45:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 67%|██████▋ | 8248/12384 [17:30:10<8:45:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 67%|██████▋ | 8248/12384 [17:30:18<8:45:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 67%|██████▋ | 8249/12384 [17:30:18<8:45:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 67%|██████▋ | 8249/12384 [17:30:25<8:45:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8250/12384 [17:30:25<8:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8250/12384 [17:30:33<8:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 67%|██████▋ | 8251/12384 [17:30:33<8:44:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 67%|██████▋ | 8251/12384 [17:30:41<8:44:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 67%|██████▋ | 8252/12384 [17:30:41<8:44:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 1: 67%|██████▋ | 8252/12384 [17:30:48<8:44:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 67%|██████▋ | 8253/12384 [17:30:48<8:45:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 67%|██████▋ | 8253/12384 [17:30:56<8:45:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 67%|██████▋ | 8254/12384 [17:30:56<8:44:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 67%|██████▋ | 8254/12384 [17:31:04<8:44:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8255/12384 [17:31:04<8:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8255/12384 [17:31:11<8:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 67%|██████▋ | 8256/12384 [17:31:11<8:44:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 67%|██████▋ | 8256/12384 [17:31:19<8:44:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 67%|██████▋ | 8257/12384 [17:31:19<8:43:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 67%|██████▋ | 8257/12384 [17:31:27<8:43:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 67%|██████▋ | 8258/12384 [17:31:27<8:49:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 67%|██████▋ | 8258/12384 [17:31:35<8:49:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 67%|██████▋ | 8259/12384 [17:31:35<8:55:06, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 67%|██████▋ | 8259/12384 [17:31:42<8:55:06, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 67%|██████▋ | 8260/12384 [17:31:42<8:51:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 67%|██████▋ | 8260/12384 [17:31:50<8:51:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 67%|██████▋ | 8261/12384 [17:31:50<8:48:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 1: 67%|██████▋ | 8261/12384 [17:31:58<8:48:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=10.98s]
Epoch 1: 67%|██████▋ | 8262/12384 [17:31:58<8:46:47, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.98s]
Epoch 1: 67%|██████▋ | 8262/12384 [17:32:05<8:46:47, 7.67s/it, loss=0.0001, acc=0.9994, iter_time=7.64s]
Epoch 1: 67%|██████▋ | 8263/12384 [17:32:05<8:45:41, 7.65s/it, loss=0.0001, acc=0.9994, iter_time=7.64s]
Epoch 1: 67%|██████▋ | 8263/12384 [17:32:13<8:45:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 67%|██████▋ | 8264/12384 [17:32:13<8:45:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 67%|██████▋ | 8264/12384 [17:32:20<8:45:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 67%|██████▋ | 8265/12384 [17:32:20<8:43:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 67%|██████▋ | 8265/12384 [17:32:28<8:43:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 67%|██████▋ | 8266/12384 [17:32:28<8:43:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 67%|██████▋ | 8266/12384 [17:32:36<8:43:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 67%|██████▋ | 8267/12384 [17:32:36<8:42:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 67%|██████▋ | 8267/12384 [17:32:43<8:42:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8268/12384 [17:32:43<8:42:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8268/12384 [17:32:51<8:42:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 67%|██████▋ | 8269/12384 [17:32:51<8:41:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 67%|██████▋ | 8269/12384 [17:32:58<8:41:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 1: 67%|██████▋ | 8270/12384 [17:32:58<8:41:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 1: 67%|██████▋ | 8270/12384 [17:33:06<8:41:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 67%|██████▋ | 8271/12384 [17:33:06<8:41:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 67%|██████▋ | 8271/12384 [17:33:14<8:41:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 67%|██████▋ | 8272/12384 [17:33:14<8:41:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 67%|██████▋ | 8272/12384 [17:33:21<8:41:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 67%|██████▋ | 8273/12384 [17:33:21<8:40:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 67%|██████▋ | 8273/12384 [17:33:29<8:40:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8274/12384 [17:33:29<8:40:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8274/12384 [17:33:36<8:40:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 67%|██████▋ | 8275/12384 [17:33:36<8:40:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 67%|██████▋ | 8275/12384 [17:33:44<8:40:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8276/12384 [17:33:44<8:40:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8276/12384 [17:33:52<8:40:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 67%|██████▋ | 8277/12384 [17:33:52<8:40:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 67%|██████▋ | 8277/12384 [17:33:59<8:40:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8278/12384 [17:33:59<8:40:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8278/12384 [17:34:07<8:40:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 67%|██████▋ | 8279/12384 [17:34:07<8:40:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 67%|██████▋ | 8279/12384 [17:34:14<8:40:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 1: 67%|██████▋ | 8280/12384 [17:34:14<8:40:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 1: 67%|██████▋ | 8280/12384 [17:34:22<8:40:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 67%|██████▋ | 8281/12384 [17:34:22<8:40:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 67%|██████▋ | 8281/12384 [17:34:30<8:40:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8282/12384 [17:34:30<8:39:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8282/12384 [17:34:37<8:39:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 67%|██████▋ | 8283/12384 [17:34:37<8:40:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 67%|██████▋ | 8283/12384 [17:34:45<8:40:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.97s]
Epoch 1: 67%|██████▋ | 8284/12384 [17:34:45<8:46:20, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=10.97s]
Epoch 1: 67%|██████▋ | 8284/12384 [17:34:53<8:46:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 67%|██████▋ | 8285/12384 [17:34:53<8:51:23, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 67%|██████▋ | 8285/12384 [17:35:01<8:51:23, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 67%|██████▋ | 8286/12384 [17:35:01<8:48:22, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 67%|██████▋ | 8286/12384 [17:35:08<8:48:22, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 67%|██████▋ | 8287/12384 [17:35:08<8:45:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 67%|██████▋ | 8287/12384 [17:35:16<8:45:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 67%|██████▋ | 8288/12384 [17:35:16<8:43:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 67%|██████▋ | 8288/12384 [17:35:24<8:43:44, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 1: 67%|██████▋ | 8289/12384 [17:35:24<8:41:58, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 1: 67%|██████▋ | 8289/12384 [17:35:31<8:41:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 67%|██████▋ | 8290/12384 [17:35:31<8:40:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 67%|██████▋ | 8290/12384 [17:35:39<8:40:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 67%|██████▋ | 8291/12384 [17:35:39<8:40:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 67%|██████▋ | 8291/12384 [17:35:46<8:40:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 67%|██████▋ | 8292/12384 [17:35:46<8:39:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 67%|██████▋ | 8292/12384 [17:35:54<8:39:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 67%|██████▋ | 8293/12384 [17:35:54<8:39:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 67%|██████▋ | 8293/12384 [17:36:02<8:39:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.84s]
Epoch 1: 67%|██████▋ | 8294/12384 [17:36:02<8:39:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.84s]
Epoch 1: 67%|██████▋ | 8294/12384 [17:36:09<8:39:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 1: 67%|██████▋ | 8295/12384 [17:36:09<8:39:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 1: 67%|██████▋ | 8295/12384 [17:36:17<8:39:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 67%|██████▋ | 8296/12384 [17:36:17<8:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 67%|██████▋ | 8296/12384 [17:36:24<8:38:45, 7.61s/it, loss=0.0003, acc=0.9994, iter_time=7.20s]
Epoch 1: 67%|██████▋ | 8297/12384 [17:36:24<8:38:48, 7.62s/it, loss=0.0003, acc=0.9994, iter_time=7.20s]
Epoch 1: 67%|██████▋ | 8297/12384 [17:36:32<8:38:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 67%|██████▋ | 8298/12384 [17:36:32<8:38:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 67%|██████▋ | 8298/12384 [17:36:40<8:38:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 67%|██████▋ | 8299/12384 [17:36:40<8:37:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 67%|██████▋ | 8299/12384 [17:36:47<8:37:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 67%|██████▋ | 8300/12384 [17:36:47<8:37:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 67%|██████▋ | 8300/12384 [17:36:55<8:37:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 67%|██████▋ | 8301/12384 [17:36:55<8:39:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 67%|██████▋ | 8301/12384 [17:37:03<8:39:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 67%|██████▋ | 8302/12384 [17:37:03<8:39:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 67%|██████▋ | 8302/12384 [17:37:10<8:39:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 67%|██████▋ | 8303/12384 [17:37:10<8:38:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 67%|██████▋ | 8303/12384 [17:37:18<8:38:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 67%|██████▋ | 8304/12384 [17:37:18<8:38:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 67%|██████▋ | 8304/12384 [17:37:25<8:38:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 67%|██████▋ | 8305/12384 [17:37:25<8:38:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 67%|██████▋ | 8305/12384 [17:37:33<8:38:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 67%|██████▋ | 8306/12384 [17:37:33<8:37:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 67%|██████▋ | 8306/12384 [17:37:41<8:37:55, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.69s]
Epoch 1: 67%|██████▋ | 8307/12384 [17:37:41<8:38:25, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=6.69s]
Epoch 1: 67%|██████▋ | 8307/12384 [17:37:48<8:38:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 67%|██████▋ | 8308/12384 [17:37:48<8:38:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 67%|██████▋ | 8308/12384 [17:37:56<8:38:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 67%|██████▋ | 8309/12384 [17:37:56<8:38:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 67%|██████▋ | 8309/12384 [17:38:04<8:38:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 67%|██████▋ | 8310/12384 [17:38:04<8:43:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 67%|██████▋ | 8310/12384 [17:38:12<8:43:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8311/12384 [17:38:12<8:41:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8311/12384 [17:38:19<8:41:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 67%|██████▋ | 8312/12384 [17:38:19<8:46:05, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 67%|██████▋ | 8312/12384 [17:38:27<8:46:05, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 67%|██████▋ | 8313/12384 [17:38:27<8:42:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 67%|██████▋ | 8313/12384 [17:38:35<8:42:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 67%|██████▋ | 8314/12384 [17:38:35<8:40:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 67%|██████▋ | 8314/12384 [17:38:42<8:40:47, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8315/12384 [17:38:42<8:39:28, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8315/12384 [17:38:50<8:39:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 67%|██████▋ | 8316/12384 [17:38:50<8:38:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 67%|██████▋ | 8316/12384 [17:38:57<8:38:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 1: 67%|██████▋ | 8317/12384 [17:38:57<8:37:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 1: 67%|██████▋ | 8317/12384 [17:39:05<8:37:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 67%|██████▋ | 8318/12384 [17:39:05<8:36:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 67%|██████▋ | 8318/12384 [17:39:13<8:36:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 67%|██████▋ | 8319/12384 [17:39:13<8:36:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 67%|██████▋ | 8319/12384 [17:39:20<8:36:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 67%|██████▋ | 8320/12384 [17:39:20<8:36:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 67%|██████▋ | 8320/12384 [17:39:28<8:36:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 67%|██████▋ | 8321/12384 [17:39:28<8:36:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 67%|██████▋ | 8321/12384 [17:39:36<8:36:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 67%|██████▋ | 8322/12384 [17:39:36<8:35:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 67%|██████▋ | 8322/12384 [17:39:43<8:35:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 67%|██████▋ | 8323/12384 [17:39:43<8:35:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 67%|██████▋ | 8323/12384 [17:39:51<8:35:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 67%|██████▋ | 8324/12384 [17:39:51<8:35:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 67%|██████▋ | 8324/12384 [17:39:58<8:35:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8325/12384 [17:39:58<8:35:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8325/12384 [17:40:06<8:35:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8326/12384 [17:40:06<8:35:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 67%|██████▋ | 8326/12384 [17:40:14<8:35:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 67%|██████▋ | 8327/12384 [17:40:14<8:34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 67%|██████▋ | 8327/12384 [17:40:21<8:34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 1: 67%|██████▋ | 8328/12384 [17:40:21<8:34:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 1: 67%|██████▋ | 8328/12384 [17:40:29<8:34:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 67%|██████▋ | 8329/12384 [17:40:29<8:35:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 67%|██████▋ | 8329/12384 [17:40:36<8:35:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 67%|██████▋ | 8330/12384 [17:40:36<8:35:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 67%|██████▋ | 8330/12384 [17:40:44<8:35:18, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8331/12384 [17:40:44<8:34:47, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8331/12384 [17:40:52<8:34:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8332/12384 [17:40:52<8:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 67%|██████▋ | 8332/12384 [17:40:59<8:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8333/12384 [17:40:59<8:33:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8333/12384 [17:41:07<8:33:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8334/12384 [17:41:07<8:34:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8334/12384 [17:41:15<8:34:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 67%|██████▋ | 8335/12384 [17:41:15<8:33:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 67%|██████▋ | 8335/12384 [17:41:22<8:33:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 67%|██████▋ | 8336/12384 [17:41:22<8:33:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 67%|██████▋ | 8336/12384 [17:41:30<8:33:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 67%|██████▋ | 8337/12384 [17:41:30<8:33:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 67%|██████▋ | 8337/12384 [17:41:38<8:33:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 67%|██████▋ | 8338/12384 [17:41:38<8:40:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 67%|██████▋ | 8338/12384 [17:41:45<8:40:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 67%|██████▋ | 8339/12384 [17:41:45<8:38:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 67%|██████▋ | 8339/12384 [17:41:53<8:38:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 67%|██████▋ | 8340/12384 [17:41:53<8:36:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 67%|██████▋ | 8340/12384 [17:42:01<8:36:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 67%|██████▋ | 8341/12384 [17:42:01<8:35:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 67%|██████▋ | 8341/12384 [17:42:08<8:35:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 67%|██████▋ | 8342/12384 [17:42:08<8:34:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 67%|██████▋ | 8342/12384 [17:42:16<8:34:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 67%|██████▋ | 8343/12384 [17:42:16<8:34:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 67%|██████▋ | 8343/12384 [17:42:24<8:34:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 67%|██████▋ | 8344/12384 [17:42:24<8:35:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 67%|██████▋ | 8344/12384 [17:42:31<8:35:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 67%|██████▋ | 8345/12384 [17:42:31<8:34:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 67%|██████▋ | 8345/12384 [17:42:39<8:34:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 67%|██████▋ | 8346/12384 [17:42:39<8:33:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 67%|██████▋ | 8346/12384 [17:42:46<8:33:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 67%|██████▋ | 8347/12384 [17:42:46<8:32:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 67%|██████▋ | 8347/12384 [17:42:54<8:32:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 67%|██████▋ | 8348/12384 [17:42:54<8:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 67%|██████▋ | 8348/12384 [17:43:02<8:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 67%|██████▋ | 8349/12384 [17:43:02<8:32:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 67%|██████▋ | 8349/12384 [17:43:09<8:32:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 67%|██████▋ | 8350/12384 [17:43:09<8:32:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 67%|██████▋ | 8350/12384 [17:43:17<8:32:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 1: 67%|██████▋ | 8351/12384 [17:43:17<8:32:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 1: 67%|██████▋ | 8351/12384 [17:43:24<8:32:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 67%|██████▋ | 8352/12384 [17:43:24<8:31:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 67%|██████▋ | 8352/12384 [17:43:32<8:31:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 67%|██████▋ | 8353/12384 [17:43:32<8:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 67%|██████▋ | 8353/12384 [17:43:40<8:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 67%|██████▋ | 8354/12384 [17:43:40<8:31:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 67%|██████▋ | 8354/12384 [17:43:47<8:31:44, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.94s]
Epoch 1: 67%|██████▋ | 8355/12384 [17:43:47<8:31:05, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=7.94s]
Epoch 1: 67%|██████▋ | 8355/12384 [17:43:55<8:31:05, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8356/12384 [17:43:55<8:30:43, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.60s]
Epoch 1: 67%|██████▋ | 8356/12384 [17:44:02<8:30:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 1: 67%|██████▋ | 8357/12384 [17:44:02<8:30:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 1: 67%|██████▋ | 8357/12384 [17:44:10<8:30:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 67%|██████▋ | 8358/12384 [17:44:10<8:30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 67%|██████▋ | 8358/12384 [17:44:18<8:30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 67%|██████▋ | 8359/12384 [17:44:18<8:30:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 67%|██████▋ | 8359/12384 [17:44:25<8:30:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 68%|██████▊ | 8360/12384 [17:44:25<8:30:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 68%|██████▊ | 8360/12384 [17:44:33<8:30:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 68%|██████▊ | 8361/12384 [17:44:33<8:31:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 68%|██████▊ | 8361/12384 [17:44:41<8:31:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 68%|██████▊ | 8362/12384 [17:44:41<8:32:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 68%|██████▊ | 8362/12384 [17:44:49<8:32:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 68%|██████▊ | 8363/12384 [17:44:49<8:37:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 68%|██████▊ | 8363/12384 [17:44:56<8:37:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 68%|██████▊ | 8364/12384 [17:44:56<8:34:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 68%|██████▊ | 8364/12384 [17:45:04<8:34:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 68%|██████▊ | 8365/12384 [17:45:04<8:40:14, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 68%|██████▊ | 8365/12384 [17:45:12<8:40:14, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 1: 68%|██████▊ | 8366/12384 [17:45:12<8:36:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 1: 68%|██████▊ | 8366/12384 [17:45:19<8:36:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 68%|██████▊ | 8367/12384 [17:45:19<8:33:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 68%|██████▊ | 8367/12384 [17:45:27<8:33:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 68%|██████▊ | 8368/12384 [17:45:27<8:32:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 68%|██████▊ | 8368/12384 [17:45:35<8:32:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 1: 68%|██████▊ | 8369/12384 [17:45:35<8:31:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 1: 68%|██████▊ | 8369/12384 [17:45:42<8:31:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 68%|██████▊ | 8370/12384 [17:45:42<8:32:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 68%|██████▊ | 8370/12384 [17:45:50<8:32:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 1: 68%|██████▊ | 8371/12384 [17:45:50<8:31:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 1: 68%|██████▊ | 8371/12384 [17:45:57<8:31:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 68%|██████▊ | 8372/12384 [17:45:57<8:30:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 68%|██████▊ | 8372/12384 [17:46:05<8:30:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 68%|██████▊ | 8373/12384 [17:46:05<8:29:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 68%|██████▊ | 8373/12384 [17:46:13<8:29:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 68%|██████▊ | 8374/12384 [17:46:13<8:30:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 68%|██████▊ | 8374/12384 [17:46:20<8:30:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8375/12384 [17:46:20<8:29:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8375/12384 [17:46:28<8:29:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 68%|██████▊ | 8376/12384 [17:46:28<8:28:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 68%|██████▊ | 8376/12384 [17:46:36<8:28:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 68%|██████▊ | 8377/12384 [17:46:36<8:28:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 68%|██████▊ | 8377/12384 [17:46:43<8:28:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 1: 68%|██████▊ | 8378/12384 [17:46:43<8:28:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 1: 68%|██████▊ | 8378/12384 [17:46:51<8:28:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 68%|██████▊ | 8379/12384 [17:46:51<8:28:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 68%|██████▊ | 8379/12384 [17:46:58<8:28:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 68%|██████▊ | 8380/12384 [17:46:58<8:27:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 68%|██████▊ | 8380/12384 [17:47:06<8:27:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 68%|██████▊ | 8381/12384 [17:47:06<8:27:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 68%|██████▊ | 8381/12384 [17:47:14<8:27:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 68%|██████▊ | 8382/12384 [17:47:14<8:27:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 68%|██████▊ | 8382/12384 [17:47:21<8:27:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 68%|██████▊ | 8383/12384 [17:47:21<8:27:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 68%|██████▊ | 8383/12384 [17:47:29<8:27:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 68%|██████▊ | 8384/12384 [17:47:29<8:27:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 68%|██████▊ | 8384/12384 [17:47:36<8:27:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 68%|██████▊ | 8385/12384 [17:47:36<8:29:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 68%|██████▊ | 8385/12384 [17:47:44<8:29:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 68%|██████▊ | 8386/12384 [17:47:44<8:28:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 68%|██████▊ | 8386/12384 [17:47:52<8:28:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 68%|██████▊ | 8387/12384 [17:47:52<8:28:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 68%|██████▊ | 8387/12384 [17:47:59<8:28:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 68%|██████▊ | 8388/12384 [17:47:59<8:28:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 68%|██████▊ | 8388/12384 [17:48:07<8:28:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 68%|██████▊ | 8389/12384 [17:48:07<8:33:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 68%|██████▊ | 8389/12384 [17:48:15<8:33:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8390/12384 [17:48:15<8:31:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8390/12384 [17:48:23<8:31:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 68%|██████▊ | 8391/12384 [17:48:23<8:35:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 68%|██████▊ | 8391/12384 [17:48:30<8:35:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 68%|██████▊ | 8392/12384 [17:48:30<8:32:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 68%|██████▊ | 8392/12384 [17:48:38<8:32:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 68%|██████▊ | 8393/12384 [17:48:38<8:30:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 68%|██████▊ | 8393/12384 [17:48:46<8:30:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8394/12384 [17:48:46<8:28:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8394/12384 [17:48:53<8:28:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8395/12384 [17:48:53<8:28:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8395/12384 [17:49:01<8:28:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 68%|██████▊ | 8396/12384 [17:49:01<8:28:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 68%|██████▊ | 8396/12384 [17:49:08<8:28:21, 7.65s/it, loss=0.0002, acc=0.9984, iter_time=4.48s]
Epoch 1: 68%|██████▊ | 8397/12384 [17:49:08<8:27:22, 7.64s/it, loss=0.0002, acc=0.9984, iter_time=4.48s]
Epoch 1: 68%|██████▊ | 8397/12384 [17:49:16<8:27:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 68%|██████▊ | 8398/12384 [17:49:16<8:26:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 68%|██████▊ | 8398/12384 [17:49:24<8:26:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8399/12384 [17:49:24<8:26:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8399/12384 [17:49:31<8:26:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 68%|██████▊ | 8400/12384 [17:49:31<8:25:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 68%|██████▊ | 8400/12384 [17:49:39<8:25:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 68%|██████▊ | 8401/12384 [17:49:39<8:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 68%|██████▊ | 8401/12384 [17:49:46<8:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 68%|██████▊ | 8402/12384 [17:49:46<8:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 68%|██████▊ | 8402/12384 [17:49:54<8:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 68%|██████▊ | 8403/12384 [17:49:54<8:24:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 68%|██████▊ | 8403/12384 [17:50:02<8:24:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 68%|██████▊ | 8404/12384 [17:50:02<8:25:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 68%|██████▊ | 8404/12384 [17:50:09<8:25:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 68%|██████▊ | 8405/12384 [17:50:09<8:25:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 68%|██████▊ | 8405/12384 [17:50:17<8:25:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 68%|██████▊ | 8406/12384 [17:50:17<8:25:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 68%|██████▊ | 8406/12384 [17:50:25<8:25:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 68%|██████▊ | 8407/12384 [17:50:25<8:25:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 68%|██████▊ | 8407/12384 [17:50:32<8:25:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 68%|██████▊ | 8408/12384 [17:50:32<8:25:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 68%|██████▊ | 8408/12384 [17:50:40<8:25:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8409/12384 [17:50:40<8:24:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8409/12384 [17:50:47<8:24:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8410/12384 [17:50:47<8:24:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8410/12384 [17:50:55<8:24:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 68%|██████▊ | 8411/12384 [17:50:55<8:23:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 68%|██████▊ | 8411/12384 [17:51:03<8:23:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8412/12384 [17:51:03<8:23:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8412/12384 [17:51:10<8:23:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8413/12384 [17:51:10<8:23:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8413/12384 [17:51:18<8:23:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 68%|██████▊ | 8414/12384 [17:51:18<8:23:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 68%|██████▊ | 8414/12384 [17:51:25<8:23:23, 7.61s/it, loss=0.0002, acc=0.9983, iter_time=6.51s]
Epoch 1: 68%|██████▊ | 8415/12384 [17:51:25<8:23:27, 7.61s/it, loss=0.0002, acc=0.9983, iter_time=6.51s]
Epoch 1: 68%|██████▊ | 8415/12384 [17:51:33<8:23:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.56s]
Epoch 1: 68%|██████▊ | 8416/12384 [17:51:33<8:22:56, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.56s]
Epoch 1: 68%|██████▊ | 8416/12384 [17:51:41<8:22:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 68%|██████▊ | 8417/12384 [17:51:41<8:28:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 68%|██████▊ | 8417/12384 [17:51:49<8:28:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 68%|██████▊ | 8418/12384 [17:51:49<8:26:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 68%|██████▊ | 8418/12384 [17:51:56<8:26:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 68%|██████▊ | 8419/12384 [17:51:56<8:25:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 68%|██████▊ | 8419/12384 [17:52:04<8:25:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 68%|██████▊ | 8420/12384 [17:52:04<8:24:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 68%|██████▊ | 8420/12384 [17:52:11<8:24:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 68%|██████▊ | 8421/12384 [17:52:11<8:24:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 68%|██████▊ | 8421/12384 [17:52:19<8:24:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 68%|██████▊ | 8422/12384 [17:52:19<8:24:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 68%|██████▊ | 8422/12384 [17:52:27<8:24:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8423/12384 [17:52:27<8:25:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8423/12384 [17:52:34<8:25:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 68%|██████▊ | 8424/12384 [17:52:34<8:24:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 68%|██████▊ | 8424/12384 [17:52:42<8:24:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 68%|██████▊ | 8425/12384 [17:52:42<8:23:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 68%|██████▊ | 8425/12384 [17:52:50<8:23:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8426/12384 [17:52:50<8:23:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8426/12384 [17:52:57<8:23:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8427/12384 [17:52:57<8:22:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8427/12384 [17:53:05<8:22:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 1: 68%|██████▊ | 8428/12384 [17:53:05<8:21:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 1: 68%|██████▊ | 8428/12384 [17:53:12<8:21:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 68%|██████▊ | 8429/12384 [17:53:12<8:21:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 68%|██████▊ | 8429/12384 [17:53:20<8:21:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 68%|██████▊ | 8430/12384 [17:53:20<8:21:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 68%|██████▊ | 8430/12384 [17:53:28<8:21:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 68%|██████▊ | 8431/12384 [17:53:28<8:21:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 68%|██████▊ | 8431/12384 [17:53:35<8:21:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 1: 68%|██████▊ | 8432/12384 [17:53:35<8:21:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 1: 68%|██████▊ | 8432/12384 [17:53:43<8:21:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.90s]
Epoch 1: 68%|██████▊ | 8433/12384 [17:53:43<8:21:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.90s]
Epoch 1: 68%|██████▊ | 8433/12384 [17:53:50<8:21:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 68%|██████▊ | 8434/12384 [17:53:50<8:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 68%|██████▊ | 8434/12384 [17:53:58<8:20:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 68%|██████▊ | 8435/12384 [17:53:58<8:21:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 68%|██████▊ | 8435/12384 [17:54:06<8:21:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 68%|██████▊ | 8436/12384 [17:54:06<8:20:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 68%|██████▊ | 8436/12384 [17:54:13<8:20:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 68%|██████▊ | 8437/12384 [17:54:13<8:20:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 68%|██████▊ | 8437/12384 [17:54:21<8:20:21, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=8.44s]
Epoch 1: 68%|██████▊ | 8438/12384 [17:54:21<8:20:19, 7.61s/it, loss=0.0005, acc=0.9988, iter_time=8.44s]
Epoch 1: 68%|██████▊ | 8438/12384 [17:54:28<8:20:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 68%|██████▊ | 8439/12384 [17:54:28<8:19:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 68%|██████▊ | 8439/12384 [17:54:36<8:19:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 68%|██████▊ | 8440/12384 [17:54:36<8:20:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 68%|██████▊ | 8440/12384 [17:54:44<8:20:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 68%|██████▊ | 8441/12384 [17:54:44<8:25:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 68%|██████▊ | 8441/12384 [17:54:52<8:25:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 68%|██████▊ | 8442/12384 [17:54:52<8:23:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 68%|██████▊ | 8442/12384 [17:55:00<8:23:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8443/12384 [17:55:00<8:29:35, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8443/12384 [17:55:07<8:29:35, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 68%|██████▊ | 8444/12384 [17:55:07<8:28:39, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 68%|██████▊ | 8444/12384 [17:55:15<8:28:39, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8445/12384 [17:55:15<8:25:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8445/12384 [17:55:23<8:25:51, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 1: 68%|██████▊ | 8446/12384 [17:55:23<8:24:13, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 1: 68%|██████▊ | 8446/12384 [17:55:30<8:24:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8447/12384 [17:55:30<8:22:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8447/12384 [17:55:38<8:22:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 68%|██████▊ | 8448/12384 [17:55:38<8:21:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 68%|██████▊ | 8448/12384 [17:55:45<8:21:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 68%|██████▊ | 8449/12384 [17:55:45<8:21:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 68%|██████▊ | 8449/12384 [17:55:53<8:21:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 68%|██████▊ | 8450/12384 [17:55:53<8:20:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 68%|██████▊ | 8450/12384 [17:56:01<8:20:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8451/12384 [17:56:01<8:19:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 68%|██████▊ | 8451/12384 [17:56:08<8:19:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8452/12384 [17:56:08<8:19:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8452/12384 [17:56:16<8:19:36, 7.62s/it, loss=0.0044, acc=0.9933, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8453/12384 [17:56:16<8:20:24, 7.64s/it, loss=0.0044, acc=0.9933, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8453/12384 [17:56:24<8:20:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 68%|██████▊ | 8454/12384 [17:56:24<8:19:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 68%|██████▊ | 8454/12384 [17:56:31<8:19:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 68%|██████▊ | 8455/12384 [17:56:31<8:19:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 68%|██████▊ | 8455/12384 [17:56:39<8:19:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 68%|██████▊ | 8456/12384 [17:56:39<8:19:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 68%|██████▊ | 8456/12384 [17:56:46<8:19:03, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=7.23s]
Epoch 1: 68%|██████▊ | 8457/12384 [17:56:46<8:18:29, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=7.23s]
Epoch 1: 68%|██████▊ | 8457/12384 [17:56:54<8:18:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 68%|██████▊ | 8458/12384 [17:56:54<8:18:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 68%|██████▊ | 8458/12384 [17:57:02<8:18:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 68%|██████▊ | 8459/12384 [17:57:02<8:17:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 68%|██████▊ | 8459/12384 [17:57:09<8:17:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 68%|██████▊ | 8460/12384 [17:57:09<8:17:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 68%|██████▊ | 8460/12384 [17:57:17<8:17:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 68%|██████▊ | 8461/12384 [17:57:17<8:18:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 68%|██████▊ | 8461/12384 [17:57:24<8:18:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8462/12384 [17:57:24<8:18:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 68%|██████▊ | 8462/12384 [17:57:32<8:18:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 68%|██████▊ | 8463/12384 [17:57:32<8:17:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 68%|██████▊ | 8463/12384 [17:57:40<8:17:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 68%|██████▊ | 8464/12384 [17:57:40<8:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 68%|██████▊ | 8464/12384 [17:57:47<8:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 68%|██████▊ | 8465/12384 [17:57:47<8:17:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 68%|██████▊ | 8465/12384 [17:57:55<8:17:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 68%|██████▊ | 8466/12384 [17:57:55<8:17:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 68%|██████▊ | 8466/12384 [17:58:02<8:17:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 68%|██████▊ | 8467/12384 [17:58:02<8:16:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 68%|██████▊ | 8467/12384 [17:58:10<8:16:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 68%|██████▊ | 8468/12384 [17:58:10<8:16:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 68%|██████▊ | 8468/12384 [17:58:18<8:16:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 1: 68%|██████▊ | 8469/12384 [17:58:18<8:23:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 1: 68%|██████▊ | 8469/12384 [17:58:26<8:23:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 68%|██████▊ | 8470/12384 [17:58:26<8:23:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 68%|██████▊ | 8470/12384 [17:58:33<8:23:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 68%|██████▊ | 8471/12384 [17:58:33<8:21:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 68%|██████▊ | 8471/12384 [17:58:41<8:21:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 68%|██████▊ | 8472/12384 [17:58:41<8:19:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 68%|██████▊ | 8472/12384 [17:58:49<8:19:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 68%|██████▊ | 8473/12384 [17:58:49<8:18:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 68%|██████▊ | 8473/12384 [17:58:56<8:18:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8474/12384 [17:58:56<8:18:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8474/12384 [17:59:04<8:18:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 68%|██████▊ | 8475/12384 [17:59:04<8:19:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 68%|██████▊ | 8475/12384 [17:59:12<8:19:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 68%|██████▊ | 8476/12384 [17:59:12<8:18:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 68%|██████▊ | 8476/12384 [17:59:19<8:18:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 68%|██████▊ | 8477/12384 [17:59:19<8:17:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 68%|██████▊ | 8477/12384 [17:59:27<8:17:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8478/12384 [17:59:27<8:17:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 68%|██████▊ | 8478/12384 [17:59:34<8:17:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.33s]
Epoch 1: 68%|██████▊ | 8479/12384 [17:59:34<8:16:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.33s]
Epoch 1: 68%|██████▊ | 8479/12384 [17:59:42<8:16:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 68%|██████▊ | 8480/12384 [17:59:42<8:15:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 68%|██████▊ | 8480/12384 [17:59:50<8:15:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 68%|██████▊ | 8481/12384 [17:59:50<8:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 68%|██████▊ | 8481/12384 [17:59:57<8:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 68%|██████▊ | 8482/12384 [17:59:57<8:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 68%|██████▊ | 8482/12384 [18:00:05<8:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 68%|██████▊ | 8483/12384 [18:00:05<8:15:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 68%|██████▊ | 8483/12384 [18:00:12<8:15:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 69%|██████▊ | 8484/12384 [18:00:12<8:14:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 69%|██████▊ | 8484/12384 [18:00:20<8:14:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 69%|██████▊ | 8485/12384 [18:00:20<8:14:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 69%|██████▊ | 8485/12384 [18:00:28<8:14:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▊ | 8486/12384 [18:00:28<8:14:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▊ | 8486/12384 [18:00:35<8:14:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 69%|██████▊ | 8487/12384 [18:00:35<8:13:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 69%|██████▊ | 8487/12384 [18:00:43<8:13:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 69%|██████▊ | 8488/12384 [18:00:43<8:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 69%|██████▊ | 8488/12384 [18:00:50<8:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 69%|██████▊ | 8489/12384 [18:00:50<8:13:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 69%|██████▊ | 8489/12384 [18:00:58<8:13:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 69%|██████▊ | 8490/12384 [18:00:58<8:13:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 69%|██████▊ | 8490/12384 [18:01:06<8:13:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 69%|██████▊ | 8491/12384 [18:01:06<8:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 69%|██████▊ | 8491/12384 [18:01:13<8:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 69%|██████▊ | 8492/12384 [18:01:13<8:13:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 69%|██████▊ | 8492/12384 [18:01:21<8:13:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 1: 69%|██████▊ | 8493/12384 [18:01:21<8:12:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 1: 69%|██████▊ | 8493/12384 [18:01:28<8:12:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 69%|██████▊ | 8494/12384 [18:01:28<8:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 69%|██████▊ | 8494/12384 [18:01:36<8:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 69%|██████▊ | 8495/12384 [18:01:36<8:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 69%|██████▊ | 8495/12384 [18:01:44<8:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 69%|██████▊ | 8496/12384 [18:01:44<8:20:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 69%|██████▊ | 8496/12384 [18:01:52<8:20:06, 7.72s/it, loss=0.0005, acc=0.9992, iter_time=7.49s]
Epoch 1: 69%|██████▊ | 8497/12384 [18:01:52<8:17:50, 7.68s/it, loss=0.0005, acc=0.9992, iter_time=7.49s]
Epoch 1: 69%|██████▊ | 8497/12384 [18:01:59<8:17:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 69%|██████▊ | 8498/12384 [18:01:59<8:16:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 69%|██████▊ | 8498/12384 [18:02:07<8:16:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▊ | 8499/12384 [18:02:07<8:14:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▊ | 8499/12384 [18:02:14<8:14:54, 7.64s/it, loss=0.0010, acc=0.9975, iter_time=7.61s]
Epoch 1: 69%|██████▊ | 8500/12384 [18:02:14<8:13:50, 7.63s/it, loss=0.0010, acc=0.9975, iter_time=7.61s]
Epoch 1: 69%|██████▊ | 8500/12384 [18:02:22<8:13:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 69%|██████▊ | 8501/12384 [18:02:22<8:13:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 69%|██████▊ | 8501/12384 [18:02:30<8:13:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 69%|██████▊ | 8502/12384 [18:02:30<8:12:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 69%|██████▊ | 8502/12384 [18:02:37<8:12:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 69%|██████▊ | 8503/12384 [18:02:37<8:12:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 69%|██████▊ | 8503/12384 [18:02:45<8:12:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 69%|██████▊ | 8504/12384 [18:02:45<8:12:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 69%|██████▊ | 8504/12384 [18:02:53<8:12:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.24s]
Epoch 1: 69%|██████▊ | 8505/12384 [18:02:53<8:12:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.24s]
Epoch 1: 69%|██████▊ | 8505/12384 [18:03:00<8:12:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 69%|██████▊ | 8506/12384 [18:03:00<8:11:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 1: 69%|██████▊ | 8506/12384 [18:03:08<8:11:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 69%|██████▊ | 8507/12384 [18:03:08<8:11:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 69%|██████▊ | 8507/12384 [18:03:15<8:11:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 69%|██████▊ | 8508/12384 [18:03:15<8:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 69%|██████▊ | 8508/12384 [18:03:23<8:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 69%|██████▊ | 8509/12384 [18:03:23<8:11:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 69%|██████▊ | 8509/12384 [18:03:31<8:11:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 69%|██████▊ | 8510/12384 [18:03:31<8:11:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 69%|██████▊ | 8510/12384 [18:03:38<8:11:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 69%|██████▊ | 8511/12384 [18:03:38<8:11:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 69%|██████▊ | 8511/12384 [18:03:46<8:11:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 69%|██████▊ | 8512/12384 [18:03:46<8:10:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 69%|██████▊ | 8512/12384 [18:03:53<8:10:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 69%|██████▊ | 8513/12384 [18:03:53<8:10:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 69%|██████▊ | 8513/12384 [18:04:01<8:10:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 69%|██████▉ | 8514/12384 [18:04:01<8:10:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 69%|██████▉ | 8514/12384 [18:04:09<8:10:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8515/12384 [18:04:09<8:10:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8515/12384 [18:04:16<8:10:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 69%|██████▉ | 8516/12384 [18:04:16<8:10:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 69%|██████▉ | 8516/12384 [18:04:24<8:10:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 69%|██████▉ | 8517/12384 [18:04:24<8:09:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 69%|██████▉ | 8517/12384 [18:04:31<8:09:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 69%|██████▉ | 8518/12384 [18:04:31<8:09:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 69%|██████▉ | 8518/12384 [18:04:39<8:09:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8519/12384 [18:04:39<8:09:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8519/12384 [18:04:47<8:09:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 69%|██████▉ | 8520/12384 [18:04:47<8:11:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 69%|██████▉ | 8520/12384 [18:04:55<8:11:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 69%|██████▉ | 8521/12384 [18:04:55<8:16:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 69%|██████▉ | 8521/12384 [18:05:03<8:16:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 69%|██████▉ | 8522/12384 [18:05:03<8:19:46, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 69%|██████▉ | 8522/12384 [18:05:10<8:19:46, 7.76s/it, loss=0.0002, acc=0.9989, iter_time=5.50s]
Epoch 1: 69%|██████▉ | 8523/12384 [18:05:10<8:16:29, 7.72s/it, loss=0.0002, acc=0.9989, iter_time=5.50s]
Epoch 1: 69%|██████▉ | 8523/12384 [18:05:18<8:16:29, 7.72s/it, loss=0.0005, acc=0.9989, iter_time=9.94s]
Epoch 1: 69%|██████▉ | 8524/12384 [18:05:18<8:14:00, 7.68s/it, loss=0.0005, acc=0.9989, iter_time=9.94s]
Epoch 1: 69%|██████▉ | 8524/12384 [18:05:25<8:14:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8525/12384 [18:05:25<8:12:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8525/12384 [18:05:33<8:12:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▉ | 8526/12384 [18:05:33<8:11:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▉ | 8526/12384 [18:05:41<8:11:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 69%|██████▉ | 8527/12384 [18:05:41<8:10:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 69%|██████▉ | 8527/12384 [18:05:48<8:10:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 69%|██████▉ | 8528/12384 [18:05:48<8:10:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 1: 69%|██████▉ | 8528/12384 [18:05:56<8:10:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 69%|██████▉ | 8529/12384 [18:05:56<8:09:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 69%|██████▉ | 8529/12384 [18:06:03<8:09:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 69%|██████▉ | 8530/12384 [18:06:03<8:09:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 69%|██████▉ | 8530/12384 [18:06:11<8:09:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 69%|██████▉ | 8531/12384 [18:06:11<8:08:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 69%|██████▉ | 8531/12384 [18:06:19<8:08:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8532/12384 [18:06:19<8:08:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8532/12384 [18:06:26<8:08:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8533/12384 [18:06:26<8:08:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8533/12384 [18:06:34<8:08:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 69%|██████▉ | 8534/12384 [18:06:34<8:08:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 69%|██████▉ | 8534/12384 [18:06:41<8:08:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 69%|██████▉ | 8535/12384 [18:06:41<8:08:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 69%|██████▉ | 8535/12384 [18:06:49<8:08:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8536/12384 [18:06:49<8:08:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8536/12384 [18:06:57<8:08:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 69%|██████▉ | 8537/12384 [18:06:57<8:08:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 69%|██████▉ | 8537/12384 [18:07:04<8:08:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 69%|██████▉ | 8538/12384 [18:07:04<8:07:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 69%|██████▉ | 8538/12384 [18:07:12<8:07:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 69%|██████▉ | 8539/12384 [18:07:12<8:09:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 69%|██████▉ | 8539/12384 [18:07:20<8:09:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 69%|██████▉ | 8540/12384 [18:07:20<8:07:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 69%|██████▉ | 8540/12384 [18:07:27<8:07:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8541/12384 [18:07:27<8:07:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8541/12384 [18:07:35<8:07:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 69%|██████▉ | 8542/12384 [18:07:35<8:06:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 69%|██████▉ | 8542/12384 [18:07:42<8:06:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 69%|██████▉ | 8543/12384 [18:07:42<8:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 69%|██████▉ | 8543/12384 [18:07:50<8:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 69%|██████▉ | 8544/12384 [18:07:50<8:06:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 69%|██████▉ | 8544/12384 [18:07:58<8:06:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 69%|██████▉ | 8545/12384 [18:07:58<8:06:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 69%|██████▉ | 8545/12384 [18:08:05<8:06:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 69%|██████▉ | 8546/12384 [18:08:05<8:06:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 69%|██████▉ | 8546/12384 [18:08:13<8:06:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 1: 69%|██████▉ | 8547/12384 [18:08:13<8:12:17, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 1: 69%|██████▉ | 8547/12384 [18:08:21<8:12:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 69%|██████▉ | 8548/12384 [18:08:21<8:10:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 69%|██████▉ | 8548/12384 [18:08:29<8:10:36, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.06s]
Epoch 1: 69%|██████▉ | 8549/12384 [18:08:29<8:15:42, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=11.06s]
Epoch 1: 69%|██████▉ | 8549/12384 [18:08:36<8:15:42, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 1: 69%|██████▉ | 8550/12384 [18:08:36<8:12:46, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.85s]
Epoch 1: 69%|██████▉ | 8550/12384 [18:08:44<8:12:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 69%|██████▉ | 8551/12384 [18:08:44<8:10:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 69%|██████▉ | 8551/12384 [18:08:51<8:10:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 69%|██████▉ | 8552/12384 [18:08:51<8:09:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 69%|██████▉ | 8552/12384 [18:08:59<8:09:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 69%|██████▉ | 8553/12384 [18:08:59<8:08:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 69%|██████▉ | 8553/12384 [18:09:07<8:08:16, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.44s]
Epoch 1: 69%|██████▉ | 8554/12384 [18:09:07<8:08:03, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.44s]
Epoch 1: 69%|██████▉ | 8554/12384 [18:09:14<8:08:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 69%|██████▉ | 8555/12384 [18:09:14<8:07:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 69%|██████▉ | 8555/12384 [18:09:22<8:07:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 69%|██████▉ | 8556/12384 [18:09:22<8:08:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 69%|██████▉ | 8556/12384 [18:09:30<8:08:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 69%|██████▉ | 8557/12384 [18:09:30<8:07:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 69%|██████▉ | 8557/12384 [18:09:37<8:07:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 69%|██████▉ | 8558/12384 [18:09:37<8:06:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 69%|██████▉ | 8558/12384 [18:09:45<8:06:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 69%|██████▉ | 8559/12384 [18:09:45<8:06:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 69%|██████▉ | 8559/12384 [18:09:52<8:06:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 69%|██████▉ | 8560/12384 [18:09:52<8:06:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 69%|██████▉ | 8560/12384 [18:10:00<8:06:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 69%|██████▉ | 8561/12384 [18:10:00<8:06:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 69%|██████▉ | 8561/12384 [18:10:08<8:06:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 69%|██████▉ | 8562/12384 [18:10:08<8:05:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 69%|██████▉ | 8562/12384 [18:10:15<8:05:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▉ | 8563/12384 [18:10:15<8:05:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▉ | 8563/12384 [18:10:23<8:05:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▉ | 8564/12384 [18:10:23<8:04:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▉ | 8564/12384 [18:10:31<8:04:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8565/12384 [18:10:31<8:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8565/12384 [18:10:38<8:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 69%|██████▉ | 8566/12384 [18:10:38<8:04:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 69%|██████▉ | 8566/12384 [18:10:46<8:04:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 69%|██████▉ | 8567/12384 [18:10:46<8:03:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 69%|██████▉ | 8567/12384 [18:10:53<8:03:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 69%|██████▉ | 8568/12384 [18:10:53<8:03:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 1: 69%|██████▉ | 8568/12384 [18:11:01<8:03:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 69%|██████▉ | 8569/12384 [18:11:01<8:03:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 69%|██████▉ | 8569/12384 [18:11:09<8:03:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 69%|██████▉ | 8570/12384 [18:11:09<8:03:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 69%|██████▉ | 8570/12384 [18:11:16<8:03:54, 7.61s/it, loss=0.0004, acc=0.9991, iter_time=10.15s]
Epoch 1: 69%|██████▉ | 8571/12384 [18:11:16<8:03:41, 7.61s/it, loss=0.0004, acc=0.9991, iter_time=10.15s]
Epoch 1: 69%|██████▉ | 8571/12384 [18:11:24<8:03:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8572/12384 [18:11:24<8:05:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8572/12384 [18:11:32<8:05:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 69%|██████▉ | 8573/12384 [18:11:32<8:04:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 69%|██████▉ | 8573/12384 [18:11:39<8:04:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 69%|██████▉ | 8574/12384 [18:11:39<8:04:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 69%|██████▉ | 8574/12384 [18:11:47<8:04:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 69%|██████▉ | 8575/12384 [18:11:47<8:10:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 69%|██████▉ | 8575/12384 [18:11:55<8:10:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 69%|██████▉ | 8576/12384 [18:11:55<8:08:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 69%|██████▉ | 8576/12384 [18:12:02<8:08:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 69%|██████▉ | 8577/12384 [18:12:02<8:06:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 69%|██████▉ | 8577/12384 [18:12:10<8:06:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8578/12384 [18:12:10<8:04:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 69%|██████▉ | 8578/12384 [18:12:18<8:04:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8579/12384 [18:12:18<8:05:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8579/12384 [18:12:25<8:05:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 69%|██████▉ | 8580/12384 [18:12:25<8:04:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 69%|██████▉ | 8580/12384 [18:12:33<8:04:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 69%|██████▉ | 8581/12384 [18:12:33<8:03:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 69%|██████▉ | 8581/12384 [18:12:40<8:03:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 69%|██████▉ | 8582/12384 [18:12:40<8:04:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 69%|██████▉ | 8582/12384 [18:12:48<8:04:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 69%|██████▉ | 8583/12384 [18:12:48<8:04:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 69%|██████▉ | 8583/12384 [18:12:56<8:04:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 69%|██████▉ | 8584/12384 [18:12:56<8:03:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 69%|██████▉ | 8584/12384 [18:13:03<8:03:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 1: 69%|██████▉ | 8585/12384 [18:13:03<8:02:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 1: 69%|██████▉ | 8585/12384 [18:13:11<8:02:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 69%|██████▉ | 8586/12384 [18:13:11<8:02:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 69%|██████▉ | 8586/12384 [18:13:19<8:02:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.53s]
Epoch 1: 69%|██████▉ | 8587/12384 [18:13:19<8:01:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.53s]
Epoch 1: 69%|██████▉ | 8587/12384 [18:13:26<8:01:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 69%|██████▉ | 8588/12384 [18:13:26<8:01:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 69%|██████▉ | 8588/12384 [18:13:34<8:01:53, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 1: 69%|██████▉ | 8589/12384 [18:13:34<8:01:28, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 1: 69%|██████▉ | 8589/12384 [18:13:41<8:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 69%|██████▉ | 8590/12384 [18:13:41<8:01:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 69%|██████▉ | 8590/12384 [18:13:49<8:01:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▉ | 8591/12384 [18:13:49<8:02:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 69%|██████▉ | 8591/12384 [18:13:57<8:02:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 69%|██████▉ | 8592/12384 [18:13:57<8:01:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 69%|██████▉ | 8592/12384 [18:14:04<8:01:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.28s]
Epoch 1: 69%|██████▉ | 8593/12384 [18:14:04<8:01:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.28s]
Epoch 1: 69%|██████▉ | 8593/12384 [18:14:12<8:01:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 1: 69%|██████▉ | 8594/12384 [18:14:12<8:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 1: 69%|██████▉ | 8594/12384 [18:14:19<8:01:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 69%|██████▉ | 8595/12384 [18:14:19<8:00:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 69%|██████▉ | 8595/12384 [18:14:27<8:00:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 69%|██████▉ | 8596/12384 [18:14:27<8:00:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 69%|██████▉ | 8596/12384 [18:14:35<8:00:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8597/12384 [18:14:35<8:00:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 69%|██████▉ | 8597/12384 [18:14:42<8:00:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 69%|██████▉ | 8598/12384 [18:14:42<8:01:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 69%|██████▉ | 8598/12384 [18:14:50<8:01:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 69%|██████▉ | 8599/12384 [18:14:50<8:00:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 69%|██████▉ | 8599/12384 [18:14:58<8:00:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.37s]
Epoch 1: 69%|██████▉ | 8600/12384 [18:14:58<8:00:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.37s]
Epoch 1: 69%|██████▉ | 8600/12384 [18:15:06<8:00:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 69%|██████▉ | 8601/12384 [18:15:06<8:07:26, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 69%|██████▉ | 8601/12384 [18:15:13<8:07:26, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 69%|██████▉ | 8602/12384 [18:15:13<8:05:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 69%|██████▉ | 8602/12384 [18:15:21<8:05:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 69%|██████▉ | 8603/12384 [18:15:21<8:03:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 69%|██████▉ | 8603/12384 [18:15:28<8:03:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 69%|██████▉ | 8604/12384 [18:15:28<8:02:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 69%|██████▉ | 8604/12384 [18:15:36<8:02:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 69%|██████▉ | 8605/12384 [18:15:36<8:02:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 69%|██████▉ | 8605/12384 [18:15:44<8:02:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 69%|██████▉ | 8606/12384 [18:15:44<8:02:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 69%|██████▉ | 8606/12384 [18:15:51<8:02:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8607/12384 [18:15:51<8:01:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8607/12384 [18:15:59<8:01:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 70%|██████▉ | 8608/12384 [18:15:59<8:01:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 70%|██████▉ | 8608/12384 [18:16:07<8:01:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 70%|██████▉ | 8609/12384 [18:16:07<8:00:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 70%|██████▉ | 8609/12384 [18:16:14<8:00:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 70%|██████▉ | 8610/12384 [18:16:14<7:59:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 70%|██████▉ | 8610/12384 [18:16:22<7:59:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 70%|██████▉ | 8611/12384 [18:16:22<7:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 70%|██████▉ | 8611/12384 [18:16:29<7:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8612/12384 [18:16:29<7:58:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8612/12384 [18:16:37<7:58:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8613/12384 [18:16:37<7:58:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8613/12384 [18:16:45<7:58:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 70%|██████▉ | 8614/12384 [18:16:45<8:00:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 70%|██████▉ | 8614/12384 [18:16:52<8:00:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 70%|██████▉ | 8615/12384 [18:16:52<7:59:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 70%|██████▉ | 8615/12384 [18:17:00<7:59:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 70%|██████▉ | 8616/12384 [18:17:00<8:02:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 70%|██████▉ | 8616/12384 [18:17:08<8:02:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 70%|██████▉ | 8617/12384 [18:17:08<8:00:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 70%|██████▉ | 8617/12384 [18:17:15<8:00:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|██████▉ | 8618/12384 [18:17:15<7:59:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|██████▉ | 8618/12384 [18:17:23<7:59:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 70%|██████▉ | 8619/12384 [18:17:23<7:58:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 70%|██████▉ | 8619/12384 [18:17:31<7:58:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 70%|██████▉ | 8620/12384 [18:17:31<7:57:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 70%|██████▉ | 8620/12384 [18:17:38<7:57:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8621/12384 [18:17:38<7:57:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8621/12384 [18:17:46<7:57:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|██████▉ | 8622/12384 [18:17:46<7:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|██████▉ | 8622/12384 [18:17:53<7:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8623/12384 [18:17:53<7:57:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8623/12384 [18:18:01<7:57:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 70%|██████▉ | 8624/12384 [18:18:01<7:56:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 70%|██████▉ | 8624/12384 [18:18:09<7:56:56, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 1: 70%|██████▉ | 8625/12384 [18:18:09<7:56:44, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 1: 70%|██████▉ | 8625/12384 [18:18:17<7:56:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 70%|██████▉ | 8626/12384 [18:18:17<8:01:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 70%|██████▉ | 8626/12384 [18:18:24<8:01:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 70%|██████▉ | 8627/12384 [18:18:24<8:05:39, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 70%|██████▉ | 8627/12384 [18:18:32<8:05:39, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 70%|██████▉ | 8628/12384 [18:18:32<8:02:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 70%|██████▉ | 8628/12384 [18:18:40<8:02:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 70%|██████▉ | 8629/12384 [18:18:40<8:02:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 70%|██████▉ | 8629/12384 [18:18:47<8:02:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 70%|██████▉ | 8630/12384 [18:18:47<8:00:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 70%|██████▉ | 8630/12384 [18:18:55<8:00:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 70%|██████▉ | 8631/12384 [18:18:55<8:00:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 70%|██████▉ | 8631/12384 [18:19:03<8:00:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 70%|██████▉ | 8632/12384 [18:19:03<7:59:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 70%|██████▉ | 8632/12384 [18:19:10<7:59:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 70%|██████▉ | 8633/12384 [18:19:10<7:58:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 70%|██████▉ | 8633/12384 [18:19:18<7:58:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 70%|██████▉ | 8634/12384 [18:19:18<7:57:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 70%|██████▉ | 8634/12384 [18:19:25<7:57:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8635/12384 [18:19:25<7:56:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8635/12384 [18:19:33<7:56:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 70%|██████▉ | 8636/12384 [18:19:33<7:55:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 70%|██████▉ | 8636/12384 [18:19:41<7:55:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 70%|██████▉ | 8637/12384 [18:19:41<7:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 70%|██████▉ | 8637/12384 [18:19:48<7:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8638/12384 [18:19:48<7:54:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8638/12384 [18:19:56<7:54:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 70%|██████▉ | 8639/12384 [18:19:56<7:56:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 70%|██████▉ | 8639/12384 [18:20:04<7:56:05, 7.63s/it, loss=0.0003, acc=0.9992, iter_time=9.03s]
Epoch 1: 70%|██████▉ | 8640/12384 [18:20:04<7:55:57, 7.63s/it, loss=0.0003, acc=0.9992, iter_time=9.03s]
Epoch 1: 70%|██████▉ | 8640/12384 [18:20:11<7:55:57, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=5.44s]
Epoch 1: 70%|██████▉ | 8641/12384 [18:20:11<7:54:59, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=5.44s]
Epoch 1: 70%|██████▉ | 8641/12384 [18:20:19<7:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 70%|██████▉ | 8642/12384 [18:20:19<7:56:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 70%|██████▉ | 8642/12384 [18:20:26<7:56:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 70%|██████▉ | 8643/12384 [18:20:26<7:55:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 70%|██████▉ | 8643/12384 [18:20:34<7:55:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 70%|██████▉ | 8644/12384 [18:20:34<7:54:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 70%|██████▉ | 8644/12384 [18:20:42<7:54:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8645/12384 [18:20:42<7:54:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8645/12384 [18:20:49<7:54:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8646/12384 [18:20:49<7:54:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|██████▉ | 8646/12384 [18:20:57<7:54:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8647/12384 [18:20:57<7:54:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8647/12384 [18:21:04<7:54:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 70%|██████▉ | 8648/12384 [18:21:04<7:54:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 70%|██████▉ | 8648/12384 [18:21:12<7:54:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 70%|██████▉ | 8649/12384 [18:21:12<7:54:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 70%|██████▉ | 8649/12384 [18:21:20<7:54:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 70%|██████▉ | 8650/12384 [18:21:20<7:54:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 70%|██████▉ | 8650/12384 [18:21:27<7:54:26, 7.62s/it, loss=0.0007, acc=0.9975, iter_time=7.60s]
Epoch 1: 70%|██████▉ | 8651/12384 [18:21:27<7:53:42, 7.61s/it, loss=0.0007, acc=0.9975, iter_time=7.60s]
Epoch 1: 70%|██████▉ | 8651/12384 [18:21:35<7:53:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8652/12384 [18:21:35<7:53:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|██████▉ | 8652/12384 [18:21:43<7:53:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 70%|██████▉ | 8653/12384 [18:21:43<7:59:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 70%|██████▉ | 8653/12384 [18:21:50<7:59:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 1: 70%|██████▉ | 8654/12384 [18:21:50<7:56:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 1: 70%|██████▉ | 8654/12384 [18:21:58<7:56:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 70%|██████▉ | 8655/12384 [18:21:58<7:55:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 70%|██████▉ | 8655/12384 [18:22:06<7:55:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 70%|██████▉ | 8656/12384 [18:22:06<7:55:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 70%|██████▉ | 8656/12384 [18:22:13<7:55:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 1: 70%|██████▉ | 8657/12384 [18:22:13<7:54:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 1: 70%|██████▉ | 8657/12384 [18:22:21<7:54:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 70%|██████▉ | 8658/12384 [18:22:21<7:55:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 70%|██████▉ | 8658/12384 [18:22:29<7:55:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 70%|██████▉ | 8659/12384 [18:22:29<7:54:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 70%|██████▉ | 8659/12384 [18:22:36<7:54:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 70%|██████▉ | 8660/12384 [18:22:36<7:53:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 70%|██████▉ | 8660/12384 [18:22:44<7:53:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 70%|██████▉ | 8661/12384 [18:22:44<7:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 70%|██████▉ | 8661/12384 [18:22:51<7:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 70%|██████▉ | 8662/12384 [18:22:51<7:52:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 70%|██████▉ | 8662/12384 [18:22:59<7:52:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 70%|██████▉ | 8663/12384 [18:22:59<7:51:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 70%|██████▉ | 8663/12384 [18:23:07<7:51:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 70%|██████▉ | 8664/12384 [18:23:07<7:51:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 70%|██████▉ | 8664/12384 [18:23:14<7:51:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 70%|██████▉ | 8665/12384 [18:23:14<7:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 70%|██████▉ | 8665/12384 [18:23:22<7:51:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 1: 70%|██████▉ | 8666/12384 [18:23:22<7:51:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 1: 70%|██████▉ | 8666/12384 [18:23:30<7:51:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 1: 70%|██████▉ | 8667/12384 [18:23:30<7:51:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 1: 70%|██████▉ | 8667/12384 [18:23:37<7:51:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 70%|██████▉ | 8668/12384 [18:23:37<7:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 70%|██████▉ | 8668/12384 [18:23:45<7:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 70%|███████ | 8669/12384 [18:23:45<7:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 70%|███████ | 8669/12384 [18:23:52<7:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 70%|███████ | 8670/12384 [18:23:52<7:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 70%|███████ | 8670/12384 [18:24:00<7:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 70%|███████ | 8671/12384 [18:24:00<7:51:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 70%|███████ | 8671/12384 [18:24:08<7:51:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 70%|███████ | 8672/12384 [18:24:08<7:51:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 70%|███████ | 8672/12384 [18:24:15<7:51:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 70%|███████ | 8673/12384 [18:24:15<7:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 1: 70%|███████ | 8673/12384 [18:24:23<7:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 70%|███████ | 8674/12384 [18:24:23<7:51:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 70%|███████ | 8674/12384 [18:24:30<7:51:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 70%|███████ | 8675/12384 [18:24:30<7:50:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 70%|███████ | 8675/12384 [18:24:38<7:50:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 70%|███████ | 8676/12384 [18:24:38<7:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 70%|███████ | 8676/12384 [18:24:46<7:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 70%|███████ | 8677/12384 [18:24:46<7:50:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 70%|███████ | 8677/12384 [18:24:53<7:50:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 70%|███████ | 8678/12384 [18:24:53<7:50:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 70%|███████ | 8678/12384 [18:25:01<7:50:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|███████ | 8679/12384 [18:25:01<7:49:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|███████ | 8679/12384 [18:25:09<7:49:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 70%|███████ | 8680/12384 [18:25:09<7:56:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 70%|███████ | 8680/12384 [18:25:16<7:56:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 70%|███████ | 8681/12384 [18:25:16<7:54:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 70%|███████ | 8681/12384 [18:25:24<7:54:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 70%|███████ | 8682/12384 [18:25:24<7:54:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 70%|███████ | 8682/12384 [18:25:32<7:54:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 70%|███████ | 8683/12384 [18:25:32<7:52:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 70%|███████ | 8683/12384 [18:25:39<7:52:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 70%|███████ | 8684/12384 [18:25:39<7:51:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 70%|███████ | 8684/12384 [18:25:47<7:51:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|███████ | 8685/12384 [18:25:47<7:50:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|███████ | 8685/12384 [18:25:55<7:50:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 70%|███████ | 8686/12384 [18:25:55<7:49:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 70%|███████ | 8686/12384 [18:26:02<7:49:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 70%|███████ | 8687/12384 [18:26:02<7:49:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 70%|███████ | 8687/12384 [18:26:10<7:49:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 70%|███████ | 8688/12384 [18:26:10<7:49:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 70%|███████ | 8688/12384 [18:26:17<7:49:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 70%|███████ | 8689/12384 [18:26:17<7:48:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 70%|███████ | 8689/12384 [18:26:25<7:48:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 70%|███████ | 8690/12384 [18:26:25<7:48:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 70%|███████ | 8690/12384 [18:26:33<7:48:17, 7.61s/it, loss=0.0011, acc=0.9982, iter_time=6.42s]
Epoch 1: 70%|███████ | 8691/12384 [18:26:33<7:48:21, 7.61s/it, loss=0.0011, acc=0.9982, iter_time=6.42s]
Epoch 1: 70%|███████ | 8691/12384 [18:26:40<7:48:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 70%|███████ | 8692/12384 [18:26:40<7:48:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 70%|███████ | 8692/12384 [18:26:48<7:48:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 70%|███████ | 8693/12384 [18:26:48<7:48:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 70%|███████ | 8693/12384 [18:26:55<7:48:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 70%|███████ | 8694/12384 [18:26:55<7:48:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 70%|███████ | 8694/12384 [18:27:03<7:48:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 70%|███████ | 8695/12384 [18:27:03<7:48:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 70%|███████ | 8695/12384 [18:27:11<7:48:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 70%|███████ | 8696/12384 [18:27:11<7:48:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 70%|███████ | 8696/12384 [18:27:18<7:48:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 70%|███████ | 8697/12384 [18:27:18<7:48:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 70%|███████ | 8697/12384 [18:27:26<7:48:24, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.82s]
Epoch 1: 70%|███████ | 8698/12384 [18:27:26<7:48:07, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.82s]
Epoch 1: 70%|███████ | 8698/12384 [18:27:33<7:48:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|███████ | 8699/12384 [18:27:34<7:47:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 70%|███████ | 8699/12384 [18:27:41<7:47:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 70%|███████ | 8700/12384 [18:27:41<7:47:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 70%|███████ | 8700/12384 [18:27:49<7:47:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.62s]
Epoch 1: 70%|███████ | 8701/12384 [18:27:49<7:48:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.62s]
Epoch 1: 70%|███████ | 8701/12384 [18:27:56<7:48:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 1: 70%|███████ | 8702/12384 [18:27:56<7:47:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 1: 70%|███████ | 8702/12384 [18:28:04<7:47:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 70%|███████ | 8703/12384 [18:28:04<7:47:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 70%|███████ | 8703/12384 [18:28:12<7:47:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 70%|███████ | 8704/12384 [18:28:12<7:46:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 70%|███████ | 8704/12384 [18:28:19<7:46:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 70%|███████ | 8705/12384 [18:28:19<7:46:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 70%|███████ | 8705/12384 [18:28:27<7:46:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 70%|███████ | 8706/12384 [18:28:27<7:52:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 70%|███████ | 8706/12384 [18:28:35<7:52:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 70%|███████ | 8707/12384 [18:28:35<7:50:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 70%|███████ | 8707/12384 [18:28:42<7:50:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 70%|███████ | 8708/12384 [18:28:42<7:49:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 70%|███████ | 8708/12384 [18:28:50<7:49:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|███████ | 8709/12384 [18:28:50<7:49:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|███████ | 8709/12384 [18:28:58<7:49:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 70%|███████ | 8710/12384 [18:28:58<7:47:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 70%|███████ | 8710/12384 [18:29:05<7:47:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|███████ | 8711/12384 [18:29:05<7:47:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 70%|███████ | 8711/12384 [18:29:13<7:47:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 70%|███████ | 8712/12384 [18:29:13<7:46:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 70%|███████ | 8712/12384 [18:29:20<7:46:45, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 1: 70%|███████ | 8713/12384 [18:29:20<7:46:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 1: 70%|███████ | 8713/12384 [18:29:28<7:46:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|███████ | 8714/12384 [18:29:28<7:45:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|███████ | 8714/12384 [18:29:36<7:45:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 70%|███████ | 8715/12384 [18:29:36<7:45:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 70%|███████ | 8715/12384 [18:29:43<7:45:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 70%|███████ | 8716/12384 [18:29:43<7:45:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 1: 70%|███████ | 8716/12384 [18:29:51<7:45:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 70%|███████ | 8717/12384 [18:29:51<7:45:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 70%|███████ | 8717/12384 [18:29:59<7:45:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 70%|███████ | 8718/12384 [18:29:59<7:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 70%|███████ | 8718/12384 [18:30:06<7:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 70%|███████ | 8719/12384 [18:30:06<7:45:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 70%|███████ | 8719/12384 [18:30:14<7:45:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 70%|███████ | 8720/12384 [18:30:14<7:45:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 70%|███████ | 8720/12384 [18:30:21<7:45:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 1: 70%|███████ | 8721/12384 [18:30:21<7:44:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 1: 70%|███████ | 8721/12384 [18:30:29<7:44:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 70%|███████ | 8722/12384 [18:30:29<7:44:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 70%|███████ | 8722/12384 [18:30:37<7:44:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 70%|███████ | 8723/12384 [18:30:37<7:44:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 70%|███████ | 8723/12384 [18:30:44<7:44:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 70%|███████ | 8724/12384 [18:30:44<7:43:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 70%|███████ | 8724/12384 [18:30:52<7:43:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 70%|███████ | 8725/12384 [18:30:52<7:43:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 70%|███████ | 8725/12384 [18:30:59<7:43:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|███████ | 8726/12384 [18:30:59<7:43:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 70%|███████ | 8726/12384 [18:31:07<7:43:07, 7.60s/it, loss=0.0002, acc=0.9994, iter_time=7.60s]
Epoch 1: 70%|███████ | 8727/12384 [18:31:07<7:44:28, 7.62s/it, loss=0.0002, acc=0.9994, iter_time=7.60s]
Epoch 1: 70%|███████ | 8727/12384 [18:31:15<7:44:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 70%|███████ | 8728/12384 [18:31:15<7:43:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 70%|███████ | 8728/12384 [18:31:22<7:43:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 70%|███████ | 8729/12384 [18:31:22<7:43:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 70%|███████ | 8729/12384 [18:31:30<7:43:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 70%|███████ | 8730/12384 [18:31:30<7:43:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 70%|███████ | 8730/12384 [18:31:37<7:43:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 71%|███████ | 8731/12384 [18:31:37<7:43:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 71%|███████ | 8731/12384 [18:31:45<7:43:12, 7.61s/it, loss=0.0002, acc=0.9992, iter_time=7.61s]
Epoch 1: 71%|███████ | 8732/12384 [18:31:45<7:44:02, 7.62s/it, loss=0.0002, acc=0.9992, iter_time=7.61s]
Epoch 1: 71%|███████ | 8732/12384 [18:31:53<7:44:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.42s]
Epoch 1: 71%|███████ | 8733/12384 [18:31:53<7:49:59, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=5.42s]
Epoch 1: 71%|███████ | 8733/12384 [18:32:01<7:49:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 71%|███████ | 8734/12384 [18:32:01<7:47:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 71%|███████ | 8734/12384 [18:32:08<7:47:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 71%|███████ | 8735/12384 [18:32:08<7:46:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 71%|███████ | 8735/12384 [18:32:16<7:46:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 71%|███████ | 8736/12384 [18:32:16<7:44:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 71%|███████ | 8736/12384 [18:32:23<7:44:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 71%|███████ | 8737/12384 [18:32:23<7:44:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 71%|███████ | 8737/12384 [18:32:31<7:44:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████ | 8738/12384 [18:32:31<7:43:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████ | 8738/12384 [18:32:39<7:43:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████ | 8739/12384 [18:32:39<7:43:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████ | 8739/12384 [18:32:46<7:43:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 71%|███████ | 8740/12384 [18:32:46<7:42:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 71%|███████ | 8740/12384 [18:32:54<7:42:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 71%|███████ | 8741/12384 [18:32:54<7:42:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 71%|███████ | 8741/12384 [18:33:02<7:42:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8742/12384 [18:33:02<7:41:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8742/12384 [18:33:09<7:41:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 71%|███████ | 8743/12384 [18:33:09<7:41:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 71%|███████ | 8743/12384 [18:33:17<7:41:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 1: 71%|███████ | 8744/12384 [18:33:17<7:41:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 1: 71%|███████ | 8744/12384 [18:33:24<7:41:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 71%|███████ | 8745/12384 [18:33:24<7:41:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 71%|███████ | 8745/12384 [18:33:32<7:41:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 71%|███████ | 8746/12384 [18:33:32<7:41:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 71%|███████ | 8746/12384 [18:33:40<7:41:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 71%|███████ | 8747/12384 [18:33:40<7:42:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 71%|███████ | 8747/12384 [18:33:47<7:42:28, 7.63s/it, loss=0.0000, acc=0.9998, iter_time=7.61s]
Epoch 1: 71%|███████ | 8748/12384 [18:33:47<7:41:54, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=7.61s]
Epoch 1: 71%|███████ | 8748/12384 [18:33:55<7:41:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 71%|███████ | 8749/12384 [18:33:55<7:41:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 71%|███████ | 8749/12384 [18:34:02<7:41:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8750/12384 [18:34:02<7:40:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8750/12384 [18:34:10<7:40:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 71%|███████ | 8751/12384 [18:34:10<7:40:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 71%|███████ | 8751/12384 [18:34:18<7:40:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 71%|███████ | 8752/12384 [18:34:18<7:40:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 71%|███████ | 8752/12384 [18:34:25<7:40:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 71%|███████ | 8753/12384 [18:34:25<7:39:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 71%|███████ | 8753/12384 [18:34:33<7:39:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 71%|███████ | 8754/12384 [18:34:33<7:39:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 71%|███████ | 8754/12384 [18:34:40<7:39:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 71%|███████ | 8755/12384 [18:34:40<7:39:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 71%|███████ | 8755/12384 [18:34:48<7:39:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8756/12384 [18:34:48<7:41:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8756/12384 [18:34:56<7:41:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 71%|███████ | 8757/12384 [18:34:56<7:41:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 71%|███████ | 8757/12384 [18:35:03<7:41:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 71%|███████ | 8758/12384 [18:35:03<7:40:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 71%|███████ | 8758/12384 [18:35:11<7:40:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 71%|███████ | 8759/12384 [18:35:11<7:46:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 71%|███████ | 8759/12384 [18:35:19<7:46:22, 7.72s/it, loss=0.0001, acc=0.9989, iter_time=7.59s]
Epoch 1: 71%|███████ | 8760/12384 [18:35:19<7:45:12, 7.70s/it, loss=0.0001, acc=0.9989, iter_time=7.59s]
Epoch 1: 71%|███████ | 8760/12384 [18:35:27<7:45:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████ | 8761/12384 [18:35:27<7:43:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████ | 8761/12384 [18:35:34<7:43:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 71%|███████ | 8762/12384 [18:35:34<7:42:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 71%|███████ | 8762/12384 [18:35:42<7:42:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 71%|███████ | 8763/12384 [18:35:42<7:41:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 71%|███████ | 8763/12384 [18:35:49<7:41:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 71%|███████ | 8764/12384 [18:35:49<7:41:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 71%|███████ | 8764/12384 [18:35:57<7:41:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 71%|███████ | 8765/12384 [18:35:57<7:40:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 71%|███████ | 8765/12384 [18:36:05<7:40:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 71%|███████ | 8766/12384 [18:36:05<7:39:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 71%|███████ | 8766/12384 [18:36:12<7:39:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 71%|███████ | 8767/12384 [18:36:12<7:39:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 71%|███████ | 8767/12384 [18:36:20<7:39:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 1: 71%|███████ | 8768/12384 [18:36:20<7:40:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 1: 71%|███████ | 8768/12384 [18:36:28<7:40:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8769/12384 [18:36:28<7:39:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8769/12384 [18:36:35<7:39:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████ | 8770/12384 [18:36:35<7:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████ | 8770/12384 [18:36:43<7:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 71%|███████ | 8771/12384 [18:36:43<7:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 71%|███████ | 8771/12384 [18:36:50<7:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 71%|███████ | 8772/12384 [18:36:50<7:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 71%|███████ | 8772/12384 [18:36:58<7:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 71%|███████ | 8773/12384 [18:36:58<7:38:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 71%|███████ | 8773/12384 [18:37:06<7:38:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 71%|███████ | 8774/12384 [18:37:06<7:37:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 71%|███████ | 8774/12384 [18:37:13<7:37:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 71%|███████ | 8775/12384 [18:37:13<7:37:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 71%|███████ | 8775/12384 [18:37:21<7:37:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 71%|███████ | 8776/12384 [18:37:21<7:35:51, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 71%|███████ | 8776/12384 [18:37:28<7:35:51, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 71%|███████ | 8777/12384 [18:37:28<7:36:21, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 71%|███████ | 8777/12384 [18:37:36<7:36:21, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 71%|███████ | 8778/12384 [18:37:36<7:36:06, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 71%|███████ | 8778/12384 [18:37:44<7:36:06, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████ | 8779/12384 [18:37:44<7:36:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████ | 8779/12384 [18:37:51<7:36:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 71%|███████ | 8780/12384 [18:37:51<7:36:08, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 71%|███████ | 8780/12384 [18:37:59<7:36:08, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 71%|███████ | 8781/12384 [18:37:59<7:36:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 71%|███████ | 8781/12384 [18:38:06<7:36:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 71%|███████ | 8782/12384 [18:38:06<7:36:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 1: 71%|███████ | 8782/12384 [18:38:14<7:36:10, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.56s]
Epoch 1: 71%|███████ | 8783/12384 [18:38:14<7:36:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.56s]
Epoch 1: 71%|███████ | 8783/12384 [18:38:22<7:36:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 71%|███████ | 8784/12384 [18:38:22<7:36:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 71%|███████ | 8784/12384 [18:38:29<7:36:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 71%|███████ | 8785/12384 [18:38:29<7:42:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 71%|███████ | 8785/12384 [18:38:37<7:42:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 71%|███████ | 8786/12384 [18:38:37<7:40:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 71%|███████ | 8786/12384 [18:38:45<7:40:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 71%|███████ | 8787/12384 [18:38:45<7:38:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 71%|███████ | 8787/12384 [18:38:52<7:38:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 71%|███████ | 8788/12384 [18:38:52<7:37:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 71%|███████ | 8788/12384 [18:39:00<7:37:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 1: 71%|███████ | 8789/12384 [18:39:00<7:36:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 1: 71%|███████ | 8789/12384 [18:39:07<7:36:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 71%|███████ | 8790/12384 [18:39:07<7:35:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 71%|███████ | 8790/12384 [18:39:15<7:35:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 71%|███████ | 8791/12384 [18:39:15<7:35:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 71%|███████ | 8791/12384 [18:39:23<7:35:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 71%|███████ | 8792/12384 [18:39:23<7:35:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 71%|███████ | 8792/12384 [18:39:30<7:35:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████ | 8793/12384 [18:39:30<7:35:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████ | 8793/12384 [18:39:38<7:35:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 71%|███████ | 8794/12384 [18:39:38<7:34:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 71%|███████ | 8794/12384 [18:39:46<7:34:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 71%|███████ | 8795/12384 [18:39:46<7:35:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 71%|███████ | 8795/12384 [18:39:53<7:35:31, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.67s]
Epoch 1: 71%|███████ | 8796/12384 [18:39:53<7:35:34, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.67s]
Epoch 1: 71%|███████ | 8796/12384 [18:40:01<7:35:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 71%|███████ | 8797/12384 [18:40:01<7:35:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 71%|███████ | 8797/12384 [18:40:08<7:35:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 71%|███████ | 8798/12384 [18:40:08<7:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 71%|███████ | 8798/12384 [18:40:16<7:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 71%|███████ | 8799/12384 [18:40:16<7:34:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 71%|███████ | 8799/12384 [18:40:24<7:34:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 71%|███████ | 8800/12384 [18:40:24<7:34:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 71%|███████ | 8800/12384 [18:40:31<7:34:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 71%|███████ | 8801/12384 [18:40:31<7:34:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 71%|███████ | 8801/12384 [18:40:39<7:34:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 71%|███████ | 8802/12384 [18:40:39<7:34:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 71%|███████ | 8802/12384 [18:40:46<7:34:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 71%|███████ | 8803/12384 [18:40:46<7:34:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 71%|███████ | 8803/12384 [18:40:54<7:34:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 71%|███████ | 8804/12384 [18:40:54<7:34:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 71%|███████ | 8804/12384 [18:41:02<7:34:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 71%|███████ | 8805/12384 [18:41:02<7:34:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 71%|███████ | 8805/12384 [18:41:09<7:34:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 71%|███████ | 8806/12384 [18:41:09<7:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 71%|███████ | 8806/12384 [18:41:17<7:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████ | 8807/12384 [18:41:17<7:34:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████ | 8807/12384 [18:41:25<7:34:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 71%|███████ | 8808/12384 [18:41:25<7:33:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 71%|███████ | 8808/12384 [18:41:32<7:33:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 71%|███████ | 8809/12384 [18:41:32<7:33:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 71%|███████ | 8809/12384 [18:41:40<7:33:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 71%|███████ | 8810/12384 [18:41:40<7:33:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 71%|███████ | 8810/12384 [18:41:48<7:33:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 71%|███████ | 8811/12384 [18:41:48<7:39:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 71%|███████ | 8811/12384 [18:41:55<7:39:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 71%|███████ | 8812/12384 [18:41:55<7:37:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 71%|███████ | 8812/12384 [18:42:03<7:37:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 71%|███████ | 8813/12384 [18:42:03<7:36:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 71%|███████ | 8813/12384 [18:42:11<7:36:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 71%|███████ | 8814/12384 [18:42:11<7:35:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 71%|███████ | 8814/12384 [18:42:18<7:35:44, 7.66s/it, loss=0.0002, acc=0.9985, iter_time=7.62s]
Epoch 1: 71%|███████ | 8815/12384 [18:42:18<7:34:29, 7.64s/it, loss=0.0002, acc=0.9985, iter_time=7.62s]
Epoch 1: 71%|███████ | 8815/12384 [18:42:26<7:34:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 71%|███████ | 8816/12384 [18:42:26<7:33:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 71%|███████ | 8816/12384 [18:42:33<7:33:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 71%|███████ | 8817/12384 [18:42:33<7:33:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 71%|███████ | 8817/12384 [18:42:41<7:33:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 71%|███████ | 8818/12384 [18:42:41<7:33:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 71%|███████ | 8818/12384 [18:42:49<7:33:12, 7.63s/it, loss=0.0004, acc=0.9997, iter_time=4.47s]
Epoch 1: 71%|███████ | 8819/12384 [18:42:49<7:32:26, 7.61s/it, loss=0.0004, acc=0.9997, iter_time=4.47s]
Epoch 1: 71%|███████ | 8819/12384 [18:42:56<7:32:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 71%|███████ | 8820/12384 [18:42:56<7:32:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 1: 71%|███████ | 8820/12384 [18:43:04<7:32:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████ | 8821/12384 [18:43:04<7:32:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████ | 8821/12384 [18:43:11<7:32:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 71%|███████ | 8822/12384 [18:43:11<7:31:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 71%|███████ | 8822/12384 [18:43:19<7:31:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8823/12384 [18:43:19<7:31:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 71%|███████ | 8823/12384 [18:43:27<7:31:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 71%|███████▏ | 8824/12384 [18:43:27<7:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 71%|███████▏ | 8824/12384 [18:43:34<7:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████▏ | 8825/12384 [18:43:34<7:30:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 71%|███████▏ | 8825/12384 [18:43:42<7:30:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 71%|███████▏ | 8826/12384 [18:43:42<7:31:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 71%|███████▏ | 8826/12384 [18:43:49<7:31:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 71%|███████▏ | 8827/12384 [18:43:49<7:30:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 71%|███████▏ | 8827/12384 [18:43:57<7:30:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 71%|███████▏ | 8828/12384 [18:43:57<7:30:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 71%|███████▏ | 8828/12384 [18:44:05<7:30:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 71%|███████▏ | 8829/12384 [18:44:05<7:30:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 71%|███████▏ | 8829/12384 [18:44:12<7:30:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 71%|███████▏ | 8830/12384 [18:44:12<7:31:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 71%|███████▏ | 8830/12384 [18:44:20<7:31:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 71%|███████▏ | 8831/12384 [18:44:20<7:30:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 71%|███████▏ | 8831/12384 [18:44:28<7:30:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 71%|███████▏ | 8832/12384 [18:44:28<7:30:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 71%|███████▏ | 8832/12384 [18:44:35<7:30:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 71%|███████▏ | 8833/12384 [18:44:35<7:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 71%|███████▏ | 8833/12384 [18:44:43<7:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 71%|███████▏ | 8834/12384 [18:44:43<7:30:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 71%|███████▏ | 8834/12384 [18:44:50<7:30:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 71%|███████▏ | 8835/12384 [18:44:50<7:17:52, 7.40s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 71%|███████▏ | 8835/12384 [18:44:57<7:17:52, 7.40s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 71%|███████▏ | 8836/12384 [18:44:57<7:21:37, 7.47s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 71%|███████▏ | 8836/12384 [18:45:05<7:21:37, 7.47s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 71%|███████▏ | 8837/12384 [18:45:05<7:29:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 71%|███████▏ | 8837/12384 [18:45:13<7:29:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 1: 71%|███████▏ | 8838/12384 [18:45:13<7:29:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 1: 71%|███████▏ | 8838/12384 [18:45:20<7:29:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 71%|███████▏ | 8839/12384 [18:45:20<7:29:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 71%|███████▏ | 8839/12384 [18:45:28<7:29:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 71%|███████▏ | 8840/12384 [18:45:28<7:29:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 71%|███████▏ | 8840/12384 [18:45:36<7:29:38, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.06s]
Epoch 1: 71%|███████▏ | 8841/12384 [18:45:36<7:28:58, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.06s]
Epoch 1: 71%|███████▏ | 8841/12384 [18:45:43<7:28:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 71%|███████▏ | 8842/12384 [18:45:43<7:29:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 71%|███████▏ | 8842/12384 [18:45:51<7:29:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 71%|███████▏ | 8843/12384 [18:45:51<7:29:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 71%|███████▏ | 8843/12384 [18:45:58<7:29:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 71%|███████▏ | 8844/12384 [18:45:58<7:28:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 71%|███████▏ | 8844/12384 [18:46:06<7:28:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 71%|███████▏ | 8845/12384 [18:46:06<7:28:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 71%|███████▏ | 8845/12384 [18:46:14<7:28:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 71%|███████▏ | 8846/12384 [18:46:14<7:28:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 71%|███████▏ | 8846/12384 [18:46:21<7:28:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 71%|███████▏ | 8847/12384 [18:46:21<7:27:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 71%|███████▏ | 8847/12384 [18:46:29<7:27:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 71%|███████▏ | 8848/12384 [18:46:29<7:27:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 71%|███████▏ | 8848/12384 [18:46:36<7:27:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 71%|███████▏ | 8849/12384 [18:46:36<7:28:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 71%|███████▏ | 8849/12384 [18:46:44<7:28:00, 7.60s/it, loss=0.0003, acc=0.9980, iter_time=4.35s]
Epoch 1: 71%|███████▏ | 8850/12384 [18:46:44<7:27:52, 7.60s/it, loss=0.0003, acc=0.9980, iter_time=4.35s]
Epoch 1: 71%|███████▏ | 8850/12384 [18:46:52<7:27:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 71%|███████▏ | 8851/12384 [18:46:52<7:28:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 71%|███████▏ | 8851/12384 [18:46:59<7:28:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 71%|███████▏ | 8852/12384 [18:46:59<7:28:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 71%|███████▏ | 8852/12384 [18:47:07<7:28:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 71%|███████▏ | 8853/12384 [18:47:07<7:28:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 1: 71%|███████▏ | 8853/12384 [18:47:15<7:28:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████▏ | 8854/12384 [18:47:15<7:27:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 71%|███████▏ | 8854/12384 [18:47:22<7:27:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 72%|███████▏ | 8855/12384 [18:47:22<7:27:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 72%|███████▏ | 8855/12384 [18:47:30<7:27:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 72%|███████▏ | 8856/12384 [18:47:30<7:26:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 72%|███████▏ | 8856/12384 [18:47:37<7:26:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 1: 72%|███████▏ | 8857/12384 [18:47:37<7:26:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 1: 72%|███████▏ | 8857/12384 [18:47:45<7:26:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 72%|███████▏ | 8858/12384 [18:47:45<7:26:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 72%|███████▏ | 8858/12384 [18:47:53<7:26:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8859/12384 [18:47:53<7:26:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8859/12384 [18:48:00<7:26:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8860/12384 [18:48:00<7:26:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8860/12384 [18:48:08<7:26:27, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 1: 72%|███████▏ | 8861/12384 [18:48:08<7:25:30, 7.59s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 1: 72%|███████▏ | 8861/12384 [18:48:15<7:25:30, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 72%|███████▏ | 8862/12384 [18:48:15<7:25:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 72%|███████▏ | 8862/12384 [18:48:23<7:25:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 72%|███████▏ | 8863/12384 [18:48:23<7:25:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 72%|███████▏ | 8863/12384 [18:48:31<7:25:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 72%|███████▏ | 8864/12384 [18:48:31<7:33:56, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 72%|███████▏ | 8864/12384 [18:48:39<7:33:56, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=3.15s]
Epoch 1: 72%|███████▏ | 8865/12384 [18:48:39<7:31:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=3.15s]
Epoch 1: 72%|███████▏ | 8865/12384 [18:48:46<7:31:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=12.20s]
Epoch 1: 72%|███████▏ | 8866/12384 [18:48:46<7:29:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=12.20s]
Epoch 1: 72%|███████▏ | 8866/12384 [18:48:54<7:29:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 72%|███████▏ | 8867/12384 [18:48:54<7:28:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 72%|███████▏ | 8867/12384 [18:49:01<7:28:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 72%|███████▏ | 8868/12384 [18:49:01<7:27:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 72%|███████▏ | 8868/12384 [18:49:09<7:27:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 72%|███████▏ | 8869/12384 [18:49:09<7:26:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 72%|███████▏ | 8869/12384 [18:49:17<7:26:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 72%|███████▏ | 8870/12384 [18:49:17<7:25:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 72%|███████▏ | 8870/12384 [18:49:24<7:25:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 72%|███████▏ | 8871/12384 [18:49:24<7:25:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 72%|███████▏ | 8871/12384 [18:49:32<7:25:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 72%|███████▏ | 8872/12384 [18:49:32<7:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 72%|███████▏ | 8872/12384 [18:49:39<7:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 72%|███████▏ | 8873/12384 [18:49:39<7:25:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 72%|███████▏ | 8873/12384 [18:49:47<7:25:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.84s]
Epoch 1: 72%|███████▏ | 8874/12384 [18:49:47<7:25:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.84s]
Epoch 1: 72%|███████▏ | 8874/12384 [18:49:55<7:25:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 72%|███████▏ | 8875/12384 [18:49:55<7:25:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 72%|███████▏ | 8875/12384 [18:50:02<7:25:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8876/12384 [18:50:02<7:24:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8876/12384 [18:50:10<7:24:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 72%|███████▏ | 8877/12384 [18:50:10<7:25:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 72%|███████▏ | 8877/12384 [18:50:18<7:25:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 72%|███████▏ | 8878/12384 [18:50:18<7:25:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 72%|███████▏ | 8878/12384 [18:50:25<7:25:37, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=7.64s]
Epoch 1: 72%|███████▏ | 8879/12384 [18:50:25<7:25:21, 7.62s/it, loss=0.0002, acc=0.9995, iter_time=7.64s]
Epoch 1: 72%|███████▏ | 8879/12384 [18:50:33<7:25:21, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=8.00s]
Epoch 1: 72%|███████▏ | 8880/12384 [18:50:33<7:24:53, 7.62s/it, loss=0.0003, acc=0.9983, iter_time=8.00s]
Epoch 1: 72%|███████▏ | 8880/12384 [18:50:40<7:24:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 72%|███████▏ | 8881/12384 [18:50:40<7:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 72%|███████▏ | 8881/12384 [18:50:48<7:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8882/12384 [18:50:48<7:24:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8882/12384 [18:50:56<7:24:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 72%|███████▏ | 8883/12384 [18:50:56<7:24:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 72%|███████▏ | 8883/12384 [18:51:03<7:24:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 72%|███████▏ | 8884/12384 [18:51:03<7:23:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 72%|███████▏ | 8884/12384 [18:51:11<7:23:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 72%|███████▏ | 8885/12384 [18:51:11<7:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 72%|███████▏ | 8885/12384 [18:51:18<7:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 72%|███████▏ | 8886/12384 [18:51:18<7:23:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 1: 72%|███████▏ | 8886/12384 [18:51:26<7:23:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 72%|███████▏ | 8887/12384 [18:51:26<7:23:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 72%|███████▏ | 8887/12384 [18:51:34<7:23:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 72%|███████▏ | 8888/12384 [18:51:34<7:23:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 72%|███████▏ | 8888/12384 [18:51:41<7:23:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 72%|███████▏ | 8889/12384 [18:51:41<7:23:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 72%|███████▏ | 8889/12384 [18:51:49<7:23:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.68s]
Epoch 1: 72%|███████▏ | 8890/12384 [18:51:49<7:29:02, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.68s]
Epoch 1: 72%|███████▏ | 8890/12384 [18:51:57<7:29:02, 7.71s/it, loss=0.0005, acc=0.9990, iter_time=10.18s]
Epoch 1: 72%|███████▏ | 8891/12384 [18:51:57<7:27:27, 7.69s/it, loss=0.0005, acc=0.9990, iter_time=10.18s]
Epoch 1: 72%|███████▏ | 8891/12384 [18:52:04<7:27:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 72%|███████▏ | 8892/12384 [18:52:04<7:26:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 72%|███████▏ | 8892/12384 [18:52:12<7:26:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 72%|███████▏ | 8893/12384 [18:52:12<7:25:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 72%|███████▏ | 8893/12384 [18:52:20<7:25:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 72%|███████▏ | 8894/12384 [18:52:20<7:23:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 72%|███████▏ | 8894/12384 [18:52:27<7:23:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 1: 72%|███████▏ | 8895/12384 [18:52:27<7:23:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 1: 72%|███████▏ | 8895/12384 [18:52:35<7:23:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 1: 72%|███████▏ | 8896/12384 [18:52:35<7:23:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 1: 72%|███████▏ | 8896/12384 [18:52:42<7:23:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 72%|███████▏ | 8897/12384 [18:52:42<7:22:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 72%|███████▏ | 8897/12384 [18:52:50<7:22:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8898/12384 [18:52:50<7:22:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8898/12384 [18:52:58<7:22:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8899/12384 [18:52:58<7:22:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8899/12384 [18:53:05<7:22:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 72%|███████▏ | 8900/12384 [18:53:05<7:22:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 72%|███████▏ | 8900/12384 [18:53:13<7:22:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8901/12384 [18:53:13<7:22:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8901/12384 [18:53:21<7:22:16, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8902/12384 [18:53:21<7:21:48, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8902/12384 [18:53:28<7:21:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 72%|███████▏ | 8903/12384 [18:53:28<7:21:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 72%|███████▏ | 8903/12384 [18:53:36<7:21:37, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=10.75s]
Epoch 1: 72%|███████▏ | 8904/12384 [18:53:36<7:21:20, 7.61s/it, loss=0.0001, acc=0.9988, iter_time=10.75s]
Epoch 1: 72%|███████▏ | 8904/12384 [18:53:43<7:21:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 72%|███████▏ | 8905/12384 [18:53:43<7:21:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 72%|███████▏ | 8905/12384 [18:53:51<7:21:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 72%|███████▏ | 8906/12384 [18:53:51<7:20:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 72%|███████▏ | 8906/12384 [18:53:59<7:20:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 72%|███████▏ | 8907/12384 [18:53:59<7:20:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 72%|███████▏ | 8907/12384 [18:54:06<7:20:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8908/12384 [18:54:06<7:20:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8908/12384 [18:54:14<7:20:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 72%|███████▏ | 8909/12384 [18:54:14<7:22:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 72%|███████▏ | 8909/12384 [18:54:21<7:22:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 72%|███████▏ | 8910/12384 [18:54:21<7:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 1: 72%|███████▏ | 8910/12384 [18:54:29<7:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8911/12384 [18:54:29<7:21:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8911/12384 [18:54:37<7:21:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 72%|███████▏ | 8912/12384 [18:54:37<7:21:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 72%|███████▏ | 8912/12384 [18:54:44<7:21:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 72%|███████▏ | 8913/12384 [18:54:44<7:20:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 72%|███████▏ | 8913/12384 [18:54:52<7:20:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 72%|███████▏ | 8914/12384 [18:54:52<7:21:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 72%|███████▏ | 8914/12384 [18:55:00<7:21:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 72%|███████▏ | 8915/12384 [18:55:00<7:20:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 72%|███████▏ | 8915/12384 [18:55:07<7:20:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 72%|███████▏ | 8916/12384 [18:55:07<7:20:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 72%|███████▏ | 8916/12384 [18:55:15<7:20:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 72%|███████▏ | 8917/12384 [18:55:15<7:26:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 72%|███████▏ | 8917/12384 [18:55:23<7:26:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 72%|███████▏ | 8918/12384 [18:55:23<7:24:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 72%|███████▏ | 8918/12384 [18:55:30<7:24:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 72%|███████▏ | 8919/12384 [18:55:30<7:22:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 72%|███████▏ | 8919/12384 [18:55:38<7:22:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 72%|███████▏ | 8920/12384 [18:55:38<7:21:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 72%|███████▏ | 8920/12384 [18:55:46<7:21:33, 7.65s/it, loss=0.0003, acc=0.9983, iter_time=4.42s]
Epoch 1: 72%|███████▏ | 8921/12384 [18:55:46<7:20:42, 7.64s/it, loss=0.0003, acc=0.9983, iter_time=4.42s]
Epoch 1: 72%|███████▏ | 8921/12384 [18:55:53<7:20:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 72%|███████▏ | 8922/12384 [18:55:53<7:19:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 72%|███████▏ | 8922/12384 [18:56:01<7:19:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 72%|███████▏ | 8923/12384 [18:56:01<7:18:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 72%|███████▏ | 8923/12384 [18:56:08<7:18:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 72%|███████▏ | 8924/12384 [18:56:08<7:18:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 72%|███████▏ | 8924/12384 [18:56:16<7:18:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 72%|███████▏ | 8925/12384 [18:56:16<7:18:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 72%|███████▏ | 8925/12384 [18:56:24<7:18:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8926/12384 [18:56:24<7:18:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8926/12384 [18:56:31<7:18:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 72%|███████▏ | 8927/12384 [18:56:31<7:18:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 72%|███████▏ | 8927/12384 [18:56:39<7:18:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 72%|███████▏ | 8928/12384 [18:56:39<7:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 72%|███████▏ | 8928/12384 [18:56:46<7:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 72%|███████▏ | 8929/12384 [18:56:46<7:18:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 72%|███████▏ | 8929/12384 [18:56:54<7:18:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 72%|███████▏ | 8930/12384 [18:56:54<7:17:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 72%|███████▏ | 8930/12384 [18:57:02<7:17:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 72%|███████▏ | 8931/12384 [18:57:02<7:17:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 72%|███████▏ | 8931/12384 [18:57:09<7:17:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 72%|███████▏ | 8932/12384 [18:57:09<7:17:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 72%|███████▏ | 8932/12384 [18:57:17<7:17:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8933/12384 [18:57:17<7:17:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8933/12384 [18:57:24<7:17:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8934/12384 [18:57:24<7:17:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8934/12384 [18:57:32<7:17:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 72%|███████▏ | 8935/12384 [18:57:32<7:17:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 72%|███████▏ | 8935/12384 [18:57:40<7:17:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 72%|███████▏ | 8936/12384 [18:57:40<7:18:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 72%|███████▏ | 8936/12384 [18:57:47<7:18:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 72%|███████▏ | 8937/12384 [18:57:47<7:17:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 72%|███████▏ | 8937/12384 [18:57:55<7:17:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8938/12384 [18:57:55<7:18:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8938/12384 [18:58:03<7:18:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 72%|███████▏ | 8939/12384 [18:58:03<7:18:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 72%|███████▏ | 8939/12384 [18:58:10<7:18:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.01s]
Epoch 1: 72%|███████▏ | 8940/12384 [18:58:10<7:17:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.01s]
Epoch 1: 72%|███████▏ | 8940/12384 [18:58:18<7:17:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8941/12384 [18:58:18<7:17:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8941/12384 [18:58:25<7:17:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8942/12384 [18:58:25<7:16:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8942/12384 [18:58:33<7:16:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 72%|███████▏ | 8943/12384 [18:58:33<7:22:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 72%|███████▏ | 8943/12384 [18:58:41<7:22:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 72%|███████▏ | 8944/12384 [18:58:41<7:20:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 72%|███████▏ | 8944/12384 [18:58:49<7:20:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 72%|███████▏ | 8945/12384 [18:58:49<7:18:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 72%|███████▏ | 8945/12384 [18:58:56<7:18:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 72%|███████▏ | 8946/12384 [18:58:56<7:17:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 72%|███████▏ | 8946/12384 [18:59:04<7:17:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8947/12384 [18:59:04<7:16:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 72%|███████▏ | 8947/12384 [18:59:11<7:16:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.24s]
Epoch 1: 72%|███████▏ | 8948/12384 [18:59:11<7:16:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.24s]
Epoch 1: 72%|███████▏ | 8948/12384 [18:59:19<7:16:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 72%|███████▏ | 8949/12384 [18:59:19<7:15:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 72%|███████▏ | 8949/12384 [18:59:27<7:15:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 72%|███████▏ | 8950/12384 [18:59:27<7:15:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 72%|███████▏ | 8950/12384 [18:59:34<7:15:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 72%|███████▏ | 8951/12384 [18:59:34<7:15:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 72%|███████▏ | 8951/12384 [18:59:42<7:15:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 72%|███████▏ | 8952/12384 [18:59:42<7:15:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 72%|███████▏ | 8952/12384 [18:59:49<7:15:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 72%|███████▏ | 8953/12384 [18:59:49<7:15:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 72%|███████▏ | 8953/12384 [18:59:57<7:15:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.02s]
Epoch 1: 72%|███████▏ | 8954/12384 [18:59:57<7:15:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.02s]
Epoch 1: 72%|███████▏ | 8954/12384 [19:00:05<7:15:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 72%|███████▏ | 8955/12384 [19:00:05<7:15:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 72%|███████▏ | 8955/12384 [19:00:12<7:15:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 72%|███████▏ | 8956/12384 [19:00:12<7:14:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 72%|███████▏ | 8956/12384 [19:00:20<7:14:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 72%|███████▏ | 8957/12384 [19:00:20<7:14:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 72%|███████▏ | 8957/12384 [19:00:27<7:14:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 72%|███████▏ | 8958/12384 [19:00:27<7:14:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 72%|███████▏ | 8958/12384 [19:00:35<7:14:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 72%|███████▏ | 8959/12384 [19:00:35<7:13:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 72%|███████▏ | 8959/12384 [19:00:43<7:13:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 72%|███████▏ | 8960/12384 [19:00:43<7:13:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 72%|███████▏ | 8960/12384 [19:00:50<7:13:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 72%|███████▏ | 8961/12384 [19:00:50<7:13:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 72%|███████▏ | 8961/12384 [19:00:58<7:13:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 72%|███████▏ | 8962/12384 [19:00:58<7:13:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 72%|███████▏ | 8962/12384 [19:01:05<7:13:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 72%|███████▏ | 8963/12384 [19:01:05<7:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 72%|███████▏ | 8963/12384 [19:01:13<7:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8964/12384 [19:01:13<7:13:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8964/12384 [19:01:21<7:13:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8965/12384 [19:01:21<7:13:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8965/12384 [19:01:28<7:13:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 72%|███████▏ | 8966/12384 [19:01:28<7:13:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 72%|███████▏ | 8966/12384 [19:01:36<7:13:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 72%|███████▏ | 8967/12384 [19:01:36<7:13:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 72%|███████▏ | 8967/12384 [19:01:44<7:13:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 72%|███████▏ | 8968/12384 [19:01:44<7:13:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 72%|███████▏ | 8968/12384 [19:01:51<7:13:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 72%|███████▏ | 8969/12384 [19:01:51<7:19:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 72%|███████▏ | 8969/12384 [19:01:59<7:19:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 72%|███████▏ | 8970/12384 [19:01:59<7:18:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 72%|███████▏ | 8970/12384 [19:02:07<7:18:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 72%|███████▏ | 8971/12384 [19:02:07<7:16:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 72%|███████▏ | 8971/12384 [19:02:14<7:16:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 72%|███████▏ | 8972/12384 [19:02:14<7:14:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 72%|███████▏ | 8972/12384 [19:02:22<7:14:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8973/12384 [19:02:22<7:13:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 72%|███████▏ | 8973/12384 [19:02:30<7:13:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8974/12384 [19:02:30<7:13:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 72%|███████▏ | 8974/12384 [19:02:37<7:13:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 72%|███████▏ | 8975/12384 [19:02:37<7:13:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 72%|███████▏ | 8975/12384 [19:02:45<7:13:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 72%|███████▏ | 8976/12384 [19:02:45<7:12:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 72%|███████▏ | 8976/12384 [19:02:52<7:12:54, 7.62s/it, loss=0.0001, acc=0.9993, iter_time=7.21s]
Epoch 1: 72%|███████▏ | 8977/12384 [19:02:52<7:12:11, 7.61s/it, loss=0.0001, acc=0.9993, iter_time=7.21s]
Epoch 1: 72%|███████▏ | 8977/12384 [19:03:00<7:12:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 72%|███████▏ | 8978/12384 [19:03:00<7:12:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 72%|███████▏ | 8978/12384 [19:03:08<7:12:03, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=8.46s]
Epoch 1: 73%|███████▎ | 8979/12384 [19:03:08<7:11:55, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=8.46s]
Epoch 1: 73%|███████▎ | 8979/12384 [19:03:15<7:11:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 8980/12384 [19:03:15<7:11:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 8980/12384 [19:03:23<7:11:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 8981/12384 [19:03:23<7:11:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 8981/12384 [19:03:30<7:11:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 8982/12384 [19:03:30<7:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 8982/12384 [19:03:38<7:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 73%|███████▎ | 8983/12384 [19:03:38<7:10:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 73%|███████▎ | 8983/12384 [19:03:46<7:10:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 73%|███████▎ | 8984/12384 [19:03:46<7:10:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 73%|███████▎ | 8984/12384 [19:03:53<7:10:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 73%|███████▎ | 8985/12384 [19:03:53<7:10:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 73%|███████▎ | 8985/12384 [19:04:01<7:10:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 73%|███████▎ | 8986/12384 [19:04:01<7:10:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 73%|███████▎ | 8986/12384 [19:04:08<7:10:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 8987/12384 [19:04:08<7:10:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 8987/12384 [19:04:16<7:10:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 8988/12384 [19:04:16<7:10:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 8988/12384 [19:04:24<7:10:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 73%|███████▎ | 8989/12384 [19:04:24<7:10:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 73%|███████▎ | 8989/12384 [19:04:31<7:10:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 73%|███████▎ | 8990/12384 [19:04:31<7:10:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 73%|███████▎ | 8990/12384 [19:04:39<7:10:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 8991/12384 [19:04:39<7:09:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 8991/12384 [19:04:46<7:09:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 73%|███████▎ | 8992/12384 [19:04:46<7:09:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 73%|███████▎ | 8992/12384 [19:04:54<7:09:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 1: 73%|███████▎ | 8993/12384 [19:04:54<7:09:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 1: 73%|███████▎ | 8993/12384 [19:05:02<7:09:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 1: 73%|███████▎ | 8994/12384 [19:05:02<7:09:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 1: 73%|███████▎ | 8994/12384 [19:05:10<7:09:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 73%|███████▎ | 8995/12384 [19:05:10<7:15:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 73%|███████▎ | 8995/12384 [19:05:17<7:15:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 73%|███████▎ | 8996/12384 [19:05:17<7:13:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 73%|███████▎ | 8996/12384 [19:05:25<7:13:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 73%|███████▎ | 8997/12384 [19:05:25<7:11:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 73%|███████▎ | 8997/12384 [19:05:32<7:11:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 1: 73%|███████▎ | 8998/12384 [19:05:32<7:10:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 1: 73%|███████▎ | 8998/12384 [19:05:40<7:10:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 73%|███████▎ | 8999/12384 [19:05:40<7:10:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 73%|███████▎ | 8999/12384 [19:05:48<7:10:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 73%|███████▎ | 9000/12384 [19:05:48<7:09:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 73%|███████▎ | 9000/12384 [19:05:55<7:09:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 73%|███████▎ | 9001/12384 [19:05:55<7:09:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 73%|███████▎ | 9001/12384 [19:06:03<7:09:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 73%|███████▎ | 9002/12384 [19:06:03<7:09:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 73%|███████▎ | 9002/12384 [19:06:10<7:09:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 73%|███████▎ | 9003/12384 [19:06:10<7:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 73%|███████▎ | 9003/12384 [19:06:18<7:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 73%|███████▎ | 9004/12384 [19:06:18<7:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 73%|███████▎ | 9004/12384 [19:06:26<7:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 73%|███████▎ | 9005/12384 [19:06:26<7:08:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 73%|███████▎ | 9005/12384 [19:06:33<7:08:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 73%|███████▎ | 9006/12384 [19:06:33<7:10:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 73%|███████▎ | 9006/12384 [19:06:41<7:10:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 73%|███████▎ | 9007/12384 [19:06:41<7:09:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 73%|███████▎ | 9007/12384 [19:06:49<7:09:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9008/12384 [19:06:49<7:09:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9008/12384 [19:06:56<7:09:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 9009/12384 [19:06:56<7:10:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 9009/12384 [19:07:04<7:10:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 73%|███████▎ | 9010/12384 [19:07:04<7:10:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 73%|███████▎ | 9010/12384 [19:07:12<7:10:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 73%|███████▎ | 9011/12384 [19:07:12<7:09:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 73%|███████▎ | 9011/12384 [19:07:19<7:09:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 73%|███████▎ | 9012/12384 [19:07:19<7:08:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 73%|███████▎ | 9012/12384 [19:07:27<7:08:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 73%|███████▎ | 9013/12384 [19:07:27<7:07:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 73%|███████▎ | 9013/12384 [19:07:34<7:07:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 73%|███████▎ | 9014/12384 [19:07:34<7:07:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 73%|███████▎ | 9014/12384 [19:07:42<7:07:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 73%|███████▎ | 9015/12384 [19:07:42<7:06:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 73%|███████▎ | 9015/12384 [19:07:50<7:06:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 73%|███████▎ | 9016/12384 [19:07:50<7:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 73%|███████▎ | 9016/12384 [19:07:57<7:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 1: 73%|███████▎ | 9017/12384 [19:07:57<7:07:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 1: 73%|███████▎ | 9017/12384 [19:08:05<7:07:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 1: 73%|███████▎ | 9018/12384 [19:08:05<7:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 1: 73%|███████▎ | 9018/12384 [19:08:12<7:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 73%|███████▎ | 9019/12384 [19:08:12<7:07:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 73%|███████▎ | 9019/12384 [19:08:20<7:07:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 9020/12384 [19:08:20<7:07:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 9020/12384 [19:08:28<7:07:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 73%|███████▎ | 9021/12384 [19:08:28<7:13:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 73%|███████▎ | 9021/12384 [19:08:36<7:13:08, 7.73s/it, loss=0.0001, acc=0.9996, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 9022/12384 [19:08:36<7:11:03, 7.69s/it, loss=0.0001, acc=0.9996, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 9022/12384 [19:08:43<7:11:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9023/12384 [19:08:43<7:09:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9023/12384 [19:08:51<7:09:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 73%|███████▎ | 9024/12384 [19:08:51<7:08:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 73%|███████▎ | 9024/12384 [19:08:58<7:08:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 73%|███████▎ | 9025/12384 [19:08:58<7:07:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 73%|███████▎ | 9025/12384 [19:09:06<7:07:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9026/12384 [19:09:06<7:07:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9026/12384 [19:09:14<7:07:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9027/12384 [19:09:14<7:06:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9027/12384 [19:09:21<7:06:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9028/12384 [19:09:21<7:06:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9028/12384 [19:09:29<7:06:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9029/12384 [19:09:29<7:07:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9029/12384 [19:09:37<7:07:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.44s]
Epoch 1: 73%|███████▎ | 9030/12384 [19:09:37<7:07:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.44s]
Epoch 1: 73%|███████▎ | 9030/12384 [19:09:44<7:07:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.89s]
Epoch 1: 73%|███████▎ | 9031/12384 [19:09:44<7:06:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.89s]
Epoch 1: 73%|███████▎ | 9031/12384 [19:09:52<7:06:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 9032/12384 [19:09:52<7:07:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 9032/12384 [19:09:59<7:07:21, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 1: 73%|███████▎ | 9033/12384 [19:09:59<7:06:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 1: 73%|███████▎ | 9033/12384 [19:10:07<7:06:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 9034/12384 [19:10:07<7:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 9034/12384 [19:10:15<7:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 73%|███████▎ | 9035/12384 [19:10:15<7:05:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 73%|███████▎ | 9035/12384 [19:10:22<7:05:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 73%|███████▎ | 9036/12384 [19:10:22<7:05:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 73%|███████▎ | 9036/12384 [19:10:30<7:05:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 73%|███████▎ | 9037/12384 [19:10:30<7:04:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 73%|███████▎ | 9037/12384 [19:10:38<7:04:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 1: 73%|███████▎ | 9038/12384 [19:10:38<7:04:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 1: 73%|███████▎ | 9038/12384 [19:10:45<7:04:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 73%|███████▎ | 9039/12384 [19:10:45<7:06:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 73%|███████▎ | 9039/12384 [19:10:53<7:06:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 73%|███████▎ | 9040/12384 [19:10:53<7:06:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 73%|███████▎ | 9040/12384 [19:11:01<7:06:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 73%|███████▎ | 9041/12384 [19:11:01<7:05:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 1: 73%|███████▎ | 9041/12384 [19:11:08<7:05:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 73%|███████▎ | 9042/12384 [19:11:08<7:04:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 1: 73%|███████▎ | 9042/12384 [19:11:16<7:04:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.18s]
Epoch 1: 73%|███████▎ | 9043/12384 [19:11:16<7:04:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.18s]
Epoch 1: 73%|███████▎ | 9043/12384 [19:11:23<7:04:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 73%|███████▎ | 9044/12384 [19:11:23<7:04:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 73%|███████▎ | 9044/12384 [19:11:31<7:04:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.76s]
Epoch 1: 73%|███████▎ | 9045/12384 [19:11:31<7:03:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.76s]
Epoch 1: 73%|███████▎ | 9045/12384 [19:11:39<7:03:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 73%|███████▎ | 9046/12384 [19:11:39<7:03:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 73%|███████▎ | 9046/12384 [19:11:46<7:03:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.24s]
Epoch 1: 73%|███████▎ | 9047/12384 [19:11:46<7:03:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.24s]
Epoch 1: 73%|███████▎ | 9047/12384 [19:11:54<7:03:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 73%|███████▎ | 9048/12384 [19:11:54<7:09:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 73%|███████▎ | 9048/12384 [19:12:02<7:09:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 73%|███████▎ | 9049/12384 [19:12:02<7:06:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 73%|███████▎ | 9049/12384 [19:12:09<7:06:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 73%|███████▎ | 9050/12384 [19:12:09<7:05:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 73%|███████▎ | 9050/12384 [19:12:17<7:05:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 73%|███████▎ | 9051/12384 [19:12:17<7:04:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 73%|███████▎ | 9051/12384 [19:12:25<7:04:10, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=9.86s]
Epoch 1: 73%|███████▎ | 9052/12384 [19:12:25<7:03:22, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=9.86s]
Epoch 1: 73%|███████▎ | 9052/12384 [19:12:32<7:03:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9053/12384 [19:12:32<7:03:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9053/12384 [19:12:40<7:03:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 73%|███████▎ | 9054/12384 [19:12:40<7:03:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 73%|███████▎ | 9054/12384 [19:12:47<7:03:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 73%|███████▎ | 9055/12384 [19:12:47<7:02:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 73%|███████▎ | 9055/12384 [19:12:55<7:02:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 73%|███████▎ | 9056/12384 [19:12:55<7:02:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 73%|███████▎ | 9056/12384 [19:13:03<7:02:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 73%|███████▎ | 9057/12384 [19:13:03<7:02:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 73%|███████▎ | 9057/12384 [19:13:10<7:02:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 9058/12384 [19:13:10<7:02:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 9058/12384 [19:13:18<7:02:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 73%|███████▎ | 9059/12384 [19:13:18<7:01:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 73%|███████▎ | 9059/12384 [19:13:25<7:01:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 73%|███████▎ | 9060/12384 [19:13:25<7:01:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 73%|███████▎ | 9060/12384 [19:13:33<7:01:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 1: 73%|███████▎ | 9061/12384 [19:13:33<7:02:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 1: 73%|███████▎ | 9061/12384 [19:13:41<7:02:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 73%|███████▎ | 9062/12384 [19:13:41<7:02:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 73%|███████▎ | 9062/12384 [19:13:48<7:02:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 73%|███████▎ | 9063/12384 [19:13:48<7:01:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 73%|███████▎ | 9063/12384 [19:13:56<7:01:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 1: 73%|███████▎ | 9064/12384 [19:13:56<7:01:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 1: 73%|███████▎ | 9064/12384 [19:14:04<7:01:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 73%|███████▎ | 9065/12384 [19:14:04<7:01:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 73%|███████▎ | 9065/12384 [19:14:11<7:01:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 73%|███████▎ | 9066/12384 [19:14:11<7:01:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 73%|███████▎ | 9066/12384 [19:14:19<7:01:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 73%|███████▎ | 9067/12384 [19:14:19<7:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 73%|███████▎ | 9067/12384 [19:14:26<7:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 73%|███████▎ | 9068/12384 [19:14:26<7:01:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 73%|███████▎ | 9068/12384 [19:14:34<7:01:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 73%|███████▎ | 9069/12384 [19:14:34<7:01:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 73%|███████▎ | 9069/12384 [19:14:42<7:01:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 73%|███████▎ | 9070/12384 [19:14:42<7:00:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 73%|███████▎ | 9070/12384 [19:14:49<7:00:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.03s]
Epoch 1: 73%|███████▎ | 9071/12384 [19:14:49<7:00:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.03s]
Epoch 1: 73%|███████▎ | 9071/12384 [19:14:57<7:00:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 73%|███████▎ | 9072/12384 [19:14:57<7:00:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 73%|███████▎ | 9072/12384 [19:15:04<7:00:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 73%|███████▎ | 9073/12384 [19:15:04<6:59:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 73%|███████▎ | 9073/12384 [19:15:12<6:59:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 73%|███████▎ | 9074/12384 [19:15:12<7:05:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 73%|███████▎ | 9074/12384 [19:15:20<7:05:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 73%|███████▎ | 9075/12384 [19:15:20<7:03:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 73%|███████▎ | 9075/12384 [19:15:28<7:03:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 73%|███████▎ | 9076/12384 [19:15:28<7:01:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 73%|███████▎ | 9076/12384 [19:15:35<7:01:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 73%|███████▎ | 9077/12384 [19:15:35<7:00:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 73%|███████▎ | 9077/12384 [19:15:43<7:00:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 9078/12384 [19:15:43<7:00:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 73%|███████▎ | 9078/12384 [19:15:50<7:00:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9079/12384 [19:15:50<6:59:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9079/12384 [19:15:58<6:59:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 73%|███████▎ | 9080/12384 [19:15:58<6:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 73%|███████▎ | 9080/12384 [19:16:06<6:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 73%|███████▎ | 9081/12384 [19:16:06<6:58:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 73%|███████▎ | 9081/12384 [19:16:13<6:58:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9082/12384 [19:16:13<6:59:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9082/12384 [19:16:21<6:59:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 9083/12384 [19:16:21<6:59:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 73%|███████▎ | 9083/12384 [19:16:28<6:59:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9084/12384 [19:16:28<6:58:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9084/12384 [19:16:36<6:58:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 73%|███████▎ | 9085/12384 [19:16:36<6:58:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 73%|███████▎ | 9085/12384 [19:16:44<6:58:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 73%|███████▎ | 9086/12384 [19:16:44<6:57:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 73%|███████▎ | 9086/12384 [19:16:51<6:57:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9087/12384 [19:16:51<6:58:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9087/12384 [19:16:59<6:58:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9088/12384 [19:16:59<6:58:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9088/12384 [19:17:07<6:58:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 73%|███████▎ | 9089/12384 [19:17:07<6:58:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 73%|███████▎ | 9089/12384 [19:17:14<6:58:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9090/12384 [19:17:14<6:57:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9090/12384 [19:17:22<6:57:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9091/12384 [19:17:22<6:57:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 73%|███████▎ | 9091/12384 [19:17:29<6:57:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 73%|███████▎ | 9092/12384 [19:17:29<6:57:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 73%|███████▎ | 9092/12384 [19:17:37<6:57:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 73%|███████▎ | 9093/12384 [19:17:37<6:57:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 73%|███████▎ | 9093/12384 [19:17:45<6:57:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 73%|███████▎ | 9094/12384 [19:17:45<6:56:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 73%|███████▎ | 9094/12384 [19:17:52<6:56:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 73%|███████▎ | 9095/12384 [19:17:52<6:56:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 73%|███████▎ | 9095/12384 [19:18:00<6:56:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 73%|███████▎ | 9096/12384 [19:18:00<6:57:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 73%|███████▎ | 9096/12384 [19:18:07<6:57:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 73%|███████▎ | 9097/12384 [19:18:07<6:56:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 73%|███████▎ | 9097/12384 [19:18:15<6:56:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 73%|███████▎ | 9098/12384 [19:18:15<6:56:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 73%|███████▎ | 9098/12384 [19:18:23<6:56:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 73%|███████▎ | 9099/12384 [19:18:23<6:56:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 73%|███████▎ | 9099/12384 [19:18:30<6:56:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9100/12384 [19:18:30<6:56:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9100/12384 [19:18:38<6:56:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 73%|███████▎ | 9101/12384 [19:18:38<7:01:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 73%|███████▎ | 9101/12384 [19:18:46<7:01:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9102/12384 [19:18:46<6:59:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 73%|███████▎ | 9102/12384 [19:18:53<6:59:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▎ | 9103/12384 [19:18:53<6:58:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▎ | 9103/12384 [19:19:01<6:58:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 74%|███████▎ | 9104/12384 [19:19:01<6:57:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 74%|███████▎ | 9104/12384 [19:19:09<6:57:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 74%|███████▎ | 9105/12384 [19:19:09<6:56:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 74%|███████▎ | 9105/12384 [19:19:16<6:56:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 74%|███████▎ | 9106/12384 [19:19:16<6:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 74%|███████▎ | 9106/12384 [19:19:24<6:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 74%|███████▎ | 9107/12384 [19:19:24<6:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 74%|███████▎ | 9107/12384 [19:19:31<6:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▎ | 9108/12384 [19:19:31<6:55:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▎ | 9108/12384 [19:19:39<6:55:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 74%|███████▎ | 9109/12384 [19:19:39<6:55:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 74%|███████▎ | 9109/12384 [19:19:47<6:55:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 74%|███████▎ | 9110/12384 [19:19:47<6:55:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 74%|███████▎ | 9110/12384 [19:19:54<6:55:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 74%|███████▎ | 9111/12384 [19:19:54<6:55:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 74%|███████▎ | 9111/12384 [19:20:02<6:55:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 74%|███████▎ | 9112/12384 [19:20:02<6:55:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 74%|███████▎ | 9112/12384 [19:20:09<6:55:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 74%|███████▎ | 9113/12384 [19:20:09<6:55:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 74%|███████▎ | 9113/12384 [19:20:17<6:55:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▎ | 9114/12384 [19:20:17<6:54:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▎ | 9114/12384 [19:20:25<6:54:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 74%|███████▎ | 9115/12384 [19:20:25<6:54:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 74%|███████▎ | 9115/12384 [19:20:32<6:54:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 74%|███████▎ | 9116/12384 [19:20:32<6:57:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 74%|███████▎ | 9116/12384 [19:20:40<6:57:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 74%|███████▎ | 9117/12384 [19:20:40<6:55:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 74%|███████▎ | 9117/12384 [19:20:48<6:55:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 1: 74%|███████▎ | 9118/12384 [19:20:48<6:57:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 1: 74%|███████▎ | 9118/12384 [19:20:55<6:57:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 74%|███████▎ | 9119/12384 [19:20:55<6:55:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 74%|███████▎ | 9119/12384 [19:21:03<6:55:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 74%|███████▎ | 9120/12384 [19:21:03<6:55:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 74%|███████▎ | 9120/12384 [19:21:11<6:55:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 74%|███████▎ | 9121/12384 [19:21:11<6:54:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 74%|███████▎ | 9121/12384 [19:21:18<6:54:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 74%|███████▎ | 9122/12384 [19:21:18<6:54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 74%|███████▎ | 9122/12384 [19:21:26<6:54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 74%|███████▎ | 9123/12384 [19:21:26<6:53:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 74%|███████▎ | 9123/12384 [19:21:33<6:53:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 1: 74%|███████▎ | 9124/12384 [19:21:33<6:53:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 1: 74%|███████▎ | 9124/12384 [19:21:41<6:53:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▎ | 9125/12384 [19:21:41<6:53:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▎ | 9125/12384 [19:21:49<6:53:11, 7.61s/it, loss=0.0005, acc=0.9983, iter_time=7.61s]
Epoch 1: 74%|███████▎ | 9126/12384 [19:21:49<6:54:21, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=7.61s]
Epoch 1: 74%|███████▎ | 9126/12384 [19:21:57<6:54:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 74%|███████▎ | 9127/12384 [19:21:57<6:58:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 74%|███████▎ | 9127/12384 [19:22:04<6:58:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 74%|███████▎ | 9128/12384 [19:22:04<6:57:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 74%|███████▎ | 9128/12384 [19:22:12<6:57:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 74%|███████▎ | 9129/12384 [19:22:12<6:55:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 74%|███████▎ | 9129/12384 [19:22:19<6:55:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 74%|███████▎ | 9130/12384 [19:22:19<6:54:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 74%|███████▎ | 9130/12384 [19:22:27<6:54:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 74%|███████▎ | 9131/12384 [19:22:27<6:53:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 74%|███████▎ | 9131/12384 [19:22:35<6:53:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 74%|███████▎ | 9132/12384 [19:22:35<6:53:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 74%|███████▎ | 9132/12384 [19:22:42<6:53:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▎ | 9133/12384 [19:22:42<6:53:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▎ | 9133/12384 [19:22:50<6:53:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 74%|███████▍ | 9134/12384 [19:22:50<6:53:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 74%|███████▍ | 9134/12384 [19:22:57<6:53:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 74%|███████▍ | 9135/12384 [19:22:57<6:52:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 74%|███████▍ | 9135/12384 [19:23:05<6:52:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 74%|███████▍ | 9136/12384 [19:23:05<6:52:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 1: 74%|███████▍ | 9136/12384 [19:23:13<6:52:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 74%|███████▍ | 9137/12384 [19:23:13<6:51:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 74%|███████▍ | 9137/12384 [19:23:20<6:51:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9138/12384 [19:23:20<6:51:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9138/12384 [19:23:28<6:51:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 74%|███████▍ | 9139/12384 [19:23:28<6:51:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 74%|███████▍ | 9139/12384 [19:23:35<6:51:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 74%|███████▍ | 9140/12384 [19:23:35<6:50:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 74%|███████▍ | 9140/12384 [19:23:43<6:50:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 74%|███████▍ | 9141/12384 [19:23:43<6:50:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 74%|███████▍ | 9141/12384 [19:23:51<6:50:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 74%|███████▍ | 9142/12384 [19:23:51<6:51:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 74%|███████▍ | 9142/12384 [19:23:58<6:51:10, 7.61s/it, loss=0.0014, acc=0.9979, iter_time=5.85s]
Epoch 1: 74%|███████▍ | 9143/12384 [19:23:58<6:51:14, 7.61s/it, loss=0.0014, acc=0.9979, iter_time=5.85s]
Epoch 1: 74%|███████▍ | 9143/12384 [19:24:06<6:51:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 74%|███████▍ | 9144/12384 [19:24:06<6:51:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 74%|███████▍ | 9144/12384 [19:24:14<6:51:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 1: 74%|███████▍ | 9145/12384 [19:24:14<6:51:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 1: 74%|███████▍ | 9145/12384 [19:24:21<6:51:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 74%|███████▍ | 9146/12384 [19:24:21<6:50:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 74%|███████▍ | 9146/12384 [19:24:29<6:50:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 74%|███████▍ | 9147/12384 [19:24:29<6:50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 74%|███████▍ | 9147/12384 [19:24:36<6:50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9148/12384 [19:24:36<6:52:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9148/12384 [19:24:44<6:52:05, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=3.52s]
Epoch 1: 74%|███████▍ | 9149/12384 [19:24:44<6:51:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=3.52s]
Epoch 1: 74%|███████▍ | 9149/12384 [19:24:52<6:51:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.77s]
Epoch 1: 74%|███████▍ | 9150/12384 [19:24:52<6:51:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.77s]
Epoch 1: 74%|███████▍ | 9150/12384 [19:24:59<6:51:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 74%|███████▍ | 9151/12384 [19:24:59<6:50:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 74%|███████▍ | 9151/12384 [19:25:07<6:50:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 74%|███████▍ | 9152/12384 [19:25:07<6:50:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 74%|███████▍ | 9152/12384 [19:25:15<6:50:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 74%|███████▍ | 9153/12384 [19:25:15<6:55:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 74%|███████▍ | 9153/12384 [19:25:23<6:55:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 74%|███████▍ | 9154/12384 [19:25:23<6:54:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 74%|███████▍ | 9154/12384 [19:25:30<6:54:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.06s]
Epoch 1: 74%|███████▍ | 9155/12384 [19:25:30<6:53:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.06s]
Epoch 1: 74%|███████▍ | 9155/12384 [19:25:38<6:53:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9156/12384 [19:25:38<6:51:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9156/12384 [19:25:45<6:51:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 74%|███████▍ | 9157/12384 [19:25:45<6:50:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 74%|███████▍ | 9157/12384 [19:25:53<6:50:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9158/12384 [19:25:53<6:50:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9158/12384 [19:26:01<6:50:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 74%|███████▍ | 9159/12384 [19:26:01<6:49:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 74%|███████▍ | 9159/12384 [19:26:08<6:49:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 74%|███████▍ | 9160/12384 [19:26:08<6:49:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 74%|███████▍ | 9160/12384 [19:26:16<6:49:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 74%|███████▍ | 9161/12384 [19:26:16<6:49:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 74%|███████▍ | 9161/12384 [19:26:24<6:49:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.49s]
Epoch 1: 74%|███████▍ | 9162/12384 [19:26:24<6:50:44, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.49s]
Epoch 1: 74%|███████▍ | 9162/12384 [19:26:31<6:50:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 74%|███████▍ | 9163/12384 [19:26:31<6:50:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 74%|███████▍ | 9163/12384 [19:26:39<6:50:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 74%|███████▍ | 9164/12384 [19:26:39<6:49:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 74%|███████▍ | 9164/12384 [19:26:46<6:49:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 74%|███████▍ | 9165/12384 [19:26:46<6:48:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 74%|███████▍ | 9165/12384 [19:26:54<6:48:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 1: 74%|███████▍ | 9166/12384 [19:26:54<6:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 1: 74%|███████▍ | 9166/12384 [19:27:02<6:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 74%|███████▍ | 9167/12384 [19:27:02<6:48:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 74%|███████▍ | 9167/12384 [19:27:09<6:48:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 74%|███████▍ | 9168/12384 [19:27:09<6:48:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 74%|███████▍ | 9168/12384 [19:27:17<6:48:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 74%|███████▍ | 9169/12384 [19:27:17<6:48:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 74%|███████▍ | 9169/12384 [19:27:24<6:48:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9170/12384 [19:27:24<6:47:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9170/12384 [19:27:32<6:47:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9171/12384 [19:27:32<6:47:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9171/12384 [19:27:40<6:47:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 74%|███████▍ | 9172/12384 [19:27:40<6:47:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 74%|███████▍ | 9172/12384 [19:27:47<6:47:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▍ | 9173/12384 [19:27:47<6:47:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▍ | 9173/12384 [19:27:55<6:47:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9174/12384 [19:27:55<6:46:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 74%|███████▍ | 9174/12384 [19:28:02<6:46:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9175/12384 [19:28:02<6:46:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9175/12384 [19:28:10<6:46:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 74%|███████▍ | 9176/12384 [19:28:10<6:46:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 74%|███████▍ | 9176/12384 [19:28:18<6:46:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 74%|███████▍ | 9177/12384 [19:28:18<6:51:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 74%|███████▍ | 9177/12384 [19:28:26<6:51:22, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.39s]
Epoch 1: 74%|███████▍ | 9178/12384 [19:28:26<6:49:37, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.39s]
Epoch 1: 74%|███████▍ | 9178/12384 [19:28:34<6:49:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 74%|███████▍ | 9179/12384 [19:28:34<6:54:12, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 74%|███████▍ | 9179/12384 [19:28:41<6:54:12, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 74%|███████▍ | 9180/12384 [19:28:41<6:51:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 74%|███████▍ | 9180/12384 [19:28:49<6:51:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 74%|███████▍ | 9181/12384 [19:28:49<6:50:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 74%|███████▍ | 9181/12384 [19:28:56<6:50:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 74%|███████▍ | 9182/12384 [19:28:56<6:48:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 74%|███████▍ | 9182/12384 [19:29:04<6:48:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 74%|███████▍ | 9183/12384 [19:29:04<6:48:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 74%|███████▍ | 9183/12384 [19:29:12<6:48:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 74%|███████▍ | 9184/12384 [19:29:12<6:47:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 74%|███████▍ | 9184/12384 [19:29:19<6:47:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 74%|███████▍ | 9185/12384 [19:29:19<6:47:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 74%|███████▍ | 9185/12384 [19:29:27<6:47:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 74%|███████▍ | 9186/12384 [19:29:27<6:46:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 74%|███████▍ | 9186/12384 [19:29:34<6:46:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.65s]
Epoch 1: 74%|███████▍ | 9187/12384 [19:29:34<6:46:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.65s]
Epoch 1: 74%|███████▍ | 9187/12384 [19:29:42<6:46:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 74%|███████▍ | 9188/12384 [19:29:42<6:45:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 74%|███████▍ | 9188/12384 [19:29:50<6:45:47, 7.62s/it, loss=0.0009, acc=0.9947, iter_time=10.15s]
Epoch 1: 74%|███████▍ | 9189/12384 [19:29:50<6:45:07, 7.61s/it, loss=0.0009, acc=0.9947, iter_time=10.15s]
Epoch 1: 74%|███████▍ | 9189/12384 [19:29:57<6:45:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 74%|███████▍ | 9190/12384 [19:29:57<6:44:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 74%|███████▍ | 9190/12384 [19:30:05<6:44:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 74%|███████▍ | 9191/12384 [19:30:05<6:44:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 74%|███████▍ | 9191/12384 [19:30:13<6:44:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 74%|███████▍ | 9192/12384 [19:30:13<6:46:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 74%|███████▍ | 9192/12384 [19:30:20<6:46:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 74%|███████▍ | 9193/12384 [19:30:20<6:45:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 74%|███████▍ | 9193/12384 [19:30:28<6:45:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 74%|███████▍ | 9194/12384 [19:30:28<6:44:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 74%|███████▍ | 9194/12384 [19:30:35<6:44:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9195/12384 [19:30:35<6:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9195/12384 [19:30:43<6:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9196/12384 [19:30:43<6:44:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9196/12384 [19:30:51<6:44:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9197/12384 [19:30:51<6:43:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 74%|███████▍ | 9197/12384 [19:30:58<6:43:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 74%|███████▍ | 9198/12384 [19:30:58<6:43:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 74%|███████▍ | 9198/12384 [19:31:06<6:43:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 74%|███████▍ | 9199/12384 [19:31:06<6:44:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 74%|███████▍ | 9199/12384 [19:31:13<6:44:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 74%|███████▍ | 9200/12384 [19:31:13<6:44:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 74%|███████▍ | 9200/12384 [19:31:21<6:44:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 74%|███████▍ | 9201/12384 [19:31:21<6:43:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 74%|███████▍ | 9201/12384 [19:31:29<6:43:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 74%|███████▍ | 9202/12384 [19:31:29<6:43:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 74%|███████▍ | 9202/12384 [19:31:36<6:43:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 74%|███████▍ | 9203/12384 [19:31:36<6:43:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 74%|███████▍ | 9203/12384 [19:31:44<6:43:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.59s]
Epoch 1: 74%|███████▍ | 9204/12384 [19:31:44<6:42:57, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.59s]
Epoch 1: 74%|███████▍ | 9204/12384 [19:31:52<6:42:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 74%|███████▍ | 9205/12384 [19:31:52<6:47:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 74%|███████▍ | 9205/12384 [19:31:59<6:47:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 74%|███████▍ | 9206/12384 [19:31:59<6:46:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 74%|███████▍ | 9206/12384 [19:32:07<6:46:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 74%|███████▍ | 9207/12384 [19:32:07<6:45:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 1: 74%|███████▍ | 9207/12384 [19:32:15<6:45:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 74%|███████▍ | 9208/12384 [19:32:15<6:44:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 74%|███████▍ | 9208/12384 [19:32:22<6:44:20, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 74%|███████▍ | 9209/12384 [19:32:22<6:43:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 74%|███████▍ | 9209/12384 [19:32:30<6:43:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 1: 74%|███████▍ | 9210/12384 [19:32:30<6:43:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 1: 74%|███████▍ | 9210/12384 [19:32:37<6:43:27, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=11.20s]
Epoch 1: 74%|███████▍ | 9211/12384 [19:32:37<6:42:43, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=11.20s]
Epoch 1: 74%|███████▍ | 9211/12384 [19:32:45<6:42:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 74%|███████▍ | 9212/12384 [19:32:45<6:36:41, 7.50s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 74%|███████▍ | 9212/12384 [19:32:52<6:36:41, 7.50s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 74%|███████▍ | 9213/12384 [19:32:52<6:38:12, 7.53s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 74%|███████▍ | 9213/12384 [19:33:00<6:38:12, 7.53s/it, loss=0.0001, acc=1.0000, iter_time=7.03s]
Epoch 1: 74%|███████▍ | 9214/12384 [19:33:00<6:39:06, 7.55s/it, loss=0.0001, acc=1.0000, iter_time=7.03s]
Epoch 1: 74%|███████▍ | 9214/12384 [19:33:07<6:39:06, 7.55s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 74%|███████▍ | 9215/12384 [19:33:07<6:39:42, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 74%|███████▍ | 9215/12384 [19:33:15<6:39:42, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 1: 74%|███████▍ | 9216/12384 [19:33:15<6:40:09, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 1: 74%|███████▍ | 9216/12384 [19:33:23<6:40:09, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 1: 74%|███████▍ | 9217/12384 [19:33:23<6:40:06, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 1: 74%|███████▍ | 9217/12384 [19:33:30<6:40:06, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 74%|███████▍ | 9218/12384 [19:33:30<6:40:29, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 74%|███████▍ | 9218/12384 [19:33:38<6:40:29, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 74%|███████▍ | 9219/12384 [19:33:38<6:40:12, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 74%|███████▍ | 9219/12384 [19:33:45<6:40:12, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 74%|███████▍ | 9220/12384 [19:33:45<6:40:28, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 74%|███████▍ | 9220/12384 [19:33:53<6:40:28, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 74%|███████▍ | 9221/12384 [19:33:53<6:41:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 74%|███████▍ | 9221/12384 [19:34:01<6:41:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▍ | 9222/12384 [19:34:01<6:40:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▍ | 9222/12384 [19:34:08<6:40:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▍ | 9223/12384 [19:34:08<6:40:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 74%|███████▍ | 9223/12384 [19:34:16<6:40:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 74%|███████▍ | 9224/12384 [19:34:16<6:42:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 74%|███████▍ | 9224/12384 [19:34:24<6:42:17, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=6.47s]
Epoch 1: 74%|███████▍ | 9225/12384 [19:34:24<6:41:25, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=6.47s]
Epoch 1: 74%|███████▍ | 9225/12384 [19:34:31<6:41:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 74%|███████▍ | 9226/12384 [19:34:31<6:41:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 74%|███████▍ | 9226/12384 [19:34:39<6:41:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▍ | 9227/12384 [19:34:39<6:41:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▍ | 9227/12384 [19:34:46<6:41:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 75%|███████▍ | 9228/12384 [19:34:46<6:41:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 75%|███████▍ | 9228/12384 [19:34:54<6:41:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 75%|███████▍ | 9229/12384 [19:34:54<6:45:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 75%|███████▍ | 9229/12384 [19:35:02<6:45:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 75%|███████▍ | 9230/12384 [19:35:02<6:45:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 75%|███████▍ | 9230/12384 [19:35:10<6:45:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 75%|███████▍ | 9231/12384 [19:35:10<6:43:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 75%|███████▍ | 9231/12384 [19:35:18<6:43:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 75%|███████▍ | 9232/12384 [19:35:18<6:47:21, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 75%|███████▍ | 9232/12384 [19:35:25<6:47:21, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 75%|███████▍ | 9233/12384 [19:35:25<6:44:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 75%|███████▍ | 9233/12384 [19:35:33<6:44:51, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 75%|███████▍ | 9234/12384 [19:35:33<6:43:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 75%|███████▍ | 9234/12384 [19:35:40<6:43:05, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 1: 75%|███████▍ | 9235/12384 [19:35:40<6:41:31, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 1: 75%|███████▍ | 9235/12384 [19:35:48<6:41:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 75%|███████▍ | 9236/12384 [19:35:48<6:40:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 75%|███████▍ | 9236/12384 [19:35:56<6:40:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▍ | 9237/12384 [19:35:56<6:40:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▍ | 9237/12384 [19:36:03<6:40:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9238/12384 [19:36:03<6:39:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9238/12384 [19:36:11<6:39:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▍ | 9239/12384 [19:36:11<6:40:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▍ | 9239/12384 [19:36:19<6:40:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 75%|███████▍ | 9240/12384 [19:36:19<6:39:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 75%|███████▍ | 9240/12384 [19:36:26<6:39:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.23s]
Epoch 1: 75%|███████▍ | 9241/12384 [19:36:26<6:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.23s]
Epoch 1: 75%|███████▍ | 9241/12384 [19:36:34<6:39:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.66s]
Epoch 1: 75%|███████▍ | 9242/12384 [19:36:34<6:39:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.66s]
Epoch 1: 75%|███████▍ | 9242/12384 [19:36:41<6:39:47, 7.63s/it, loss=0.0003, acc=0.9973, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9243/12384 [19:36:41<6:39:07, 7.62s/it, loss=0.0003, acc=0.9973, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9243/12384 [19:36:49<6:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9244/12384 [19:36:49<6:38:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9244/12384 [19:36:57<6:38:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 75%|███████▍ | 9245/12384 [19:36:57<6:39:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 75%|███████▍ | 9245/12384 [19:37:04<6:39:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9246/12384 [19:37:04<6:39:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9246/12384 [19:37:12<6:39:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 75%|███████▍ | 9247/12384 [19:37:12<6:39:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 75%|███████▍ | 9247/12384 [19:37:20<6:39:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 75%|███████▍ | 9248/12384 [19:37:20<6:38:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 75%|███████▍ | 9248/12384 [19:37:27<6:38:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 75%|███████▍ | 9249/12384 [19:37:27<6:38:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 75%|███████▍ | 9249/12384 [19:37:35<6:38:13, 7.62s/it, loss=0.0030, acc=0.9984, iter_time=8.13s]
Epoch 1: 75%|███████▍ | 9250/12384 [19:37:35<6:37:50, 7.62s/it, loss=0.0030, acc=0.9984, iter_time=8.13s]
Epoch 1: 75%|███████▍ | 9250/12384 [19:37:42<6:37:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 75%|███████▍ | 9251/12384 [19:37:42<6:37:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 75%|███████▍ | 9251/12384 [19:37:50<6:37:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 75%|███████▍ | 9252/12384 [19:37:50<6:37:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 75%|███████▍ | 9252/12384 [19:37:58<6:37:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▍ | 9253/12384 [19:37:58<6:37:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▍ | 9253/12384 [19:38:05<6:37:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9254/12384 [19:38:05<6:37:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9254/12384 [19:38:13<6:37:21, 7.62s/it, loss=0.0001, acc=0.9992, iter_time=4.08s]
Epoch 1: 75%|███████▍ | 9255/12384 [19:38:13<6:37:12, 7.62s/it, loss=0.0001, acc=0.9992, iter_time=4.08s]
Epoch 1: 75%|███████▍ | 9255/12384 [19:38:21<6:37:12, 7.62s/it, loss=0.0002, acc=0.9981, iter_time=11.83s]
Epoch 1: 75%|███████▍ | 9256/12384 [19:38:21<6:41:28, 7.70s/it, loss=0.0002, acc=0.9981, iter_time=11.83s]
Epoch 1: 75%|███████▍ | 9256/12384 [19:38:28<6:41:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 75%|███████▍ | 9257/12384 [19:38:28<6:40:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 75%|███████▍ | 9257/12384 [19:38:36<6:40:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 1: 75%|███████▍ | 9258/12384 [19:38:36<6:43:52, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 1: 75%|███████▍ | 9258/12384 [19:38:44<6:43:52, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 75%|███████▍ | 9259/12384 [19:38:44<6:41:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 75%|███████▍ | 9259/12384 [19:38:52<6:41:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9260/12384 [19:38:52<6:39:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9260/12384 [19:38:59<6:39:39, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9261/12384 [19:38:59<6:38:44, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▍ | 9261/12384 [19:39:07<6:38:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9262/12384 [19:39:07<6:37:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9262/12384 [19:39:14<6:37:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▍ | 9263/12384 [19:39:14<6:37:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▍ | 9263/12384 [19:39:22<6:37:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 75%|███████▍ | 9264/12384 [19:39:22<6:36:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 75%|███████▍ | 9264/12384 [19:39:30<6:36:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 75%|███████▍ | 9265/12384 [19:39:30<6:36:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 75%|███████▍ | 9265/12384 [19:39:37<6:36:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 75%|███████▍ | 9266/12384 [19:39:37<6:35:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 75%|███████▍ | 9266/12384 [19:39:45<6:35:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 75%|███████▍ | 9267/12384 [19:39:45<6:35:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 75%|███████▍ | 9267/12384 [19:39:52<6:35:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 75%|███████▍ | 9268/12384 [19:39:52<6:35:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 75%|███████▍ | 9268/12384 [19:40:00<6:35:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 75%|███████▍ | 9269/12384 [19:40:00<6:34:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 75%|███████▍ | 9269/12384 [19:40:08<6:34:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9270/12384 [19:40:08<6:35:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9270/12384 [19:40:15<6:35:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 75%|███████▍ | 9271/12384 [19:40:15<6:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 75%|███████▍ | 9271/12384 [19:40:23<6:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 75%|███████▍ | 9272/12384 [19:40:23<6:35:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 75%|███████▍ | 9272/12384 [19:40:30<6:35:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 75%|███████▍ | 9273/12384 [19:40:30<6:34:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 75%|███████▍ | 9273/12384 [19:40:38<6:34:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9274/12384 [19:40:38<6:35:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9274/12384 [19:40:46<6:35:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 1: 75%|███████▍ | 9275/12384 [19:40:46<6:34:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 1: 75%|███████▍ | 9275/12384 [19:40:53<6:34:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 75%|███████▍ | 9276/12384 [19:40:53<6:34:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 75%|███████▍ | 9276/12384 [19:41:01<6:34:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9277/12384 [19:41:01<6:33:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 75%|███████▍ | 9277/12384 [19:41:08<6:33:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 75%|███████▍ | 9278/12384 [19:41:08<6:33:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 75%|███████▍ | 9278/12384 [19:41:16<6:33:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 75%|███████▍ | 9279/12384 [19:41:16<6:33:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 75%|███████▍ | 9279/12384 [19:41:24<6:33:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 1: 75%|███████▍ | 9280/12384 [19:41:24<6:34:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 1: 75%|███████▍ | 9280/12384 [19:41:31<6:34:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 75%|███████▍ | 9281/12384 [19:41:31<6:33:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 75%|███████▍ | 9281/12384 [19:41:39<6:33:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 75%|███████▍ | 9282/12384 [19:41:39<6:38:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 75%|███████▍ | 9282/12384 [19:41:47<6:38:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 75%|███████▍ | 9283/12384 [19:41:47<6:36:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 75%|███████▍ | 9283/12384 [19:41:54<6:36:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 75%|███████▍ | 9284/12384 [19:41:54<6:35:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 75%|███████▍ | 9284/12384 [19:42:02<6:35:25, 7.65s/it, loss=0.0000, acc=0.9996, iter_time=7.66s]
Epoch 1: 75%|███████▍ | 9285/12384 [19:42:02<6:40:03, 7.75s/it, loss=0.0000, acc=0.9996, iter_time=7.66s]
Epoch 1: 75%|███████▍ | 9285/12384 [19:42:10<6:40:03, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 75%|███████▍ | 9286/12384 [19:42:10<6:37:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 75%|███████▍ | 9286/12384 [19:42:18<6:37:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 75%|███████▍ | 9287/12384 [19:42:18<6:36:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 75%|███████▍ | 9287/12384 [19:42:25<6:36:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 75%|███████▌ | 9288/12384 [19:42:25<6:35:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 75%|███████▌ | 9288/12384 [19:42:33<6:35:05, 7.66s/it, loss=0.0014, acc=0.9952, iter_time=7.65s]
Epoch 1: 75%|███████▌ | 9289/12384 [19:42:33<6:34:13, 7.64s/it, loss=0.0014, acc=0.9952, iter_time=7.65s]
Epoch 1: 75%|███████▌ | 9289/12384 [19:42:40<6:34:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9290/12384 [19:42:40<6:33:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9290/12384 [19:42:48<6:33:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 75%|███████▌ | 9291/12384 [19:42:48<6:33:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 75%|███████▌ | 9291/12384 [19:42:56<6:33:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 75%|███████▌ | 9292/12384 [19:42:56<6:32:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 75%|███████▌ | 9292/12384 [19:43:03<6:32:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▌ | 9293/12384 [19:43:03<6:32:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▌ | 9293/12384 [19:43:11<6:32:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 75%|███████▌ | 9294/12384 [19:43:11<6:33:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 75%|███████▌ | 9294/12384 [19:43:19<6:33:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 75%|███████▌ | 9295/12384 [19:43:19<6:32:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 75%|███████▌ | 9295/12384 [19:43:26<6:32:49, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=9.22s]
Epoch 1: 75%|███████▌ | 9296/12384 [19:43:26<6:32:29, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=9.22s]
Epoch 1: 75%|███████▌ | 9296/12384 [19:43:34<6:32:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 75%|███████▌ | 9297/12384 [19:43:34<6:31:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 75%|███████▌ | 9297/12384 [19:43:41<6:31:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▌ | 9298/12384 [19:43:41<6:31:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▌ | 9298/12384 [19:43:49<6:31:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9299/12384 [19:43:49<6:31:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9299/12384 [19:43:57<6:31:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9300/12384 [19:43:57<6:31:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9300/12384 [19:44:04<6:31:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 75%|███████▌ | 9301/12384 [19:44:04<6:30:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 75%|███████▌ | 9301/12384 [19:44:12<6:30:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.67s]
Epoch 1: 75%|███████▌ | 9302/12384 [19:44:12<6:30:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.67s]
Epoch 1: 75%|███████▌ | 9302/12384 [19:44:20<6:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9303/12384 [19:44:20<6:30:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9303/12384 [19:44:27<6:30:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 75%|███████▌ | 9304/12384 [19:44:27<6:31:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 75%|███████▌ | 9304/12384 [19:44:35<6:31:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 75%|███████▌ | 9305/12384 [19:44:35<6:30:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 75%|███████▌ | 9305/12384 [19:44:42<6:30:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 75%|███████▌ | 9306/12384 [19:44:42<6:30:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 75%|███████▌ | 9306/12384 [19:44:50<6:30:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 75%|███████▌ | 9307/12384 [19:44:50<6:30:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 75%|███████▌ | 9307/12384 [19:44:58<6:30:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 75%|███████▌ | 9308/12384 [19:44:58<6:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 75%|███████▌ | 9308/12384 [19:45:05<6:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 75%|███████▌ | 9309/12384 [19:45:05<6:34:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 75%|███████▌ | 9309/12384 [19:45:13<6:34:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 75%|███████▌ | 9310/12384 [19:45:13<6:34:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 75%|███████▌ | 9310/12384 [19:45:21<6:34:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 75%|███████▌ | 9311/12384 [19:45:21<6:37:40, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 75%|███████▌ | 9311/12384 [19:45:29<6:37:40, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 75%|███████▌ | 9312/12384 [19:45:29<6:34:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 75%|███████▌ | 9312/12384 [19:45:36<6:34:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 75%|███████▌ | 9313/12384 [19:45:36<6:33:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 75%|███████▌ | 9313/12384 [19:45:44<6:33:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9314/12384 [19:45:44<6:32:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9314/12384 [19:45:52<6:32:06, 7.66s/it, loss=0.0010, acc=0.9980, iter_time=7.61s]
Epoch 1: 75%|███████▌ | 9315/12384 [19:45:52<6:31:20, 7.65s/it, loss=0.0010, acc=0.9980, iter_time=7.61s]
Epoch 1: 75%|███████▌ | 9315/12384 [19:45:59<6:31:20, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 1: 75%|███████▌ | 9316/12384 [19:45:59<6:30:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 1: 75%|███████▌ | 9316/12384 [19:46:07<6:30:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 75%|███████▌ | 9317/12384 [19:46:07<6:30:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 75%|███████▌ | 9317/12384 [19:46:14<6:30:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▌ | 9318/12384 [19:46:14<6:29:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▌ | 9318/12384 [19:46:22<6:29:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▌ | 9319/12384 [19:46:22<6:29:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▌ | 9319/12384 [19:46:30<6:29:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 75%|███████▌ | 9320/12384 [19:46:30<6:29:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 75%|███████▌ | 9320/12384 [19:46:37<6:29:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 75%|███████▌ | 9321/12384 [19:46:37<6:28:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 75%|███████▌ | 9321/12384 [19:46:45<6:28:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 75%|███████▌ | 9322/12384 [19:46:45<6:28:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 75%|███████▌ | 9322/12384 [19:46:52<6:28:35, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.73s]
Epoch 1: 75%|███████▌ | 9323/12384 [19:46:52<6:29:16, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.73s]
Epoch 1: 75%|███████▌ | 9323/12384 [19:47:00<6:29:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 75%|███████▌ | 9324/12384 [19:47:00<6:28:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 75%|███████▌ | 9324/12384 [19:47:08<6:28:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▌ | 9325/12384 [19:47:08<6:28:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 75%|███████▌ | 9325/12384 [19:47:15<6:28:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 75%|███████▌ | 9326/12384 [19:47:15<6:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 75%|███████▌ | 9326/12384 [19:47:23<6:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▌ | 9327/12384 [19:47:23<6:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 75%|███████▌ | 9327/12384 [19:47:31<6:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 75%|███████▌ | 9328/12384 [19:47:31<6:27:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 75%|███████▌ | 9328/12384 [19:47:38<6:27:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 75%|███████▌ | 9329/12384 [19:47:38<6:27:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 75%|███████▌ | 9329/12384 [19:47:46<6:27:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 75%|███████▌ | 9330/12384 [19:47:46<6:27:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 75%|███████▌ | 9330/12384 [19:47:53<6:27:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 75%|███████▌ | 9331/12384 [19:47:53<6:28:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 75%|███████▌ | 9331/12384 [19:48:01<6:28:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 75%|███████▌ | 9332/12384 [19:48:01<6:27:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 75%|███████▌ | 9332/12384 [19:48:09<6:27:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 75%|███████▌ | 9333/12384 [19:48:09<6:27:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 75%|███████▌ | 9333/12384 [19:48:16<6:27:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 75%|███████▌ | 9334/12384 [19:48:16<6:27:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 75%|███████▌ | 9334/12384 [19:48:24<6:27:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 75%|███████▌ | 9335/12384 [19:48:24<6:31:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 75%|███████▌ | 9335/12384 [19:48:32<6:31:03, 7.70s/it, loss=0.0000, acc=0.9999, iter_time=7.99s]
Epoch 1: 75%|███████▌ | 9336/12384 [19:48:32<6:29:46, 7.67s/it, loss=0.0000, acc=0.9999, iter_time=7.99s]
Epoch 1: 75%|███████▌ | 9336/12384 [19:48:40<6:29:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 75%|███████▌ | 9337/12384 [19:48:40<6:33:59, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 75%|███████▌ | 9337/12384 [19:48:47<6:33:59, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 75%|███████▌ | 9338/12384 [19:48:47<6:33:00, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 75%|███████▌ | 9338/12384 [19:48:55<6:33:00, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 75%|███████▌ | 9339/12384 [19:48:55<6:30:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 75%|███████▌ | 9339/12384 [19:49:03<6:30:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 75%|███████▌ | 9340/12384 [19:49:03<6:28:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 75%|███████▌ | 9340/12384 [19:49:10<6:28:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 75%|███████▌ | 9341/12384 [19:49:10<6:27:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 75%|███████▌ | 9341/12384 [19:49:18<6:27:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 75%|███████▌ | 9342/12384 [19:49:18<6:27:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 75%|███████▌ | 9342/12384 [19:49:25<6:27:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 75%|███████▌ | 9343/12384 [19:49:25<6:26:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 75%|███████▌ | 9343/12384 [19:49:33<6:26:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 1: 75%|███████▌ | 9344/12384 [19:49:33<6:26:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 1: 75%|███████▌ | 9344/12384 [19:49:41<6:26:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 75%|███████▌ | 9345/12384 [19:49:41<6:26:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 75%|███████▌ | 9345/12384 [19:49:48<6:26:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 75%|███████▌ | 9346/12384 [19:49:48<6:26:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 75%|███████▌ | 9346/12384 [19:49:56<6:26:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9347/12384 [19:49:56<6:25:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 75%|███████▌ | 9347/12384 [19:50:04<6:25:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 75%|███████▌ | 9348/12384 [19:50:04<6:26:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 75%|███████▌ | 9348/12384 [19:50:11<6:26:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 75%|███████▌ | 9349/12384 [19:50:11<6:26:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 75%|███████▌ | 9349/12384 [19:50:19<6:26:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 76%|███████▌ | 9350/12384 [19:50:19<6:25:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 76%|███████▌ | 9350/12384 [19:50:26<6:25:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 76%|███████▌ | 9351/12384 [19:50:26<6:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 1: 76%|███████▌ | 9351/12384 [19:50:34<6:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 76%|███████▌ | 9352/12384 [19:50:34<6:24:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 76%|███████▌ | 9352/12384 [19:50:42<6:24:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 76%|███████▌ | 9353/12384 [19:50:42<6:24:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 76%|███████▌ | 9353/12384 [19:50:49<6:24:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9354/12384 [19:50:49<6:24:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9354/12384 [19:50:57<6:24:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 76%|███████▌ | 9355/12384 [19:50:57<6:24:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 76%|███████▌ | 9355/12384 [19:51:05<6:24:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 76%|███████▌ | 9356/12384 [19:51:05<6:24:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 76%|███████▌ | 9356/12384 [19:51:12<6:24:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 76%|███████▌ | 9357/12384 [19:51:12<6:23:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 76%|███████▌ | 9357/12384 [19:51:20<6:23:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 76%|███████▌ | 9358/12384 [19:51:20<6:25:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 76%|███████▌ | 9358/12384 [19:51:27<6:25:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 76%|███████▌ | 9359/12384 [19:51:27<6:24:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 1: 76%|███████▌ | 9359/12384 [19:51:35<6:24:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 1: 76%|███████▌ | 9360/12384 [19:51:35<6:24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 1: 76%|███████▌ | 9360/12384 [19:51:43<6:24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 76%|███████▌ | 9361/12384 [19:51:43<6:28:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 76%|███████▌ | 9361/12384 [19:51:51<6:28:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 76%|███████▌ | 9362/12384 [19:51:51<6:27:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 76%|███████▌ | 9362/12384 [19:51:59<6:27:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 76%|███████▌ | 9363/12384 [19:51:59<6:31:03, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 76%|███████▌ | 9363/12384 [19:52:06<6:31:03, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 1: 76%|███████▌ | 9364/12384 [19:52:06<6:28:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 1: 76%|███████▌ | 9364/12384 [19:52:14<6:28:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 76%|███████▌ | 9365/12384 [19:52:14<6:26:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 76%|███████▌ | 9365/12384 [19:52:21<6:26:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.84s]
Epoch 1: 76%|███████▌ | 9366/12384 [19:52:21<6:25:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.84s]
Epoch 1: 76%|███████▌ | 9366/12384 [19:52:29<6:25:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 76%|███████▌ | 9367/12384 [19:52:29<6:25:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 76%|███████▌ | 9367/12384 [19:52:37<6:25:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 76%|███████▌ | 9368/12384 [19:52:37<6:25:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 76%|███████▌ | 9368/12384 [19:52:44<6:25:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 76%|███████▌ | 9369/12384 [19:52:44<6:24:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 1: 76%|███████▌ | 9369/12384 [19:52:52<6:24:59, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.74s]
Epoch 1: 76%|███████▌ | 9370/12384 [19:52:52<6:23:44, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.74s]
Epoch 1: 76%|███████▌ | 9370/12384 [19:53:00<6:23:44, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 76%|███████▌ | 9371/12384 [19:53:00<6:23:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 1: 76%|███████▌ | 9371/12384 [19:53:07<6:23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 76%|███████▌ | 9372/12384 [19:53:07<6:22:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 76%|███████▌ | 9372/12384 [19:53:15<6:22:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 76%|███████▌ | 9373/12384 [19:53:15<6:22:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 76%|███████▌ | 9373/12384 [19:53:22<6:22:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9374/12384 [19:53:22<6:21:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9374/12384 [19:53:30<6:21:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 76%|███████▌ | 9375/12384 [19:53:30<6:21:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 76%|███████▌ | 9375/12384 [19:53:38<6:21:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 76%|███████▌ | 9376/12384 [19:53:38<6:21:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 76%|███████▌ | 9376/12384 [19:53:45<6:21:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 76%|███████▌ | 9377/12384 [19:53:45<6:21:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 76%|███████▌ | 9377/12384 [19:53:53<6:21:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 76%|███████▌ | 9378/12384 [19:53:53<6:21:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 76%|███████▌ | 9378/12384 [19:54:00<6:21:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9379/12384 [19:54:00<6:21:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9379/12384 [19:54:08<6:21:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 76%|███████▌ | 9380/12384 [19:54:08<6:21:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 76%|███████▌ | 9380/12384 [19:54:16<6:21:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 1: 76%|███████▌ | 9381/12384 [19:54:16<6:21:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 1: 76%|███████▌ | 9381/12384 [19:54:23<6:21:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.87s]
Epoch 1: 76%|███████▌ | 9382/12384 [19:54:23<6:20:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.87s]
Epoch 1: 76%|███████▌ | 9382/12384 [19:54:31<6:20:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 76%|███████▌ | 9383/12384 [19:54:31<6:22:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 76%|███████▌ | 9383/12384 [19:54:39<6:22:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 76%|███████▌ | 9384/12384 [19:54:39<6:22:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 76%|███████▌ | 9384/12384 [19:54:46<6:22:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 76%|███████▌ | 9385/12384 [19:54:46<6:21:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 76%|███████▌ | 9385/12384 [19:54:54<6:21:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 76%|███████▌ | 9386/12384 [19:54:54<6:20:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 76%|███████▌ | 9386/12384 [19:55:02<6:20:55, 7.62s/it, loss=0.0001, acc=0.9992, iter_time=8.84s]
Epoch 1: 76%|███████▌ | 9387/12384 [19:55:02<6:24:54, 7.71s/it, loss=0.0001, acc=0.9992, iter_time=8.84s]
Epoch 1: 76%|███████▌ | 9387/12384 [19:55:09<6:24:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 76%|███████▌ | 9388/12384 [19:55:09<6:23:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 76%|███████▌ | 9388/12384 [19:55:17<6:23:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 76%|███████▌ | 9389/12384 [19:55:17<6:26:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 76%|███████▌ | 9389/12384 [19:55:25<6:26:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 76%|███████▌ | 9390/12384 [19:55:25<6:24:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 76%|███████▌ | 9390/12384 [19:55:32<6:24:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 76%|███████▌ | 9391/12384 [19:55:32<6:23:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 76%|███████▌ | 9391/12384 [19:55:40<6:23:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 1: 76%|███████▌ | 9392/12384 [19:55:40<6:21:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 1: 76%|███████▌ | 9392/12384 [19:55:48<6:21:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 76%|███████▌ | 9393/12384 [19:55:48<6:21:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 76%|███████▌ | 9393/12384 [19:55:55<6:21:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9394/12384 [19:55:55<6:20:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9394/12384 [19:56:03<6:20:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 76%|███████▌ | 9395/12384 [19:56:03<6:20:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 76%|███████▌ | 9395/12384 [19:56:11<6:20:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 76%|███████▌ | 9396/12384 [19:56:11<6:19:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 1: 76%|███████▌ | 9396/12384 [19:56:18<6:19:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 76%|███████▌ | 9397/12384 [19:56:18<6:19:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 76%|███████▌ | 9397/12384 [19:56:26<6:19:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 76%|███████▌ | 9398/12384 [19:56:26<6:20:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 76%|███████▌ | 9398/12384 [19:56:33<6:20:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 1: 76%|███████▌ | 9399/12384 [19:56:33<6:19:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 1: 76%|███████▌ | 9399/12384 [19:56:41<6:19:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 76%|███████▌ | 9400/12384 [19:56:41<6:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 76%|███████▌ | 9400/12384 [19:56:49<6:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 76%|███████▌ | 9401/12384 [19:56:49<6:18:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 1: 76%|███████▌ | 9401/12384 [19:56:56<6:18:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 76%|███████▌ | 9402/12384 [19:56:56<6:18:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 76%|███████▌ | 9402/12384 [19:57:04<6:18:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9403/12384 [19:57:04<6:18:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9403/12384 [19:57:11<6:18:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 76%|███████▌ | 9404/12384 [19:57:11<6:17:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 76%|███████▌ | 9404/12384 [19:57:19<6:17:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 76%|███████▌ | 9405/12384 [19:57:19<6:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 76%|███████▌ | 9405/12384 [19:57:27<6:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 76%|███████▌ | 9406/12384 [19:57:27<6:17:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 76%|███████▌ | 9406/12384 [19:57:34<6:17:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9407/12384 [19:57:34<6:18:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▌ | 9407/12384 [19:57:42<6:18:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 76%|███████▌ | 9408/12384 [19:57:42<6:17:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 76%|███████▌ | 9408/12384 [19:57:50<6:17:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 1: 76%|███████▌ | 9409/12384 [19:57:50<6:17:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 1: 76%|███████▌ | 9409/12384 [19:57:57<6:17:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 76%|███████▌ | 9410/12384 [19:57:57<6:17:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 76%|███████▌ | 9410/12384 [19:58:05<6:17:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 76%|███████▌ | 9411/12384 [19:58:05<6:17:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 76%|███████▌ | 9411/12384 [19:58:12<6:17:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 76%|███████▌ | 9412/12384 [19:58:12<6:17:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 76%|███████▌ | 9412/12384 [19:58:20<6:17:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 76%|███████▌ | 9413/12384 [19:58:20<6:17:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 76%|███████▌ | 9413/12384 [19:58:28<6:17:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 76%|███████▌ | 9414/12384 [19:58:28<6:16:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 76%|███████▌ | 9414/12384 [19:58:35<6:16:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 76%|███████▌ | 9415/12384 [19:58:35<6:16:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 76%|███████▌ | 9415/12384 [19:58:43<6:16:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 76%|███████▌ | 9416/12384 [19:58:43<6:20:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 76%|███████▌ | 9416/12384 [19:58:51<6:20:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 1: 76%|███████▌ | 9417/12384 [19:58:51<6:19:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 1: 76%|███████▌ | 9417/12384 [19:58:58<6:19:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 76%|███████▌ | 9418/12384 [19:58:58<6:17:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 76%|███████▌ | 9418/12384 [19:59:06<6:17:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 76%|███████▌ | 9419/12384 [19:59:06<6:17:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 76%|███████▌ | 9419/12384 [19:59:14<6:17:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 76%|███████▌ | 9420/12384 [19:59:14<6:17:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 76%|███████▌ | 9420/12384 [19:59:21<6:17:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 76%|███████▌ | 9421/12384 [19:59:21<6:17:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 76%|███████▌ | 9421/12384 [19:59:29<6:17:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 76%|███████▌ | 9422/12384 [19:59:29<6:16:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 76%|███████▌ | 9422/12384 [19:59:37<6:16:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 76%|███████▌ | 9423/12384 [19:59:37<6:16:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 76%|███████▌ | 9423/12384 [19:59:44<6:16:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 76%|███████▌ | 9424/12384 [19:59:44<6:16:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 76%|███████▌ | 9424/12384 [19:59:52<6:16:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 76%|███████▌ | 9425/12384 [19:59:52<6:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 76%|███████▌ | 9425/12384 [19:59:59<6:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 76%|███████▌ | 9426/12384 [19:59:59<6:15:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 76%|███████▌ | 9426/12384 [20:00:07<6:15:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 76%|███████▌ | 9427/12384 [20:00:07<6:14:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 76%|███████▌ | 9427/12384 [20:00:15<6:14:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 76%|███████▌ | 9428/12384 [20:00:15<6:14:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 76%|███████▌ | 9428/12384 [20:00:22<6:14:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 1: 76%|███████▌ | 9429/12384 [20:00:22<6:14:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 1: 76%|███████▌ | 9429/12384 [20:00:30<6:14:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 76%|███████▌ | 9430/12384 [20:00:30<6:14:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 76%|███████▌ | 9430/12384 [20:00:37<6:14:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 76%|███████▌ | 9431/12384 [20:00:37<6:14:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 76%|███████▌ | 9431/12384 [20:00:45<6:14:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 76%|███████▌ | 9432/12384 [20:00:45<6:14:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 76%|███████▌ | 9432/12384 [20:00:53<6:14:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 76%|███████▌ | 9433/12384 [20:00:53<6:14:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 76%|███████▌ | 9433/12384 [20:01:00<6:14:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 76%|███████▌ | 9434/12384 [20:01:00<6:14:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 76%|███████▌ | 9434/12384 [20:01:08<6:14:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 76%|███████▌ | 9435/12384 [20:01:08<6:14:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 76%|███████▌ | 9435/12384 [20:01:15<6:14:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 76%|███████▌ | 9436/12384 [20:01:15<6:14:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 76%|███████▌ | 9436/12384 [20:01:23<6:14:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 76%|███████▌ | 9437/12384 [20:01:23<6:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 76%|███████▌ | 9437/12384 [20:01:31<6:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 76%|███████▌ | 9438/12384 [20:01:31<6:15:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 76%|███████▌ | 9438/12384 [20:01:38<6:15:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 76%|███████▌ | 9439/12384 [20:01:38<6:14:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 76%|███████▌ | 9439/12384 [20:01:46<6:14:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 76%|███████▌ | 9440/12384 [20:01:46<6:14:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 76%|███████▌ | 9440/12384 [20:01:54<6:14:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 76%|███████▌ | 9441/12384 [20:01:54<6:13:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 76%|███████▌ | 9441/12384 [20:02:02<6:13:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 76%|███████▌ | 9442/12384 [20:02:02<6:18:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 76%|███████▌ | 9442/12384 [20:02:09<6:18:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 76%|███████▋ | 9443/12384 [20:02:09<6:16:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 76%|███████▋ | 9443/12384 [20:02:17<6:16:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 76%|███████▋ | 9444/12384 [20:02:17<6:15:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 1: 76%|███████▋ | 9444/12384 [20:02:24<6:15:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 76%|███████▋ | 9445/12384 [20:02:24<6:14:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 76%|███████▋ | 9445/12384 [20:02:32<6:14:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 76%|███████▋ | 9446/12384 [20:02:32<6:13:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 76%|███████▋ | 9446/12384 [20:02:40<6:13:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 76%|███████▋ | 9447/12384 [20:02:40<6:13:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 76%|███████▋ | 9447/12384 [20:02:47<6:13:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 76%|███████▋ | 9448/12384 [20:02:47<6:14:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 76%|███████▋ | 9448/12384 [20:02:55<6:14:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 76%|███████▋ | 9449/12384 [20:02:55<6:13:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 76%|███████▋ | 9449/12384 [20:03:03<6:13:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 76%|███████▋ | 9450/12384 [20:03:03<6:13:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 76%|███████▋ | 9450/12384 [20:03:10<6:13:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▋ | 9451/12384 [20:03:10<6:12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▋ | 9451/12384 [20:03:18<6:12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▋ | 9452/12384 [20:03:18<6:13:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 76%|███████▋ | 9452/12384 [20:03:25<6:13:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 1: 76%|███████▋ | 9453/12384 [20:03:25<6:13:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 1: 76%|███████▋ | 9453/12384 [20:03:33<6:13:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 76%|███████▋ | 9454/12384 [20:03:33<6:12:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 76%|███████▋ | 9454/12384 [20:03:41<6:12:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 76%|███████▋ | 9455/12384 [20:03:41<6:12:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 76%|███████▋ | 9455/12384 [20:03:48<6:12:10, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.01s]
Epoch 1: 76%|███████▋ | 9456/12384 [20:03:48<6:12:03, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.01s]
Epoch 1: 76%|███████▋ | 9456/12384 [20:03:56<6:12:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 76%|███████▋ | 9457/12384 [20:03:56<6:11:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 76%|███████▋ | 9457/12384 [20:04:04<6:11:48, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.63s]
Epoch 1: 76%|███████▋ | 9458/12384 [20:04:04<6:11:34, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.63s]
Epoch 1: 76%|███████▋ | 9458/12384 [20:04:11<6:11:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 1: 76%|███████▋ | 9459/12384 [20:04:11<6:11:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 1: 76%|███████▋ | 9459/12384 [20:04:19<6:11:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 76%|███████▋ | 9460/12384 [20:04:19<6:11:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 76%|███████▋ | 9460/12384 [20:04:26<6:11:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 76%|███████▋ | 9461/12384 [20:04:26<6:10:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 76%|███████▋ | 9461/12384 [20:04:34<6:10:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 1: 76%|███████▋ | 9462/12384 [20:04:34<6:10:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 1: 76%|███████▋ | 9462/12384 [20:04:42<6:10:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 76%|███████▋ | 9463/12384 [20:04:42<6:10:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 76%|███████▋ | 9463/12384 [20:04:49<6:10:42, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=11.31s]
Epoch 1: 76%|███████▋ | 9464/12384 [20:04:49<6:10:16, 7.61s/it, loss=0.0002, acc=0.9991, iter_time=11.31s]
Epoch 1: 76%|███████▋ | 9464/12384 [20:04:57<6:10:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 76%|███████▋ | 9465/12384 [20:04:57<6:10:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 76%|███████▋ | 9465/12384 [20:05:05<6:10:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 1: 76%|███████▋ | 9466/12384 [20:05:05<6:14:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 1: 76%|███████▋ | 9466/12384 [20:05:12<6:14:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 76%|███████▋ | 9467/12384 [20:05:12<6:12:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 76%|███████▋ | 9467/12384 [20:05:20<6:12:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 76%|███████▋ | 9468/12384 [20:05:20<6:11:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 76%|███████▋ | 9468/12384 [20:05:28<6:11:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 76%|███████▋ | 9469/12384 [20:05:28<6:15:57, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 76%|███████▋ | 9469/12384 [20:05:35<6:15:57, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 76%|███████▋ | 9470/12384 [20:05:35<6:14:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 76%|███████▋ | 9470/12384 [20:05:43<6:14:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 76%|███████▋ | 9471/12384 [20:05:43<6:12:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 76%|███████▋ | 9471/12384 [20:05:51<6:12:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 76%|███████▋ | 9472/12384 [20:05:51<6:11:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 76%|███████▋ | 9472/12384 [20:05:58<6:11:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 76%|███████▋ | 9473/12384 [20:05:58<6:11:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 1: 76%|███████▋ | 9473/12384 [20:06:06<6:11:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 77%|███████▋ | 9474/12384 [20:06:06<6:11:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 77%|███████▋ | 9474/12384 [20:06:14<6:11:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9475/12384 [20:06:14<6:10:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9475/12384 [20:06:21<6:10:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9476/12384 [20:06:21<6:10:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9476/12384 [20:06:29<6:10:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 77%|███████▋ | 9477/12384 [20:06:29<6:09:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 77%|███████▋ | 9477/12384 [20:06:36<6:09:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9478/12384 [20:06:36<6:09:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9478/12384 [20:06:44<6:09:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 77%|███████▋ | 9479/12384 [20:06:44<6:08:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 77%|███████▋ | 9479/12384 [20:06:52<6:08:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 77%|███████▋ | 9480/12384 [20:06:52<6:08:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 1: 77%|███████▋ | 9480/12384 [20:06:59<6:08:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 77%|███████▋ | 9481/12384 [20:06:59<6:07:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 77%|███████▋ | 9481/12384 [20:07:07<6:07:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 1: 77%|███████▋ | 9482/12384 [20:07:07<6:08:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 1: 77%|███████▋ | 9482/12384 [20:07:14<6:08:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 77%|███████▋ | 9483/12384 [20:07:14<6:07:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 77%|███████▋ | 9483/12384 [20:07:22<6:07:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9484/12384 [20:07:22<6:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9484/12384 [20:07:30<6:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9485/12384 [20:07:30<6:07:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9485/12384 [20:07:37<6:07:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9486/12384 [20:07:37<6:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9486/12384 [20:07:45<6:07:55, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 1: 77%|███████▋ | 9487/12384 [20:07:45<6:07:55, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 1: 77%|███████▋ | 9487/12384 [20:07:53<6:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 77%|███████▋ | 9488/12384 [20:07:53<6:07:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 77%|███████▋ | 9488/12384 [20:08:00<6:07:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 77%|███████▋ | 9489/12384 [20:08:00<6:07:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 77%|███████▋ | 9489/12384 [20:08:08<6:07:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9490/12384 [20:08:08<6:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9490/12384 [20:08:15<6:06:57, 7.61s/it, loss=0.0005, acc=0.9989, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9491/12384 [20:08:15<6:06:49, 7.61s/it, loss=0.0005, acc=0.9989, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9491/12384 [20:08:23<6:06:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 77%|███████▋ | 9492/12384 [20:08:23<6:06:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 77%|███████▋ | 9492/12384 [20:08:31<6:06:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 77%|███████▋ | 9493/12384 [20:08:31<6:06:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 77%|███████▋ | 9493/12384 [20:08:38<6:06:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 77%|███████▋ | 9494/12384 [20:08:38<6:06:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 77%|███████▋ | 9494/12384 [20:08:46<6:06:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9495/12384 [20:08:46<6:10:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9495/12384 [20:08:54<6:10:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 77%|███████▋ | 9496/12384 [20:08:54<6:09:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 77%|███████▋ | 9496/12384 [20:09:01<6:09:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 77%|███████▋ | 9497/12384 [20:09:01<6:07:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 77%|███████▋ | 9497/12384 [20:09:09<6:07:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 77%|███████▋ | 9498/12384 [20:09:09<6:06:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 77%|███████▋ | 9498/12384 [20:09:16<6:06:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 77%|███████▋ | 9499/12384 [20:09:16<6:06:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 77%|███████▋ | 9499/12384 [20:09:24<6:06:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 77%|███████▋ | 9500/12384 [20:09:24<6:06:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 77%|███████▋ | 9500/12384 [20:09:32<6:06:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 77%|███████▋ | 9501/12384 [20:09:32<6:05:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 77%|███████▋ | 9501/12384 [20:09:39<6:05:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 77%|███████▋ | 9502/12384 [20:09:39<6:05:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 77%|███████▋ | 9502/12384 [20:09:47<6:05:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 77%|███████▋ | 9503/12384 [20:09:47<6:05:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 77%|███████▋ | 9503/12384 [20:09:55<6:05:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 77%|███████▋ | 9504/12384 [20:09:55<6:05:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 77%|███████▋ | 9504/12384 [20:10:02<6:05:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 77%|███████▋ | 9505/12384 [20:10:02<6:05:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 77%|███████▋ | 9505/12384 [20:10:10<6:05:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 77%|███████▋ | 9506/12384 [20:10:10<6:05:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 77%|███████▋ | 9506/12384 [20:10:17<6:05:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9507/12384 [20:10:17<6:04:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9507/12384 [20:10:25<6:04:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 77%|███████▋ | 9508/12384 [20:10:25<6:04:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 77%|███████▋ | 9508/12384 [20:10:33<6:04:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 77%|███████▋ | 9509/12384 [20:10:33<6:04:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 77%|███████▋ | 9509/12384 [20:10:40<6:04:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 77%|███████▋ | 9510/12384 [20:10:40<6:04:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 77%|███████▋ | 9510/12384 [20:10:48<6:04:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 77%|███████▋ | 9511/12384 [20:10:48<6:03:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 77%|███████▋ | 9511/12384 [20:10:55<6:03:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 77%|███████▋ | 9512/12384 [20:10:55<6:03:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 77%|███████▋ | 9512/12384 [20:11:03<6:03:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 77%|███████▋ | 9513/12384 [20:11:03<6:03:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 77%|███████▋ | 9513/12384 [20:11:11<6:03:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 77%|███████▋ | 9514/12384 [20:11:11<6:04:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 77%|███████▋ | 9514/12384 [20:11:18<6:04:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 77%|███████▋ | 9515/12384 [20:11:18<6:03:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 77%|███████▋ | 9515/12384 [20:11:26<6:03:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 77%|███████▋ | 9516/12384 [20:11:26<6:04:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 77%|███████▋ | 9516/12384 [20:11:34<6:04:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 77%|███████▋ | 9517/12384 [20:11:34<6:04:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 77%|███████▋ | 9517/12384 [20:11:41<6:04:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 77%|███████▋ | 9518/12384 [20:11:41<6:04:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 77%|███████▋ | 9518/12384 [20:11:49<6:04:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 77%|███████▋ | 9519/12384 [20:11:49<6:04:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 77%|███████▋ | 9519/12384 [20:11:56<6:04:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 77%|███████▋ | 9520/12384 [20:11:56<6:04:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 77%|███████▋ | 9520/12384 [20:12:04<6:04:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 77%|███████▋ | 9521/12384 [20:12:04<6:08:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 77%|███████▋ | 9521/12384 [20:12:12<6:08:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 77%|███████▋ | 9522/12384 [20:12:12<6:06:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 77%|███████▋ | 9522/12384 [20:12:20<6:06:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 77%|███████▋ | 9523/12384 [20:12:20<6:05:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 77%|███████▋ | 9523/12384 [20:12:27<6:05:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 77%|███████▋ | 9524/12384 [20:12:27<6:03:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 77%|███████▋ | 9524/12384 [20:12:35<6:03:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9525/12384 [20:12:35<6:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9525/12384 [20:12:42<6:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9526/12384 [20:12:42<6:02:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9526/12384 [20:12:50<6:02:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 77%|███████▋ | 9527/12384 [20:12:50<6:02:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 77%|███████▋ | 9527/12384 [20:12:58<6:02:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 77%|███████▋ | 9528/12384 [20:12:58<6:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 77%|███████▋ | 9528/12384 [20:13:05<6:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 77%|███████▋ | 9529/12384 [20:13:05<6:02:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 77%|███████▋ | 9529/12384 [20:13:13<6:02:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 77%|███████▋ | 9530/12384 [20:13:13<6:02:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 77%|███████▋ | 9530/12384 [20:13:20<6:02:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9531/12384 [20:13:20<6:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9531/12384 [20:13:28<6:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 77%|███████▋ | 9532/12384 [20:13:28<6:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 77%|███████▋ | 9532/12384 [20:13:36<6:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 77%|███████▋ | 9533/12384 [20:13:36<6:01:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 77%|███████▋ | 9533/12384 [20:13:43<6:01:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 77%|███████▋ | 9534/12384 [20:13:43<6:01:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 77%|███████▋ | 9534/12384 [20:13:51<6:01:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9535/12384 [20:13:51<6:01:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 77%|███████▋ | 9535/12384 [20:13:58<6:01:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 77%|███████▋ | 9536/12384 [20:13:58<6:01:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 77%|███████▋ | 9536/12384 [20:14:06<6:01:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 77%|███████▋ | 9537/12384 [20:14:06<6:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 77%|███████▋ | 9537/12384 [20:14:14<6:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 77%|███████▋ | 9538/12384 [20:14:14<6:00:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 77%|███████▋ | 9538/12384 [20:14:21<6:00:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 77%|███████▋ | 9539/12384 [20:14:21<6:00:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 77%|███████▋ | 9539/12384 [20:14:29<6:00:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 77%|███████▋ | 9540/12384 [20:14:29<6:00:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 77%|███████▋ | 9540/12384 [20:14:36<6:00:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 77%|███████▋ | 9541/12384 [20:14:36<6:00:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 77%|███████▋ | 9541/12384 [20:14:44<6:00:16, 7.60s/it, loss=0.0006, acc=0.9979, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9542/12384 [20:14:44<6:00:13, 7.60s/it, loss=0.0006, acc=0.9979, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9542/12384 [20:14:52<6:00:13, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 1: 77%|███████▋ | 9543/12384 [20:14:52<6:00:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 1: 77%|███████▋ | 9543/12384 [20:14:59<6:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 77%|███████▋ | 9544/12384 [20:14:59<6:00:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 77%|███████▋ | 9544/12384 [20:15:07<6:00:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 1: 77%|███████▋ | 9545/12384 [20:15:07<6:03:53, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 1: 77%|███████▋ | 9545/12384 [20:15:15<6:03:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 77%|███████▋ | 9546/12384 [20:15:15<6:02:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 77%|███████▋ | 9546/12384 [20:15:23<6:02:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 1: 77%|███████▋ | 9547/12384 [20:15:23<6:06:31, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 1: 77%|███████▋ | 9547/12384 [20:15:30<6:06:31, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 77%|███████▋ | 9548/12384 [20:15:30<6:04:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 77%|███████▋ | 9548/12384 [20:15:38<6:04:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 77%|███████▋ | 9549/12384 [20:15:38<6:02:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 77%|███████▋ | 9549/12384 [20:15:46<6:02:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 77%|███████▋ | 9550/12384 [20:15:46<6:01:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 77%|███████▋ | 9550/12384 [20:15:53<6:01:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 77%|███████▋ | 9551/12384 [20:15:53<6:00:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 77%|███████▋ | 9551/12384 [20:16:01<6:00:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 77%|███████▋ | 9552/12384 [20:16:01<6:00:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 77%|███████▋ | 9552/12384 [20:16:08<6:00:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 77%|███████▋ | 9553/12384 [20:16:08<5:59:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 77%|███████▋ | 9553/12384 [20:16:16<5:59:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 77%|███████▋ | 9554/12384 [20:16:16<5:59:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 77%|███████▋ | 9554/12384 [20:16:24<5:59:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9555/12384 [20:16:24<5:58:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 77%|███████▋ | 9555/12384 [20:16:31<5:58:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 77%|███████▋ | 9556/12384 [20:16:31<5:58:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 77%|███████▋ | 9556/12384 [20:16:39<5:58:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 77%|███████▋ | 9557/12384 [20:16:39<5:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 77%|███████▋ | 9557/12384 [20:16:46<5:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 77%|███████▋ | 9558/12384 [20:16:46<5:58:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 77%|███████▋ | 9558/12384 [20:16:54<5:58:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 77%|███████▋ | 9559/12384 [20:16:54<5:58:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 1: 77%|███████▋ | 9559/12384 [20:17:02<5:58:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 77%|███████▋ | 9560/12384 [20:17:02<5:57:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 77%|███████▋ | 9560/12384 [20:17:09<5:57:59, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=5.38s]
Epoch 1: 77%|███████▋ | 9561/12384 [20:17:09<5:58:22, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.38s]
Epoch 1: 77%|███████▋ | 9561/12384 [20:17:17<5:58:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 77%|███████▋ | 9562/12384 [20:17:17<5:58:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 77%|███████▋ | 9562/12384 [20:17:24<5:58:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9563/12384 [20:17:24<5:58:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9563/12384 [20:17:32<5:58:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 77%|███████▋ | 9564/12384 [20:17:32<5:57:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 77%|███████▋ | 9564/12384 [20:17:40<5:57:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 77%|███████▋ | 9565/12384 [20:17:40<5:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 77%|███████▋ | 9565/12384 [20:17:47<5:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 77%|███████▋ | 9566/12384 [20:17:47<5:57:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 77%|███████▋ | 9566/12384 [20:17:55<5:57:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 77%|███████▋ | 9567/12384 [20:17:55<5:57:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 77%|███████▋ | 9567/12384 [20:18:03<5:57:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 77%|███████▋ | 9568/12384 [20:18:03<5:57:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 77%|███████▋ | 9568/12384 [20:18:10<5:57:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 77%|███████▋ | 9569/12384 [20:18:10<5:57:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 1: 77%|███████▋ | 9569/12384 [20:18:18<5:57:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 77%|███████▋ | 9570/12384 [20:18:18<5:57:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 77%|███████▋ | 9570/12384 [20:18:25<5:57:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 77%|███████▋ | 9571/12384 [20:18:25<5:57:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 1: 77%|███████▋ | 9571/12384 [20:18:33<5:57:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 77%|███████▋ | 9572/12384 [20:18:33<5:56:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 77%|███████▋ | 9572/12384 [20:18:41<5:56:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 77%|███████▋ | 9573/12384 [20:18:41<6:00:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 77%|███████▋ | 9573/12384 [20:18:49<6:00:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 77%|███████▋ | 9574/12384 [20:18:49<5:59:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 77%|███████▋ | 9574/12384 [20:18:56<5:59:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 77%|███████▋ | 9575/12384 [20:18:56<5:58:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 1: 77%|███████▋ | 9575/12384 [20:19:04<5:58:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 77%|███████▋ | 9576/12384 [20:19:04<5:57:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 1: 77%|███████▋ | 9576/12384 [20:19:11<5:57:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 77%|███████▋ | 9577/12384 [20:19:11<5:57:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 77%|███████▋ | 9577/12384 [20:19:19<5:57:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 77%|███████▋ | 9578/12384 [20:19:19<5:56:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 77%|███████▋ | 9578/12384 [20:19:27<5:56:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 77%|███████▋ | 9579/12384 [20:19:27<5:56:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 77%|███████▋ | 9579/12384 [20:19:34<5:56:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 77%|███████▋ | 9580/12384 [20:19:34<5:56:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 77%|███████▋ | 9580/12384 [20:19:42<5:56:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 77%|███████▋ | 9581/12384 [20:19:42<5:56:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 77%|███████▋ | 9581/12384 [20:19:49<5:56:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 77%|███████▋ | 9582/12384 [20:19:49<5:56:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 77%|███████▋ | 9582/12384 [20:19:57<5:56:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 77%|███████▋ | 9583/12384 [20:19:57<5:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 77%|███████▋ | 9583/12384 [20:20:05<5:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 77%|███████▋ | 9584/12384 [20:20:05<5:55:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 77%|███████▋ | 9584/12384 [20:20:12<5:55:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 77%|███████▋ | 9585/12384 [20:20:12<5:55:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 77%|███████▋ | 9585/12384 [20:20:20<5:55:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9586/12384 [20:20:20<5:54:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 77%|███████▋ | 9586/12384 [20:20:28<5:54:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 77%|███████▋ | 9587/12384 [20:20:28<5:54:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 77%|███████▋ | 9587/12384 [20:20:35<5:54:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 77%|███████▋ | 9588/12384 [20:20:35<5:54:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 77%|███████▋ | 9588/12384 [20:20:43<5:54:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 1: 77%|███████▋ | 9589/12384 [20:20:43<5:54:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 1: 77%|███████▋ | 9589/12384 [20:20:50<5:54:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 77%|███████▋ | 9590/12384 [20:20:50<5:54:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 1: 77%|███████▋ | 9590/12384 [20:20:58<5:54:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 77%|███████▋ | 9591/12384 [20:20:58<5:54:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 77%|███████▋ | 9591/12384 [20:21:06<5:54:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 77%|███████▋ | 9592/12384 [20:21:06<5:54:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 1: 77%|███████▋ | 9592/12384 [20:21:13<5:54:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 77%|███████▋ | 9593/12384 [20:21:13<5:53:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 77%|███████▋ | 9593/12384 [20:21:21<5:53:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 77%|███████▋ | 9594/12384 [20:21:21<5:55:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 77%|███████▋ | 9594/12384 [20:21:28<5:55:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 77%|███████▋ | 9595/12384 [20:21:28<5:54:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 77%|███████▋ | 9595/12384 [20:21:36<5:54:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 77%|███████▋ | 9596/12384 [20:21:36<5:54:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 77%|███████▋ | 9596/12384 [20:21:44<5:54:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 77%|███████▋ | 9597/12384 [20:21:44<5:55:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 77%|███████▋ | 9597/12384 [20:21:51<5:55:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 78%|███████▊ | 9598/12384 [20:21:51<5:54:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 78%|███████▊ | 9598/12384 [20:21:59<5:54:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 78%|███████▊ | 9599/12384 [20:21:59<5:53:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 1: 78%|███████▊ | 9599/12384 [20:22:07<5:53:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 78%|███████▊ | 9600/12384 [20:22:07<5:57:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 78%|███████▊ | 9600/12384 [20:22:15<5:57:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 78%|███████▊ | 9601/12384 [20:22:15<5:56:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 78%|███████▊ | 9601/12384 [20:22:22<5:56:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9602/12384 [20:22:22<5:55:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9602/12384 [20:22:30<5:55:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 1: 78%|███████▊ | 9603/12384 [20:22:30<5:54:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 1: 78%|███████▊ | 9603/12384 [20:22:37<5:54:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 1: 78%|███████▊ | 9604/12384 [20:22:37<5:53:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 1: 78%|███████▊ | 9604/12384 [20:22:45<5:53:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 78%|███████▊ | 9605/12384 [20:22:45<5:53:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 78%|███████▊ | 9605/12384 [20:22:53<5:53:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 78%|███████▊ | 9606/12384 [20:22:53<5:52:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 78%|███████▊ | 9606/12384 [20:23:00<5:52:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 78%|███████▊ | 9607/12384 [20:23:00<5:52:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 78%|███████▊ | 9607/12384 [20:23:08<5:52:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 78%|███████▊ | 9608/12384 [20:23:08<5:52:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 78%|███████▊ | 9608/12384 [20:23:15<5:52:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 78%|███████▊ | 9609/12384 [20:23:15<5:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 78%|███████▊ | 9609/12384 [20:23:23<5:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 78%|███████▊ | 9610/12384 [20:23:23<5:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 78%|███████▊ | 9610/12384 [20:23:31<5:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 78%|███████▊ | 9611/12384 [20:23:31<5:51:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 78%|███████▊ | 9611/12384 [20:23:38<5:51:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9612/12384 [20:23:38<5:51:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9612/12384 [20:23:46<5:51:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 78%|███████▊ | 9613/12384 [20:23:46<5:51:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 78%|███████▊ | 9613/12384 [20:23:53<5:51:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 78%|███████▊ | 9614/12384 [20:23:53<5:51:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 78%|███████▊ | 9614/12384 [20:24:01<5:51:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9615/12384 [20:24:01<5:50:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9615/12384 [20:24:09<5:50:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 78%|███████▊ | 9616/12384 [20:24:09<5:53:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 78%|███████▊ | 9616/12384 [20:24:16<5:53:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 78%|███████▊ | 9617/12384 [20:24:16<5:52:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 78%|███████▊ | 9617/12384 [20:24:24<5:52:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 78%|███████▊ | 9618/12384 [20:24:24<5:51:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 78%|███████▊ | 9618/12384 [20:24:32<5:51:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9619/12384 [20:24:32<5:51:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9619/12384 [20:24:39<5:51:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9620/12384 [20:24:39<5:51:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9620/12384 [20:24:47<5:51:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9621/12384 [20:24:47<5:52:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9621/12384 [20:24:55<5:52:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 1: 78%|███████▊ | 9622/12384 [20:24:55<5:51:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 1: 78%|███████▊ | 9622/12384 [20:25:02<5:51:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 78%|███████▊ | 9623/12384 [20:25:02<5:51:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 78%|███████▊ | 9623/12384 [20:25:10<5:51:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 78%|███████▊ | 9624/12384 [20:25:10<5:50:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 78%|███████▊ | 9624/12384 [20:25:17<5:50:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 78%|███████▊ | 9625/12384 [20:25:17<5:50:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 78%|███████▊ | 9625/12384 [20:25:25<5:50:20, 7.62s/it, loss=0.0004, acc=0.9976, iter_time=7.41s]
Epoch 1: 78%|███████▊ | 9626/12384 [20:25:25<5:54:52, 7.72s/it, loss=0.0004, acc=0.9976, iter_time=7.41s]
Epoch 1: 78%|███████▊ | 9626/12384 [20:25:33<5:54:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 78%|███████▊ | 9627/12384 [20:25:33<5:52:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 78%|███████▊ | 9627/12384 [20:25:41<5:52:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 78%|███████▊ | 9628/12384 [20:25:41<5:51:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 78%|███████▊ | 9628/12384 [20:25:48<5:51:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9629/12384 [20:25:48<5:50:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9629/12384 [20:25:56<5:50:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9630/12384 [20:25:56<5:50:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9630/12384 [20:26:03<5:50:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.45s]
Epoch 1: 78%|███████▊ | 9631/12384 [20:26:03<5:50:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.45s]
Epoch 1: 78%|███████▊ | 9631/12384 [20:26:11<5:50:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=12.18s]
Epoch 1: 78%|███████▊ | 9632/12384 [20:26:11<5:49:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=12.18s]
Epoch 1: 78%|███████▊ | 9632/12384 [20:26:19<5:49:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 78%|███████▊ | 9633/12384 [20:26:19<5:49:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 78%|███████▊ | 9633/12384 [20:26:26<5:49:20, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=6.96s]
Epoch 1: 78%|███████▊ | 9634/12384 [20:26:26<5:48:57, 7.61s/it, loss=0.0002, acc=0.9988, iter_time=6.96s]
Epoch 1: 78%|███████▊ | 9634/12384 [20:26:34<5:48:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 78%|███████▊ | 9635/12384 [20:26:34<5:49:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 1: 78%|███████▊ | 9635/12384 [20:26:42<5:49:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 78%|███████▊ | 9636/12384 [20:26:42<5:49:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 78%|███████▊ | 9636/12384 [20:26:49<5:49:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 78%|███████▊ | 9637/12384 [20:26:49<5:49:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 1: 78%|███████▊ | 9637/12384 [20:26:57<5:49:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 78%|███████▊ | 9638/12384 [20:26:57<5:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 78%|███████▊ | 9638/12384 [20:27:04<5:48:45, 7.62s/it, loss=0.0001, acc=0.9990, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9639/12384 [20:27:04<5:48:42, 7.62s/it, loss=0.0001, acc=0.9990, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9639/12384 [20:27:12<5:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 78%|███████▊ | 9640/12384 [20:27:12<5:48:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 78%|███████▊ | 9640/12384 [20:27:20<5:48:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 1: 78%|███████▊ | 9641/12384 [20:27:20<5:48:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 1: 78%|███████▊ | 9641/12384 [20:27:27<5:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 78%|███████▊ | 9642/12384 [20:27:27<5:47:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 78%|███████▊ | 9642/12384 [20:27:35<5:47:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 78%|███████▊ | 9643/12384 [20:27:35<5:47:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 78%|███████▊ | 9643/12384 [20:27:42<5:47:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 78%|███████▊ | 9644/12384 [20:27:42<5:47:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 78%|███████▊ | 9644/12384 [20:27:50<5:47:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9645/12384 [20:27:50<5:47:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9645/12384 [20:27:58<5:47:30, 7.61s/it, loss=0.0001, acc=0.9993, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9646/12384 [20:27:58<5:47:10, 7.61s/it, loss=0.0001, acc=0.9993, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9646/12384 [20:28:05<5:47:10, 7.61s/it, loss=0.0005, acc=0.9977, iter_time=7.59s]
Epoch 1: 78%|███████▊ | 9647/12384 [20:28:05<5:47:16, 7.61s/it, loss=0.0005, acc=0.9977, iter_time=7.59s]
Epoch 1: 78%|███████▊ | 9647/12384 [20:28:13<5:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 78%|███████▊ | 9648/12384 [20:28:13<5:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 78%|███████▊ | 9648/12384 [20:28:20<5:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 78%|███████▊ | 9649/12384 [20:28:20<5:46:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 78%|███████▊ | 9649/12384 [20:28:28<5:46:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 78%|███████▊ | 9650/12384 [20:28:28<5:46:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 78%|███████▊ | 9650/12384 [20:28:36<5:46:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9651/12384 [20:28:36<5:46:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9651/12384 [20:28:43<5:46:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 78%|███████▊ | 9652/12384 [20:28:43<5:47:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 78%|███████▊ | 9652/12384 [20:28:51<5:47:49, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.78s]
Epoch 1: 78%|███████▊ | 9653/12384 [20:28:51<5:51:45, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=7.78s]
Epoch 1: 78%|███████▊ | 9653/12384 [20:28:59<5:51:45, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 78%|███████▊ | 9654/12384 [20:28:59<5:49:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 1: 78%|███████▊ | 9654/12384 [20:29:07<5:49:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 78%|███████▊ | 9655/12384 [20:29:07<5:48:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 78%|███████▊ | 9655/12384 [20:29:14<5:48:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 78%|███████▊ | 9656/12384 [20:29:14<5:47:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 78%|███████▊ | 9656/12384 [20:29:22<5:47:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 78%|███████▊ | 9657/12384 [20:29:22<5:47:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 78%|███████▊ | 9657/12384 [20:29:29<5:47:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9658/12384 [20:29:29<5:46:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9658/12384 [20:29:37<5:46:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9659/12384 [20:29:37<5:46:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9659/12384 [20:29:45<5:46:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 78%|███████▊ | 9660/12384 [20:29:45<5:46:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 78%|███████▊ | 9660/12384 [20:29:52<5:46:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 78%|███████▊ | 9661/12384 [20:29:52<5:45:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 78%|███████▊ | 9661/12384 [20:30:00<5:45:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 78%|███████▊ | 9662/12384 [20:30:00<5:45:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 78%|███████▊ | 9662/12384 [20:30:07<5:45:25, 7.61s/it, loss=0.0005, acc=0.9987, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9663/12384 [20:30:07<5:45:09, 7.61s/it, loss=0.0005, acc=0.9987, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9663/12384 [20:30:15<5:45:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 78%|███████▊ | 9664/12384 [20:30:15<5:46:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 78%|███████▊ | 9664/12384 [20:30:23<5:46:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 78%|███████▊ | 9665/12384 [20:30:23<5:46:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 78%|███████▊ | 9665/12384 [20:30:30<5:46:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 78%|███████▊ | 9666/12384 [20:30:30<5:45:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 78%|███████▊ | 9666/12384 [20:30:38<5:45:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 78%|███████▊ | 9667/12384 [20:30:38<5:45:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 78%|███████▊ | 9667/12384 [20:30:46<5:45:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 78%|███████▊ | 9668/12384 [20:30:46<5:44:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 78%|███████▊ | 9668/12384 [20:30:53<5:44:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9669/12384 [20:30:53<5:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9669/12384 [20:31:01<5:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 78%|███████▊ | 9670/12384 [20:31:01<5:44:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 78%|███████▊ | 9670/12384 [20:31:09<5:44:12, 7.61s/it, loss=0.0004, acc=0.9965, iter_time=5.36s]
Epoch 1: 78%|███████▊ | 9671/12384 [20:31:09<5:45:42, 7.65s/it, loss=0.0004, acc=0.9965, iter_time=5.36s]
Epoch 1: 78%|███████▊ | 9671/12384 [20:31:16<5:45:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.87s]
Epoch 1: 78%|███████▊ | 9672/12384 [20:31:16<5:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.87s]
Epoch 1: 78%|███████▊ | 9672/12384 [20:31:24<5:45:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 78%|███████▊ | 9673/12384 [20:31:24<5:44:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 78%|███████▊ | 9673/12384 [20:31:31<5:44:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 78%|███████▊ | 9674/12384 [20:31:31<5:44:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 78%|███████▊ | 9674/12384 [20:31:39<5:44:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 78%|███████▊ | 9675/12384 [20:31:39<5:45:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 78%|███████▊ | 9675/12384 [20:31:47<5:45:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 1: 78%|███████▊ | 9676/12384 [20:31:47<5:47:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 1: 78%|███████▊ | 9676/12384 [20:31:55<5:47:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 78%|███████▊ | 9677/12384 [20:31:55<5:46:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 78%|███████▊ | 9677/12384 [20:32:02<5:46:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 78%|███████▊ | 9678/12384 [20:32:02<5:45:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 78%|███████▊ | 9678/12384 [20:32:10<5:45:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 78%|███████▊ | 9679/12384 [20:32:10<5:48:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 78%|███████▊ | 9679/12384 [20:32:18<5:48:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 78%|███████▊ | 9680/12384 [20:32:18<5:47:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 78%|███████▊ | 9680/12384 [20:32:25<5:47:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 78%|███████▊ | 9681/12384 [20:32:25<5:46:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 78%|███████▊ | 9681/12384 [20:32:33<5:46:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 78%|███████▊ | 9682/12384 [20:32:33<5:44:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 78%|███████▊ | 9682/12384 [20:32:41<5:44:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9683/12384 [20:32:41<5:44:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 78%|███████▊ | 9683/12384 [20:32:48<5:44:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 78%|███████▊ | 9684/12384 [20:32:48<5:43:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 78%|███████▊ | 9684/12384 [20:32:56<5:43:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9685/12384 [20:32:56<5:43:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9685/12384 [20:33:03<5:43:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 78%|███████▊ | 9686/12384 [20:33:03<5:42:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 78%|███████▊ | 9686/12384 [20:33:11<5:42:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 78%|███████▊ | 9687/12384 [20:33:11<5:42:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 78%|███████▊ | 9687/12384 [20:33:19<5:42:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 78%|███████▊ | 9688/12384 [20:33:19<5:42:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 78%|███████▊ | 9688/12384 [20:33:26<5:42:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 78%|███████▊ | 9689/12384 [20:33:26<5:41:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 78%|███████▊ | 9689/12384 [20:33:34<5:41:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9690/12384 [20:33:34<5:41:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9690/12384 [20:33:41<5:41:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 78%|███████▊ | 9691/12384 [20:33:41<5:41:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 78%|███████▊ | 9691/12384 [20:33:49<5:41:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 78%|███████▊ | 9692/12384 [20:33:49<5:41:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 1: 78%|███████▊ | 9692/12384 [20:33:57<5:41:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 78%|███████▊ | 9693/12384 [20:33:57<5:41:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 78%|███████▊ | 9693/12384 [20:34:04<5:41:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 78%|███████▊ | 9694/12384 [20:34:04<5:41:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 78%|███████▊ | 9694/12384 [20:34:12<5:41:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9695/12384 [20:34:12<5:41:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9695/12384 [20:34:20<5:41:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 78%|███████▊ | 9696/12384 [20:34:20<5:41:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 78%|███████▊ | 9696/12384 [20:34:27<5:41:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 78%|███████▊ | 9697/12384 [20:34:27<5:41:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 78%|███████▊ | 9697/12384 [20:34:35<5:41:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 78%|███████▊ | 9698/12384 [20:34:35<5:41:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 78%|███████▊ | 9698/12384 [20:34:42<5:41:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9699/12384 [20:34:42<5:41:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9699/12384 [20:34:50<5:41:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9700/12384 [20:34:50<5:41:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 78%|███████▊ | 9700/12384 [20:34:58<5:41:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 78%|███████▊ | 9701/12384 [20:34:58<5:40:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 78%|███████▊ | 9701/12384 [20:35:05<5:40:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 78%|███████▊ | 9702/12384 [20:35:05<5:40:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 78%|███████▊ | 9702/12384 [20:35:13<5:40:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 78%|███████▊ | 9703/12384 [20:35:13<5:43:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 78%|███████▊ | 9703/12384 [20:35:21<5:43:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 78%|███████▊ | 9704/12384 [20:35:21<5:42:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 78%|███████▊ | 9704/12384 [20:35:29<5:42:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 78%|███████▊ | 9705/12384 [20:35:29<5:45:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 78%|███████▊ | 9705/12384 [20:35:36<5:45:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 78%|███████▊ | 9706/12384 [20:35:36<5:44:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 78%|███████▊ | 9706/12384 [20:35:44<5:44:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 78%|███████▊ | 9707/12384 [20:35:44<5:42:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 78%|███████▊ | 9707/12384 [20:35:52<5:42:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 78%|███████▊ | 9708/12384 [20:35:52<5:42:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 78%|███████▊ | 9708/12384 [20:35:59<5:42:03, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 78%|███████▊ | 9709/12384 [20:35:59<5:41:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 78%|███████▊ | 9709/12384 [20:36:07<5:41:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 78%|███████▊ | 9710/12384 [20:36:07<5:40:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 78%|███████▊ | 9710/12384 [20:36:14<5:40:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 78%|███████▊ | 9711/12384 [20:36:14<5:39:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 78%|███████▊ | 9711/12384 [20:36:22<5:39:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9712/12384 [20:36:22<5:39:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9712/12384 [20:36:30<5:39:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 78%|███████▊ | 9713/12384 [20:36:30<5:39:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 78%|███████▊ | 9713/12384 [20:36:37<5:39:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9714/12384 [20:36:37<5:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 78%|███████▊ | 9714/12384 [20:36:45<5:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9715/12384 [20:36:45<5:39:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 78%|███████▊ | 9715/12384 [20:36:53<5:39:10, 7.62s/it, loss=0.0033, acc=0.9959, iter_time=8.10s]
Epoch 1: 78%|███████▊ | 9716/12384 [20:36:53<5:39:35, 7.64s/it, loss=0.0033, acc=0.9959, iter_time=8.10s]
Epoch 1: 78%|███████▊ | 9716/12384 [20:37:00<5:39:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 78%|███████▊ | 9717/12384 [20:37:00<5:38:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 78%|███████▊ | 9717/12384 [20:37:08<5:38:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 78%|███████▊ | 9718/12384 [20:37:08<5:38:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 78%|███████▊ | 9718/12384 [20:37:15<5:38:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.23s]
Epoch 1: 78%|███████▊ | 9719/12384 [20:37:15<5:38:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.23s]
Epoch 1: 78%|███████▊ | 9719/12384 [20:37:23<5:38:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 1: 78%|███████▊ | 9720/12384 [20:37:23<5:38:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 1: 78%|███████▊ | 9720/12384 [20:37:31<5:38:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 1: 78%|███████▊ | 9721/12384 [20:37:31<5:38:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 1: 78%|███████▊ | 9721/12384 [20:37:38<5:38:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 79%|███████▊ | 9722/12384 [20:37:38<5:38:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 79%|███████▊ | 9722/12384 [20:37:46<5:38:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 79%|███████▊ | 9723/12384 [20:37:46<5:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 79%|███████▊ | 9723/12384 [20:37:53<5:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▊ | 9724/12384 [20:37:53<5:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▊ | 9724/12384 [20:38:01<5:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 79%|███████▊ | 9725/12384 [20:38:01<5:37:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 79%|███████▊ | 9725/12384 [20:38:09<5:37:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 79%|███████▊ | 9726/12384 [20:38:09<5:37:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 79%|███████▊ | 9726/12384 [20:38:16<5:37:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 79%|███████▊ | 9727/12384 [20:38:16<5:36:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 79%|███████▊ | 9727/12384 [20:38:24<5:36:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 79%|███████▊ | 9728/12384 [20:38:24<5:36:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 1: 79%|███████▊ | 9728/12384 [20:38:31<5:36:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 79%|███████▊ | 9729/12384 [20:38:31<5:36:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 79%|███████▊ | 9729/12384 [20:38:39<5:36:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 79%|███████▊ | 9730/12384 [20:38:39<5:37:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 79%|███████▊ | 9730/12384 [20:38:47<5:37:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 79%|███████▊ | 9731/12384 [20:38:47<5:41:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 79%|███████▊ | 9731/12384 [20:38:55<5:41:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 79%|███████▊ | 9732/12384 [20:38:55<5:39:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 79%|███████▊ | 9732/12384 [20:39:02<5:39:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 79%|███████▊ | 9733/12384 [20:39:02<5:38:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 79%|███████▊ | 9733/12384 [20:39:10<5:38:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 79%|███████▊ | 9734/12384 [20:39:10<5:37:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 79%|███████▊ | 9734/12384 [20:39:18<5:37:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 79%|███████▊ | 9735/12384 [20:39:18<5:37:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 79%|███████▊ | 9735/12384 [20:39:25<5:37:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 79%|███████▊ | 9736/12384 [20:39:25<5:36:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 79%|███████▊ | 9736/12384 [20:39:33<5:36:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 79%|███████▊ | 9737/12384 [20:39:33<5:36:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 79%|███████▊ | 9737/12384 [20:39:40<5:36:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 79%|███████▊ | 9738/12384 [20:39:40<5:35:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 79%|███████▊ | 9738/12384 [20:39:48<5:35:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 79%|███████▊ | 9739/12384 [20:39:48<5:35:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 79%|███████▊ | 9739/12384 [20:39:56<5:35:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 1: 79%|███████▊ | 9740/12384 [20:39:56<5:35:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 1: 79%|███████▊ | 9740/12384 [20:40:03<5:35:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 1: 79%|███████▊ | 9741/12384 [20:40:03<5:35:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 1: 79%|███████▊ | 9741/12384 [20:40:11<5:35:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 79%|███████▊ | 9742/12384 [20:40:11<5:35:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 79%|███████▊ | 9742/12384 [20:40:18<5:35:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 79%|███████▊ | 9743/12384 [20:40:18<5:34:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 79%|███████▊ | 9743/12384 [20:40:26<5:34:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 79%|███████▊ | 9744/12384 [20:40:26<5:35:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 79%|███████▊ | 9744/12384 [20:40:34<5:35:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 79%|███████▊ | 9745/12384 [20:40:34<5:34:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 79%|███████▊ | 9745/12384 [20:40:41<5:34:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 79%|███████▊ | 9746/12384 [20:40:41<5:34:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 79%|███████▊ | 9746/12384 [20:40:49<5:34:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 79%|███████▊ | 9747/12384 [20:40:49<5:34:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 79%|███████▊ | 9747/12384 [20:40:56<5:34:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▊ | 9748/12384 [20:40:56<5:33:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▊ | 9748/12384 [20:41:04<5:33:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 79%|███████▊ | 9749/12384 [20:41:04<5:33:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 79%|███████▊ | 9749/12384 [20:41:12<5:33:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 1: 79%|███████▊ | 9750/12384 [20:41:12<5:33:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 1: 79%|███████▊ | 9750/12384 [20:41:19<5:33:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 79%|███████▊ | 9751/12384 [20:41:19<5:33:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 1: 79%|███████▊ | 9751/12384 [20:41:27<5:33:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 79%|███████▊ | 9752/12384 [20:41:27<5:33:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 79%|███████▊ | 9752/12384 [20:41:34<5:33:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 79%|███████▉ | 9753/12384 [20:41:34<5:33:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 79%|███████▉ | 9753/12384 [20:41:42<5:33:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 1: 79%|███████▉ | 9754/12384 [20:41:42<5:33:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 1: 79%|███████▉ | 9754/12384 [20:41:50<5:33:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 79%|███████▉ | 9755/12384 [20:41:50<5:33:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 79%|███████▉ | 9755/12384 [20:41:57<5:33:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 79%|███████▉ | 9756/12384 [20:41:57<5:33:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 79%|███████▉ | 9756/12384 [20:42:05<5:33:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 79%|███████▉ | 9757/12384 [20:42:05<5:37:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 79%|███████▉ | 9757/12384 [20:42:13<5:37:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 79%|███████▉ | 9758/12384 [20:42:13<5:36:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 79%|███████▉ | 9758/12384 [20:42:20<5:36:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 79%|███████▉ | 9759/12384 [20:42:20<5:35:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 79%|███████▉ | 9759/12384 [20:42:28<5:35:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 1: 79%|███████▉ | 9760/12384 [20:42:28<5:34:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 1: 79%|███████▉ | 9760/12384 [20:42:36<5:34:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 79%|███████▉ | 9761/12384 [20:42:36<5:34:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 79%|███████▉ | 9761/12384 [20:42:43<5:34:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9762/12384 [20:42:43<5:33:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9762/12384 [20:42:51<5:33:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 79%|███████▉ | 9763/12384 [20:42:51<5:33:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 79%|███████▉ | 9763/12384 [20:42:59<5:33:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 79%|███████▉ | 9764/12384 [20:42:59<5:32:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 79%|███████▉ | 9764/12384 [20:43:06<5:32:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9765/12384 [20:43:06<5:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9765/12384 [20:43:14<5:32:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 79%|███████▉ | 9766/12384 [20:43:14<5:32:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 79%|███████▉ | 9766/12384 [20:43:21<5:32:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.68s]
Epoch 1: 79%|███████▉ | 9767/12384 [20:43:21<5:32:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.68s]
Epoch 1: 79%|███████▉ | 9767/12384 [20:43:29<5:32:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 1: 79%|███████▉ | 9768/12384 [20:43:29<5:32:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 1: 79%|███████▉ | 9768/12384 [20:43:37<5:32:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 79%|███████▉ | 9769/12384 [20:43:37<5:31:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 79%|███████▉ | 9769/12384 [20:43:44<5:31:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9770/12384 [20:43:44<5:31:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9770/12384 [20:43:52<5:31:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 79%|███████▉ | 9771/12384 [20:43:52<5:31:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 79%|███████▉ | 9771/12384 [20:44:00<5:31:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 79%|███████▉ | 9772/12384 [20:44:00<5:31:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 79%|███████▉ | 9772/12384 [20:44:07<5:31:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 79%|███████▉ | 9773/12384 [20:44:07<5:31:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 79%|███████▉ | 9773/12384 [20:44:15<5:31:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 79%|███████▉ | 9774/12384 [20:44:15<5:31:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 79%|███████▉ | 9774/12384 [20:44:22<5:31:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 79%|███████▉ | 9775/12384 [20:44:22<5:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 79%|███████▉ | 9775/12384 [20:44:30<5:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 79%|███████▉ | 9776/12384 [20:44:30<5:31:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 79%|███████▉ | 9776/12384 [20:44:38<5:31:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 79%|███████▉ | 9777/12384 [20:44:38<5:32:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 79%|███████▉ | 9777/12384 [20:44:45<5:32:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 79%|███████▉ | 9778/12384 [20:44:45<5:31:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 79%|███████▉ | 9778/12384 [20:44:53<5:31:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9779/12384 [20:44:53<5:32:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9779/12384 [20:45:01<5:32:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 1: 79%|███████▉ | 9780/12384 [20:45:01<5:32:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 1: 79%|███████▉ | 9780/12384 [20:45:09<5:32:00, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.73s]
Epoch 1: 79%|███████▉ | 9781/12384 [20:45:09<5:34:34, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=8.73s]
Epoch 1: 79%|███████▉ | 9781/12384 [20:45:16<5:34:34, 7.71s/it, loss=0.0002, acc=0.9994, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9782/12384 [20:45:16<5:33:07, 7.68s/it, loss=0.0002, acc=0.9994, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9782/12384 [20:45:24<5:33:07, 7.68s/it, loss=0.0011, acc=0.9982, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9783/12384 [20:45:24<5:32:01, 7.66s/it, loss=0.0011, acc=0.9982, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9783/12384 [20:45:32<5:32:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 79%|███████▉ | 9784/12384 [20:45:32<5:35:25, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 79%|███████▉ | 9784/12384 [20:45:39<5:35:25, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 79%|███████▉ | 9785/12384 [20:45:39<5:33:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 79%|███████▉ | 9785/12384 [20:45:47<5:33:38, 7.70s/it, loss=0.0050, acc=0.9911, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9786/12384 [20:45:47<5:32:22, 7.68s/it, loss=0.0050, acc=0.9911, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9786/12384 [20:45:55<5:32:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 79%|███████▉ | 9787/12384 [20:45:55<5:31:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 79%|███████▉ | 9787/12384 [20:46:02<5:31:17, 7.65s/it, loss=0.0007, acc=0.9979, iter_time=5.55s]
Epoch 1: 79%|███████▉ | 9788/12384 [20:46:02<5:30:23, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=5.55s]
Epoch 1: 79%|███████▉ | 9788/12384 [20:46:10<5:30:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 79%|███████▉ | 9789/12384 [20:46:10<5:29:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 79%|███████▉ | 9789/12384 [20:46:17<5:29:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9790/12384 [20:46:17<5:29:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9790/12384 [20:46:25<5:29:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 79%|███████▉ | 9791/12384 [20:46:25<5:29:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 79%|███████▉ | 9791/12384 [20:46:33<5:29:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 79%|███████▉ | 9792/12384 [20:46:33<5:29:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 79%|███████▉ | 9792/12384 [20:46:40<5:29:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 79%|███████▉ | 9793/12384 [20:46:40<5:28:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 79%|███████▉ | 9793/12384 [20:46:48<5:28:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 79%|███████▉ | 9794/12384 [20:46:48<5:28:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 79%|███████▉ | 9794/12384 [20:46:55<5:28:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 79%|███████▉ | 9795/12384 [20:46:55<5:28:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 79%|███████▉ | 9795/12384 [20:47:03<5:28:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9796/12384 [20:47:03<5:28:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9796/12384 [20:47:11<5:28:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 79%|███████▉ | 9797/12384 [20:47:11<5:29:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 1: 79%|███████▉ | 9797/12384 [20:47:18<5:29:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 1: 79%|███████▉ | 9798/12384 [20:47:18<5:28:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 1: 79%|███████▉ | 9798/12384 [20:47:26<5:28:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9799/12384 [20:47:26<5:28:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9799/12384 [20:47:34<5:28:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 79%|███████▉ | 9800/12384 [20:47:34<5:28:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 79%|███████▉ | 9800/12384 [20:47:41<5:28:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 79%|███████▉ | 9801/12384 [20:47:41<5:28:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 79%|███████▉ | 9801/12384 [20:47:49<5:28:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 79%|███████▉ | 9802/12384 [20:47:49<5:28:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 79%|███████▉ | 9802/12384 [20:47:57<5:28:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 79%|███████▉ | 9803/12384 [20:47:57<5:29:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 79%|███████▉ | 9803/12384 [20:48:04<5:29:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 79%|███████▉ | 9804/12384 [20:48:04<5:28:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 79%|███████▉ | 9804/12384 [20:48:12<5:28:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 79%|███████▉ | 9805/12384 [20:48:12<5:27:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 79%|███████▉ | 9805/12384 [20:48:20<5:27:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 79%|███████▉ | 9806/12384 [20:48:20<5:30:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 79%|███████▉ | 9806/12384 [20:48:27<5:30:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9807/12384 [20:48:27<5:29:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9807/12384 [20:48:35<5:29:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 79%|███████▉ | 9808/12384 [20:48:35<5:28:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 79%|███████▉ | 9808/12384 [20:48:42<5:28:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 79%|███████▉ | 9809/12384 [20:48:42<5:27:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 79%|███████▉ | 9809/12384 [20:48:50<5:27:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 79%|███████▉ | 9810/12384 [20:48:50<5:31:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 79%|███████▉ | 9810/12384 [20:48:58<5:31:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 79%|███████▉ | 9811/12384 [20:48:58<5:29:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 1: 79%|███████▉ | 9811/12384 [20:49:06<5:29:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 1: 79%|███████▉ | 9812/12384 [20:49:06<5:29:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 1: 79%|███████▉ | 9812/12384 [20:49:13<5:29:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 79%|███████▉ | 9813/12384 [20:49:13<5:28:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 79%|███████▉ | 9813/12384 [20:49:21<5:28:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9814/12384 [20:49:21<5:27:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9814/12384 [20:49:28<5:27:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9815/12384 [20:49:28<5:27:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9815/12384 [20:49:36<5:27:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 79%|███████▉ | 9816/12384 [20:49:36<5:26:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 79%|███████▉ | 9816/12384 [20:49:44<5:26:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 79%|███████▉ | 9817/12384 [20:49:44<5:26:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 79%|███████▉ | 9817/12384 [20:49:51<5:26:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 79%|███████▉ | 9818/12384 [20:49:51<5:26:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 79%|███████▉ | 9818/12384 [20:49:59<5:26:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 79%|███████▉ | 9819/12384 [20:49:59<5:25:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 79%|███████▉ | 9819/12384 [20:50:07<5:25:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 79%|███████▉ | 9820/12384 [20:50:07<5:25:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 1: 79%|███████▉ | 9820/12384 [20:50:14<5:25:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 79%|███████▉ | 9821/12384 [20:50:14<5:25:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 79%|███████▉ | 9821/12384 [20:50:22<5:25:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 79%|███████▉ | 9822/12384 [20:50:22<5:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 79%|███████▉ | 9822/12384 [20:50:29<5:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 79%|███████▉ | 9823/12384 [20:50:29<5:24:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 79%|███████▉ | 9823/12384 [20:50:37<5:24:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 79%|███████▉ | 9824/12384 [20:50:37<5:24:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 79%|███████▉ | 9824/12384 [20:50:45<5:24:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 79%|███████▉ | 9825/12384 [20:50:45<5:24:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 79%|███████▉ | 9825/12384 [20:50:52<5:24:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9826/12384 [20:50:52<5:24:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 79%|███████▉ | 9826/12384 [20:51:00<5:24:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9827/12384 [20:51:00<5:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9827/12384 [20:51:08<5:24:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 79%|███████▉ | 9828/12384 [20:51:08<5:24:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 79%|███████▉ | 9828/12384 [20:51:15<5:24:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 79%|███████▉ | 9829/12384 [20:51:15<5:24:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 79%|███████▉ | 9829/12384 [20:51:23<5:24:06, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.79s]
Epoch 1: 79%|███████▉ | 9830/12384 [20:51:23<5:23:52, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=8.79s]
Epoch 1: 79%|███████▉ | 9830/12384 [20:51:30<5:23:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9831/12384 [20:51:30<5:24:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 79%|███████▉ | 9831/12384 [20:51:38<5:24:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9832/12384 [20:51:38<5:24:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9832/12384 [20:51:46<5:24:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 79%|███████▉ | 9833/12384 [20:51:46<5:27:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 79%|███████▉ | 9833/12384 [20:51:54<5:27:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 79%|███████▉ | 9834/12384 [20:51:54<5:26:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 79%|███████▉ | 9834/12384 [20:52:01<5:26:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 79%|███████▉ | 9835/12384 [20:52:01<5:25:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 79%|███████▉ | 9835/12384 [20:52:09<5:25:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 79%|███████▉ | 9836/12384 [20:52:09<5:24:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 1: 79%|███████▉ | 9836/12384 [20:52:17<5:24:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 79%|███████▉ | 9837/12384 [20:52:17<5:27:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 1: 79%|███████▉ | 9837/12384 [20:52:24<5:27:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 79%|███████▉ | 9838/12384 [20:52:24<5:25:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 79%|███████▉ | 9838/12384 [20:52:32<5:25:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 79%|███████▉ | 9839/12384 [20:52:32<5:24:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 79%|███████▉ | 9839/12384 [20:52:39<5:24:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 79%|███████▉ | 9840/12384 [20:52:39<5:24:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 79%|███████▉ | 9840/12384 [20:52:47<5:24:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9841/12384 [20:52:47<5:23:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 79%|███████▉ | 9841/12384 [20:52:55<5:23:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 79%|███████▉ | 9842/12384 [20:52:55<5:22:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 79%|███████▉ | 9842/12384 [20:53:02<5:22:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 79%|███████▉ | 9843/12384 [20:53:02<5:23:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 79%|███████▉ | 9843/12384 [20:53:10<5:23:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 79%|███████▉ | 9844/12384 [20:53:10<5:22:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 79%|███████▉ | 9844/12384 [20:53:18<5:22:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 79%|███████▉ | 9845/12384 [20:53:18<5:22:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 1: 79%|███████▉ | 9845/12384 [20:53:25<5:22:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 80%|███████▉ | 9846/12384 [20:53:25<5:22:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 1: 80%|███████▉ | 9846/12384 [20:53:33<5:22:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 80%|███████▉ | 9847/12384 [20:53:33<5:22:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 80%|███████▉ | 9847/12384 [20:53:40<5:22:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 80%|███████▉ | 9848/12384 [20:53:40<5:22:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 80%|███████▉ | 9848/12384 [20:53:48<5:22:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 80%|███████▉ | 9849/12384 [20:53:48<5:22:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 80%|███████▉ | 9849/12384 [20:53:56<5:22:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 80%|███████▉ | 9850/12384 [20:53:56<5:21:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 80%|███████▉ | 9850/12384 [20:54:03<5:21:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|███████▉ | 9851/12384 [20:54:03<5:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|███████▉ | 9851/12384 [20:54:11<5:21:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|███████▉ | 9852/12384 [20:54:11<5:21:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|███████▉ | 9852/12384 [20:54:19<5:21:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 80%|███████▉ | 9853/12384 [20:54:19<5:21:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 1: 80%|███████▉ | 9853/12384 [20:54:26<5:21:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 80%|███████▉ | 9854/12384 [20:54:26<5:21:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 1: 80%|███████▉ | 9854/12384 [20:54:34<5:21:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 80%|███████▉ | 9855/12384 [20:54:34<5:21:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 80%|███████▉ | 9855/12384 [20:54:41<5:21:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 1: 80%|███████▉ | 9856/12384 [20:54:41<5:21:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 1: 80%|███████▉ | 9856/12384 [20:54:49<5:21:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 1: 80%|███████▉ | 9857/12384 [20:54:49<5:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 1: 80%|███████▉ | 9857/12384 [20:54:57<5:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 80%|███████▉ | 9858/12384 [20:54:57<5:20:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 1: 80%|███████▉ | 9858/12384 [20:55:04<5:20:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 80%|███████▉ | 9859/12384 [20:55:04<5:19:54, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 80%|███████▉ | 9859/12384 [20:55:12<5:19:54, 7.60s/it, loss=0.0002, acc=0.9984, iter_time=6.95s]
Epoch 1: 80%|███████▉ | 9860/12384 [20:55:12<5:19:42, 7.60s/it, loss=0.0002, acc=0.9984, iter_time=6.95s]
Epoch 1: 80%|███████▉ | 9860/12384 [20:55:19<5:19:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 80%|███████▉ | 9861/12384 [20:55:19<5:19:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 80%|███████▉ | 9861/12384 [20:55:27<5:19:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 80%|███████▉ | 9862/12384 [20:55:27<5:19:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 80%|███████▉ | 9862/12384 [20:55:35<5:19:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 80%|███████▉ | 9863/12384 [20:55:35<5:24:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 80%|███████▉ | 9863/12384 [20:55:43<5:24:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 80%|███████▉ | 9864/12384 [20:55:43<5:22:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 80%|███████▉ | 9864/12384 [20:55:50<5:22:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 80%|███████▉ | 9865/12384 [20:55:50<5:21:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 80%|███████▉ | 9865/12384 [20:55:58<5:21:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 80%|███████▉ | 9866/12384 [20:55:58<5:20:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 80%|███████▉ | 9866/12384 [20:56:05<5:20:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 80%|███████▉ | 9867/12384 [20:56:05<5:20:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 80%|███████▉ | 9867/12384 [20:56:13<5:20:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|███████▉ | 9868/12384 [20:56:13<5:19:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|███████▉ | 9868/12384 [20:56:21<5:19:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 80%|███████▉ | 9869/12384 [20:56:21<5:19:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 80%|███████▉ | 9869/12384 [20:56:28<5:19:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 80%|███████▉ | 9870/12384 [20:56:28<5:19:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 80%|███████▉ | 9870/12384 [20:56:36<5:19:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|███████▉ | 9871/12384 [20:56:36<5:19:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|███████▉ | 9871/12384 [20:56:44<5:19:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 80%|███████▉ | 9872/12384 [20:56:44<5:20:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 80%|███████▉ | 9872/12384 [20:56:51<5:20:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 80%|███████▉ | 9873/12384 [20:56:51<5:19:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 80%|███████▉ | 9873/12384 [20:56:59<5:19:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 80%|███████▉ | 9874/12384 [20:56:59<5:18:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 80%|███████▉ | 9874/12384 [20:57:06<5:18:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 80%|███████▉ | 9875/12384 [20:57:06<5:19:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 80%|███████▉ | 9875/12384 [20:57:14<5:19:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 80%|███████▉ | 9876/12384 [20:57:14<5:18:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 80%|███████▉ | 9876/12384 [20:57:22<5:18:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 80%|███████▉ | 9877/12384 [20:57:22<5:18:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 80%|███████▉ | 9877/12384 [20:57:29<5:18:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 80%|███████▉ | 9878/12384 [20:57:29<5:18:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 80%|███████▉ | 9878/12384 [20:57:37<5:18:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|███████▉ | 9879/12384 [20:57:37<5:17:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|███████▉ | 9879/12384 [20:57:44<5:17:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 80%|███████▉ | 9880/12384 [20:57:44<5:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 80%|███████▉ | 9880/12384 [20:57:52<5:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 80%|███████▉ | 9881/12384 [20:57:52<5:18:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 80%|███████▉ | 9881/12384 [20:58:00<5:18:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 1: 80%|███████▉ | 9882/12384 [20:58:00<5:17:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 1: 80%|███████▉ | 9882/12384 [20:58:07<5:17:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 80%|███████▉ | 9883/12384 [20:58:07<5:17:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 80%|███████▉ | 9883/12384 [20:58:15<5:17:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 80%|███████▉ | 9884/12384 [20:58:15<5:16:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 80%|███████▉ | 9884/12384 [20:58:23<5:16:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 80%|███████▉ | 9885/12384 [20:58:23<5:17:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 80%|███████▉ | 9885/12384 [20:58:30<5:17:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 80%|███████▉ | 9886/12384 [20:58:30<5:17:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 80%|███████▉ | 9886/12384 [20:58:38<5:17:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 80%|███████▉ | 9887/12384 [20:58:38<5:20:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 80%|███████▉ | 9887/12384 [20:58:46<5:20:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 80%|███████▉ | 9888/12384 [20:58:46<5:19:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 80%|███████▉ | 9888/12384 [20:58:54<5:19:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 80%|███████▉ | 9889/12384 [20:58:54<5:22:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 1: 80%|███████▉ | 9889/12384 [20:59:01<5:22:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 80%|███████▉ | 9890/12384 [20:59:01<5:20:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 80%|███████▉ | 9890/12384 [20:59:09<5:20:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 80%|███████▉ | 9891/12384 [20:59:09<5:19:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 80%|███████▉ | 9891/12384 [20:59:16<5:19:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 80%|███████▉ | 9892/12384 [20:59:16<5:17:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 80%|███████▉ | 9892/12384 [20:59:24<5:17:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|███████▉ | 9893/12384 [20:59:24<5:17:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|███████▉ | 9893/12384 [20:59:32<5:17:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|███████▉ | 9894/12384 [20:59:32<5:16:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|███████▉ | 9894/12384 [20:59:39<5:16:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 80%|███████▉ | 9895/12384 [20:59:39<5:16:16, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 80%|███████▉ | 9895/12384 [20:59:47<5:16:16, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.70s]
Epoch 1: 80%|███████▉ | 9896/12384 [20:59:47<5:15:59, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.70s]
Epoch 1: 80%|███████▉ | 9896/12384 [20:59:54<5:15:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 80%|███████▉ | 9897/12384 [20:59:54<5:15:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 80%|███████▉ | 9897/12384 [21:00:02<5:15:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 80%|███████▉ | 9898/12384 [21:00:02<5:15:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 80%|███████▉ | 9898/12384 [21:00:10<5:15:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 80%|███████▉ | 9899/12384 [21:00:10<5:15:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 80%|███████▉ | 9899/12384 [21:00:17<5:15:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 80%|███████▉ | 9900/12384 [21:00:17<5:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 1: 80%|███████▉ | 9900/12384 [21:00:25<5:15:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.01s]
Epoch 1: 80%|███████▉ | 9901/12384 [21:00:25<5:15:20, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.01s]
Epoch 1: 80%|███████▉ | 9901/12384 [21:00:33<5:15:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 80%|███████▉ | 9902/12384 [21:00:33<5:14:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 80%|███████▉ | 9902/12384 [21:00:40<5:14:50, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.36s]
Epoch 1: 80%|███████▉ | 9903/12384 [21:00:40<5:14:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.36s]
Epoch 1: 80%|███████▉ | 9903/12384 [21:00:48<5:14:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 80%|███████▉ | 9904/12384 [21:00:48<5:14:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 80%|███████▉ | 9904/12384 [21:00:55<5:14:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 80%|███████▉ | 9905/12384 [21:00:55<5:14:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 80%|███████▉ | 9905/12384 [21:01:03<5:14:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 80%|███████▉ | 9906/12384 [21:01:03<5:14:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 80%|███████▉ | 9906/12384 [21:01:11<5:14:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 80%|███████▉ | 9907/12384 [21:01:11<5:14:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 80%|███████▉ | 9907/12384 [21:01:18<5:14:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 80%|████████ | 9908/12384 [21:01:18<5:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 80%|████████ | 9908/12384 [21:01:26<5:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 80%|████████ | 9909/12384 [21:01:26<5:14:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 80%|████████ | 9909/12384 [21:01:33<5:14:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 80%|████████ | 9910/12384 [21:01:33<5:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 80%|████████ | 9910/12384 [21:01:41<5:13:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 80%|████████ | 9911/12384 [21:01:41<5:13:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 80%|████████ | 9911/12384 [21:01:49<5:13:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 80%|████████ | 9912/12384 [21:01:49<5:17:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 80%|████████ | 9912/12384 [21:01:57<5:17:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 80%|████████ | 9913/12384 [21:01:57<5:15:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 80%|████████ | 9913/12384 [21:02:04<5:15:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 80%|████████ | 9914/12384 [21:02:04<5:14:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 80%|████████ | 9914/12384 [21:02:12<5:14:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 80%|████████ | 9915/12384 [21:02:12<5:19:14, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 80%|████████ | 9915/12384 [21:02:20<5:19:14, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 80%|████████ | 9916/12384 [21:02:20<5:17:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 80%|████████ | 9916/12384 [21:02:27<5:17:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 80%|████████ | 9917/12384 [21:02:27<5:15:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 80%|████████ | 9917/12384 [21:02:35<5:15:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9918/12384 [21:02:35<5:15:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9918/12384 [21:02:43<5:15:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9919/12384 [21:02:43<5:14:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9919/12384 [21:02:50<5:14:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 80%|████████ | 9920/12384 [21:02:50<5:13:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 80%|████████ | 9920/12384 [21:02:58<5:13:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 80%|████████ | 9921/12384 [21:02:58<5:13:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 80%|████████ | 9921/12384 [21:03:06<5:13:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 80%|████████ | 9922/12384 [21:03:06<5:12:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 80%|████████ | 9922/12384 [21:03:13<5:12:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 80%|████████ | 9923/12384 [21:03:13<5:13:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 80%|████████ | 9923/12384 [21:03:21<5:13:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 80%|████████ | 9924/12384 [21:03:21<5:12:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 1: 80%|████████ | 9924/12384 [21:03:28<5:12:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 80%|████████ | 9925/12384 [21:03:28<5:12:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 80%|████████ | 9925/12384 [21:03:36<5:12:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 80%|████████ | 9926/12384 [21:03:36<5:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 80%|████████ | 9926/12384 [21:03:44<5:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 80%|████████ | 9927/12384 [21:03:44<5:11:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 80%|████████ | 9927/12384 [21:03:51<5:11:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 80%|████████ | 9928/12384 [21:03:51<5:12:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 80%|████████ | 9928/12384 [21:03:59<5:12:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 80%|████████ | 9929/12384 [21:03:59<5:12:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 80%|████████ | 9929/12384 [21:04:07<5:12:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 80%|████████ | 9930/12384 [21:04:07<5:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 80%|████████ | 9930/12384 [21:04:14<5:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 80%|████████ | 9931/12384 [21:04:14<5:11:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 80%|████████ | 9931/12384 [21:04:22<5:11:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 80%|████████ | 9932/12384 [21:04:22<5:11:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 80%|████████ | 9932/12384 [21:04:29<5:11:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 80%|████████ | 9933/12384 [21:04:29<5:11:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 80%|████████ | 9933/12384 [21:04:37<5:11:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 80%|████████ | 9934/12384 [21:04:37<5:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 80%|████████ | 9934/12384 [21:04:45<5:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 80%|████████ | 9935/12384 [21:04:45<5:10:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 1: 80%|████████ | 9935/12384 [21:04:52<5:10:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 1: 80%|████████ | 9936/12384 [21:04:52<5:10:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 1: 80%|████████ | 9936/12384 [21:05:00<5:10:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 80%|████████ | 9937/12384 [21:05:00<5:10:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 80%|████████ | 9937/12384 [21:05:08<5:10:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 80%|████████ | 9938/12384 [21:05:08<5:12:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 80%|████████ | 9938/12384 [21:05:15<5:12:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9939/12384 [21:05:15<5:12:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9939/12384 [21:05:23<5:12:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 80%|████████ | 9940/12384 [21:05:23<5:11:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 80%|████████ | 9940/12384 [21:05:31<5:11:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 80%|████████ | 9941/12384 [21:05:31<5:14:49, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 80%|████████ | 9941/12384 [21:05:38<5:14:49, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 80%|████████ | 9942/12384 [21:05:38<5:13:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 80%|████████ | 9942/12384 [21:05:46<5:13:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 80%|████████ | 9943/12384 [21:05:46<5:11:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 80%|████████ | 9943/12384 [21:05:54<5:11:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 80%|████████ | 9944/12384 [21:05:54<5:11:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 1: 80%|████████ | 9944/12384 [21:06:01<5:11:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 80%|████████ | 9945/12384 [21:06:01<5:11:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 80%|████████ | 9945/12384 [21:06:09<5:11:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 80%|████████ | 9946/12384 [21:06:09<5:11:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 80%|████████ | 9946/12384 [21:06:17<5:11:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 80%|████████ | 9947/12384 [21:06:17<5:10:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 80%|████████ | 9947/12384 [21:06:24<5:10:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 80%|████████ | 9948/12384 [21:06:24<5:10:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 80%|████████ | 9948/12384 [21:06:32<5:10:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 80%|████████ | 9949/12384 [21:06:32<5:09:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 80%|████████ | 9949/12384 [21:06:39<5:09:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|████████ | 9950/12384 [21:06:39<5:09:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|████████ | 9950/12384 [21:06:47<5:09:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9951/12384 [21:06:47<5:09:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9951/12384 [21:06:55<5:09:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 80%|████████ | 9952/12384 [21:06:55<5:10:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 80%|████████ | 9952/12384 [21:07:02<5:10:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 80%|████████ | 9953/12384 [21:07:02<5:09:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 80%|████████ | 9953/12384 [21:07:10<5:09:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9954/12384 [21:07:10<5:08:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 80%|████████ | 9954/12384 [21:07:18<5:08:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 80%|████████ | 9955/12384 [21:07:18<5:08:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 80%|████████ | 9955/12384 [21:07:25<5:08:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 80%|████████ | 9956/12384 [21:07:25<5:08:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 80%|████████ | 9956/12384 [21:07:33<5:08:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 1: 80%|████████ | 9957/12384 [21:07:33<5:07:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 1: 80%|████████ | 9957/12384 [21:07:40<5:07:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 80%|████████ | 9958/12384 [21:07:40<5:07:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 80%|████████ | 9958/12384 [21:07:48<5:07:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 80%|████████ | 9959/12384 [21:07:48<5:07:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 80%|████████ | 9959/12384 [21:07:56<5:07:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 80%|████████ | 9960/12384 [21:07:56<5:07:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 80%|████████ | 9960/12384 [21:08:03<5:07:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 80%|████████ | 9961/12384 [21:08:03<5:07:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 80%|████████ | 9961/12384 [21:08:11<5:07:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 80%|████████ | 9962/12384 [21:08:11<5:07:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 80%|████████ | 9962/12384 [21:08:18<5:07:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|████████ | 9963/12384 [21:08:18<5:07:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 80%|████████ | 9963/12384 [21:08:26<5:07:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 80%|████████ | 9964/12384 [21:08:26<5:06:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 80%|████████ | 9964/12384 [21:08:34<5:06:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 80%|████████ | 9965/12384 [21:08:34<5:09:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 80%|████████ | 9965/12384 [21:08:41<5:09:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 80%|████████ | 9966/12384 [21:08:41<5:08:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 80%|████████ | 9966/12384 [21:08:49<5:08:41, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 80%|████████ | 9967/12384 [21:08:49<5:08:03, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 80%|████████ | 9967/12384 [21:08:57<5:08:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 80%|████████ | 9968/12384 [21:08:57<5:11:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 80%|████████ | 9968/12384 [21:09:05<5:11:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 1: 80%|████████ | 9969/12384 [21:09:05<5:09:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 1: 80%|████████ | 9969/12384 [21:09:12<5:09:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 81%|████████ | 9970/12384 [21:09:12<5:09:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 1: 81%|████████ | 9970/12384 [21:09:20<5:09:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 81%|████████ | 9971/12384 [21:09:20<5:08:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 81%|████████ | 9971/12384 [21:09:28<5:08:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 81%|████████ | 9972/12384 [21:09:28<5:07:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 81%|████████ | 9972/12384 [21:09:35<5:07:37, 7.65s/it, loss=0.0008, acc=1.0000, iter_time=7.03s]
Epoch 1: 81%|████████ | 9973/12384 [21:09:35<5:07:12, 7.65s/it, loss=0.0008, acc=1.0000, iter_time=7.03s]
Epoch 1: 81%|████████ | 9973/12384 [21:09:43<5:07:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 81%|████████ | 9974/12384 [21:09:43<5:06:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 81%|████████ | 9974/12384 [21:09:50<5:06:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 1: 81%|████████ | 9975/12384 [21:09:50<5:05:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 1: 81%|████████ | 9975/12384 [21:09:58<5:05:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 81%|████████ | 9976/12384 [21:09:58<5:05:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 81%|████████ | 9976/12384 [21:10:06<5:05:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 81%|████████ | 9977/12384 [21:10:06<5:06:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 81%|████████ | 9977/12384 [21:10:13<5:06:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 81%|████████ | 9978/12384 [21:10:13<5:05:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 81%|████████ | 9978/12384 [21:10:21<5:05:54, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.33s]
Epoch 1: 81%|████████ | 9979/12384 [21:10:21<5:05:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.33s]
Epoch 1: 81%|████████ | 9979/12384 [21:10:28<5:05:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 81%|████████ | 9980/12384 [21:10:28<5:04:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 81%|████████ | 9980/12384 [21:10:36<5:04:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 9981/12384 [21:10:36<5:04:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 9981/12384 [21:10:44<5:04:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 9982/12384 [21:10:44<5:04:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 9982/12384 [21:10:51<5:04:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 9983/12384 [21:10:51<5:04:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 9983/12384 [21:10:59<5:04:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 81%|████████ | 9984/12384 [21:10:59<5:04:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 81%|████████ | 9984/12384 [21:11:06<5:04:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 81%|████████ | 9985/12384 [21:11:06<5:04:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 81%|████████ | 9985/12384 [21:11:14<5:04:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 81%|████████ | 9986/12384 [21:11:14<5:03:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 81%|████████ | 9986/12384 [21:11:22<5:03:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 9987/12384 [21:11:22<5:04:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 9987/12384 [21:11:29<5:04:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 9988/12384 [21:11:29<5:03:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 9988/12384 [21:11:37<5:03:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 81%|████████ | 9989/12384 [21:11:37<5:04:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 81%|████████ | 9989/12384 [21:11:45<5:04:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 81%|████████ | 9990/12384 [21:11:45<5:07:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 81%|████████ | 9990/12384 [21:11:52<5:07:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 81%|████████ | 9991/12384 [21:11:52<5:05:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 81%|████████ | 9991/12384 [21:12:00<5:05:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 1: 81%|████████ | 9992/12384 [21:12:00<5:05:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 1: 81%|████████ | 9992/12384 [21:12:08<5:05:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 81%|████████ | 9993/12384 [21:12:08<5:04:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 81%|████████ | 9993/12384 [21:12:16<5:04:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 1: 81%|████████ | 9994/12384 [21:12:16<5:08:21, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 1: 81%|████████ | 9994/12384 [21:12:23<5:08:21, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 1: 81%|████████ | 9995/12384 [21:12:23<5:06:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 1: 81%|████████ | 9995/12384 [21:12:31<5:06:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 9996/12384 [21:12:31<5:05:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 9996/12384 [21:12:38<5:05:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 9997/12384 [21:12:38<5:04:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 9997/12384 [21:12:46<5:04:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████ | 9998/12384 [21:12:46<5:03:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████ | 9998/12384 [21:12:54<5:03:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 9999/12384 [21:12:54<5:03:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 9999/12384 [21:13:01<5:03:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 81%|████████ | 10000/12384 [21:13:01<5:03:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 81%|████████ | 10000/12384 [21:13:09<5:03:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 81%|████████ | 10001/12384 [21:13:09<5:03:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 1: 81%|████████ | 10001/12384 [21:13:17<5:03:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 81%|████████ | 10002/12384 [21:13:17<5:02:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 81%|████████ | 10002/12384 [21:13:24<5:02:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10003/12384 [21:13:24<5:02:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10003/12384 [21:13:32<5:02:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 81%|████████ | 10004/12384 [21:13:32<5:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 81%|████████ | 10004/12384 [21:13:39<5:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 81%|████████ | 10005/12384 [21:13:39<5:02:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 81%|████████ | 10005/12384 [21:13:47<5:02:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10006/12384 [21:13:47<5:01:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10006/12384 [21:13:55<5:01:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10007/12384 [21:13:55<5:01:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10007/12384 [21:14:02<5:01:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 81%|████████ | 10008/12384 [21:14:02<5:01:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 81%|████████ | 10008/12384 [21:14:10<5:01:38, 7.62s/it, loss=0.0000, acc=0.9999, iter_time=7.66s]
Epoch 1: 81%|████████ | 10009/12384 [21:14:10<5:01:36, 7.62s/it, loss=0.0000, acc=0.9999, iter_time=7.66s]
Epoch 1: 81%|████████ | 10009/12384 [21:14:17<5:01:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10010/12384 [21:14:17<5:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10010/12384 [21:14:25<5:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 81%|████████ | 10011/12384 [21:14:25<5:01:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 81%|████████ | 10011/12384 [21:14:33<5:01:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 81%|████████ | 10012/12384 [21:14:33<5:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 81%|████████ | 10012/12384 [21:14:40<5:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 81%|████████ | 10013/12384 [21:14:40<5:00:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 81%|████████ | 10013/12384 [21:14:48<5:00:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 1: 81%|████████ | 10014/12384 [21:14:48<5:00:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 1: 81%|████████ | 10014/12384 [21:14:56<5:00:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 81%|████████ | 10015/12384 [21:14:56<5:00:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 1: 81%|████████ | 10015/12384 [21:15:03<5:00:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 81%|████████ | 10016/12384 [21:15:03<5:00:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 81%|████████ | 10016/12384 [21:15:11<5:00:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 81%|████████ | 10017/12384 [21:15:11<5:00:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 81%|████████ | 10017/12384 [21:15:18<5:00:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 81%|████████ | 10018/12384 [21:15:18<5:00:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 1: 81%|████████ | 10018/12384 [21:15:26<5:00:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 81%|████████ | 10019/12384 [21:15:26<5:00:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 81%|████████ | 10019/12384 [21:15:34<5:00:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 1: 81%|████████ | 10020/12384 [21:15:34<5:00:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.98s]
Epoch 1: 81%|████████ | 10020/12384 [21:15:42<5:00:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 81%|████████ | 10021/12384 [21:15:42<5:04:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 81%|████████ | 10021/12384 [21:15:49<5:04:00, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.92s]
Epoch 1: 81%|████████ | 10022/12384 [21:15:49<5:02:18, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.92s]
Epoch 1: 81%|████████ | 10022/12384 [21:15:57<5:02:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████ | 10023/12384 [21:15:57<5:01:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████ | 10023/12384 [21:16:04<5:01:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 81%|████████ | 10024/12384 [21:16:04<5:00:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 81%|████████ | 10024/12384 [21:16:12<5:00:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 81%|████████ | 10025/12384 [21:16:12<5:00:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 81%|████████ | 10025/12384 [21:16:20<5:00:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10026/12384 [21:16:20<4:59:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10026/12384 [21:16:27<4:59:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████ | 10027/12384 [21:16:27<4:59:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████ | 10027/12384 [21:16:35<4:59:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 81%|████████ | 10028/12384 [21:16:35<4:59:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 81%|████████ | 10028/12384 [21:16:42<4:59:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 81%|████████ | 10029/12384 [21:16:42<4:58:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 81%|████████ | 10029/12384 [21:16:50<4:58:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 81%|████████ | 10030/12384 [21:16:50<4:58:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 81%|████████ | 10030/12384 [21:16:58<4:58:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 81%|████████ | 10031/12384 [21:16:58<4:58:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 81%|████████ | 10031/12384 [21:17:05<4:58:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 81%|████████ | 10032/12384 [21:17:05<4:58:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 81%|████████ | 10032/12384 [21:17:13<4:58:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 81%|████████ | 10033/12384 [21:17:13<4:58:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 81%|████████ | 10033/12384 [21:17:20<4:58:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10034/12384 [21:17:20<4:58:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10034/12384 [21:17:28<4:58:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10035/12384 [21:17:28<4:57:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10035/12384 [21:17:36<4:57:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 10036/12384 [21:17:36<4:57:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 10036/12384 [21:17:43<4:57:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████ | 10037/12384 [21:17:43<4:57:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████ | 10037/12384 [21:17:51<4:57:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 81%|████████ | 10038/12384 [21:17:51<4:56:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 81%|████████ | 10038/12384 [21:17:58<4:56:59, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=4.82s]
Epoch 1: 81%|████████ | 10039/12384 [21:17:58<4:57:06, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=4.82s]
Epoch 1: 81%|████████ | 10039/12384 [21:18:06<4:57:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 81%|████████ | 10040/12384 [21:18:06<4:57:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 81%|████████ | 10040/12384 [21:18:14<4:57:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 81%|████████ | 10041/12384 [21:18:14<4:56:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 81%|████████ | 10041/12384 [21:18:21<4:56:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 81%|████████ | 10042/12384 [21:18:21<4:56:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 81%|████████ | 10042/12384 [21:18:29<4:56:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 81%|████████ | 10043/12384 [21:18:29<4:56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 81%|████████ | 10043/12384 [21:18:36<4:56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 81%|████████ | 10044/12384 [21:18:36<4:56:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 81%|████████ | 10044/12384 [21:18:44<4:56:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 81%|████████ | 10045/12384 [21:18:44<4:56:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 81%|████████ | 10045/12384 [21:18:52<4:56:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10046/12384 [21:18:52<4:56:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10046/12384 [21:19:00<4:56:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 81%|████████ | 10047/12384 [21:19:00<5:00:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 1: 81%|████████ | 10047/12384 [21:19:07<5:00:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 1: 81%|████████ | 10048/12384 [21:19:07<4:59:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 1: 81%|████████ | 10048/12384 [21:19:15<4:59:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 81%|████████ | 10049/12384 [21:19:15<4:57:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 81%|████████ | 10049/12384 [21:19:23<4:57:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 81%|████████ | 10050/12384 [21:19:23<4:57:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 81%|████████ | 10050/12384 [21:19:30<4:57:23, 7.65s/it, loss=0.0005, acc=0.9981, iter_time=11.21s]
Epoch 1: 81%|████████ | 10051/12384 [21:19:30<4:56:54, 7.64s/it, loss=0.0005, acc=0.9981, iter_time=11.21s]
Epoch 1: 81%|████████ | 10051/12384 [21:19:38<4:56:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10052/12384 [21:19:38<4:56:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████ | 10052/12384 [21:19:45<4:56:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 81%|████████ | 10053/12384 [21:19:45<4:56:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 81%|████████ | 10053/12384 [21:19:53<4:56:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 10054/12384 [21:19:53<4:56:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 81%|████████ | 10054/12384 [21:20:01<4:56:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 81%|████████ | 10055/12384 [21:20:01<4:55:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 81%|████████ | 10055/12384 [21:20:08<4:55:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 81%|████████ | 10056/12384 [21:20:08<4:56:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 81%|████████ | 10056/12384 [21:20:16<4:56:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 81%|████████ | 10057/12384 [21:20:16<4:56:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 81%|████████ | 10057/12384 [21:20:24<4:56:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 81%|████████ | 10058/12384 [21:20:24<4:55:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 1: 81%|████████ | 10058/12384 [21:20:31<4:55:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 81%|████████ | 10059/12384 [21:20:31<4:55:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 81%|████████ | 10059/12384 [21:20:39<4:55:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 81%|████████ | 10060/12384 [21:20:39<4:55:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 1: 81%|████████ | 10060/12384 [21:20:46<4:55:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10061/12384 [21:20:46<4:55:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████ | 10061/12384 [21:20:54<4:55:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 81%|████████▏ | 10062/12384 [21:20:54<4:54:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 81%|████████▏ | 10062/12384 [21:21:02<4:54:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 81%|████████▏ | 10063/12384 [21:21:02<4:54:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 81%|████████▏ | 10063/12384 [21:21:09<4:54:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 81%|████████▏ | 10064/12384 [21:21:09<4:55:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 81%|████████▏ | 10064/12384 [21:21:17<4:55:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 81%|████████▏ | 10065/12384 [21:21:17<4:55:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 81%|████████▏ | 10065/12384 [21:21:24<4:55:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 81%|████████▏ | 10066/12384 [21:21:24<4:54:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 81%|████████▏ | 10066/12384 [21:21:32<4:54:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 81%|████████▏ | 10067/12384 [21:21:32<4:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 81%|████████▏ | 10067/12384 [21:21:40<4:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 81%|████████▏ | 10068/12384 [21:21:40<4:53:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 81%|████████▏ | 10068/12384 [21:21:47<4:53:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 81%|████████▏ | 10069/12384 [21:21:47<4:53:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 81%|████████▏ | 10069/12384 [21:21:55<4:53:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 81%|████████▏ | 10070/12384 [21:21:55<4:53:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 81%|████████▏ | 10070/12384 [21:22:03<4:53:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 81%|████████▏ | 10071/12384 [21:22:03<4:56:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 81%|████████▏ | 10071/12384 [21:22:10<4:56:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 81%|████████▏ | 10072/12384 [21:22:10<4:55:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 81%|████████▏ | 10072/12384 [21:22:18<4:55:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 81%|████████▏ | 10073/12384 [21:22:18<4:58:27, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 81%|████████▏ | 10073/12384 [21:22:26<4:58:27, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 81%|████████▏ | 10074/12384 [21:22:26<4:56:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 81%|████████▏ | 10074/12384 [21:22:34<4:56:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████▏ | 10075/12384 [21:22:34<4:55:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████▏ | 10075/12384 [21:22:41<4:55:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████▏ | 10076/12384 [21:22:41<4:54:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████▏ | 10076/12384 [21:22:49<4:54:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████▏ | 10077/12384 [21:22:49<4:53:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████▏ | 10077/12384 [21:22:56<4:53:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████▏ | 10078/12384 [21:22:56<4:53:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████▏ | 10078/12384 [21:23:04<4:53:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████▏ | 10079/12384 [21:23:04<4:52:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 81%|████████▏ | 10079/12384 [21:23:12<4:52:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 81%|████████▏ | 10080/12384 [21:23:12<4:52:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 81%|████████▏ | 10080/12384 [21:23:19<4:52:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 81%|████████▏ | 10081/12384 [21:23:19<4:52:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 81%|████████▏ | 10081/12384 [21:23:27<4:52:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 81%|████████▏ | 10082/12384 [21:23:27<4:51:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 81%|████████▏ | 10082/12384 [21:23:34<4:51:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 81%|████████▏ | 10083/12384 [21:23:34<4:52:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 81%|████████▏ | 10083/12384 [21:23:42<4:52:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 81%|████████▏ | 10084/12384 [21:23:42<4:51:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 81%|████████▏ | 10084/12384 [21:23:50<4:51:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████▏ | 10085/12384 [21:23:50<4:51:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 81%|████████▏ | 10085/12384 [21:23:57<4:51:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████▏ | 10086/12384 [21:23:57<4:51:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████▏ | 10086/12384 [21:24:05<4:51:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 81%|████████▏ | 10087/12384 [21:24:05<4:51:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 81%|████████▏ | 10087/12384 [21:24:12<4:51:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 81%|████████▏ | 10088/12384 [21:24:12<4:51:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 1: 81%|████████▏ | 10088/12384 [21:24:20<4:51:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 81%|████████▏ | 10089/12384 [21:24:20<4:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 81%|████████▏ | 10089/12384 [21:24:28<4:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 81%|████████▏ | 10090/12384 [21:24:28<4:50:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 81%|████████▏ | 10090/12384 [21:24:35<4:50:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 81%|████████▏ | 10091/12384 [21:24:35<4:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 1: 81%|████████▏ | 10091/12384 [21:24:43<4:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████▏ | 10092/12384 [21:24:43<4:50:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 81%|████████▏ | 10092/12384 [21:24:50<4:50:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10093/12384 [21:24:50<4:50:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10093/12384 [21:24:58<4:50:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 82%|████████▏ | 10094/12384 [21:24:58<4:50:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 82%|████████▏ | 10094/12384 [21:25:06<4:50:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 82%|████████▏ | 10095/12384 [21:25:06<4:50:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 82%|████████▏ | 10095/12384 [21:25:14<4:50:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 82%|████████▏ | 10096/12384 [21:25:14<4:53:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 82%|████████▏ | 10096/12384 [21:25:21<4:53:18, 7.69s/it, loss=0.0001, acc=0.9992, iter_time=5.41s]
Epoch 1: 82%|████████▏ | 10097/12384 [21:25:21<4:52:14, 7.67s/it, loss=0.0001, acc=0.9992, iter_time=5.41s]
Epoch 1: 82%|████████▏ | 10097/12384 [21:25:29<4:52:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 82%|████████▏ | 10098/12384 [21:25:29<4:51:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 82%|████████▏ | 10098/12384 [21:25:37<4:51:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 82%|████████▏ | 10099/12384 [21:25:37<4:54:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 82%|████████▏ | 10099/12384 [21:25:44<4:54:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 82%|████████▏ | 10100/12384 [21:25:44<4:53:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 82%|████████▏ | 10100/12384 [21:25:52<4:53:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 82%|████████▏ | 10101/12384 [21:25:52<4:53:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 1: 82%|████████▏ | 10101/12384 [21:26:00<4:53:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 1: 82%|████████▏ | 10102/12384 [21:26:00<4:52:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 1: 82%|████████▏ | 10102/12384 [21:26:07<4:52:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 82%|████████▏ | 10103/12384 [21:26:07<4:51:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 82%|████████▏ | 10103/12384 [21:26:15<4:51:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 82%|████████▏ | 10104/12384 [21:26:15<4:50:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 82%|████████▏ | 10104/12384 [21:26:23<4:50:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 1: 82%|████████▏ | 10105/12384 [21:26:23<4:49:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 1: 82%|████████▏ | 10105/12384 [21:26:30<4:49:39, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=9.10s]
Epoch 1: 82%|████████▏ | 10106/12384 [21:26:30<4:49:18, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=9.10s]
Epoch 1: 82%|████████▏ | 10106/12384 [21:26:38<4:49:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10107/12384 [21:26:38<4:49:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10107/12384 [21:26:45<4:49:06, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10108/12384 [21:26:45<4:49:30, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10108/12384 [21:26:53<4:49:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 82%|████████▏ | 10109/12384 [21:26:53<4:49:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 82%|████████▏ | 10109/12384 [21:27:01<4:49:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 82%|████████▏ | 10110/12384 [21:27:01<4:49:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 1: 82%|████████▏ | 10110/12384 [21:27:08<4:49:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 82%|████████▏ | 10111/12384 [21:27:08<4:48:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 82%|████████▏ | 10111/12384 [21:27:16<4:48:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 82%|████████▏ | 10112/12384 [21:27:16<4:48:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 82%|████████▏ | 10112/12384 [21:27:24<4:48:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 1: 82%|████████▏ | 10113/12384 [21:27:24<4:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 1: 82%|████████▏ | 10113/12384 [21:27:31<4:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 82%|████████▏ | 10114/12384 [21:27:31<4:47:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 82%|████████▏ | 10114/12384 [21:27:39<4:47:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 82%|████████▏ | 10115/12384 [21:27:39<4:47:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 82%|████████▏ | 10115/12384 [21:27:46<4:47:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 82%|████████▏ | 10116/12384 [21:27:47<4:50:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 82%|████████▏ | 10116/12384 [21:27:54<4:50:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 82%|████████▏ | 10117/12384 [21:27:54<4:49:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 82%|████████▏ | 10117/12384 [21:28:02<4:49:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=2.97s]
Epoch 1: 82%|████████▏ | 10118/12384 [21:28:02<4:48:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=2.97s]
Epoch 1: 82%|████████▏ | 10118/12384 [21:28:09<4:48:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=12.25s]
Epoch 1: 82%|████████▏ | 10119/12384 [21:28:09<4:48:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=12.25s]
Epoch 1: 82%|████████▏ | 10119/12384 [21:28:17<4:48:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 82%|████████▏ | 10120/12384 [21:28:17<4:48:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 82%|████████▏ | 10120/12384 [21:28:25<4:48:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 82%|████████▏ | 10121/12384 [21:28:25<4:48:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 82%|████████▏ | 10121/12384 [21:28:32<4:48:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 82%|████████▏ | 10122/12384 [21:28:32<4:47:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 1: 82%|████████▏ | 10122/12384 [21:28:40<4:47:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 82%|████████▏ | 10123/12384 [21:28:40<4:48:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 1: 82%|████████▏ | 10123/12384 [21:28:48<4:48:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 82%|████████▏ | 10124/12384 [21:28:48<4:47:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 82%|████████▏ | 10124/12384 [21:28:56<4:47:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 82%|████████▏ | 10125/12384 [21:28:56<4:52:09, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 82%|████████▏ | 10125/12384 [21:29:03<4:52:09, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 82%|████████▏ | 10126/12384 [21:29:03<4:50:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 82%|████████▏ | 10126/12384 [21:29:11<4:50:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 82%|████████▏ | 10127/12384 [21:29:11<4:49:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 82%|████████▏ | 10127/12384 [21:29:19<4:49:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10128/12384 [21:29:19<4:49:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10128/12384 [21:29:26<4:49:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 82%|████████▏ | 10129/12384 [21:29:26<4:49:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 82%|████████▏ | 10129/12384 [21:29:34<4:49:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 82%|████████▏ | 10130/12384 [21:29:34<4:48:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 82%|████████▏ | 10130/12384 [21:29:42<4:48:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 82%|████████▏ | 10131/12384 [21:29:42<4:48:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 82%|████████▏ | 10131/12384 [21:29:49<4:48:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10132/12384 [21:29:49<4:47:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10132/12384 [21:29:57<4:47:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10133/12384 [21:29:57<4:46:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10133/12384 [21:30:05<4:46:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10134/12384 [21:30:05<4:47:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10134/12384 [21:30:12<4:47:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 82%|████████▏ | 10135/12384 [21:30:12<4:46:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 82%|████████▏ | 10135/12384 [21:30:20<4:46:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 82%|████████▏ | 10136/12384 [21:30:20<4:46:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 82%|████████▏ | 10136/12384 [21:30:27<4:46:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 82%|████████▏ | 10137/12384 [21:30:27<4:45:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 82%|████████▏ | 10137/12384 [21:30:35<4:45:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 82%|████████▏ | 10138/12384 [21:30:35<4:44:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 82%|████████▏ | 10138/12384 [21:30:43<4:44:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.96s]
Epoch 1: 82%|████████▏ | 10139/12384 [21:30:43<4:44:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.96s]
Epoch 1: 82%|████████▏ | 10139/12384 [21:30:50<4:44:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 82%|████████▏ | 10140/12384 [21:30:50<4:44:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 82%|████████▏ | 10140/12384 [21:30:58<4:44:23, 7.60s/it, loss=0.0002, acc=0.9976, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10141/12384 [21:30:58<4:44:35, 7.61s/it, loss=0.0002, acc=0.9976, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10141/12384 [21:31:05<4:44:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10142/12384 [21:31:05<4:44:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10142/12384 [21:31:13<4:44:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10143/12384 [21:31:13<4:44:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10143/12384 [21:31:21<4:44:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 82%|████████▏ | 10144/12384 [21:31:21<4:45:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 82%|████████▏ | 10144/12384 [21:31:28<4:45:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 82%|████████▏ | 10145/12384 [21:31:28<4:45:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 82%|████████▏ | 10145/12384 [21:31:36<4:45:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 82%|████████▏ | 10146/12384 [21:31:36<4:44:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 1: 82%|████████▏ | 10146/12384 [21:31:44<4:44:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.01s]
Epoch 1: 82%|████████▏ | 10147/12384 [21:31:44<4:45:33, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=11.01s]
Epoch 1: 82%|████████▏ | 10147/12384 [21:31:51<4:45:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 82%|████████▏ | 10148/12384 [21:31:51<4:44:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 1: 82%|████████▏ | 10148/12384 [21:31:59<4:44:55, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.64s]
Epoch 1: 82%|████████▏ | 10149/12384 [21:31:59<4:44:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.64s]
Epoch 1: 82%|████████▏ | 10149/12384 [21:32:07<4:44:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 82%|████████▏ | 10150/12384 [21:32:07<4:44:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 82%|████████▏ | 10150/12384 [21:32:14<4:44:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 82%|████████▏ | 10151/12384 [21:32:14<4:43:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 82%|████████▏ | 10151/12384 [21:32:22<4:43:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 82%|████████▏ | 10152/12384 [21:32:22<4:47:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 82%|████████▏ | 10152/12384 [21:32:30<4:47:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 1: 82%|████████▏ | 10153/12384 [21:32:30<4:45:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 1: 82%|████████▏ | 10153/12384 [21:32:37<4:45:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 82%|████████▏ | 10154/12384 [21:32:37<4:44:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 82%|████████▏ | 10154/12384 [21:32:45<4:44:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 82%|████████▏ | 10155/12384 [21:32:45<4:43:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 82%|████████▏ | 10155/12384 [21:32:53<4:43:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 82%|████████▏ | 10156/12384 [21:32:53<4:43:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 82%|████████▏ | 10156/12384 [21:33:00<4:43:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 82%|████████▏ | 10157/12384 [21:33:00<4:43:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 82%|████████▏ | 10157/12384 [21:33:08<4:43:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 82%|████████▏ | 10158/12384 [21:33:08<4:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 82%|████████▏ | 10158/12384 [21:33:15<4:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10159/12384 [21:33:15<4:42:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10159/12384 [21:33:23<4:42:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 82%|████████▏ | 10160/12384 [21:33:23<4:41:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 82%|████████▏ | 10160/12384 [21:33:31<4:41:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 82%|████████▏ | 10161/12384 [21:33:31<4:41:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 82%|████████▏ | 10161/12384 [21:33:38<4:41:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 82%|████████▏ | 10162/12384 [21:33:38<4:41:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 82%|████████▏ | 10162/12384 [21:33:46<4:41:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 82%|████████▏ | 10163/12384 [21:33:46<4:41:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 82%|████████▏ | 10163/12384 [21:33:53<4:41:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10164/12384 [21:33:53<4:41:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10164/12384 [21:34:01<4:41:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10165/12384 [21:34:01<4:40:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10165/12384 [21:34:09<4:40:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 82%|████████▏ | 10166/12384 [21:34:09<4:41:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 82%|████████▏ | 10166/12384 [21:34:16<4:41:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 82%|████████▏ | 10167/12384 [21:34:16<4:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 82%|████████▏ | 10167/12384 [21:34:24<4:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 82%|████████▏ | 10168/12384 [21:34:24<4:41:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 82%|████████▏ | 10168/12384 [21:34:31<4:41:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10169/12384 [21:34:31<4:40:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10169/12384 [21:34:39<4:40:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10170/12384 [21:34:39<4:40:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10170/12384 [21:34:47<4:40:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10171/12384 [21:34:47<4:40:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10171/12384 [21:34:54<4:40:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 82%|████████▏ | 10172/12384 [21:34:54<4:40:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 82%|████████▏ | 10172/12384 [21:35:02<4:40:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10173/12384 [21:35:02<4:40:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10173/12384 [21:35:09<4:40:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10174/12384 [21:35:09<4:40:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10174/12384 [21:35:17<4:40:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10175/12384 [21:35:17<4:40:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10175/12384 [21:35:25<4:40:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 82%|████████▏ | 10176/12384 [21:35:25<4:43:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 82%|████████▏ | 10176/12384 [21:35:33<4:43:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 82%|████████▏ | 10177/12384 [21:35:33<4:42:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 82%|████████▏ | 10177/12384 [21:35:41<4:42:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 1: 82%|████████▏ | 10178/12384 [21:35:41<4:45:36, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 1: 82%|████████▏ | 10178/12384 [21:35:48<4:45:36, 7.77s/it, loss=0.0002, acc=1.0000, iter_time=10.70s]
Epoch 1: 82%|████████▏ | 10179/12384 [21:35:48<4:43:29, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=10.70s]
Epoch 1: 82%|████████▏ | 10179/12384 [21:35:56<4:43:29, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.82s]
Epoch 1: 82%|████████▏ | 10180/12384 [21:35:56<4:42:09, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.82s]
Epoch 1: 82%|████████▏ | 10180/12384 [21:36:03<4:42:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 82%|████████▏ | 10181/12384 [21:36:03<4:41:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 82%|████████▏ | 10181/12384 [21:36:11<4:41:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 1: 82%|████████▏ | 10182/12384 [21:36:11<4:40:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 1: 82%|████████▏ | 10182/12384 [21:36:19<4:40:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 82%|████████▏ | 10183/12384 [21:36:19<4:39:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 82%|████████▏ | 10183/12384 [21:36:26<4:39:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10184/12384 [21:36:26<4:40:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10184/12384 [21:36:34<4:40:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 82%|████████▏ | 10185/12384 [21:36:34<4:39:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 82%|████████▏ | 10185/12384 [21:36:41<4:39:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10186/12384 [21:36:41<4:39:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10186/12384 [21:36:49<4:39:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 82%|████████▏ | 10187/12384 [21:36:49<4:39:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 82%|████████▏ | 10187/12384 [21:36:57<4:39:36, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10188/12384 [21:36:57<4:39:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10188/12384 [21:37:04<4:39:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10189/12384 [21:37:04<4:38:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10189/12384 [21:37:12<4:38:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10190/12384 [21:37:12<4:38:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10190/12384 [21:37:20<4:38:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10191/12384 [21:37:20<4:38:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10191/12384 [21:37:27<4:38:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 82%|████████▏ | 10192/12384 [21:37:27<4:38:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 82%|████████▏ | 10192/12384 [21:37:35<4:38:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 82%|████████▏ | 10193/12384 [21:37:35<4:39:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 82%|████████▏ | 10193/12384 [21:37:43<4:39:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 82%|████████▏ | 10194/12384 [21:37:43<4:38:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 82%|████████▏ | 10194/12384 [21:37:50<4:38:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 1: 82%|████████▏ | 10195/12384 [21:37:50<4:38:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 1: 82%|████████▏ | 10195/12384 [21:37:58<4:38:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 82%|████████▏ | 10196/12384 [21:37:58<4:37:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 82%|████████▏ | 10196/12384 [21:38:05<4:37:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10197/12384 [21:38:05<4:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 82%|████████▏ | 10197/12384 [21:38:13<4:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 82%|████████▏ | 10198/12384 [21:38:13<4:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 82%|████████▏ | 10198/12384 [21:38:21<4:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 82%|████████▏ | 10199/12384 [21:38:21<4:37:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 82%|████████▏ | 10199/12384 [21:38:28<4:37:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 82%|████████▏ | 10200/12384 [21:38:28<4:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 82%|████████▏ | 10200/12384 [21:38:36<4:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 82%|████████▏ | 10201/12384 [21:38:36<4:36:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 82%|████████▏ | 10201/12384 [21:38:44<4:36:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 82%|████████▏ | 10202/12384 [21:38:44<4:39:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 82%|████████▏ | 10202/12384 [21:38:51<4:39:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10203/12384 [21:38:51<4:38:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 82%|████████▏ | 10203/12384 [21:38:59<4:38:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.17s]
Epoch 1: 82%|████████▏ | 10204/12384 [21:38:59<4:38:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.17s]
Epoch 1: 82%|████████▏ | 10204/12384 [21:39:07<4:38:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=12.13s]
Epoch 1: 82%|████████▏ | 10205/12384 [21:39:07<4:41:29, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=12.13s]
Epoch 1: 82%|████████▏ | 10205/12384 [21:39:15<4:41:29, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.17s]
Epoch 1: 82%|████████▏ | 10206/12384 [21:39:15<4:39:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.17s]
Epoch 1: 82%|████████▏ | 10206/12384 [21:39:22<4:39:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 82%|████████▏ | 10207/12384 [21:39:22<4:38:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 82%|████████▏ | 10207/12384 [21:39:30<4:38:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 82%|████████▏ | 10208/12384 [21:39:30<4:38:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 82%|████████▏ | 10208/12384 [21:39:37<4:38:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 82%|████████▏ | 10209/12384 [21:39:37<4:37:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 82%|████████▏ | 10209/12384 [21:39:45<4:37:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 82%|████████▏ | 10210/12384 [21:39:45<4:37:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 82%|████████▏ | 10210/12384 [21:39:53<4:37:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 82%|████████▏ | 10211/12384 [21:39:53<4:36:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 82%|████████▏ | 10211/12384 [21:40:00<4:36:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10212/12384 [21:40:00<4:35:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 82%|████████▏ | 10212/12384 [21:40:08<4:35:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10213/12384 [21:40:08<4:35:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 82%|████████▏ | 10213/12384 [21:40:15<4:35:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10214/12384 [21:40:15<4:35:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 82%|████████▏ | 10214/12384 [21:40:23<4:35:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 82%|████████▏ | 10215/12384 [21:40:23<4:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 82%|████████▏ | 10215/12384 [21:40:31<4:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 82%|████████▏ | 10216/12384 [21:40:31<4:35:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 1: 82%|████████▏ | 10216/12384 [21:40:38<4:35:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 83%|████████▎ | 10217/12384 [21:40:38<4:34:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 83%|████████▎ | 10217/12384 [21:40:46<4:34:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 83%|████████▎ | 10218/12384 [21:40:46<4:34:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 83%|████████▎ | 10218/12384 [21:40:54<4:34:42, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 1: 83%|████████▎ | 10219/12384 [21:40:54<4:34:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.76s]
Epoch 1: 83%|████████▎ | 10219/12384 [21:41:01<4:34:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 83%|████████▎ | 10220/12384 [21:41:01<4:34:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 1: 83%|████████▎ | 10220/12384 [21:41:09<4:34:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 83%|████████▎ | 10221/12384 [21:41:09<4:34:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 83%|████████▎ | 10221/12384 [21:41:16<4:34:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 83%|████████▎ | 10222/12384 [21:41:16<4:34:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 83%|████████▎ | 10222/12384 [21:41:24<4:34:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 83%|████████▎ | 10223/12384 [21:41:24<4:34:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 83%|████████▎ | 10223/12384 [21:41:32<4:34:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 83%|████████▎ | 10224/12384 [21:41:32<4:35:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 83%|████████▎ | 10224/12384 [21:41:39<4:35:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 83%|████████▎ | 10225/12384 [21:41:39<4:34:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 83%|████████▎ | 10225/12384 [21:41:47<4:34:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 83%|████████▎ | 10226/12384 [21:41:47<4:34:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 83%|████████▎ | 10226/12384 [21:41:55<4:34:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10227/12384 [21:41:55<4:34:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10227/12384 [21:42:02<4:34:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10228/12384 [21:42:02<4:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10228/12384 [21:42:10<4:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 83%|████████▎ | 10229/12384 [21:42:10<4:36:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 83%|████████▎ | 10229/12384 [21:42:18<4:36:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 83%|████████▎ | 10230/12384 [21:42:18<4:35:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 83%|████████▎ | 10230/12384 [21:42:26<4:35:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 83%|████████▎ | 10231/12384 [21:42:26<4:37:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 83%|████████▎ | 10231/12384 [21:42:33<4:37:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 83%|████████▎ | 10232/12384 [21:42:33<4:36:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 83%|████████▎ | 10232/12384 [21:42:41<4:36:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 83%|████████▎ | 10233/12384 [21:42:41<4:34:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 83%|████████▎ | 10233/12384 [21:42:48<4:34:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 83%|████████▎ | 10234/12384 [21:42:48<4:34:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 83%|████████▎ | 10234/12384 [21:42:56<4:34:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 83%|████████▎ | 10235/12384 [21:42:56<4:33:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 1: 83%|████████▎ | 10235/12384 [21:43:04<4:33:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 83%|████████▎ | 10236/12384 [21:43:04<4:32:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 83%|████████▎ | 10236/12384 [21:43:11<4:32:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 83%|████████▎ | 10237/12384 [21:43:11<4:32:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 83%|████████▎ | 10237/12384 [21:43:19<4:32:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 83%|████████▎ | 10238/12384 [21:43:19<4:33:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 83%|████████▎ | 10238/12384 [21:43:26<4:33:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10239/12384 [21:43:26<4:32:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10239/12384 [21:43:34<4:32:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 83%|████████▎ | 10240/12384 [21:43:34<4:32:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 83%|████████▎ | 10240/12384 [21:43:42<4:32:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 83%|████████▎ | 10241/12384 [21:43:42<4:31:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 83%|████████▎ | 10241/12384 [21:43:49<4:31:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 83%|████████▎ | 10242/12384 [21:43:49<4:31:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 83%|████████▎ | 10242/12384 [21:43:57<4:31:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.29s]
Epoch 1: 83%|████████▎ | 10243/12384 [21:43:57<4:31:20, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.29s]
Epoch 1: 83%|████████▎ | 10243/12384 [21:44:04<4:31:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 83%|████████▎ | 10244/12384 [21:44:04<4:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 83%|████████▎ | 10244/12384 [21:44:12<4:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10245/12384 [21:44:12<4:31:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10245/12384 [21:44:20<4:31:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10246/12384 [21:44:20<4:30:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10246/12384 [21:44:27<4:30:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 83%|████████▎ | 10247/12384 [21:44:27<4:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 83%|████████▎ | 10247/12384 [21:44:35<4:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 83%|████████▎ | 10248/12384 [21:44:35<4:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 1: 83%|████████▎ | 10248/12384 [21:44:42<4:30:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 83%|████████▎ | 10249/12384 [21:44:42<4:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 83%|████████▎ | 10249/12384 [21:44:50<4:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 83%|████████▎ | 10250/12384 [21:44:50<4:30:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 1: 83%|████████▎ | 10250/12384 [21:44:58<4:30:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10251/12384 [21:44:58<4:30:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10251/12384 [21:45:05<4:30:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10252/12384 [21:45:05<4:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10252/12384 [21:45:13<4:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10253/12384 [21:45:13<4:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10253/12384 [21:45:21<4:30:16, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.51s]
Epoch 1: 83%|████████▎ | 10254/12384 [21:45:21<4:30:13, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.51s]
Epoch 1: 83%|████████▎ | 10254/12384 [21:45:28<4:30:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 83%|████████▎ | 10255/12384 [21:45:28<4:32:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 83%|████████▎ | 10255/12384 [21:45:36<4:32:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 83%|████████▎ | 10256/12384 [21:45:36<4:32:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 83%|████████▎ | 10256/12384 [21:45:44<4:32:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 83%|████████▎ | 10257/12384 [21:45:44<4:34:46, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 83%|████████▎ | 10257/12384 [21:45:52<4:34:46, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 83%|████████▎ | 10258/12384 [21:45:52<4:33:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 83%|████████▎ | 10258/12384 [21:45:59<4:33:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 83%|████████▎ | 10259/12384 [21:45:59<4:31:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 83%|████████▎ | 10259/12384 [21:46:07<4:31:52, 7.68s/it, loss=0.0003, acc=0.9992, iter_time=8.20s]
Epoch 1: 83%|████████▎ | 10260/12384 [21:46:07<4:31:07, 7.66s/it, loss=0.0003, acc=0.9992, iter_time=8.20s]
Epoch 1: 83%|████████▎ | 10260/12384 [21:46:14<4:31:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10261/12384 [21:46:14<4:30:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10261/12384 [21:46:22<4:30:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10262/12384 [21:46:22<4:30:05, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10262/12384 [21:46:30<4:30:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 83%|████████▎ | 10263/12384 [21:46:30<4:29:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 83%|████████▎ | 10263/12384 [21:46:37<4:29:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 83%|████████▎ | 10264/12384 [21:46:37<4:29:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 83%|████████▎ | 10264/12384 [21:46:45<4:29:19, 7.62s/it, loss=0.0012, acc=0.9984, iter_time=7.20s]
Epoch 1: 83%|████████▎ | 10265/12384 [21:46:45<4:29:11, 7.62s/it, loss=0.0012, acc=0.9984, iter_time=7.20s]
Epoch 1: 83%|████████▎ | 10265/12384 [21:46:52<4:29:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 83%|████████▎ | 10266/12384 [21:46:52<4:29:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 83%|████████▎ | 10266/12384 [21:47:00<4:29:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 83%|████████▎ | 10267/12384 [21:47:00<4:28:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 83%|████████▎ | 10267/12384 [21:47:08<4:28:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10268/12384 [21:47:08<4:28:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10268/12384 [21:47:15<4:28:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10269/12384 [21:47:15<4:28:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10269/12384 [21:47:23<4:28:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10270/12384 [21:47:23<4:28:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10270/12384 [21:47:31<4:28:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10271/12384 [21:47:31<4:27:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10271/12384 [21:47:38<4:27:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 83%|████████▎ | 10272/12384 [21:47:38<4:27:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 83%|████████▎ | 10272/12384 [21:47:46<4:27:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 1: 83%|████████▎ | 10273/12384 [21:47:46<4:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 1: 83%|████████▎ | 10273/12384 [21:47:53<4:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 83%|████████▎ | 10274/12384 [21:47:53<4:27:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 83%|████████▎ | 10274/12384 [21:48:01<4:27:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 83%|████████▎ | 10275/12384 [21:48:01<4:27:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 1: 83%|████████▎ | 10275/12384 [21:48:09<4:27:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 83%|████████▎ | 10276/12384 [21:48:09<4:28:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 83%|████████▎ | 10276/12384 [21:48:16<4:28:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 83%|████████▎ | 10277/12384 [21:48:16<4:28:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 83%|████████▎ | 10277/12384 [21:48:24<4:28:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 83%|████████▎ | 10278/12384 [21:48:24<4:27:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 1: 83%|████████▎ | 10278/12384 [21:48:32<4:27:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 83%|████████▎ | 10279/12384 [21:48:32<4:27:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 83%|████████▎ | 10279/12384 [21:48:39<4:27:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 83%|████████▎ | 10280/12384 [21:48:39<4:27:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 83%|████████▎ | 10280/12384 [21:48:47<4:27:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 83%|████████▎ | 10281/12384 [21:48:47<4:30:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 83%|████████▎ | 10281/12384 [21:48:55<4:30:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 83%|████████▎ | 10282/12384 [21:48:55<4:29:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 83%|████████▎ | 10282/12384 [21:49:03<4:29:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 83%|████████▎ | 10283/12384 [21:49:03<4:31:14, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 83%|████████▎ | 10283/12384 [21:49:10<4:31:14, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 83%|████████▎ | 10284/12384 [21:49:10<4:29:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 83%|████████▎ | 10284/12384 [21:49:18<4:29:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 83%|████████▎ | 10285/12384 [21:49:18<4:28:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 83%|████████▎ | 10285/12384 [21:49:25<4:28:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10286/12384 [21:49:25<4:27:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10286/12384 [21:49:33<4:27:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10287/12384 [21:49:33<4:26:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10287/12384 [21:49:41<4:26:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 83%|████████▎ | 10288/12384 [21:49:41<4:26:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 83%|████████▎ | 10288/12384 [21:49:48<4:26:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 83%|████████▎ | 10289/12384 [21:49:48<4:26:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 83%|████████▎ | 10289/12384 [21:49:56<4:26:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.72s]
Epoch 1: 83%|████████▎ | 10290/12384 [21:49:56<4:25:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.72s]
Epoch 1: 83%|████████▎ | 10290/12384 [21:50:03<4:25:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 83%|████████▎ | 10291/12384 [21:50:03<4:25:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 83%|████████▎ | 10291/12384 [21:50:11<4:25:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 1: 83%|████████▎ | 10292/12384 [21:50:11<4:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 1: 83%|████████▎ | 10292/12384 [21:50:19<4:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 83%|████████▎ | 10293/12384 [21:50:19<4:25:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 83%|████████▎ | 10293/12384 [21:50:26<4:25:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 83%|████████▎ | 10294/12384 [21:50:26<4:25:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 83%|████████▎ | 10294/12384 [21:50:34<4:25:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10295/12384 [21:50:34<4:25:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10295/12384 [21:50:41<4:25:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 83%|████████▎ | 10296/12384 [21:50:41<4:24:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 83%|████████▎ | 10296/12384 [21:50:49<4:24:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 83%|████████▎ | 10297/12384 [21:50:49<4:24:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 83%|████████▎ | 10297/12384 [21:50:57<4:24:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 83%|████████▎ | 10298/12384 [21:50:57<4:24:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 83%|████████▎ | 10298/12384 [21:51:04<4:24:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10299/12384 [21:51:04<4:25:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10299/12384 [21:51:12<4:25:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 83%|████████▎ | 10300/12384 [21:51:12<4:25:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 1: 83%|████████▎ | 10300/12384 [21:51:20<4:25:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 83%|████████▎ | 10301/12384 [21:51:20<4:24:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 83%|████████▎ | 10301/12384 [21:51:27<4:24:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10302/12384 [21:51:27<4:24:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10302/12384 [21:51:35<4:24:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10303/12384 [21:51:35<4:24:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10303/12384 [21:51:42<4:24:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 83%|████████▎ | 10304/12384 [21:51:42<4:24:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 83%|████████▎ | 10304/12384 [21:51:50<4:24:06, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.16s]
Epoch 1: 83%|████████▎ | 10305/12384 [21:51:50<4:24:04, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=4.16s]
Epoch 1: 83%|████████▎ | 10305/12384 [21:51:58<4:24:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 83%|████████▎ | 10306/12384 [21:51:58<4:23:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 83%|████████▎ | 10306/12384 [21:52:05<4:23:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 83%|████████▎ | 10307/12384 [21:52:05<4:23:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 83%|████████▎ | 10307/12384 [21:52:13<4:23:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 83%|████████▎ | 10308/12384 [21:52:13<4:23:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 83%|████████▎ | 10308/12384 [21:52:21<4:23:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 83%|████████▎ | 10309/12384 [21:52:21<4:27:12, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 83%|████████▎ | 10309/12384 [21:52:29<4:27:12, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 83%|████████▎ | 10310/12384 [21:52:29<4:26:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 83%|████████▎ | 10310/12384 [21:52:36<4:26:03, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10311/12384 [21:52:36<4:24:57, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 83%|████████▎ | 10311/12384 [21:52:44<4:24:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 83%|████████▎ | 10312/12384 [21:52:44<4:24:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 83%|████████▎ | 10312/12384 [21:52:51<4:24:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 83%|████████▎ | 10313/12384 [21:52:51<4:23:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 83%|████████▎ | 10313/12384 [21:52:59<4:23:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 83%|████████▎ | 10314/12384 [21:52:59<4:22:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 83%|████████▎ | 10314/12384 [21:53:07<4:22:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 83%|████████▎ | 10315/12384 [21:53:07<4:22:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 83%|████████▎ | 10315/12384 [21:53:14<4:22:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 83%|████████▎ | 10316/12384 [21:53:14<4:23:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 83%|████████▎ | 10316/12384 [21:53:22<4:23:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 83%|████████▎ | 10317/12384 [21:53:22<4:22:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 83%|████████▎ | 10317/12384 [21:53:29<4:22:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 83%|████████▎ | 10318/12384 [21:53:29<4:22:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 83%|████████▎ | 10318/12384 [21:53:37<4:22:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 1: 83%|████████▎ | 10319/12384 [21:53:37<4:22:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 1: 83%|████████▎ | 10319/12384 [21:53:45<4:22:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 83%|████████▎ | 10320/12384 [21:53:45<4:22:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 83%|████████▎ | 10320/12384 [21:53:52<4:22:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 83%|████████▎ | 10321/12384 [21:53:52<4:21:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 83%|████████▎ | 10321/12384 [21:54:00<4:21:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10322/12384 [21:54:00<4:21:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10322/12384 [21:54:08<4:21:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10323/12384 [21:54:08<4:21:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10323/12384 [21:54:15<4:21:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 83%|████████▎ | 10324/12384 [21:54:15<4:21:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 1: 83%|████████▎ | 10324/12384 [21:54:23<4:21:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 83%|████████▎ | 10325/12384 [21:54:23<4:21:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 83%|████████▎ | 10325/12384 [21:54:30<4:21:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 83%|████████▎ | 10326/12384 [21:54:30<4:21:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 83%|████████▎ | 10326/12384 [21:54:38<4:21:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10327/12384 [21:54:38<4:21:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10327/12384 [21:54:46<4:21:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 83%|████████▎ | 10328/12384 [21:54:46<4:21:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 83%|████████▎ | 10328/12384 [21:54:53<4:21:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 83%|████████▎ | 10329/12384 [21:54:53<4:20:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 83%|████████▎ | 10329/12384 [21:55:01<4:20:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 83%|████████▎ | 10330/12384 [21:55:01<4:20:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 83%|████████▎ | 10330/12384 [21:55:08<4:20:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10331/12384 [21:55:08<4:20:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10331/12384 [21:55:16<4:20:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10332/12384 [21:55:16<4:20:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 83%|████████▎ | 10332/12384 [21:55:24<4:20:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 83%|████████▎ | 10333/12384 [21:55:24<4:20:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 83%|████████▎ | 10333/12384 [21:55:31<4:20:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 83%|████████▎ | 10334/12384 [21:55:31<4:20:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 83%|████████▎ | 10334/12384 [21:55:39<4:20:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10335/12384 [21:55:39<4:19:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 83%|████████▎ | 10335/12384 [21:55:47<4:19:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 83%|████████▎ | 10336/12384 [21:55:47<4:23:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 83%|████████▎ | 10336/12384 [21:55:54<4:23:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 83%|████████▎ | 10337/12384 [21:55:54<4:22:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 83%|████████▎ | 10337/12384 [21:56:02<4:22:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 83%|████████▎ | 10338/12384 [21:56:02<4:21:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 83%|████████▎ | 10338/12384 [21:56:10<4:21:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 83%|████████▎ | 10339/12384 [21:56:10<4:20:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 83%|████████▎ | 10339/12384 [21:56:17<4:20:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10340/12384 [21:56:17<4:20:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 83%|████████▎ | 10340/12384 [21:56:25<4:20:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 84%|████████▎ | 10341/12384 [21:56:25<4:19:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 84%|████████▎ | 10341/12384 [21:56:33<4:19:56, 7.63s/it, loss=0.0002, acc=0.9979, iter_time=8.82s]
Epoch 1: 84%|████████▎ | 10342/12384 [21:56:33<4:19:40, 7.63s/it, loss=0.0002, acc=0.9979, iter_time=8.82s]
Epoch 1: 84%|████████▎ | 10342/12384 [21:56:40<4:19:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 84%|████████▎ | 10343/12384 [21:56:40<4:19:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 84%|████████▎ | 10343/12384 [21:56:48<4:19:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 84%|████████▎ | 10344/12384 [21:56:48<4:19:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 84%|████████▎ | 10344/12384 [21:56:55<4:19:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 84%|████████▎ | 10345/12384 [21:56:55<4:20:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 84%|████████▎ | 10345/12384 [21:57:03<4:20:04, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 1: 84%|████████▎ | 10346/12384 [21:57:03<4:19:41, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 1: 84%|████████▎ | 10346/12384 [21:57:11<4:19:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 84%|████████▎ | 10347/12384 [21:57:11<4:19:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 84%|████████▎ | 10347/12384 [21:57:18<4:19:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 84%|████████▎ | 10348/12384 [21:57:18<4:19:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 84%|████████▎ | 10348/12384 [21:57:26<4:19:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▎ | 10349/12384 [21:57:26<4:18:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▎ | 10349/12384 [21:57:34<4:18:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 84%|████████▎ | 10350/12384 [21:57:34<4:18:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 84%|████████▎ | 10350/12384 [21:57:41<4:18:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 84%|████████▎ | 10351/12384 [21:57:41<4:18:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 84%|████████▎ | 10351/12384 [21:57:49<4:18:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 84%|████████▎ | 10352/12384 [21:57:49<4:18:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 1: 84%|████████▎ | 10352/12384 [21:57:56<4:18:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 1: 84%|████████▎ | 10353/12384 [21:57:56<4:18:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 1: 84%|████████▎ | 10353/12384 [21:58:04<4:18:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 84%|████████▎ | 10354/12384 [21:58:04<4:17:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 84%|████████▎ | 10354/12384 [21:58:12<4:17:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 84%|████████▎ | 10355/12384 [21:58:12<4:17:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 84%|████████▎ | 10355/12384 [21:58:19<4:17:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 1: 84%|████████▎ | 10356/12384 [21:58:19<4:17:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 1: 84%|████████▎ | 10356/12384 [21:58:27<4:17:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 84%|████████▎ | 10357/12384 [21:58:27<4:16:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 84%|████████▎ | 10357/12384 [21:58:35<4:16:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 84%|████████▎ | 10358/12384 [21:58:35<4:17:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 84%|████████▎ | 10358/12384 [21:58:42<4:17:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 84%|████████▎ | 10359/12384 [21:58:42<4:16:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 84%|████████▎ | 10359/12384 [21:58:50<4:16:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 1: 84%|████████▎ | 10360/12384 [21:58:50<4:19:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 1: 84%|████████▎ | 10360/12384 [21:58:58<4:19:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 84%|████████▎ | 10361/12384 [21:58:58<4:18:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 84%|████████▎ | 10361/12384 [21:59:06<4:18:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 84%|████████▎ | 10362/12384 [21:59:06<4:21:10, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 84%|████████▎ | 10362/12384 [21:59:13<4:21:10, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 84%|████████▎ | 10363/12384 [21:59:13<4:19:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 1: 84%|████████▎ | 10363/12384 [21:59:21<4:19:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 84%|████████▎ | 10364/12384 [21:59:21<4:18:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 84%|████████▎ | 10364/12384 [21:59:28<4:18:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 84%|████████▎ | 10365/12384 [21:59:28<4:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 1: 84%|████████▎ | 10365/12384 [21:59:36<4:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 84%|████████▎ | 10366/12384 [21:59:36<4:17:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 84%|████████▎ | 10366/12384 [21:59:44<4:17:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 84%|████████▎ | 10367/12384 [21:59:44<4:16:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 84%|████████▎ | 10367/12384 [21:59:51<4:16:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▎ | 10368/12384 [21:59:51<4:16:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▎ | 10368/12384 [21:59:59<4:16:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 84%|████████▎ | 10369/12384 [21:59:59<4:16:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 1: 84%|████████▎ | 10369/12384 [22:00:07<4:16:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 84%|████████▎ | 10370/12384 [22:00:07<4:16:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 84%|████████▎ | 10370/12384 [22:00:14<4:16:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 84%|████████▎ | 10371/12384 [22:00:14<4:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 84%|████████▎ | 10371/12384 [22:00:22<4:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10372/12384 [22:00:22<4:15:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10372/12384 [22:00:29<4:15:23, 7.62s/it, loss=0.0004, acc=0.9987, iter_time=5.55s]
Epoch 1: 84%|████████▍ | 10373/12384 [22:00:29<4:15:13, 7.61s/it, loss=0.0004, acc=0.9987, iter_time=5.55s]
Epoch 1: 84%|████████▍ | 10373/12384 [22:00:37<4:15:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 84%|████████▍ | 10374/12384 [22:00:37<4:15:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 84%|████████▍ | 10374/12384 [22:00:45<4:15:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 84%|████████▍ | 10375/12384 [22:00:45<4:14:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 84%|████████▍ | 10375/12384 [22:00:52<4:14:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 84%|████████▍ | 10376/12384 [22:00:52<4:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 84%|████████▍ | 10376/12384 [22:01:00<4:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 84%|████████▍ | 10377/12384 [22:01:00<4:14:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 84%|████████▍ | 10377/12384 [22:01:07<4:14:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 84%|████████▍ | 10378/12384 [22:01:07<4:13:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 84%|████████▍ | 10378/12384 [22:01:15<4:13:58, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 84%|████████▍ | 10379/12384 [22:01:15<4:13:44, 7.59s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 84%|████████▍ | 10379/12384 [22:01:23<4:13:44, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10380/12384 [22:01:23<4:14:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10380/12384 [22:01:30<4:14:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 84%|████████▍ | 10381/12384 [22:01:30<4:14:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 84%|████████▍ | 10381/12384 [22:01:38<4:14:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 84%|████████▍ | 10382/12384 [22:01:38<4:14:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 84%|████████▍ | 10382/12384 [22:01:45<4:14:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 84%|████████▍ | 10383/12384 [22:01:45<4:14:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 84%|████████▍ | 10383/12384 [22:01:53<4:14:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 84%|████████▍ | 10384/12384 [22:01:53<4:14:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 84%|████████▍ | 10384/12384 [22:02:01<4:14:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 84%|████████▍ | 10385/12384 [22:02:01<4:13:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 84%|████████▍ | 10385/12384 [22:02:08<4:13:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 84%|████████▍ | 10386/12384 [22:02:08<4:13:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 84%|████████▍ | 10386/12384 [22:02:16<4:13:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 84%|████████▍ | 10387/12384 [22:02:16<4:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 84%|████████▍ | 10387/12384 [22:02:23<4:13:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 84%|████████▍ | 10388/12384 [22:02:23<4:13:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 1: 84%|████████▍ | 10388/12384 [22:02:31<4:13:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 84%|████████▍ | 10389/12384 [22:02:31<4:16:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 84%|████████▍ | 10389/12384 [22:02:39<4:16:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 84%|████████▍ | 10390/12384 [22:02:39<4:15:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 84%|████████▍ | 10390/12384 [22:02:47<4:15:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 84%|████████▍ | 10391/12384 [22:02:47<4:14:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 1: 84%|████████▍ | 10391/12384 [22:02:54<4:14:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 84%|████████▍ | 10392/12384 [22:02:54<4:13:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 84%|████████▍ | 10392/12384 [22:03:02<4:13:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 84%|████████▍ | 10393/12384 [22:03:02<4:13:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 84%|████████▍ | 10393/12384 [22:03:09<4:13:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 84%|████████▍ | 10394/12384 [22:03:09<4:12:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 84%|████████▍ | 10394/12384 [22:03:17<4:12:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 84%|████████▍ | 10395/12384 [22:03:17<4:12:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 84%|████████▍ | 10395/12384 [22:03:25<4:12:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 84%|████████▍ | 10396/12384 [22:03:25<4:13:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 84%|████████▍ | 10396/12384 [22:03:32<4:13:17, 7.64s/it, loss=0.0013, acc=0.9984, iter_time=7.71s]
Epoch 1: 84%|████████▍ | 10397/12384 [22:03:32<4:12:41, 7.63s/it, loss=0.0013, acc=0.9984, iter_time=7.71s]
Epoch 1: 84%|████████▍ | 10397/12384 [22:03:40<4:12:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10398/12384 [22:03:40<4:12:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10398/12384 [22:03:48<4:12:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 84%|████████▍ | 10399/12384 [22:03:48<4:11:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 84%|████████▍ | 10399/12384 [22:03:55<4:11:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 84%|████████▍ | 10400/12384 [22:03:55<4:11:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 84%|████████▍ | 10400/12384 [22:04:03<4:11:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 84%|████████▍ | 10401/12384 [22:04:03<4:11:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 84%|████████▍ | 10401/12384 [22:04:10<4:11:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▍ | 10402/12384 [22:04:10<4:11:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▍ | 10402/12384 [22:04:18<4:11:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 84%|████████▍ | 10403/12384 [22:04:18<4:10:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 84%|████████▍ | 10403/12384 [22:04:26<4:10:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 84%|████████▍ | 10404/12384 [22:04:26<4:10:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 84%|████████▍ | 10404/12384 [22:04:33<4:10:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 1: 84%|████████▍ | 10405/12384 [22:04:33<4:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 1: 84%|████████▍ | 10405/12384 [22:04:41<4:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=12.49s]
Epoch 1: 84%|████████▍ | 10406/12384 [22:04:41<4:10:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=12.49s]
Epoch 1: 84%|████████▍ | 10406/12384 [22:04:48<4:10:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10407/12384 [22:04:48<4:10:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10407/12384 [22:04:56<4:10:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 84%|████████▍ | 10408/12384 [22:04:56<4:11:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 84%|████████▍ | 10408/12384 [22:05:04<4:11:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 84%|████████▍ | 10409/12384 [22:05:04<4:11:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 84%|████████▍ | 10409/12384 [22:05:11<4:11:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▍ | 10410/12384 [22:05:11<4:10:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▍ | 10410/12384 [22:05:19<4:10:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 84%|████████▍ | 10411/12384 [22:05:19<4:10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 84%|████████▍ | 10411/12384 [22:05:27<4:10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 84%|████████▍ | 10412/12384 [22:05:27<4:10:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 84%|████████▍ | 10412/12384 [22:05:34<4:10:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 84%|████████▍ | 10413/12384 [22:05:34<4:12:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 84%|████████▍ | 10413/12384 [22:05:42<4:12:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10414/12384 [22:05:42<4:11:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10414/12384 [22:05:50<4:11:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 84%|████████▍ | 10415/12384 [22:05:50<4:14:12, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 84%|████████▍ | 10415/12384 [22:05:58<4:14:12, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 84%|████████▍ | 10416/12384 [22:05:58<4:12:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 84%|████████▍ | 10416/12384 [22:06:05<4:12:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 84%|████████▍ | 10417/12384 [22:06:05<4:11:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 84%|████████▍ | 10417/12384 [22:06:13<4:11:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 84%|████████▍ | 10418/12384 [22:06:13<4:10:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 84%|████████▍ | 10418/12384 [22:06:20<4:10:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 84%|████████▍ | 10419/12384 [22:06:20<4:10:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 84%|████████▍ | 10419/12384 [22:06:28<4:10:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 84%|████████▍ | 10420/12384 [22:06:28<4:09:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 84%|████████▍ | 10420/12384 [22:06:36<4:09:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10421/12384 [22:06:36<4:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10421/12384 [22:06:43<4:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10422/12384 [22:06:43<4:09:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10422/12384 [22:06:51<4:09:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 84%|████████▍ | 10423/12384 [22:06:51<4:09:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 84%|████████▍ | 10423/12384 [22:06:58<4:09:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 84%|████████▍ | 10424/12384 [22:06:58<4:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 84%|████████▍ | 10424/12384 [22:07:06<4:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 1: 84%|████████▍ | 10425/12384 [22:07:06<4:08:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 1: 84%|████████▍ | 10425/12384 [22:07:14<4:08:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 84%|████████▍ | 10426/12384 [22:07:14<4:08:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 84%|████████▍ | 10426/12384 [22:07:21<4:08:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 84%|████████▍ | 10427/12384 [22:07:21<4:09:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 1: 84%|████████▍ | 10427/12384 [22:07:29<4:09:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 1: 84%|████████▍ | 10428/12384 [22:07:29<4:08:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 1: 84%|████████▍ | 10428/12384 [22:07:37<4:08:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 84%|████████▍ | 10429/12384 [22:07:37<4:08:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 1: 84%|████████▍ | 10429/12384 [22:07:44<4:08:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 84%|████████▍ | 10430/12384 [22:07:44<4:08:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 84%|████████▍ | 10430/12384 [22:07:52<4:08:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 84%|████████▍ | 10431/12384 [22:07:52<4:08:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 84%|████████▍ | 10431/12384 [22:07:59<4:08:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 84%|████████▍ | 10432/12384 [22:07:59<4:07:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 84%|████████▍ | 10432/12384 [22:08:07<4:07:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 1: 84%|████████▍ | 10433/12384 [22:08:07<4:07:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 1: 84%|████████▍ | 10433/12384 [22:08:15<4:07:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 84%|████████▍ | 10434/12384 [22:08:15<4:07:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 84%|████████▍ | 10434/12384 [22:08:22<4:07:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 84%|████████▍ | 10435/12384 [22:08:22<4:07:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 84%|████████▍ | 10435/12384 [22:08:30<4:07:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 1: 84%|████████▍ | 10436/12384 [22:08:30<4:07:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 1: 84%|████████▍ | 10436/12384 [22:08:37<4:07:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 1: 84%|████████▍ | 10437/12384 [22:08:37<4:06:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 1: 84%|████████▍ | 10437/12384 [22:08:45<4:06:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10438/12384 [22:08:45<4:06:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10438/12384 [22:08:53<4:06:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 84%|████████▍ | 10439/12384 [22:08:53<4:09:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 84%|████████▍ | 10439/12384 [22:09:01<4:09:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 84%|████████▍ | 10440/12384 [22:09:01<4:09:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 84%|████████▍ | 10440/12384 [22:09:09<4:09:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 84%|████████▍ | 10441/12384 [22:09:09<4:11:41, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 1: 84%|████████▍ | 10441/12384 [22:09:16<4:11:41, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 84%|████████▍ | 10442/12384 [22:09:16<4:09:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 84%|████████▍ | 10442/12384 [22:09:24<4:09:47, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 84%|████████▍ | 10443/12384 [22:09:24<4:08:36, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 84%|████████▍ | 10443/12384 [22:09:31<4:08:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10444/12384 [22:09:31<4:07:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10444/12384 [22:09:39<4:07:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 84%|████████▍ | 10445/12384 [22:09:39<4:07:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 84%|████████▍ | 10445/12384 [22:09:47<4:07:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10446/12384 [22:09:47<4:06:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10446/12384 [22:09:54<4:06:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 84%|████████▍ | 10447/12384 [22:09:54<4:06:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 84%|████████▍ | 10447/12384 [22:10:02<4:06:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 84%|████████▍ | 10448/12384 [22:10:02<4:06:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 84%|████████▍ | 10448/12384 [22:10:10<4:06:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 84%|████████▍ | 10449/12384 [22:10:10<4:06:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 84%|████████▍ | 10449/12384 [22:10:17<4:06:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 84%|████████▍ | 10450/12384 [22:10:17<4:06:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 84%|████████▍ | 10450/12384 [22:10:25<4:06:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 84%|████████▍ | 10451/12384 [22:10:25<4:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 84%|████████▍ | 10451/12384 [22:10:32<4:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=2.96s]
Epoch 1: 84%|████████▍ | 10452/12384 [22:10:32<4:05:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=2.96s]
Epoch 1: 84%|████████▍ | 10452/12384 [22:10:40<4:05:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 84%|████████▍ | 10453/12384 [22:10:40<4:05:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 84%|████████▍ | 10453/12384 [22:10:48<4:05:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 84%|████████▍ | 10454/12384 [22:10:48<4:05:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 1: 84%|████████▍ | 10454/12384 [22:10:55<4:05:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10455/12384 [22:10:55<4:04:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10455/12384 [22:11:03<4:04:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 84%|████████▍ | 10456/12384 [22:11:03<4:04:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 84%|████████▍ | 10456/12384 [22:11:11<4:04:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 84%|████████▍ | 10457/12384 [22:11:11<4:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 84%|████████▍ | 10457/12384 [22:11:18<4:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10458/12384 [22:11:18<4:04:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 84%|████████▍ | 10458/12384 [22:11:26<4:04:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▍ | 10459/12384 [22:11:26<4:04:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▍ | 10459/12384 [22:11:33<4:04:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10460/12384 [22:11:33<4:04:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 84%|████████▍ | 10460/12384 [22:11:41<4:04:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▍ | 10461/12384 [22:11:41<4:04:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 84%|████████▍ | 10461/12384 [22:11:49<4:04:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 84%|████████▍ | 10462/12384 [22:11:49<4:04:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 84%|████████▍ | 10462/12384 [22:11:56<4:04:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 84%|████████▍ | 10463/12384 [22:11:56<4:03:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 84%|████████▍ | 10463/12384 [22:12:04<4:03:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 84%|████████▍ | 10464/12384 [22:12:04<4:03:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 84%|████████▍ | 10464/12384 [22:12:11<4:03:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 85%|████████▍ | 10465/12384 [22:12:11<4:03:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 85%|████████▍ | 10465/12384 [22:12:19<4:03:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 85%|████████▍ | 10466/12384 [22:12:19<4:03:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 85%|████████▍ | 10466/12384 [22:12:27<4:03:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 85%|████████▍ | 10467/12384 [22:12:27<4:06:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 85%|████████▍ | 10467/12384 [22:12:35<4:06:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 85%|████████▍ | 10468/12384 [22:12:35<4:04:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 85%|████████▍ | 10468/12384 [22:12:42<4:04:57, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.58s]
Epoch 1: 85%|████████▍ | 10469/12384 [22:12:42<4:04:10, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.58s]
Epoch 1: 85%|████████▍ | 10469/12384 [22:12:50<4:04:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▍ | 10470/12384 [22:12:50<4:03:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▍ | 10470/12384 [22:12:57<4:03:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▍ | 10471/12384 [22:12:57<4:03:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▍ | 10471/12384 [22:13:05<4:03:03, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=7.99s]
Epoch 1: 85%|████████▍ | 10472/12384 [22:13:05<4:02:46, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=7.99s]
Epoch 1: 85%|████████▍ | 10472/12384 [22:13:13<4:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 85%|████████▍ | 10473/12384 [22:13:13<4:02:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 85%|████████▍ | 10473/12384 [22:13:20<4:02:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 85%|████████▍ | 10474/12384 [22:13:20<4:03:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 1: 85%|████████▍ | 10474/12384 [22:13:28<4:03:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 1: 85%|████████▍ | 10475/12384 [22:13:28<4:02:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 1: 85%|████████▍ | 10475/12384 [22:13:35<4:02:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▍ | 10476/12384 [22:13:35<4:02:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▍ | 10476/12384 [22:13:43<4:02:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▍ | 10477/12384 [22:13:43<4:01:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▍ | 10477/12384 [22:13:51<4:01:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10478/12384 [22:13:51<4:01:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10478/12384 [22:13:58<4:01:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 85%|████████▍ | 10479/12384 [22:13:58<4:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 85%|████████▍ | 10479/12384 [22:14:06<4:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 85%|████████▍ | 10480/12384 [22:14:06<4:01:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 85%|████████▍ | 10480/12384 [22:14:14<4:01:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 85%|████████▍ | 10481/12384 [22:14:14<4:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 85%|████████▍ | 10481/12384 [22:14:21<4:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10482/12384 [22:14:21<4:01:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10482/12384 [22:14:29<4:01:23, 7.62s/it, loss=0.0018, acc=0.9982, iter_time=7.64s]
Epoch 1: 85%|████████▍ | 10483/12384 [22:14:29<4:02:01, 7.64s/it, loss=0.0018, acc=0.9982, iter_time=7.64s]
Epoch 1: 85%|████████▍ | 10483/12384 [22:14:36<4:02:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 85%|████████▍ | 10484/12384 [22:14:36<4:01:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 85%|████████▍ | 10484/12384 [22:14:44<4:01:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 85%|████████▍ | 10485/12384 [22:14:44<4:01:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 85%|████████▍ | 10485/12384 [22:14:52<4:01:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 85%|████████▍ | 10486/12384 [22:14:52<4:01:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 85%|████████▍ | 10486/12384 [22:14:59<4:01:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10487/12384 [22:14:59<4:00:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10487/12384 [22:15:07<4:00:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 85%|████████▍ | 10488/12384 [22:15:07<4:00:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 85%|████████▍ | 10488/12384 [22:15:15<4:00:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 85%|████████▍ | 10489/12384 [22:15:15<4:00:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 85%|████████▍ | 10489/12384 [22:15:22<4:00:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10490/12384 [22:15:22<4:00:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10490/12384 [22:15:30<4:00:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 85%|████████▍ | 10491/12384 [22:15:30<4:00:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 85%|████████▍ | 10491/12384 [22:15:37<4:00:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 1: 85%|████████▍ | 10492/12384 [22:15:37<3:59:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 1: 85%|████████▍ | 10492/12384 [22:15:45<3:59:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 85%|████████▍ | 10493/12384 [22:15:45<4:02:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 85%|████████▍ | 10493/12384 [22:15:53<4:02:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 85%|████████▍ | 10494/12384 [22:15:53<4:01:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 85%|████████▍ | 10494/12384 [22:16:01<4:01:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 85%|████████▍ | 10495/12384 [22:16:01<4:01:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 85%|████████▍ | 10495/12384 [22:16:08<4:01:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 85%|████████▍ | 10496/12384 [22:16:08<4:00:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 1: 85%|████████▍ | 10496/12384 [22:16:16<4:00:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 85%|████████▍ | 10497/12384 [22:16:16<4:00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 85%|████████▍ | 10497/12384 [22:16:23<4:00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 85%|████████▍ | 10498/12384 [22:16:23<3:59:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 85%|████████▍ | 10498/12384 [22:16:31<3:59:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 85%|████████▍ | 10499/12384 [22:16:31<3:59:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 85%|████████▍ | 10499/12384 [22:16:39<3:59:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 85%|████████▍ | 10500/12384 [22:16:39<3:59:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 85%|████████▍ | 10500/12384 [22:16:46<3:59:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 85%|████████▍ | 10501/12384 [22:16:46<3:59:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 1: 85%|████████▍ | 10501/12384 [22:16:54<3:59:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▍ | 10502/12384 [22:16:54<3:58:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▍ | 10502/12384 [22:17:01<3:58:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▍ | 10503/12384 [22:17:01<3:58:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▍ | 10503/12384 [22:17:09<3:58:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 85%|████████▍ | 10504/12384 [22:17:09<3:58:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 85%|████████▍ | 10504/12384 [22:17:17<3:58:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 85%|████████▍ | 10505/12384 [22:17:17<3:58:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 1: 85%|████████▍ | 10505/12384 [22:17:24<3:58:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 85%|████████▍ | 10506/12384 [22:17:24<3:58:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 85%|████████▍ | 10506/12384 [22:17:32<3:58:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▍ | 10507/12384 [22:17:32<3:58:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▍ | 10507/12384 [22:17:39<3:58:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▍ | 10508/12384 [22:17:39<3:57:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▍ | 10508/12384 [22:17:47<3:57:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 85%|████████▍ | 10509/12384 [22:17:47<3:57:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 85%|████████▍ | 10509/12384 [22:17:55<3:57:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 85%|████████▍ | 10510/12384 [22:17:55<3:57:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 85%|████████▍ | 10510/12384 [22:18:02<3:57:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10511/12384 [22:18:02<3:57:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▍ | 10511/12384 [22:18:10<3:57:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 85%|████████▍ | 10512/12384 [22:18:10<3:57:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 85%|████████▍ | 10512/12384 [22:18:17<3:57:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 85%|████████▍ | 10513/12384 [22:18:17<3:57:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 85%|████████▍ | 10513/12384 [22:18:25<3:57:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 85%|████████▍ | 10514/12384 [22:18:25<3:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 85%|████████▍ | 10514/12384 [22:18:33<3:57:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▍ | 10515/12384 [22:18:33<3:57:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▍ | 10515/12384 [22:18:40<3:57:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 85%|████████▍ | 10516/12384 [22:18:40<3:57:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 85%|████████▍ | 10516/12384 [22:18:48<3:57:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 85%|████████▍ | 10517/12384 [22:18:48<3:59:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 85%|████████▍ | 10517/12384 [22:18:56<3:59:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 1: 85%|████████▍ | 10518/12384 [22:18:56<3:58:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 1: 85%|████████▍ | 10518/12384 [22:19:03<3:58:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 85%|████████▍ | 10519/12384 [22:19:03<3:57:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 1: 85%|████████▍ | 10519/12384 [22:19:11<3:57:43, 7.65s/it, loss=0.0021, acc=0.9981, iter_time=8.08s]
Epoch 1: 85%|████████▍ | 10520/12384 [22:19:11<3:59:57, 7.72s/it, loss=0.0021, acc=0.9981, iter_time=8.08s]
Epoch 1: 85%|████████▍ | 10520/12384 [22:19:19<3:59:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 85%|████████▍ | 10521/12384 [22:19:19<3:58:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 1: 85%|████████▍ | 10521/12384 [22:19:27<3:58:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 1: 85%|████████▍ | 10522/12384 [22:19:27<3:58:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 1: 85%|████████▍ | 10522/12384 [22:19:34<3:58:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 1: 85%|████████▍ | 10523/12384 [22:19:34<3:57:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 1: 85%|████████▍ | 10523/12384 [22:19:42<3:57:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.81s]
Epoch 1: 85%|████████▍ | 10524/12384 [22:19:42<3:57:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.81s]
Epoch 1: 85%|████████▍ | 10524/12384 [22:19:49<3:57:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 85%|████████▍ | 10525/12384 [22:19:49<3:56:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 1: 85%|████████▍ | 10525/12384 [22:19:57<3:56:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▍ | 10526/12384 [22:19:57<3:56:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▍ | 10526/12384 [22:20:05<3:56:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10527/12384 [22:20:05<3:55:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10527/12384 [22:20:12<3:55:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 85%|████████▌ | 10528/12384 [22:20:12<3:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 85%|████████▌ | 10528/12384 [22:20:20<3:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▌ | 10529/12384 [22:20:20<3:55:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▌ | 10529/12384 [22:20:27<3:55:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▌ | 10530/12384 [22:20:27<3:55:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▌ | 10530/12384 [22:20:35<3:55:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▌ | 10531/12384 [22:20:35<3:55:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▌ | 10531/12384 [22:20:43<3:55:02, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.09s]
Epoch 1: 85%|████████▌ | 10532/12384 [22:20:43<3:55:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.09s]
Epoch 1: 85%|████████▌ | 10532/12384 [22:20:50<3:55:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 85%|████████▌ | 10533/12384 [22:20:50<3:55:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 85%|████████▌ | 10533/12384 [22:20:58<3:55:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 85%|████████▌ | 10534/12384 [22:20:58<3:55:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 85%|████████▌ | 10534/12384 [22:21:06<3:55:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10535/12384 [22:21:06<3:54:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10535/12384 [22:21:13<3:54:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 85%|████████▌ | 10536/12384 [22:21:13<3:54:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 85%|████████▌ | 10536/12384 [22:21:21<3:54:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 85%|████████▌ | 10537/12384 [22:21:21<3:54:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 85%|████████▌ | 10537/12384 [22:21:28<3:54:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 85%|████████▌ | 10538/12384 [22:21:28<3:54:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 85%|████████▌ | 10538/12384 [22:21:36<3:54:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10539/12384 [22:21:36<3:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10539/12384 [22:21:44<3:54:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▌ | 10540/12384 [22:21:44<3:54:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▌ | 10540/12384 [22:21:51<3:54:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 85%|████████▌ | 10541/12384 [22:21:51<3:53:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 85%|████████▌ | 10541/12384 [22:21:59<3:53:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 85%|████████▌ | 10542/12384 [22:21:59<3:53:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 85%|████████▌ | 10542/12384 [22:22:06<3:53:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 85%|████████▌ | 10543/12384 [22:22:06<3:53:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 1: 85%|████████▌ | 10543/12384 [22:22:14<3:53:30, 7.61s/it, loss=0.0000, acc=0.9996, iter_time=11.43s]
Epoch 1: 85%|████████▌ | 10544/12384 [22:22:14<3:56:02, 7.70s/it, loss=0.0000, acc=0.9996, iter_time=11.43s]
Epoch 1: 85%|████████▌ | 10544/12384 [22:22:22<3:56:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 85%|████████▌ | 10545/12384 [22:22:22<3:55:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 85%|████████▌ | 10545/12384 [22:22:30<3:55:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 85%|████████▌ | 10546/12384 [22:22:30<3:57:40, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 85%|████████▌ | 10546/12384 [22:22:38<3:57:40, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 85%|████████▌ | 10547/12384 [22:22:38<3:56:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 85%|████████▌ | 10547/12384 [22:22:45<3:56:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 85%|████████▌ | 10548/12384 [22:22:45<3:55:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 85%|████████▌ | 10548/12384 [22:22:53<3:55:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 85%|████████▌ | 10549/12384 [22:22:53<3:54:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 85%|████████▌ | 10549/12384 [22:23:00<3:54:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 85%|████████▌ | 10550/12384 [22:23:00<3:53:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 85%|████████▌ | 10550/12384 [22:23:08<3:53:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 85%|████████▌ | 10551/12384 [22:23:08<3:53:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 85%|████████▌ | 10551/12384 [22:23:16<3:53:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 85%|████████▌ | 10552/12384 [22:23:16<3:53:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 85%|████████▌ | 10552/12384 [22:23:23<3:53:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 85%|████████▌ | 10553/12384 [22:23:23<3:52:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 1: 85%|████████▌ | 10553/12384 [22:23:31<3:52:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 85%|████████▌ | 10554/12384 [22:23:31<3:52:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 85%|████████▌ | 10554/12384 [22:23:38<3:52:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 85%|████████▌ | 10555/12384 [22:23:38<3:51:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 85%|████████▌ | 10555/12384 [22:23:46<3:51:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 85%|████████▌ | 10556/12384 [22:23:46<3:51:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 85%|████████▌ | 10556/12384 [22:23:54<3:51:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 85%|████████▌ | 10557/12384 [22:23:54<3:51:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 85%|████████▌ | 10557/12384 [22:24:01<3:51:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▌ | 10558/12384 [22:24:01<3:51:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 85%|████████▌ | 10558/12384 [22:24:09<3:51:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▌ | 10559/12384 [22:24:09<3:51:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▌ | 10559/12384 [22:24:16<3:51:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 85%|████████▌ | 10560/12384 [22:24:16<3:51:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 85%|████████▌ | 10560/12384 [22:24:24<3:51:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 85%|████████▌ | 10561/12384 [22:24:24<3:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 85%|████████▌ | 10561/12384 [22:24:32<3:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 85%|████████▌ | 10562/12384 [22:24:32<3:51:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 85%|████████▌ | 10562/12384 [22:24:39<3:51:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 85%|████████▌ | 10563/12384 [22:24:39<3:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 85%|████████▌ | 10563/12384 [22:24:47<3:50:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 85%|████████▌ | 10564/12384 [22:24:47<3:50:31, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 85%|████████▌ | 10564/12384 [22:24:54<3:50:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▌ | 10565/12384 [22:24:54<3:50:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▌ | 10565/12384 [22:25:02<3:50:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 85%|████████▌ | 10566/12384 [22:25:02<3:50:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 85%|████████▌ | 10566/12384 [22:25:10<3:50:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 85%|████████▌ | 10567/12384 [22:25:10<3:50:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 85%|████████▌ | 10567/12384 [22:25:17<3:50:08, 7.60s/it, loss=0.0001, acc=0.9986, iter_time=10.59s]
Epoch 1: 85%|████████▌ | 10568/12384 [22:25:17<3:49:55, 7.60s/it, loss=0.0001, acc=0.9986, iter_time=10.59s]
Epoch 1: 85%|████████▌ | 10568/12384 [22:25:25<3:49:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 85%|████████▌ | 10569/12384 [22:25:25<3:49:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 85%|████████▌ | 10569/12384 [22:25:33<3:49:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 85%|████████▌ | 10570/12384 [22:25:33<3:52:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 85%|████████▌ | 10570/12384 [22:25:40<3:52:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▌ | 10571/12384 [22:25:40<3:51:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▌ | 10571/12384 [22:25:48<3:51:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 85%|████████▌ | 10572/12384 [22:25:48<3:51:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 85%|████████▌ | 10572/12384 [22:25:56<3:51:05, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.90s]
Epoch 1: 85%|████████▌ | 10573/12384 [22:25:56<3:53:45, 7.74s/it, loss=0.0002, acc=1.0000, iter_time=8.90s]
Epoch 1: 85%|████████▌ | 10573/12384 [22:26:04<3:53:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 85%|████████▌ | 10574/12384 [22:26:04<3:52:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 85%|████████▌ | 10574/12384 [22:26:11<3:52:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▌ | 10575/12384 [22:26:11<3:51:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 85%|████████▌ | 10575/12384 [22:26:19<3:51:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10576/12384 [22:26:19<3:51:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10576/12384 [22:26:26<3:51:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 85%|████████▌ | 10577/12384 [22:26:26<3:50:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 85%|████████▌ | 10577/12384 [22:26:34<3:50:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 85%|████████▌ | 10578/12384 [22:26:34<3:50:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 85%|████████▌ | 10578/12384 [22:26:42<3:50:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 85%|████████▌ | 10579/12384 [22:26:42<3:49:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 1: 85%|████████▌ | 10579/12384 [22:26:49<3:49:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▌ | 10580/12384 [22:26:49<3:49:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▌ | 10580/12384 [22:26:57<3:49:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 85%|████████▌ | 10581/12384 [22:26:57<3:49:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 85%|████████▌ | 10581/12384 [22:27:05<3:49:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 85%|████████▌ | 10582/12384 [22:27:05<3:48:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 85%|████████▌ | 10582/12384 [22:27:12<3:48:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▌ | 10583/12384 [22:27:12<3:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 85%|████████▌ | 10583/12384 [22:27:20<3:48:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 85%|████████▌ | 10584/12384 [22:27:20<3:48:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 85%|████████▌ | 10584/12384 [22:27:27<3:48:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 85%|████████▌ | 10585/12384 [22:27:27<3:47:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 1: 85%|████████▌ | 10585/12384 [22:27:35<3:47:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 85%|████████▌ | 10586/12384 [22:27:35<3:47:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 85%|████████▌ | 10586/12384 [22:27:43<3:47:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10587/12384 [22:27:43<3:47:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 85%|████████▌ | 10587/12384 [22:27:50<3:47:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▌ | 10588/12384 [22:27:50<3:48:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 85%|████████▌ | 10588/12384 [22:27:58<3:48:15, 7.63s/it, loss=0.0002, acc=0.9979, iter_time=6.46s]
Epoch 1: 86%|████████▌ | 10589/12384 [22:27:58<3:48:05, 7.62s/it, loss=0.0002, acc=0.9979, iter_time=6.46s]
Epoch 1: 86%|████████▌ | 10589/12384 [22:28:05<3:48:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 86%|████████▌ | 10590/12384 [22:28:05<3:47:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 86%|████████▌ | 10590/12384 [22:28:13<3:47:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 86%|████████▌ | 10591/12384 [22:28:13<3:47:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 86%|████████▌ | 10591/12384 [22:28:21<3:47:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 86%|████████▌ | 10592/12384 [22:28:21<3:47:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 1: 86%|████████▌ | 10592/12384 [22:28:28<3:47:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 86%|████████▌ | 10593/12384 [22:28:28<3:47:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 86%|████████▌ | 10593/12384 [22:28:36<3:47:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 86%|████████▌ | 10594/12384 [22:28:36<3:47:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 86%|████████▌ | 10594/12384 [22:28:44<3:47:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 86%|████████▌ | 10595/12384 [22:28:44<3:47:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 86%|████████▌ | 10595/12384 [22:28:51<3:47:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 86%|████████▌ | 10596/12384 [22:28:51<3:47:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 1: 86%|████████▌ | 10596/12384 [22:28:59<3:47:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 86%|████████▌ | 10597/12384 [22:28:59<3:47:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 86%|████████▌ | 10597/12384 [22:29:06<3:47:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 86%|████████▌ | 10598/12384 [22:29:06<3:46:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 86%|████████▌ | 10598/12384 [22:29:14<3:46:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 86%|████████▌ | 10599/12384 [22:29:14<3:49:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 86%|████████▌ | 10599/12384 [22:29:22<3:49:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 86%|████████▌ | 10600/12384 [22:29:22<3:48:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 86%|████████▌ | 10600/12384 [22:29:30<3:48:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 86%|████████▌ | 10601/12384 [22:29:30<3:47:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 86%|████████▌ | 10601/12384 [22:29:37<3:47:44, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.27s]
Epoch 1: 86%|████████▌ | 10602/12384 [22:29:37<3:47:12, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.27s]
Epoch 1: 86%|████████▌ | 10602/12384 [22:29:45<3:47:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 86%|████████▌ | 10603/12384 [22:29:45<3:46:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 1: 86%|████████▌ | 10603/12384 [22:29:52<3:46:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10604/12384 [22:29:52<3:46:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10604/12384 [22:30:00<3:46:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10605/12384 [22:30:00<3:45:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10605/12384 [22:30:08<3:45:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10606/12384 [22:30:08<3:45:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10606/12384 [22:30:15<3:45:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10607/12384 [22:30:15<3:45:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10607/12384 [22:30:23<3:45:18, 7.61s/it, loss=0.0015, acc=0.9943, iter_time=7.56s]
Epoch 1: 86%|████████▌ | 10608/12384 [22:30:23<3:45:19, 7.61s/it, loss=0.0015, acc=0.9943, iter_time=7.56s]
Epoch 1: 86%|████████▌ | 10608/12384 [22:30:30<3:45:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 86%|████████▌ | 10609/12384 [22:30:30<3:44:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 86%|████████▌ | 10609/12384 [22:30:38<3:44:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 86%|████████▌ | 10610/12384 [22:30:38<3:44:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 86%|████████▌ | 10610/12384 [22:30:46<3:44:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 86%|████████▌ | 10611/12384 [22:30:46<3:44:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 86%|████████▌ | 10611/12384 [22:30:53<3:44:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 86%|████████▌ | 10612/12384 [22:30:53<3:44:14, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 86%|████████▌ | 10612/12384 [22:31:01<3:44:14, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10613/12384 [22:31:01<3:44:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10613/12384 [22:31:08<3:44:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10614/12384 [22:31:08<3:44:10, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10614/12384 [22:31:16<3:44:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 86%|████████▌ | 10615/12384 [22:31:16<3:44:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 86%|████████▌ | 10615/12384 [22:31:24<3:44:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 86%|████████▌ | 10616/12384 [22:31:24<3:46:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 1: 86%|████████▌ | 10616/12384 [22:31:31<3:46:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 86%|████████▌ | 10617/12384 [22:31:31<3:45:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 86%|████████▌ | 10617/12384 [22:31:39<3:45:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10618/12384 [22:31:39<3:44:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10618/12384 [22:31:47<3:44:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 86%|████████▌ | 10619/12384 [22:31:47<3:44:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 86%|████████▌ | 10619/12384 [22:31:54<3:44:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 86%|████████▌ | 10620/12384 [22:31:54<3:44:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 86%|████████▌ | 10620/12384 [22:32:02<3:44:11, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.82s]
Epoch 1: 86%|████████▌ | 10621/12384 [22:32:02<3:44:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.82s]
Epoch 1: 86%|████████▌ | 10621/12384 [22:32:10<3:44:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 1: 86%|████████▌ | 10622/12384 [22:32:10<3:46:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 1: 86%|████████▌ | 10622/12384 [22:32:17<3:46:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 86%|████████▌ | 10623/12384 [22:32:17<3:45:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 86%|████████▌ | 10623/12384 [22:32:25<3:45:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 86%|████████▌ | 10624/12384 [22:32:25<3:44:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 86%|████████▌ | 10624/12384 [22:32:33<3:44:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.72s]
Epoch 1: 86%|████████▌ | 10625/12384 [22:32:33<3:46:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=3.72s]
Epoch 1: 86%|████████▌ | 10625/12384 [22:32:41<3:46:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 86%|████████▌ | 10626/12384 [22:32:41<3:45:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 86%|████████▌ | 10626/12384 [22:32:48<3:45:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 86%|████████▌ | 10627/12384 [22:32:48<3:44:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 86%|████████▌ | 10627/12384 [22:32:56<3:44:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10628/12384 [22:32:56<3:43:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10628/12384 [22:33:03<3:43:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10629/12384 [22:33:03<3:43:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10629/12384 [22:33:11<3:43:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 86%|████████▌ | 10630/12384 [22:33:11<3:43:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 86%|████████▌ | 10630/12384 [22:33:19<3:43:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 86%|████████▌ | 10631/12384 [22:33:19<3:43:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 86%|████████▌ | 10631/12384 [22:33:26<3:43:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 1: 86%|████████▌ | 10632/12384 [22:33:26<3:42:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 1: 86%|████████▌ | 10632/12384 [22:33:34<3:42:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 86%|████████▌ | 10633/12384 [22:33:34<3:42:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 86%|████████▌ | 10633/12384 [22:33:42<3:42:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 86%|████████▌ | 10634/12384 [22:33:42<3:42:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 86%|████████▌ | 10634/12384 [22:33:49<3:42:30, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.12s]
Epoch 1: 86%|████████▌ | 10635/12384 [22:33:49<3:42:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.12s]
Epoch 1: 86%|████████▌ | 10635/12384 [22:33:57<3:42:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10636/12384 [22:33:57<3:42:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10636/12384 [22:34:04<3:42:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 86%|████████▌ | 10637/12384 [22:34:04<3:42:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 86%|████████▌ | 10637/12384 [22:34:12<3:42:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 1: 86%|████████▌ | 10638/12384 [22:34:12<3:41:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 1: 86%|████████▌ | 10638/12384 [22:34:20<3:41:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 86%|████████▌ | 10639/12384 [22:34:20<3:41:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 86%|████████▌ | 10639/12384 [22:34:27<3:41:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 86%|████████▌ | 10640/12384 [22:34:27<3:41:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 86%|████████▌ | 10640/12384 [22:34:35<3:41:39, 7.63s/it, loss=0.0003, acc=0.9992, iter_time=4.41s]
Epoch 1: 86%|████████▌ | 10641/12384 [22:34:35<3:41:16, 7.62s/it, loss=0.0003, acc=0.9992, iter_time=4.41s]
Epoch 1: 86%|████████▌ | 10641/12384 [22:34:43<3:41:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 86%|████████▌ | 10642/12384 [22:34:43<3:41:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 86%|████████▌ | 10642/12384 [22:34:50<3:41:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 86%|████████▌ | 10643/12384 [22:34:50<3:40:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 86%|████████▌ | 10643/12384 [22:34:58<3:40:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 86%|████████▌ | 10644/12384 [22:34:58<3:40:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 86%|████████▌ | 10644/12384 [22:35:05<3:40:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10645/12384 [22:35:05<3:40:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10645/12384 [22:35:13<3:40:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 86%|████████▌ | 10646/12384 [22:35:13<3:40:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 86%|████████▌ | 10646/12384 [22:35:21<3:40:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10647/12384 [22:35:21<3:40:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10647/12384 [22:35:28<3:40:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 86%|████████▌ | 10648/12384 [22:35:28<3:40:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 86%|████████▌ | 10648/12384 [22:35:36<3:40:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 86%|████████▌ | 10649/12384 [22:35:36<3:40:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 86%|████████▌ | 10649/12384 [22:35:43<3:40:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10650/12384 [22:35:43<3:39:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10650/12384 [22:35:51<3:39:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 86%|████████▌ | 10651/12384 [22:35:51<3:42:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 86%|████████▌ | 10651/12384 [22:35:59<3:42:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 86%|████████▌ | 10652/12384 [22:35:59<3:41:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 86%|████████▌ | 10652/12384 [22:36:07<3:41:49, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=8.26s]
Epoch 1: 86%|████████▌ | 10653/12384 [22:36:07<3:41:01, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=8.26s]
Epoch 1: 86%|████████▌ | 10653/12384 [22:36:14<3:41:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10654/12384 [22:36:14<3:40:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10654/12384 [22:36:22<3:40:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 86%|████████▌ | 10655/12384 [22:36:22<3:40:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 86%|████████▌ | 10655/12384 [22:36:29<3:40:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 86%|████████▌ | 10656/12384 [22:36:29<3:39:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 86%|████████▌ | 10656/12384 [22:36:37<3:39:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 86%|████████▌ | 10657/12384 [22:36:37<3:39:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 86%|████████▌ | 10657/12384 [22:36:45<3:39:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 1: 86%|████████▌ | 10658/12384 [22:36:45<3:39:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 1: 86%|████████▌ | 10658/12384 [22:36:52<3:39:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 86%|████████▌ | 10659/12384 [22:36:52<3:38:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 86%|████████▌ | 10659/12384 [22:37:00<3:38:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 86%|████████▌ | 10660/12384 [22:37:00<3:38:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 86%|████████▌ | 10660/12384 [22:37:07<3:38:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10661/12384 [22:37:07<3:38:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10661/12384 [22:37:15<3:38:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 86%|████████▌ | 10662/12384 [22:37:15<3:38:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 86%|████████▌ | 10662/12384 [22:37:23<3:38:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10663/12384 [22:37:23<3:38:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▌ | 10663/12384 [22:37:30<3:38:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 86%|████████▌ | 10664/12384 [22:37:30<3:38:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 86%|████████▌ | 10664/12384 [22:37:38<3:38:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 86%|████████▌ | 10665/12384 [22:37:38<3:38:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 86%|████████▌ | 10665/12384 [22:37:46<3:38:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 86%|████████▌ | 10666/12384 [22:37:46<3:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 86%|████████▌ | 10666/12384 [22:37:53<3:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 86%|████████▌ | 10667/12384 [22:37:53<3:37:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 86%|████████▌ | 10667/12384 [22:38:01<3:37:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 86%|████████▌ | 10668/12384 [22:38:01<3:37:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 86%|████████▌ | 10668/12384 [22:38:08<3:37:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 86%|████████▌ | 10669/12384 [22:38:08<3:37:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 86%|████████▌ | 10669/12384 [22:38:16<3:37:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10670/12384 [22:38:16<3:37:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▌ | 10670/12384 [22:38:24<3:37:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 86%|████████▌ | 10671/12384 [22:38:24<3:37:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 86%|████████▌ | 10671/12384 [22:38:31<3:37:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 86%|████████▌ | 10672/12384 [22:38:31<3:37:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 86%|████████▌ | 10672/12384 [22:38:39<3:37:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 86%|████████▌ | 10673/12384 [22:38:39<3:37:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 86%|████████▌ | 10673/12384 [22:38:46<3:37:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 86%|████████▌ | 10674/12384 [22:38:46<3:37:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 86%|████████▌ | 10674/12384 [22:38:54<3:37:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 1: 86%|████████▌ | 10675/12384 [22:38:54<3:37:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 1: 86%|████████▌ | 10675/12384 [22:39:02<3:37:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 86%|████████▌ | 10676/12384 [22:39:02<3:36:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 86%|████████▌ | 10676/12384 [22:39:10<3:36:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 86%|████████▌ | 10677/12384 [22:39:10<3:39:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 86%|████████▌ | 10677/12384 [22:39:17<3:39:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 86%|████████▌ | 10678/12384 [22:39:17<3:38:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 86%|████████▌ | 10678/12384 [22:39:25<3:38:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 86%|████████▌ | 10679/12384 [22:39:25<3:37:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 86%|████████▌ | 10679/12384 [22:39:32<3:37:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 86%|████████▌ | 10680/12384 [22:39:32<3:36:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 86%|████████▌ | 10680/12384 [22:39:40<3:36:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 1: 86%|████████▌ | 10681/12384 [22:39:40<3:36:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 1: 86%|████████▌ | 10681/12384 [22:39:48<3:36:30, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.89s]
Epoch 1: 86%|████████▋ | 10682/12384 [22:39:48<3:36:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.89s]
Epoch 1: 86%|████████▋ | 10682/12384 [22:39:55<3:36:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 86%|████████▋ | 10683/12384 [22:39:55<3:36:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 86%|████████▋ | 10683/12384 [22:40:03<3:36:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 86%|████████▋ | 10684/12384 [22:40:03<3:36:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 86%|████████▋ | 10684/12384 [22:40:11<3:36:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 86%|████████▋ | 10685/12384 [22:40:11<3:35:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 86%|████████▋ | 10685/12384 [22:40:18<3:35:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 86%|████████▋ | 10686/12384 [22:40:18<3:35:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 86%|████████▋ | 10686/12384 [22:40:26<3:35:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 86%|████████▋ | 10687/12384 [22:40:26<3:35:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 86%|████████▋ | 10687/12384 [22:40:33<3:35:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 86%|████████▋ | 10688/12384 [22:40:33<3:35:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 86%|████████▋ | 10688/12384 [22:40:41<3:35:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 86%|████████▋ | 10689/12384 [22:40:41<3:34:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 86%|████████▋ | 10689/12384 [22:40:49<3:34:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 86%|████████▋ | 10690/12384 [22:40:49<3:34:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 86%|████████▋ | 10690/12384 [22:40:56<3:34:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 86%|████████▋ | 10691/12384 [22:40:56<3:35:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 86%|████████▋ | 10691/12384 [22:41:04<3:35:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 86%|████████▋ | 10692/12384 [22:41:04<3:34:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 86%|████████▋ | 10692/12384 [22:41:11<3:34:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 86%|████████▋ | 10693/12384 [22:41:11<3:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 86%|████████▋ | 10693/12384 [22:41:19<3:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 86%|████████▋ | 10694/12384 [22:41:19<3:35:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 86%|████████▋ | 10694/12384 [22:41:27<3:35:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 86%|████████▋ | 10695/12384 [22:41:27<3:34:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 86%|████████▋ | 10695/12384 [22:41:34<3:34:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 86%|████████▋ | 10696/12384 [22:41:34<3:34:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 1: 86%|████████▋ | 10696/12384 [22:41:42<3:34:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 86%|████████▋ | 10697/12384 [22:41:42<3:34:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 86%|████████▋ | 10697/12384 [22:41:50<3:34:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 86%|████████▋ | 10698/12384 [22:41:50<3:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 1: 86%|████████▋ | 10698/12384 [22:41:57<3:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 86%|████████▋ | 10699/12384 [22:41:57<3:33:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 86%|████████▋ | 10699/12384 [22:42:05<3:33:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 86%|████████▋ | 10700/12384 [22:42:05<3:33:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 86%|████████▋ | 10700/12384 [22:42:13<3:33:41, 7.61s/it, loss=0.0001, acc=0.9993, iter_time=8.24s]
Epoch 1: 86%|████████▋ | 10701/12384 [22:42:13<3:36:03, 7.70s/it, loss=0.0001, acc=0.9993, iter_time=8.24s]
Epoch 1: 86%|████████▋ | 10701/12384 [22:42:20<3:36:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▋ | 10702/12384 [22:42:20<3:35:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 86%|████████▋ | 10702/12384 [22:42:28<3:35:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 86%|████████▋ | 10703/12384 [22:42:28<3:34:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 86%|████████▋ | 10703/12384 [22:42:36<3:34:18, 7.65s/it, loss=0.0004, acc=0.9980, iter_time=8.05s]
Epoch 1: 86%|████████▋ | 10704/12384 [22:42:36<3:36:47, 7.74s/it, loss=0.0004, acc=0.9980, iter_time=8.05s]
Epoch 1: 86%|████████▋ | 10704/12384 [22:42:43<3:36:47, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 86%|████████▋ | 10705/12384 [22:42:43<3:35:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 1: 86%|████████▋ | 10705/12384 [22:42:51<3:35:30, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▋ | 10706/12384 [22:42:51<3:34:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▋ | 10706/12384 [22:42:59<3:34:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▋ | 10707/12384 [22:42:59<3:34:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▋ | 10707/12384 [22:43:06<3:34:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▋ | 10708/12384 [22:43:06<3:33:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 86%|████████▋ | 10708/12384 [22:43:14<3:33:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 86%|████████▋ | 10709/12384 [22:43:14<3:33:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 86%|████████▋ | 10709/12384 [22:43:22<3:33:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 86%|████████▋ | 10710/12384 [22:43:22<3:32:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 86%|████████▋ | 10710/12384 [22:43:29<3:32:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 86%|████████▋ | 10711/12384 [22:43:29<3:33:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 86%|████████▋ | 10711/12384 [22:43:37<3:33:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 86%|████████▋ | 10712/12384 [22:43:37<3:32:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 86%|████████▋ | 10712/12384 [22:43:44<3:32:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 87%|████████▋ | 10713/12384 [22:43:44<3:32:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 1: 87%|████████▋ | 10713/12384 [22:43:52<3:32:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 87%|████████▋ | 10714/12384 [22:43:52<3:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 87%|████████▋ | 10714/12384 [22:44:00<3:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 87%|████████▋ | 10715/12384 [22:44:00<3:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 87%|████████▋ | 10715/12384 [22:44:07<3:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 87%|████████▋ | 10716/12384 [22:44:07<3:31:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 87%|████████▋ | 10716/12384 [22:44:15<3:31:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 87%|████████▋ | 10717/12384 [22:44:15<3:31:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 87%|████████▋ | 10717/12384 [22:44:22<3:31:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10718/12384 [22:44:22<3:31:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10718/12384 [22:44:30<3:31:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10719/12384 [22:44:30<3:30:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10719/12384 [22:44:38<3:30:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 87%|████████▋ | 10720/12384 [22:44:38<3:30:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 87%|████████▋ | 10720/12384 [22:44:45<3:30:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 87%|████████▋ | 10721/12384 [22:44:45<3:30:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 87%|████████▋ | 10721/12384 [22:44:53<3:30:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10722/12384 [22:44:53<3:30:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10722/12384 [22:45:00<3:30:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10723/12384 [22:45:00<3:30:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10723/12384 [22:45:08<3:30:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10724/12384 [22:45:08<3:30:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10724/12384 [22:45:16<3:30:12, 7.60s/it, loss=0.0005, acc=0.9992, iter_time=6.15s]
Epoch 1: 87%|████████▋ | 10725/12384 [22:45:16<3:29:55, 7.59s/it, loss=0.0005, acc=0.9992, iter_time=6.15s]
Epoch 1: 87%|████████▋ | 10725/12384 [22:45:23<3:29:55, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 87%|████████▋ | 10726/12384 [22:45:23<3:30:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 87%|████████▋ | 10726/12384 [22:45:31<3:30:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 1: 87%|████████▋ | 10727/12384 [22:45:31<3:32:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 1: 87%|████████▋ | 10727/12384 [22:45:39<3:32:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 87%|████████▋ | 10728/12384 [22:45:39<3:32:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 87%|████████▋ | 10728/12384 [22:45:46<3:32:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 87%|████████▋ | 10729/12384 [22:45:46<3:31:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 87%|████████▋ | 10729/12384 [22:45:54<3:31:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 87%|████████▋ | 10730/12384 [22:45:54<3:33:42, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 87%|████████▋ | 10730/12384 [22:46:02<3:33:42, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 87%|████████▋ | 10731/12384 [22:46:02<3:32:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 87%|████████▋ | 10731/12384 [22:46:10<3:32:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10732/12384 [22:46:10<3:31:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10732/12384 [22:46:17<3:31:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10733/12384 [22:46:17<3:30:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10733/12384 [22:46:25<3:30:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 87%|████████▋ | 10734/12384 [22:46:25<3:30:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 87%|████████▋ | 10734/12384 [22:46:32<3:30:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 1: 87%|████████▋ | 10735/12384 [22:46:32<3:29:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 1: 87%|████████▋ | 10735/12384 [22:46:40<3:29:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 1: 87%|████████▋ | 10736/12384 [22:46:40<3:29:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 1: 87%|████████▋ | 10736/12384 [22:46:48<3:29:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 87%|████████▋ | 10737/12384 [22:46:48<3:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 87%|████████▋ | 10737/12384 [22:46:55<3:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10738/12384 [22:46:55<3:28:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10738/12384 [22:47:03<3:28:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10739/12384 [22:47:03<3:28:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10739/12384 [22:47:10<3:28:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 87%|████████▋ | 10740/12384 [22:47:10<3:28:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 87%|████████▋ | 10740/12384 [22:47:18<3:28:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 87%|████████▋ | 10741/12384 [22:47:18<3:28:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 87%|████████▋ | 10741/12384 [22:47:26<3:28:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 87%|████████▋ | 10742/12384 [22:47:26<3:28:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 87%|████████▋ | 10742/12384 [22:47:33<3:28:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10743/12384 [22:47:33<3:28:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10743/12384 [22:47:41<3:28:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 87%|████████▋ | 10744/12384 [22:47:41<3:28:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 87%|████████▋ | 10744/12384 [22:47:49<3:28:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 87%|████████▋ | 10745/12384 [22:47:49<3:28:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 87%|████████▋ | 10745/12384 [22:47:56<3:28:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 87%|████████▋ | 10746/12384 [22:47:56<3:28:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 87%|████████▋ | 10746/12384 [22:48:04<3:28:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 87%|████████▋ | 10747/12384 [22:48:04<3:27:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 87%|████████▋ | 10747/12384 [22:48:11<3:27:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 87%|████████▋ | 10748/12384 [22:48:11<3:27:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 87%|████████▋ | 10748/12384 [22:48:19<3:27:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 87%|████████▋ | 10749/12384 [22:48:19<3:27:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 87%|████████▋ | 10749/12384 [22:48:27<3:27:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 87%|████████▋ | 10750/12384 [22:48:27<3:27:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 87%|████████▋ | 10750/12384 [22:48:34<3:27:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 87%|████████▋ | 10751/12384 [22:48:34<3:26:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 87%|████████▋ | 10751/12384 [22:48:42<3:26:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 87%|████████▋ | 10752/12384 [22:48:42<3:26:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 87%|████████▋ | 10752/12384 [22:48:49<3:26:47, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=5.43s]
Epoch 1: 87%|████████▋ | 10753/12384 [22:48:49<3:26:43, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=5.43s]
Epoch 1: 87%|████████▋ | 10753/12384 [22:48:57<3:26:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 87%|████████▋ | 10754/12384 [22:48:57<3:26:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 87%|████████▋ | 10754/12384 [22:49:05<3:26:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 87%|████████▋ | 10755/12384 [22:49:05<3:26:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 87%|████████▋ | 10755/12384 [22:49:12<3:26:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 87%|████████▋ | 10756/12384 [22:49:12<3:26:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 87%|████████▋ | 10756/12384 [22:49:20<3:26:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 87%|████████▋ | 10757/12384 [22:49:20<3:28:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 87%|████████▋ | 10757/12384 [22:49:28<3:28:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 87%|████████▋ | 10758/12384 [22:49:28<3:28:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 87%|████████▋ | 10758/12384 [22:49:35<3:28:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 87%|████████▋ | 10759/12384 [22:49:35<3:27:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 87%|████████▋ | 10759/12384 [22:49:43<3:27:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 87%|████████▋ | 10760/12384 [22:49:43<3:26:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 87%|████████▋ | 10760/12384 [22:49:51<3:26:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 87%|████████▋ | 10761/12384 [22:49:51<3:26:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 87%|████████▋ | 10761/12384 [22:49:58<3:26:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 87%|████████▋ | 10762/12384 [22:49:58<3:26:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 87%|████████▋ | 10762/12384 [22:50:06<3:26:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 87%|████████▋ | 10763/12384 [22:50:06<3:25:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 87%|████████▋ | 10763/12384 [22:50:13<3:25:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 87%|████████▋ | 10764/12384 [22:50:13<3:25:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 87%|████████▋ | 10764/12384 [22:50:21<3:25:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10765/12384 [22:50:21<3:25:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10765/12384 [22:50:29<3:25:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 87%|████████▋ | 10766/12384 [22:50:29<3:25:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 87%|████████▋ | 10766/12384 [22:50:36<3:25:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 87%|████████▋ | 10767/12384 [22:50:36<3:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 87%|████████▋ | 10767/12384 [22:50:44<3:25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 87%|████████▋ | 10768/12384 [22:50:44<3:24:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 87%|████████▋ | 10768/12384 [22:50:51<3:24:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 1: 87%|████████▋ | 10769/12384 [22:50:51<3:24:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 1: 87%|████████▋ | 10769/12384 [22:50:59<3:24:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 87%|████████▋ | 10770/12384 [22:50:59<3:24:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 87%|████████▋ | 10770/12384 [22:51:07<3:24:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 87%|████████▋ | 10771/12384 [22:51:07<3:24:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 1: 87%|████████▋ | 10771/12384 [22:51:14<3:24:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10772/12384 [22:51:14<3:24:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10772/12384 [22:51:22<3:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10773/12384 [22:51:22<3:24:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10773/12384 [22:51:30<3:24:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10774/12384 [22:51:30<3:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10774/12384 [22:51:37<3:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10775/12384 [22:51:37<3:24:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10775/12384 [22:51:45<3:24:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 87%|████████▋ | 10776/12384 [22:51:45<3:24:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 87%|████████▋ | 10776/12384 [22:51:52<3:24:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 87%|████████▋ | 10777/12384 [22:51:52<3:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 1: 87%|████████▋ | 10777/12384 [22:52:00<3:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 87%|████████▋ | 10778/12384 [22:52:00<3:23:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 1: 87%|████████▋ | 10778/12384 [22:52:08<3:23:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 87%|████████▋ | 10779/12384 [22:52:08<3:25:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 87%|████████▋ | 10779/12384 [22:52:15<3:25:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 87%|████████▋ | 10780/12384 [22:52:15<3:24:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 1: 87%|████████▋ | 10780/12384 [22:52:23<3:24:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 87%|████████▋ | 10781/12384 [22:52:23<3:24:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 87%|████████▋ | 10781/12384 [22:52:31<3:24:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 87%|████████▋ | 10782/12384 [22:52:31<3:23:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 87%|████████▋ | 10782/12384 [22:52:39<3:23:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 87%|████████▋ | 10783/12384 [22:52:39<3:26:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 87%|████████▋ | 10783/12384 [22:52:46<3:26:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 87%|████████▋ | 10784/12384 [22:52:46<3:25:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 87%|████████▋ | 10784/12384 [22:52:54<3:25:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 87%|████████▋ | 10785/12384 [22:52:54<3:24:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 87%|████████▋ | 10785/12384 [22:53:01<3:24:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10786/12384 [22:53:01<3:23:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10786/12384 [22:53:09<3:23:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 87%|████████▋ | 10787/12384 [22:53:09<3:23:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 87%|████████▋ | 10787/12384 [22:53:17<3:23:10, 7.63s/it, loss=0.0002, acc=0.9982, iter_time=10.39s]
Epoch 1: 87%|████████▋ | 10788/12384 [22:53:17<3:22:57, 7.63s/it, loss=0.0002, acc=0.9982, iter_time=10.39s]
Epoch 1: 87%|████████▋ | 10788/12384 [22:53:24<3:22:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10789/12384 [22:53:24<3:22:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 87%|████████▋ | 10789/12384 [22:53:32<3:22:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10790/12384 [22:53:32<3:22:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10790/12384 [22:53:40<3:22:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 87%|████████▋ | 10791/12384 [22:53:40<3:22:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 87%|████████▋ | 10791/12384 [22:53:47<3:22:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 87%|████████▋ | 10792/12384 [22:53:47<3:22:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 1: 87%|████████▋ | 10792/12384 [22:53:55<3:22:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 87%|████████▋ | 10793/12384 [22:53:55<3:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 87%|████████▋ | 10793/12384 [22:54:02<3:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 87%|████████▋ | 10794/12384 [22:54:02<3:21:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 1: 87%|████████▋ | 10794/12384 [22:54:10<3:21:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 87%|████████▋ | 10795/12384 [22:54:10<3:21:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 87%|████████▋ | 10795/12384 [22:54:18<3:21:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 87%|████████▋ | 10796/12384 [22:54:18<3:21:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 87%|████████▋ | 10796/12384 [22:54:25<3:21:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10797/12384 [22:54:25<3:21:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10797/12384 [22:54:33<3:21:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 87%|████████▋ | 10798/12384 [22:54:33<3:21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 87%|████████▋ | 10798/12384 [22:54:40<3:21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 87%|████████▋ | 10799/12384 [22:54:40<3:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 1: 87%|████████▋ | 10799/12384 [22:54:48<3:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 1: 87%|████████▋ | 10800/12384 [22:54:48<3:20:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 1: 87%|████████▋ | 10800/12384 [22:54:56<3:20:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 87%|████████▋ | 10801/12384 [22:54:56<3:20:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 87%|████████▋ | 10801/12384 [22:55:03<3:20:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10802/12384 [22:55:03<3:20:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10802/12384 [22:55:11<3:20:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 87%|████████▋ | 10803/12384 [22:55:11<3:21:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 87%|████████▋ | 10803/12384 [22:55:19<3:21:04, 7.63s/it, loss=0.0011, acc=0.9973, iter_time=5.85s]
Epoch 1: 87%|████████▋ | 10804/12384 [22:55:19<3:20:38, 7.62s/it, loss=0.0011, acc=0.9973, iter_time=5.85s]
Epoch 1: 87%|████████▋ | 10804/12384 [22:55:26<3:20:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 87%|████████▋ | 10805/12384 [22:55:26<3:20:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 87%|████████▋ | 10805/12384 [22:55:34<3:20:18, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.90s]
Epoch 1: 87%|████████▋ | 10806/12384 [22:55:34<3:22:28, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=7.90s]
Epoch 1: 87%|████████▋ | 10806/12384 [22:55:42<3:22:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10807/12384 [22:55:42<3:21:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 87%|████████▋ | 10807/12384 [22:55:49<3:21:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 87%|████████▋ | 10808/12384 [22:55:49<3:21:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 87%|████████▋ | 10808/12384 [22:55:57<3:21:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 87%|████████▋ | 10809/12384 [22:55:57<3:23:02, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 87%|████████▋ | 10809/12384 [22:56:05<3:23:02, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 87%|████████▋ | 10810/12384 [22:56:05<3:21:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 87%|████████▋ | 10810/12384 [22:56:12<3:21:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10811/12384 [22:56:12<3:21:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10811/12384 [22:56:20<3:21:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 87%|████████▋ | 10812/12384 [22:56:20<3:20:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 87%|████████▋ | 10812/12384 [22:56:28<3:20:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 87%|████████▋ | 10813/12384 [22:56:28<3:19:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 87%|████████▋ | 10813/12384 [22:56:35<3:19:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 87%|████████▋ | 10814/12384 [22:56:35<3:19:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 87%|████████▋ | 10814/12384 [22:56:43<3:19:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 87%|████████▋ | 10815/12384 [22:56:43<3:19:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 1: 87%|████████▋ | 10815/12384 [22:56:50<3:19:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 87%|████████▋ | 10816/12384 [22:56:50<3:18:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 87%|████████▋ | 10816/12384 [22:56:58<3:18:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 87%|████████▋ | 10817/12384 [22:56:58<3:18:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 87%|████████▋ | 10817/12384 [22:57:06<3:18:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 87%|████████▋ | 10818/12384 [22:57:06<3:18:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 87%|████████▋ | 10818/12384 [22:57:13<3:18:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10819/12384 [22:57:13<3:18:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 87%|████████▋ | 10819/12384 [22:57:21<3:18:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 87%|████████▋ | 10820/12384 [22:57:21<3:18:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 87%|████████▋ | 10820/12384 [22:57:28<3:18:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 87%|████████▋ | 10821/12384 [22:57:28<3:18:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 87%|████████▋ | 10821/12384 [22:57:36<3:18:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 87%|████████▋ | 10822/12384 [22:57:36<3:18:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 87%|████████▋ | 10822/12384 [22:57:44<3:18:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 87%|████████▋ | 10823/12384 [22:57:44<3:17:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 87%|████████▋ | 10823/12384 [22:57:51<3:17:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 87%|████████▋ | 10824/12384 [22:57:51<3:17:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 1: 87%|████████▋ | 10824/12384 [22:57:59<3:17:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 87%|████████▋ | 10825/12384 [22:57:59<3:17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 87%|████████▋ | 10825/12384 [22:58:07<3:17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 87%|████████▋ | 10826/12384 [22:58:07<3:17:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 87%|████████▋ | 10826/12384 [22:58:14<3:17:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 87%|████████▋ | 10827/12384 [22:58:14<3:17:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 87%|████████▋ | 10827/12384 [22:58:22<3:17:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 87%|████████▋ | 10828/12384 [22:58:22<3:17:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 87%|████████▋ | 10828/12384 [22:58:29<3:17:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.80s]
Epoch 1: 87%|████████▋ | 10829/12384 [22:58:29<3:17:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.80s]
Epoch 1: 87%|████████▋ | 10829/12384 [22:58:37<3:17:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 87%|████████▋ | 10830/12384 [22:58:37<3:17:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 87%|████████▋ | 10830/12384 [22:58:45<3:17:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 87%|████████▋ | 10831/12384 [22:58:45<3:17:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 87%|████████▋ | 10831/12384 [22:58:52<3:17:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 87%|████████▋ | 10832/12384 [22:58:52<3:16:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 1: 87%|████████▋ | 10832/12384 [22:59:00<3:16:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 87%|████████▋ | 10833/12384 [22:59:00<3:16:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 87%|████████▋ | 10833/12384 [22:59:07<3:16:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.80s]
Epoch 1: 87%|████████▋ | 10834/12384 [22:59:07<3:16:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.80s]
Epoch 1: 87%|████████▋ | 10834/12384 [22:59:15<3:16:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.53s]
Epoch 1: 87%|████████▋ | 10835/12384 [22:59:15<3:19:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.53s]
Epoch 1: 87%|████████▋ | 10835/12384 [22:59:23<3:19:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 88%|████████▊ | 10836/12384 [22:59:23<3:18:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 88%|████████▊ | 10836/12384 [22:59:31<3:18:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 88%|████████▊ | 10837/12384 [22:59:31<3:17:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 88%|████████▊ | 10837/12384 [22:59:38<3:17:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 88%|████████▊ | 10838/12384 [22:59:38<3:17:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 1: 88%|████████▊ | 10838/12384 [22:59:46<3:17:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10839/12384 [22:59:46<3:16:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10839/12384 [22:59:53<3:16:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 88%|████████▊ | 10840/12384 [22:59:53<3:16:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 88%|████████▊ | 10840/12384 [23:00:01<3:16:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 88%|████████▊ | 10841/12384 [23:00:01<3:15:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 88%|████████▊ | 10841/12384 [23:00:09<3:15:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 88%|████████▊ | 10842/12384 [23:00:09<3:16:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 88%|████████▊ | 10842/12384 [23:00:16<3:16:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 88%|████████▊ | 10843/12384 [23:00:16<3:15:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 88%|████████▊ | 10843/12384 [23:00:24<3:15:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 88%|████████▊ | 10844/12384 [23:00:24<3:15:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 1: 88%|████████▊ | 10844/12384 [23:00:32<3:15:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 88%|████████▊ | 10845/12384 [23:00:32<3:15:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 88%|████████▊ | 10845/12384 [23:00:39<3:15:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 88%|████████▊ | 10846/12384 [23:00:39<3:15:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 88%|████████▊ | 10846/12384 [23:00:47<3:15:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 88%|████████▊ | 10847/12384 [23:00:47<3:15:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 1: 88%|████████▊ | 10847/12384 [23:00:54<3:15:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 88%|████████▊ | 10848/12384 [23:00:54<3:14:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 88%|████████▊ | 10848/12384 [23:01:02<3:14:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 88%|████████▊ | 10849/12384 [23:01:02<3:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 88%|████████▊ | 10849/12384 [23:01:10<3:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 88%|████████▊ | 10850/12384 [23:01:10<3:14:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 88%|████████▊ | 10850/12384 [23:01:17<3:14:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 88%|████████▊ | 10851/12384 [23:01:17<3:14:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 88%|████████▊ | 10851/12384 [23:01:25<3:14:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10852/12384 [23:01:25<3:14:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10852/12384 [23:01:32<3:14:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10853/12384 [23:01:32<3:14:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10853/12384 [23:01:40<3:14:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 88%|████████▊ | 10854/12384 [23:01:40<3:14:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 1: 88%|████████▊ | 10854/12384 [23:01:48<3:14:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 88%|████████▊ | 10855/12384 [23:01:48<3:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 88%|████████▊ | 10855/12384 [23:01:55<3:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 88%|████████▊ | 10856/12384 [23:01:55<3:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 88%|████████▊ | 10856/12384 [23:02:03<3:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.38s]
Epoch 1: 88%|████████▊ | 10857/12384 [23:02:03<3:13:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.38s]
Epoch 1: 88%|████████▊ | 10857/12384 [23:02:10<3:13:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 88%|████████▊ | 10858/12384 [23:02:10<3:13:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 88%|████████▊ | 10858/12384 [23:02:18<3:13:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10859/12384 [23:02:18<3:13:12, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10859/12384 [23:02:26<3:13:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 88%|████████▊ | 10860/12384 [23:02:26<3:12:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 88%|████████▊ | 10860/12384 [23:02:34<3:12:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 88%|████████▊ | 10861/12384 [23:02:34<3:15:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 88%|████████▊ | 10861/12384 [23:02:41<3:15:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 88%|████████▊ | 10862/12384 [23:02:41<3:14:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 88%|████████▊ | 10862/12384 [23:02:49<3:14:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10863/12384 [23:02:49<3:14:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10863/12384 [23:02:56<3:14:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 88%|████████▊ | 10864/12384 [23:02:56<3:13:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 88%|████████▊ | 10864/12384 [23:03:04<3:13:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 88%|████████▊ | 10865/12384 [23:03:04<3:13:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 88%|████████▊ | 10865/12384 [23:03:12<3:13:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 88%|████████▊ | 10866/12384 [23:03:12<3:12:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 88%|████████▊ | 10866/12384 [23:03:19<3:12:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 1: 88%|████████▊ | 10867/12384 [23:03:19<3:12:24, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 1: 88%|████████▊ | 10867/12384 [23:03:27<3:12:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 88%|████████▊ | 10868/12384 [23:03:27<3:12:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 88%|████████▊ | 10868/12384 [23:03:34<3:12:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 88%|████████▊ | 10869/12384 [23:03:34<3:12:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 88%|████████▊ | 10869/12384 [23:03:42<3:12:12, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=7.93s]
Epoch 1: 88%|████████▊ | 10870/12384 [23:03:42<3:12:38, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=7.93s]
Epoch 1: 88%|████████▊ | 10870/12384 [23:03:50<3:12:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 88%|████████▊ | 10871/12384 [23:03:50<3:12:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 88%|████████▊ | 10871/12384 [23:03:57<3:12:32, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=9.07s]
Epoch 1: 88%|████████▊ | 10872/12384 [23:03:57<3:12:28, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=9.07s]
Epoch 1: 88%|████████▊ | 10872/12384 [23:04:05<3:12:28, 7.64s/it, loss=0.0002, acc=0.9976, iter_time=7.41s]
Epoch 1: 88%|████████▊ | 10873/12384 [23:04:05<3:12:02, 7.63s/it, loss=0.0002, acc=0.9976, iter_time=7.41s]
Epoch 1: 88%|████████▊ | 10873/12384 [23:04:13<3:12:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 88%|████████▊ | 10874/12384 [23:04:13<3:11:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 88%|████████▊ | 10874/12384 [23:04:20<3:11:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 88%|████████▊ | 10875/12384 [23:04:20<3:11:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 88%|████████▊ | 10875/12384 [23:04:28<3:11:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.26s]
Epoch 1: 88%|████████▊ | 10876/12384 [23:04:28<3:11:59, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.26s]
Epoch 1: 88%|████████▊ | 10876/12384 [23:04:36<3:11:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 88%|████████▊ | 10877/12384 [23:04:36<3:11:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 88%|████████▊ | 10877/12384 [23:04:43<3:11:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 88%|████████▊ | 10878/12384 [23:04:43<3:11:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 88%|████████▊ | 10878/12384 [23:04:51<3:11:26, 7.63s/it, loss=0.0007, acc=0.9964, iter_time=8.79s]
Epoch 1: 88%|████████▊ | 10879/12384 [23:04:51<3:11:19, 7.63s/it, loss=0.0007, acc=0.9964, iter_time=8.79s]
Epoch 1: 88%|████████▊ | 10879/12384 [23:04:58<3:11:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 88%|████████▊ | 10880/12384 [23:04:58<3:11:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 88%|████████▊ | 10880/12384 [23:05:06<3:11:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 88%|████████▊ | 10881/12384 [23:05:06<3:10:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 88%|████████▊ | 10881/12384 [23:05:14<3:10:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10882/12384 [23:05:14<3:10:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10882/12384 [23:05:21<3:10:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 88%|████████▊ | 10883/12384 [23:05:21<3:12:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 88%|████████▊ | 10883/12384 [23:05:29<3:12:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 88%|████████▊ | 10884/12384 [23:05:29<3:11:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 88%|████████▊ | 10884/12384 [23:05:37<3:11:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 88%|████████▊ | 10885/12384 [23:05:37<3:11:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 1: 88%|████████▊ | 10885/12384 [23:05:44<3:11:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 88%|████████▊ | 10886/12384 [23:05:44<3:10:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 88%|████████▊ | 10886/12384 [23:05:52<3:10:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 88%|████████▊ | 10887/12384 [23:05:52<3:10:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 88%|████████▊ | 10887/12384 [23:06:00<3:10:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 88%|████████▊ | 10888/12384 [23:06:00<3:12:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 88%|████████▊ | 10888/12384 [23:06:07<3:12:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 1: 88%|████████▊ | 10889/12384 [23:06:07<3:11:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 1: 88%|████████▊ | 10889/12384 [23:06:15<3:11:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 88%|████████▊ | 10890/12384 [23:06:15<3:10:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 88%|████████▊ | 10890/12384 [23:06:23<3:10:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10891/12384 [23:06:23<3:10:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10891/12384 [23:06:30<3:10:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10892/12384 [23:06:30<3:09:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10892/12384 [23:06:38<3:09:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10893/12384 [23:06:38<3:09:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10893/12384 [23:06:46<3:09:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 88%|████████▊ | 10894/12384 [23:06:46<3:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 88%|████████▊ | 10894/12384 [23:06:53<3:09:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 88%|████████▊ | 10895/12384 [23:06:53<3:09:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 1: 88%|████████▊ | 10895/12384 [23:07:01<3:09:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 88%|████████▊ | 10896/12384 [23:07:01<3:08:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 88%|████████▊ | 10896/12384 [23:07:08<3:08:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 88%|████████▊ | 10897/12384 [23:07:08<3:09:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 88%|████████▊ | 10897/12384 [23:07:16<3:09:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 88%|████████▊ | 10898/12384 [23:07:16<3:09:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 88%|████████▊ | 10898/12384 [23:07:24<3:09:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10899/12384 [23:07:24<3:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10899/12384 [23:07:31<3:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 88%|████████▊ | 10900/12384 [23:07:31<3:08:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 88%|████████▊ | 10900/12384 [23:07:39<3:08:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 88%|████████▊ | 10901/12384 [23:07:39<3:08:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 88%|████████▊ | 10901/12384 [23:07:47<3:08:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 88%|████████▊ | 10902/12384 [23:07:47<3:08:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 88%|████████▊ | 10902/12384 [23:07:54<3:08:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 88%|████████▊ | 10903/12384 [23:07:54<3:08:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 88%|████████▊ | 10903/12384 [23:08:02<3:08:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 88%|████████▊ | 10904/12384 [23:08:02<3:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 88%|████████▊ | 10904/12384 [23:08:09<3:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 88%|████████▊ | 10905/12384 [23:08:09<3:07:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 88%|████████▊ | 10905/12384 [23:08:17<3:07:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 88%|████████▊ | 10906/12384 [23:08:17<3:07:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 88%|████████▊ | 10906/12384 [23:08:25<3:07:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 88%|████████▊ | 10907/12384 [23:08:25<3:07:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 88%|████████▊ | 10907/12384 [23:08:32<3:07:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 88%|████████▊ | 10908/12384 [23:08:32<3:07:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 88%|████████▊ | 10908/12384 [23:08:40<3:07:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 88%|████████▊ | 10909/12384 [23:08:40<3:09:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 88%|████████▊ | 10909/12384 [23:08:48<3:09:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10910/12384 [23:08:48<3:09:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 88%|████████▊ | 10910/12384 [23:08:55<3:09:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 88%|████████▊ | 10911/12384 [23:08:55<3:08:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 88%|████████▊ | 10911/12384 [23:09:03<3:08:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 88%|████████▊ | 10912/12384 [23:09:03<3:08:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 88%|████████▊ | 10912/12384 [23:09:11<3:08:25, 7.68s/it, loss=0.0002, acc=0.9999, iter_time=7.66s]
Epoch 1: 88%|████████▊ | 10913/12384 [23:09:11<3:07:46, 7.66s/it, loss=0.0002, acc=0.9999, iter_time=7.66s]
Epoch 1: 88%|████████▊ | 10913/12384 [23:09:19<3:07:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 88%|████████▊ | 10914/12384 [23:09:19<3:09:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 88%|████████▊ | 10914/12384 [23:09:26<3:09:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 88%|████████▊ | 10915/12384 [23:09:26<3:08:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 88%|████████▊ | 10915/12384 [23:09:34<3:08:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 88%|████████▊ | 10916/12384 [23:09:34<3:07:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 88%|████████▊ | 10916/12384 [23:09:42<3:07:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 88%|████████▊ | 10917/12384 [23:09:42<3:07:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 88%|████████▊ | 10917/12384 [23:09:49<3:07:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10918/12384 [23:09:49<3:06:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10918/12384 [23:09:57<3:06:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 88%|████████▊ | 10919/12384 [23:09:57<3:06:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 1: 88%|████████▊ | 10919/12384 [23:10:04<3:06:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 88%|████████▊ | 10920/12384 [23:10:04<3:06:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 88%|████████▊ | 10920/12384 [23:10:12<3:06:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 88%|████████▊ | 10921/12384 [23:10:12<3:06:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 88%|████████▊ | 10921/12384 [23:10:20<3:06:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 88%|████████▊ | 10922/12384 [23:10:20<3:05:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 88%|████████▊ | 10922/12384 [23:10:27<3:05:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10923/12384 [23:10:27<3:05:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10923/12384 [23:10:35<3:05:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 88%|████████▊ | 10924/12384 [23:10:35<3:05:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 88%|████████▊ | 10924/12384 [23:10:42<3:05:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 88%|████████▊ | 10925/12384 [23:10:42<3:05:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 88%|████████▊ | 10925/12384 [23:10:50<3:05:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.77s]
Epoch 1: 88%|████████▊ | 10926/12384 [23:10:50<3:05:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.77s]
Epoch 1: 88%|████████▊ | 10926/12384 [23:10:58<3:05:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.46s]
Epoch 1: 88%|████████▊ | 10927/12384 [23:10:58<3:04:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.46s]
Epoch 1: 88%|████████▊ | 10927/12384 [23:11:05<3:04:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 88%|████████▊ | 10928/12384 [23:11:05<3:04:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 88%|████████▊ | 10928/12384 [23:11:13<3:04:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 88%|████████▊ | 10929/12384 [23:11:13<3:04:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 1: 88%|████████▊ | 10929/12384 [23:11:21<3:04:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 88%|████████▊ | 10930/12384 [23:11:21<3:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 1: 88%|████████▊ | 10930/12384 [23:11:28<3:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 88%|████████▊ | 10931/12384 [23:11:28<3:04:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 88%|████████▊ | 10931/12384 [23:11:36<3:04:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 88%|████████▊ | 10932/12384 [23:11:36<3:04:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 88%|████████▊ | 10932/12384 [23:11:43<3:04:45, 7.63s/it, loss=0.0004, acc=0.9980, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10933/12384 [23:11:43<3:04:32, 7.63s/it, loss=0.0004, acc=0.9980, iter_time=7.62s]
Epoch 1: 88%|████████▊ | 10933/12384 [23:11:51<3:04:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 88%|████████▊ | 10934/12384 [23:11:51<3:05:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 88%|████████▊ | 10934/12384 [23:11:59<3:05:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 88%|████████▊ | 10935/12384 [23:11:59<3:05:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 88%|████████▊ | 10935/12384 [23:12:07<3:05:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 88%|████████▊ | 10936/12384 [23:12:07<3:11:10, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 88%|████████▊ | 10936/12384 [23:12:16<3:11:10, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 88%|████████▊ | 10937/12384 [23:12:16<3:18:45, 8.24s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 88%|████████▊ | 10937/12384 [23:12:25<3:18:45, 8.24s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 88%|████████▊ | 10938/12384 [23:12:25<3:22:42, 8.41s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 88%|████████▊ | 10938/12384 [23:12:33<3:22:42, 8.41s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 88%|████████▊ | 10939/12384 [23:12:33<3:19:32, 8.29s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 88%|████████▊ | 10939/12384 [23:12:41<3:19:32, 8.29s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 88%|████████▊ | 10940/12384 [23:12:41<3:16:40, 8.17s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 88%|████████▊ | 10940/12384 [23:12:49<3:16:40, 8.17s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 88%|████████▊ | 10941/12384 [23:12:49<3:18:07, 8.24s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 88%|████████▊ | 10941/12384 [23:12:58<3:18:07, 8.24s/it, loss=0.0003, acc=1.0000, iter_time=8.62s]
Epoch 1: 88%|████████▊ | 10942/12384 [23:12:58<3:18:37, 8.26s/it, loss=0.0003, acc=1.0000, iter_time=8.62s]
Epoch 1: 88%|████████▊ | 10942/12384 [23:13:06<3:18:37, 8.26s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 88%|████████▊ | 10943/12384 [23:13:06<3:16:44, 8.19s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 88%|████████▊ | 10943/12384 [23:13:14<3:16:44, 8.19s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 88%|████████▊ | 10944/12384 [23:13:14<3:15:40, 8.15s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 88%|████████▊ | 10944/12384 [23:13:23<3:15:40, 8.15s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 88%|████████▊ | 10945/12384 [23:13:23<3:19:30, 8.32s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 88%|████████▊ | 10945/12384 [23:13:30<3:19:30, 8.32s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 88%|████████▊ | 10946/12384 [23:13:30<3:16:35, 8.20s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 1: 88%|████████▊ | 10946/12384 [23:13:39<3:16:35, 8.20s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 88%|████████▊ | 10947/12384 [23:13:39<3:20:24, 8.37s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 88%|████████▊ | 10947/12384 [23:13:47<3:20:24, 8.37s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 88%|████████▊ | 10948/12384 [23:13:47<3:17:49, 8.27s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 88%|████████▊ | 10948/12384 [23:13:56<3:17:49, 8.27s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 88%|████████▊ | 10949/12384 [23:13:56<3:21:26, 8.42s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 88%|████████▊ | 10949/12384 [23:14:04<3:21:26, 8.42s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 1: 88%|████████▊ | 10950/12384 [23:14:04<3:17:25, 8.26s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 1: 88%|████████▊ | 10950/12384 [23:14:12<3:17:25, 8.26s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 88%|████████▊ | 10951/12384 [23:14:12<3:15:25, 8.18s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 88%|████████▊ | 10951/12384 [23:14:20<3:15:25, 8.18s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 88%|████████▊ | 10952/12384 [23:14:20<3:13:04, 8.09s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 88%|████████▊ | 10952/12384 [23:14:28<3:13:04, 8.09s/it, loss=0.0003, acc=0.9986, iter_time=7.56s]
Epoch 1: 88%|████████▊ | 10953/12384 [23:14:28<3:11:49, 8.04s/it, loss=0.0003, acc=0.9986, iter_time=7.56s]
Epoch 1: 88%|████████▊ | 10953/12384 [23:14:36<3:11:49, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 88%|████████▊ | 10954/12384 [23:14:36<3:10:14, 7.98s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 88%|████████▊ | 10954/12384 [23:14:44<3:10:14, 7.98s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 88%|████████▊ | 10955/12384 [23:14:44<3:09:40, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 88%|████████▊ | 10955/12384 [23:14:51<3:09:40, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 88%|████████▊ | 10956/12384 [23:14:51<3:09:21, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 88%|████████▊ | 10956/12384 [23:14:59<3:09:21, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 88%|████████▊ | 10957/12384 [23:14:59<3:08:05, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 88%|████████▊ | 10957/12384 [23:15:07<3:08:05, 7.91s/it, loss=0.0003, acc=0.9998, iter_time=5.88s]
Epoch 1: 88%|████████▊ | 10958/12384 [23:15:07<3:08:22, 7.93s/it, loss=0.0003, acc=0.9998, iter_time=5.88s]
Epoch 1: 88%|████████▊ | 10958/12384 [23:15:15<3:08:22, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 88%|████████▊ | 10959/12384 [23:15:15<3:07:37, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 88%|████████▊ | 10959/12384 [23:15:23<3:07:37, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 89%|████████▊ | 10960/12384 [23:15:23<3:07:24, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 89%|████████▊ | 10960/12384 [23:15:31<3:07:24, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 89%|████████▊ | 10961/12384 [23:15:31<3:06:41, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 89%|████████▊ | 10961/12384 [23:15:39<3:06:41, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 89%|████████▊ | 10962/12384 [23:15:39<3:09:30, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 89%|████████▊ | 10962/12384 [23:15:47<3:09:30, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 89%|████████▊ | 10963/12384 [23:15:47<3:08:06, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 89%|████████▊ | 10963/12384 [23:15:55<3:08:06, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 89%|████████▊ | 10964/12384 [23:15:55<3:07:40, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 1: 89%|████████▊ | 10964/12384 [23:16:03<3:07:40, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=11.56s]
Epoch 1: 89%|████████▊ | 10965/12384 [23:16:03<3:07:28, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=11.56s]
Epoch 1: 89%|████████▊ | 10965/12384 [23:16:11<3:07:28, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 89%|████████▊ | 10966/12384 [23:16:11<3:06:32, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 89%|████████▊ | 10966/12384 [23:16:19<3:06:32, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 89%|████████▊ | 10967/12384 [23:16:19<3:09:43, 8.03s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 89%|████████▊ | 10967/12384 [23:16:27<3:09:43, 8.03s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 89%|████████▊ | 10968/12384 [23:16:27<3:08:24, 7.98s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 89%|████████▊ | 10968/12384 [23:16:35<3:08:24, 7.98s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 1: 89%|████████▊ | 10969/12384 [23:16:35<3:07:49, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 1: 89%|████████▊ | 10969/12384 [23:16:43<3:07:49, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 1: 89%|████████▊ | 10970/12384 [23:16:43<3:06:52, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 1: 89%|████████▊ | 10970/12384 [23:16:50<3:06:52, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 89%|████████▊ | 10971/12384 [23:16:50<3:06:44, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 1: 89%|████████▊ | 10971/12384 [23:16:58<3:06:44, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 89%|████████▊ | 10972/12384 [23:16:58<3:04:51, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 89%|████████▊ | 10972/12384 [23:17:06<3:04:51, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 89%|████████▊ | 10973/12384 [23:17:06<3:03:25, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 89%|████████▊ | 10973/12384 [23:17:13<3:03:25, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 89%|████████▊ | 10974/12384 [23:17:13<3:02:10, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 89%|████████▊ | 10974/12384 [23:17:21<3:02:10, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 89%|████████▊ | 10975/12384 [23:17:21<3:01:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 89%|████████▊ | 10975/12384 [23:17:29<3:01:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 89%|████████▊ | 10976/12384 [23:17:29<3:00:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 89%|████████▊ | 10976/12384 [23:17:36<3:00:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 89%|████████▊ | 10977/12384 [23:17:36<2:59:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 89%|████████▊ | 10977/12384 [23:17:44<2:59:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 89%|████████▊ | 10978/12384 [23:17:44<2:59:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 89%|████████▊ | 10978/12384 [23:17:52<2:59:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 89%|████████▊ | 10979/12384 [23:17:52<2:59:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 1: 89%|████████▊ | 10979/12384 [23:17:59<2:59:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 89%|████████▊ | 10980/12384 [23:17:59<2:58:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 89%|████████▊ | 10980/12384 [23:18:07<2:58:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 89%|████████▊ | 10981/12384 [23:18:07<2:58:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 89%|████████▊ | 10981/12384 [23:18:14<2:58:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 89%|████████▊ | 10982/12384 [23:18:14<2:58:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 89%|████████▊ | 10982/12384 [23:18:22<2:58:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 89%|████████▊ | 10983/12384 [23:18:22<2:58:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 89%|████████▊ | 10983/12384 [23:18:30<2:58:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 89%|████████▊ | 10984/12384 [23:18:30<2:57:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 89%|████████▊ | 10984/12384 [23:18:37<2:57:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 89%|████████▊ | 10985/12384 [23:18:37<2:57:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 89%|████████▊ | 10985/12384 [23:18:45<2:57:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 89%|████████▊ | 10986/12384 [23:18:45<2:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 89%|████████▊ | 10986/12384 [23:18:53<2:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 89%|████████▊ | 10987/12384 [23:18:53<2:57:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 89%|████████▊ | 10987/12384 [23:19:00<2:57:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 89%|████████▊ | 10988/12384 [23:19:00<2:56:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 89%|████████▊ | 10988/12384 [23:19:08<2:56:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 89%|████████▊ | 10989/12384 [23:19:08<2:56:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 89%|████████▊ | 10989/12384 [23:19:15<2:56:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 89%|████████▊ | 10990/12384 [23:19:15<2:56:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 89%|████████▊ | 10990/12384 [23:19:23<2:56:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 89%|████████▉ | 10991/12384 [23:19:23<2:56:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 1: 89%|████████▉ | 10991/12384 [23:19:31<2:56:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 89%|████████▉ | 10992/12384 [23:19:31<2:57:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 89%|████████▉ | 10992/12384 [23:19:39<2:57:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 89%|████████▉ | 10993/12384 [23:19:39<2:59:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 89%|████████▉ | 10993/12384 [23:19:46<2:59:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 89%|████████▉ | 10994/12384 [23:19:46<2:58:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 89%|████████▉ | 10994/12384 [23:19:54<2:58:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 89%|████████▉ | 10995/12384 [23:19:54<2:57:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 89%|████████▉ | 10995/12384 [23:20:01<2:57:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 89%|████████▉ | 10996/12384 [23:20:01<2:57:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 1: 89%|████████▉ | 10996/12384 [23:20:09<2:57:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 89%|████████▉ | 10997/12384 [23:20:09<2:56:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 1: 89%|████████▉ | 10997/12384 [23:20:17<2:56:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 10998/12384 [23:20:17<2:56:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 10998/12384 [23:20:24<2:56:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 10999/12384 [23:20:24<2:56:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 10999/12384 [23:20:32<2:56:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 89%|████████▉ | 11000/12384 [23:20:32<2:55:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 89%|████████▉ | 11000/12384 [23:20:40<2:55:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 89%|████████▉ | 11001/12384 [23:20:40<2:55:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 1: 89%|████████▉ | 11001/12384 [23:20:47<2:55:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 89%|████████▉ | 11002/12384 [23:20:47<2:56:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 89%|████████▉ | 11002/12384 [23:20:55<2:56:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 89%|████████▉ | 11003/12384 [23:20:55<2:56:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 89%|████████▉ | 11003/12384 [23:21:03<2:56:10, 7.65s/it, loss=0.0002, acc=0.9989, iter_time=8.03s]
Epoch 1: 89%|████████▉ | 11004/12384 [23:21:03<2:58:39, 7.77s/it, loss=0.0002, acc=0.9989, iter_time=8.03s]
Epoch 1: 89%|████████▉ | 11004/12384 [23:21:11<2:58:39, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 89%|████████▉ | 11005/12384 [23:21:11<2:57:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 89%|████████▉ | 11005/12384 [23:21:18<2:57:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 89%|████████▉ | 11006/12384 [23:21:18<2:56:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 89%|████████▉ | 11006/12384 [23:21:26<2:56:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11007/12384 [23:21:26<2:55:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11007/12384 [23:21:33<2:55:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 89%|████████▉ | 11008/12384 [23:21:33<2:55:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 89%|████████▉ | 11008/12384 [23:21:41<2:55:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 89%|████████▉ | 11009/12384 [23:21:41<2:55:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 89%|████████▉ | 11009/12384 [23:21:49<2:55:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 89%|████████▉ | 11010/12384 [23:21:49<2:55:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 89%|████████▉ | 11010/12384 [23:21:56<2:55:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 89%|████████▉ | 11011/12384 [23:21:56<2:54:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 1: 89%|████████▉ | 11011/12384 [23:22:04<2:54:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 89%|████████▉ | 11012/12384 [23:22:04<2:55:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 89%|████████▉ | 11012/12384 [23:22:12<2:55:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 89%|████████▉ | 11013/12384 [23:22:12<2:54:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 89%|████████▉ | 11013/12384 [23:22:19<2:54:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 89%|████████▉ | 11014/12384 [23:22:19<2:54:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 89%|████████▉ | 11014/12384 [23:22:27<2:54:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 89%|████████▉ | 11015/12384 [23:22:27<2:55:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 89%|████████▉ | 11015/12384 [23:22:35<2:55:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 89%|████████▉ | 11016/12384 [23:22:35<2:55:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 89%|████████▉ | 11016/12384 [23:22:42<2:55:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 89%|████████▉ | 11017/12384 [23:22:42<2:54:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 1: 89%|████████▉ | 11017/12384 [23:22:50<2:54:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 89%|████████▉ | 11018/12384 [23:22:50<2:53:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 89%|████████▉ | 11018/12384 [23:22:58<2:53:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 89%|████████▉ | 11019/12384 [23:22:58<2:55:48, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 89%|████████▉ | 11019/12384 [23:23:05<2:55:48, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 89%|████████▉ | 11020/12384 [23:23:05<2:54:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 1: 89%|████████▉ | 11020/12384 [23:23:13<2:54:53, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 1: 89%|████████▉ | 11021/12384 [23:23:13<2:54:46, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 1: 89%|████████▉ | 11021/12384 [23:23:21<2:54:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 89%|████████▉ | 11022/12384 [23:23:21<2:54:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 89%|████████▉ | 11022/12384 [23:23:28<2:54:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.44s]
Epoch 1: 89%|████████▉ | 11023/12384 [23:23:28<2:53:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.44s]
Epoch 1: 89%|████████▉ | 11023/12384 [23:23:36<2:53:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=12.15s]
Epoch 1: 89%|████████▉ | 11024/12384 [23:23:36<2:53:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=12.15s]
Epoch 1: 89%|████████▉ | 11024/12384 [23:23:44<2:53:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 89%|████████▉ | 11025/12384 [23:23:44<2:53:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 89%|████████▉ | 11025/12384 [23:23:51<2:53:12, 7.65s/it, loss=0.0011, acc=0.9983, iter_time=5.82s]
Epoch 1: 89%|████████▉ | 11026/12384 [23:23:51<2:52:50, 7.64s/it, loss=0.0011, acc=0.9983, iter_time=5.82s]
Epoch 1: 89%|████████▉ | 11026/12384 [23:23:59<2:52:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 89%|████████▉ | 11027/12384 [23:23:59<2:53:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 1: 89%|████████▉ | 11027/12384 [23:24:07<2:53:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 89%|████████▉ | 11028/12384 [23:24:07<2:52:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 89%|████████▉ | 11028/12384 [23:24:14<2:52:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 89%|████████▉ | 11029/12384 [23:24:14<2:52:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 89%|████████▉ | 11029/12384 [23:24:22<2:52:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 1: 89%|████████▉ | 11030/12384 [23:24:22<2:52:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 1: 89%|████████▉ | 11030/12384 [23:24:29<2:52:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 11031/12384 [23:24:29<2:51:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 11031/12384 [23:24:37<2:51:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 89%|████████▉ | 11032/12384 [23:24:37<2:51:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 89%|████████▉ | 11032/12384 [23:24:45<2:51:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 89%|████████▉ | 11033/12384 [23:24:45<2:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 89%|████████▉ | 11033/12384 [23:24:52<2:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 89%|████████▉ | 11034/12384 [23:24:52<2:51:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 89%|████████▉ | 11034/12384 [23:25:00<2:51:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 11035/12384 [23:25:00<2:51:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 11035/12384 [23:25:08<2:51:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11036/12384 [23:25:08<2:51:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11036/12384 [23:25:15<2:51:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 11037/12384 [23:25:15<2:51:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 89%|████████▉ | 11037/12384 [23:25:23<2:51:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 89%|████████▉ | 11038/12384 [23:25:23<2:50:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 89%|████████▉ | 11038/12384 [23:25:30<2:50:54, 7.62s/it, loss=0.0002, acc=0.9996, iter_time=7.60s]
Epoch 1: 89%|████████▉ | 11039/12384 [23:25:30<2:50:39, 7.61s/it, loss=0.0002, acc=0.9996, iter_time=7.60s]
Epoch 1: 89%|████████▉ | 11039/12384 [23:25:38<2:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 89%|████████▉ | 11040/12384 [23:25:38<2:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 89%|████████▉ | 11040/12384 [23:25:46<2:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 89%|████████▉ | 11041/12384 [23:25:46<2:52:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 89%|████████▉ | 11041/12384 [23:25:53<2:52:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 89%|████████▉ | 11042/12384 [23:25:53<2:51:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 89%|████████▉ | 11042/12384 [23:26:01<2:51:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 89%|████████▉ | 11043/12384 [23:26:01<2:51:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 89%|████████▉ | 11043/12384 [23:26:09<2:51:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 89%|████████▉ | 11044/12384 [23:26:09<2:50:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 89%|████████▉ | 11044/12384 [23:26:17<2:50:43, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=8.86s]
Epoch 1: 89%|████████▉ | 11045/12384 [23:26:17<2:52:54, 7.75s/it, loss=0.0001, acc=0.9996, iter_time=8.86s]
Epoch 1: 89%|████████▉ | 11045/12384 [23:26:24<2:52:54, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 89%|████████▉ | 11046/12384 [23:26:24<2:51:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 89%|████████▉ | 11046/12384 [23:26:32<2:51:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 89%|████████▉ | 11047/12384 [23:26:32<2:51:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 89%|████████▉ | 11047/12384 [23:26:40<2:51:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 89%|████████▉ | 11048/12384 [23:26:40<2:50:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 89%|████████▉ | 11048/12384 [23:26:47<2:50:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 89%|████████▉ | 11049/12384 [23:26:47<2:50:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 89%|████████▉ | 11049/12384 [23:26:55<2:50:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 89%|████████▉ | 11050/12384 [23:26:55<2:49:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 89%|████████▉ | 11050/12384 [23:27:02<2:49:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 89%|████████▉ | 11051/12384 [23:27:02<2:49:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 89%|████████▉ | 11051/12384 [23:27:10<2:49:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 1: 89%|████████▉ | 11052/12384 [23:27:10<2:49:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 1: 89%|████████▉ | 11052/12384 [23:27:18<2:49:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 89%|████████▉ | 11053/12384 [23:27:18<2:49:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 1: 89%|████████▉ | 11053/12384 [23:27:25<2:49:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 89%|████████▉ | 11054/12384 [23:27:25<2:49:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 1: 89%|████████▉ | 11054/12384 [23:27:33<2:49:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 89%|████████▉ | 11055/12384 [23:27:33<2:49:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 89%|████████▉ | 11055/12384 [23:27:41<2:49:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 89%|████████▉ | 11056/12384 [23:27:41<2:48:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 89%|████████▉ | 11056/12384 [23:27:48<2:48:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 89%|████████▉ | 11057/12384 [23:27:48<2:48:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 89%|████████▉ | 11057/12384 [23:27:56<2:48:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 89%|████████▉ | 11058/12384 [23:27:56<2:48:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 89%|████████▉ | 11058/12384 [23:28:03<2:48:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 89%|████████▉ | 11059/12384 [23:28:03<2:48:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 89%|████████▉ | 11059/12384 [23:28:11<2:48:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 89%|████████▉ | 11060/12384 [23:28:11<2:47:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 89%|████████▉ | 11060/12384 [23:28:19<2:47:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 89%|████████▉ | 11061/12384 [23:28:19<2:47:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 89%|████████▉ | 11061/12384 [23:28:26<2:47:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 89%|████████▉ | 11062/12384 [23:28:26<2:47:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 89%|████████▉ | 11062/12384 [23:28:34<2:47:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 89%|████████▉ | 11063/12384 [23:28:34<2:47:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 89%|████████▉ | 11063/12384 [23:28:41<2:47:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 89%|████████▉ | 11064/12384 [23:28:41<2:47:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 89%|████████▉ | 11064/12384 [23:28:49<2:47:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 89%|████████▉ | 11065/12384 [23:28:49<2:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 89%|████████▉ | 11065/12384 [23:28:57<2:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 1: 89%|████████▉ | 11066/12384 [23:28:57<2:47:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 1: 89%|████████▉ | 11066/12384 [23:29:04<2:47:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 1: 89%|████████▉ | 11067/12384 [23:29:04<2:47:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 1: 89%|████████▉ | 11067/12384 [23:29:12<2:47:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 89%|████████▉ | 11068/12384 [23:29:12<2:46:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 89%|████████▉ | 11068/12384 [23:29:19<2:46:58, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11069/12384 [23:29:19<2:46:53, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11069/12384 [23:29:27<2:46:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 89%|████████▉ | 11070/12384 [23:29:27<2:46:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 89%|████████▉ | 11070/12384 [23:29:35<2:46:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 89%|████████▉ | 11071/12384 [23:29:35<2:46:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 1: 89%|████████▉ | 11071/12384 [23:29:43<2:46:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 89%|████████▉ | 11072/12384 [23:29:43<2:48:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 89%|████████▉ | 11072/12384 [23:29:50<2:48:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 89%|████████▉ | 11073/12384 [23:29:50<2:47:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 89%|████████▉ | 11073/12384 [23:29:58<2:47:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 89%|████████▉ | 11074/12384 [23:29:58<2:47:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 1: 89%|████████▉ | 11074/12384 [23:30:06<2:47:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11075/12384 [23:30:06<2:46:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11075/12384 [23:30:13<2:46:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11076/12384 [23:30:13<2:46:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 89%|████████▉ | 11076/12384 [23:30:21<2:46:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 89%|████████▉ | 11077/12384 [23:30:21<2:46:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 89%|████████▉ | 11077/12384 [23:30:28<2:46:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 89%|████████▉ | 11078/12384 [23:30:28<2:45:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 89%|████████▉ | 11078/12384 [23:30:36<2:45:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 89%|████████▉ | 11079/12384 [23:30:36<2:45:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 89%|████████▉ | 11079/12384 [23:30:44<2:45:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 89%|████████▉ | 11080/12384 [23:30:44<2:45:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 89%|████████▉ | 11080/12384 [23:30:51<2:45:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 89%|████████▉ | 11081/12384 [23:30:51<2:45:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 89%|████████▉ | 11081/12384 [23:30:59<2:45:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.15s]
Epoch 1: 89%|████████▉ | 11082/12384 [23:30:59<2:45:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.15s]
Epoch 1: 89%|████████▉ | 11082/12384 [23:31:06<2:45:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 89%|████████▉ | 11083/12384 [23:31:06<2:45:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 1: 89%|████████▉ | 11083/12384 [23:31:14<2:45:16, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=9.15s]
Epoch 1: 90%|████████▉ | 11084/12384 [23:31:14<2:44:56, 7.61s/it, loss=0.0000, acc=0.9998, iter_time=9.15s]
Epoch 1: 90%|████████▉ | 11084/12384 [23:31:22<2:44:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 1: 90%|████████▉ | 11085/12384 [23:31:22<2:44:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 1: 90%|████████▉ | 11085/12384 [23:31:29<2:44:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 1: 90%|████████▉ | 11086/12384 [23:31:29<2:44:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 1: 90%|████████▉ | 11086/12384 [23:31:37<2:44:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 90%|████████▉ | 11087/12384 [23:31:37<2:44:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 90%|████████▉ | 11087/12384 [23:31:44<2:44:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 90%|████████▉ | 11088/12384 [23:31:44<2:44:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 90%|████████▉ | 11088/12384 [23:31:52<2:44:21, 7.61s/it, loss=0.0000, acc=0.9997, iter_time=6.29s]
Epoch 1: 90%|████████▉ | 11089/12384 [23:31:52<2:44:04, 7.60s/it, loss=0.0000, acc=0.9997, iter_time=6.29s]
Epoch 1: 90%|████████▉ | 11089/12384 [23:32:00<2:44:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 90%|████████▉ | 11090/12384 [23:32:00<2:43:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 90%|████████▉ | 11090/12384 [23:32:07<2:43:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 90%|████████▉ | 11091/12384 [23:32:07<2:44:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 90%|████████▉ | 11091/12384 [23:32:15<2:44:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|████████▉ | 11092/12384 [23:32:15<2:43:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|████████▉ | 11092/12384 [23:32:23<2:43:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 90%|████████▉ | 11093/12384 [23:32:23<2:45:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 90%|████████▉ | 11093/12384 [23:32:30<2:45:37, 7.70s/it, loss=0.0002, acc=0.9992, iter_time=7.65s]
Epoch 1: 90%|████████▉ | 11094/12384 [23:32:30<2:45:11, 7.68s/it, loss=0.0002, acc=0.9992, iter_time=7.65s]
Epoch 1: 90%|████████▉ | 11094/12384 [23:32:38<2:45:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 90%|████████▉ | 11095/12384 [23:32:38<2:44:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 90%|████████▉ | 11095/12384 [23:32:46<2:44:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 90%|████████▉ | 11096/12384 [23:32:46<2:44:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 90%|████████▉ | 11096/12384 [23:32:53<2:44:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 90%|████████▉ | 11097/12384 [23:32:53<2:43:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 90%|████████▉ | 11097/12384 [23:33:01<2:43:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 90%|████████▉ | 11098/12384 [23:33:01<2:45:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 90%|████████▉ | 11098/12384 [23:33:09<2:45:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 90%|████████▉ | 11099/12384 [23:33:09<2:44:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 90%|████████▉ | 11099/12384 [23:33:17<2:44:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 1: 90%|████████▉ | 11100/12384 [23:33:17<2:44:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 1: 90%|████████▉ | 11100/12384 [23:33:24<2:44:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 90%|████████▉ | 11101/12384 [23:33:24<2:43:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 90%|████████▉ | 11101/12384 [23:33:32<2:43:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 90%|████████▉ | 11102/12384 [23:33:32<2:43:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 90%|████████▉ | 11102/12384 [23:33:39<2:43:25, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=7.62s]
Epoch 1: 90%|████████▉ | 11103/12384 [23:33:39<2:43:16, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=7.62s]
Epoch 1: 90%|████████▉ | 11103/12384 [23:33:47<2:43:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 90%|████████▉ | 11104/12384 [23:33:47<2:42:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 90%|████████▉ | 11104/12384 [23:33:55<2:42:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 90%|████████▉ | 11105/12384 [23:33:55<2:42:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 90%|████████▉ | 11105/12384 [23:34:02<2:42:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|████████▉ | 11106/12384 [23:34:02<2:42:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|████████▉ | 11106/12384 [23:34:10<2:42:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|████████▉ | 11107/12384 [23:34:10<2:42:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|████████▉ | 11107/12384 [23:34:17<2:42:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 90%|████████▉ | 11108/12384 [23:34:17<2:41:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 90%|████████▉ | 11108/12384 [23:34:25<2:41:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 90%|████████▉ | 11109/12384 [23:34:25<2:41:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 90%|████████▉ | 11109/12384 [23:34:33<2:41:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|████████▉ | 11110/12384 [23:34:33<2:41:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|████████▉ | 11110/12384 [23:34:40<2:41:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 90%|████████▉ | 11111/12384 [23:34:40<2:41:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 90%|████████▉ | 11111/12384 [23:34:48<2:41:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 90%|████████▉ | 11112/12384 [23:34:48<2:41:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 90%|████████▉ | 11112/12384 [23:34:56<2:41:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 90%|████████▉ | 11113/12384 [23:34:56<2:41:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 90%|████████▉ | 11113/12384 [23:35:03<2:41:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 1: 90%|████████▉ | 11114/12384 [23:35:03<2:41:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 1: 90%|████████▉ | 11114/12384 [23:35:11<2:41:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 90%|████████▉ | 11115/12384 [23:35:11<2:41:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 90%|████████▉ | 11115/12384 [23:35:19<2:41:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 90%|████████▉ | 11116/12384 [23:35:19<2:42:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 1: 90%|████████▉ | 11116/12384 [23:35:26<2:42:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 90%|████████▉ | 11117/12384 [23:35:26<2:41:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 90%|████████▉ | 11117/12384 [23:35:34<2:41:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 90%|████████▉ | 11118/12384 [23:35:34<2:41:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 90%|████████▉ | 11118/12384 [23:35:42<2:41:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 90%|████████▉ | 11119/12384 [23:35:42<2:41:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 90%|████████▉ | 11119/12384 [23:35:49<2:41:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 90%|████████▉ | 11120/12384 [23:35:49<2:40:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 1: 90%|████████▉ | 11120/12384 [23:35:57<2:40:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 90%|████████▉ | 11121/12384 [23:35:57<2:40:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 90%|████████▉ | 11121/12384 [23:36:04<2:40:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 90%|████████▉ | 11122/12384 [23:36:04<2:40:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 90%|████████▉ | 11122/12384 [23:36:12<2:40:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 90%|████████▉ | 11123/12384 [23:36:12<2:40:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 1: 90%|████████▉ | 11123/12384 [23:36:20<2:40:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 90%|████████▉ | 11124/12384 [23:36:20<2:39:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 90%|████████▉ | 11124/12384 [23:36:28<2:39:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 90%|████████▉ | 11125/12384 [23:36:28<2:42:10, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 90%|████████▉ | 11125/12384 [23:36:35<2:42:10, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 90%|████████▉ | 11126/12384 [23:36:35<2:41:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 90%|████████▉ | 11126/12384 [23:36:43<2:41:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 90%|████████▉ | 11127/12384 [23:36:43<2:40:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 90%|████████▉ | 11127/12384 [23:36:50<2:40:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 90%|████████▉ | 11128/12384 [23:36:50<2:40:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 90%|████████▉ | 11128/12384 [23:36:58<2:40:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 1: 90%|████████▉ | 11129/12384 [23:36:58<2:40:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 1: 90%|████████▉ | 11129/12384 [23:37:06<2:40:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 90%|████████▉ | 11130/12384 [23:37:06<2:39:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 90%|████████▉ | 11130/12384 [23:37:13<2:39:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 90%|████████▉ | 11131/12384 [23:37:13<2:40:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 90%|████████▉ | 11131/12384 [23:37:21<2:40:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 1: 90%|████████▉ | 11132/12384 [23:37:21<2:39:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 1: 90%|████████▉ | 11132/12384 [23:37:29<2:39:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 90%|████████▉ | 11133/12384 [23:37:29<2:39:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 1: 90%|████████▉ | 11133/12384 [23:37:36<2:39:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 90%|████████▉ | 11134/12384 [23:37:36<2:39:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 1: 90%|████████▉ | 11134/12384 [23:37:44<2:39:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 90%|████████▉ | 11135/12384 [23:37:44<2:39:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 90%|████████▉ | 11135/12384 [23:37:52<2:39:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 90%|████████▉ | 11136/12384 [23:37:52<2:39:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 1: 90%|████████▉ | 11136/12384 [23:37:59<2:39:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 90%|████████▉ | 11137/12384 [23:37:59<2:38:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 90%|████████▉ | 11137/12384 [23:38:07<2:38:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 90%|████████▉ | 11138/12384 [23:38:07<2:38:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 1: 90%|████████▉ | 11138/12384 [23:38:15<2:38:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 90%|████████▉ | 11139/12384 [23:38:15<2:38:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 90%|████████▉ | 11139/12384 [23:38:22<2:38:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|████████▉ | 11140/12384 [23:38:22<2:37:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|████████▉ | 11140/12384 [23:38:30<2:37:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 90%|████████▉ | 11141/12384 [23:38:30<2:37:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 90%|████████▉ | 11141/12384 [23:38:37<2:37:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 90%|████████▉ | 11142/12384 [23:38:37<2:37:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 90%|████████▉ | 11142/12384 [23:38:45<2:37:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 90%|████████▉ | 11143/12384 [23:38:45<2:37:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 1: 90%|████████▉ | 11143/12384 [23:38:53<2:37:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 90%|████████▉ | 11144/12384 [23:38:53<2:37:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 90%|████████▉ | 11144/12384 [23:39:00<2:37:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 90%|████████▉ | 11145/12384 [23:39:00<2:37:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 90%|████████▉ | 11145/12384 [23:39:08<2:37:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 90%|█████████ | 11146/12384 [23:39:08<2:38:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 90%|█████████ | 11146/12384 [23:39:16<2:38:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 90%|█████████ | 11147/12384 [23:39:16<2:38:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 90%|█████████ | 11147/12384 [23:39:23<2:38:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 90%|█████████ | 11148/12384 [23:39:23<2:37:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 90%|█████████ | 11148/12384 [23:39:31<2:37:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 90%|█████████ | 11149/12384 [23:39:31<2:37:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 90%|█████████ | 11149/12384 [23:39:39<2:37:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 90%|█████████ | 11150/12384 [23:39:39<2:37:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 90%|█████████ | 11150/12384 [23:39:47<2:37:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 90%|█████████ | 11151/12384 [23:39:47<2:38:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 90%|█████████ | 11151/12384 [23:39:54<2:38:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 90%|█████████ | 11152/12384 [23:39:54<2:38:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 1: 90%|█████████ | 11152/12384 [23:40:02<2:38:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 90%|█████████ | 11153/12384 [23:40:02<2:37:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 90%|█████████ | 11153/12384 [23:40:09<2:37:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11154/12384 [23:40:09<2:37:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11154/12384 [23:40:17<2:37:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 90%|█████████ | 11155/12384 [23:40:17<2:36:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 90%|█████████ | 11155/12384 [23:40:25<2:36:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 90%|█████████ | 11156/12384 [23:40:25<2:36:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 90%|█████████ | 11156/12384 [23:40:32<2:36:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 90%|█████████ | 11157/12384 [23:40:32<2:36:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 90%|█████████ | 11157/12384 [23:40:40<2:36:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11158/12384 [23:40:40<2:35:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11158/12384 [23:40:47<2:35:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 90%|█████████ | 11159/12384 [23:40:47<2:35:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 90%|█████████ | 11159/12384 [23:40:55<2:35:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 90%|█████████ | 11160/12384 [23:40:55<2:35:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 1: 90%|█████████ | 11160/12384 [23:41:03<2:35:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 90%|█████████ | 11161/12384 [23:41:03<2:35:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 90%|█████████ | 11161/12384 [23:41:10<2:35:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 90%|█████████ | 11162/12384 [23:41:10<2:35:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 90%|█████████ | 11162/12384 [23:41:18<2:35:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|█████████ | 11163/12384 [23:41:18<2:35:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|█████████ | 11163/12384 [23:41:26<2:35:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11164/12384 [23:41:26<2:35:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11164/12384 [23:41:33<2:35:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|█████████ | 11165/12384 [23:41:33<2:34:46, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|█████████ | 11165/12384 [23:41:41<2:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 90%|█████████ | 11166/12384 [23:41:41<2:34:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 90%|█████████ | 11166/12384 [23:41:49<2:34:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 90%|█████████ | 11167/12384 [23:41:49<2:34:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 90%|█████████ | 11167/12384 [23:41:56<2:34:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 90%|█████████ | 11168/12384 [23:41:56<2:34:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 90%|█████████ | 11168/12384 [23:42:04<2:34:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 1: 90%|█████████ | 11169/12384 [23:42:04<2:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.15s]
Epoch 1: 90%|█████████ | 11169/12384 [23:42:11<2:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 90%|█████████ | 11170/12384 [23:42:11<2:34:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 90%|█████████ | 11170/12384 [23:42:19<2:34:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|█████████ | 11171/12384 [23:42:19<2:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|█████████ | 11171/12384 [23:42:27<2:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 1: 90%|█████████ | 11172/12384 [23:42:27<2:34:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 1: 90%|█████████ | 11172/12384 [23:42:34<2:34:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 90%|█████████ | 11173/12384 [23:42:34<2:34:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 1: 90%|█████████ | 11173/12384 [23:42:42<2:34:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|█████████ | 11174/12384 [23:42:42<2:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 90%|█████████ | 11174/12384 [23:42:49<2:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 90%|█████████ | 11175/12384 [23:42:49<2:33:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 90%|█████████ | 11175/12384 [23:42:57<2:33:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 90%|█████████ | 11176/12384 [23:42:57<2:33:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 1: 90%|█████████ | 11176/12384 [23:43:05<2:33:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 90%|█████████ | 11177/12384 [23:43:05<2:35:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 90%|█████████ | 11177/12384 [23:43:13<2:35:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 90%|█████████ | 11178/12384 [23:43:13<2:34:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 90%|█████████ | 11178/12384 [23:43:20<2:34:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 90%|█████████ | 11179/12384 [23:43:20<2:33:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 90%|█████████ | 11179/12384 [23:43:28<2:33:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 90%|█████████ | 11180/12384 [23:43:28<2:33:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 90%|█████████ | 11180/12384 [23:43:36<2:33:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 90%|█████████ | 11181/12384 [23:43:36<2:33:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 90%|█████████ | 11181/12384 [23:43:43<2:33:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11182/12384 [23:43:43<2:33:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11182/12384 [23:43:51<2:33:12, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|█████████ | 11183/12384 [23:43:51<2:32:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|█████████ | 11183/12384 [23:43:58<2:32:47, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 1: 90%|█████████ | 11184/12384 [23:43:58<2:32:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 1: 90%|█████████ | 11184/12384 [23:44:06<2:32:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 90%|█████████ | 11185/12384 [23:44:06<2:32:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 90%|█████████ | 11185/12384 [23:44:14<2:32:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 90%|█████████ | 11186/12384 [23:44:14<2:32:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 90%|█████████ | 11186/12384 [23:44:21<2:32:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 90%|█████████ | 11187/12384 [23:44:21<2:31:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 1: 90%|█████████ | 11187/12384 [23:44:29<2:31:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11188/12384 [23:44:29<2:31:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 90%|█████████ | 11188/12384 [23:44:36<2:31:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 90%|█████████ | 11189/12384 [23:44:36<2:31:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 90%|█████████ | 11189/12384 [23:44:44<2:31:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 90%|█████████ | 11190/12384 [23:44:44<2:31:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 90%|█████████ | 11190/12384 [23:44:52<2:31:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 1: 90%|█████████ | 11191/12384 [23:44:52<2:31:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 1: 90%|█████████ | 11191/12384 [23:44:59<2:31:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 90%|█████████ | 11192/12384 [23:44:59<2:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 90%|█████████ | 11192/12384 [23:45:07<2:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 90%|█████████ | 11193/12384 [23:45:07<2:31:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 90%|█████████ | 11193/12384 [23:45:15<2:31:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 90%|█████████ | 11194/12384 [23:45:15<2:31:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 90%|█████████ | 11194/12384 [23:45:22<2:31:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 90%|█████████ | 11195/12384 [23:45:22<2:31:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 90%|█████████ | 11195/12384 [23:45:30<2:31:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|█████████ | 11196/12384 [23:45:30<2:31:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|█████████ | 11196/12384 [23:45:37<2:31:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 90%|█████████ | 11197/12384 [23:45:37<2:30:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 90%|█████████ | 11197/12384 [23:45:45<2:30:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|█████████ | 11198/12384 [23:45:45<2:30:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 90%|█████████ | 11198/12384 [23:45:53<2:30:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 90%|█████████ | 11199/12384 [23:45:53<2:32:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 90%|█████████ | 11199/12384 [23:46:01<2:32:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 90%|█████████ | 11200/12384 [23:46:01<2:31:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 90%|█████████ | 11200/12384 [23:46:08<2:31:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 90%|█████████ | 11201/12384 [23:46:08<2:31:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 90%|█████████ | 11201/12384 [23:46:16<2:31:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 90%|█████████ | 11202/12384 [23:46:16<2:30:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 1: 90%|█████████ | 11202/12384 [23:46:24<2:30:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 90%|█████████ | 11203/12384 [23:46:24<2:32:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 90%|█████████ | 11203/12384 [23:46:31<2:32:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 90%|█████████ | 11204/12384 [23:46:31<2:31:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 90%|█████████ | 11204/12384 [23:46:39<2:31:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 1: 90%|█████████ | 11205/12384 [23:46:39<2:30:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 1: 90%|█████████ | 11205/12384 [23:46:47<2:30:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 90%|█████████ | 11206/12384 [23:46:47<2:30:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 90%|█████████ | 11206/12384 [23:46:54<2:30:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 90%|█████████ | 11207/12384 [23:46:54<2:29:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 90%|█████████ | 11207/12384 [23:47:02<2:29:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 91%|█████████ | 11208/12384 [23:47:02<2:29:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 91%|█████████ | 11208/12384 [23:47:09<2:29:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 91%|█████████ | 11209/12384 [23:47:09<2:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 91%|█████████ | 11209/12384 [23:47:17<2:29:12, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=6.98s]
Epoch 1: 91%|█████████ | 11210/12384 [23:47:17<2:29:02, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=6.98s]
Epoch 1: 91%|█████████ | 11210/12384 [23:47:25<2:29:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 91%|█████████ | 11211/12384 [23:47:25<2:28:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 91%|█████████ | 11211/12384 [23:47:32<2:28:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 91%|█████████ | 11212/12384 [23:47:32<2:28:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 1: 91%|█████████ | 11212/12384 [23:47:40<2:28:43, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 91%|█████████ | 11213/12384 [23:47:40<2:28:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 91%|█████████ | 11213/12384 [23:47:47<2:28:30, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11214/12384 [23:47:47<2:28:27, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11214/12384 [23:47:55<2:28:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 91%|█████████ | 11215/12384 [23:47:55<2:28:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 91%|█████████ | 11215/12384 [23:48:03<2:28:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 91%|█████████ | 11216/12384 [23:48:03<2:28:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 91%|█████████ | 11216/12384 [23:48:10<2:28:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 91%|█████████ | 11217/12384 [23:48:10<2:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 1: 91%|█████████ | 11217/12384 [23:48:18<2:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 91%|█████████ | 11218/12384 [23:48:18<2:28:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 91%|█████████ | 11218/12384 [23:48:26<2:28:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 91%|█████████ | 11219/12384 [23:48:26<2:28:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 91%|█████████ | 11219/12384 [23:48:33<2:28:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 91%|█████████ | 11220/12384 [23:48:33<2:28:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 91%|█████████ | 11220/12384 [23:48:41<2:28:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11221/12384 [23:48:41<2:27:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11221/12384 [23:48:48<2:27:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11222/12384 [23:48:48<2:27:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11222/12384 [23:48:56<2:27:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 91%|█████████ | 11223/12384 [23:48:56<2:27:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 91%|█████████ | 11223/12384 [23:49:04<2:27:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 91%|█████████ | 11224/12384 [23:49:04<2:27:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 1: 91%|█████████ | 11224/12384 [23:49:11<2:27:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 91%|█████████ | 11225/12384 [23:49:11<2:26:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 91%|█████████ | 11225/12384 [23:49:19<2:26:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 91%|█████████ | 11226/12384 [23:49:19<2:26:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 1: 91%|█████████ | 11226/12384 [23:49:27<2:26:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 91%|█████████ | 11227/12384 [23:49:27<2:26:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 91%|█████████ | 11227/12384 [23:49:34<2:26:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 91%|█████████ | 11228/12384 [23:49:34<2:26:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 91%|█████████ | 11228/12384 [23:49:42<2:26:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 1: 91%|█████████ | 11229/12384 [23:49:42<2:28:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 1: 91%|█████████ | 11229/12384 [23:49:50<2:28:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 91%|█████████ | 11230/12384 [23:49:50<2:27:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 1: 91%|█████████ | 11230/12384 [23:49:57<2:27:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 91%|█████████ | 11231/12384 [23:49:57<2:27:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 91%|█████████ | 11231/12384 [23:50:05<2:27:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 91%|█████████ | 11232/12384 [23:50:05<2:27:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 91%|█████████ | 11232/12384 [23:50:13<2:27:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 91%|█████████ | 11233/12384 [23:50:13<2:26:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 91%|█████████ | 11233/12384 [23:50:20<2:26:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11234/12384 [23:50:20<2:26:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11234/12384 [23:50:28<2:26:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 91%|█████████ | 11235/12384 [23:50:28<2:26:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 91%|█████████ | 11235/12384 [23:50:35<2:26:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11236/12384 [23:50:35<2:25:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11236/12384 [23:50:43<2:25:58, 7.63s/it, loss=0.0039, acc=0.9860, iter_time=5.88s]
Epoch 1: 91%|█████████ | 11237/12384 [23:50:43<2:25:35, 7.62s/it, loss=0.0039, acc=0.9860, iter_time=5.88s]
Epoch 1: 91%|█████████ | 11237/12384 [23:50:51<2:25:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.52s]
Epoch 1: 91%|█████████ | 11238/12384 [23:50:51<2:25:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.52s]
Epoch 1: 91%|█████████ | 11238/12384 [23:50:58<2:25:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 91%|█████████ | 11239/12384 [23:50:58<2:25:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 1: 91%|█████████ | 11239/12384 [23:51:06<2:25:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 91%|█████████ | 11240/12384 [23:51:06<2:25:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 91%|█████████ | 11240/12384 [23:51:13<2:25:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.73s]
Epoch 1: 91%|█████████ | 11241/12384 [23:51:13<2:25:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.73s]
Epoch 1: 91%|█████████ | 11241/12384 [23:51:21<2:25:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 91%|█████████ | 11242/12384 [23:51:21<2:24:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 1: 91%|█████████ | 11242/12384 [23:51:29<2:24:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 91%|█████████ | 11243/12384 [23:51:29<2:24:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 91%|█████████ | 11243/12384 [23:51:36<2:24:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 91%|█████████ | 11244/12384 [23:51:36<2:24:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 91%|█████████ | 11244/12384 [23:51:44<2:24:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 91%|█████████ | 11245/12384 [23:51:44<2:24:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 91%|█████████ | 11245/12384 [23:51:52<2:24:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.76s]
Epoch 1: 91%|█████████ | 11246/12384 [23:51:52<2:24:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.76s]
Epoch 1: 91%|█████████ | 11246/12384 [23:51:59<2:24:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 91%|█████████ | 11247/12384 [23:51:59<2:24:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 91%|█████████ | 11247/12384 [23:52:07<2:24:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 91%|█████████ | 11248/12384 [23:52:07<2:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 91%|█████████ | 11248/12384 [23:52:14<2:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11249/12384 [23:52:14<2:23:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11249/12384 [23:52:22<2:23:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 91%|█████████ | 11250/12384 [23:52:22<2:23:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 91%|█████████ | 11250/12384 [23:52:30<2:23:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 91%|█████████ | 11251/12384 [23:52:30<2:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 91%|█████████ | 11251/12384 [23:52:37<2:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 91%|█████████ | 11252/12384 [23:52:37<2:25:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 91%|█████████ | 11252/12384 [23:52:45<2:25:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 91%|█████████ | 11253/12384 [23:52:45<2:24:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 91%|█████████ | 11253/12384 [23:52:53<2:24:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11254/12384 [23:52:53<2:24:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11254/12384 [23:53:00<2:24:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 91%|█████████ | 11255/12384 [23:53:00<2:23:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 91%|█████████ | 11255/12384 [23:53:08<2:23:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 91%|█████████ | 11256/12384 [23:53:08<2:25:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 91%|█████████ | 11256/12384 [23:53:16<2:25:17, 7.73s/it, loss=0.0002, acc=0.9989, iter_time=7.64s]
Epoch 1: 91%|█████████ | 11257/12384 [23:53:16<2:24:24, 7.69s/it, loss=0.0002, acc=0.9989, iter_time=7.64s]
Epoch 1: 91%|█████████ | 11257/12384 [23:53:24<2:24:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 91%|█████████ | 11258/12384 [23:53:24<2:24:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 91%|█████████ | 11258/12384 [23:53:31<2:24:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11259/12384 [23:53:31<2:24:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11259/12384 [23:53:39<2:24:18, 7.70s/it, loss=0.0006, acc=0.9977, iter_time=7.68s]
Epoch 1: 91%|█████████ | 11260/12384 [23:53:39<2:23:42, 7.67s/it, loss=0.0006, acc=0.9977, iter_time=7.68s]
Epoch 1: 91%|█████████ | 11260/12384 [23:53:46<2:23:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11261/12384 [23:53:46<2:23:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11261/12384 [23:53:54<2:23:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 91%|█████████ | 11262/12384 [23:53:54<2:22:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 91%|█████████ | 11262/12384 [23:54:02<2:22:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 91%|█████████ | 11263/12384 [23:54:02<2:22:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 91%|█████████ | 11263/12384 [23:54:09<2:22:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 91%|█████████ | 11264/12384 [23:54:09<2:22:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 91%|█████████ | 11264/12384 [23:54:17<2:22:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 91%|█████████ | 11265/12384 [23:54:17<2:22:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 91%|█████████ | 11265/12384 [23:54:25<2:22:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 91%|█████████ | 11266/12384 [23:54:25<2:22:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 91%|█████████ | 11266/12384 [23:54:32<2:22:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 91%|█████████ | 11267/12384 [23:54:32<2:22:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 91%|█████████ | 11267/12384 [23:54:40<2:22:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11268/12384 [23:54:40<2:21:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11268/12384 [23:54:47<2:21:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 91%|█████████ | 11269/12384 [23:54:47<2:21:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 91%|█████████ | 11269/12384 [23:54:55<2:21:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 91%|█████████ | 11270/12384 [23:54:55<2:21:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 1: 91%|█████████ | 11270/12384 [23:55:03<2:21:12, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.30s]
Epoch 1: 91%|█████████ | 11271/12384 [23:55:03<2:21:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.30s]
Epoch 1: 91%|█████████ | 11271/12384 [23:55:10<2:21:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 91%|█████████ | 11272/12384 [23:55:10<2:21:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 91%|█████████ | 11272/12384 [23:55:18<2:21:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 91%|█████████ | 11273/12384 [23:55:18<2:21:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 91%|█████████ | 11273/12384 [23:55:26<2:21:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 1: 91%|█████████ | 11274/12384 [23:55:26<2:21:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 1: 91%|█████████ | 11274/12384 [23:55:33<2:21:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 91%|█████████ | 11275/12384 [23:55:33<2:21:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 91%|█████████ | 11275/12384 [23:55:41<2:21:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 91%|█████████ | 11276/12384 [23:55:41<2:20:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 91%|█████████ | 11276/12384 [23:55:48<2:20:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 91%|█████████ | 11277/12384 [23:55:48<2:20:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 91%|█████████ | 11277/12384 [23:55:56<2:20:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 91%|█████████ | 11278/12384 [23:55:56<2:21:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 1: 91%|█████████ | 11278/12384 [23:56:04<2:21:58, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 91%|█████████ | 11279/12384 [23:56:04<2:21:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 91%|█████████ | 11279/12384 [23:56:12<2:21:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 91%|█████████ | 11280/12384 [23:56:12<2:20:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 1: 91%|█████████ | 11280/12384 [23:56:19<2:20:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11281/12384 [23:56:19<2:20:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11281/12384 [23:56:27<2:20:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 91%|█████████ | 11282/12384 [23:56:27<2:22:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 91%|█████████ | 11282/12384 [23:56:35<2:22:00, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11283/12384 [23:56:35<2:21:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 91%|█████████ | 11283/12384 [23:56:42<2:21:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 91%|█████████ | 11284/12384 [23:56:42<2:20:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 91%|█████████ | 11284/12384 [23:56:50<2:20:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 91%|█████████ | 11285/12384 [23:56:50<2:20:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 1: 91%|█████████ | 11285/12384 [23:56:58<2:20:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 91%|█████████ | 11286/12384 [23:56:58<2:19:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 1: 91%|█████████ | 11286/12384 [23:57:05<2:19:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 91%|█████████ | 11287/12384 [23:57:05<2:19:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 91%|█████████ | 11287/12384 [23:57:13<2:19:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 91%|█████████ | 11288/12384 [23:57:13<2:19:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 91%|█████████ | 11288/12384 [23:57:20<2:19:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 91%|█████████ | 11289/12384 [23:57:20<2:19:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 1: 91%|█████████ | 11289/12384 [23:57:28<2:19:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 91%|█████████ | 11290/12384 [23:57:28<2:19:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 91%|█████████ | 11290/12384 [23:57:36<2:19:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 91%|█████████ | 11291/12384 [23:57:36<2:19:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 91%|█████████ | 11291/12384 [23:57:43<2:19:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 91%|█████████ | 11292/12384 [23:57:43<2:18:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 91%|█████████ | 11292/12384 [23:57:51<2:18:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11293/12384 [23:57:51<2:18:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 91%|█████████ | 11293/12384 [23:57:59<2:18:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 91%|█████████ | 11294/12384 [23:57:59<2:18:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 91%|█████████ | 11294/12384 [23:58:06<2:18:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 1: 91%|█████████ | 11295/12384 [23:58:06<2:18:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 1: 91%|█████████ | 11295/12384 [23:58:14<2:18:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 91%|█████████ | 11296/12384 [23:58:14<2:17:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 91%|█████████ | 11296/12384 [23:58:21<2:17:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 91%|█████████ | 11297/12384 [23:58:21<2:17:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 91%|█████████ | 11297/12384 [23:58:29<2:17:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 91%|█████████ | 11298/12384 [23:58:29<2:17:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 91%|█████████ | 11298/12384 [23:58:37<2:17:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 91%|█████████ | 11299/12384 [23:58:37<2:17:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 91%|█████████ | 11299/12384 [23:58:44<2:17:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 91%|█████████ | 11300/12384 [23:58:44<2:17:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 91%|█████████ | 11300/12384 [23:58:52<2:17:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 91%|█████████▏| 11301/12384 [23:58:52<2:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 91%|█████████▏| 11301/12384 [23:58:59<2:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 1: 91%|█████████▏| 11302/12384 [23:58:59<2:17:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 1: 91%|█████████▏| 11302/12384 [23:59:07<2:17:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 91%|█████████▏| 11303/12384 [23:59:07<2:17:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 91%|█████████▏| 11303/12384 [23:59:15<2:17:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 91%|█████████▏| 11304/12384 [23:59:15<2:17:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 91%|█████████▏| 11304/12384 [23:59:22<2:17:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 91%|█████████▏| 11305/12384 [23:59:22<2:17:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 91%|█████████▏| 11305/12384 [23:59:30<2:17:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 91%|█████████▏| 11306/12384 [23:59:30<2:16:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 91%|█████████▏| 11306/12384 [23:59:37<2:16:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 91%|█████████▏| 11307/12384 [23:59:37<2:16:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 91%|█████████▏| 11307/12384 [23:59:45<2:16:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 91%|█████████▏| 11308/12384 [23:59:45<2:16:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 91%|█████████▏| 11308/12384 [23:59:53<2:16:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 91%|█████████▏| 11309/12384 [23:59:53<2:18:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 91%|█████████▏| 11309/12384 [24:00:01<2:18:13, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 1: 91%|█████████▏| 11310/12384 [24:00:01<2:17:41, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 1: 91%|█████████▏| 11310/12384 [24:00:08<2:17:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 91%|█████████▏| 11311/12384 [24:00:08<2:17:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 91%|█████████▏| 11311/12384 [24:00:16<2:17:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 91%|█████████▏| 11312/12384 [24:00:16<2:16:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 91%|█████████▏| 11312/12384 [24:00:24<2:16:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 91%|█████████▏| 11313/12384 [24:00:24<2:16:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 91%|█████████▏| 11313/12384 [24:00:31<2:16:23, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.04s]
Epoch 1: 91%|█████████▏| 11314/12384 [24:00:31<2:16:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.04s]
Epoch 1: 91%|█████████▏| 11314/12384 [24:00:39<2:16:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 91%|█████████▏| 11315/12384 [24:00:39<2:15:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 91%|█████████▏| 11315/12384 [24:00:46<2:15:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 91%|█████████▏| 11316/12384 [24:00:46<2:15:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 91%|█████████▏| 11316/12384 [24:00:54<2:15:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 91%|█████████▏| 11317/12384 [24:00:54<2:15:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 1: 91%|█████████▏| 11317/12384 [24:01:02<2:15:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 91%|█████████▏| 11318/12384 [24:01:02<2:15:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 91%|█████████▏| 11318/12384 [24:01:09<2:15:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 91%|█████████▏| 11319/12384 [24:01:09<2:15:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 1: 91%|█████████▏| 11319/12384 [24:01:17<2:15:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 1: 91%|█████████▏| 11320/12384 [24:01:17<2:15:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 1: 91%|█████████▏| 11320/12384 [24:01:24<2:15:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 91%|█████████▏| 11321/12384 [24:01:24<2:14:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 91%|█████████▏| 11321/12384 [24:01:32<2:14:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 91%|█████████▏| 11322/12384 [24:01:32<2:14:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 1: 91%|█████████▏| 11322/12384 [24:01:40<2:14:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 1: 91%|█████████▏| 11323/12384 [24:01:40<2:14:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 1: 91%|█████████▏| 11323/12384 [24:01:47<2:14:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 91%|█████████▏| 11324/12384 [24:01:47<2:14:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 91%|█████████▏| 11324/12384 [24:01:55<2:14:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 91%|█████████▏| 11325/12384 [24:01:55<2:14:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 91%|█████████▏| 11325/12384 [24:02:02<2:14:09, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 1: 91%|█████████▏| 11326/12384 [24:02:02<2:14:00, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 1: 91%|█████████▏| 11326/12384 [24:02:10<2:14:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 91%|█████████▏| 11327/12384 [24:02:10<2:13:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 91%|█████████▏| 11327/12384 [24:02:18<2:13:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 91%|█████████▏| 11328/12384 [24:02:18<2:13:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 91%|█████████▏| 11328/12384 [24:02:25<2:13:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 91%|█████████▏| 11329/12384 [24:02:25<2:13:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 1: 91%|█████████▏| 11329/12384 [24:02:33<2:13:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 91%|█████████▏| 11330/12384 [24:02:33<2:13:24, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 91%|█████████▏| 11330/12384 [24:02:40<2:13:24, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 91%|█████████▏| 11331/12384 [24:02:40<2:13:14, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 1: 91%|█████████▏| 11331/12384 [24:02:48<2:13:14, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 92%|█████████▏| 11332/12384 [24:02:48<2:13:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 92%|█████████▏| 11332/12384 [24:02:56<2:13:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 92%|█████████▏| 11333/12384 [24:02:56<2:13:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 92%|█████████▏| 11333/12384 [24:03:03<2:13:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 92%|█████████▏| 11334/12384 [24:03:03<2:13:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 92%|█████████▏| 11334/12384 [24:03:11<2:13:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 92%|█████████▏| 11335/12384 [24:03:11<2:14:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 1: 92%|█████████▏| 11335/12384 [24:03:19<2:14:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 92%|█████████▏| 11336/12384 [24:03:19<2:14:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 1: 92%|█████████▏| 11336/12384 [24:03:26<2:14:20, 7.69s/it, loss=0.0001, acc=0.9998, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11337/12384 [24:03:26<2:13:46, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11337/12384 [24:03:34<2:13:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 92%|█████████▏| 11338/12384 [24:03:34<2:13:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 92%|█████████▏| 11338/12384 [24:03:42<2:13:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 92%|█████████▏| 11339/12384 [24:03:42<2:12:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 92%|█████████▏| 11339/12384 [24:03:49<2:12:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 92%|█████████▏| 11340/12384 [24:03:49<2:12:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 92%|█████████▏| 11340/12384 [24:03:57<2:12:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 92%|█████████▏| 11341/12384 [24:03:57<2:12:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 1: 92%|█████████▏| 11341/12384 [24:04:04<2:12:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 92%|█████████▏| 11342/12384 [24:04:04<2:12:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 1: 92%|█████████▏| 11342/12384 [24:04:12<2:12:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 1: 92%|█████████▏| 11343/12384 [24:04:12<2:12:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 1: 92%|█████████▏| 11343/12384 [24:04:20<2:12:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 92%|█████████▏| 11344/12384 [24:04:20<2:12:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 92%|█████████▏| 11344/12384 [24:04:28<2:12:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11345/12384 [24:04:28<2:12:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11345/12384 [24:04:35<2:12:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 92%|█████████▏| 11346/12384 [24:04:35<2:12:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 92%|█████████▏| 11346/12384 [24:04:43<2:12:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 92%|█████████▏| 11347/12384 [24:04:43<2:12:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 92%|█████████▏| 11347/12384 [24:04:50<2:12:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 92%|█████████▏| 11348/12384 [24:04:50<2:12:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 92%|█████████▏| 11348/12384 [24:04:58<2:12:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 92%|█████████▏| 11349/12384 [24:04:58<2:11:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 92%|█████████▏| 11349/12384 [24:05:06<2:11:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 92%|█████████▏| 11350/12384 [24:05:06<2:11:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 92%|█████████▏| 11350/12384 [24:05:13<2:11:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 1: 92%|█████████▏| 11351/12384 [24:05:13<2:11:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 1: 92%|█████████▏| 11351/12384 [24:05:21<2:11:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 92%|█████████▏| 11352/12384 [24:05:21<2:11:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 1: 92%|█████████▏| 11352/12384 [24:05:29<2:11:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 92%|█████████▏| 11353/12384 [24:05:29<2:11:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 92%|█████████▏| 11353/12384 [24:05:36<2:11:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 92%|█████████▏| 11354/12384 [24:05:36<2:10:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 1: 92%|█████████▏| 11354/12384 [24:05:44<2:10:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 92%|█████████▏| 11355/12384 [24:05:44<2:10:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 92%|█████████▏| 11355/12384 [24:05:52<2:10:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 92%|█████████▏| 11356/12384 [24:05:52<2:10:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 92%|█████████▏| 11356/12384 [24:05:59<2:10:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.40s]
Epoch 1: 92%|█████████▏| 11357/12384 [24:05:59<2:10:48, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.40s]
Epoch 1: 92%|█████████▏| 11357/12384 [24:06:07<2:10:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 92%|█████████▏| 11358/12384 [24:06:07<2:10:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 92%|█████████▏| 11358/12384 [24:06:14<2:10:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11359/12384 [24:06:14<2:10:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11359/12384 [24:06:22<2:10:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 92%|█████████▏| 11360/12384 [24:06:22<2:10:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 92%|█████████▏| 11360/12384 [24:06:30<2:10:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 92%|█████████▏| 11361/12384 [24:06:30<2:11:43, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 92%|█████████▏| 11361/12384 [24:06:38<2:11:43, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 92%|█████████▏| 11362/12384 [24:06:38<2:11:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 92%|█████████▏| 11362/12384 [24:06:45<2:11:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11363/12384 [24:06:45<2:10:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11363/12384 [24:06:53<2:10:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 92%|█████████▏| 11364/12384 [24:06:53<2:09:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 92%|█████████▏| 11364/12384 [24:07:00<2:09:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 92%|█████████▏| 11365/12384 [24:07:00<2:09:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 92%|█████████▏| 11365/12384 [24:07:08<2:09:40, 7.64s/it, loss=0.0002, acc=0.9990, iter_time=7.99s]
Epoch 1: 92%|█████████▏| 11366/12384 [24:07:08<2:09:17, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.99s]
Epoch 1: 92%|█████████▏| 11366/12384 [24:07:16<2:09:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.73s]
Epoch 1: 92%|█████████▏| 11367/12384 [24:07:16<2:09:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.73s]
Epoch 1: 92%|█████████▏| 11367/12384 [24:07:23<2:09:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.49s]
Epoch 1: 92%|█████████▏| 11368/12384 [24:07:23<2:08:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.49s]
Epoch 1: 92%|█████████▏| 11368/12384 [24:07:31<2:08:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 1: 92%|█████████▏| 11369/12384 [24:07:31<2:08:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 1: 92%|█████████▏| 11369/12384 [24:07:38<2:08:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 92%|█████████▏| 11370/12384 [24:07:38<2:08:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 1: 92%|█████████▏| 11370/12384 [24:07:46<2:08:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 92%|█████████▏| 11371/12384 [24:07:46<2:08:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 92%|█████████▏| 11371/12384 [24:07:54<2:08:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 92%|█████████▏| 11372/12384 [24:07:54<2:08:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 1: 92%|█████████▏| 11372/12384 [24:08:01<2:08:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 92%|█████████▏| 11373/12384 [24:08:01<2:08:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 92%|█████████▏| 11373/12384 [24:08:09<2:08:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 92%|█████████▏| 11374/12384 [24:08:09<2:08:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 1: 92%|█████████▏| 11374/12384 [24:08:17<2:08:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 92%|█████████▏| 11375/12384 [24:08:17<2:08:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 1: 92%|█████████▏| 11375/12384 [24:08:24<2:08:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 92%|█████████▏| 11376/12384 [24:08:24<2:08:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 92%|█████████▏| 11376/12384 [24:08:32<2:08:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 92%|█████████▏| 11377/12384 [24:08:32<2:07:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 92%|█████████▏| 11377/12384 [24:08:39<2:07:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 92%|█████████▏| 11378/12384 [24:08:39<2:07:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 92%|█████████▏| 11378/12384 [24:08:47<2:07:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 1: 92%|█████████▏| 11379/12384 [24:08:47<2:07:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 1: 92%|█████████▏| 11379/12384 [24:08:55<2:07:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 92%|█████████▏| 11380/12384 [24:08:55<2:07:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 92%|█████████▏| 11380/12384 [24:09:02<2:07:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 92%|█████████▏| 11381/12384 [24:09:02<2:07:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 92%|█████████▏| 11381/12384 [24:09:10<2:07:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 92%|█████████▏| 11382/12384 [24:09:10<2:07:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 92%|█████████▏| 11382/12384 [24:09:18<2:07:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 92%|█████████▏| 11383/12384 [24:09:18<2:08:24, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 1: 92%|█████████▏| 11383/12384 [24:09:25<2:08:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 92%|█████████▏| 11384/12384 [24:09:25<2:08:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 92%|█████████▏| 11384/12384 [24:09:33<2:08:00, 7.68s/it, loss=0.0002, acc=0.9995, iter_time=5.76s]
Epoch 1: 92%|█████████▏| 11385/12384 [24:09:33<2:07:26, 7.65s/it, loss=0.0002, acc=0.9995, iter_time=5.76s]
Epoch 1: 92%|█████████▏| 11385/12384 [24:09:41<2:07:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 92%|█████████▏| 11386/12384 [24:09:41<2:07:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 92%|█████████▏| 11386/12384 [24:09:49<2:07:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 92%|█████████▏| 11387/12384 [24:09:49<2:08:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 1: 92%|█████████▏| 11387/12384 [24:09:56<2:08:25, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 1: 92%|█████████▏| 11388/12384 [24:09:56<2:07:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 1: 92%|█████████▏| 11388/12384 [24:10:04<2:07:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 92%|█████████▏| 11389/12384 [24:10:04<2:07:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 1: 92%|█████████▏| 11389/12384 [24:10:11<2:07:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 92%|█████████▏| 11390/12384 [24:10:11<2:06:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 92%|█████████▏| 11390/12384 [24:10:19<2:06:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 92%|█████████▏| 11391/12384 [24:10:19<2:06:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 1: 92%|█████████▏| 11391/12384 [24:10:27<2:06:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 1: 92%|█████████▏| 11392/12384 [24:10:27<2:06:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 1: 92%|█████████▏| 11392/12384 [24:10:34<2:06:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 92%|█████████▏| 11393/12384 [24:10:34<2:05:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 1: 92%|█████████▏| 11393/12384 [24:10:42<2:05:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 92%|█████████▏| 11394/12384 [24:10:42<2:05:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 1: 92%|█████████▏| 11394/12384 [24:10:49<2:05:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 92%|█████████▏| 11395/12384 [24:10:49<2:05:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 92%|█████████▏| 11395/12384 [24:10:57<2:05:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 92%|█████████▏| 11396/12384 [24:10:57<2:05:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 92%|█████████▏| 11396/12384 [24:11:05<2:05:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 92%|█████████▏| 11397/12384 [24:11:05<2:05:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 92%|█████████▏| 11397/12384 [24:11:12<2:05:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 92%|█████████▏| 11398/12384 [24:11:12<2:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 92%|█████████▏| 11398/12384 [24:11:20<2:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 92%|█████████▏| 11399/12384 [24:11:20<2:04:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 92%|█████████▏| 11399/12384 [24:11:27<2:04:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 92%|█████████▏| 11400/12384 [24:11:27<2:04:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 92%|█████████▏| 11400/12384 [24:11:35<2:04:41, 7.60s/it, loss=0.0005, acc=0.9974, iter_time=7.05s]
Epoch 1: 92%|█████████▏| 11401/12384 [24:11:35<2:04:36, 7.61s/it, loss=0.0005, acc=0.9974, iter_time=7.05s]
Epoch 1: 92%|█████████▏| 11401/12384 [24:11:43<2:04:36, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 1: 92%|█████████▏| 11402/12384 [24:11:43<2:04:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 1: 92%|█████████▏| 11402/12384 [24:11:50<2:04:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11403/12384 [24:11:50<2:04:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11403/12384 [24:11:58<2:04:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 1: 92%|█████████▏| 11404/12384 [24:11:58<2:05:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 1: 92%|█████████▏| 11404/12384 [24:12:06<2:05:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 92%|█████████▏| 11405/12384 [24:12:06<2:04:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 1: 92%|█████████▏| 11405/12384 [24:12:13<2:04:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11406/12384 [24:12:13<2:04:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11406/12384 [24:12:21<2:04:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 92%|█████████▏| 11407/12384 [24:12:21<2:04:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 92%|█████████▏| 11407/12384 [24:12:29<2:04:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.23s]
Epoch 1: 92%|█████████▏| 11408/12384 [24:12:29<2:04:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.23s]
Epoch 1: 92%|█████████▏| 11408/12384 [24:12:37<2:04:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 92%|█████████▏| 11409/12384 [24:12:37<2:05:40, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 92%|█████████▏| 11409/12384 [24:12:44<2:05:40, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 92%|█████████▏| 11410/12384 [24:12:44<2:04:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 1: 92%|█████████▏| 11410/12384 [24:12:52<2:04:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 92%|█████████▏| 11411/12384 [24:12:52<2:04:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 92%|█████████▏| 11411/12384 [24:12:59<2:04:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 92%|█████████▏| 11412/12384 [24:12:59<2:04:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 92%|█████████▏| 11412/12384 [24:13:07<2:04:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 92%|█████████▏| 11413/12384 [24:13:07<2:05:25, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 92%|█████████▏| 11413/12384 [24:13:15<2:05:25, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 92%|█████████▏| 11414/12384 [24:13:15<2:04:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 92%|█████████▏| 11414/12384 [24:13:23<2:04:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 92%|█████████▏| 11415/12384 [24:13:23<2:04:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 92%|█████████▏| 11415/12384 [24:13:30<2:04:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 92%|█████████▏| 11416/12384 [24:13:30<2:03:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 92%|█████████▏| 11416/12384 [24:13:38<2:03:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 92%|█████████▏| 11417/12384 [24:13:38<2:03:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 92%|█████████▏| 11417/12384 [24:13:46<2:03:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 92%|█████████▏| 11418/12384 [24:13:46<2:03:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 1: 92%|█████████▏| 11418/12384 [24:13:53<2:03:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 92%|█████████▏| 11419/12384 [24:13:53<2:02:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 1: 92%|█████████▏| 11419/12384 [24:14:01<2:02:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 92%|█████████▏| 11420/12384 [24:14:01<2:02:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 92%|█████████▏| 11420/12384 [24:14:08<2:02:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11421/12384 [24:14:08<2:02:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11421/12384 [24:14:16<2:02:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11422/12384 [24:14:16<2:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11422/12384 [24:14:24<2:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 92%|█████████▏| 11423/12384 [24:14:24<2:01:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 1: 92%|█████████▏| 11423/12384 [24:14:31<2:01:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 92%|█████████▏| 11424/12384 [24:14:31<2:01:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 1: 92%|█████████▏| 11424/12384 [24:14:39<2:01:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11425/12384 [24:14:39<2:01:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11425/12384 [24:14:46<2:01:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 92%|█████████▏| 11426/12384 [24:14:46<2:01:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 92%|█████████▏| 11426/12384 [24:14:54<2:01:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 92%|█████████▏| 11427/12384 [24:14:54<2:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 92%|█████████▏| 11427/12384 [24:15:02<2:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11428/12384 [24:15:02<2:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 92%|█████████▏| 11428/12384 [24:15:09<2:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 92%|█████████▏| 11429/12384 [24:15:09<2:01:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 1: 92%|█████████▏| 11429/12384 [24:15:17<2:01:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 92%|█████████▏| 11430/12384 [24:15:17<2:01:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 92%|█████████▏| 11430/12384 [24:15:25<2:01:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 92%|█████████▏| 11431/12384 [24:15:25<2:00:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 92%|█████████▏| 11431/12384 [24:15:32<2:00:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 92%|█████████▏| 11432/12384 [24:15:32<2:00:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 92%|█████████▏| 11432/12384 [24:15:40<2:00:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 1: 92%|█████████▏| 11433/12384 [24:15:40<2:00:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 1: 92%|█████████▏| 11433/12384 [24:15:47<2:00:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 1: 92%|█████████▏| 11434/12384 [24:15:47<2:00:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 1: 92%|█████████▏| 11434/12384 [24:15:55<2:00:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 92%|█████████▏| 11435/12384 [24:15:55<2:00:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 92%|█████████▏| 11435/12384 [24:16:03<2:00:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 92%|█████████▏| 11436/12384 [24:16:03<2:01:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 92%|█████████▏| 11436/12384 [24:16:10<2:01:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 92%|█████████▏| 11437/12384 [24:16:10<2:01:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 92%|█████████▏| 11437/12384 [24:16:18<2:01:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 92%|█████████▏| 11438/12384 [24:16:18<2:00:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 92%|█████████▏| 11438/12384 [24:16:26<2:00:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 92%|█████████▏| 11439/12384 [24:16:26<2:00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 92%|█████████▏| 11439/12384 [24:16:34<2:00:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 92%|█████████▏| 11440/12384 [24:16:34<2:01:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 1: 92%|█████████▏| 11440/12384 [24:16:41<2:01:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 92%|█████████▏| 11441/12384 [24:16:41<2:00:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 1: 92%|█████████▏| 11441/12384 [24:16:49<2:00:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11442/12384 [24:16:49<2:00:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 92%|█████████▏| 11442/12384 [24:16:56<2:00:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 92%|█████████▏| 11443/12384 [24:16:56<2:00:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 1: 92%|█████████▏| 11443/12384 [24:17:04<2:00:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 92%|█████████▏| 11444/12384 [24:17:04<1:59:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 92%|█████████▏| 11444/12384 [24:17:12<1:59:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 92%|█████████▏| 11445/12384 [24:17:12<1:59:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 92%|█████████▏| 11445/12384 [24:17:19<1:59:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 92%|█████████▏| 11446/12384 [24:17:19<1:59:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 92%|█████████▏| 11446/12384 [24:17:27<1:59:40, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.21s]
Epoch 1: 92%|█████████▏| 11447/12384 [24:17:27<1:59:29, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.21s]
Epoch 1: 92%|█████████▏| 11447/12384 [24:17:35<1:59:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 92%|█████████▏| 11448/12384 [24:17:35<1:59:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 92%|█████████▏| 11448/12384 [24:17:42<1:59:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 92%|█████████▏| 11449/12384 [24:17:42<1:58:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 92%|█████████▏| 11449/12384 [24:17:50<1:58:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 92%|█████████▏| 11450/12384 [24:17:50<1:59:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 1: 92%|█████████▏| 11450/12384 [24:17:58<1:59:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 92%|█████████▏| 11451/12384 [24:17:58<1:58:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 92%|█████████▏| 11451/12384 [24:18:05<1:58:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 92%|█████████▏| 11452/12384 [24:18:05<1:58:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 92%|█████████▏| 11452/12384 [24:18:13<1:58:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 92%|█████████▏| 11453/12384 [24:18:13<1:58:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 92%|█████████▏| 11453/12384 [24:18:20<1:58:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 92%|█████████▏| 11454/12384 [24:18:20<1:58:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 1: 92%|█████████▏| 11454/12384 [24:18:28<1:58:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 92%|█████████▏| 11455/12384 [24:18:28<1:57:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 1: 92%|█████████▏| 11455/12384 [24:18:36<1:57:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 93%|█████████▎| 11456/12384 [24:18:36<1:57:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 93%|█████████▎| 11456/12384 [24:18:43<1:57:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 93%|█████████▎| 11457/12384 [24:18:43<1:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 1: 93%|█████████▎| 11457/12384 [24:18:51<1:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 93%|█████████▎| 11458/12384 [24:18:51<1:57:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 1: 93%|█████████▎| 11458/12384 [24:18:58<1:57:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11459/12384 [24:18:58<1:57:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11459/12384 [24:19:06<1:57:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11460/12384 [24:19:06<1:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11460/12384 [24:19:14<1:57:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 93%|█████████▎| 11461/12384 [24:19:14<1:57:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 93%|█████████▎| 11461/12384 [24:19:21<1:57:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 93%|█████████▎| 11462/12384 [24:19:21<1:56:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 93%|█████████▎| 11462/12384 [24:19:29<1:56:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 93%|█████████▎| 11463/12384 [24:19:29<1:56:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 93%|█████████▎| 11463/12384 [24:19:37<1:56:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11464/12384 [24:19:37<1:56:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11464/12384 [24:19:44<1:56:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 93%|█████████▎| 11465/12384 [24:19:44<1:56:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 93%|█████████▎| 11465/12384 [24:19:52<1:56:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 93%|█████████▎| 11466/12384 [24:19:52<1:58:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 1: 93%|█████████▎| 11466/12384 [24:20:00<1:58:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 93%|█████████▎| 11467/12384 [24:20:00<1:57:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 93%|█████████▎| 11467/12384 [24:20:07<1:57:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 93%|█████████▎| 11468/12384 [24:20:07<1:56:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 1: 93%|█████████▎| 11468/12384 [24:20:15<1:56:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 93%|█████████▎| 11469/12384 [24:20:15<1:56:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 1: 93%|█████████▎| 11469/12384 [24:20:23<1:56:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 93%|█████████▎| 11470/12384 [24:20:23<1:56:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 1: 93%|█████████▎| 11470/12384 [24:20:30<1:56:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11471/12384 [24:20:30<1:56:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11471/12384 [24:20:38<1:56:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 93%|█████████▎| 11472/12384 [24:20:38<1:56:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 93%|█████████▎| 11472/12384 [24:20:45<1:56:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 1: 93%|█████████▎| 11473/12384 [24:20:45<1:55:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 1: 93%|█████████▎| 11473/12384 [24:20:53<1:55:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 1: 93%|█████████▎| 11474/12384 [24:20:53<1:55:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 1: 93%|█████████▎| 11474/12384 [24:21:01<1:55:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 93%|█████████▎| 11475/12384 [24:21:01<1:55:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 1: 93%|█████████▎| 11475/12384 [24:21:08<1:55:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 93%|█████████▎| 11476/12384 [24:21:08<1:55:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 1: 93%|█████████▎| 11476/12384 [24:21:16<1:55:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11477/12384 [24:21:16<1:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11477/12384 [24:21:23<1:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11478/12384 [24:21:23<1:54:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11478/12384 [24:21:31<1:54:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 93%|█████████▎| 11479/12384 [24:21:31<1:55:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 93%|█████████▎| 11479/12384 [24:21:39<1:55:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 1: 93%|█████████▎| 11480/12384 [24:21:39<1:54:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 1: 93%|█████████▎| 11480/12384 [24:21:46<1:54:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 93%|█████████▎| 11481/12384 [24:21:46<1:54:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 93%|█████████▎| 11481/12384 [24:21:54<1:54:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 93%|█████████▎| 11482/12384 [24:21:54<1:54:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 1: 93%|█████████▎| 11482/12384 [24:22:02<1:54:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 93%|█████████▎| 11483/12384 [24:22:02<1:54:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 93%|█████████▎| 11483/12384 [24:22:09<1:54:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 93%|█████████▎| 11484/12384 [24:22:09<1:54:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 93%|█████████▎| 11484/12384 [24:22:17<1:54:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 1: 93%|█████████▎| 11485/12384 [24:22:17<1:54:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 1: 93%|█████████▎| 11485/12384 [24:22:24<1:54:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 93%|█████████▎| 11486/12384 [24:22:24<1:54:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 93%|█████████▎| 11486/12384 [24:22:32<1:54:06, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=5.24s]
Epoch 1: 93%|█████████▎| 11487/12384 [24:22:32<1:54:21, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=5.24s]
Epoch 1: 93%|█████████▎| 11487/12384 [24:22:40<1:54:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 93%|█████████▎| 11488/12384 [24:22:40<1:55:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 1: 93%|█████████▎| 11488/12384 [24:22:48<1:55:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 93%|█████████▎| 11489/12384 [24:22:48<1:55:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 93%|█████████▎| 11489/12384 [24:22:55<1:55:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 93%|█████████▎| 11490/12384 [24:22:55<1:54:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 93%|█████████▎| 11490/12384 [24:23:03<1:54:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 93%|█████████▎| 11491/12384 [24:23:03<1:54:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 1: 93%|█████████▎| 11491/12384 [24:23:11<1:54:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 93%|█████████▎| 11492/12384 [24:23:11<1:53:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 93%|█████████▎| 11492/12384 [24:23:19<1:53:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 93%|█████████▎| 11493/12384 [24:23:19<1:54:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 93%|█████████▎| 11493/12384 [24:23:26<1:54:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 93%|█████████▎| 11494/12384 [24:23:26<1:54:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 93%|█████████▎| 11494/12384 [24:23:34<1:54:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 93%|█████████▎| 11495/12384 [24:23:34<1:53:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 1: 93%|█████████▎| 11495/12384 [24:23:41<1:53:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 93%|█████████▎| 11496/12384 [24:23:41<1:53:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 93%|█████████▎| 11496/12384 [24:23:49<1:53:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 93%|█████████▎| 11497/12384 [24:23:49<1:53:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 1: 93%|█████████▎| 11497/12384 [24:23:57<1:53:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 93%|█████████▎| 11498/12384 [24:23:57<1:52:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 93%|█████████▎| 11498/12384 [24:24:04<1:52:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 93%|█████████▎| 11499/12384 [24:24:04<1:52:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 93%|█████████▎| 11499/12384 [24:24:12<1:52:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 93%|█████████▎| 11500/12384 [24:24:12<1:52:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 93%|█████████▎| 11500/12384 [24:24:20<1:52:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 93%|█████████▎| 11501/12384 [24:24:20<1:52:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 93%|█████████▎| 11501/12384 [24:24:27<1:52:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11502/12384 [24:24:27<1:52:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11502/12384 [24:24:35<1:52:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 93%|█████████▎| 11503/12384 [24:24:35<1:51:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 93%|█████████▎| 11503/12384 [24:24:42<1:51:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 93%|█████████▎| 11504/12384 [24:24:42<1:51:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 1: 93%|█████████▎| 11504/12384 [24:24:50<1:51:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 93%|█████████▎| 11505/12384 [24:24:50<1:51:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 93%|█████████▎| 11505/12384 [24:24:58<1:51:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 93%|█████████▎| 11506/12384 [24:24:58<1:51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 93%|█████████▎| 11506/12384 [24:25:05<1:51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11507/12384 [24:25:05<1:51:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11507/12384 [24:25:13<1:51:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 93%|█████████▎| 11508/12384 [24:25:13<1:51:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 93%|█████████▎| 11508/12384 [24:25:20<1:51:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 1: 93%|█████████▎| 11509/12384 [24:25:20<1:50:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 1: 93%|█████████▎| 11509/12384 [24:25:28<1:50:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11510/12384 [24:25:28<1:50:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11510/12384 [24:25:36<1:50:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11511/12384 [24:25:36<1:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11511/12384 [24:25:43<1:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 93%|█████████▎| 11512/12384 [24:25:43<1:50:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 93%|█████████▎| 11512/12384 [24:25:51<1:50:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 93%|█████████▎| 11513/12384 [24:25:51<1:50:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 93%|█████████▎| 11513/12384 [24:25:59<1:50:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 93%|█████████▎| 11514/12384 [24:25:59<1:51:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 93%|█████████▎| 11514/12384 [24:26:06<1:51:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11515/12384 [24:26:06<1:51:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11515/12384 [24:26:14<1:51:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 93%|█████████▎| 11516/12384 [24:26:14<1:50:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 1: 93%|█████████▎| 11516/12384 [24:26:22<1:50:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 93%|█████████▎| 11517/12384 [24:26:22<1:50:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 93%|█████████▎| 11517/12384 [24:26:29<1:50:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 93%|█████████▎| 11518/12384 [24:26:29<1:50:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 93%|█████████▎| 11518/12384 [24:26:37<1:50:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 93%|█████████▎| 11519/12384 [24:26:37<1:51:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 93%|█████████▎| 11519/12384 [24:26:45<1:51:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 1: 93%|█████████▎| 11520/12384 [24:26:45<1:50:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 1: 93%|█████████▎| 11520/12384 [24:26:53<1:50:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 93%|█████████▎| 11521/12384 [24:26:53<1:50:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 93%|█████████▎| 11521/12384 [24:27:00<1:50:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 93%|█████████▎| 11522/12384 [24:27:00<1:49:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 1: 93%|█████████▎| 11522/12384 [24:27:08<1:49:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 93%|█████████▎| 11523/12384 [24:27:08<1:49:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 93%|█████████▎| 11523/12384 [24:27:15<1:49:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 93%|█████████▎| 11524/12384 [24:27:15<1:49:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 93%|█████████▎| 11524/12384 [24:27:23<1:49:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 93%|█████████▎| 11525/12384 [24:27:23<1:49:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 93%|█████████▎| 11525/12384 [24:27:31<1:49:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 93%|█████████▎| 11526/12384 [24:27:31<1:49:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 93%|█████████▎| 11526/12384 [24:27:38<1:49:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 93%|█████████▎| 11527/12384 [24:27:38<1:49:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 1: 93%|█████████▎| 11527/12384 [24:27:46<1:49:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 1: 93%|█████████▎| 11528/12384 [24:27:46<1:49:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 1: 93%|█████████▎| 11528/12384 [24:27:53<1:49:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 1: 93%|█████████▎| 11529/12384 [24:27:53<1:48:36, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.49s]
Epoch 1: 93%|█████████▎| 11529/12384 [24:28:01<1:48:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 93%|█████████▎| 11530/12384 [24:28:01<1:48:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 1: 93%|█████████▎| 11530/12384 [24:28:09<1:48:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 93%|█████████▎| 11531/12384 [24:28:09<1:48:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 93%|█████████▎| 11531/12384 [24:28:16<1:48:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11532/12384 [24:28:16<1:48:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11532/12384 [24:28:24<1:48:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 93%|█████████▎| 11533/12384 [24:28:24<1:48:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 93%|█████████▎| 11533/12384 [24:28:32<1:48:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 93%|█████████▎| 11534/12384 [24:28:32<1:47:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 93%|█████████▎| 11534/12384 [24:28:39<1:47:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 93%|█████████▎| 11535/12384 [24:28:39<1:48:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 93%|█████████▎| 11535/12384 [24:28:47<1:48:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 93%|█████████▎| 11536/12384 [24:28:47<1:48:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 1: 93%|█████████▎| 11536/12384 [24:28:55<1:48:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 93%|█████████▎| 11537/12384 [24:28:55<1:48:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 93%|█████████▎| 11537/12384 [24:29:02<1:48:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 93%|█████████▎| 11538/12384 [24:29:02<1:48:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 93%|█████████▎| 11538/12384 [24:29:10<1:48:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 93%|█████████▎| 11539/12384 [24:29:10<1:48:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 1: 93%|█████████▎| 11539/12384 [24:29:18<1:48:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 93%|█████████▎| 11540/12384 [24:29:18<1:47:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 1: 93%|█████████▎| 11540/12384 [24:29:25<1:47:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 93%|█████████▎| 11541/12384 [24:29:25<1:47:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 93%|█████████▎| 11541/12384 [24:29:33<1:47:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 93%|█████████▎| 11542/12384 [24:29:33<1:47:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 1: 93%|█████████▎| 11542/12384 [24:29:41<1:47:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 93%|█████████▎| 11543/12384 [24:29:41<1:46:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 1: 93%|█████████▎| 11543/12384 [24:29:48<1:46:59, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.98s]
Epoch 1: 93%|█████████▎| 11544/12384 [24:29:48<1:47:13, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.98s]
Epoch 1: 93%|█████████▎| 11544/12384 [24:29:56<1:47:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 93%|█████████▎| 11545/12384 [24:29:56<1:48:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 93%|█████████▎| 11545/12384 [24:30:04<1:48:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 93%|█████████▎| 11546/12384 [24:30:04<1:47:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 93%|█████████▎| 11546/12384 [24:30:11<1:47:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 93%|█████████▎| 11547/12384 [24:30:11<1:47:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 93%|█████████▎| 11547/12384 [24:30:19<1:47:07, 7.68s/it, loss=0.0001, acc=0.9986, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11548/12384 [24:30:19<1:46:44, 7.66s/it, loss=0.0001, acc=0.9986, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11548/12384 [24:30:27<1:46:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11549/12384 [24:30:27<1:46:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11549/12384 [24:30:34<1:46:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 93%|█████████▎| 11550/12384 [24:30:34<1:46:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 93%|█████████▎| 11550/12384 [24:30:42<1:46:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 93%|█████████▎| 11551/12384 [24:30:42<1:45:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 93%|█████████▎| 11551/12384 [24:30:50<1:45:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 93%|█████████▎| 11552/12384 [24:30:50<1:46:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 93%|█████████▎| 11552/12384 [24:30:57<1:46:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 93%|█████████▎| 11553/12384 [24:30:57<1:46:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 93%|█████████▎| 11553/12384 [24:31:05<1:46:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 93%|█████████▎| 11554/12384 [24:31:05<1:46:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 93%|█████████▎| 11554/12384 [24:31:13<1:46:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 93%|█████████▎| 11555/12384 [24:31:13<1:45:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 93%|█████████▎| 11555/12384 [24:31:20<1:45:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 93%|█████████▎| 11556/12384 [24:31:20<1:45:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 93%|█████████▎| 11556/12384 [24:31:28<1:45:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 1: 93%|█████████▎| 11557/12384 [24:31:28<1:45:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 1: 93%|█████████▎| 11557/12384 [24:31:35<1:45:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 93%|█████████▎| 11558/12384 [24:31:35<1:45:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 1: 93%|█████████▎| 11558/12384 [24:31:43<1:45:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 93%|█████████▎| 11559/12384 [24:31:43<1:44:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 93%|█████████▎| 11559/12384 [24:31:51<1:44:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11560/12384 [24:31:51<1:44:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 93%|█████████▎| 11560/12384 [24:31:58<1:44:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 93%|█████████▎| 11561/12384 [24:31:58<1:44:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 93%|█████████▎| 11561/12384 [24:32:06<1:44:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 93%|█████████▎| 11562/12384 [24:32:06<1:44:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 93%|█████████▎| 11562/12384 [24:32:14<1:44:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 93%|█████████▎| 11563/12384 [24:32:14<1:44:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 1: 93%|█████████▎| 11563/12384 [24:32:21<1:44:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11564/12384 [24:32:21<1:44:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 93%|█████████▎| 11564/12384 [24:32:29<1:44:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 93%|█████████▎| 11565/12384 [24:32:29<1:43:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 93%|█████████▎| 11565/12384 [24:32:36<1:43:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.58s]
Epoch 1: 93%|█████████▎| 11566/12384 [24:32:36<1:43:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.58s]
Epoch 1: 93%|█████████▎| 11566/12384 [24:32:44<1:43:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 93%|█████████▎| 11567/12384 [24:32:44<1:43:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 93%|█████████▎| 11567/12384 [24:32:52<1:43:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 93%|█████████▎| 11568/12384 [24:32:52<1:43:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 1: 93%|█████████▎| 11568/12384 [24:32:59<1:43:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.09s]
Epoch 1: 93%|█████████▎| 11569/12384 [24:32:59<1:43:40, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.09s]
Epoch 1: 93%|█████████▎| 11569/12384 [24:33:07<1:43:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 93%|█████████▎| 11570/12384 [24:33:07<1:43:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 1: 93%|█████████▎| 11570/12384 [24:33:15<1:43:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 93%|█████████▎| 11571/12384 [24:33:15<1:45:00, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 1: 93%|█████████▎| 11571/12384 [24:33:23<1:45:00, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 93%|█████████▎| 11572/12384 [24:33:23<1:44:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 93%|█████████▎| 11572/12384 [24:33:30<1:44:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11573/12384 [24:33:30<1:44:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 93%|█████████▎| 11573/12384 [24:33:38<1:44:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 1: 93%|█████████▎| 11574/12384 [24:33:38<1:43:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 1: 93%|█████████▎| 11574/12384 [24:33:45<1:43:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 93%|█████████▎| 11575/12384 [24:33:45<1:43:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 93%|█████████▎| 11575/12384 [24:33:53<1:43:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 93%|█████████▎| 11576/12384 [24:33:53<1:42:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 93%|█████████▎| 11576/12384 [24:34:01<1:42:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 93%|█████████▎| 11577/12384 [24:34:01<1:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 93%|█████████▎| 11577/12384 [24:34:08<1:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 93%|█████████▎| 11578/12384 [24:34:08<1:42:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 1: 93%|█████████▎| 11578/12384 [24:34:16<1:42:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 93%|█████████▎| 11579/12384 [24:34:16<1:42:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 1: 93%|█████████▎| 11579/12384 [24:34:23<1:42:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 94%|█████████▎| 11580/12384 [24:34:23<1:42:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 1: 94%|█████████▎| 11580/12384 [24:34:31<1:42:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 94%|█████████▎| 11581/12384 [24:34:31<1:42:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 1: 94%|█████████▎| 11581/12384 [24:34:39<1:42:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 94%|█████████▎| 11582/12384 [24:34:39<1:41:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 94%|█████████▎| 11582/12384 [24:34:46<1:41:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 94%|█████████▎| 11583/12384 [24:34:46<1:42:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 94%|█████████▎| 11583/12384 [24:34:54<1:42:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 94%|█████████▎| 11584/12384 [24:34:54<1:41:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 94%|█████████▎| 11584/12384 [24:35:02<1:41:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 1: 94%|█████████▎| 11585/12384 [24:35:02<1:41:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.25s]
Epoch 1: 94%|█████████▎| 11585/12384 [24:35:09<1:41:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▎| 11586/12384 [24:35:09<1:41:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▎| 11586/12384 [24:35:17<1:41:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 94%|█████████▎| 11587/12384 [24:35:17<1:41:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 1: 94%|█████████▎| 11587/12384 [24:35:25<1:41:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 94%|█████████▎| 11588/12384 [24:35:25<1:41:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 94%|█████████▎| 11588/12384 [24:35:32<1:41:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 94%|█████████▎| 11589/12384 [24:35:32<1:40:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 1: 94%|█████████▎| 11589/12384 [24:35:40<1:40:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▎| 11590/12384 [24:35:40<1:41:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▎| 11590/12384 [24:35:47<1:41:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 94%|█████████▎| 11591/12384 [24:35:47<1:40:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 94%|█████████▎| 11591/12384 [24:35:55<1:40:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 94%|█████████▎| 11592/12384 [24:35:55<1:40:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 94%|█████████▎| 11592/12384 [24:36:03<1:40:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 1: 94%|█████████▎| 11593/12384 [24:36:03<1:40:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 1: 94%|█████████▎| 11593/12384 [24:36:10<1:40:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 94%|█████████▎| 11594/12384 [24:36:10<1:40:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 1: 94%|█████████▎| 11594/12384 [24:36:18<1:40:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 94%|█████████▎| 11595/12384 [24:36:18<1:40:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 94%|█████████▎| 11595/12384 [24:36:26<1:40:07, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=5.52s]
Epoch 1: 94%|█████████▎| 11596/12384 [24:36:26<1:39:58, 7.61s/it, loss=0.0004, acc=0.9986, iter_time=5.52s]
Epoch 1: 94%|█████████▎| 11596/12384 [24:36:33<1:39:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 94%|█████████▎| 11597/12384 [24:36:33<1:41:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 1: 94%|█████████▎| 11597/12384 [24:36:41<1:41:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 94%|█████████▎| 11598/12384 [24:36:41<1:40:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 94%|█████████▎| 11598/12384 [24:36:49<1:40:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 94%|█████████▎| 11599/12384 [24:36:49<1:40:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 94%|█████████▎| 11599/12384 [24:36:56<1:40:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 94%|█████████▎| 11600/12384 [24:36:56<1:39:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 1: 94%|█████████▎| 11600/12384 [24:37:04<1:39:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 1: 94%|█████████▎| 11601/12384 [24:37:04<1:39:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 1: 94%|█████████▎| 11601/12384 [24:37:11<1:39:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 94%|█████████▎| 11602/12384 [24:37:11<1:39:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 1: 94%|█████████▎| 11602/12384 [24:37:19<1:39:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 94%|█████████▎| 11603/12384 [24:37:19<1:39:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 94%|█████████▎| 11603/12384 [24:37:27<1:39:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 94%|█████████▎| 11604/12384 [24:37:27<1:39:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 94%|█████████▎| 11604/12384 [24:37:34<1:39:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 94%|█████████▎| 11605/12384 [24:37:34<1:38:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 1: 94%|█████████▎| 11605/12384 [24:37:42<1:38:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 94%|█████████▎| 11606/12384 [24:37:42<1:38:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 1: 94%|█████████▎| 11606/12384 [24:37:50<1:38:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 94%|█████████▎| 11607/12384 [24:37:50<1:38:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 1: 94%|█████████▎| 11607/12384 [24:37:57<1:38:37, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.57s]
Epoch 1: 94%|█████████▎| 11608/12384 [24:37:57<1:38:25, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.57s]
Epoch 1: 94%|█████████▎| 11608/12384 [24:38:05<1:38:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 94%|█████████▎| 11609/12384 [24:38:05<1:38:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 94%|█████████▎| 11609/12384 [24:38:12<1:38:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 94%|█████████▍| 11610/12384 [24:38:12<1:38:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 94%|█████████▍| 11610/12384 [24:38:20<1:38:03, 7.60s/it, loss=0.0008, acc=0.9981, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11611/12384 [24:38:20<1:37:59, 7.61s/it, loss=0.0008, acc=0.9981, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11611/12384 [24:38:28<1:37:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11612/12384 [24:38:28<1:37:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11612/12384 [24:38:35<1:37:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11613/12384 [24:38:35<1:37:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11613/12384 [24:38:43<1:37:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 94%|█████████▍| 11614/12384 [24:38:43<1:37:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 1: 94%|█████████▍| 11614/12384 [24:38:50<1:37:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 1: 94%|█████████▍| 11615/12384 [24:38:50<1:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 1: 94%|█████████▍| 11615/12384 [24:38:58<1:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 94%|█████████▍| 11616/12384 [24:38:58<1:38:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 1: 94%|█████████▍| 11616/12384 [24:39:06<1:38:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 1: 94%|█████████▍| 11617/12384 [24:39:06<1:37:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 1: 94%|█████████▍| 11617/12384 [24:39:13<1:37:50, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.56s]
Epoch 1: 94%|█████████▍| 11618/12384 [24:39:13<1:37:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.56s]
Epoch 1: 94%|█████████▍| 11618/12384 [24:39:21<1:37:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 94%|█████████▍| 11619/12384 [24:39:21<1:37:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 1: 94%|█████████▍| 11619/12384 [24:39:29<1:37:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 94%|█████████▍| 11620/12384 [24:39:29<1:37:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 1: 94%|█████████▍| 11620/12384 [24:39:36<1:37:03, 7.62s/it, loss=0.0014, acc=0.9968, iter_time=10.10s]
Epoch 1: 94%|█████████▍| 11621/12384 [24:39:36<1:36:48, 7.61s/it, loss=0.0014, acc=0.9968, iter_time=10.10s]
Epoch 1: 94%|█████████▍| 11621/12384 [24:39:44<1:36:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 94%|█████████▍| 11622/12384 [24:39:44<1:36:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 94%|█████████▍| 11622/12384 [24:39:51<1:36:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▍| 11623/12384 [24:39:51<1:36:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▍| 11623/12384 [24:39:59<1:36:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 94%|█████████▍| 11624/12384 [24:39:59<1:37:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 94%|█████████▍| 11624/12384 [24:40:07<1:37:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 94%|█████████▍| 11625/12384 [24:40:07<1:37:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 1: 94%|█████████▍| 11625/12384 [24:40:15<1:37:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 94%|█████████▍| 11626/12384 [24:40:15<1:36:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 1: 94%|█████████▍| 11626/12384 [24:40:22<1:36:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 94%|█████████▍| 11627/12384 [24:40:22<1:36:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 1: 94%|█████████▍| 11627/12384 [24:40:30<1:36:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 94%|█████████▍| 11628/12384 [24:40:30<1:36:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 94%|█████████▍| 11628/12384 [24:40:37<1:36:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 94%|█████████▍| 11629/12384 [24:40:37<1:36:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 1: 94%|█████████▍| 11629/12384 [24:40:45<1:36:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 94%|█████████▍| 11630/12384 [24:40:45<1:36:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 94%|█████████▍| 11630/12384 [24:40:53<1:36:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 94%|█████████▍| 11631/12384 [24:40:53<1:36:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 94%|█████████▍| 11631/12384 [24:41:00<1:36:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 94%|█████████▍| 11632/12384 [24:41:00<1:35:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 94%|█████████▍| 11632/12384 [24:41:08<1:35:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 1: 94%|█████████▍| 11633/12384 [24:41:08<1:35:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.14s]
Epoch 1: 94%|█████████▍| 11633/12384 [24:41:16<1:35:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 1: 94%|█████████▍| 11634/12384 [24:41:16<1:35:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 1: 94%|█████████▍| 11634/12384 [24:41:23<1:35:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 94%|█████████▍| 11635/12384 [24:41:23<1:35:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 94%|█████████▍| 11635/12384 [24:41:31<1:35:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11636/12384 [24:41:31<1:35:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11636/12384 [24:41:39<1:35:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11637/12384 [24:41:39<1:34:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11637/12384 [24:41:46<1:34:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 94%|█████████▍| 11638/12384 [24:41:46<1:34:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 1: 94%|█████████▍| 11638/12384 [24:41:54<1:34:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 94%|█████████▍| 11639/12384 [24:41:54<1:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 1: 94%|█████████▍| 11639/12384 [24:42:01<1:34:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 94%|█████████▍| 11640/12384 [24:42:01<1:34:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 94%|█████████▍| 11640/12384 [24:42:09<1:34:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 94%|█████████▍| 11641/12384 [24:42:09<1:34:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 94%|█████████▍| 11641/12384 [24:42:17<1:34:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 94%|█████████▍| 11642/12384 [24:42:17<1:34:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 94%|█████████▍| 11642/12384 [24:42:24<1:34:00, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=4.31s]
Epoch 1: 94%|█████████▍| 11643/12384 [24:42:24<1:33:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.31s]
Epoch 1: 94%|█████████▍| 11643/12384 [24:42:32<1:33:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.92s]
Epoch 1: 94%|█████████▍| 11644/12384 [24:42:32<1:33:47, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.92s]
Epoch 1: 94%|█████████▍| 11644/12384 [24:42:39<1:33:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 94%|█████████▍| 11645/12384 [24:42:39<1:33:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 94%|█████████▍| 11645/12384 [24:42:47<1:33:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 94%|█████████▍| 11646/12384 [24:42:47<1:34:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 94%|█████████▍| 11646/12384 [24:42:55<1:34:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 94%|█████████▍| 11647/12384 [24:42:55<1:34:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 94%|█████████▍| 11647/12384 [24:43:03<1:34:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 1: 94%|█████████▍| 11648/12384 [24:43:03<1:34:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 1: 94%|█████████▍| 11648/12384 [24:43:10<1:34:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 94%|█████████▍| 11649/12384 [24:43:10<1:33:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 94%|█████████▍| 11649/12384 [24:43:18<1:33:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 94%|█████████▍| 11650/12384 [24:43:18<1:34:48, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 1: 94%|█████████▍| 11650/12384 [24:43:26<1:34:48, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 94%|█████████▍| 11651/12384 [24:43:26<1:34:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 1: 94%|█████████▍| 11651/12384 [24:43:33<1:34:12, 7.71s/it, loss=0.0024, acc=0.9981, iter_time=10.67s]
Epoch 1: 94%|█████████▍| 11652/12384 [24:43:33<1:33:41, 7.68s/it, loss=0.0024, acc=0.9981, iter_time=10.67s]
Epoch 1: 94%|█████████▍| 11652/12384 [24:43:41<1:33:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 94%|█████████▍| 11653/12384 [24:43:41<1:33:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 94%|█████████▍| 11653/12384 [24:43:49<1:33:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 94%|█████████▍| 11654/12384 [24:43:49<1:32:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 94%|█████████▍| 11654/12384 [24:43:56<1:32:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 94%|█████████▍| 11655/12384 [24:43:56<1:32:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 94%|█████████▍| 11655/12384 [24:44:04<1:32:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 94%|█████████▍| 11656/12384 [24:44:04<1:32:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 94%|█████████▍| 11656/12384 [24:44:12<1:32:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 94%|█████████▍| 11657/12384 [24:44:12<1:32:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 1: 94%|█████████▍| 11657/12384 [24:44:19<1:32:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 94%|█████████▍| 11658/12384 [24:44:19<1:32:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 94%|█████████▍| 11658/12384 [24:44:27<1:32:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 94%|█████████▍| 11659/12384 [24:44:27<1:32:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 1: 94%|█████████▍| 11659/12384 [24:44:34<1:32:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 94%|█████████▍| 11660/12384 [24:44:34<1:31:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 94%|█████████▍| 11660/12384 [24:44:42<1:31:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11661/12384 [24:44:42<1:31:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11661/12384 [24:44:50<1:31:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 94%|█████████▍| 11662/12384 [24:44:50<1:31:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 94%|█████████▍| 11662/12384 [24:44:57<1:31:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 94%|█████████▍| 11663/12384 [24:44:57<1:31:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 94%|█████████▍| 11663/12384 [24:45:05<1:31:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 94%|█████████▍| 11664/12384 [24:45:05<1:31:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 94%|█████████▍| 11664/12384 [24:45:12<1:31:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 94%|█████████▍| 11665/12384 [24:45:12<1:31:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 94%|█████████▍| 11665/12384 [24:45:20<1:31:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 94%|█████████▍| 11666/12384 [24:45:20<1:31:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 94%|█████████▍| 11666/12384 [24:45:28<1:31:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 94%|█████████▍| 11667/12384 [24:45:28<1:31:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 1: 94%|█████████▍| 11667/12384 [24:45:35<1:31:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 94%|█████████▍| 11668/12384 [24:45:35<1:30:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 1: 94%|█████████▍| 11668/12384 [24:45:43<1:30:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▍| 11669/12384 [24:45:43<1:30:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▍| 11669/12384 [24:45:50<1:30:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11670/12384 [24:45:50<1:30:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11670/12384 [24:45:58<1:30:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▍| 11671/12384 [24:45:58<1:30:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▍| 11671/12384 [24:46:06<1:30:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 94%|█████████▍| 11672/12384 [24:46:06<1:30:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 94%|█████████▍| 11672/12384 [24:46:14<1:30:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 94%|█████████▍| 11673/12384 [24:46:14<1:31:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 94%|█████████▍| 11673/12384 [24:46:21<1:31:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 94%|█████████▍| 11674/12384 [24:46:21<1:30:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 1: 94%|█████████▍| 11674/12384 [24:46:29<1:30:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.71s]
Epoch 1: 94%|█████████▍| 11675/12384 [24:46:29<1:30:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.71s]
Epoch 1: 94%|█████████▍| 11675/12384 [24:46:36<1:30:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 94%|█████████▍| 11676/12384 [24:46:36<1:30:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 94%|█████████▍| 11676/12384 [24:46:44<1:30:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 94%|█████████▍| 11677/12384 [24:46:44<1:31:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 94%|█████████▍| 11677/12384 [24:46:52<1:31:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 94%|█████████▍| 11678/12384 [24:46:52<1:30:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 94%|█████████▍| 11678/12384 [24:47:00<1:30:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11679/12384 [24:47:00<1:30:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11679/12384 [24:47:07<1:30:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 94%|█████████▍| 11680/12384 [24:47:07<1:29:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 94%|█████████▍| 11680/12384 [24:47:15<1:29:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 94%|█████████▍| 11681/12384 [24:47:15<1:29:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 94%|█████████▍| 11681/12384 [24:47:22<1:29:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11682/12384 [24:47:22<1:29:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11682/12384 [24:47:30<1:29:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 94%|█████████▍| 11683/12384 [24:47:30<1:29:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 1: 94%|█████████▍| 11683/12384 [24:47:38<1:29:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 94%|█████████▍| 11684/12384 [24:47:38<1:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 94%|█████████▍| 11684/12384 [24:47:45<1:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 94%|█████████▍| 11685/12384 [24:47:45<1:28:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 94%|█████████▍| 11685/12384 [24:47:53<1:28:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 94%|█████████▍| 11686/12384 [24:47:53<1:28:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 94%|█████████▍| 11686/12384 [24:48:00<1:28:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 94%|█████████▍| 11687/12384 [24:48:00<1:28:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 1: 94%|█████████▍| 11687/12384 [24:48:08<1:28:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.38s]
Epoch 1: 94%|█████████▍| 11688/12384 [24:48:08<1:28:44, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=11.38s]
Epoch 1: 94%|█████████▍| 11688/12384 [24:48:16<1:28:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 1: 94%|█████████▍| 11689/12384 [24:48:16<1:28:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 1: 94%|█████████▍| 11689/12384 [24:48:23<1:28:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 94%|█████████▍| 11690/12384 [24:48:23<1:28:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 94%|█████████▍| 11690/12384 [24:48:31<1:28:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 94%|█████████▍| 11691/12384 [24:48:31<1:27:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 94%|█████████▍| 11691/12384 [24:48:39<1:27:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 94%|█████████▍| 11692/12384 [24:48:39<1:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 94%|█████████▍| 11692/12384 [24:48:46<1:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11693/12384 [24:48:46<1:27:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11693/12384 [24:48:54<1:27:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11694/12384 [24:48:54<1:27:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 94%|█████████▍| 11694/12384 [24:49:01<1:27:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11695/12384 [24:49:01<1:27:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11695/12384 [24:49:09<1:27:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 94%|█████████▍| 11696/12384 [24:49:09<1:27:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 94%|█████████▍| 11696/12384 [24:49:17<1:27:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 94%|█████████▍| 11697/12384 [24:49:17<1:27:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 94%|█████████▍| 11697/12384 [24:49:24<1:27:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▍| 11698/12384 [24:49:24<1:27:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 94%|█████████▍| 11698/12384 [24:49:32<1:27:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 94%|█████████▍| 11699/12384 [24:49:32<1:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 1: 94%|█████████▍| 11699/12384 [24:49:39<1:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 94%|█████████▍| 11700/12384 [24:49:39<1:26:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 1: 94%|█████████▍| 11700/12384 [24:49:47<1:26:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 94%|█████████▍| 11701/12384 [24:49:47<1:27:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 94%|█████████▍| 11701/12384 [24:49:55<1:27:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11702/12384 [24:49:55<1:26:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 94%|█████████▍| 11702/12384 [24:50:03<1:26:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 1: 95%|█████████▍| 11703/12384 [24:50:03<1:27:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 1: 95%|█████████▍| 11703/12384 [24:50:10<1:27:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 1: 95%|█████████▍| 11704/12384 [24:50:10<1:27:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 1: 95%|█████████▍| 11704/12384 [24:50:18<1:27:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 95%|█████████▍| 11705/12384 [24:50:18<1:27:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 95%|█████████▍| 11705/12384 [24:50:26<1:27:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 95%|█████████▍| 11706/12384 [24:50:26<1:26:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 1: 95%|█████████▍| 11706/12384 [24:50:33<1:26:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 95%|█████████▍| 11707/12384 [24:50:33<1:26:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 95%|█████████▍| 11707/12384 [24:50:41<1:26:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 95%|█████████▍| 11708/12384 [24:50:41<1:26:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 95%|█████████▍| 11708/12384 [24:50:49<1:26:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 95%|█████████▍| 11709/12384 [24:50:49<1:25:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 1: 95%|█████████▍| 11709/12384 [24:50:56<1:25:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▍| 11710/12384 [24:50:56<1:25:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▍| 11710/12384 [24:51:04<1:25:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11711/12384 [24:51:04<1:25:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11711/12384 [24:51:12<1:25:43, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.06s]
Epoch 1: 95%|█████████▍| 11712/12384 [24:51:12<1:25:33, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.06s]
Epoch 1: 95%|█████████▍| 11712/12384 [24:51:19<1:25:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 1: 95%|█████████▍| 11713/12384 [24:51:19<1:25:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 1: 95%|█████████▍| 11713/12384 [24:51:27<1:25:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 95%|█████████▍| 11714/12384 [24:51:27<1:25:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 1: 95%|█████████▍| 11714/12384 [24:51:34<1:25:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 95%|█████████▍| 11715/12384 [24:51:34<1:24:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 95%|█████████▍| 11715/12384 [24:51:42<1:24:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 95%|█████████▍| 11716/12384 [24:51:42<1:24:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 95%|█████████▍| 11716/12384 [24:51:50<1:24:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 95%|█████████▍| 11717/12384 [24:51:50<1:24:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 1: 95%|█████████▍| 11717/12384 [24:51:57<1:24:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 95%|█████████▍| 11718/12384 [24:51:57<1:24:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 95%|█████████▍| 11718/12384 [24:52:05<1:24:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 95%|█████████▍| 11719/12384 [24:52:05<1:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 95%|█████████▍| 11719/12384 [24:52:13<1:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 95%|█████████▍| 11720/12384 [24:52:13<1:24:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 95%|█████████▍| 11720/12384 [24:52:20<1:24:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 95%|█████████▍| 11721/12384 [24:52:20<1:24:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 1: 95%|█████████▍| 11721/12384 [24:52:28<1:24:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 95%|█████████▍| 11722/12384 [24:52:28<1:24:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 1: 95%|█████████▍| 11722/12384 [24:52:35<1:24:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 95%|█████████▍| 11723/12384 [24:52:35<1:23:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 95%|█████████▍| 11723/12384 [24:52:43<1:23:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 95%|█████████▍| 11724/12384 [24:52:43<1:23:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 95%|█████████▍| 11724/12384 [24:52:51<1:23:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 95%|█████████▍| 11725/12384 [24:52:51<1:23:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 1: 95%|█████████▍| 11725/12384 [24:52:58<1:23:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 95%|█████████▍| 11726/12384 [24:52:58<1:23:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 95%|█████████▍| 11726/12384 [24:53:06<1:23:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 1: 95%|█████████▍| 11727/12384 [24:53:06<1:23:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 1: 95%|█████████▍| 11727/12384 [24:53:13<1:23:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 95%|█████████▍| 11728/12384 [24:53:13<1:23:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 1: 95%|█████████▍| 11728/12384 [24:53:21<1:23:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 95%|█████████▍| 11729/12384 [24:53:21<1:24:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 95%|█████████▍| 11729/12384 [24:53:29<1:24:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 95%|█████████▍| 11730/12384 [24:53:29<1:23:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 1: 95%|█████████▍| 11730/12384 [24:53:37<1:23:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 95%|█████████▍| 11731/12384 [24:53:37<1:23:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 1: 95%|█████████▍| 11731/12384 [24:53:44<1:23:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 95%|█████████▍| 11732/12384 [24:53:44<1:23:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 95%|█████████▍| 11732/12384 [24:53:52<1:23:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11733/12384 [24:53:52<1:22:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11733/12384 [24:54:00<1:22:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▍| 11734/12384 [24:54:00<1:22:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▍| 11734/12384 [24:54:07<1:22:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11735/12384 [24:54:07<1:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11735/12384 [24:54:15<1:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 95%|█████████▍| 11736/12384 [24:54:15<1:22:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 95%|█████████▍| 11736/12384 [24:54:22<1:22:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 95%|█████████▍| 11737/12384 [24:54:22<1:22:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 95%|█████████▍| 11737/12384 [24:54:30<1:22:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 95%|█████████▍| 11738/12384 [24:54:30<1:22:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 95%|█████████▍| 11738/12384 [24:54:38<1:22:06, 7.63s/it, loss=0.0002, acc=0.9987, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11739/12384 [24:54:38<1:21:56, 7.62s/it, loss=0.0002, acc=0.9987, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11739/12384 [24:54:45<1:21:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11740/12384 [24:54:45<1:21:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▍| 11740/12384 [24:54:53<1:21:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 95%|█████████▍| 11741/12384 [24:54:53<1:21:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 1: 95%|█████████▍| 11741/12384 [24:55:00<1:21:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 95%|█████████▍| 11742/12384 [24:55:00<1:21:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 95%|█████████▍| 11742/12384 [24:55:08<1:21:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 95%|█████████▍| 11743/12384 [24:55:08<1:21:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 95%|█████████▍| 11743/12384 [24:55:16<1:21:31, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.10s]
Epoch 1: 95%|█████████▍| 11744/12384 [24:55:16<1:21:38, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.10s]
Epoch 1: 95%|█████████▍| 11744/12384 [24:55:23<1:21:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 95%|█████████▍| 11745/12384 [24:55:23<1:21:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 1: 95%|█████████▍| 11745/12384 [24:55:31<1:21:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 95%|█████████▍| 11746/12384 [24:55:31<1:21:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 95%|█████████▍| 11746/12384 [24:55:39<1:21:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 95%|█████████▍| 11747/12384 [24:55:39<1:21:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 95%|█████████▍| 11747/12384 [24:55:46<1:21:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 95%|█████████▍| 11748/12384 [24:55:46<1:20:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 1: 95%|█████████▍| 11748/12384 [24:55:54<1:20:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 95%|█████████▍| 11749/12384 [24:55:54<1:20:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 95%|█████████▍| 11749/12384 [24:56:02<1:20:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 95%|█████████▍| 11750/12384 [24:56:02<1:20:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 1: 95%|█████████▍| 11750/12384 [24:56:09<1:20:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 95%|█████████▍| 11751/12384 [24:56:09<1:21:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 95%|█████████▍| 11751/12384 [24:56:17<1:21:13, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 1: 95%|█████████▍| 11752/12384 [24:56:17<1:20:49, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 1: 95%|█████████▍| 11752/12384 [24:56:25<1:20:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 95%|█████████▍| 11753/12384 [24:56:25<1:20:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 95%|█████████▍| 11753/12384 [24:56:32<1:20:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▍| 11754/12384 [24:56:32<1:20:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▍| 11754/12384 [24:56:40<1:20:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 95%|█████████▍| 11755/12384 [24:56:40<1:21:11, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 1: 95%|█████████▍| 11755/12384 [24:56:48<1:21:11, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 95%|█████████▍| 11756/12384 [24:56:48<1:20:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 95%|█████████▍| 11756/12384 [24:56:56<1:20:42, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▍| 11757/12384 [24:56:56<1:20:22, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▍| 11757/12384 [24:57:03<1:20:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 95%|█████████▍| 11758/12384 [24:57:03<1:19:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 95%|█████████▍| 11758/12384 [24:57:11<1:19:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▍| 11759/12384 [24:57:11<1:19:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▍| 11759/12384 [24:57:18<1:19:38, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 95%|█████████▍| 11760/12384 [24:57:18<1:19:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 1: 95%|█████████▍| 11760/12384 [24:57:26<1:19:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 95%|█████████▍| 11761/12384 [24:57:26<1:19:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 1: 95%|█████████▍| 11761/12384 [24:57:34<1:19:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 95%|█████████▍| 11762/12384 [24:57:34<1:19:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 1: 95%|█████████▍| 11762/12384 [24:57:41<1:19:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 95%|█████████▍| 11763/12384 [24:57:41<1:19:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 1: 95%|█████████▍| 11763/12384 [24:57:49<1:19:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 95%|█████████▍| 11764/12384 [24:57:49<1:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 1: 95%|█████████▍| 11764/12384 [24:57:57<1:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 95%|█████████▌| 11765/12384 [24:57:57<1:18:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 1: 95%|█████████▌| 11765/12384 [24:58:04<1:18:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 95%|█████████▌| 11766/12384 [24:58:04<1:18:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 95%|█████████▌| 11766/12384 [24:58:12<1:18:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 95%|█████████▌| 11767/12384 [24:58:12<1:18:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 95%|█████████▌| 11767/12384 [24:58:19<1:18:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 1: 95%|█████████▌| 11768/12384 [24:58:19<1:18:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 1: 95%|█████████▌| 11768/12384 [24:58:27<1:18:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 95%|█████████▌| 11769/12384 [24:58:27<1:17:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 1: 95%|█████████▌| 11769/12384 [24:58:35<1:17:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 95%|█████████▌| 11770/12384 [24:58:35<1:17:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 1: 95%|█████████▌| 11770/12384 [24:58:42<1:17:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 95%|█████████▌| 11771/12384 [24:58:42<1:17:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 95%|█████████▌| 11771/12384 [24:58:50<1:17:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▌| 11772/12384 [24:58:50<1:17:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▌| 11772/12384 [24:58:57<1:17:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 95%|█████████▌| 11773/12384 [24:58:57<1:17:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 95%|█████████▌| 11773/12384 [24:59:05<1:17:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 95%|█████████▌| 11774/12384 [24:59:05<1:17:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 95%|█████████▌| 11774/12384 [24:59:13<1:17:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 95%|█████████▌| 11775/12384 [24:59:13<1:17:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 1: 95%|█████████▌| 11775/12384 [24:59:20<1:17:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 95%|█████████▌| 11776/12384 [24:59:20<1:17:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 95%|█████████▌| 11776/12384 [24:59:28<1:17:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 95%|█████████▌| 11777/12384 [24:59:28<1:17:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 95%|█████████▌| 11777/12384 [24:59:36<1:17:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▌| 11778/12384 [24:59:36<1:17:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▌| 11778/12384 [24:59:43<1:17:25, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=3.08s]
Epoch 1: 95%|█████████▌| 11779/12384 [24:59:43<1:17:10, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=3.08s]
Epoch 1: 95%|█████████▌| 11779/12384 [24:59:51<1:17:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=12.13s]
Epoch 1: 95%|█████████▌| 11780/12384 [24:59:51<1:16:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=12.13s]
Epoch 1: 95%|█████████▌| 11780/12384 [24:59:59<1:16:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 95%|█████████▌| 11781/12384 [24:59:59<1:17:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 95%|█████████▌| 11781/12384 [25:00:06<1:17:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 95%|█████████▌| 11782/12384 [25:00:06<1:17:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 1: 95%|█████████▌| 11782/12384 [25:00:14<1:17:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 1: 95%|█████████▌| 11783/12384 [25:00:14<1:16:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 1: 95%|█████████▌| 11783/12384 [25:00:22<1:16:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 95%|█████████▌| 11784/12384 [25:00:22<1:16:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 95%|█████████▌| 11784/12384 [25:00:29<1:16:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 95%|█████████▌| 11785/12384 [25:00:29<1:16:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 95%|█████████▌| 11785/12384 [25:00:37<1:16:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▌| 11786/12384 [25:00:37<1:15:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▌| 11786/12384 [25:00:45<1:15:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 95%|█████████▌| 11787/12384 [25:00:45<1:15:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 95%|█████████▌| 11787/12384 [25:00:52<1:15:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 95%|█████████▌| 11788/12384 [25:00:52<1:15:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 95%|█████████▌| 11788/12384 [25:01:00<1:15:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▌| 11789/12384 [25:01:00<1:15:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▌| 11789/12384 [25:01:07<1:15:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▌| 11790/12384 [25:01:07<1:15:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▌| 11790/12384 [25:01:15<1:15:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 95%|█████████▌| 11791/12384 [25:01:15<1:15:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 1: 95%|█████████▌| 11791/12384 [25:01:23<1:15:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 95%|█████████▌| 11792/12384 [25:01:23<1:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 1: 95%|█████████▌| 11792/12384 [25:01:30<1:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 95%|█████████▌| 11793/12384 [25:01:30<1:15:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 95%|█████████▌| 11793/12384 [25:01:38<1:15:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 95%|█████████▌| 11794/12384 [25:01:38<1:14:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 1: 95%|█████████▌| 11794/12384 [25:01:45<1:14:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 95%|█████████▌| 11795/12384 [25:01:45<1:14:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 1: 95%|█████████▌| 11795/12384 [25:01:53<1:14:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▌| 11796/12384 [25:01:53<1:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▌| 11796/12384 [25:02:01<1:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▌| 11797/12384 [25:02:01<1:14:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▌| 11797/12384 [25:02:08<1:14:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 95%|█████████▌| 11798/12384 [25:02:08<1:14:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 95%|█████████▌| 11798/12384 [25:02:16<1:14:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 1: 95%|█████████▌| 11799/12384 [25:02:16<1:14:06, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 1: 95%|█████████▌| 11799/12384 [25:02:23<1:14:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 95%|█████████▌| 11800/12384 [25:02:23<1:14:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 95%|█████████▌| 11800/12384 [25:02:31<1:14:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 95%|█████████▌| 11801/12384 [25:02:31<1:14:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 95%|█████████▌| 11801/12384 [25:02:39<1:14:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▌| 11802/12384 [25:02:39<1:13:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▌| 11802/12384 [25:02:47<1:13:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 95%|█████████▌| 11803/12384 [25:02:47<1:14:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 95%|█████████▌| 11803/12384 [25:02:54<1:14:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 95%|█████████▌| 11804/12384 [25:02:54<1:14:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 1: 95%|█████████▌| 11804/12384 [25:03:02<1:14:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 95%|█████████▌| 11805/12384 [25:03:02<1:14:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 95%|█████████▌| 11805/12384 [25:03:10<1:14:04, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 1: 95%|█████████▌| 11806/12384 [25:03:10<1:13:46, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 1: 95%|█████████▌| 11806/12384 [25:03:17<1:13:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 95%|█████████▌| 11807/12384 [25:03:17<1:13:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 95%|█████████▌| 11807/12384 [25:03:25<1:13:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 95%|█████████▌| 11808/12384 [25:03:25<1:14:19, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 95%|█████████▌| 11808/12384 [25:03:33<1:14:19, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 95%|█████████▌| 11809/12384 [25:03:33<1:13:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 95%|█████████▌| 11809/12384 [25:03:40<1:13:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 95%|█████████▌| 11810/12384 [25:03:40<1:13:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 95%|█████████▌| 11810/12384 [25:03:48<1:13:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 95%|█████████▌| 11811/12384 [25:03:48<1:13:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 95%|█████████▌| 11811/12384 [25:03:56<1:13:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 95%|█████████▌| 11812/12384 [25:03:56<1:12:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 1: 95%|█████████▌| 11812/12384 [25:04:03<1:12:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 95%|█████████▌| 11813/12384 [25:04:03<1:12:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 95%|█████████▌| 11813/12384 [25:04:11<1:12:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 95%|█████████▌| 11814/12384 [25:04:11<1:12:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 1: 95%|█████████▌| 11814/12384 [25:04:19<1:12:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▌| 11815/12384 [25:04:19<1:12:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 95%|█████████▌| 11815/12384 [25:04:26<1:12:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 95%|█████████▌| 11816/12384 [25:04:26<1:12:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 95%|█████████▌| 11816/12384 [25:04:34<1:12:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 95%|█████████▌| 11817/12384 [25:04:34<1:12:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 95%|█████████▌| 11817/12384 [25:04:41<1:12:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▌| 11818/12384 [25:04:41<1:11:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 95%|█████████▌| 11818/12384 [25:04:49<1:11:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 95%|█████████▌| 11819/12384 [25:04:49<1:11:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 95%|█████████▌| 11819/12384 [25:04:57<1:11:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 95%|█████████▌| 11820/12384 [25:04:57<1:11:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 1: 95%|█████████▌| 11820/12384 [25:05:04<1:11:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 95%|█████████▌| 11821/12384 [25:05:04<1:11:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 95%|█████████▌| 11821/12384 [25:05:12<1:11:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 95%|█████████▌| 11822/12384 [25:05:12<1:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 1: 95%|█████████▌| 11822/12384 [25:05:20<1:11:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▌| 11823/12384 [25:05:20<1:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 95%|█████████▌| 11823/12384 [25:05:27<1:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 95%|█████████▌| 11824/12384 [25:05:27<1:11:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 95%|█████████▌| 11824/12384 [25:05:35<1:11:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 95%|█████████▌| 11825/12384 [25:05:35<1:10:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 1: 95%|█████████▌| 11825/12384 [25:05:42<1:10:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 95%|█████████▌| 11826/12384 [25:05:42<1:10:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 95%|█████████▌| 11826/12384 [25:05:50<1:10:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 96%|█████████▌| 11827/12384 [25:05:50<1:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 96%|█████████▌| 11827/12384 [25:05:58<1:10:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 96%|█████████▌| 11828/12384 [25:05:58<1:10:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 96%|█████████▌| 11828/12384 [25:06:05<1:10:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 96%|█████████▌| 11829/12384 [25:06:05<1:10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 1: 96%|█████████▌| 11829/12384 [25:06:13<1:10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 96%|█████████▌| 11830/12384 [25:06:13<1:10:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 96%|█████████▌| 11830/12384 [25:06:20<1:10:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 96%|█████████▌| 11831/12384 [25:06:20<1:10:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 1: 96%|█████████▌| 11831/12384 [25:06:28<1:10:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 96%|█████████▌| 11832/12384 [25:06:28<1:09:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 96%|█████████▌| 11832/12384 [25:06:36<1:09:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 1: 96%|█████████▌| 11833/12384 [25:06:36<1:09:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 1: 96%|█████████▌| 11833/12384 [25:06:44<1:09:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 96%|█████████▌| 11834/12384 [25:06:44<1:10:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 96%|█████████▌| 11834/12384 [25:06:51<1:10:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 1: 96%|█████████▌| 11835/12384 [25:06:51<1:10:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 1: 96%|█████████▌| 11835/12384 [25:06:59<1:10:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 96%|█████████▌| 11836/12384 [25:06:59<1:10:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 1: 96%|█████████▌| 11836/12384 [25:07:07<1:10:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 96%|█████████▌| 11837/12384 [25:07:07<1:10:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 96%|█████████▌| 11837/12384 [25:07:14<1:10:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 1: 96%|█████████▌| 11838/12384 [25:07:14<1:09:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 1: 96%|█████████▌| 11838/12384 [25:07:22<1:09:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 96%|█████████▌| 11839/12384 [25:07:22<1:09:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 1: 96%|█████████▌| 11839/12384 [25:07:29<1:09:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 96%|█████████▌| 11840/12384 [25:07:29<1:09:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 1: 96%|█████████▌| 11840/12384 [25:07:37<1:09:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 96%|█████████▌| 11841/12384 [25:07:37<1:09:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 1: 96%|█████████▌| 11841/12384 [25:07:45<1:09:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 96%|█████████▌| 11842/12384 [25:07:45<1:09:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 1: 96%|█████████▌| 11842/12384 [25:07:52<1:09:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 96%|█████████▌| 11843/12384 [25:07:52<1:08:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 1: 96%|█████████▌| 11843/12384 [25:08:00<1:08:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 96%|█████████▌| 11844/12384 [25:08:00<1:08:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 1: 96%|█████████▌| 11844/12384 [25:08:08<1:08:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 96%|█████████▌| 11845/12384 [25:08:08<1:08:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 96%|█████████▌| 11845/12384 [25:08:15<1:08:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.07s]
Epoch 1: 96%|█████████▌| 11846/12384 [25:08:15<1:08:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.07s]
Epoch 1: 96%|█████████▌| 11846/12384 [25:08:23<1:08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 96%|█████████▌| 11847/12384 [25:08:23<1:08:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 96%|█████████▌| 11847/12384 [25:08:30<1:08:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 96%|█████████▌| 11848/12384 [25:08:30<1:08:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 96%|█████████▌| 11848/12384 [25:08:38<1:08:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 96%|█████████▌| 11849/12384 [25:08:38<1:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 96%|█████████▌| 11849/12384 [25:08:46<1:07:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11850/12384 [25:08:46<1:07:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11850/12384 [25:08:53<1:07:46, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11851/12384 [25:08:53<1:07:38, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11851/12384 [25:09:01<1:07:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11852/12384 [25:09:01<1:07:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11852/12384 [25:09:08<1:07:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 96%|█████████▌| 11853/12384 [25:09:08<1:07:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 1: 96%|█████████▌| 11853/12384 [25:09:16<1:07:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 96%|█████████▌| 11854/12384 [25:09:16<1:07:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 96%|█████████▌| 11854/12384 [25:09:24<1:07:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11855/12384 [25:09:24<1:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11855/12384 [25:09:31<1:07:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 96%|█████████▌| 11856/12384 [25:09:31<1:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 96%|█████████▌| 11856/12384 [25:09:39<1:06:56, 7.61s/it, loss=0.0004, acc=0.9994, iter_time=6.13s]
Epoch 1: 96%|█████████▌| 11857/12384 [25:09:39<1:06:51, 7.61s/it, loss=0.0004, acc=0.9994, iter_time=6.13s]
Epoch 1: 96%|█████████▌| 11857/12384 [25:09:46<1:06:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 96%|█████████▌| 11858/12384 [25:09:46<1:06:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 1: 96%|█████████▌| 11858/12384 [25:09:54<1:06:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 96%|█████████▌| 11859/12384 [25:09:54<1:06:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 96%|█████████▌| 11859/12384 [25:10:02<1:06:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 96%|█████████▌| 11860/12384 [25:10:02<1:06:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 1: 96%|█████████▌| 11860/12384 [25:10:10<1:06:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 96%|█████████▌| 11861/12384 [25:10:10<1:07:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 1: 96%|█████████▌| 11861/12384 [25:10:17<1:07:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 96%|█████████▌| 11862/12384 [25:10:17<1:06:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 96%|█████████▌| 11862/12384 [25:10:25<1:06:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11863/12384 [25:10:25<1:06:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11863/12384 [25:10:32<1:06:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 96%|█████████▌| 11864/12384 [25:10:32<1:06:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 96%|█████████▌| 11864/12384 [25:10:40<1:06:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 96%|█████████▌| 11865/12384 [25:10:40<1:05:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 96%|█████████▌| 11865/12384 [25:10:48<1:05:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 96%|█████████▌| 11866/12384 [25:10:48<1:05:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 96%|█████████▌| 11866/12384 [25:10:55<1:05:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 96%|█████████▌| 11867/12384 [25:10:55<1:05:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 96%|█████████▌| 11867/12384 [25:11:03<1:05:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 96%|█████████▌| 11868/12384 [25:11:03<1:05:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 96%|█████████▌| 11868/12384 [25:11:10<1:05:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 96%|█████████▌| 11869/12384 [25:11:10<1:05:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 96%|█████████▌| 11869/12384 [25:11:18<1:05:21, 7.61s/it, loss=0.0002, acc=0.9995, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11870/12384 [25:11:18<1:05:12, 7.61s/it, loss=0.0002, acc=0.9995, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11870/12384 [25:11:26<1:05:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 96%|█████████▌| 11871/12384 [25:11:26<1:05:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 96%|█████████▌| 11871/12384 [25:11:33<1:05:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 96%|█████████▌| 11872/12384 [25:11:33<1:04:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 96%|█████████▌| 11872/12384 [25:11:41<1:04:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 96%|█████████▌| 11873/12384 [25:11:41<1:04:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 96%|█████████▌| 11873/12384 [25:11:48<1:04:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 96%|█████████▌| 11874/12384 [25:11:48<1:04:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 96%|█████████▌| 11874/12384 [25:11:56<1:04:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 96%|█████████▌| 11875/12384 [25:11:56<1:04:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 96%|█████████▌| 11875/12384 [25:12:04<1:04:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 96%|█████████▌| 11876/12384 [25:12:04<1:04:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 1: 96%|█████████▌| 11876/12384 [25:12:11<1:04:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 96%|█████████▌| 11877/12384 [25:12:11<1:04:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 96%|█████████▌| 11877/12384 [25:12:19<1:04:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 96%|█████████▌| 11878/12384 [25:12:19<1:04:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 1: 96%|█████████▌| 11878/12384 [25:12:27<1:04:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 1: 96%|█████████▌| 11879/12384 [25:12:27<1:04:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 1: 96%|█████████▌| 11879/12384 [25:12:34<1:04:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 96%|█████████▌| 11880/12384 [25:12:34<1:03:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 1: 96%|█████████▌| 11880/12384 [25:12:42<1:03:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11881/12384 [25:12:42<1:03:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11881/12384 [25:12:49<1:03:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 96%|█████████▌| 11882/12384 [25:12:49<1:03:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 1: 96%|█████████▌| 11882/12384 [25:12:57<1:03:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 96%|█████████▌| 11883/12384 [25:12:57<1:04:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 1: 96%|█████████▌| 11883/12384 [25:13:05<1:04:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 96%|█████████▌| 11884/12384 [25:13:05<1:03:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 1: 96%|█████████▌| 11884/12384 [25:13:12<1:03:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 96%|█████████▌| 11885/12384 [25:13:12<1:03:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 1: 96%|█████████▌| 11885/12384 [25:13:20<1:03:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11886/12384 [25:13:20<1:03:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11886/12384 [25:13:28<1:03:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 96%|█████████▌| 11887/12384 [25:13:28<1:04:03, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 96%|█████████▌| 11887/12384 [25:13:36<1:04:03, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 96%|█████████▌| 11888/12384 [25:13:36<1:03:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 1: 96%|█████████▌| 11888/12384 [25:13:43<1:03:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 96%|█████████▌| 11889/12384 [25:13:43<1:03:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 96%|█████████▌| 11889/12384 [25:13:51<1:03:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 96%|█████████▌| 11890/12384 [25:13:51<1:02:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 96%|█████████▌| 11890/12384 [25:13:58<1:02:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 96%|█████████▌| 11891/12384 [25:13:58<1:02:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 96%|█████████▌| 11891/12384 [25:14:06<1:02:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 96%|█████████▌| 11892/12384 [25:14:06<1:02:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 96%|█████████▌| 11892/12384 [25:14:14<1:02:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 96%|█████████▌| 11893/12384 [25:14:14<1:02:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 1: 96%|█████████▌| 11893/12384 [25:14:21<1:02:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 96%|█████████▌| 11894/12384 [25:14:21<1:02:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 1: 96%|█████████▌| 11894/12384 [25:14:29<1:02:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11895/12384 [25:14:29<1:02:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 96%|█████████▌| 11895/12384 [25:14:37<1:02:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 96%|█████████▌| 11896/12384 [25:14:37<1:01:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 1: 96%|█████████▌| 11896/12384 [25:14:44<1:01:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11897/12384 [25:14:44<1:01:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11897/12384 [25:14:52<1:01:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 96%|█████████▌| 11898/12384 [25:14:52<1:01:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 96%|█████████▌| 11898/12384 [25:14:59<1:01:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 96%|█████████▌| 11899/12384 [25:14:59<1:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 96%|█████████▌| 11899/12384 [25:15:07<1:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 1: 96%|█████████▌| 11900/12384 [25:15:07<1:01:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 1: 96%|█████████▌| 11900/12384 [25:15:15<1:01:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.64s]
Epoch 1: 96%|█████████▌| 11901/12384 [25:15:15<1:01:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.64s]
Epoch 1: 96%|█████████▌| 11901/12384 [25:15:22<1:01:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▌| 11902/12384 [25:15:22<1:01:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▌| 11902/12384 [25:15:30<1:01:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11903/12384 [25:15:30<1:01:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 96%|█████████▌| 11903/12384 [25:15:37<1:01:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 96%|█████████▌| 11904/12384 [25:15:37<1:00:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 96%|█████████▌| 11904/12384 [25:15:45<1:00:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 96%|█████████▌| 11905/12384 [25:15:45<1:00:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 96%|█████████▌| 11905/12384 [25:15:53<1:00:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▌| 11906/12384 [25:15:53<1:00:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▌| 11906/12384 [25:16:00<1:00:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▌| 11907/12384 [25:16:00<1:00:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▌| 11907/12384 [25:16:08<1:00:29, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 1: 96%|█████████▌| 11908/12384 [25:16:08<1:00:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.07s]
Epoch 1: 96%|█████████▌| 11908/12384 [25:16:15<1:00:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 1: 96%|█████████▌| 11909/12384 [25:16:15<1:00:13, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 1: 96%|█████████▌| 11909/12384 [25:16:23<1:00:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 96%|█████████▌| 11910/12384 [25:16:23<1:00:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 1: 96%|█████████▌| 11910/12384 [25:16:31<1:00:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 96%|█████████▌| 11911/12384 [25:16:31<1:00:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 96%|█████████▌| 11911/12384 [25:16:38<1:00:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 96%|█████████▌| 11912/12384 [25:16:38<59:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 96%|█████████▌| 11912/12384 [25:16:46<59:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 96%|█████████▌| 11913/12384 [25:16:46<1:00:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 96%|█████████▌| 11913/12384 [25:16:54<1:00:26, 7.70s/it, loss=0.0009, acc=0.9961, iter_time=4.26s]
Epoch 1: 96%|█████████▌| 11914/12384 [25:16:54<1:00:06, 7.67s/it, loss=0.0009, acc=0.9961, iter_time=4.26s]
Epoch 1: 96%|█████████▌| 11914/12384 [25:17:01<1:00:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 96%|█████████▌| 11915/12384 [25:17:01<59:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 1: 96%|█████████▌| 11915/12384 [25:17:09<59:58, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 1: 96%|█████████▌| 11916/12384 [25:17:09<59:40, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 1: 96%|█████████▌| 11916/12384 [25:17:17<59:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 96%|█████████▌| 11917/12384 [25:17:17<59:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 1: 96%|█████████▌| 11917/12384 [25:17:24<59:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 96%|█████████▌| 11918/12384 [25:17:24<59:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 1: 96%|█████████▌| 11918/12384 [25:17:32<59:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 96%|█████████▌| 11919/12384 [25:17:32<59:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 1: 96%|█████████▌| 11919/12384 [25:17:40<59:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 96%|█████████▋| 11920/12384 [25:17:40<58:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 96%|█████████▋| 11920/12384 [25:17:47<58:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 96%|█████████▋| 11921/12384 [25:17:47<58:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 96%|█████████▋| 11921/12384 [25:17:55<58:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▋| 11922/12384 [25:17:55<58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▋| 11922/12384 [25:18:02<58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 96%|█████████▋| 11923/12384 [25:18:02<58:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 96%|█████████▋| 11923/12384 [25:18:10<58:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 96%|█████████▋| 11924/12384 [25:18:10<58:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 1: 96%|█████████▋| 11924/12384 [25:18:18<58:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 96%|█████████▋| 11925/12384 [25:18:18<58:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 96%|█████████▋| 11925/12384 [25:18:25<58:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 96%|█████████▋| 11926/12384 [25:18:25<58:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 1: 96%|█████████▋| 11926/12384 [25:18:33<58:07, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.32s]
Epoch 1: 96%|█████████▋| 11927/12384 [25:18:33<58:13, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.32s]
Epoch 1: 96%|█████████▋| 11927/12384 [25:18:41<58:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 1: 96%|█████████▋| 11928/12384 [25:18:41<58:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 1: 96%|█████████▋| 11928/12384 [25:18:48<58:02, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=4.65s]
Epoch 1: 96%|█████████▋| 11929/12384 [25:18:48<57:50, 7.63s/it, loss=0.0003, acc=0.9986, iter_time=4.65s]
Epoch 1: 96%|█████████▋| 11929/12384 [25:18:56<57:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 96%|█████████▋| 11930/12384 [25:18:56<57:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 1: 96%|█████████▋| 11930/12384 [25:19:03<57:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 96%|█████████▋| 11931/12384 [25:19:03<57:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 1: 96%|█████████▋| 11931/12384 [25:19:11<57:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 96%|█████████▋| 11932/12384 [25:19:11<57:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 96%|█████████▋| 11932/12384 [25:19:19<57:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 96%|█████████▋| 11933/12384 [25:19:19<57:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 96%|█████████▋| 11933/12384 [25:19:26<57:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 96%|█████████▋| 11934/12384 [25:19:26<57:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 1: 96%|█████████▋| 11934/12384 [25:19:34<57:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 96%|█████████▋| 11935/12384 [25:19:34<56:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 96%|█████████▋| 11935/12384 [25:19:41<56:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 1: 96%|█████████▋| 11936/12384 [25:19:41<56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 1: 96%|█████████▋| 11936/12384 [25:19:49<56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 96%|█████████▋| 11937/12384 [25:19:49<56:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 96%|█████████▋| 11937/12384 [25:19:57<56:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 96%|█████████▋| 11938/12384 [25:19:57<56:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 96%|█████████▋| 11938/12384 [25:20:05<56:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 96%|█████████▋| 11939/12384 [25:20:05<57:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 96%|█████████▋| 11939/12384 [25:20:12<57:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 96%|█████████▋| 11940/12384 [25:20:12<56:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 96%|█████████▋| 11940/12384 [25:20:20<56:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▋| 11941/12384 [25:20:20<56:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▋| 11941/12384 [25:20:28<56:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 96%|█████████▋| 11942/12384 [25:20:28<56:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 1: 96%|█████████▋| 11942/12384 [25:20:35<56:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 96%|█████████▋| 11943/12384 [25:20:35<56:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 1: 96%|█████████▋| 11943/12384 [25:20:43<56:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 1: 96%|█████████▋| 11944/12384 [25:20:43<56:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 1: 96%|█████████▋| 11944/12384 [25:20:50<56:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 96%|█████████▋| 11945/12384 [25:20:50<55:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 96%|█████████▋| 11945/12384 [25:20:58<55:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▋| 11946/12384 [25:20:58<55:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 96%|█████████▋| 11946/12384 [25:21:06<55:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 96%|█████████▋| 11947/12384 [25:21:06<55:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 1: 96%|█████████▋| 11947/12384 [25:21:13<55:30, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=8.46s]
Epoch 1: 96%|█████████▋| 11948/12384 [25:21:13<55:24, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=8.46s]
Epoch 1: 96%|█████████▋| 11948/12384 [25:21:21<55:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.21s]
Epoch 1: 96%|█████████▋| 11949/12384 [25:21:21<55:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.21s]
Epoch 1: 96%|█████████▋| 11949/12384 [25:21:29<55:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 96%|█████████▋| 11950/12384 [25:21:29<55:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 1: 96%|█████████▋| 11950/12384 [25:21:36<55:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 97%|█████████▋| 11951/12384 [25:21:36<54:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 97%|█████████▋| 11951/12384 [25:21:44<54:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 97%|█████████▋| 11952/12384 [25:21:44<54:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 97%|█████████▋| 11952/12384 [25:21:51<54:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 1: 97%|█████████▋| 11953/12384 [25:21:51<54:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 1: 97%|█████████▋| 11953/12384 [25:21:59<54:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 97%|█████████▋| 11954/12384 [25:21:59<54:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 1: 97%|█████████▋| 11954/12384 [25:22:07<54:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 97%|█████████▋| 11955/12384 [25:22:07<54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 97%|█████████▋| 11955/12384 [25:22:14<54:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 97%|█████████▋| 11956/12384 [25:22:14<54:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 97%|█████████▋| 11956/12384 [25:22:22<54:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 97%|█████████▋| 11957/12384 [25:22:22<54:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 97%|█████████▋| 11957/12384 [25:22:29<54:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 97%|█████████▋| 11958/12384 [25:22:29<54:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 1: 97%|█████████▋| 11958/12384 [25:22:37<54:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 97%|█████████▋| 11959/12384 [25:22:37<53:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 97%|█████████▋| 11959/12384 [25:22:45<53:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 97%|█████████▋| 11960/12384 [25:22:45<53:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 97%|█████████▋| 11960/12384 [25:22:53<53:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 97%|█████████▋| 11961/12384 [25:22:53<54:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 1: 97%|█████████▋| 11961/12384 [25:23:00<54:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 97%|█████████▋| 11962/12384 [25:23:00<54:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 1: 97%|█████████▋| 11962/12384 [25:23:08<54:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 97%|█████████▋| 11963/12384 [25:23:08<53:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 1: 97%|█████████▋| 11963/12384 [25:23:15<53:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 97%|█████████▋| 11964/12384 [25:23:15<53:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 97%|█████████▋| 11964/12384 [25:23:23<53:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 97%|█████████▋| 11965/12384 [25:23:23<53:59, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 97%|█████████▋| 11965/12384 [25:23:31<53:59, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 97%|█████████▋| 11966/12384 [25:23:31<53:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 1: 97%|█████████▋| 11966/12384 [25:23:39<53:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 97%|█████████▋| 11967/12384 [25:23:39<53:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 97%|█████████▋| 11967/12384 [25:23:46<53:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 97%|█████████▋| 11968/12384 [25:23:46<53:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 97%|█████████▋| 11968/12384 [25:23:54<53:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 97%|█████████▋| 11969/12384 [25:23:54<52:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 97%|█████████▋| 11969/12384 [25:24:01<52:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 97%|█████████▋| 11970/12384 [25:24:01<52:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 1: 97%|█████████▋| 11970/12384 [25:24:09<52:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 97%|█████████▋| 11971/12384 [25:24:09<52:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 97%|█████████▋| 11971/12384 [25:24:17<52:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 1: 97%|█████████▋| 11972/12384 [25:24:17<52:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 1: 97%|█████████▋| 11972/12384 [25:24:24<52:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 97%|█████████▋| 11973/12384 [25:24:24<52:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 97%|█████████▋| 11973/12384 [25:24:32<52:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 97%|█████████▋| 11974/12384 [25:24:32<52:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 97%|█████████▋| 11974/12384 [25:24:39<52:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 97%|█████████▋| 11975/12384 [25:24:39<51:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 97%|█████████▋| 11975/12384 [25:24:47<51:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 97%|█████████▋| 11976/12384 [25:24:47<51:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 1: 97%|█████████▋| 11976/12384 [25:24:55<51:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 97%|█████████▋| 11977/12384 [25:24:55<51:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 97%|█████████▋| 11977/12384 [25:25:02<51:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 11978/12384 [25:25:02<51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 11978/12384 [25:25:10<51:36, 7.63s/it, loss=0.0001, acc=0.9994, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 11979/12384 [25:25:10<51:26, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 11979/12384 [25:25:18<51:26, 7.62s/it, loss=0.0001, acc=0.9991, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 11980/12384 [25:25:18<51:27, 7.64s/it, loss=0.0001, acc=0.9991, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 11980/12384 [25:25:25<51:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 97%|█████████▋| 11981/12384 [25:25:25<51:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 97%|█████████▋| 11981/12384 [25:25:33<51:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 11982/12384 [25:25:33<51:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 11982/12384 [25:25:41<51:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 97%|█████████▋| 11983/12384 [25:25:41<50:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 97%|█████████▋| 11983/12384 [25:25:48<50:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 97%|█████████▋| 11984/12384 [25:25:48<50:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 1: 97%|█████████▋| 11984/12384 [25:25:56<50:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 97%|█████████▋| 11985/12384 [25:25:56<50:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 1: 97%|█████████▋| 11985/12384 [25:26:03<50:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 97%|█████████▋| 11986/12384 [25:26:03<50:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 1: 97%|█████████▋| 11986/12384 [25:26:11<50:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 97%|█████████▋| 11987/12384 [25:26:11<51:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 97%|█████████▋| 11987/12384 [25:26:19<51:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 11988/12384 [25:26:19<50:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 11988/12384 [25:26:27<50:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 97%|█████████▋| 11989/12384 [25:26:27<50:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 97%|█████████▋| 11989/12384 [25:26:34<50:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 11990/12384 [25:26:34<50:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 11990/12384 [25:26:42<50:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 11991/12384 [25:26:42<50:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 11991/12384 [25:26:50<50:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 97%|█████████▋| 11992/12384 [25:26:50<50:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 1: 97%|█████████▋| 11992/12384 [25:26:57<50:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 97%|█████████▋| 11993/12384 [25:26:57<50:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 1: 97%|█████████▋| 11993/12384 [25:27:05<50:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 97%|█████████▋| 11994/12384 [25:27:05<49:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 1: 97%|█████████▋| 11994/12384 [25:27:13<49:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 11995/12384 [25:27:13<49:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 11995/12384 [25:27:20<49:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 11996/12384 [25:27:20<49:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 11996/12384 [25:27:28<49:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 97%|█████████▋| 11997/12384 [25:27:28<49:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 97%|█████████▋| 11997/12384 [25:27:35<49:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 97%|█████████▋| 11998/12384 [25:27:35<49:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 1: 97%|█████████▋| 11998/12384 [25:27:43<49:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 97%|█████████▋| 11999/12384 [25:27:43<48:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 1: 97%|█████████▋| 11999/12384 [25:27:51<48:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 97%|█████████▋| 12000/12384 [25:27:51<48:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 97%|█████████▋| 12000/12384 [25:27:58<48:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 97%|█████████▋| 12001/12384 [25:27:58<48:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 1: 97%|█████████▋| 12001/12384 [25:28:06<48:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 97%|█████████▋| 12002/12384 [25:28:06<48:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 1: 97%|█████████▋| 12002/12384 [25:28:13<48:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 12003/12384 [25:28:13<48:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 12003/12384 [25:28:21<48:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 97%|█████████▋| 12004/12384 [25:28:21<48:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 1: 97%|█████████▋| 12004/12384 [25:28:29<48:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 97%|█████████▋| 12005/12384 [25:28:29<48:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 97%|█████████▋| 12005/12384 [25:28:36<48:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 97%|█████████▋| 12006/12384 [25:28:36<47:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 1: 97%|█████████▋| 12006/12384 [25:28:44<47:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 97%|█████████▋| 12007/12384 [25:28:44<47:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 1: 97%|█████████▋| 12007/12384 [25:28:51<47:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 97%|█████████▋| 12008/12384 [25:28:51<47:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 97%|█████████▋| 12008/12384 [25:28:59<47:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 97%|█████████▋| 12009/12384 [25:28:59<47:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 97%|█████████▋| 12009/12384 [25:29:07<47:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 12010/12384 [25:29:07<47:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 12010/12384 [25:29:14<47:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 12011/12384 [25:29:14<47:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 12011/12384 [25:29:22<47:17, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12012/12384 [25:29:22<47:10, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12012/12384 [25:29:29<47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 97%|█████████▋| 12013/12384 [25:29:29<47:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 97%|█████████▋| 12013/12384 [25:29:37<47:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 97%|█████████▋| 12014/12384 [25:29:37<47:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 97%|█████████▋| 12014/12384 [25:29:45<47:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 12015/12384 [25:29:45<47:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 97%|█████████▋| 12015/12384 [25:29:53<47:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 97%|█████████▋| 12016/12384 [25:29:53<46:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 97%|█████████▋| 12016/12384 [25:30:00<46:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 97%|█████████▋| 12017/12384 [25:30:00<46:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 97%|█████████▋| 12017/12384 [25:30:08<46:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 97%|█████████▋| 12018/12384 [25:30:08<47:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 97%|█████████▋| 12018/12384 [25:30:16<47:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 97%|█████████▋| 12019/12384 [25:30:16<46:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 97%|█████████▋| 12019/12384 [25:30:23<46:44, 7.68s/it, loss=0.0000, acc=0.9999, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12020/12384 [25:30:23<46:29, 7.66s/it, loss=0.0000, acc=0.9999, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12020/12384 [25:30:31<46:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12021/12384 [25:30:31<46:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12021/12384 [25:30:39<46:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 97%|█████████▋| 12022/12384 [25:30:39<46:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 97%|█████████▋| 12022/12384 [25:30:46<46:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12023/12384 [25:30:46<45:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12023/12384 [25:30:54<45:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 97%|█████████▋| 12024/12384 [25:30:54<45:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 1: 97%|█████████▋| 12024/12384 [25:31:01<45:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 97%|█████████▋| 12025/12384 [25:31:01<45:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 97%|█████████▋| 12025/12384 [25:31:09<45:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 97%|█████████▋| 12026/12384 [25:31:09<45:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 97%|█████████▋| 12026/12384 [25:31:17<45:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 97%|█████████▋| 12027/12384 [25:31:17<45:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 97%|█████████▋| 12027/12384 [25:31:24<45:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 97%|█████████▋| 12028/12384 [25:31:24<45:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 1: 97%|█████████▋| 12028/12384 [25:31:32<45:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 97%|█████████▋| 12029/12384 [25:31:32<45:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 97%|█████████▋| 12029/12384 [25:31:40<45:02, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12030/12384 [25:31:40<44:57, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12030/12384 [25:31:47<44:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 12031/12384 [25:31:47<44:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 12031/12384 [25:31:55<44:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 97%|█████████▋| 12032/12384 [25:31:55<44:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 97%|█████████▋| 12032/12384 [25:32:02<44:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 97%|█████████▋| 12033/12384 [25:32:02<44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 97%|█████████▋| 12033/12384 [25:32:10<44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 97%|█████████▋| 12034/12384 [25:32:10<44:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 1: 97%|█████████▋| 12034/12384 [25:32:18<44:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 97%|█████████▋| 12035/12384 [25:32:18<44:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 1: 97%|█████████▋| 12035/12384 [25:32:25<44:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 12036/12384 [25:32:25<44:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 97%|█████████▋| 12036/12384 [25:32:33<44:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12037/12384 [25:32:33<44:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12037/12384 [25:32:40<44:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 97%|█████████▋| 12038/12384 [25:32:40<43:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 97%|█████████▋| 12038/12384 [25:32:48<43:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12039/12384 [25:32:48<43:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12039/12384 [25:32:56<43:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 97%|█████████▋| 12040/12384 [25:32:56<43:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 1: 97%|█████████▋| 12040/12384 [25:33:04<43:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 97%|█████████▋| 12041/12384 [25:33:04<44:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 97%|█████████▋| 12041/12384 [25:33:11<44:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 97%|█████████▋| 12042/12384 [25:33:11<43:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 1: 97%|█████████▋| 12042/12384 [25:33:19<43:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 97%|█████████▋| 12043/12384 [25:33:19<43:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 97%|█████████▋| 12043/12384 [25:33:26<43:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 97%|█████████▋| 12044/12384 [25:33:26<43:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 97%|█████████▋| 12044/12384 [25:33:34<43:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 97%|█████████▋| 12045/12384 [25:33:34<43:42, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 1: 97%|█████████▋| 12045/12384 [25:33:42<43:42, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 97%|█████████▋| 12046/12384 [25:33:42<43:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 1: 97%|█████████▋| 12046/12384 [25:33:50<43:23, 7.70s/it, loss=0.0005, acc=0.9979, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12047/12384 [25:33:50<43:05, 7.67s/it, loss=0.0005, acc=0.9979, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12047/12384 [25:33:57<43:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 97%|█████████▋| 12048/12384 [25:33:57<42:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 97%|█████████▋| 12048/12384 [25:34:05<42:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 97%|█████████▋| 12049/12384 [25:34:05<42:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 97%|█████████▋| 12049/12384 [25:34:13<42:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 97%|█████████▋| 12050/12384 [25:34:13<42:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 97%|█████████▋| 12050/12384 [25:34:20<42:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12051/12384 [25:34:20<42:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12051/12384 [25:34:28<42:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 97%|█████████▋| 12052/12384 [25:34:28<42:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 1: 97%|█████████▋| 12052/12384 [25:34:35<42:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 97%|█████████▋| 12053/12384 [25:34:35<42:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 97%|█████████▋| 12053/12384 [25:34:43<42:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 97%|█████████▋| 12054/12384 [25:34:43<41:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 1: 97%|█████████▋| 12054/12384 [25:34:51<41:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 97%|█████████▋| 12055/12384 [25:34:51<41:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 97%|█████████▋| 12055/12384 [25:34:58<41:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 97%|█████████▋| 12056/12384 [25:34:58<41:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 97%|█████████▋| 12056/12384 [25:35:06<41:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 97%|█████████▋| 12057/12384 [25:35:06<41:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 97%|█████████▋| 12057/12384 [25:35:13<41:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 97%|█████████▋| 12058/12384 [25:35:13<41:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 97%|█████████▋| 12058/12384 [25:35:21<41:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 97%|█████████▋| 12059/12384 [25:35:21<41:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 97%|█████████▋| 12059/12384 [25:35:29<41:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 97%|█████████▋| 12060/12384 [25:35:29<41:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 97%|█████████▋| 12060/12384 [25:35:36<41:18, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.77s]
Epoch 1: 97%|█████████▋| 12061/12384 [25:35:36<41:06, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=9.77s]
Epoch 1: 97%|█████████▋| 12061/12384 [25:35:44<41:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12062/12384 [25:35:44<40:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 97%|█████████▋| 12062/12384 [25:35:52<40:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 97%|█████████▋| 12063/12384 [25:35:52<40:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 1: 97%|█████████▋| 12063/12384 [25:35:59<40:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 97%|█████████▋| 12064/12384 [25:35:59<40:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 1: 97%|█████████▋| 12064/12384 [25:36:07<40:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 1: 97%|█████████▋| 12065/12384 [25:36:07<40:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 1: 97%|█████████▋| 12065/12384 [25:36:14<40:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 97%|█████████▋| 12066/12384 [25:36:14<40:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 97%|█████████▋| 12066/12384 [25:36:22<40:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 97%|█████████▋| 12067/12384 [25:36:22<40:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 1: 97%|█████████▋| 12067/12384 [25:36:30<40:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 97%|█████████▋| 12068/12384 [25:36:30<40:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 1: 97%|█████████▋| 12068/12384 [25:36:38<40:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 97%|█████████▋| 12069/12384 [25:36:38<40:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 1: 97%|█████████▋| 12069/12384 [25:36:45<40:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 1: 97%|█████████▋| 12070/12384 [25:36:45<40:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 1: 97%|█████████▋| 12070/12384 [25:36:53<40:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 97%|█████████▋| 12071/12384 [25:36:53<40:25, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 97%|█████████▋| 12071/12384 [25:37:01<40:25, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 1: 97%|█████████▋| 12072/12384 [25:37:01<40:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 1: 97%|█████████▋| 12072/12384 [25:37:08<40:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 97%|█████████▋| 12073/12384 [25:37:08<39:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 97%|█████████▋| 12073/12384 [25:37:16<39:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 97%|█████████▋| 12074/12384 [25:37:16<39:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 1: 97%|█████████▋| 12074/12384 [25:37:24<39:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 98%|█████████▊| 12075/12384 [25:37:24<39:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 1: 98%|█████████▊| 12075/12384 [25:37:31<39:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12076/12384 [25:37:31<39:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12076/12384 [25:37:39<39:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12077/12384 [25:37:39<38:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12077/12384 [25:37:46<38:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 98%|█████████▊| 12078/12384 [25:37:46<38:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 1: 98%|█████████▊| 12078/12384 [25:37:54<38:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 98%|█████████▊| 12079/12384 [25:37:54<38:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 98%|█████████▊| 12079/12384 [25:38:02<38:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 98%|█████████▊| 12080/12384 [25:38:02<38:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 98%|█████████▊| 12080/12384 [25:38:09<38:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 98%|█████████▊| 12081/12384 [25:38:09<38:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 98%|█████████▊| 12081/12384 [25:38:17<38:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 98%|█████████▊| 12082/12384 [25:38:17<38:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 1: 98%|█████████▊| 12082/12384 [25:38:24<38:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 98%|█████████▊| 12083/12384 [25:38:24<38:06, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 98%|█████████▊| 12083/12384 [25:38:32<38:06, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 98%|█████████▊| 12084/12384 [25:38:32<38:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 98%|█████████▊| 12084/12384 [25:38:40<38:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 98%|█████████▊| 12085/12384 [25:38:40<37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 98%|█████████▊| 12085/12384 [25:38:47<37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 98%|█████████▊| 12086/12384 [25:38:47<37:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 1: 98%|█████████▊| 12086/12384 [25:38:55<37:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 98%|█████████▊| 12087/12384 [25:38:55<37:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 98%|█████████▊| 12087/12384 [25:39:02<37:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 98%|█████████▊| 12088/12384 [25:39:02<37:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 98%|█████████▊| 12088/12384 [25:39:10<37:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 98%|█████████▊| 12089/12384 [25:39:10<37:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 1: 98%|█████████▊| 12089/12384 [25:39:18<37:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 98%|█████████▊| 12090/12384 [25:39:18<37:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 1: 98%|█████████▊| 12090/12384 [25:39:25<37:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12091/12384 [25:39:25<37:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12091/12384 [25:39:33<37:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12092/12384 [25:39:33<37:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12092/12384 [25:39:41<37:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 1: 98%|█████████▊| 12093/12384 [25:39:41<37:18, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 1: 98%|█████████▊| 12093/12384 [25:39:48<37:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12094/12384 [25:39:48<37:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12094/12384 [25:39:56<37:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 98%|█████████▊| 12095/12384 [25:39:56<36:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 1: 98%|█████████▊| 12095/12384 [25:40:04<36:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 98%|█████████▊| 12096/12384 [25:40:04<36:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 1: 98%|█████████▊| 12096/12384 [25:40:12<36:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 98%|█████████▊| 12097/12384 [25:40:12<36:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 1: 98%|█████████▊| 12097/12384 [25:40:19<36:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 98%|█████████▊| 12098/12384 [25:40:19<36:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 1: 98%|█████████▊| 12098/12384 [25:40:27<36:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 98%|█████████▊| 12099/12384 [25:40:27<36:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 98%|█████████▊| 12099/12384 [25:40:34<36:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 98%|█████████▊| 12100/12384 [25:40:34<36:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 1: 98%|█████████▊| 12100/12384 [25:40:42<36:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 98%|█████████▊| 12101/12384 [25:40:42<36:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 98%|█████████▊| 12101/12384 [25:40:50<36:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 98%|█████████▊| 12102/12384 [25:40:50<35:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 98%|█████████▊| 12102/12384 [25:40:57<35:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 98%|█████████▊| 12103/12384 [25:40:57<35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 1: 98%|█████████▊| 12103/12384 [25:41:05<35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 98%|█████████▊| 12104/12384 [25:41:05<35:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 98%|█████████▊| 12104/12384 [25:41:12<35:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 98%|█████████▊| 12105/12384 [25:41:12<35:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 1: 98%|█████████▊| 12105/12384 [25:41:20<35:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 98%|█████████▊| 12106/12384 [25:41:20<35:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 1: 98%|█████████▊| 12106/12384 [25:41:28<35:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 98%|█████████▊| 12107/12384 [25:41:28<35:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 1: 98%|█████████▊| 12107/12384 [25:41:35<35:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 98%|█████████▊| 12108/12384 [25:41:35<35:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 1: 98%|█████████▊| 12108/12384 [25:41:43<35:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 98%|█████████▊| 12109/12384 [25:41:43<34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 98%|█████████▊| 12109/12384 [25:41:50<34:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12110/12384 [25:41:50<34:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12110/12384 [25:41:58<34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12111/12384 [25:41:58<34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12111/12384 [25:42:06<34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 98%|█████████▊| 12112/12384 [25:42:06<34:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 98%|█████████▊| 12112/12384 [25:42:13<34:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 98%|█████████▊| 12113/12384 [25:42:13<34:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 98%|█████████▊| 12113/12384 [25:42:21<34:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 98%|█████████▊| 12114/12384 [25:42:21<34:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 1: 98%|█████████▊| 12114/12384 [25:42:29<34:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12115/12384 [25:42:29<34:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12115/12384 [25:42:36<34:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 98%|█████████▊| 12116/12384 [25:42:36<34:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 98%|█████████▊| 12116/12384 [25:42:44<34:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 98%|█████████▊| 12117/12384 [25:42:44<34:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 98%|█████████▊| 12117/12384 [25:42:52<34:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 98%|█████████▊| 12118/12384 [25:42:52<34:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 1: 98%|█████████▊| 12118/12384 [25:42:59<34:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12119/12384 [25:42:59<33:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12119/12384 [25:43:07<33:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 98%|█████████▊| 12120/12384 [25:43:07<33:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 98%|█████████▊| 12120/12384 [25:43:15<33:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 98%|█████████▊| 12121/12384 [25:43:15<33:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 1: 98%|█████████▊| 12121/12384 [25:43:22<33:35, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=7.85s]
Epoch 1: 98%|█████████▊| 12122/12384 [25:43:22<33:22, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.85s]
Epoch 1: 98%|█████████▊| 12122/12384 [25:43:30<33:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 98%|█████████▊| 12123/12384 [25:43:30<33:46, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 98%|█████████▊| 12123/12384 [25:43:38<33:46, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 1: 98%|█████████▊| 12124/12384 [25:43:38<33:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 1: 98%|█████████▊| 12124/12384 [25:43:46<33:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 1: 98%|█████████▊| 12125/12384 [25:43:46<33:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 1: 98%|█████████▊| 12125/12384 [25:43:53<33:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 1: 98%|█████████▊| 12126/12384 [25:43:53<32:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 1: 98%|█████████▊| 12126/12384 [25:44:01<32:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 98%|█████████▊| 12127/12384 [25:44:01<32:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 98%|█████████▊| 12127/12384 [25:44:08<32:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 98%|█████████▊| 12128/12384 [25:44:08<32:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 98%|█████████▊| 12128/12384 [25:44:16<32:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 98%|█████████▊| 12129/12384 [25:44:16<32:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 1: 98%|█████████▊| 12129/12384 [25:44:24<32:26, 7.63s/it, loss=0.0003, acc=0.9984, iter_time=7.66s]
Epoch 1: 98%|█████████▊| 12130/12384 [25:44:24<32:16, 7.63s/it, loss=0.0003, acc=0.9984, iter_time=7.66s]
Epoch 1: 98%|█████████▊| 12130/12384 [25:44:31<32:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 98%|█████████▊| 12131/12384 [25:44:31<32:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 1: 98%|█████████▊| 12131/12384 [25:44:39<32:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 98%|█████████▊| 12132/12384 [25:44:39<32:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 1: 98%|█████████▊| 12132/12384 [25:44:47<32:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 1: 98%|█████████▊| 12133/12384 [25:44:47<31:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 1: 98%|█████████▊| 12133/12384 [25:44:54<31:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 98%|█████████▊| 12134/12384 [25:44:54<31:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 1: 98%|█████████▊| 12134/12384 [25:45:02<31:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 98%|█████████▊| 12135/12384 [25:45:02<31:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 1: 98%|█████████▊| 12135/12384 [25:45:09<31:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12136/12384 [25:45:09<31:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12136/12384 [25:45:17<31:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 98%|█████████▊| 12137/12384 [25:45:17<31:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 98%|█████████▊| 12137/12384 [25:45:25<31:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 98%|█████████▊| 12138/12384 [25:45:25<31:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 98%|█████████▊| 12138/12384 [25:45:32<31:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 98%|█████████▊| 12139/12384 [25:45:32<31:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 1: 98%|█████████▊| 12139/12384 [25:45:40<31:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 1: 98%|█████████▊| 12140/12384 [25:45:40<30:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 1: 98%|█████████▊| 12140/12384 [25:45:48<30:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 1: 98%|█████████▊| 12141/12384 [25:45:48<30:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 1: 98%|█████████▊| 12141/12384 [25:45:55<30:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 98%|█████████▊| 12142/12384 [25:45:55<30:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 1: 98%|█████████▊| 12142/12384 [25:46:03<30:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 98%|█████████▊| 12143/12384 [25:46:03<30:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 1: 98%|█████████▊| 12143/12384 [25:46:11<30:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 98%|█████████▊| 12144/12384 [25:46:11<30:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 1: 98%|█████████▊| 12144/12384 [25:46:18<30:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 98%|█████████▊| 12145/12384 [25:46:18<30:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 1: 98%|█████████▊| 12145/12384 [25:46:26<30:35, 7.68s/it, loss=0.0001, acc=0.9997, iter_time=5.13s]
Epoch 1: 98%|█████████▊| 12146/12384 [25:46:26<30:23, 7.66s/it, loss=0.0001, acc=0.9997, iter_time=5.13s]
Epoch 1: 98%|█████████▊| 12146/12384 [25:46:34<30:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.91s]
Epoch 1: 98%|█████████▊| 12147/12384 [25:46:34<30:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.91s]
Epoch 1: 98%|█████████▊| 12147/12384 [25:46:41<30:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12148/12384 [25:46:41<30:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12148/12384 [25:46:49<30:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 98%|█████████▊| 12149/12384 [25:46:49<30:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 1: 98%|█████████▊| 12149/12384 [25:46:57<30:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 98%|█████████▊| 12150/12384 [25:46:57<30:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 1: 98%|█████████▊| 12150/12384 [25:47:04<30:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 98%|█████████▊| 12151/12384 [25:47:04<29:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 98%|█████████▊| 12151/12384 [25:47:12<29:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 98%|█████████▊| 12152/12384 [25:47:12<29:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 98%|█████████▊| 12152/12384 [25:47:20<29:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 98%|█████████▊| 12153/12384 [25:47:20<29:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 98%|█████████▊| 12153/12384 [25:47:27<29:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12154/12384 [25:47:27<29:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 98%|█████████▊| 12154/12384 [25:47:35<29:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12155/12384 [25:47:35<29:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12155/12384 [25:47:42<29:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12156/12384 [25:47:42<28:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12156/12384 [25:47:50<28:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 98%|█████████▊| 12157/12384 [25:47:50<28:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 98%|█████████▊| 12157/12384 [25:47:58<28:51, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=6.76s]
Epoch 1: 98%|█████████▊| 12158/12384 [25:47:58<28:42, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=6.76s]
Epoch 1: 98%|█████████▊| 12158/12384 [25:48:05<28:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 98%|█████████▊| 12159/12384 [25:48:05<28:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 1: 98%|█████████▊| 12159/12384 [25:48:13<28:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 98%|█████████▊| 12160/12384 [25:48:13<28:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 98%|█████████▊| 12160/12384 [25:48:20<28:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 98%|█████████▊| 12161/12384 [25:48:20<28:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 1: 98%|█████████▊| 12161/12384 [25:48:28<28:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 98%|█████████▊| 12162/12384 [25:48:28<28:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 98%|█████████▊| 12162/12384 [25:48:36<28:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 98%|█████████▊| 12163/12384 [25:48:36<28:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 98%|█████████▊| 12163/12384 [25:48:44<28:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 98%|█████████▊| 12164/12384 [25:48:44<28:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 1: 98%|█████████▊| 12164/12384 [25:48:51<28:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 98%|█████████▊| 12165/12384 [25:48:51<27:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 98%|█████████▊| 12165/12384 [25:48:59<27:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 98%|█████████▊| 12166/12384 [25:48:59<27:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 98%|█████████▊| 12166/12384 [25:49:06<27:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 98%|█████████▊| 12167/12384 [25:49:06<27:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 98%|█████████▊| 12167/12384 [25:49:14<27:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 98%|█████████▊| 12168/12384 [25:49:14<27:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 98%|█████████▊| 12168/12384 [25:49:22<27:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 98%|█████████▊| 12169/12384 [25:49:22<27:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 98%|█████████▊| 12169/12384 [25:49:29<27:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 98%|█████████▊| 12170/12384 [25:49:29<27:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 1: 98%|█████████▊| 12170/12384 [25:49:37<27:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 98%|█████████▊| 12171/12384 [25:49:37<27:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 1: 98%|█████████▊| 12171/12384 [25:49:45<27:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 98%|█████████▊| 12172/12384 [25:49:45<26:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 1: 98%|█████████▊| 12172/12384 [25:49:52<26:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 98%|█████████▊| 12173/12384 [25:49:52<26:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 98%|█████████▊| 12173/12384 [25:50:00<26:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 98%|█████████▊| 12174/12384 [25:50:00<26:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 98%|█████████▊| 12174/12384 [25:50:07<26:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 98%|█████████▊| 12175/12384 [25:50:07<26:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 1: 98%|█████████▊| 12175/12384 [25:50:15<26:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 98%|█████████▊| 12176/12384 [25:50:15<26:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 1: 98%|█████████▊| 12176/12384 [25:50:23<26:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 98%|█████████▊| 12177/12384 [25:50:23<26:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 1: 98%|█████████▊| 12177/12384 [25:50:31<26:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 98%|█████████▊| 12178/12384 [25:50:31<26:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 1: 98%|█████████▊| 12178/12384 [25:50:38<26:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 98%|█████████▊| 12179/12384 [25:50:38<26:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 1: 98%|█████████▊| 12179/12384 [25:50:46<26:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 98%|█████████▊| 12180/12384 [25:50:46<25:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 98%|█████████▊| 12180/12384 [25:50:53<25:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 98%|█████████▊| 12181/12384 [25:50:53<25:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 98%|█████████▊| 12181/12384 [25:51:01<25:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12182/12384 [25:51:01<25:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 98%|█████████▊| 12182/12384 [25:51:09<25:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 98%|█████████▊| 12183/12384 [25:51:09<25:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 98%|█████████▊| 12183/12384 [25:51:16<25:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 98%|█████████▊| 12184/12384 [25:51:16<25:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 1: 98%|█████████▊| 12184/12384 [25:51:24<25:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 98%|█████████▊| 12185/12384 [25:51:24<25:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 98%|█████████▊| 12185/12384 [25:51:31<25:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 98%|█████████▊| 12186/12384 [25:51:31<25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 1: 98%|█████████▊| 12186/12384 [25:51:39<25:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 98%|█████████▊| 12187/12384 [25:51:39<25:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 98%|█████████▊| 12187/12384 [25:51:47<25:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12188/12384 [25:51:47<24:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 98%|█████████▊| 12188/12384 [25:51:54<24:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 98%|█████████▊| 12189/12384 [25:51:54<24:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 98%|█████████▊| 12189/12384 [25:52:02<24:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 98%|█████████▊| 12190/12384 [25:52:02<24:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 1: 98%|█████████▊| 12190/12384 [25:52:10<24:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 98%|█████████▊| 12191/12384 [25:52:10<24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 1: 98%|█████████▊| 12191/12384 [25:52:17<24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 98%|█████████▊| 12192/12384 [25:52:17<24:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 1: 98%|█████████▊| 12192/12384 [25:52:25<24:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 98%|█████████▊| 12193/12384 [25:52:25<24:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 98%|█████████▊| 12193/12384 [25:52:32<24:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 98%|█████████▊| 12194/12384 [25:52:32<24:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 1: 98%|█████████▊| 12194/12384 [25:52:40<24:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 98%|█████████▊| 12195/12384 [25:52:40<23:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 1: 98%|█████████▊| 12195/12384 [25:52:48<23:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 98%|█████████▊| 12196/12384 [25:52:48<24:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 1: 98%|█████████▊| 12196/12384 [25:52:56<24:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 98%|█████████▊| 12197/12384 [25:52:56<23:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 1: 98%|█████████▊| 12197/12384 [25:53:03<23:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 98%|█████████▊| 12198/12384 [25:53:03<23:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 1: 98%|█████████▊| 12198/12384 [25:53:11<23:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▊| 12199/12384 [25:53:11<23:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▊| 12199/12384 [25:53:18<23:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 99%|█████████▊| 12200/12384 [25:53:18<23:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 99%|█████████▊| 12200/12384 [25:53:26<23:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 99%|█████████▊| 12201/12384 [25:53:26<23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 99%|█████████▊| 12201/12384 [25:53:34<23:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 99%|█████████▊| 12202/12384 [25:53:34<23:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 99%|█████████▊| 12202/12384 [25:53:42<23:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 99%|█████████▊| 12203/12384 [25:53:42<23:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 1: 99%|█████████▊| 12203/12384 [25:53:49<23:12, 7.70s/it, loss=0.0001, acc=0.9999, iter_time=9.10s]
Epoch 1: 99%|█████████▊| 12204/12384 [25:53:49<23:00, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=9.10s]
Epoch 1: 99%|█████████▊| 12204/12384 [25:53:57<23:00, 7.67s/it, loss=0.0002, acc=0.9995, iter_time=7.62s]
Epoch 1: 99%|█████████▊| 12205/12384 [25:53:57<22:56, 7.69s/it, loss=0.0002, acc=0.9995, iter_time=7.62s]
Epoch 1: 99%|█████████▊| 12205/12384 [25:54:05<22:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 99%|█████████▊| 12206/12384 [25:54:05<22:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 1: 99%|█████████▊| 12206/12384 [25:54:12<22:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 99%|█████████▊| 12207/12384 [25:54:12<22:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 99%|█████████▊| 12207/12384 [25:54:20<22:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 99%|█████████▊| 12208/12384 [25:54:20<22:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 99%|█████████▊| 12208/12384 [25:54:27<22:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 99%|█████████▊| 12209/12384 [25:54:27<22:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 99%|█████████▊| 12209/12384 [25:54:35<22:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▊| 12210/12384 [25:54:35<22:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▊| 12210/12384 [25:54:43<22:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▊| 12211/12384 [25:54:43<21:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▊| 12211/12384 [25:54:50<21:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▊| 12212/12384 [25:54:50<21:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▊| 12212/12384 [25:54:58<21:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▊| 12213/12384 [25:54:58<21:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▊| 12213/12384 [25:55:05<21:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 99%|█████████▊| 12214/12384 [25:55:05<21:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 1: 99%|█████████▊| 12214/12384 [25:55:13<21:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 99%|█████████▊| 12215/12384 [25:55:13<21:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 1: 99%|█████████▊| 12215/12384 [25:55:21<21:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 99%|█████████▊| 12216/12384 [25:55:21<21:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 1: 99%|█████████▊| 12216/12384 [25:55:28<21:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 99%|█████████▊| 12217/12384 [25:55:28<21:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 99%|█████████▊| 12217/12384 [25:55:36<21:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 99%|█████████▊| 12218/12384 [25:55:36<21:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 1: 99%|█████████▊| 12218/12384 [25:55:43<21:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 99%|█████████▊| 12219/12384 [25:55:43<20:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 99%|█████████▊| 12219/12384 [25:55:51<20:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▊| 12220/12384 [25:55:51<20:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▊| 12220/12384 [25:55:59<20:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 99%|█████████▊| 12221/12384 [25:55:59<20:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 1: 99%|█████████▊| 12221/12384 [25:56:06<20:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 99%|█████████▊| 12222/12384 [25:56:06<20:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 1: 99%|█████████▊| 12222/12384 [25:56:14<20:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 99%|█████████▊| 12223/12384 [25:56:14<20:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 1: 99%|█████████▊| 12223/12384 [25:56:21<20:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 99%|█████████▊| 12224/12384 [25:56:21<20:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 99%|█████████▊| 12224/12384 [25:56:29<20:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 99%|█████████▊| 12225/12384 [25:56:29<20:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 1: 99%|█████████▊| 12225/12384 [25:56:37<20:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 99%|█████████▊| 12226/12384 [25:56:37<20:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 99%|█████████▊| 12226/12384 [25:56:44<20:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 99%|█████████▊| 12227/12384 [25:56:44<19:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 99%|█████████▊| 12227/12384 [25:56:52<19:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 99%|█████████▊| 12228/12384 [25:56:52<19:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 99%|█████████▊| 12228/12384 [25:57:00<19:46, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.36s]
Epoch 1: 99%|█████████▊| 12229/12384 [25:57:00<19:54, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=9.36s]
Epoch 1: 99%|█████████▊| 12229/12384 [25:57:08<19:54, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.38s]
Epoch 1: 99%|█████████▉| 12230/12384 [25:57:08<19:42, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.38s]
Epoch 1: 99%|█████████▉| 12230/12384 [25:57:15<19:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 99%|█████████▉| 12231/12384 [25:57:15<19:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 1: 99%|█████████▉| 12231/12384 [25:57:23<19:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 99%|█████████▉| 12232/12384 [25:57:23<19:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 1: 99%|█████████▉| 12232/12384 [25:57:30<19:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 99%|█████████▉| 12233/12384 [25:57:30<19:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 1: 99%|█████████▉| 12233/12384 [25:57:38<19:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▉| 12234/12384 [25:57:38<19:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▉| 12234/12384 [25:57:46<19:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 99%|█████████▉| 12235/12384 [25:57:46<18:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 1: 99%|█████████▉| 12235/12384 [25:57:53<18:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 99%|█████████▉| 12236/12384 [25:57:53<18:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 1: 99%|█████████▉| 12236/12384 [25:58:01<18:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 99%|█████████▉| 12237/12384 [25:58:01<18:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 1: 99%|█████████▉| 12237/12384 [25:58:08<18:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 99%|█████████▉| 12238/12384 [25:58:08<18:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 1: 99%|█████████▉| 12238/12384 [25:58:16<18:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12239/12384 [25:58:16<18:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12239/12384 [25:58:24<18:22, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.54s]
Epoch 1: 99%|█████████▉| 12240/12384 [25:58:24<18:14, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.54s]
Epoch 1: 99%|█████████▉| 12240/12384 [25:58:31<18:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 99%|█████████▉| 12241/12384 [25:58:31<18:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 1: 99%|█████████▉| 12241/12384 [25:58:39<18:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 99%|█████████▉| 12242/12384 [25:58:39<17:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 99%|█████████▉| 12242/12384 [25:58:46<17:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12243/12384 [25:58:46<17:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12243/12384 [25:58:54<17:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 99%|█████████▉| 12244/12384 [25:58:54<17:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 99%|█████████▉| 12244/12384 [25:59:00<17:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 99%|█████████▉| 12245/12384 [25:59:00<16:27, 7.10s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 1: 99%|█████████▉| 12245/12384 [25:59:08<16:27, 7.10s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 99%|█████████▉| 12246/12384 [25:59:08<16:40, 7.25s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 1: 99%|█████████▉| 12246/12384 [25:59:15<16:40, 7.25s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 99%|█████████▉| 12247/12384 [25:59:15<16:47, 7.35s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 1: 99%|█████████▉| 12247/12384 [25:59:23<16:47, 7.35s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 99%|█████████▉| 12248/12384 [25:59:23<16:50, 7.43s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 1: 99%|█████████▉| 12248/12384 [25:59:31<16:50, 7.43s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 99%|█████████▉| 12249/12384 [25:59:31<17:00, 7.56s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 1: 99%|█████████▉| 12249/12384 [25:59:38<17:00, 7.56s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12250/12384 [25:59:38<16:55, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12250/12384 [25:59:46<16:55, 7.58s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 99%|█████████▉| 12251/12384 [25:59:46<16:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 99%|█████████▉| 12251/12384 [25:59:54<16:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▉| 12252/12384 [25:59:54<16:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▉| 12252/12384 [26:00:01<16:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 99%|█████████▉| 12253/12384 [26:00:01<16:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 99%|█████████▉| 12253/12384 [26:00:09<16:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 99%|█████████▉| 12254/12384 [26:00:09<16:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 1: 99%|█████████▉| 12254/12384 [26:00:17<16:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 99%|█████████▉| 12255/12384 [26:00:17<16:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 99%|█████████▉| 12255/12384 [26:00:24<16:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 99%|█████████▉| 12256/12384 [26:00:24<16:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 99%|█████████▉| 12256/12384 [26:00:32<16:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 1: 99%|█████████▉| 12257/12384 [26:00:32<16:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 1: 99%|█████████▉| 12257/12384 [26:00:40<16:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 99%|█████████▉| 12258/12384 [26:00:40<16:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 1: 99%|█████████▉| 12258/12384 [26:00:47<16:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 1: 99%|█████████▉| 12259/12384 [26:00:47<15:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 1: 99%|█████████▉| 12259/12384 [26:00:55<15:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12260/12384 [26:00:55<15:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12260/12384 [26:01:03<15:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 99%|█████████▉| 12261/12384 [26:01:03<15:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 1: 99%|█████████▉| 12261/12384 [26:01:10<15:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12262/12384 [26:01:10<15:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12262/12384 [26:01:18<15:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 99%|█████████▉| 12263/12384 [26:01:18<15:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 1: 99%|█████████▉| 12263/12384 [26:01:25<15:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 99%|█████████▉| 12264/12384 [26:01:25<15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 1: 99%|█████████▉| 12264/12384 [26:01:33<15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 99%|█████████▉| 12265/12384 [26:01:33<15:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 1: 99%|█████████▉| 12265/12384 [26:01:41<15:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 99%|█████████▉| 12266/12384 [26:01:41<14:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 1: 99%|█████████▉| 12266/12384 [26:01:48<14:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.29s]
Epoch 1: 99%|█████████▉| 12267/12384 [26:01:48<14:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.29s]
Epoch 1: 99%|█████████▉| 12267/12384 [26:01:56<14:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 99%|█████████▉| 12268/12384 [26:01:56<14:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 99%|█████████▉| 12268/12384 [26:02:03<14:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 99%|█████████▉| 12269/12384 [26:02:03<14:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 99%|█████████▉| 12269/12384 [26:02:11<14:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12270/12384 [26:02:11<14:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12270/12384 [26:02:19<14:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.14s]
Epoch 1: 99%|█████████▉| 12271/12384 [26:02:19<14:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.14s]
Epoch 1: 99%|█████████▉| 12271/12384 [26:02:26<14:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 1: 99%|█████████▉| 12272/12384 [26:02:26<14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 1: 99%|█████████▉| 12272/12384 [26:02:34<14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 99%|█████████▉| 12273/12384 [26:02:34<14:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 99%|█████████▉| 12273/12384 [26:02:42<14:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 99%|█████████▉| 12274/12384 [26:02:42<13:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 1: 99%|█████████▉| 12274/12384 [26:02:49<13:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 99%|█████████▉| 12275/12384 [26:02:49<13:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 1: 99%|█████████▉| 12275/12384 [26:02:57<13:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 99%|█████████▉| 12276/12384 [26:02:57<13:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 1: 99%|█████████▉| 12276/12384 [26:03:05<13:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 99%|█████████▉| 12277/12384 [26:03:05<13:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 1: 99%|█████████▉| 12277/12384 [26:03:12<13:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 99%|█████████▉| 12278/12384 [26:03:12<13:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 1: 99%|█████████▉| 12278/12384 [26:03:20<13:30, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 99%|█████████▉| 12279/12384 [26:03:20<13:22, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.83s]
Epoch 1: 99%|█████████▉| 12279/12384 [26:03:28<13:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 99%|█████████▉| 12280/12384 [26:03:28<13:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 1: 99%|█████████▉| 12280/12384 [26:03:35<13:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 99%|█████████▉| 12281/12384 [26:03:35<13:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 1: 99%|█████████▉| 12281/12384 [26:03:43<13:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 99%|█████████▉| 12282/12384 [26:03:43<13:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 1: 99%|█████████▉| 12282/12384 [26:03:51<13:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 99%|█████████▉| 12283/12384 [26:03:51<12:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 99%|█████████▉| 12283/12384 [26:03:58<12:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12284/12384 [26:03:58<12:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12284/12384 [26:04:06<12:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12285/12384 [26:04:06<12:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12285/12384 [26:04:13<12:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 99%|█████████▉| 12286/12384 [26:04:13<12:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 1: 99%|█████████▉| 12286/12384 [26:04:21<12:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 99%|█████████▉| 12287/12384 [26:04:21<12:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 1: 99%|█████████▉| 12287/12384 [26:04:29<12:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 99%|█████████▉| 12288/12384 [26:04:29<12:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 1: 99%|█████████▉| 12288/12384 [26:04:36<12:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 99%|█████████▉| 12289/12384 [26:04:36<12:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 99%|█████████▉| 12289/12384 [26:04:44<12:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 99%|█████████▉| 12290/12384 [26:04:44<11:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 1: 99%|█████████▉| 12290/12384 [26:04:51<11:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12291/12384 [26:04:51<11:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12291/12384 [26:04:59<11:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12292/12384 [26:04:59<11:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12292/12384 [26:05:07<11:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.38s]
Epoch 1: 99%|█████████▉| 12293/12384 [26:05:07<11:32, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=3.38s]
Epoch 1: 99%|█████████▉| 12293/12384 [26:05:14<11:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.83s]
Epoch 1: 99%|█████████▉| 12294/12384 [26:05:14<11:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.83s]
Epoch 1: 99%|█████████▉| 12294/12384 [26:05:22<11:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12295/12384 [26:05:22<11:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 99%|█████████▉| 12295/12384 [26:05:29<11:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 99%|█████████▉| 12296/12384 [26:05:29<11:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 1: 99%|█████████▉| 12296/12384 [26:05:37<11:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 99%|█████████▉| 12297/12384 [26:05:37<11:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 99%|█████████▉| 12297/12384 [26:05:45<11:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 99%|█████████▉| 12298/12384 [26:05:45<10:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 1: 99%|█████████▉| 12298/12384 [26:05:52<10:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 99%|█████████▉| 12299/12384 [26:05:52<10:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 1: 99%|█████████▉| 12299/12384 [26:06:00<10:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 99%|█████████▉| 12300/12384 [26:06:00<10:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 1: 99%|█████████▉| 12300/12384 [26:06:08<10:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 99%|█████████▉| 12301/12384 [26:06:08<10:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 1: 99%|█████████▉| 12301/12384 [26:06:15<10:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 99%|█████████▉| 12302/12384 [26:06:15<10:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 1: 99%|█████████▉| 12302/12384 [26:06:23<10:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 99%|█████████▉| 12303/12384 [26:06:23<10:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 1: 99%|█████████▉| 12303/12384 [26:06:30<10:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 99%|█████████▉| 12304/12384 [26:06:30<10:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 1: 99%|█████████▉| 12304/12384 [26:06:38<10:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 99%|█████████▉| 12305/12384 [26:06:38<10:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 1: 99%|█████████▉| 12305/12384 [26:06:46<10:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12306/12384 [26:06:46<09:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12306/12384 [26:06:54<09:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 99%|█████████▉| 12307/12384 [26:06:54<09:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 1: 99%|█████████▉| 12307/12384 [26:07:01<09:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 99%|█████████▉| 12308/12384 [26:07:01<09:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 1: 99%|█████████▉| 12308/12384 [26:07:09<09:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 99%|█████████▉| 12309/12384 [26:07:09<09:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 1: 99%|█████████▉| 12309/12384 [26:07:16<09:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▉| 12310/12384 [26:07:16<09:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 99%|█████████▉| 12310/12384 [26:07:24<09:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 99%|█████████▉| 12311/12384 [26:07:24<09:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 1: 99%|█████████▉| 12311/12384 [26:07:32<09:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 99%|█████████▉| 12312/12384 [26:07:32<09:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 1: 99%|█████████▉| 12312/12384 [26:07:39<09:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 99%|█████████▉| 12313/12384 [26:07:39<09:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 1: 99%|█████████▉| 12313/12384 [26:07:47<09:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 99%|█████████▉| 12314/12384 [26:07:47<08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 1: 99%|█████████▉| 12314/12384 [26:07:54<08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 99%|█████████▉| 12315/12384 [26:07:54<08:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 1: 99%|█████████▉| 12315/12384 [26:08:02<08:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 99%|█████████▉| 12316/12384 [26:08:02<08:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 99%|█████████▉| 12316/12384 [26:08:10<08:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 99%|█████████▉| 12317/12384 [26:08:10<08:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 1: 99%|█████████▉| 12317/12384 [26:08:17<08:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 99%|█████████▉| 12318/12384 [26:08:17<08:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 1: 99%|█████████▉| 12318/12384 [26:08:25<08:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 99%|█████████▉| 12319/12384 [26:08:25<08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 1: 99%|█████████▉| 12319/12384 [26:08:32<08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 99%|█████████▉| 12320/12384 [26:08:32<08:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 1: 99%|█████████▉| 12320/12384 [26:08:40<08:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 99%|█████████▉| 12321/12384 [26:08:40<07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 1: 99%|█████████▉| 12321/12384 [26:08:48<07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12322/12384 [26:08:48<07:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 99%|█████████▉| 12322/12384 [26:08:55<07:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 100%|█████████▉| 12323/12384 [26:08:55<07:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 1: 100%|█████████▉| 12323/12384 [26:09:03<07:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 100%|█████████▉| 12324/12384 [26:09:03<07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 1: 100%|█████████▉| 12324/12384 [26:09:11<07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 100%|█████████▉| 12325/12384 [26:09:11<07:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 1: 100%|█████████▉| 12325/12384 [26:09:18<07:29, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 1: 100%|█████████▉| 12326/12384 [26:09:18<07:21, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 1: 100%|█████████▉| 12326/12384 [26:09:26<07:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 100%|█████████▉| 12327/12384 [26:09:26<07:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 100%|█████████▉| 12327/12384 [26:09:34<07:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 100%|█████████▉| 12328/12384 [26:09:34<07:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 1: 100%|█████████▉| 12328/12384 [26:09:41<07:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 100%|█████████▉| 12329/12384 [26:09:41<07:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 1: 100%|█████████▉| 12329/12384 [26:09:49<07:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 100%|█████████▉| 12330/12384 [26:09:49<06:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 1: 100%|█████████▉| 12330/12384 [26:09:56<06:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 1: 100%|█████████▉| 12331/12384 [26:09:56<06:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 1: 100%|█████████▉| 12331/12384 [26:10:04<06:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 100%|█████████▉| 12332/12384 [26:10:04<06:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 1: 100%|█████████▉| 12332/12384 [26:10:12<06:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 100%|█████████▉| 12333/12384 [26:10:12<06:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 1: 100%|█████████▉| 12333/12384 [26:10:20<06:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 100%|█████████▉| 12334/12384 [26:10:20<06:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 1: 100%|█████████▉| 12334/12384 [26:10:27<06:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 100%|█████████▉| 12335/12384 [26:10:27<06:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 1: 100%|█████████▉| 12335/12384 [26:10:35<06:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 100%|█████████▉| 12336/12384 [26:10:35<06:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 1: 100%|█████████▉| 12336/12384 [26:10:42<06:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 100%|█████████▉| 12337/12384 [26:10:42<05:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 1: 100%|█████████▉| 12337/12384 [26:10:50<05:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 100%|█████████▉| 12338/12384 [26:10:50<05:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 100%|█████████▉| 12338/12384 [26:10:58<05:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 100%|█████████▉| 12339/12384 [26:10:58<05:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 1: 100%|█████████▉| 12339/12384 [26:11:05<05:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 100%|█████████▉| 12340/12384 [26:11:05<05:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 1: 100%|█████████▉| 12340/12384 [26:11:13<05:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 100%|█████████▉| 12341/12384 [26:11:13<05:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 1: 100%|█████████▉| 12341/12384 [26:11:20<05:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 100%|█████████▉| 12342/12384 [26:11:20<05:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 1: 100%|█████████▉| 12342/12384 [26:11:28<05:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 100%|█████████▉| 12343/12384 [26:11:28<05:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 1: 100%|█████████▉| 12343/12384 [26:11:36<05:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 100%|█████████▉| 12344/12384 [26:11:36<05:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 1: 100%|█████████▉| 12344/12384 [26:11:43<05:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 100%|█████████▉| 12345/12384 [26:11:43<04:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 1: 100%|█████████▉| 12345/12384 [26:11:51<04:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 100%|█████████▉| 12346/12384 [26:11:51<04:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 100%|█████████▉| 12346/12384 [26:11:58<04:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 100%|█████████▉| 12347/12384 [26:11:58<04:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 1: 100%|█████████▉| 12347/12384 [26:12:06<04:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 100%|█████████▉| 12348/12384 [26:12:06<04:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 1: 100%|█████████▉| 12348/12384 [26:12:14<04:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 100%|█████████▉| 12349/12384 [26:12:14<04:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 1: 100%|█████████▉| 12349/12384 [26:12:21<04:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 100%|█████████▉| 12350/12384 [26:12:21<04:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 1: 100%|█████████▉| 12350/12384 [26:12:29<04:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 100%|█████████▉| 12351/12384 [26:12:29<04:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 1: 100%|█████████▉| 12351/12384 [26:12:37<04:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 100%|█████████▉| 12352/12384 [26:12:37<04:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 1: 100%|█████████▉| 12352/12384 [26:12:44<04:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 1: 100%|█████████▉| 12353/12384 [26:12:44<03:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 1: 100%|█████████▉| 12353/12384 [26:12:52<03:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 100%|█████████▉| 12354/12384 [26:12:52<03:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 1: 100%|█████████▉| 12354/12384 [26:12:59<03:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 100%|█████████▉| 12355/12384 [26:12:59<03:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 1: 100%|█████████▉| 12355/12384 [26:13:07<03:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 100%|█████████▉| 12356/12384 [26:13:07<03:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 1: 100%|█████████▉| 12356/12384 [26:13:15<03:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 100%|█████████▉| 12357/12384 [26:13:15<03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 1: 100%|█████████▉| 12357/12384 [26:13:22<03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 1: 100%|█████████▉| 12358/12384 [26:13:22<03:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 1: 100%|█████████▉| 12358/12384 [26:13:30<03:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 100%|█████████▉| 12359/12384 [26:13:30<03:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 1: 100%|█████████▉| 12359/12384 [26:13:38<03:10, 7.64s/it, loss=0.0019, acc=0.9956, iter_time=11.17s]
Epoch 1: 100%|█████████▉| 12360/12384 [26:13:38<03:04, 7.70s/it, loss=0.0019, acc=0.9956, iter_time=11.17s]
Epoch 1: 100%|█████████▉| 12360/12384 [26:13:45<03:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 100%|█████████▉| 12361/12384 [26:13:45<02:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 1: 100%|█████████▉| 12361/12384 [26:13:53<02:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 100%|█████████▉| 12362/12384 [26:13:53<02:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 1: 100%|█████████▉| 12362/12384 [26:14:01<02:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 100%|█████████▉| 12363/12384 [26:14:01<02:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 100%|█████████▉| 12363/12384 [26:14:08<02:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 100%|█████████▉| 12364/12384 [26:14:08<02:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 100%|█████████▉| 12364/12384 [26:14:16<02:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 100%|█████████▉| 12365/12384 [26:14:16<02:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 100%|█████████▉| 12365/12384 [26:14:23<02:24, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.01s]
Epoch 1: 100%|█████████▉| 12366/12384 [26:14:23<02:17, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=8.01s]
Epoch 1: 100%|█████████▉| 12366/12384 [26:14:31<02:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 100%|█████████▉| 12367/12384 [26:14:31<02:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 1: 100%|█████████▉| 12367/12384 [26:14:39<02:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 100%|█████████▉| 12368/12384 [26:14:39<02:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 1: 100%|█████████▉| 12368/12384 [26:14:46<02:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 100%|█████████▉| 12369/12384 [26:14:46<01:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 1: 100%|█████████▉| 12369/12384 [26:14:54<01:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 100%|█████████▉| 12370/12384 [26:14:54<01:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 1: 100%|█████████▉| 12370/12384 [26:15:02<01:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 100%|█████████▉| 12371/12384 [26:15:02<01:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 100%|█████████▉| 12371/12384 [26:15:09<01:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 100%|█████████▉| 12372/12384 [26:15:09<01:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 100%|█████████▉| 12372/12384 [26:15:17<01:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 100%|█████████▉| 12373/12384 [26:15:17<01:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 100%|█████████▉| 12373/12384 [26:15:24<01:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 100%|█████████▉| 12374/12384 [26:15:24<01:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 1: 100%|█████████▉| 12374/12384 [26:15:32<01:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 100%|█████████▉| 12375/12384 [26:15:32<01:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 1: 100%|█████████▉| 12375/12384 [26:15:40<01:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 100%|█████████▉| 12376/12384 [26:15:40<01:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 1: 100%|█████████▉| 12376/12384 [26:15:47<01:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 100%|█████████▉| 12377/12384 [26:15:47<00:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 1: 100%|█████████▉| 12377/12384 [26:15:55<00:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 100%|█████████▉| 12378/12384 [26:15:55<00:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 100%|█████████▉| 12378/12384 [26:16:03<00:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 100%|█████████▉| 12379/12384 [26:16:03<00:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 1: 100%|█████████▉| 12379/12384 [26:16:10<00:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 100%|█████████▉| 12380/12384 [26:16:10<00:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 1: 100%|█████████▉| 12380/12384 [26:16:18<00:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 100%|█████████▉| 12381/12384 [26:16:18<00:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 1: 100%|█████████▉| 12381/12384 [26:16:25<00:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 100%|█████████▉| 12382/12384 [26:16:25<00:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 1: 100%|█████████▉| 12382/12384 [26:16:33<00:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 100%|█████████▉| 12383/12384 [26:16:33<00:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 1: 100%|█████████▉| 12383/12384 [26:16:41<00:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 100%|██████████| 12384/12384 [26:16:41<00:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 1: 100%|██████████| 12384/12384 [26:16:41<00:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
+
Epoch 2: 0%| | 0/12384 [00:00, ?it/s]
Epoch 2: 0%| | 0/12384 [00:07, ?it/s, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 0%| | 1/12384 [00:07<26:15:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 0%| | 1/12384 [00:15<26:15:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 0%| | 2/12384 [00:15<26:57:36, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 0%| | 2/12384 [00:23<26:57:36, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 0%| | 3/12384 [00:23<26:35:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 0%| | 3/12384 [00:30<26:35:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 0%| | 4/12384 [00:30<26:25:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 0%| | 4/12384 [00:38<26:25:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 0%| | 5/12384 [00:38<26:19:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 0%| | 5/12384 [00:46<26:19:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 6/12384 [00:46<26:15:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 6/12384 [00:53<26:15:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 7/12384 [00:53<26:12:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 7/12384 [01:01<26:12:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 0%| | 8/12384 [01:01<26:11:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 0%| | 8/12384 [01:08<26:11:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 2: 0%| | 9/12384 [01:08<26:11:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 2: 0%| | 9/12384 [01:16<26:11:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 0%| | 10/12384 [01:16<26:10:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 0%| | 10/12384 [01:24<26:10:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 0%| | 11/12384 [01:24<26:10:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 0%| | 11/12384 [01:31<26:10:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 0%| | 12/12384 [01:31<26:11:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 0%| | 12/12384 [01:39<26:11:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 0%| | 13/12384 [01:39<26:10:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 0%| | 13/12384 [01:46<26:10:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.81s]
Epoch 2: 0%| | 14/12384 [01:46<26:12:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.81s]
Epoch 2: 0%| | 14/12384 [01:54<26:12:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 2: 0%| | 15/12384 [01:54<26:10:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 2: 0%| | 15/12384 [02:02<26:10:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 0%| | 16/12384 [02:02<26:08:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 0%| | 16/12384 [02:09<26:08:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.69s]
Epoch 2: 0%| | 17/12384 [02:09<26:06:12, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=5.69s]
Epoch 2: 0%| | 17/12384 [02:17<26:06:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 0%| | 18/12384 [02:17<26:06:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 0%| | 18/12384 [02:24<26:06:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 0%| | 19/12384 [02:24<26:06:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 0%| | 19/12384 [02:32<26:06:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 0%| | 20/12384 [02:32<26:05:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 0%| | 20/12384 [02:40<26:05:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 0%| | 21/12384 [02:40<26:10:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 0%| | 21/12384 [02:47<26:10:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.42s]
Epoch 2: 0%| | 22/12384 [02:47<26:14:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.42s]
Epoch 2: 0%| | 22/12384 [02:55<26:14:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 0%| | 23/12384 [02:55<26:12:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 0%| | 23/12384 [03:03<26:12:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 0%| | 24/12384 [03:03<26:11:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 0%| | 24/12384 [03:10<26:11:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 2: 0%| | 25/12384 [03:10<26:09:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 2: 0%| | 25/12384 [03:18<26:09:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 0%| | 26/12384 [03:18<26:09:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 0%| | 26/12384 [03:25<26:09:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.74s]
Epoch 2: 0%| | 27/12384 [03:25<26:07:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.74s]
Epoch 2: 0%| | 27/12384 [03:33<26:07:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 28/12384 [03:33<26:07:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 28/12384 [03:41<26:07:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 0%| | 29/12384 [03:41<26:27:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 0%| | 29/12384 [03:49<26:27:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 0%| | 30/12384 [03:49<26:20:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 0%| | 30/12384 [03:56<26:20:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 0%| | 31/12384 [03:56<26:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 0%| | 31/12384 [04:04<26:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 0%| | 32/12384 [04:04<26:13:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 0%| | 32/12384 [04:12<26:13:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 0%| | 33/12384 [04:12<26:16:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 0%| | 33/12384 [04:19<26:16:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 0%| | 34/12384 [04:19<26:12:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 0%| | 34/12384 [04:27<26:12:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 35/12384 [04:27<26:09:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 35/12384 [04:34<26:09:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 0%| | 36/12384 [04:34<26:09:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 0%| | 36/12384 [04:42<26:09:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 0%| | 37/12384 [04:42<26:09:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 0%| | 37/12384 [04:50<26:09:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 0%| | 38/12384 [04:50<26:08:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 0%| | 38/12384 [04:57<26:08:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 0%| | 39/12384 [04:57<26:08:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 0%| | 39/12384 [05:05<26:08:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 0%| | 40/12384 [05:05<26:14:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 0%| | 40/12384 [05:13<26:14:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 0%| | 41/12384 [05:13<26:11:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 0%| | 41/12384 [05:20<26:11:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 0%| | 42/12384 [05:20<26:08:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 0%| | 42/12384 [05:28<26:08:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 0%| | 43/12384 [05:28<26:07:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 0%| | 43/12384 [05:35<26:07:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 0%| | 44/12384 [05:35<26:07:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 0%| | 44/12384 [05:43<26:07:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 0%| | 45/12384 [05:43<26:06:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 0%| | 45/12384 [05:51<26:06:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 0%| | 46/12384 [05:51<26:06:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 0%| | 46/12384 [05:58<26:06:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 0%| | 47/12384 [05:58<26:05:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 0%| | 47/12384 [06:06<26:05:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 2: 0%| | 48/12384 [06:06<26:06:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 2: 0%| | 48/12384 [06:14<26:06:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 0%| | 49/12384 [06:14<26:21:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 0%| | 49/12384 [06:21<26:21:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 0%| | 50/12384 [06:21<26:16:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 0%| | 50/12384 [06:29<26:16:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 51/12384 [06:29<26:11:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 0%| | 51/12384 [06:37<26:11:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 0%| | 52/12384 [06:37<26:14:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 0%| | 52/12384 [06:44<26:14:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 0%| | 53/12384 [06:44<26:11:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 0%| | 53/12384 [06:52<26:11:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 0%| | 54/12384 [06:52<26:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 0%| | 54/12384 [07:00<26:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 0%| | 55/12384 [07:00<26:25:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 0%| | 55/12384 [07:07<26:25:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 0%| | 56/12384 [07:07<26:18:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 0%| | 56/12384 [07:15<26:18:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 0%| | 57/12384 [07:15<26:12:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 0%| | 57/12384 [07:23<26:12:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 0%| | 58/12384 [07:23<26:08:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 0%| | 58/12384 [07:30<26:08:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 2: 0%| | 59/12384 [07:30<26:07:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 2: 0%| | 59/12384 [07:38<26:07:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 0%| | 60/12384 [07:38<26:04:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 0%| | 60/12384 [07:45<26:04:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 0%| | 61/12384 [07:45<26:03:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 0%| | 61/12384 [07:53<26:03:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 62/12384 [07:53<26:03:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 62/12384 [08:01<26:03:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 63/12384 [08:01<26:03:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 63/12384 [08:08<26:03:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 1%| | 64/12384 [08:08<26:04:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 1%| | 64/12384 [08:16<26:04:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 1%| | 65/12384 [08:16<26:04:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 1%| | 65/12384 [08:23<26:04:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 1%| | 66/12384 [08:23<26:02:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 1%| | 66/12384 [08:31<26:02:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 1%| | 67/12384 [08:31<26:02:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 1%| | 67/12384 [08:39<26:02:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 68/12384 [08:39<26:01:49, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 68/12384 [08:46<26:01:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 69/12384 [08:46<26:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 69/12384 [08:54<26:00:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 1%| | 70/12384 [08:54<26:01:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 1%| | 70/12384 [09:01<26:01:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 1%| | 71/12384 [09:01<26:01:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 1%| | 71/12384 [09:09<26:01:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 1%| | 72/12384 [09:09<26:07:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 1%| | 72/12384 [09:17<26:07:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 1%| | 73/12384 [09:17<26:05:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 1%| | 73/12384 [09:24<26:05:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 1%| | 74/12384 [09:24<26:05:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 1%| | 74/12384 [09:32<26:05:27, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 2: 1%| | 75/12384 [09:32<26:21:21, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 2: 1%| | 75/12384 [09:40<26:21:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 76/12384 [09:40<26:15:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 76/12384 [09:47<26:15:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 1%| | 77/12384 [09:47<26:10:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 1%| | 77/12384 [09:55<26:10:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 78/12384 [09:55<26:07:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 78/12384 [10:03<26:07:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 1%| | 79/12384 [10:03<26:05:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 1%| | 79/12384 [10:10<26:05:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 1%| | 80/12384 [10:10<26:03:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 1%| | 80/12384 [10:18<26:03:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 1%| | 81/12384 [10:18<26:23:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 1%| | 81/12384 [10:26<26:23:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 2: 1%| | 82/12384 [10:26<26:19:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 2: 1%| | 82/12384 [10:34<26:19:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 1%| | 83/12384 [10:34<26:12:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 1%| | 83/12384 [10:41<26:12:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 1%| | 84/12384 [10:41<26:08:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 1%| | 84/12384 [10:49<26:08:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 1%| | 85/12384 [10:49<26:05:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 1%| | 85/12384 [10:56<26:05:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 2: 1%| | 86/12384 [10:56<26:06:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 2: 1%| | 86/12384 [11:04<26:06:01, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=6.06s]
Epoch 2: 1%| | 87/12384 [11:04<26:07:42, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=6.06s]
Epoch 2: 1%| | 87/12384 [11:12<26:07:42, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=10.85s]
Epoch 2: 1%| | 88/12384 [11:12<26:04:49, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.85s]
Epoch 2: 1%| | 88/12384 [11:19<26:04:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 1%| | 89/12384 [11:19<26:01:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 1%| | 89/12384 [11:27<26:01:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 1%| | 90/12384 [11:27<26:02:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 1%| | 90/12384 [11:34<26:02:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 91/12384 [11:34<26:01:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 91/12384 [11:42<26:01:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 92/12384 [11:42<26:04:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 92/12384 [11:50<26:04:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 93/12384 [11:50<26:02:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 93/12384 [11:57<26:02:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 94/12384 [11:57<26:01:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 94/12384 [12:05<26:01:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 2: 1%| | 95/12384 [12:05<25:59:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 2: 1%| | 95/12384 [12:13<25:59:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 1%| | 96/12384 [12:13<25:58:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 1%| | 96/12384 [12:20<25:58:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 1%| | 97/12384 [12:20<25:58:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 1%| | 97/12384 [12:28<25:58:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 98/12384 [12:28<25:57:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 98/12384 [12:35<25:57:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 1%| | 99/12384 [12:35<25:59:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 1%| | 99/12384 [12:43<25:59:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 1%| | 100/12384 [12:43<25:57:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 1%| | 100/12384 [12:51<25:57:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 1%| | 101/12384 [12:51<26:14:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 1%| | 101/12384 [12:58<26:14:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 102/12384 [12:58<26:09:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 102/12384 [13:06<26:09:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 103/12384 [13:06<26:06:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 103/12384 [13:14<26:06:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 1%| | 104/12384 [13:14<26:02:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 1%| | 104/12384 [13:21<26:02:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 1%| | 105/12384 [13:21<26:01:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 1%| | 105/12384 [13:29<26:01:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 106/12384 [13:29<25:59:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 106/12384 [13:37<25:59:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 107/12384 [13:37<26:18:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 107/12384 [13:44<26:18:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 1%| | 108/12384 [13:44<26:10:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 1%| | 108/12384 [13:52<26:10:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 1%| | 109/12384 [13:52<26:12:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 1%| | 109/12384 [14:00<26:12:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 110/12384 [14:00<26:06:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 110/12384 [14:07<26:06:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 111/12384 [14:07<26:03:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%| | 111/12384 [14:15<26:03:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 1%| | 112/12384 [14:15<26:06:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 1%| | 112/12384 [14:23<26:06:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 1%| | 113/12384 [14:23<26:08:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 1%| | 113/12384 [14:30<26:08:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 1%| | 114/12384 [14:30<26:07:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 1%| | 114/12384 [14:38<26:07:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 1%| | 115/12384 [14:38<26:08:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 1%| | 115/12384 [14:46<26:08:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 2: 1%| | 116/12384 [14:46<26:06:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 2: 1%| | 116/12384 [14:53<26:06:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 1%| | 117/12384 [14:53<26:03:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 1%| | 117/12384 [15:01<26:03:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 118/12384 [15:01<26:01:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 118/12384 [15:09<26:01:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 1%| | 119/12384 [15:09<25:58:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 1%| | 119/12384 [15:16<25:58:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 1%| | 120/12384 [15:16<25:58:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 1%| | 120/12384 [15:24<25:58:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 1%| | 121/12384 [15:24<25:57:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 1%| | 121/12384 [15:31<25:57:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 1%| | 122/12384 [15:31<25:57:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 1%| | 122/12384 [15:39<25:57:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 1%| | 123/12384 [15:39<26:01:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 1%| | 123/12384 [15:47<26:01:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 1%| | 124/12384 [15:47<26:00:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 1%| | 124/12384 [15:54<26:00:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 1%| | 125/12384 [15:54<25:57:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 1%| | 125/12384 [16:02<25:57:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 1%| | 126/12384 [16:02<25:56:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 1%| | 126/12384 [16:10<25:56:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 1%| | 127/12384 [16:10<26:13:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 1%| | 127/12384 [16:17<26:13:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 1%| | 128/12384 [16:17<26:07:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 1%| | 128/12384 [16:25<26:07:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 1%| | 129/12384 [16:25<26:05:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 1%| | 129/12384 [16:33<26:05:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 1%| | 130/12384 [16:33<26:02:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 1%| | 130/12384 [16:40<26:02:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 1%| | 131/12384 [16:40<26:00:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 1%| | 131/12384 [16:48<26:00:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 1%| | 132/12384 [16:48<25:59:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 1%| | 132/12384 [16:56<25:59:16, 7.64s/it, loss=0.0002, acc=0.9989, iter_time=7.27s]
Epoch 2: 1%| | 133/12384 [16:56<26:17:14, 7.72s/it, loss=0.0002, acc=0.9989, iter_time=7.27s]
Epoch 2: 1%| | 133/12384 [17:03<26:17:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 1%| | 134/12384 [17:03<26:08:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 1%| | 134/12384 [17:11<26:08:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 1%| | 135/12384 [17:11<26:02:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 1%| | 135/12384 [17:19<26:02:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 1%| | 136/12384 [17:19<26:00:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 1%| | 136/12384 [17:26<26:00:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 1%| | 137/12384 [17:26<25:58:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 1%| | 137/12384 [17:34<25:58:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 1%| | 138/12384 [17:34<25:56:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 1%| | 138/12384 [17:42<25:56:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 1%| | 139/12384 [17:42<25:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 1%| | 139/12384 [17:49<25:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 1%| | 140/12384 [17:49<25:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 1%| | 140/12384 [17:57<25:55:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 141/12384 [17:57<25:55:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%| | 141/12384 [18:04<25:55:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 142/12384 [18:04<25:54:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 142/12384 [18:12<25:54:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 1%| | 143/12384 [18:12<25:55:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 1%| | 143/12384 [18:20<25:55:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 1%| | 144/12384 [18:20<25:54:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 1%| | 144/12384 [18:27<25:54:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 1%| | 145/12384 [18:27<25:55:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 1%| | 145/12384 [18:35<25:55:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 1%| | 146/12384 [18:35<25:53:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 1%| | 146/12384 [18:42<25:53:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 1%| | 147/12384 [18:42<25:53:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 1%| | 147/12384 [18:50<25:53:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 1%| | 148/12384 [18:50<25:55:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 1%| | 148/12384 [18:58<25:55:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 149/12384 [18:58<25:55:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%| | 149/12384 [19:05<25:55:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 1%| | 150/12384 [19:05<25:59:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 1%| | 150/12384 [19:13<25:59:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 151/12384 [19:13<25:57:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 1%| | 151/12384 [19:21<25:57:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 1%| | 152/12384 [19:21<25:55:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 1%| | 152/12384 [19:28<25:55:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 1%| | 153/12384 [19:28<25:52:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 1%| | 153/12384 [19:36<25:52:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 2: 1%| | 154/12384 [19:36<25:51:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 2: 1%| | 154/12384 [19:43<25:51:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 1%|▏ | 155/12384 [19:43<25:54:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 1%|▏ | 155/12384 [19:51<25:54:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 1%|▏ | 156/12384 [19:51<25:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 1%|▏ | 156/12384 [19:59<25:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 1%|▏ | 157/12384 [19:59<25:53:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 1%|▏ | 157/12384 [20:06<25:53:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 1%|▏ | 158/12384 [20:06<25:51:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 1%|▏ | 158/12384 [20:14<25:51:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%|▏ | 159/12384 [20:14<25:50:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 1%|▏ | 159/12384 [20:22<25:50:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 1%|▏ | 160/12384 [20:22<26:10:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 1%|▏ | 160/12384 [20:29<26:10:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%|▏ | 161/12384 [20:29<26:03:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 1%|▏ | 161/12384 [20:37<26:03:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 1%|▏ | 162/12384 [20:37<25:58:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 1%|▏ | 162/12384 [20:45<25:58:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 2: 1%|▏ | 163/12384 [20:45<25:55:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 2: 1%|▏ | 163/12384 [20:52<25:55:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 1%|▏ | 164/12384 [20:52<25:53:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 1%|▏ | 164/12384 [21:00<25:53:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.39s]
Epoch 2: 1%|▏ | 165/12384 [21:00<25:52:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.39s]
Epoch 2: 1%|▏ | 165/12384 [21:07<25:52:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 1%|▏ | 166/12384 [21:07<25:50:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 1%|▏ | 166/12384 [21:15<25:50:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 1%|▏ | 167/12384 [21:15<25:50:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 1%|▏ | 167/12384 [21:23<25:50:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 1%|▏ | 168/12384 [21:23<25:55:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 1%|▏ | 168/12384 [21:30<25:55:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 1%|▏ | 169/12384 [21:30<25:53:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 1%|▏ | 169/12384 [21:38<25:53:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 1%|▏ | 170/12384 [21:38<25:52:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 1%|▏ | 170/12384 [21:46<25:52:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 1%|▏ | 171/12384 [21:46<25:51:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 1%|▏ | 171/12384 [21:53<25:51:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%|▏ | 172/12384 [21:53<25:53:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 1%|▏ | 172/12384 [22:01<25:53:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 1%|▏ | 173/12384 [22:01<25:52:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 1%|▏ | 173/12384 [22:09<25:52:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 2: 1%|▏ | 174/12384 [22:09<25:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 2: 1%|▏ | 174/12384 [22:16<25:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 1%|▏ | 175/12384 [22:16<25:51:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 1%|▏ | 175/12384 [22:24<25:51:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 1%|▏ | 176/12384 [22:24<25:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 1%|▏ | 176/12384 [22:31<25:51:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 1%|▏ | 177/12384 [22:31<25:49:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 1%|▏ | 177/12384 [22:39<25:49:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 1%|▏ | 178/12384 [22:39<25:48:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 1%|▏ | 178/12384 [22:47<25:48:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 1%|▏ | 179/12384 [22:47<26:05:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 1%|▏ | 179/12384 [22:54<26:05:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 1%|▏ | 180/12384 [22:54<26:00:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 1%|▏ | 180/12384 [23:02<26:00:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 1%|▏ | 181/12384 [23:02<25:57:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 1%|▏ | 181/12384 [23:10<25:57:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 1%|▏ | 182/12384 [23:10<25:54:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 1%|▏ | 182/12384 [23:17<25:54:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 1%|▏ | 183/12384 [23:17<25:53:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 1%|▏ | 183/12384 [23:25<25:53:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 1%|▏ | 184/12384 [23:25<25:51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 1%|▏ | 184/12384 [23:33<25:51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 2: 1%|▏ | 185/12384 [23:33<25:51:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 2: 1%|▏ | 185/12384 [23:41<25:51:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 2%|▏ | 186/12384 [23:41<26:10:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 2%|▏ | 186/12384 [23:48<26:10:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 2%|▏ | 187/12384 [23:48<26:07:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 2%|▏ | 187/12384 [23:56<26:07:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 2%|▏ | 188/12384 [23:56<26:00:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 2%|▏ | 188/12384 [24:03<26:00:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 189/12384 [24:03<25:56:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 189/12384 [24:11<25:56:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 2%|▏ | 190/12384 [24:11<25:54:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 2%|▏ | 190/12384 [24:19<25:54:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 2%|▏ | 191/12384 [24:19<25:51:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 2%|▏ | 191/12384 [24:26<25:51:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 192/12384 [24:26<25:51:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 192/12384 [24:34<25:51:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 2%|▏ | 193/12384 [24:34<25:51:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 2%|▏ | 193/12384 [24:42<25:51:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 2%|▏ | 194/12384 [24:42<25:49:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 2%|▏ | 194/12384 [24:49<25:49:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 2%|▏ | 195/12384 [24:49<25:48:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 2%|▏ | 195/12384 [24:57<25:48:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 2%|▏ | 196/12384 [24:57<25:47:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 2%|▏ | 196/12384 [25:04<25:47:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 2%|▏ | 197/12384 [25:04<25:45:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 2%|▏ | 197/12384 [25:12<25:45:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 2%|▏ | 198/12384 [25:12<25:44:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 2%|▏ | 198/12384 [25:20<25:44:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 2%|▏ | 199/12384 [25:20<25:45:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 2%|▏ | 199/12384 [25:27<25:45:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 2%|▏ | 200/12384 [25:27<25:46:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 2%|▏ | 200/12384 [25:35<25:46:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 2%|▏ | 201/12384 [25:35<25:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 2%|▏ | 201/12384 [25:42<25:46:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 2%|▏ | 202/12384 [25:42<25:45:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 2%|▏ | 202/12384 [25:50<25:45:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 203/12384 [25:50<25:44:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 203/12384 [25:58<25:44:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 204/12384 [25:58<25:43:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 204/12384 [26:05<25:43:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 2%|▏ | 205/12384 [26:05<25:42:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 2%|▏ | 205/12384 [26:13<25:42:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 2%|▏ | 206/12384 [26:13<25:43:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 2%|▏ | 206/12384 [26:20<25:43:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 2%|▏ | 207/12384 [26:20<25:43:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 2%|▏ | 207/12384 [26:28<25:43:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 2%|▏ | 208/12384 [26:28<25:47:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 2%|▏ | 208/12384 [26:36<25:47:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 2%|▏ | 209/12384 [26:36<25:46:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 2%|▏ | 209/12384 [26:43<25:46:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 2%|▏ | 210/12384 [26:43<25:49:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 2%|▏ | 210/12384 [26:51<25:49:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 2%|▏ | 211/12384 [26:51<25:48:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 2%|▏ | 211/12384 [26:59<25:48:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 2%|▏ | 212/12384 [26:59<25:46:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 2%|▏ | 212/12384 [27:07<25:46:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 2%|▏ | 213/12384 [27:07<26:05:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 2%|▏ | 213/12384 [27:14<26:05:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 2%|▏ | 214/12384 [27:14<25:59:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 2%|▏ | 214/12384 [27:22<25:59:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 2%|▏ | 215/12384 [27:22<25:54:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 2%|▏ | 215/12384 [27:29<25:54:26, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.08s]
Epoch 2: 2%|▏ | 216/12384 [27:29<25:52:34, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.08s]
Epoch 2: 2%|▏ | 216/12384 [27:37<25:52:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 2%|▏ | 217/12384 [27:37<25:49:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 2%|▏ | 217/12384 [27:45<25:49:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 2%|▏ | 218/12384 [27:45<25:47:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 2%|▏ | 218/12384 [27:52<25:47:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 2%|▏ | 219/12384 [27:52<25:47:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 2%|▏ | 219/12384 [28:00<25:47:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.89s]
Epoch 2: 2%|▏ | 220/12384 [28:00<25:46:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.89s]
Epoch 2: 2%|▏ | 220/12384 [28:07<25:46:39, 7.63s/it, loss=0.0002, acc=0.9975, iter_time=7.26s]
Epoch 2: 2%|▏ | 221/12384 [28:07<25:45:28, 7.62s/it, loss=0.0002, acc=0.9975, iter_time=7.26s]
Epoch 2: 2%|▏ | 221/12384 [28:15<25:45:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 2%|▏ | 222/12384 [28:15<25:43:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 2%|▏ | 222/12384 [28:23<25:43:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 2%|▏ | 223/12384 [28:23<25:45:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 2%|▏ | 223/12384 [28:30<25:45:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 2%|▏ | 224/12384 [28:30<25:43:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 2%|▏ | 224/12384 [28:38<25:43:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.70s]
Epoch 2: 2%|▏ | 225/12384 [28:38<25:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.70s]
Epoch 2: 2%|▏ | 225/12384 [28:46<25:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 2%|▏ | 226/12384 [28:46<25:45:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 2%|▏ | 226/12384 [28:52<25:45:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 2%|▏ | 227/12384 [28:52<24:39:43, 7.30s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 2%|▏ | 227/12384 [29:00<24:39:43, 7.30s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 2%|▏ | 228/12384 [29:00<24:57:46, 7.39s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 2%|▏ | 228/12384 [29:07<24:57:46, 7.39s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 229/12384 [29:07<25:11:51, 7.46s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 229/12384 [29:15<25:11:51, 7.46s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 2%|▏ | 230/12384 [29:15<25:21:04, 7.51s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 2%|▏ | 230/12384 [29:23<25:21:04, 7.51s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 2%|▏ | 231/12384 [29:23<25:26:07, 7.53s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 2%|▏ | 231/12384 [29:30<25:26:07, 7.53s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 2%|▏ | 232/12384 [29:30<25:47:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 2%|▏ | 232/12384 [29:38<25:47:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 2%|▏ | 233/12384 [29:38<25:45:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 2%|▏ | 233/12384 [29:46<25:45:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 2: 2%|▏ | 234/12384 [29:46<25:48:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 2: 2%|▏ | 234/12384 [29:53<25:48:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 2%|▏ | 235/12384 [29:53<25:45:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 2%|▏ | 235/12384 [30:01<25:45:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 2%|▏ | 236/12384 [30:01<25:44:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 2%|▏ | 236/12384 [30:09<25:44:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 237/12384 [30:09<25:42:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 237/12384 [30:16<25:42:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 2%|▏ | 238/12384 [30:16<25:42:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 2%|▏ | 238/12384 [30:24<25:42:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 2%|▏ | 239/12384 [30:24<26:02:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 2%|▏ | 239/12384 [30:32<26:02:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 2%|▏ | 240/12384 [30:32<25:57:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 2%|▏ | 240/12384 [30:39<25:57:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 2%|▏ | 241/12384 [30:39<25:51:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 2%|▏ | 241/12384 [30:47<25:51:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 2%|▏ | 242/12384 [30:47<25:47:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 2%|▏ | 242/12384 [30:55<25:47:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 2%|▏ | 243/12384 [30:55<25:43:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 2%|▏ | 243/12384 [31:02<25:43:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 2: 2%|▏ | 244/12384 [31:02<25:49:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 2: 2%|▏ | 244/12384 [31:10<25:49:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 2%|▏ | 245/12384 [31:10<25:45:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 2%|▏ | 245/12384 [31:17<25:45:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 2: 2%|▏ | 246/12384 [31:17<25:42:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 2: 2%|▏ | 246/12384 [31:25<25:42:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 2: 2%|▏ | 247/12384 [31:25<25:44:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 2: 2%|▏ | 247/12384 [31:33<25:44:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 2: 2%|▏ | 248/12384 [31:33<25:43:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 2: 2%|▏ | 248/12384 [31:40<25:43:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 2: 2%|▏ | 249/12384 [31:40<25:40:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 2: 2%|▏ | 249/12384 [31:48<25:40:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 2%|▏ | 250/12384 [31:48<25:46:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 2%|▏ | 250/12384 [31:56<25:46:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 2: 2%|▏ | 251/12384 [31:56<25:47:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 2: 2%|▏ | 251/12384 [32:03<25:47:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 2%|▏ | 252/12384 [32:03<25:43:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 2%|▏ | 252/12384 [32:11<25:43:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 2%|▏ | 253/12384 [32:11<25:42:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 2%|▏ | 253/12384 [32:19<25:42:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 2%|▏ | 254/12384 [32:19<25:41:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 2%|▏ | 254/12384 [32:26<25:41:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 255/12384 [32:26<25:40:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 255/12384 [32:34<25:40:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 2%|▏ | 256/12384 [32:34<25:40:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 2%|▏ | 256/12384 [32:41<25:40:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 2%|▏ | 257/12384 [32:41<25:39:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 2%|▏ | 257/12384 [32:49<25:39:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 2%|▏ | 258/12384 [32:49<25:39:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 2%|▏ | 258/12384 [32:57<25:39:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 259/12384 [32:57<25:38:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 259/12384 [33:04<25:38:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 2%|▏ | 260/12384 [33:04<25:53:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 2%|▏ | 260/12384 [33:12<25:53:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 2%|▏ | 261/12384 [33:12<25:47:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 2%|▏ | 261/12384 [33:20<25:47:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 2%|▏ | 262/12384 [33:20<25:44:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 2%|▏ | 262/12384 [33:27<25:44:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 2%|▏ | 263/12384 [33:27<25:42:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 2%|▏ | 263/12384 [33:35<25:42:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 2%|▏ | 264/12384 [33:35<25:42:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 2%|▏ | 264/12384 [33:43<25:42:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.33s]
Epoch 2: 2%|▏ | 265/12384 [33:43<26:00:48, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=4.33s]
Epoch 2: 2%|▏ | 265/12384 [33:50<26:00:48, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.27s]
Epoch 2: 2%|▏ | 266/12384 [33:50<25:54:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.27s]
Epoch 2: 2%|▏ | 266/12384 [33:58<25:54:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 2%|▏ | 267/12384 [33:58<25:51:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 2%|▏ | 267/12384 [34:06<25:51:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 2%|▏ | 268/12384 [34:06<25:49:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 2%|▏ | 268/12384 [34:13<25:49:02, 7.67s/it, loss=0.0003, acc=0.9982, iter_time=7.64s]
Epoch 2: 2%|▏ | 269/12384 [34:13<25:45:47, 7.66s/it, loss=0.0003, acc=0.9982, iter_time=7.64s]
Epoch 2: 2%|▏ | 269/12384 [34:21<25:45:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 2%|▏ | 270/12384 [34:21<25:42:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 2%|▏ | 270/12384 [34:29<25:42:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 2%|▏ | 271/12384 [34:29<25:39:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 2%|▏ | 271/12384 [34:36<25:39:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 2%|▏ | 272/12384 [34:36<25:38:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 2%|▏ | 272/12384 [34:44<25:38:32, 7.62s/it, loss=0.0004, acc=0.9975, iter_time=4.92s]
Epoch 2: 2%|▏ | 273/12384 [34:44<25:43:17, 7.65s/it, loss=0.0004, acc=0.9975, iter_time=4.92s]
Epoch 2: 2%|▏ | 273/12384 [34:52<25:43:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 2%|▏ | 274/12384 [34:52<25:41:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 2%|▏ | 274/12384 [34:59<25:41:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 2%|▏ | 275/12384 [34:59<25:44:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 2%|▏ | 275/12384 [35:07<25:44:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 2%|▏ | 276/12384 [35:07<25:42:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 2%|▏ | 276/12384 [35:14<25:42:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 2%|▏ | 277/12384 [35:14<25:40:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 2%|▏ | 277/12384 [35:22<25:40:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 278/12384 [35:22<25:38:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 278/12384 [35:30<25:38:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 279/12384 [35:30<25:39:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 279/12384 [35:37<25:39:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 2%|▏ | 280/12384 [35:37<25:43:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 2%|▏ | 280/12384 [35:45<25:43:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 2%|▏ | 281/12384 [35:45<25:41:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 2%|▏ | 281/12384 [35:53<25:41:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 2%|▏ | 282/12384 [35:53<25:38:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 2%|▏ | 282/12384 [36:00<25:38:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 2: 2%|▏ | 283/12384 [36:00<25:36:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 2: 2%|▏ | 283/12384 [36:08<25:36:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 2: 2%|▏ | 284/12384 [36:08<25:34:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 2: 2%|▏ | 284/12384 [36:15<25:34:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 2%|▏ | 285/12384 [36:15<25:34:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 2%|▏ | 285/12384 [36:23<25:34:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 2%|▏ | 286/12384 [36:23<25:51:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 2%|▏ | 286/12384 [36:31<25:51:17, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 287/12384 [36:31<25:45:30, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 287/12384 [36:39<25:45:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 2%|▏ | 288/12384 [36:39<25:42:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 2%|▏ | 288/12384 [36:46<25:42:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 2%|▏ | 289/12384 [36:46<25:45:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 2%|▏ | 289/12384 [36:54<25:45:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 2%|▏ | 290/12384 [36:54<25:41:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 2%|▏ | 290/12384 [37:02<25:41:06, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.79s]
Epoch 2: 2%|▏ | 291/12384 [37:02<25:59:54, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=6.79s]
Epoch 2: 2%|▏ | 291/12384 [37:09<25:59:54, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 2%|▏ | 292/12384 [37:09<25:52:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 2%|▏ | 292/12384 [37:17<25:52:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 2%|▏ | 293/12384 [37:17<25:45:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 2%|▏ | 293/12384 [37:25<25:45:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 2%|▏ | 294/12384 [37:25<25:40:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 2%|▏ | 294/12384 [37:32<25:40:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 2%|▏ | 295/12384 [37:32<25:39:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 2%|▏ | 295/12384 [37:40<25:39:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 2%|▏ | 296/12384 [37:40<25:37:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 2%|▏ | 296/12384 [37:47<25:37:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 2%|▏ | 297/12384 [37:47<25:36:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 2%|▏ | 297/12384 [37:55<25:36:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 2%|▏ | 298/12384 [37:55<25:36:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 2%|▏ | 298/12384 [38:03<25:36:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 2: 2%|▏ | 299/12384 [38:03<25:38:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 2: 2%|▏ | 299/12384 [38:10<25:38:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 2: 2%|▏ | 300/12384 [38:10<25:38:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 2: 2%|▏ | 300/12384 [38:18<25:38:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 2%|▏ | 301/12384 [38:18<25:35:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 2%|▏ | 301/12384 [38:26<25:35:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 2%|▏ | 302/12384 [38:26<25:40:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 2%|▏ | 302/12384 [38:33<25:40:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 303/12384 [38:33<25:36:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 303/12384 [38:41<25:36:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 2%|▏ | 304/12384 [38:41<25:35:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 2%|▏ | 304/12384 [38:48<25:35:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 2%|▏ | 305/12384 [38:48<25:33:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 2%|▏ | 305/12384 [38:56<25:33:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 306/12384 [38:56<25:32:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 2%|▏ | 306/12384 [39:04<25:32:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 307/12384 [39:04<25:33:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 2%|▏ | 307/12384 [39:11<25:33:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 2%|▏ | 308/12384 [39:11<25:31:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 2%|▏ | 308/12384 [39:19<25:31:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 2%|▏ | 309/12384 [39:19<25:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 2%|▏ | 309/12384 [39:27<25:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 310/12384 [39:27<25:31:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 310/12384 [39:34<25:31:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 311/12384 [39:34<25:30:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 311/12384 [39:42<25:30:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 3%|▎ | 312/12384 [39:42<25:48:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 3%|▎ | 312/12384 [39:50<25:48:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 3%|▎ | 313/12384 [39:50<25:43:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 3%|▎ | 313/12384 [39:57<25:43:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 3%|▎ | 314/12384 [39:57<25:40:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 3%|▎ | 314/12384 [40:05<25:40:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 3%|▎ | 315/12384 [40:05<25:38:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 3%|▎ | 315/12384 [40:12<25:38:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 3%|▎ | 316/12384 [40:12<25:34:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 3%|▎ | 316/12384 [40:20<25:34:57, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=5.40s]
Epoch 2: 3%|▎ | 317/12384 [40:20<25:55:21, 7.73s/it, loss=0.0003, acc=0.9990, iter_time=5.40s]
Epoch 2: 3%|▎ | 317/12384 [40:28<25:55:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 3%|▎ | 318/12384 [40:28<25:46:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 3%|▎ | 318/12384 [40:36<25:46:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 319/12384 [40:36<25:42:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 319/12384 [40:43<25:42:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 3%|▎ | 320/12384 [40:43<25:43:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 3%|▎ | 320/12384 [40:51<25:43:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 3%|▎ | 321/12384 [40:51<25:44:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 3%|▎ | 321/12384 [40:59<25:44:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 3%|▎ | 322/12384 [40:59<25:44:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 3%|▎ | 322/12384 [41:06<25:44:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 3%|▎ | 323/12384 [41:06<25:39:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 3%|▎ | 323/12384 [41:14<25:39:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 324/12384 [41:14<25:36:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 324/12384 [41:22<25:36:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 3%|▎ | 325/12384 [41:22<25:34:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 3%|▎ | 325/12384 [41:29<25:34:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 3%|▎ | 326/12384 [41:29<25:32:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 3%|▎ | 326/12384 [41:37<25:32:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 327/12384 [41:37<25:33:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 327/12384 [41:44<25:33:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 3%|▎ | 328/12384 [41:44<25:32:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 3%|▎ | 328/12384 [41:52<25:32:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 3%|▎ | 329/12384 [41:52<25:30:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 3%|▎ | 329/12384 [42:00<25:30:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.64s]
Epoch 2: 3%|▎ | 330/12384 [42:00<25:33:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.64s]
Epoch 2: 3%|▎ | 330/12384 [42:07<25:33:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.64s]
Epoch 2: 3%|▎ | 331/12384 [42:07<25:37:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.64s]
Epoch 2: 3%|▎ | 331/12384 [42:15<25:37:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 3%|▎ | 332/12384 [42:15<25:38:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 3%|▎ | 332/12384 [42:23<25:38:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 3%|▎ | 333/12384 [42:23<25:34:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 3%|▎ | 333/12384 [42:30<25:34:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 334/12384 [42:30<25:32:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 3%|▎ | 334/12384 [42:38<25:32:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 3%|▎ | 335/12384 [42:38<25:31:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 3%|▎ | 335/12384 [42:45<25:31:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 3%|▎ | 336/12384 [42:45<25:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 3%|▎ | 336/12384 [42:53<25:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 3%|▎ | 337/12384 [42:53<25:47:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 3%|▎ | 337/12384 [43:01<25:47:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 3%|▎ | 338/12384 [43:01<25:41:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 3%|▎ | 338/12384 [43:09<25:41:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 2: 3%|▎ | 339/12384 [43:09<25:38:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 2: 3%|▎ | 339/12384 [43:16<25:38:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 2: 3%|▎ | 340/12384 [43:16<25:35:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 2: 3%|▎ | 340/12384 [43:24<25:35:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 3%|▎ | 341/12384 [43:24<25:32:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 3%|▎ | 341/12384 [43:31<25:32:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 3%|▎ | 342/12384 [43:31<25:31:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 3%|▎ | 342/12384 [43:39<25:31:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 343/12384 [43:39<25:29:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 343/12384 [43:47<25:29:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 3%|▎ | 344/12384 [43:47<25:49:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 3%|▎ | 344/12384 [43:55<25:49:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 3%|▎ | 345/12384 [43:55<25:41:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 3%|▎ | 345/12384 [44:02<25:41:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 3%|▎ | 346/12384 [44:02<25:38:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 3%|▎ | 346/12384 [44:10<25:38:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 347/12384 [44:10<25:35:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 347/12384 [44:18<25:35:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 3%|▎ | 348/12384 [44:18<25:33:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 3%|▎ | 348/12384 [44:25<25:33:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 3%|▎ | 349/12384 [44:25<25:31:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 3%|▎ | 349/12384 [44:33<25:31:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 350/12384 [44:33<25:30:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 350/12384 [44:40<25:30:22, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=7.08s]
Epoch 2: 3%|▎ | 351/12384 [44:40<25:31:41, 7.64s/it, loss=0.0002, acc=0.9983, iter_time=7.08s]
Epoch 2: 3%|▎ | 351/12384 [44:48<25:31:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 3%|▎ | 352/12384 [44:48<25:37:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 3%|▎ | 352/12384 [44:56<25:37:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 3%|▎ | 353/12384 [44:56<25:33:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 3%|▎ | 353/12384 [45:03<25:33:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 3%|▎ | 354/12384 [45:03<25:30:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 3%|▎ | 354/12384 [45:11<25:30:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 3%|▎ | 355/12384 [45:11<25:27:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 3%|▎ | 355/12384 [45:19<25:27:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 3%|▎ | 356/12384 [45:19<25:27:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 3%|▎ | 356/12384 [45:26<25:27:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 3%|▎ | 357/12384 [45:26<25:29:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 3%|▎ | 357/12384 [45:34<25:29:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 3%|▎ | 358/12384 [45:34<25:29:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 3%|▎ | 358/12384 [45:41<25:29:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 3%|▎ | 359/12384 [45:41<25:28:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 3%|▎ | 359/12384 [45:49<25:28:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 3%|▎ | 360/12384 [45:49<25:28:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 3%|▎ | 360/12384 [45:57<25:28:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 3%|▎ | 361/12384 [45:57<25:27:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 3%|▎ | 361/12384 [46:04<25:27:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 3%|▎ | 362/12384 [46:04<25:26:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 3%|▎ | 362/12384 [46:12<25:26:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 3%|▎ | 363/12384 [46:12<25:27:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 3%|▎ | 363/12384 [46:20<25:27:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 3%|▎ | 364/12384 [46:20<25:28:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 3%|▎ | 364/12384 [46:27<25:28:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 3%|▎ | 365/12384 [46:27<25:26:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 3%|▎ | 365/12384 [46:35<25:26:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 3%|▎ | 366/12384 [46:35<25:27:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 3%|▎ | 366/12384 [46:42<25:27:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 3%|▎ | 367/12384 [46:42<25:26:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 3%|▎ | 367/12384 [46:50<25:26:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 3%|▎ | 368/12384 [46:50<25:26:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 3%|▎ | 368/12384 [46:58<25:26:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 2: 3%|▎ | 369/12384 [46:58<25:26:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 2: 3%|▎ | 369/12384 [47:06<25:26:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 3%|▎ | 370/12384 [47:06<25:50:37, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 3%|▎ | 370/12384 [47:13<25:50:37, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 3%|▎ | 371/12384 [47:13<25:43:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 3%|▎ | 371/12384 [47:21<25:43:37, 7.71s/it, loss=0.0002, acc=0.9991, iter_time=7.65s]
Epoch 2: 3%|▎ | 372/12384 [47:21<25:37:12, 7.68s/it, loss=0.0002, acc=0.9991, iter_time=7.65s]
Epoch 2: 3%|▎ | 372/12384 [47:29<25:37:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 3%|▎ | 373/12384 [47:29<25:32:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 3%|▎ | 373/12384 [47:36<25:32:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 3%|▎ | 374/12384 [47:36<25:30:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 3%|▎ | 374/12384 [47:44<25:30:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 3%|▎ | 375/12384 [47:44<25:29:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 3%|▎ | 375/12384 [47:51<25:29:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 3%|▎ | 376/12384 [47:51<25:26:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 3%|▎ | 376/12384 [47:59<25:26:57, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 377/12384 [47:59<25:24:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 377/12384 [48:07<25:24:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 378/12384 [48:07<25:26:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 378/12384 [48:14<25:26:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 379/12384 [48:14<25:32:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 379/12384 [48:22<25:32:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 3%|▎ | 380/12384 [48:22<25:30:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 3%|▎ | 380/12384 [48:30<25:30:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 381/12384 [48:30<25:31:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 3%|▎ | 381/12384 [48:37<25:31:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 3%|▎ | 382/12384 [48:37<25:27:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 3%|▎ | 382/12384 [48:45<25:27:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 3%|▎ | 383/12384 [48:45<25:25:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 3%|▎ | 383/12384 [48:52<25:25:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 3%|▎ | 384/12384 [48:52<25:25:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 3%|▎ | 384/12384 [49:00<25:25:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 2: 3%|▎ | 385/12384 [49:00<25:23:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 2: 3%|▎ | 385/12384 [49:08<25:23:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 3%|▎ | 386/12384 [49:08<25:23:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 3%|▎ | 386/12384 [49:15<25:23:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 3%|▎ | 387/12384 [49:15<25:23:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 3%|▎ | 387/12384 [49:23<25:23:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 3%|▎ | 388/12384 [49:23<25:40:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 3%|▎ | 388/12384 [49:31<25:40:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 3%|▎ | 389/12384 [49:31<25:33:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 3%|▎ | 389/12384 [49:38<25:33:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 3%|▎ | 390/12384 [49:38<25:33:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 3%|▎ | 390/12384 [49:46<25:33:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 2: 3%|▎ | 391/12384 [49:46<25:30:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 2: 3%|▎ | 391/12384 [49:54<25:30:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 2: 3%|▎ | 392/12384 [49:54<25:26:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 2: 3%|▎ | 392/12384 [50:01<25:26:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 3%|▎ | 393/12384 [50:01<25:30:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 3%|▎ | 393/12384 [50:09<25:30:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 2: 3%|▎ | 394/12384 [50:09<25:27:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 2: 3%|▎ | 394/12384 [50:17<25:27:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 3%|▎ | 395/12384 [50:17<25:25:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 3%|▎ | 395/12384 [50:24<25:25:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 3%|▎ | 396/12384 [50:24<25:23:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 3%|▎ | 396/12384 [50:32<25:23:01, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.54s]
Epoch 2: 3%|▎ | 397/12384 [50:32<25:41:37, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=5.54s]
Epoch 2: 3%|▎ | 397/12384 [50:40<25:41:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 3%|▎ | 398/12384 [50:40<25:33:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 3%|▎ | 398/12384 [50:47<25:33:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 3%|▎ | 399/12384 [50:47<25:32:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 3%|▎ | 399/12384 [50:55<25:32:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 3%|▎ | 400/12384 [50:55<25:31:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 3%|▎ | 400/12384 [51:03<25:31:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 3%|▎ | 401/12384 [51:03<25:33:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 3%|▎ | 401/12384 [51:10<25:33:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 3%|▎ | 402/12384 [51:10<25:31:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 3%|▎ | 402/12384 [51:18<25:31:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 3%|▎ | 403/12384 [51:18<25:38:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 3%|▎ | 403/12384 [51:26<25:38:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 3%|▎ | 404/12384 [51:26<25:40:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 3%|▎ | 404/12384 [51:34<25:40:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 3%|▎ | 405/12384 [51:34<25:35:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 3%|▎ | 405/12384 [51:41<25:35:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 406/12384 [51:41<25:30:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 406/12384 [51:49<25:30:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 407/12384 [51:49<25:28:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 3%|▎ | 407/12384 [51:56<25:28:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 3%|▎ | 408/12384 [51:56<25:25:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 3%|▎ | 408/12384 [52:04<25:25:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 3%|▎ | 409/12384 [52:04<25:23:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 3%|▎ | 409/12384 [52:12<25:23:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 3%|▎ | 410/12384 [52:12<25:22:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 3%|▎ | 410/12384 [52:19<25:22:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 3%|▎ | 411/12384 [52:19<25:22:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 3%|▎ | 411/12384 [52:27<25:22:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 3%|▎ | 412/12384 [52:27<25:21:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 3%|▎ | 412/12384 [52:35<25:21:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 3%|▎ | 413/12384 [52:35<25:19:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 3%|▎ | 413/12384 [52:42<25:19:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 3%|▎ | 414/12384 [52:42<25:37:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 3%|▎ | 414/12384 [52:50<25:37:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 3%|▎ | 415/12384 [52:50<25:31:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 3%|▎ | 415/12384 [52:58<25:31:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 3%|▎ | 416/12384 [52:58<25:26:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 3%|▎ | 416/12384 [53:05<25:26:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 3%|▎ | 417/12384 [53:05<25:23:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 3%|▎ | 417/12384 [53:13<25:23:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 3%|▎ | 418/12384 [53:13<25:21:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 3%|▎ | 418/12384 [53:20<25:21:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 3%|▎ | 419/12384 [53:20<25:19:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 3%|▎ | 419/12384 [53:28<25:19:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 3%|▎ | 420/12384 [53:28<25:16:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 3%|▎ | 420/12384 [53:36<25:16:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 3%|▎ | 421/12384 [53:36<25:18:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 3%|▎ | 421/12384 [53:43<25:18:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 3%|▎ | 422/12384 [53:43<25:21:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 3%|▎ | 422/12384 [53:51<25:21:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 3%|▎ | 423/12384 [53:51<25:43:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 3%|▎ | 423/12384 [53:59<25:43:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 3%|▎ | 424/12384 [53:59<25:37:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 3%|▎ | 424/12384 [54:07<25:37:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 3%|▎ | 425/12384 [54:07<25:31:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 3%|▎ | 425/12384 [54:14<25:31:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 3%|▎ | 426/12384 [54:14<25:26:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 3%|▎ | 426/12384 [54:22<25:26:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 3%|▎ | 427/12384 [54:22<25:26:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 3%|▎ | 427/12384 [54:29<25:26:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 2: 3%|▎ | 428/12384 [54:29<25:24:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 2: 3%|▎ | 428/12384 [54:37<25:24:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 3%|▎ | 429/12384 [54:37<25:21:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 3%|▎ | 429/12384 [54:45<25:21:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 3%|▎ | 430/12384 [54:45<25:22:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 3%|▎ | 430/12384 [54:52<25:22:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 3%|▎ | 431/12384 [54:52<25:21:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 3%|▎ | 431/12384 [55:00<25:21:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 2: 3%|▎ | 432/12384 [55:00<25:20:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 2: 3%|▎ | 432/12384 [55:08<25:20:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 2: 3%|▎ | 433/12384 [55:08<25:21:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 2: 3%|▎ | 433/12384 [55:15<25:21:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 4%|▎ | 434/12384 [55:15<25:20:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 4%|▎ | 434/12384 [55:23<25:20:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 4%|▎ | 435/12384 [55:23<25:19:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 4%|▎ | 435/12384 [55:30<25:19:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 4%|▎ | 436/12384 [55:30<25:17:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 4%|▎ | 436/12384 [55:38<25:17:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 4%|▎ | 437/12384 [55:38<25:15:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 4%|▎ | 437/12384 [55:46<25:15:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 4%|▎ | 438/12384 [55:46<25:16:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 4%|▎ | 438/12384 [55:53<25:16:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 4%|▎ | 439/12384 [55:53<25:14:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 4%|▎ | 439/12384 [56:01<25:14:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 4%|▎ | 440/12384 [56:01<25:14:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 4%|▎ | 440/12384 [56:09<25:14:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 4%|▎ | 441/12384 [56:09<25:30:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 4%|▎ | 441/12384 [56:16<25:30:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 4%|▎ | 442/12384 [56:16<25:25:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 4%|▎ | 442/12384 [56:24<25:25:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 4%|▎ | 443/12384 [56:24<25:20:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 4%|▎ | 443/12384 [56:32<25:20:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 4%|▎ | 444/12384 [56:32<25:18:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 4%|▎ | 444/12384 [56:39<25:18:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 4%|▎ | 445/12384 [56:39<25:18:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 4%|▎ | 445/12384 [56:47<25:18:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 4%|▎ | 446/12384 [56:47<25:17:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 4%|▎ | 446/12384 [56:54<25:17:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▎ | 447/12384 [56:54<25:16:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▎ | 447/12384 [57:02<25:16:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 4%|▎ | 448/12384 [57:02<25:16:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 4%|▎ | 448/12384 [57:10<25:16:03, 7.62s/it, loss=0.0004, acc=0.9979, iter_time=7.29s]
Epoch 2: 4%|▎ | 449/12384 [57:10<25:35:04, 7.72s/it, loss=0.0004, acc=0.9979, iter_time=7.29s]
Epoch 2: 4%|▎ | 449/12384 [57:18<25:35:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 4%|▎ | 450/12384 [57:18<25:29:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 4%|▎ | 450/12384 [57:25<25:29:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 4%|▎ | 451/12384 [57:25<25:25:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 4%|▎ | 451/12384 [57:33<25:25:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 2: 4%|▎ | 452/12384 [57:33<25:23:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 2: 4%|▎ | 452/12384 [57:40<25:23:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 4%|▎ | 453/12384 [57:40<25:19:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 4%|▎ | 453/12384 [57:48<25:19:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 4%|▎ | 454/12384 [57:48<25:17:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 4%|▎ | 454/12384 [57:56<25:17:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 4%|▎ | 455/12384 [57:56<25:15:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 4%|▎ | 455/12384 [58:03<25:15:16, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=8.32s]
Epoch 2: 4%|▎ | 456/12384 [58:03<25:18:00, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=8.32s]
Epoch 2: 4%|▎ | 456/12384 [58:11<25:18:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 4%|▎ | 457/12384 [58:11<25:16:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 4%|▎ | 457/12384 [58:19<25:16:14, 7.63s/it, loss=0.0007, acc=1.0000, iter_time=10.64s]
Epoch 2: 4%|▎ | 458/12384 [58:19<25:15:38, 7.63s/it, loss=0.0007, acc=1.0000, iter_time=10.64s]
Epoch 2: 4%|▎ | 458/12384 [58:26<25:15:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 4%|▎ | 459/12384 [58:26<25:14:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 4%|▎ | 459/12384 [58:34<25:14:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 4%|▎ | 460/12384 [58:34<25:13:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 4%|▎ | 460/12384 [58:41<25:13:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 4%|▎ | 461/12384 [58:41<25:16:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 4%|▎ | 461/12384 [58:49<25:16:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 4%|▎ | 462/12384 [58:49<25:14:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 4%|▎ | 462/12384 [58:57<25:14:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 4%|▎ | 463/12384 [58:57<25:12:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 4%|▎ | 463/12384 [59:04<25:12:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 4%|▎ | 464/12384 [59:04<25:11:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 4%|▎ | 464/12384 [59:12<25:11:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 4%|▍ | 465/12384 [59:12<25:11:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 4%|▍ | 465/12384 [59:19<25:11:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 466/12384 [59:19<25:12:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 466/12384 [59:27<25:12:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 4%|▍ | 467/12384 [59:27<25:28:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 4%|▍ | 467/12384 [59:35<25:28:44, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 4%|▍ | 468/12384 [59:35<25:24:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 4%|▍ | 468/12384 [59:43<25:24:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 4%|▍ | 469/12384 [59:43<25:20:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 4%|▍ | 469/12384 [59:50<25:20:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 470/12384 [59:50<25:17:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 470/12384 [59:58<25:17:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 4%|▍ | 471/12384 [59:58<25:16:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 4%|▍ | 471/12384 [1:00:05<25:16:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 4%|▍ | 472/12384 [1:00:05<25:14:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 4%|▍ | 472/12384 [1:00:13<25:14:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 4%|▍ | 473/12384 [1:00:13<25:16:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 4%|▍ | 473/12384 [1:00:21<25:16:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 4%|▍ | 474/12384 [1:00:21<25:15:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 4%|▍ | 474/12384 [1:00:29<25:15:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 4%|▍ | 475/12384 [1:00:29<25:33:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 4%|▍ | 475/12384 [1:00:36<25:33:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 4%|▍ | 476/12384 [1:00:36<25:27:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 4%|▍ | 476/12384 [1:00:44<25:27:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 4%|▍ | 477/12384 [1:00:44<25:21:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 4%|▍ | 477/12384 [1:00:52<25:21:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 4%|▍ | 478/12384 [1:00:52<25:19:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 4%|▍ | 478/12384 [1:00:59<25:19:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 4%|▍ | 479/12384 [1:00:59<25:19:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 4%|▍ | 479/12384 [1:01:07<25:19:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 4%|▍ | 480/12384 [1:01:07<25:20:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 4%|▍ | 480/12384 [1:01:14<25:20:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 4%|▍ | 481/12384 [1:01:14<25:17:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 4%|▍ | 481/12384 [1:01:22<25:17:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 4%|▍ | 482/12384 [1:01:22<25:14:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 4%|▍ | 482/12384 [1:01:30<25:14:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 4%|▍ | 483/12384 [1:01:30<25:13:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 4%|▍ | 483/12384 [1:01:37<25:13:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 4%|▍ | 484/12384 [1:01:37<25:12:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 4%|▍ | 484/12384 [1:01:45<25:12:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 4%|▍ | 485/12384 [1:01:45<25:12:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 4%|▍ | 485/12384 [1:01:53<25:12:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 4%|▍ | 486/12384 [1:01:53<25:09:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 4%|▍ | 486/12384 [1:02:00<25:09:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 4%|▍ | 487/12384 [1:02:00<25:08:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 4%|▍ | 487/12384 [1:02:08<25:08:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 4%|▍ | 488/12384 [1:02:08<25:09:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 4%|▍ | 488/12384 [1:02:15<25:09:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 4%|▍ | 489/12384 [1:02:15<25:09:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 4%|▍ | 489/12384 [1:02:23<25:09:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 4%|▍ | 490/12384 [1:02:23<25:08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 4%|▍ | 490/12384 [1:02:31<25:08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 4%|▍ | 491/12384 [1:02:31<25:07:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 4%|▍ | 491/12384 [1:02:38<25:07:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 4%|▍ | 492/12384 [1:02:38<25:06:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 4%|▍ | 492/12384 [1:02:46<25:06:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 4%|▍ | 493/12384 [1:02:46<25:22:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 4%|▍ | 493/12384 [1:02:54<25:22:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 4%|▍ | 494/12384 [1:02:54<25:16:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 4%|▍ | 494/12384 [1:03:01<25:16:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 4%|▍ | 495/12384 [1:03:01<25:14:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 4%|▍ | 495/12384 [1:03:09<25:14:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 2: 4%|▍ | 496/12384 [1:03:09<25:11:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 2: 4%|▍ | 496/12384 [1:03:16<25:11:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 2: 4%|▍ | 497/12384 [1:03:16<25:11:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 2: 4%|▍ | 497/12384 [1:03:24<25:11:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 2: 4%|▍ | 498/12384 [1:03:24<25:10:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 2: 4%|▍ | 498/12384 [1:03:32<25:10:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 4%|▍ | 499/12384 [1:03:32<25:10:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 4%|▍ | 499/12384 [1:03:39<25:10:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 2: 4%|▍ | 500/12384 [1:03:39<25:08:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 2: 4%|▍ | 500/12384 [1:03:47<25:08:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 4%|▍ | 501/12384 [1:03:47<25:34:11, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 4%|▍ | 501/12384 [1:03:55<25:34:11, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 4%|▍ | 502/12384 [1:03:55<25:30:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 4%|▍ | 502/12384 [1:04:03<25:30:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 4%|▍ | 503/12384 [1:04:03<25:23:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 4%|▍ | 503/12384 [1:04:10<25:23:43, 7.69s/it, loss=0.0002, acc=0.9994, iter_time=8.00s]
Epoch 2: 4%|▍ | 504/12384 [1:04:10<25:18:48, 7.67s/it, loss=0.0002, acc=0.9994, iter_time=8.00s]
Epoch 2: 4%|▍ | 504/12384 [1:04:18<25:18:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 4%|▍ | 505/12384 [1:04:18<25:15:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 4%|▍ | 505/12384 [1:04:26<25:15:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 4%|▍ | 506/12384 [1:04:26<25:14:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 4%|▍ | 506/12384 [1:04:33<25:14:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 4%|▍ | 507/12384 [1:04:33<25:12:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 4%|▍ | 507/12384 [1:04:41<25:12:10, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=7.63s]
Epoch 2: 4%|▍ | 508/12384 [1:04:41<25:10:59, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=7.63s]
Epoch 2: 4%|▍ | 508/12384 [1:04:48<25:10:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 509/12384 [1:04:48<25:09:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 509/12384 [1:04:56<25:09:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 4%|▍ | 510/12384 [1:04:56<25:08:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 4%|▍ | 510/12384 [1:05:04<25:08:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 4%|▍ | 511/12384 [1:05:04<25:08:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 4%|▍ | 511/12384 [1:05:11<25:08:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 4%|▍ | 512/12384 [1:05:11<25:07:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 4%|▍ | 512/12384 [1:05:19<25:07:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 4%|▍ | 513/12384 [1:05:19<25:07:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 4%|▍ | 513/12384 [1:05:26<25:07:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 4%|▍ | 514/12384 [1:05:26<25:07:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 4%|▍ | 514/12384 [1:05:34<25:07:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 4%|▍ | 515/12384 [1:05:34<25:09:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 4%|▍ | 515/12384 [1:05:42<25:09:21, 7.63s/it, loss=0.0013, acc=0.9963, iter_time=7.66s]
Epoch 2: 4%|▍ | 516/12384 [1:05:42<25:07:39, 7.62s/it, loss=0.0013, acc=0.9963, iter_time=7.66s]
Epoch 2: 4%|▍ | 516/12384 [1:05:49<25:07:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 4%|▍ | 517/12384 [1:05:49<25:05:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 4%|▍ | 517/12384 [1:05:57<25:05:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 4%|▍ | 518/12384 [1:05:57<25:09:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 4%|▍ | 518/12384 [1:06:05<25:09:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 4%|▍ | 519/12384 [1:06:05<25:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 4%|▍ | 519/12384 [1:06:12<25:07:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.24s]
Epoch 2: 4%|▍ | 520/12384 [1:06:12<25:08:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.24s]
Epoch 2: 4%|▍ | 520/12384 [1:06:20<25:08:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 4%|▍ | 521/12384 [1:06:20<25:06:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 4%|▍ | 521/12384 [1:06:27<25:06:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 522/12384 [1:06:27<25:07:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 522/12384 [1:06:35<25:07:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 4%|▍ | 523/12384 [1:06:35<25:07:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 4%|▍ | 523/12384 [1:06:43<25:07:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 524/12384 [1:06:43<25:07:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 524/12384 [1:06:50<25:07:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 4%|▍ | 525/12384 [1:06:50<25:05:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 4%|▍ | 525/12384 [1:06:58<25:05:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 4%|▍ | 526/12384 [1:06:58<25:05:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 4%|▍ | 526/12384 [1:07:06<25:05:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 4%|▍ | 527/12384 [1:07:06<25:06:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 4%|▍ | 527/12384 [1:07:14<25:06:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 4%|▍ | 528/12384 [1:07:14<25:24:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 4%|▍ | 528/12384 [1:07:21<25:24:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 4%|▍ | 529/12384 [1:07:21<25:17:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 4%|▍ | 529/12384 [1:07:29<25:17:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 530/12384 [1:07:29<25:12:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 530/12384 [1:07:36<25:12:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 4%|▍ | 531/12384 [1:07:36<25:09:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 4%|▍ | 531/12384 [1:07:44<25:09:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 4%|▍ | 532/12384 [1:07:44<25:11:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 4%|▍ | 532/12384 [1:07:52<25:11:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 4%|▍ | 533/12384 [1:07:52<25:08:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 4%|▍ | 533/12384 [1:07:59<25:08:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 4%|▍ | 534/12384 [1:07:59<25:05:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 4%|▍ | 534/12384 [1:08:07<25:05:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 535/12384 [1:08:07<25:04:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 4%|▍ | 535/12384 [1:08:14<25:04:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 4%|▍ | 536/12384 [1:08:14<25:04:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 4%|▍ | 536/12384 [1:08:22<25:04:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 4%|▍ | 537/12384 [1:08:22<25:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 4%|▍ | 537/12384 [1:08:30<25:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 4%|▍ | 538/12384 [1:08:30<25:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 4%|▍ | 538/12384 [1:08:37<25:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 4%|▍ | 539/12384 [1:08:37<25:04:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 4%|▍ | 539/12384 [1:08:45<25:04:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 4%|▍ | 540/12384 [1:08:45<25:02:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 4%|▍ | 540/12384 [1:08:52<25:02:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 4%|▍ | 541/12384 [1:08:52<25:02:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 4%|▍ | 541/12384 [1:09:00<25:02:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 4%|▍ | 542/12384 [1:09:00<25:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 4%|▍ | 542/12384 [1:09:08<25:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 4%|▍ | 543/12384 [1:09:08<25:00:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 4%|▍ | 543/12384 [1:09:15<25:00:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 4%|▍ | 544/12384 [1:09:15<25:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 4%|▍ | 544/12384 [1:09:23<25:01:47, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=7.91s]
Epoch 2: 4%|▍ | 545/12384 [1:09:23<25:15:29, 7.68s/it, loss=0.0004, acc=1.0000, iter_time=7.91s]
Epoch 2: 4%|▍ | 545/12384 [1:09:31<25:15:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 4%|▍ | 546/12384 [1:09:31<25:11:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 4%|▍ | 546/12384 [1:09:38<25:11:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 4%|▍ | 547/12384 [1:09:38<25:07:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 4%|▍ | 547/12384 [1:09:46<25:07:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 4%|▍ | 548/12384 [1:09:46<25:04:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 4%|▍ | 548/12384 [1:09:54<25:04:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 4%|▍ | 549/12384 [1:09:54<25:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 4%|▍ | 549/12384 [1:10:01<25:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 4%|▍ | 550/12384 [1:10:01<25:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 4%|▍ | 550/12384 [1:10:09<25:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 2: 4%|▍ | 551/12384 [1:10:09<25:02:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 2: 4%|▍ | 551/12384 [1:10:16<25:02:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 4%|▍ | 552/12384 [1:10:16<25:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 4%|▍ | 552/12384 [1:10:24<25:03:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 4%|▍ | 553/12384 [1:10:24<25:02:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 4%|▍ | 553/12384 [1:10:32<25:02:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 4%|▍ | 554/12384 [1:10:32<25:20:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 4%|▍ | 554/12384 [1:10:40<25:20:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 4%|▍ | 555/12384 [1:10:40<25:14:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 4%|▍ | 555/12384 [1:10:47<25:14:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 4%|▍ | 556/12384 [1:10:47<25:09:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 4%|▍ | 556/12384 [1:10:55<25:09:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 4%|▍ | 557/12384 [1:10:55<25:06:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 4%|▍ | 557/12384 [1:11:02<25:06:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▍ | 558/12384 [1:11:02<25:03:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▍ | 558/12384 [1:11:10<25:03:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▍ | 559/12384 [1:11:10<25:01:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▍ | 559/12384 [1:11:18<25:01:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 5%|▍ | 560/12384 [1:11:18<25:04:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 5%|▍ | 560/12384 [1:11:25<25:04:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 5%|▍ | 561/12384 [1:11:25<25:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 5%|▍ | 561/12384 [1:11:33<25:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 5%|▍ | 562/12384 [1:11:33<25:06:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 5%|▍ | 562/12384 [1:11:41<25:06:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 5%|▍ | 563/12384 [1:11:41<25:04:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 5%|▍ | 563/12384 [1:11:48<25:04:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 5%|▍ | 564/12384 [1:11:48<25:06:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 5%|▍ | 564/12384 [1:11:56<25:06:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 5%|▍ | 565/12384 [1:11:56<25:08:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 5%|▍ | 565/12384 [1:12:04<25:08:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 5%|▍ | 566/12384 [1:12:04<25:04:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 5%|▍ | 566/12384 [1:12:11<25:04:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 5%|▍ | 567/12384 [1:12:11<25:01:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 5%|▍ | 567/12384 [1:12:19<25:01:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 5%|▍ | 568/12384 [1:12:19<25:01:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 5%|▍ | 568/12384 [1:12:26<25:01:34, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.40s]
Epoch 2: 5%|▍ | 569/12384 [1:12:26<25:00:09, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=5.40s]
Epoch 2: 5%|▍ | 569/12384 [1:12:34<25:00:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 5%|▍ | 570/12384 [1:12:34<24:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 5%|▍ | 570/12384 [1:12:42<24:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 5%|▍ | 571/12384 [1:12:42<25:16:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 5%|▍ | 571/12384 [1:12:49<25:16:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 5%|▍ | 572/12384 [1:12:49<25:12:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 5%|▍ | 572/12384 [1:12:57<25:12:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 5%|▍ | 573/12384 [1:12:57<25:09:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 5%|▍ | 573/12384 [1:13:05<25:09:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 5%|▍ | 574/12384 [1:13:05<25:06:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 5%|▍ | 574/12384 [1:13:12<25:06:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 5%|▍ | 575/12384 [1:13:12<25:04:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 5%|▍ | 575/12384 [1:13:20<25:04:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 2: 5%|▍ | 576/12384 [1:13:20<25:02:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 2: 5%|▍ | 576/12384 [1:13:28<25:02:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 5%|▍ | 577/12384 [1:13:28<25:00:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 5%|▍ | 577/12384 [1:13:35<25:00:20, 7.62s/it, loss=0.0011, acc=0.9971, iter_time=5.59s]
Epoch 2: 5%|▍ | 578/12384 [1:13:35<25:01:13, 7.63s/it, loss=0.0011, acc=0.9971, iter_time=5.59s]
Epoch 2: 5%|▍ | 578/12384 [1:13:43<25:01:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 5%|▍ | 579/12384 [1:13:43<24:58:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 5%|▍ | 579/12384 [1:13:50<24:58:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 5%|▍ | 580/12384 [1:13:50<24:57:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 5%|▍ | 580/12384 [1:13:58<24:57:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 5%|▍ | 581/12384 [1:13:58<25:17:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 5%|▍ | 581/12384 [1:14:06<25:17:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 5%|▍ | 582/12384 [1:14:06<25:15:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 5%|▍ | 582/12384 [1:14:14<25:15:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 5%|▍ | 583/12384 [1:14:14<25:10:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 5%|▍ | 583/12384 [1:14:21<25:10:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 5%|▍ | 584/12384 [1:14:21<25:06:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 5%|▍ | 584/12384 [1:14:29<25:06:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 5%|▍ | 585/12384 [1:14:29<25:09:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 5%|▍ | 585/12384 [1:14:37<25:09:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 5%|▍ | 586/12384 [1:14:37<25:06:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 5%|▍ | 586/12384 [1:14:44<25:06:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 5%|▍ | 587/12384 [1:14:44<25:03:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 5%|▍ | 587/12384 [1:14:52<25:03:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 5%|▍ | 588/12384 [1:14:52<25:02:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 5%|▍ | 588/12384 [1:14:59<25:02:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 5%|▍ | 589/12384 [1:14:59<25:00:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 5%|▍ | 589/12384 [1:15:07<25:00:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 5%|▍ | 590/12384 [1:15:07<24:58:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 5%|▍ | 590/12384 [1:15:15<24:58:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▍ | 591/12384 [1:15:15<24:56:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▍ | 591/12384 [1:15:22<24:56:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 5%|▍ | 592/12384 [1:15:22<24:55:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 5%|▍ | 592/12384 [1:15:30<24:55:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 5%|▍ | 593/12384 [1:15:30<24:56:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 5%|▍ | 593/12384 [1:15:38<24:56:01, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.82s]
Epoch 2: 5%|▍ | 594/12384 [1:15:38<24:58:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.82s]
Epoch 2: 5%|▍ | 594/12384 [1:15:45<24:58:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 5%|▍ | 595/12384 [1:15:45<24:56:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 5%|▍ | 595/12384 [1:15:53<24:56:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 5%|▍ | 596/12384 [1:15:53<24:56:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 5%|▍ | 596/12384 [1:16:00<24:56:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 5%|▍ | 597/12384 [1:16:00<24:54:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 5%|▍ | 597/12384 [1:16:08<24:54:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 5%|▍ | 598/12384 [1:16:08<25:10:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 5%|▍ | 598/12384 [1:16:16<25:10:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 5%|▍ | 599/12384 [1:16:16<25:04:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 5%|▍ | 599/12384 [1:16:24<25:04:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 5%|▍ | 600/12384 [1:16:24<25:07:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 5%|▍ | 600/12384 [1:16:31<25:07:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 5%|▍ | 601/12384 [1:16:31<25:08:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 5%|▍ | 601/12384 [1:16:39<25:08:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 5%|▍ | 602/12384 [1:16:39<25:04:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 5%|▍ | 602/12384 [1:16:46<25:04:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 5%|▍ | 603/12384 [1:16:46<25:01:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 5%|▍ | 603/12384 [1:16:54<25:01:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 5%|▍ | 604/12384 [1:16:54<24:58:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 5%|▍ | 604/12384 [1:17:02<24:58:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 5%|▍ | 605/12384 [1:17:02<25:01:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 5%|▍ | 605/12384 [1:17:09<25:01:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 5%|▍ | 606/12384 [1:17:09<24:59:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 5%|▍ | 606/12384 [1:17:17<24:59:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 5%|▍ | 607/12384 [1:17:17<25:17:12, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 5%|▍ | 607/12384 [1:17:25<25:17:12, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 5%|▍ | 608/12384 [1:17:25<25:10:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 5%|▍ | 608/12384 [1:17:32<25:10:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 5%|▍ | 609/12384 [1:17:32<25:03:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 5%|▍ | 609/12384 [1:17:40<25:03:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▍ | 610/12384 [1:17:40<24:59:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▍ | 610/12384 [1:17:48<24:59:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 5%|▍ | 611/12384 [1:17:48<24:57:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 5%|▍ | 611/12384 [1:17:55<24:57:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▍ | 612/12384 [1:17:55<24:57:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▍ | 612/12384 [1:18:03<24:57:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 5%|▍ | 613/12384 [1:18:03<24:55:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 5%|▍ | 613/12384 [1:18:11<24:55:32, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.91s]
Epoch 2: 5%|▍ | 614/12384 [1:18:11<24:54:22, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.91s]
Epoch 2: 5%|▍ | 614/12384 [1:18:18<24:54:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 5%|▍ | 615/12384 [1:18:18<24:54:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 5%|▍ | 615/12384 [1:18:26<24:54:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 5%|▍ | 616/12384 [1:18:26<24:54:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 5%|▍ | 616/12384 [1:18:33<24:54:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 5%|▍ | 617/12384 [1:18:33<24:54:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 5%|▍ | 617/12384 [1:18:41<24:54:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 5%|▍ | 618/12384 [1:18:41<24:53:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 5%|▍ | 618/12384 [1:18:49<24:53:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▍ | 619/12384 [1:18:49<24:52:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▍ | 619/12384 [1:18:56<24:52:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 5%|▌ | 620/12384 [1:18:56<24:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 5%|▌ | 620/12384 [1:19:04<24:51:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▌ | 621/12384 [1:19:04<24:51:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▌ | 621/12384 [1:19:11<24:51:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 5%|▌ | 622/12384 [1:19:11<24:50:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 5%|▌ | 622/12384 [1:19:19<24:50:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 5%|▌ | 623/12384 [1:19:19<24:50:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 5%|▌ | 623/12384 [1:19:27<24:50:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 5%|▌ | 624/12384 [1:19:27<24:56:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 5%|▌ | 624/12384 [1:19:35<24:56:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 5%|▌ | 625/12384 [1:19:35<25:09:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 5%|▌ | 625/12384 [1:19:42<25:09:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 626/12384 [1:19:42<25:03:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 626/12384 [1:19:50<25:03:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 5%|▌ | 627/12384 [1:19:50<24:58:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 5%|▌ | 627/12384 [1:19:57<24:58:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 5%|▌ | 628/12384 [1:19:57<24:56:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 5%|▌ | 628/12384 [1:20:05<24:56:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 5%|▌ | 629/12384 [1:20:05<24:54:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 5%|▌ | 629/12384 [1:20:13<24:54:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 630/12384 [1:20:13<24:54:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 630/12384 [1:20:20<24:54:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 5%|▌ | 631/12384 [1:20:20<24:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 5%|▌ | 631/12384 [1:20:28<24:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 5%|▌ | 632/12384 [1:20:28<24:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 5%|▌ | 632/12384 [1:20:36<24:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 5%|▌ | 633/12384 [1:20:36<25:13:32, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 5%|▌ | 633/12384 [1:20:43<25:13:32, 7.73s/it, loss=0.0006, acc=0.9981, iter_time=7.89s]
Epoch 2: 5%|▌ | 634/12384 [1:20:43<25:05:25, 7.69s/it, loss=0.0006, acc=0.9981, iter_time=7.89s]
Epoch 2: 5%|▌ | 634/12384 [1:20:51<25:05:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 635/12384 [1:20:51<25:00:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 635/12384 [1:20:59<25:00:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▌ | 636/12384 [1:20:59<24:57:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▌ | 636/12384 [1:21:06<24:57:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 637/12384 [1:21:06<24:54:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 637/12384 [1:21:14<24:54:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 5%|▌ | 638/12384 [1:21:14<24:53:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 5%|▌ | 638/12384 [1:21:21<24:53:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 5%|▌ | 639/12384 [1:21:21<24:52:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 5%|▌ | 639/12384 [1:21:29<24:52:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 5%|▌ | 640/12384 [1:21:29<24:51:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 5%|▌ | 640/12384 [1:21:37<24:51:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 5%|▌ | 641/12384 [1:21:37<24:50:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 5%|▌ | 641/12384 [1:21:44<24:50:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 5%|▌ | 642/12384 [1:21:44<24:50:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 5%|▌ | 642/12384 [1:21:52<24:50:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▌ | 643/12384 [1:21:52<24:49:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▌ | 643/12384 [1:22:00<24:49:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 5%|▌ | 644/12384 [1:22:00<24:52:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 5%|▌ | 644/12384 [1:22:07<24:52:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 5%|▌ | 645/12384 [1:22:07<24:54:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 5%|▌ | 645/12384 [1:22:15<24:54:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 5%|▌ | 646/12384 [1:22:15<24:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 5%|▌ | 646/12384 [1:22:22<24:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 5%|▌ | 647/12384 [1:22:22<24:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 5%|▌ | 647/12384 [1:22:30<24:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 5%|▌ | 648/12384 [1:22:30<24:51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 5%|▌ | 648/12384 [1:22:38<24:51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 5%|▌ | 649/12384 [1:22:38<24:50:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 5%|▌ | 649/12384 [1:22:45<24:50:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 650/12384 [1:22:45<24:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 5%|▌ | 650/12384 [1:22:53<24:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 5%|▌ | 651/12384 [1:22:53<25:05:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 5%|▌ | 651/12384 [1:23:01<25:05:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 5%|▌ | 652/12384 [1:23:01<25:01:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 5%|▌ | 652/12384 [1:23:09<25:01:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 5%|▌ | 653/12384 [1:23:09<25:03:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 5%|▌ | 653/12384 [1:23:16<25:03:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 5%|▌ | 654/12384 [1:23:16<24:59:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 5%|▌ | 654/12384 [1:23:24<24:59:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 5%|▌ | 655/12384 [1:23:24<24:58:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 5%|▌ | 655/12384 [1:23:31<24:58:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 5%|▌ | 656/12384 [1:23:31<24:55:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 5%|▌ | 656/12384 [1:23:39<24:55:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 5%|▌ | 657/12384 [1:23:39<24:53:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 5%|▌ | 657/12384 [1:23:47<24:53:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 5%|▌ | 658/12384 [1:23:47<24:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 5%|▌ | 658/12384 [1:23:55<24:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 5%|▌ | 659/12384 [1:23:55<25:10:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 5%|▌ | 659/12384 [1:24:02<25:10:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 5%|▌ | 660/12384 [1:24:02<25:03:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 5%|▌ | 660/12384 [1:24:10<25:03:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=3.94s]
Epoch 2: 5%|▌ | 661/12384 [1:24:10<25:07:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=3.94s]
Epoch 2: 5%|▌ | 661/12384 [1:24:18<25:07:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 5%|▌ | 662/12384 [1:24:18<25:00:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 5%|▌ | 662/12384 [1:24:25<25:00:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 5%|▌ | 663/12384 [1:24:25<24:56:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 5%|▌ | 663/12384 [1:24:33<24:56:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 5%|▌ | 664/12384 [1:24:33<24:54:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 5%|▌ | 664/12384 [1:24:40<24:54:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 2: 5%|▌ | 665/12384 [1:24:40<24:53:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 2: 5%|▌ | 665/12384 [1:24:48<24:53:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 5%|▌ | 666/12384 [1:24:48<24:51:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 5%|▌ | 666/12384 [1:24:56<24:51:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 5%|▌ | 667/12384 [1:24:56<24:50:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 5%|▌ | 667/12384 [1:25:03<24:50:20, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=9.71s]
Epoch 2: 5%|▌ | 668/12384 [1:25:03<24:48:50, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=9.71s]
Epoch 2: 5%|▌ | 668/12384 [1:25:11<24:48:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 5%|▌ | 669/12384 [1:25:11<24:48:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 5%|▌ | 669/12384 [1:25:19<24:48:07, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=7.90s]
Epoch 2: 5%|▌ | 670/12384 [1:25:19<24:47:42, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=7.90s]
Epoch 2: 5%|▌ | 670/12384 [1:25:26<24:47:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 5%|▌ | 671/12384 [1:25:26<24:45:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 5%|▌ | 671/12384 [1:25:34<24:45:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 5%|▌ | 672/12384 [1:25:34<24:47:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 5%|▌ | 672/12384 [1:25:41<24:47:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 5%|▌ | 673/12384 [1:25:41<24:45:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 5%|▌ | 673/12384 [1:25:49<24:45:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 5%|▌ | 674/12384 [1:25:49<24:46:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 5%|▌ | 674/12384 [1:25:57<24:46:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 5%|▌ | 675/12384 [1:25:57<24:50:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 5%|▌ | 675/12384 [1:26:04<24:50:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 5%|▌ | 676/12384 [1:26:04<24:48:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 5%|▌ | 676/12384 [1:26:12<24:48:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 5%|▌ | 677/12384 [1:26:12<24:47:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 5%|▌ | 677/12384 [1:26:20<24:47:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 5%|▌ | 678/12384 [1:26:20<24:44:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 5%|▌ | 678/12384 [1:26:27<24:44:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▌ | 679/12384 [1:26:27<24:45:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 5%|▌ | 679/12384 [1:26:35<24:45:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 5%|▌ | 680/12384 [1:26:35<24:46:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 5%|▌ | 680/12384 [1:26:42<24:46:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 5%|▌ | 681/12384 [1:26:42<24:47:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 5%|▌ | 681/12384 [1:26:50<24:47:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 6%|▌ | 682/12384 [1:26:50<24:48:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 6%|▌ | 682/12384 [1:26:58<24:48:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 6%|▌ | 683/12384 [1:26:58<24:47:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 6%|▌ | 683/12384 [1:27:05<24:47:54, 7.63s/it, loss=0.0002, acc=0.9997, iter_time=8.25s]
Epoch 2: 6%|▌ | 684/12384 [1:27:05<24:47:16, 7.63s/it, loss=0.0002, acc=0.9997, iter_time=8.25s]
Epoch 2: 6%|▌ | 684/12384 [1:27:13<24:47:16, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=6.16s]
Epoch 2: 6%|▌ | 685/12384 [1:27:13<25:06:40, 7.73s/it, loss=0.0001, acc=0.9998, iter_time=6.16s]
Epoch 2: 6%|▌ | 685/12384 [1:27:21<25:06:40, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 6%|▌ | 686/12384 [1:27:21<25:01:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 6%|▌ | 686/12384 [1:27:29<25:01:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 2: 6%|▌ | 687/12384 [1:27:29<24:56:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 2: 6%|▌ | 687/12384 [1:27:36<24:56:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 6%|▌ | 688/12384 [1:27:36<24:52:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 6%|▌ | 688/12384 [1:27:44<24:52:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 6%|▌ | 689/12384 [1:27:44<24:54:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 6%|▌ | 689/12384 [1:27:51<24:54:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 6%|▌ | 690/12384 [1:27:51<24:50:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 6%|▌ | 690/12384 [1:27:59<24:50:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 691/12384 [1:27:59<24:50:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 691/12384 [1:28:07<24:50:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 6%|▌ | 692/12384 [1:28:07<24:46:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 6%|▌ | 692/12384 [1:28:14<24:46:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 6%|▌ | 693/12384 [1:28:14<24:44:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 6%|▌ | 693/12384 [1:28:22<24:44:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▌ | 694/12384 [1:28:22<24:45:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▌ | 694/12384 [1:28:30<24:45:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 6%|▌ | 695/12384 [1:28:30<24:49:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 6%|▌ | 695/12384 [1:28:37<24:49:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 6%|▌ | 696/12384 [1:28:37<24:50:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 6%|▌ | 696/12384 [1:28:45<24:50:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 6%|▌ | 697/12384 [1:28:45<24:48:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 6%|▌ | 697/12384 [1:28:52<24:48:09, 7.64s/it, loss=0.0003, acc=0.9983, iter_time=7.63s]
Epoch 2: 6%|▌ | 698/12384 [1:28:52<24:46:56, 7.63s/it, loss=0.0003, acc=0.9983, iter_time=7.63s]
Epoch 2: 6%|▌ | 698/12384 [1:29:00<24:46:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▌ | 699/12384 [1:29:00<24:45:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▌ | 699/12384 [1:29:08<24:45:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 6%|▌ | 700/12384 [1:29:08<24:44:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 6%|▌ | 700/12384 [1:29:15<24:44:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 701/12384 [1:29:15<24:42:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 701/12384 [1:29:23<24:42:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 6%|▌ | 702/12384 [1:29:23<24:42:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 6%|▌ | 702/12384 [1:29:31<24:42:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 6%|▌ | 703/12384 [1:29:31<24:42:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 6%|▌ | 703/12384 [1:29:38<24:42:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 2: 6%|▌ | 704/12384 [1:29:38<24:42:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 2: 6%|▌ | 704/12384 [1:29:46<24:42:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 6%|▌ | 705/12384 [1:29:46<24:41:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 6%|▌ | 705/12384 [1:29:53<24:41:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 6%|▌ | 706/12384 [1:29:53<24:40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 6%|▌ | 706/12384 [1:30:01<24:40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 707/12384 [1:30:01<24:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 707/12384 [1:30:09<24:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 708/12384 [1:30:09<24:41:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 708/12384 [1:30:16<24:41:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 709/12384 [1:30:16<24:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 709/12384 [1:30:24<24:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▌ | 710/12384 [1:30:24<24:40:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▌ | 710/12384 [1:30:31<24:40:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 711/12384 [1:30:31<24:39:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 711/12384 [1:30:39<24:39:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 6%|▌ | 712/12384 [1:30:39<24:59:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 6%|▌ | 712/12384 [1:30:47<24:59:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 6%|▌ | 713/12384 [1:30:47<24:57:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 6%|▌ | 713/12384 [1:30:55<24:57:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 6%|▌ | 714/12384 [1:30:55<24:52:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 6%|▌ | 714/12384 [1:31:02<24:52:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 6%|▌ | 715/12384 [1:31:02<24:48:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 6%|▌ | 715/12384 [1:31:10<24:48:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 2: 6%|▌ | 716/12384 [1:31:10<24:45:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 2: 6%|▌ | 716/12384 [1:31:17<24:45:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 6%|▌ | 717/12384 [1:31:17<24:42:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 6%|▌ | 717/12384 [1:31:25<24:42:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 6%|▌ | 718/12384 [1:31:25<24:45:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 6%|▌ | 718/12384 [1:31:33<24:45:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 2: 6%|▌ | 719/12384 [1:31:33<24:44:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 2: 6%|▌ | 719/12384 [1:31:40<24:44:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 6%|▌ | 720/12384 [1:31:40<24:44:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 6%|▌ | 720/12384 [1:31:48<24:44:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 6%|▌ | 721/12384 [1:31:48<24:43:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 6%|▌ | 721/12384 [1:31:56<24:43:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 2: 6%|▌ | 722/12384 [1:31:56<24:42:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 2: 6%|▌ | 722/12384 [1:32:03<24:42:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 2: 6%|▌ | 723/12384 [1:32:03<24:40:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 2: 6%|▌ | 723/12384 [1:32:11<24:40:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 6%|▌ | 724/12384 [1:32:11<24:40:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 6%|▌ | 724/12384 [1:32:18<24:40:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 6%|▌ | 725/12384 [1:32:18<24:40:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 6%|▌ | 725/12384 [1:32:26<24:40:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 6%|▌ | 726/12384 [1:32:26<24:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 6%|▌ | 726/12384 [1:32:34<24:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 727/12384 [1:32:34<24:39:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 727/12384 [1:32:41<24:39:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 6%|▌ | 728/12384 [1:32:41<24:40:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 6%|▌ | 728/12384 [1:32:49<24:40:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 6%|▌ | 729/12384 [1:32:49<24:46:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 6%|▌ | 729/12384 [1:32:57<24:46:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 2: 6%|▌ | 730/12384 [1:32:57<24:45:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 2: 6%|▌ | 730/12384 [1:33:04<24:45:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 2: 6%|▌ | 731/12384 [1:33:04<24:42:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 2: 6%|▌ | 731/12384 [1:33:12<24:42:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 6%|▌ | 732/12384 [1:33:12<24:51:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 6%|▌ | 732/12384 [1:33:20<24:51:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 6%|▌ | 733/12384 [1:33:20<24:46:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 6%|▌ | 733/12384 [1:33:27<24:46:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 6%|▌ | 734/12384 [1:33:27<24:43:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 6%|▌ | 734/12384 [1:33:35<24:43:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 735/12384 [1:33:35<24:41:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 735/12384 [1:33:42<24:41:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 6%|▌ | 736/12384 [1:33:42<24:40:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 6%|▌ | 736/12384 [1:33:50<24:40:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 2: 6%|▌ | 737/12384 [1:33:50<24:39:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.91s]
Epoch 2: 6%|▌ | 737/12384 [1:33:58<24:39:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 6%|▌ | 738/12384 [1:33:58<24:58:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 6%|▌ | 738/12384 [1:34:06<24:58:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 6%|▌ | 739/12384 [1:34:06<24:52:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 6%|▌ | 739/12384 [1:34:13<24:52:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 6%|▌ | 740/12384 [1:34:13<24:48:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 6%|▌ | 740/12384 [1:34:21<24:48:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 741/12384 [1:34:21<24:44:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 741/12384 [1:34:29<24:44:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 6%|▌ | 742/12384 [1:34:29<24:42:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 6%|▌ | 742/12384 [1:34:36<24:42:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 6%|▌ | 743/12384 [1:34:36<24:40:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 6%|▌ | 743/12384 [1:34:44<24:40:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 6%|▌ | 744/12384 [1:34:44<24:39:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 6%|▌ | 744/12384 [1:34:51<24:39:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 6%|▌ | 745/12384 [1:34:51<24:38:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 6%|▌ | 745/12384 [1:34:59<24:38:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▌ | 746/12384 [1:34:59<24:36:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▌ | 746/12384 [1:35:07<24:36:36, 7.61s/it, loss=0.0002, acc=0.9989, iter_time=6.47s]
Epoch 2: 6%|▌ | 747/12384 [1:35:07<24:41:03, 7.64s/it, loss=0.0002, acc=0.9989, iter_time=6.47s]
Epoch 2: 6%|▌ | 747/12384 [1:35:14<24:41:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 6%|▌ | 748/12384 [1:35:14<24:38:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 6%|▌ | 748/12384 [1:35:22<24:38:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 6%|▌ | 749/12384 [1:35:22<24:38:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 6%|▌ | 749/12384 [1:35:29<24:38:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 6%|▌ | 750/12384 [1:35:29<24:36:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 6%|▌ | 750/12384 [1:35:37<24:36:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 6%|▌ | 751/12384 [1:35:37<24:33:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 6%|▌ | 751/12384 [1:35:45<24:33:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 6%|▌ | 752/12384 [1:35:45<24:35:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 6%|▌ | 752/12384 [1:35:52<24:35:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 6%|▌ | 753/12384 [1:35:52<24:35:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 6%|▌ | 753/12384 [1:36:00<24:35:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 6%|▌ | 754/12384 [1:36:00<24:35:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 6%|▌ | 754/12384 [1:36:08<24:35:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 6%|▌ | 755/12384 [1:36:08<24:50:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 6%|▌ | 755/12384 [1:36:15<24:50:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 6%|▌ | 756/12384 [1:36:15<24:44:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 6%|▌ | 756/12384 [1:36:23<24:44:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▌ | 757/12384 [1:36:23<24:41:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▌ | 757/12384 [1:36:31<24:41:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 6%|▌ | 758/12384 [1:36:31<24:39:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 6%|▌ | 758/12384 [1:36:38<24:39:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 759/12384 [1:36:38<24:37:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 759/12384 [1:36:46<24:37:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 6%|▌ | 760/12384 [1:36:46<24:36:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 6%|▌ | 760/12384 [1:36:53<24:36:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▌ | 761/12384 [1:36:53<24:41:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▌ | 761/12384 [1:37:01<24:41:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▌ | 762/12384 [1:37:01<24:39:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▌ | 762/12384 [1:37:09<24:39:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 763/12384 [1:37:09<24:37:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▌ | 763/12384 [1:37:16<24:37:43, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.62s]
Epoch 2: 6%|▌ | 764/12384 [1:37:16<24:36:40, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.62s]
Epoch 2: 6%|▌ | 764/12384 [1:37:24<24:36:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 6%|▌ | 765/12384 [1:37:24<24:58:27, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 6%|▌ | 765/12384 [1:37:32<24:58:27, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 6%|▌ | 766/12384 [1:37:32<24:51:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 6%|▌ | 766/12384 [1:37:40<24:51:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 6%|▌ | 767/12384 [1:37:40<24:45:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 6%|▌ | 767/12384 [1:37:47<24:45:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 6%|▌ | 768/12384 [1:37:47<24:41:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 6%|▌ | 768/12384 [1:37:55<24:41:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 6%|▌ | 769/12384 [1:37:55<24:38:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 6%|▌ | 769/12384 [1:38:02<24:38:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 770/12384 [1:38:02<24:37:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 770/12384 [1:38:10<24:37:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▌ | 771/12384 [1:38:10<24:35:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▌ | 771/12384 [1:38:18<24:35:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 772/12384 [1:38:18<24:34:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▌ | 772/12384 [1:38:25<24:34:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 6%|▌ | 773/12384 [1:38:25<24:32:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 6%|▌ | 773/12384 [1:38:33<24:32:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 6%|▋ | 774/12384 [1:38:33<24:32:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 6%|▋ | 774/12384 [1:38:40<24:32:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▋ | 775/12384 [1:38:40<24:31:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 6%|▋ | 775/12384 [1:38:48<24:31:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 6%|▋ | 776/12384 [1:38:48<24:34:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 6%|▋ | 776/12384 [1:38:56<24:34:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 2: 6%|▋ | 777/12384 [1:38:56<24:33:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 2: 6%|▋ | 777/12384 [1:39:03<24:33:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 6%|▋ | 778/12384 [1:39:03<24:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 6%|▋ | 778/12384 [1:39:11<24:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 6%|▋ | 779/12384 [1:39:11<24:30:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 6%|▋ | 779/12384 [1:39:18<24:30:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 6%|▋ | 780/12384 [1:39:18<24:30:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 6%|▋ | 780/12384 [1:39:26<24:30:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 6%|▋ | 781/12384 [1:39:26<24:47:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 6%|▋ | 781/12384 [1:39:34<24:47:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 6%|▋ | 782/12384 [1:39:34<24:47:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 6%|▋ | 782/12384 [1:39:42<24:47:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 6%|▋ | 783/12384 [1:39:42<24:42:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 6%|▋ | 783/12384 [1:39:49<24:42:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 6%|▋ | 784/12384 [1:39:49<24:40:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 6%|▋ | 784/12384 [1:39:57<24:40:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 6%|▋ | 785/12384 [1:39:57<24:36:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 6%|▋ | 785/12384 [1:40:04<24:36:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 6%|▋ | 786/12384 [1:40:04<24:34:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 6%|▋ | 786/12384 [1:40:12<24:34:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 6%|▋ | 787/12384 [1:40:12<24:34:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 6%|▋ | 787/12384 [1:40:20<24:34:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 6%|▋ | 788/12384 [1:40:20<24:34:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 6%|▋ | 788/12384 [1:40:27<24:34:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 6%|▋ | 789/12384 [1:40:27<24:32:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 6%|▋ | 789/12384 [1:40:35<24:32:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▋ | 790/12384 [1:40:35<24:32:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 6%|▋ | 790/12384 [1:40:43<24:32:06, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=7.68s]
Epoch 2: 6%|▋ | 791/12384 [1:40:43<24:50:52, 7.72s/it, loss=0.0001, acc=0.9989, iter_time=7.68s]
Epoch 2: 6%|▋ | 791/12384 [1:40:51<24:50:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 6%|▋ | 792/12384 [1:40:51<24:45:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 6%|▋ | 792/12384 [1:40:58<24:45:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 6%|▋ | 793/12384 [1:40:58<24:42:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 6%|▋ | 793/12384 [1:41:06<24:42:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 6%|▋ | 794/12384 [1:41:06<24:39:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 6%|▋ | 794/12384 [1:41:13<24:39:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 6%|▋ | 795/12384 [1:41:13<24:38:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 6%|▋ | 795/12384 [1:41:21<24:38:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▋ | 796/12384 [1:41:21<24:35:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▋ | 796/12384 [1:41:29<24:35:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▋ | 797/12384 [1:41:29<24:39:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 6%|▋ | 797/12384 [1:41:36<24:39:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 6%|▋ | 798/12384 [1:41:36<24:35:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 6%|▋ | 798/12384 [1:41:44<24:35:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 6%|▋ | 799/12384 [1:41:44<24:33:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 6%|▋ | 799/12384 [1:41:52<24:33:29, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.32s]
Epoch 2: 6%|▋ | 800/12384 [1:41:52<24:31:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.32s]
Epoch 2: 6%|▋ | 800/12384 [1:41:59<24:31:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 6%|▋ | 801/12384 [1:41:59<24:31:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 6%|▋ | 801/12384 [1:42:07<24:31:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 6%|▋ | 802/12384 [1:42:07<24:35:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 6%|▋ | 802/12384 [1:42:14<24:35:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 6%|▋ | 803/12384 [1:42:14<24:33:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 6%|▋ | 803/12384 [1:42:22<24:33:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▋ | 804/12384 [1:42:22<24:31:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 6%|▋ | 804/12384 [1:42:30<24:31:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 805/12384 [1:42:30<24:33:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 805/12384 [1:42:37<24:33:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 7%|▋ | 806/12384 [1:42:37<24:31:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 7%|▋ | 806/12384 [1:42:45<24:31:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 7%|▋ | 807/12384 [1:42:45<24:31:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 7%|▋ | 807/12384 [1:42:53<24:31:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 7%|▋ | 808/12384 [1:42:53<24:31:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 7%|▋ | 808/12384 [1:43:00<24:31:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 2: 7%|▋ | 809/12384 [1:43:00<24:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 2: 7%|▋ | 809/12384 [1:43:08<24:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 7%|▋ | 810/12384 [1:43:08<24:29:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 7%|▋ | 810/12384 [1:43:15<24:29:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 7%|▋ | 811/12384 [1:43:15<24:28:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 7%|▋ | 811/12384 [1:43:23<24:28:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 812/12384 [1:43:23<24:28:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 812/12384 [1:43:31<24:28:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 813/12384 [1:43:31<24:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 813/12384 [1:43:38<24:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 814/12384 [1:43:38<24:27:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 814/12384 [1:43:46<24:27:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 7%|▋ | 815/12384 [1:43:46<24:26:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 7%|▋ | 815/12384 [1:43:54<24:26:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 2: 7%|▋ | 816/12384 [1:43:54<24:31:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 2: 7%|▋ | 816/12384 [1:44:01<24:31:12, 7.63s/it, loss=0.0000, acc=0.9998, iter_time=7.34s]
Epoch 2: 7%|▋ | 817/12384 [1:44:01<24:51:29, 7.74s/it, loss=0.0000, acc=0.9998, iter_time=7.34s]
Epoch 2: 7%|▋ | 817/12384 [1:44:09<24:51:29, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 7%|▋ | 818/12384 [1:44:09<24:45:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 7%|▋ | 818/12384 [1:44:17<24:45:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 7%|▋ | 819/12384 [1:44:17<24:39:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 7%|▋ | 819/12384 [1:44:24<24:39:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 820/12384 [1:44:24<24:41:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 820/12384 [1:44:32<24:41:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 7%|▋ | 821/12384 [1:44:32<24:36:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 7%|▋ | 821/12384 [1:44:40<24:36:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 7%|▋ | 822/12384 [1:44:40<24:33:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 7%|▋ | 822/12384 [1:44:47<24:33:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 7%|▋ | 823/12384 [1:44:47<24:37:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 7%|▋ | 823/12384 [1:44:55<24:37:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 7%|▋ | 824/12384 [1:44:55<24:34:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 7%|▋ | 824/12384 [1:45:03<24:34:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 7%|▋ | 825/12384 [1:45:03<24:35:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 7%|▋ | 825/12384 [1:45:10<24:35:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 7%|▋ | 826/12384 [1:45:10<24:32:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 7%|▋ | 826/12384 [1:45:18<24:32:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 827/12384 [1:45:18<24:31:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 827/12384 [1:45:26<24:31:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 7%|▋ | 828/12384 [1:45:26<24:30:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 7%|▋ | 828/12384 [1:45:33<24:30:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 7%|▋ | 829/12384 [1:45:33<24:29:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 7%|▋ | 829/12384 [1:45:41<24:29:16, 7.63s/it, loss=0.0009, acc=0.9962, iter_time=10.74s]
Epoch 2: 7%|▋ | 830/12384 [1:45:41<24:27:26, 7.62s/it, loss=0.0009, acc=0.9962, iter_time=10.74s]
Epoch 2: 7%|▋ | 830/12384 [1:45:48<24:27:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 831/12384 [1:45:48<24:27:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 831/12384 [1:45:56<24:27:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 7%|▋ | 832/12384 [1:45:56<24:27:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 7%|▋ | 832/12384 [1:46:04<24:27:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 2: 7%|▋ | 833/12384 [1:46:04<24:25:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 2: 7%|▋ | 833/12384 [1:46:11<24:25:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.25s]
Epoch 2: 7%|▋ | 834/12384 [1:46:11<24:40:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.25s]
Epoch 2: 7%|▋ | 834/12384 [1:46:19<24:40:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 7%|▋ | 835/12384 [1:46:19<24:36:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 7%|▋ | 835/12384 [1:46:27<24:36:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 7%|▋ | 836/12384 [1:46:27<24:33:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 7%|▋ | 836/12384 [1:46:34<24:33:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 837/12384 [1:46:34<24:31:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 837/12384 [1:46:42<24:31:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 838/12384 [1:46:42<24:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 838/12384 [1:46:50<24:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 2: 7%|▋ | 839/12384 [1:46:50<24:27:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 2: 7%|▋ | 839/12384 [1:46:57<24:27:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 7%|▋ | 840/12384 [1:46:57<24:28:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 7%|▋ | 840/12384 [1:47:05<24:28:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.67s]
Epoch 2: 7%|▋ | 841/12384 [1:47:05<24:25:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.67s]
Epoch 2: 7%|▋ | 841/12384 [1:47:12<24:25:58, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.19s]
Epoch 2: 7%|▋ | 842/12384 [1:47:12<24:26:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.19s]
Epoch 2: 7%|▋ | 842/12384 [1:47:20<24:26:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 7%|▋ | 843/12384 [1:47:20<24:45:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 7%|▋ | 843/12384 [1:47:28<24:45:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 7%|▋ | 844/12384 [1:47:28<24:37:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 7%|▋ | 844/12384 [1:47:36<24:37:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 7%|▋ | 845/12384 [1:47:36<24:34:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 7%|▋ | 845/12384 [1:47:43<24:34:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 7%|▋ | 846/12384 [1:47:43<24:30:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 7%|▋ | 846/12384 [1:47:51<24:30:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 7%|▋ | 847/12384 [1:47:51<24:29:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 7%|▋ | 847/12384 [1:47:58<24:29:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 7%|▋ | 848/12384 [1:47:58<24:27:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 7%|▋ | 848/12384 [1:48:06<24:27:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 7%|▋ | 849/12384 [1:48:06<24:26:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 7%|▋ | 849/12384 [1:48:14<24:26:49, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 2: 7%|▋ | 850/12384 [1:48:14<24:26:05, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 2: 7%|▋ | 850/12384 [1:48:21<24:26:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 7%|▋ | 851/12384 [1:48:21<24:26:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 7%|▋ | 851/12384 [1:48:29<24:26:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 7%|▋ | 852/12384 [1:48:29<24:26:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 7%|▋ | 852/12384 [1:48:37<24:26:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 853/12384 [1:48:37<24:24:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 853/12384 [1:48:44<24:24:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 7%|▋ | 854/12384 [1:48:44<24:23:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 7%|▋ | 854/12384 [1:48:52<24:23:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 7%|▋ | 855/12384 [1:48:52<24:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 7%|▋ | 855/12384 [1:48:59<24:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 7%|▋ | 856/12384 [1:48:59<24:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 7%|▋ | 856/12384 [1:49:07<24:22:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 7%|▋ | 857/12384 [1:49:07<24:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 7%|▋ | 857/12384 [1:49:15<24:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 858/12384 [1:49:15<24:24:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 858/12384 [1:49:22<24:24:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 7%|▋ | 859/12384 [1:49:22<24:23:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 7%|▋ | 859/12384 [1:49:30<24:23:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 7%|▋ | 860/12384 [1:49:30<24:38:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 7%|▋ | 860/12384 [1:49:38<24:38:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 7%|▋ | 861/12384 [1:49:38<24:32:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 7%|▋ | 861/12384 [1:49:45<24:32:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 2: 7%|▋ | 862/12384 [1:49:45<24:30:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 2: 7%|▋ | 862/12384 [1:49:53<24:30:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 7%|▋ | 863/12384 [1:49:53<24:27:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 7%|▋ | 863/12384 [1:50:01<24:27:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 7%|▋ | 864/12384 [1:50:01<24:24:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 7%|▋ | 864/12384 [1:50:08<24:24:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 7%|▋ | 865/12384 [1:50:08<24:23:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 7%|▋ | 865/12384 [1:50:16<24:23:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 866/12384 [1:50:16<24:22:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 866/12384 [1:50:23<24:22:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 7%|▋ | 867/12384 [1:50:23<24:21:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 7%|▋ | 867/12384 [1:50:31<24:21:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 7%|▋ | 868/12384 [1:50:31<24:22:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 7%|▋ | 868/12384 [1:50:39<24:22:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 7%|▋ | 869/12384 [1:50:39<24:41:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 7%|▋ | 869/12384 [1:50:47<24:41:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 7%|▋ | 870/12384 [1:50:47<24:39:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 7%|▋ | 870/12384 [1:50:54<24:39:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 2: 7%|▋ | 871/12384 [1:50:54<24:34:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.82s]
Epoch 2: 7%|▋ | 871/12384 [1:51:02<24:34:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 2: 7%|▋ | 872/12384 [1:51:02<24:30:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 2: 7%|▋ | 872/12384 [1:51:09<24:30:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 7%|▋ | 873/12384 [1:51:09<24:26:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 7%|▋ | 873/12384 [1:51:17<24:26:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 7%|▋ | 874/12384 [1:51:17<24:25:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 7%|▋ | 874/12384 [1:51:25<24:25:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 7%|▋ | 875/12384 [1:51:25<24:25:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 7%|▋ | 875/12384 [1:51:32<24:25:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 7%|▋ | 876/12384 [1:51:32<24:23:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 7%|▋ | 876/12384 [1:51:40<24:23:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 7%|▋ | 877/12384 [1:51:40<24:22:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 7%|▋ | 877/12384 [1:51:48<24:22:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 2: 7%|▋ | 878/12384 [1:51:48<24:20:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 2: 7%|▋ | 878/12384 [1:51:55<24:20:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 7%|▋ | 879/12384 [1:51:55<24:19:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 7%|▋ | 879/12384 [1:52:03<24:19:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 7%|▋ | 880/12384 [1:52:03<24:19:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 7%|▋ | 880/12384 [1:52:10<24:19:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 7%|▋ | 881/12384 [1:52:10<24:18:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 7%|▋ | 881/12384 [1:52:18<24:18:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 7%|▋ | 882/12384 [1:52:18<24:17:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 7%|▋ | 882/12384 [1:52:26<24:17:48, 7.60s/it, loss=0.0001, acc=0.9994, iter_time=7.21s]
Epoch 2: 7%|▋ | 883/12384 [1:52:26<24:18:39, 7.61s/it, loss=0.0001, acc=0.9994, iter_time=7.21s]
Epoch 2: 7%|▋ | 883/12384 [1:52:33<24:18:39, 7.61s/it, loss=0.0001, acc=0.9997, iter_time=7.62s]
Epoch 2: 7%|▋ | 884/12384 [1:52:33<24:19:39, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.62s]
Epoch 2: 7%|▋ | 884/12384 [1:52:41<24:19:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 7%|▋ | 885/12384 [1:52:41<24:19:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 7%|▋ | 885/12384 [1:52:49<24:19:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 7%|▋ | 886/12384 [1:52:49<24:35:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 7%|▋ | 886/12384 [1:52:56<24:35:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 7%|▋ | 887/12384 [1:52:56<24:36:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 7%|▋ | 887/12384 [1:53:04<24:36:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 7%|▋ | 888/12384 [1:53:04<24:32:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 7%|▋ | 888/12384 [1:53:12<24:32:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 7%|▋ | 889/12384 [1:53:12<24:27:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 7%|▋ | 889/12384 [1:53:19<24:27:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 7%|▋ | 890/12384 [1:53:19<24:24:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 7%|▋ | 890/12384 [1:53:27<24:24:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 7%|▋ | 891/12384 [1:53:27<24:21:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 7%|▋ | 891/12384 [1:53:35<24:21:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 892/12384 [1:53:35<24:20:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 892/12384 [1:53:42<24:20:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 893/12384 [1:53:42<24:20:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 893/12384 [1:53:50<24:20:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 7%|▋ | 894/12384 [1:53:50<24:19:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 7%|▋ | 894/12384 [1:53:57<24:19:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 7%|▋ | 895/12384 [1:53:57<24:19:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 7%|▋ | 895/12384 [1:54:05<24:19:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 7%|▋ | 896/12384 [1:54:05<24:36:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 7%|▋ | 896/12384 [1:54:13<24:36:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 7%|▋ | 897/12384 [1:54:13<24:31:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 7%|▋ | 897/12384 [1:54:21<24:31:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 7%|▋ | 898/12384 [1:54:21<24:29:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 7%|▋ | 898/12384 [1:54:28<24:29:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 7%|▋ | 899/12384 [1:54:28<24:26:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 7%|▋ | 899/12384 [1:54:36<24:26:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 7%|▋ | 900/12384 [1:54:36<24:24:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 7%|▋ | 900/12384 [1:54:43<24:24:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 7%|▋ | 901/12384 [1:54:43<24:20:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 7%|▋ | 901/12384 [1:54:51<24:20:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 902/12384 [1:54:51<24:20:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 902/12384 [1:54:59<24:20:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 7%|▋ | 903/12384 [1:54:59<24:17:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 7%|▋ | 903/12384 [1:55:06<24:17:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 7%|▋ | 904/12384 [1:55:06<24:16:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 7%|▋ | 904/12384 [1:55:14<24:16:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 7%|▋ | 905/12384 [1:55:14<24:16:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 7%|▋ | 905/12384 [1:55:21<24:16:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 906/12384 [1:55:21<24:17:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 7%|▋ | 906/12384 [1:55:29<24:17:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 7%|▋ | 907/12384 [1:55:29<24:15:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 7%|▋ | 907/12384 [1:55:37<24:15:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 7%|▋ | 908/12384 [1:55:37<24:16:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 7%|▋ | 908/12384 [1:55:44<24:16:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 7%|▋ | 909/12384 [1:55:44<24:16:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 7%|▋ | 909/12384 [1:55:52<24:16:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 910/12384 [1:55:52<24:16:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 7%|▋ | 910/12384 [1:56:00<24:16:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 7%|▋ | 911/12384 [1:56:00<24:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 7%|▋ | 911/12384 [1:56:07<24:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=12.00s]
Epoch 2: 7%|▋ | 912/12384 [1:56:07<24:30:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=12.00s]
Epoch 2: 7%|▋ | 912/12384 [1:56:15<24:30:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 7%|▋ | 913/12384 [1:56:15<24:25:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 7%|▋ | 913/12384 [1:56:23<24:25:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 914/12384 [1:56:23<24:20:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 914/12384 [1:56:30<24:20:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 915/12384 [1:56:30<24:19:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 7%|▋ | 915/12384 [1:56:38<24:19:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 7%|▋ | 916/12384 [1:56:38<24:18:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 7%|▋ | 916/12384 [1:56:45<24:18:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 7%|▋ | 917/12384 [1:56:45<24:15:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 7%|▋ | 917/12384 [1:56:53<24:15:43, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=6.13s]
Epoch 2: 7%|▋ | 918/12384 [1:56:53<24:15:51, 7.62s/it, loss=0.0001, acc=0.9988, iter_time=6.13s]
Epoch 2: 7%|▋ | 918/12384 [1:57:01<24:15:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 7%|▋ | 919/12384 [1:57:01<24:15:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 7%|▋ | 919/12384 [1:57:08<24:15:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 7%|▋ | 920/12384 [1:57:08<24:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 7%|▋ | 920/12384 [1:57:16<24:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 7%|▋ | 921/12384 [1:57:16<24:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 7%|▋ | 921/12384 [1:57:24<24:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 7%|▋ | 922/12384 [1:57:24<24:35:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 7%|▋ | 922/12384 [1:57:31<24:35:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 7%|▋ | 923/12384 [1:57:31<24:30:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 7%|▋ | 923/12384 [1:57:39<24:30:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 7%|▋ | 924/12384 [1:57:39<24:26:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 7%|▋ | 924/12384 [1:57:47<24:26:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 7%|▋ | 925/12384 [1:57:47<24:21:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 7%|▋ | 925/12384 [1:57:54<24:21:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 7%|▋ | 926/12384 [1:57:54<24:19:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 7%|▋ | 926/12384 [1:58:02<24:19:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 7%|▋ | 927/12384 [1:58:02<24:23:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 7%|▋ | 927/12384 [1:58:10<24:23:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 7%|▋ | 928/12384 [1:58:10<24:22:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 7%|▋ | 928/12384 [1:58:17<24:22:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 8%|▊ | 929/12384 [1:58:17<24:19:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 8%|▊ | 929/12384 [1:58:25<24:19:08, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 2: 8%|▊ | 930/12384 [1:58:25<24:15:58, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.59s]
Epoch 2: 8%|▊ | 930/12384 [1:58:33<24:15:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 931/12384 [1:58:33<24:15:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 931/12384 [1:58:40<24:15:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 8%|▊ | 932/12384 [1:58:40<24:14:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 8%|▊ | 932/12384 [1:58:48<24:14:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 8%|▊ | 933/12384 [1:58:48<24:12:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 8%|▊ | 933/12384 [1:58:55<24:12:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 934/12384 [1:58:55<24:12:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 934/12384 [1:59:03<24:12:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 8%|▊ | 935/12384 [1:59:03<24:12:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 8%|▊ | 935/12384 [1:59:11<24:12:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 8%|▊ | 936/12384 [1:59:11<24:14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 8%|▊ | 936/12384 [1:59:18<24:14:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 8%|▊ | 937/12384 [1:59:18<24:14:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 8%|▊ | 937/12384 [1:59:26<24:14:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 8%|▊ | 938/12384 [1:59:26<24:30:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 8%|▊ | 938/12384 [1:59:34<24:30:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 939/12384 [1:59:34<24:24:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 939/12384 [1:59:41<24:24:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 8%|▊ | 940/12384 [1:59:41<24:21:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 8%|▊ | 940/12384 [1:59:49<24:21:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 8%|▊ | 941/12384 [1:59:49<24:18:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 8%|▊ | 941/12384 [1:59:57<24:18:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 942/12384 [1:59:57<24:16:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 942/12384 [2:00:04<24:16:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 8%|▊ | 943/12384 [2:00:04<24:15:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 8%|▊ | 943/12384 [2:00:12<24:15:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 8%|▊ | 944/12384 [2:00:12<24:12:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 8%|▊ | 944/12384 [2:00:19<24:12:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 8%|▊ | 945/12384 [2:00:19<24:14:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 8%|▊ | 945/12384 [2:00:27<24:14:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 8%|▊ | 946/12384 [2:00:27<24:11:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 8%|▊ | 946/12384 [2:00:35<24:11:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 8%|▊ | 947/12384 [2:00:35<24:11:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 8%|▊ | 947/12384 [2:00:42<24:11:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 8%|▊ | 948/12384 [2:00:42<24:11:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 8%|▊ | 948/12384 [2:00:50<24:11:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 8%|▊ | 949/12384 [2:00:50<24:32:18, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 8%|▊ | 949/12384 [2:00:58<24:32:18, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 8%|▊ | 950/12384 [2:00:58<24:27:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 8%|▊ | 950/12384 [2:01:05<24:27:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 8%|▊ | 951/12384 [2:01:05<24:22:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 8%|▊ | 951/12384 [2:01:13<24:22:18, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.59s]
Epoch 2: 8%|▊ | 952/12384 [2:01:13<24:18:35, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.59s]
Epoch 2: 8%|▊ | 952/12384 [2:01:21<24:18:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 8%|▊ | 953/12384 [2:01:21<24:19:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 8%|▊ | 953/12384 [2:01:28<24:19:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 8%|▊ | 954/12384 [2:01:28<24:17:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 8%|▊ | 954/12384 [2:01:36<24:17:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 8%|▊ | 955/12384 [2:01:36<24:16:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 8%|▊ | 955/12384 [2:01:44<24:16:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 8%|▊ | 956/12384 [2:01:44<24:13:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 8%|▊ | 956/12384 [2:01:51<24:13:44, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=8.57s]
Epoch 2: 8%|▊ | 957/12384 [2:01:51<24:12:27, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=8.57s]
Epoch 2: 8%|▊ | 957/12384 [2:01:59<24:12:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 8%|▊ | 958/12384 [2:01:59<24:11:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 8%|▊ | 958/12384 [2:02:06<24:11:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 8%|▊ | 959/12384 [2:02:06<24:08:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 8%|▊ | 959/12384 [2:02:14<24:08:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 8%|▊ | 960/12384 [2:02:14<24:11:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 8%|▊ | 960/12384 [2:02:22<24:11:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 8%|▊ | 961/12384 [2:02:22<24:09:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 8%|▊ | 961/12384 [2:02:29<24:09:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 8%|▊ | 962/12384 [2:02:29<24:07:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 8%|▊ | 962/12384 [2:02:37<24:07:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 8%|▊ | 963/12384 [2:02:37<24:08:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 8%|▊ | 963/12384 [2:02:45<24:08:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 8%|▊ | 964/12384 [2:02:45<24:23:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 8%|▊ | 964/12384 [2:02:52<24:23:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 8%|▊ | 965/12384 [2:02:52<24:18:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 8%|▊ | 965/12384 [2:03:00<24:18:11, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 2: 8%|▊ | 966/12384 [2:03:00<24:19:58, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 2: 8%|▊ | 966/12384 [2:03:08<24:19:58, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 2: 8%|▊ | 967/12384 [2:03:08<24:17:17, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.69s]
Epoch 2: 8%|▊ | 967/12384 [2:03:15<24:17:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 8%|▊ | 968/12384 [2:03:15<24:14:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 8%|▊ | 968/12384 [2:03:23<24:14:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 8%|▊ | 969/12384 [2:03:23<24:12:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 8%|▊ | 969/12384 [2:03:31<24:12:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 8%|▊ | 970/12384 [2:03:31<24:12:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 8%|▊ | 970/12384 [2:03:38<24:12:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 8%|▊ | 971/12384 [2:03:38<24:09:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 8%|▊ | 971/12384 [2:03:46<24:09:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 8%|▊ | 972/12384 [2:03:46<24:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 8%|▊ | 972/12384 [2:03:53<24:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 8%|▊ | 973/12384 [2:03:53<24:10:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 8%|▊ | 973/12384 [2:04:01<24:10:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 8%|▊ | 974/12384 [2:04:01<24:08:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 8%|▊ | 974/12384 [2:04:09<24:08:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 8%|▊ | 975/12384 [2:04:09<24:26:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 8%|▊ | 975/12384 [2:04:17<24:26:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 8%|▊ | 976/12384 [2:04:17<24:24:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 8%|▊ | 976/12384 [2:04:24<24:24:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 8%|▊ | 977/12384 [2:04:24<24:19:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 8%|▊ | 977/12384 [2:04:32<24:19:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 8%|▊ | 978/12384 [2:04:32<24:14:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 8%|▊ | 978/12384 [2:04:39<24:14:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 8%|▊ | 979/12384 [2:04:39<24:11:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 8%|▊ | 979/12384 [2:04:47<24:11:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 8%|▊ | 980/12384 [2:04:47<24:09:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 8%|▊ | 980/12384 [2:04:55<24:09:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 8%|▊ | 981/12384 [2:04:55<24:07:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 8%|▊ | 981/12384 [2:05:02<24:07:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 8%|▊ | 982/12384 [2:05:02<24:11:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 8%|▊ | 982/12384 [2:05:10<24:11:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 8%|▊ | 983/12384 [2:05:10<24:10:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 8%|▊ | 983/12384 [2:05:18<24:10:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 8%|▊ | 984/12384 [2:05:18<24:09:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 8%|▊ | 984/12384 [2:05:25<24:09:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 8%|▊ | 985/12384 [2:05:25<24:08:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 8%|▊ | 985/12384 [2:05:33<24:08:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 8%|▊ | 986/12384 [2:05:33<24:08:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 8%|▊ | 986/12384 [2:05:40<24:08:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 8%|▊ | 987/12384 [2:05:40<24:12:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 8%|▊ | 987/12384 [2:05:48<24:12:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 8%|▊ | 988/12384 [2:05:48<24:12:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 8%|▊ | 988/12384 [2:05:56<24:12:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 8%|▊ | 989/12384 [2:05:56<24:10:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 8%|▊ | 989/12384 [2:06:04<24:10:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 8%|▊ | 990/12384 [2:06:04<24:26:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 8%|▊ | 990/12384 [2:06:11<24:26:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 8%|▊ | 991/12384 [2:06:11<24:20:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 8%|▊ | 991/12384 [2:06:19<24:20:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 8%|▊ | 992/12384 [2:06:19<24:23:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 8%|▊ | 992/12384 [2:06:27<24:23:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 8%|▊ | 993/12384 [2:06:27<24:17:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 8%|▊ | 993/12384 [2:06:34<24:17:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 8%|▊ | 994/12384 [2:06:34<24:13:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 8%|▊ | 994/12384 [2:06:42<24:13:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 8%|▊ | 995/12384 [2:06:42<24:11:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 8%|▊ | 995/12384 [2:06:49<24:11:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 8%|▊ | 996/12384 [2:06:49<24:09:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 8%|▊ | 996/12384 [2:06:57<24:09:06, 7.63s/it, loss=0.0001, acc=0.9996, iter_time=7.60s]
Epoch 2: 8%|▊ | 997/12384 [2:06:57<24:06:44, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=7.60s]
Epoch 2: 8%|▊ | 997/12384 [2:07:05<24:06:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 2: 8%|▊ | 998/12384 [2:07:05<24:05:08, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 2: 8%|▊ | 998/12384 [2:07:12<24:05:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 8%|▊ | 999/12384 [2:07:12<24:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 8%|▊ | 999/12384 [2:07:20<24:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 8%|▊ | 1000/12384 [2:07:20<24:03:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 8%|▊ | 1000/12384 [2:07:28<24:03:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 2: 8%|▊ | 1001/12384 [2:07:28<24:22:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 2: 8%|▊ | 1001/12384 [2:07:35<24:22:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 2: 8%|▊ | 1002/12384 [2:07:35<24:15:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 2: 8%|▊ | 1002/12384 [2:07:43<24:15:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 1003/12384 [2:07:43<24:11:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 8%|▊ | 1003/12384 [2:07:51<24:11:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 8%|▊ | 1004/12384 [2:07:51<24:08:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 8%|▊ | 1004/12384 [2:07:58<24:08:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 8%|▊ | 1005/12384 [2:07:58<24:07:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 8%|▊ | 1005/12384 [2:08:06<24:07:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 2: 8%|▊ | 1006/12384 [2:08:06<24:06:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 2: 8%|▊ | 1006/12384 [2:08:13<24:06:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 8%|▊ | 1007/12384 [2:08:13<24:03:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 8%|▊ | 1007/12384 [2:08:21<24:03:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 8%|▊ | 1008/12384 [2:08:21<24:04:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 8%|▊ | 1008/12384 [2:08:29<24:04:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 8%|▊ | 1009/12384 [2:08:29<24:03:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 8%|▊ | 1009/12384 [2:08:36<24:03:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 8%|▊ | 1010/12384 [2:08:36<24:03:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 8%|▊ | 1010/12384 [2:08:44<24:03:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 8%|▊ | 1011/12384 [2:08:44<24:02:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 8%|▊ | 1011/12384 [2:08:51<24:02:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 8%|▊ | 1012/12384 [2:08:51<24:02:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 8%|▊ | 1012/12384 [2:08:59<24:02:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 8%|▊ | 1013/12384 [2:08:59<24:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 8%|▊ | 1013/12384 [2:09:07<24:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 8%|▊ | 1014/12384 [2:09:07<24:08:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 8%|▊ | 1014/12384 [2:09:14<24:08:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 8%|▊ | 1015/12384 [2:09:14<24:05:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 8%|▊ | 1015/12384 [2:09:22<24:05:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 8%|▊ | 1016/12384 [2:09:22<24:04:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 8%|▊ | 1016/12384 [2:09:30<24:04:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 2: 8%|▊ | 1017/12384 [2:09:30<24:02:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 2: 8%|▊ | 1017/12384 [2:09:37<24:02:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 8%|▊ | 1018/12384 [2:09:37<24:02:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 8%|▊ | 1018/12384 [2:09:45<24:02:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 8%|▊ | 1019/12384 [2:09:45<24:01:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 8%|▊ | 1019/12384 [2:09:52<24:01:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 8%|▊ | 1020/12384 [2:09:52<24:00:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 8%|▊ | 1020/12384 [2:10:00<24:00:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 8%|▊ | 1021/12384 [2:10:00<24:01:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 8%|▊ | 1021/12384 [2:10:08<24:01:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 8%|▊ | 1022/12384 [2:10:08<23:59:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 8%|▊ | 1022/12384 [2:10:15<23:59:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 8%|▊ | 1023/12384 [2:10:15<23:59:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 8%|▊ | 1023/12384 [2:10:23<23:59:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 8%|▊ | 1024/12384 [2:10:23<24:00:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 8%|▊ | 1024/12384 [2:10:30<24:00:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 8%|▊ | 1025/12384 [2:10:30<24:00:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 8%|▊ | 1025/12384 [2:10:38<24:00:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 8%|▊ | 1026/12384 [2:10:38<24:00:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 8%|▊ | 1026/12384 [2:10:46<24:00:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 8%|▊ | 1027/12384 [2:10:46<24:20:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 8%|▊ | 1027/12384 [2:10:54<24:20:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 8%|▊ | 1028/12384 [2:10:54<24:13:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 8%|▊ | 1028/12384 [2:11:01<24:13:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 8%|▊ | 1029/12384 [2:11:01<24:09:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 8%|▊ | 1029/12384 [2:11:09<24:09:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 8%|▊ | 1030/12384 [2:11:09<24:08:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 8%|▊ | 1030/12384 [2:11:16<24:08:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 8%|▊ | 1031/12384 [2:11:16<24:05:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 8%|▊ | 1031/12384 [2:11:24<24:05:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 8%|▊ | 1032/12384 [2:11:24<24:03:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 8%|▊ | 1032/12384 [2:11:32<24:03:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 8%|▊ | 1033/12384 [2:11:32<24:02:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 8%|▊ | 1033/12384 [2:11:39<24:02:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 8%|▊ | 1034/12384 [2:11:39<24:06:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 8%|▊ | 1034/12384 [2:11:47<24:06:41, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.42s]
Epoch 2: 8%|▊ | 1035/12384 [2:11:47<24:04:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.42s]
Epoch 2: 8%|▊ | 1035/12384 [2:11:55<24:04:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 8%|▊ | 1036/12384 [2:11:55<24:03:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 8%|▊ | 1036/12384 [2:12:02<24:03:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 8%|▊ | 1037/12384 [2:12:02<24:01:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 8%|▊ | 1037/12384 [2:12:10<24:01:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 8%|▊ | 1038/12384 [2:12:10<24:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 8%|▊ | 1038/12384 [2:12:18<24:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 8%|▊ | 1039/12384 [2:12:18<24:02:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 8%|▊ | 1039/12384 [2:12:25<24:02:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 8%|▊ | 1040/12384 [2:12:25<24:05:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 8%|▊ | 1040/12384 [2:12:33<24:05:29, 7.65s/it, loss=0.0004, acc=0.9987, iter_time=7.29s]
Epoch 2: 8%|▊ | 1041/12384 [2:12:33<24:02:46, 7.63s/it, loss=0.0004, acc=0.9987, iter_time=7.29s]
Epoch 2: 8%|▊ | 1041/12384 [2:12:40<24:02:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 8%|▊ | 1042/12384 [2:12:40<24:01:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 8%|▊ | 1042/12384 [2:12:48<24:01:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 8%|▊ | 1043/12384 [2:12:48<24:16:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 8%|▊ | 1043/12384 [2:12:56<24:16:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 8%|▊ | 1044/12384 [2:12:56<24:12:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 8%|▊ | 1044/12384 [2:13:04<24:12:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 8%|▊ | 1045/12384 [2:13:04<24:08:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 8%|▊ | 1045/12384 [2:13:11<24:08:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 8%|▊ | 1046/12384 [2:13:11<24:05:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 8%|▊ | 1046/12384 [2:13:19<24:05:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 8%|▊ | 1047/12384 [2:13:19<24:02:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 8%|▊ | 1047/12384 [2:13:26<24:02:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 8%|▊ | 1048/12384 [2:13:26<24:01:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 8%|▊ | 1048/12384 [2:13:34<24:01:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 8%|▊ | 1049/12384 [2:13:34<24:01:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 8%|▊ | 1049/12384 [2:13:42<24:01:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 8%|▊ | 1050/12384 [2:13:42<24:00:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 8%|▊ | 1050/12384 [2:13:49<24:00:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 8%|▊ | 1051/12384 [2:13:49<23:59:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 8%|▊ | 1051/12384 [2:13:57<23:59:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 8%|▊ | 1052/12384 [2:13:57<23:57:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 8%|▊ | 1052/12384 [2:14:05<23:57:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 9%|▊ | 1053/12384 [2:14:05<24:16:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 9%|▊ | 1053/12384 [2:14:12<24:16:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 9%|▊ | 1054/12384 [2:14:12<24:11:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 9%|▊ | 1054/12384 [2:14:20<24:11:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▊ | 1055/12384 [2:14:20<24:06:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▊ | 1055/12384 [2:14:28<24:06:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 9%|▊ | 1056/12384 [2:14:28<24:04:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 9%|▊ | 1056/12384 [2:14:35<24:04:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 9%|▊ | 1057/12384 [2:14:35<24:01:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 9%|▊ | 1057/12384 [2:14:43<24:01:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▊ | 1058/12384 [2:14:43<24:00:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▊ | 1058/12384 [2:14:50<24:00:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▊ | 1059/12384 [2:14:50<23:58:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▊ | 1059/12384 [2:14:58<23:58:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 9%|▊ | 1060/12384 [2:14:58<23:57:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 9%|▊ | 1060/12384 [2:15:06<23:57:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 9%|▊ | 1061/12384 [2:15:06<23:57:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 9%|▊ | 1061/12384 [2:15:13<23:57:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.21s]
Epoch 2: 9%|▊ | 1062/12384 [2:15:13<23:56:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.21s]
Epoch 2: 9%|▊ | 1062/12384 [2:15:21<23:56:46, 7.61s/it, loss=0.0004, acc=0.9963, iter_time=4.07s]
Epoch 2: 9%|▊ | 1063/12384 [2:15:21<23:55:01, 7.61s/it, loss=0.0004, acc=0.9963, iter_time=4.07s]
Epoch 2: 9%|▊ | 1063/12384 [2:15:28<23:55:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 9%|▊ | 1064/12384 [2:15:28<23:54:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 9%|▊ | 1064/12384 [2:15:36<23:54:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 9%|▊ | 1065/12384 [2:15:36<23:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 9%|▊ | 1065/12384 [2:15:44<23:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▊ | 1066/12384 [2:15:44<23:55:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▊ | 1066/12384 [2:15:51<23:55:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.11s]
Epoch 2: 9%|▊ | 1067/12384 [2:15:51<23:54:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.11s]
Epoch 2: 9%|▊ | 1067/12384 [2:15:59<23:54:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 9%|▊ | 1068/12384 [2:15:59<23:58:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 9%|▊ | 1068/12384 [2:16:07<23:58:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▊ | 1069/12384 [2:16:07<23:57:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▊ | 1069/12384 [2:16:14<23:57:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.44s]
Epoch 2: 9%|▊ | 1070/12384 [2:16:14<23:56:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.44s]
Epoch 2: 9%|▊ | 1070/12384 [2:16:22<23:56:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.82s]
Epoch 2: 9%|▊ | 1071/12384 [2:16:22<23:55:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.82s]
Epoch 2: 9%|▊ | 1071/12384 [2:16:29<23:55:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 9%|▊ | 1072/12384 [2:16:29<23:54:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 9%|▊ | 1072/12384 [2:16:37<23:54:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 9%|▊ | 1073/12384 [2:16:37<23:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 9%|▊ | 1073/12384 [2:16:45<23:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▊ | 1074/12384 [2:16:45<23:55:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▊ | 1074/12384 [2:16:52<23:55:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 9%|▊ | 1075/12384 [2:16:52<23:53:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 9%|▊ | 1075/12384 [2:17:00<23:53:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 9%|▊ | 1076/12384 [2:17:00<23:53:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 9%|▊ | 1076/12384 [2:17:07<23:53:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 2: 9%|▊ | 1077/12384 [2:17:07<23:55:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 2: 9%|▊ | 1077/12384 [2:17:15<23:55:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 9%|▊ | 1078/12384 [2:17:15<23:54:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 9%|▊ | 1078/12384 [2:17:23<23:54:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 9%|▊ | 1079/12384 [2:17:23<23:54:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 9%|▊ | 1079/12384 [2:17:31<23:54:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 9%|▊ | 1080/12384 [2:17:31<24:19:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 9%|▊ | 1080/12384 [2:17:38<24:19:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 9%|▊ | 1081/12384 [2:17:38<24:12:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 9%|▊ | 1081/12384 [2:17:46<24:12:16, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 9%|▊ | 1082/12384 [2:17:46<24:06:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 9%|▊ | 1082/12384 [2:17:54<24:06:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 9%|▊ | 1083/12384 [2:17:54<24:01:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 9%|▊ | 1083/12384 [2:18:01<24:01:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1084/12384 [2:18:01<24:00:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1084/12384 [2:18:09<24:00:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 9%|▉ | 1085/12384 [2:18:09<23:58:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 9%|▉ | 1085/12384 [2:18:16<23:58:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1086/12384 [2:18:16<23:57:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1086/12384 [2:18:24<23:57:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 9%|▉ | 1087/12384 [2:18:24<23:56:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 9%|▉ | 1087/12384 [2:18:32<23:56:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 9%|▉ | 1088/12384 [2:18:32<23:56:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 9%|▉ | 1088/12384 [2:18:39<23:56:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 9%|▉ | 1089/12384 [2:18:39<23:54:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 9%|▉ | 1089/12384 [2:18:47<23:54:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1090/12384 [2:18:47<23:54:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1090/12384 [2:18:55<23:54:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1091/12384 [2:18:55<23:54:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1091/12384 [2:19:02<23:54:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1092/12384 [2:19:02<23:54:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1092/12384 [2:19:10<23:54:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1093/12384 [2:19:10<23:52:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1093/12384 [2:19:17<23:52:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1094/12384 [2:19:17<23:52:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1094/12384 [2:19:25<23:52:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 9%|▉ | 1095/12384 [2:19:25<24:09:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 9%|▉ | 1095/12384 [2:19:33<24:09:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 9%|▉ | 1096/12384 [2:19:33<24:05:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 9%|▉ | 1096/12384 [2:19:41<24:05:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 9%|▉ | 1097/12384 [2:19:41<23:59:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 9%|▉ | 1097/12384 [2:19:48<23:59:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1098/12384 [2:19:48<23:57:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1098/12384 [2:19:56<23:57:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▉ | 1099/12384 [2:19:56<23:55:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▉ | 1099/12384 [2:20:03<23:55:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 9%|▉ | 1100/12384 [2:20:03<23:55:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 9%|▉ | 1100/12384 [2:20:11<23:55:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 9%|▉ | 1101/12384 [2:20:11<23:54:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 9%|▉ | 1101/12384 [2:20:19<23:54:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1102/12384 [2:20:19<23:53:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1102/12384 [2:20:26<23:53:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 9%|▉ | 1103/12384 [2:20:26<23:52:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 9%|▉ | 1103/12384 [2:20:34<23:52:28, 7.62s/it, loss=0.0001, acc=0.9996, iter_time=7.99s]
Epoch 2: 9%|▉ | 1104/12384 [2:20:34<23:51:28, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=7.99s]
Epoch 2: 9%|▉ | 1104/12384 [2:20:41<23:51:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 9%|▉ | 1105/12384 [2:20:41<23:50:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 9%|▉ | 1105/12384 [2:20:49<23:50:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 9%|▉ | 1106/12384 [2:20:49<24:09:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 9%|▉ | 1106/12384 [2:20:57<24:09:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 9%|▉ | 1107/12384 [2:20:57<24:02:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 9%|▉ | 1107/12384 [2:21:05<24:02:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 9%|▉ | 1108/12384 [2:21:05<24:04:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 9%|▉ | 1108/12384 [2:21:12<24:04:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 9%|▉ | 1109/12384 [2:21:12<23:58:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 9%|▉ | 1109/12384 [2:21:20<23:58:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▉ | 1110/12384 [2:21:20<23:55:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▉ | 1110/12384 [2:21:27<23:55:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 9%|▉ | 1111/12384 [2:21:27<23:52:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 9%|▉ | 1111/12384 [2:21:35<23:52:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 9%|▉ | 1112/12384 [2:21:35<23:53:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 9%|▉ | 1112/12384 [2:21:43<23:53:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 9%|▉ | 1113/12384 [2:21:43<23:54:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 9%|▉ | 1113/12384 [2:21:50<23:54:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 9%|▉ | 1114/12384 [2:21:50<23:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 9%|▉ | 1114/12384 [2:21:58<23:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▉ | 1115/12384 [2:21:58<23:50:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▉ | 1115/12384 [2:22:06<23:50:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1116/12384 [2:22:06<23:50:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1116/12384 [2:22:13<23:50:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1117/12384 [2:22:13<23:53:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1117/12384 [2:22:21<23:53:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 9%|▉ | 1118/12384 [2:22:21<23:53:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 9%|▉ | 1118/12384 [2:22:29<23:53:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 9%|▉ | 1119/12384 [2:22:29<23:58:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 9%|▉ | 1119/12384 [2:22:36<23:58:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 9%|▉ | 1120/12384 [2:22:36<23:55:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 9%|▉ | 1120/12384 [2:22:44<23:55:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 9%|▉ | 1121/12384 [2:22:44<24:13:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 9%|▉ | 1121/12384 [2:22:52<24:13:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 9%|▉ | 1122/12384 [2:22:52<24:05:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 9%|▉ | 1122/12384 [2:22:59<24:05:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 9%|▉ | 1123/12384 [2:22:59<23:59:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 9%|▉ | 1123/12384 [2:23:07<23:59:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1124/12384 [2:23:07<23:56:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1124/12384 [2:23:15<23:56:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 9%|▉ | 1125/12384 [2:23:15<23:54:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 9%|▉ | 1125/12384 [2:23:22<23:54:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 9%|▉ | 1126/12384 [2:23:22<23:52:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 9%|▉ | 1126/12384 [2:23:30<23:52:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1127/12384 [2:23:30<23:50:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1127/12384 [2:23:37<23:50:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1128/12384 [2:23:37<23:53:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 9%|▉ | 1128/12384 [2:23:45<23:53:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 9%|▉ | 1129/12384 [2:23:45<23:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 9%|▉ | 1129/12384 [2:23:53<23:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 9%|▉ | 1130/12384 [2:23:53<23:50:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 9%|▉ | 1130/12384 [2:24:00<23:50:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 9%|▉ | 1131/12384 [2:24:00<23:50:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 9%|▉ | 1131/12384 [2:24:08<23:50:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 9%|▉ | 1132/12384 [2:24:08<23:49:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 9%|▉ | 1132/12384 [2:24:16<23:49:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 9%|▉ | 1133/12384 [2:24:16<24:04:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 9%|▉ | 1133/12384 [2:24:23<24:04:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 9%|▉ | 1134/12384 [2:24:23<24:01:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 9%|▉ | 1134/12384 [2:24:31<24:01:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 9%|▉ | 1135/12384 [2:24:31<23:56:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 9%|▉ | 1135/12384 [2:24:39<23:56:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 9%|▉ | 1136/12384 [2:24:39<23:53:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 9%|▉ | 1136/12384 [2:24:46<23:53:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 9%|▉ | 1137/12384 [2:24:46<23:54:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 9%|▉ | 1137/12384 [2:24:54<23:54:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 9%|▉ | 1138/12384 [2:24:54<23:52:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 9%|▉ | 1138/12384 [2:25:02<23:52:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 2: 9%|▉ | 1139/12384 [2:25:02<23:51:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 2: 9%|▉ | 1139/12384 [2:25:09<23:51:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 9%|▉ | 1140/12384 [2:25:09<23:50:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 9%|▉ | 1140/12384 [2:25:17<23:50:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1141/12384 [2:25:17<23:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1141/12384 [2:25:24<23:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 9%|▉ | 1142/12384 [2:25:24<23:47:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 9%|▉ | 1142/12384 [2:25:32<23:47:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 9%|▉ | 1143/12384 [2:25:32<23:48:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 9%|▉ | 1143/12384 [2:25:40<23:48:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 9%|▉ | 1144/12384 [2:25:40<23:46:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 9%|▉ | 1144/12384 [2:25:47<23:46:34, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.65s]
Epoch 2: 9%|▉ | 1145/12384 [2:25:47<23:46:33, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=7.65s]
Epoch 2: 9%|▉ | 1145/12384 [2:25:55<23:46:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1146/12384 [2:25:55<23:46:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1146/12384 [2:26:03<23:46:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 9%|▉ | 1147/12384 [2:26:03<24:02:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 9%|▉ | 1147/12384 [2:26:10<24:02:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▉ | 1148/12384 [2:26:10<23:58:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 9%|▉ | 1148/12384 [2:26:18<23:58:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 9%|▉ | 1149/12384 [2:26:18<23:57:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 9%|▉ | 1149/12384 [2:26:26<23:57:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 9%|▉ | 1150/12384 [2:26:26<23:53:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 9%|▉ | 1150/12384 [2:26:33<23:53:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 9%|▉ | 1151/12384 [2:26:33<23:52:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 9%|▉ | 1151/12384 [2:26:41<23:52:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 2: 9%|▉ | 1152/12384 [2:26:41<23:51:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 2: 9%|▉ | 1152/12384 [2:26:49<23:51:06, 7.64s/it, loss=0.0002, acc=0.9991, iter_time=7.21s]
Epoch 2: 9%|▉ | 1153/12384 [2:26:49<23:48:46, 7.63s/it, loss=0.0002, acc=0.9991, iter_time=7.21s]
Epoch 2: 9%|▉ | 1153/12384 [2:26:56<23:48:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 9%|▉ | 1154/12384 [2:26:56<23:48:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 9%|▉ | 1154/12384 [2:27:04<23:48:37, 7.63s/it, loss=0.0001, acc=0.9993, iter_time=9.30s]
Epoch 2: 9%|▉ | 1155/12384 [2:27:04<23:47:44, 7.63s/it, loss=0.0001, acc=0.9993, iter_time=9.30s]
Epoch 2: 9%|▉ | 1155/12384 [2:27:11<23:47:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 9%|▉ | 1156/12384 [2:27:11<23:47:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 9%|▉ | 1156/12384 [2:27:19<23:47:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1157/12384 [2:27:19<23:46:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1157/12384 [2:27:27<23:46:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1158/12384 [2:27:27<23:48:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 9%|▉ | 1158/12384 [2:27:35<23:48:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 9%|▉ | 1159/12384 [2:27:35<24:07:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 9%|▉ | 1159/12384 [2:27:42<24:07:35, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 9%|▉ | 1160/12384 [2:27:42<24:01:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 9%|▉ | 1160/12384 [2:27:50<24:01:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 9%|▉ | 1161/12384 [2:27:50<23:56:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 9%|▉ | 1161/12384 [2:27:58<23:56:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 9%|▉ | 1162/12384 [2:27:58<23:51:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 9%|▉ | 1162/12384 [2:28:05<23:51:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 9%|▉ | 1163/12384 [2:28:05<23:48:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 9%|▉ | 1163/12384 [2:28:13<23:48:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 9%|▉ | 1164/12384 [2:28:13<23:46:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 9%|▉ | 1164/12384 [2:28:20<23:46:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 9%|▉ | 1165/12384 [2:28:20<23:45:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 9%|▉ | 1165/12384 [2:28:28<23:45:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 9%|▉ | 1166/12384 [2:28:28<23:44:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 9%|▉ | 1166/12384 [2:28:36<23:44:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1167/12384 [2:28:36<23:44:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 9%|▉ | 1167/12384 [2:28:43<23:44:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 9%|▉ | 1168/12384 [2:28:43<23:43:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 9%|▉ | 1168/12384 [2:28:51<23:43:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 9%|▉ | 1169/12384 [2:28:51<23:45:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 9%|▉ | 1169/12384 [2:28:58<23:45:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 9%|▉ | 1170/12384 [2:28:58<23:43:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 9%|▉ | 1170/12384 [2:29:06<23:43:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 9%|▉ | 1171/12384 [2:29:06<23:43:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 9%|▉ | 1171/12384 [2:29:14<23:43:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 9%|▉ | 1172/12384 [2:29:14<23:42:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 9%|▉ | 1172/12384 [2:29:21<23:42:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 9%|▉ | 1173/12384 [2:29:21<23:41:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 9%|▉ | 1173/12384 [2:29:29<23:41:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 9%|▉ | 1174/12384 [2:29:29<23:42:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 9%|▉ | 1174/12384 [2:29:37<23:42:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 2: 9%|▉ | 1175/12384 [2:29:37<23:41:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 2: 9%|▉ | 1175/12384 [2:29:44<23:41:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 9%|▉ | 1176/12384 [2:29:44<23:42:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 9%|▉ | 1176/12384 [2:29:52<23:42:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 10%|▉ | 1177/12384 [2:29:52<23:40:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 10%|▉ | 1177/12384 [2:29:59<23:40:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1178/12384 [2:29:59<23:40:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1178/12384 [2:30:07<23:40:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 10%|▉ | 1179/12384 [2:30:07<23:39:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 10%|▉ | 1179/12384 [2:30:15<23:39:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 2: 10%|▉ | 1180/12384 [2:30:15<23:39:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 2: 10%|▉ | 1180/12384 [2:30:22<23:39:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 10%|▉ | 1181/12384 [2:30:22<23:40:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 10%|▉ | 1181/12384 [2:30:30<23:40:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.44s]
Epoch 2: 10%|▉ | 1182/12384 [2:30:30<23:42:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.44s]
Epoch 2: 10%|▉ | 1182/12384 [2:30:37<23:42:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 10%|▉ | 1183/12384 [2:30:37<23:40:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 10%|▉ | 1183/12384 [2:30:45<23:40:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 10%|▉ | 1184/12384 [2:30:45<23:42:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 10%|▉ | 1184/12384 [2:30:53<23:42:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 2: 10%|▉ | 1185/12384 [2:30:53<24:00:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 2: 10%|▉ | 1185/12384 [2:31:01<24:00:46, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.97s]
Epoch 2: 10%|▉ | 1186/12384 [2:31:01<24:00:57, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.97s]
Epoch 2: 10%|▉ | 1186/12384 [2:31:08<24:00:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 10%|▉ | 1187/12384 [2:31:08<23:54:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 10%|▉ | 1187/12384 [2:31:16<23:54:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|▉ | 1188/12384 [2:31:16<23:49:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|▉ | 1188/12384 [2:31:24<23:49:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 10%|▉ | 1189/12384 [2:31:24<23:46:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 10%|▉ | 1189/12384 [2:31:31<23:46:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 10%|▉ | 1190/12384 [2:31:31<23:43:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 10%|▉ | 1190/12384 [2:31:39<23:43:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 10%|▉ | 1191/12384 [2:31:39<23:42:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 10%|▉ | 1191/12384 [2:31:46<23:42:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 10%|▉ | 1192/12384 [2:31:46<23:41:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 10%|▉ | 1192/12384 [2:31:54<23:41:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 10%|▉ | 1193/12384 [2:31:54<23:41:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 10%|▉ | 1193/12384 [2:32:02<23:41:20, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.63s]
Epoch 2: 10%|▉ | 1194/12384 [2:32:02<23:40:12, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.63s]
Epoch 2: 10%|▉ | 1194/12384 [2:32:09<23:40:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 10%|▉ | 1195/12384 [2:32:09<23:40:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 10%|▉ | 1195/12384 [2:32:17<23:40:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 10%|▉ | 1196/12384 [2:32:17<23:40:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 10%|▉ | 1196/12384 [2:32:24<23:40:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 10%|▉ | 1197/12384 [2:32:24<23:39:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 10%|▉ | 1197/12384 [2:32:32<23:39:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1198/12384 [2:32:32<23:40:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1198/12384 [2:32:40<23:40:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|▉ | 1199/12384 [2:32:40<23:39:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|▉ | 1199/12384 [2:32:47<23:39:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 10%|▉ | 1200/12384 [2:32:47<23:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 10%|▉ | 1200/12384 [2:32:55<23:37:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 10%|▉ | 1201/12384 [2:32:55<23:38:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 10%|▉ | 1201/12384 [2:33:02<23:38:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 10%|▉ | 1202/12384 [2:33:02<23:39:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 10%|▉ | 1202/12384 [2:33:10<23:39:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|▉ | 1203/12384 [2:33:10<23:39:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|▉ | 1203/12384 [2:33:18<23:39:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 10%|▉ | 1204/12384 [2:33:18<23:40:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 10%|▉ | 1204/12384 [2:33:25<23:40:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 10%|▉ | 1205/12384 [2:33:25<23:41:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 10%|▉ | 1205/12384 [2:33:33<23:41:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 10%|▉ | 1206/12384 [2:33:33<23:40:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 10%|▉ | 1206/12384 [2:33:41<23:40:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 10%|▉ | 1207/12384 [2:33:41<23:39:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 10%|▉ | 1207/12384 [2:33:48<23:39:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 10%|▉ | 1208/12384 [2:33:48<23:38:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 10%|▉ | 1208/12384 [2:33:56<23:38:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 2: 10%|▉ | 1209/12384 [2:33:56<23:38:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 2: 10%|▉ | 1209/12384 [2:34:03<23:38:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 10%|▉ | 1210/12384 [2:34:03<23:37:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 10%|▉ | 1210/12384 [2:34:11<23:37:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 10%|▉ | 1211/12384 [2:34:11<23:57:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 10%|▉ | 1211/12384 [2:34:19<23:57:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 10%|▉ | 1212/12384 [2:34:19<23:51:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 10%|▉ | 1212/12384 [2:34:27<23:51:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 10%|▉ | 1213/12384 [2:34:27<23:46:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 10%|▉ | 1213/12384 [2:34:34<23:46:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|▉ | 1214/12384 [2:34:34<23:42:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|▉ | 1214/12384 [2:34:42<23:42:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1215/12384 [2:34:42<23:40:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1215/12384 [2:34:49<23:40:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 10%|▉ | 1216/12384 [2:34:49<23:38:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 10%|▉ | 1216/12384 [2:34:57<23:38:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 10%|▉ | 1217/12384 [2:34:57<23:43:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 10%|▉ | 1217/12384 [2:35:05<23:43:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 10%|▉ | 1218/12384 [2:35:05<23:41:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 10%|▉ | 1218/12384 [2:35:12<23:41:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 10%|▉ | 1219/12384 [2:35:12<23:40:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 10%|▉ | 1219/12384 [2:35:20<23:40:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 10%|▉ | 1220/12384 [2:35:20<23:40:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 10%|▉ | 1220/12384 [2:35:28<23:40:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 10%|▉ | 1221/12384 [2:35:28<23:38:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 10%|▉ | 1221/12384 [2:35:35<23:38:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1222/12384 [2:35:35<23:38:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1222/12384 [2:35:43<23:38:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 10%|▉ | 1223/12384 [2:35:43<23:43:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 10%|▉ | 1223/12384 [2:35:51<23:43:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|▉ | 1224/12384 [2:35:51<23:41:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|▉ | 1224/12384 [2:35:58<23:41:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 10%|▉ | 1225/12384 [2:35:58<23:44:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 10%|▉ | 1225/12384 [2:36:06<23:44:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|▉ | 1226/12384 [2:36:06<23:42:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|▉ | 1226/12384 [2:36:14<23:42:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 10%|▉ | 1227/12384 [2:36:14<23:55:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 10%|▉ | 1227/12384 [2:36:21<23:55:24, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1228/12384 [2:36:21<23:51:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|▉ | 1228/12384 [2:36:29<23:51:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 10%|▉ | 1229/12384 [2:36:29<23:46:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 10%|▉ | 1229/12384 [2:36:37<23:46:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 10%|▉ | 1230/12384 [2:36:37<23:43:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 10%|▉ | 1230/12384 [2:36:44<23:43:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 10%|▉ | 1231/12384 [2:36:44<23:39:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 10%|▉ | 1231/12384 [2:36:52<23:39:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 10%|▉ | 1232/12384 [2:36:52<23:50:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 10%|▉ | 1232/12384 [2:37:00<23:50:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 10%|▉ | 1233/12384 [2:37:00<23:45:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 10%|▉ | 1233/12384 [2:37:07<23:45:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 10%|▉ | 1234/12384 [2:37:07<23:41:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 10%|▉ | 1234/12384 [2:37:15<23:41:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 10%|▉ | 1235/12384 [2:37:15<23:39:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 10%|▉ | 1235/12384 [2:37:23<23:39:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|▉ | 1236/12384 [2:37:23<23:38:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|▉ | 1236/12384 [2:37:30<23:38:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 10%|▉ | 1237/12384 [2:37:30<23:55:59, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 10%|▉ | 1237/12384 [2:37:38<23:55:59, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 10%|▉ | 1238/12384 [2:37:38<23:47:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 10%|▉ | 1238/12384 [2:37:46<23:47:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|█ | 1239/12384 [2:37:46<23:43:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|█ | 1239/12384 [2:37:53<23:43:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 10%|█ | 1240/12384 [2:37:53<23:40:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 10%|█ | 1240/12384 [2:38:01<23:40:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 2: 10%|█ | 1241/12384 [2:38:01<23:38:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 2: 10%|█ | 1241/12384 [2:38:08<23:38:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 10%|█ | 1242/12384 [2:38:08<23:36:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 10%|█ | 1242/12384 [2:38:16<23:36:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|█ | 1243/12384 [2:38:16<23:36:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|█ | 1243/12384 [2:38:24<23:36:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1244/12384 [2:38:24<23:35:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1244/12384 [2:38:31<23:35:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 10%|█ | 1245/12384 [2:38:31<23:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 10%|█ | 1245/12384 [2:38:39<23:35:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 2: 10%|█ | 1246/12384 [2:38:39<23:34:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 2: 10%|█ | 1246/12384 [2:38:47<23:34:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 10%|█ | 1247/12384 [2:38:47<23:35:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 10%|█ | 1247/12384 [2:38:54<23:35:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 10%|█ | 1248/12384 [2:38:54<23:34:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 10%|█ | 1248/12384 [2:39:02<23:34:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 10%|█ | 1249/12384 [2:39:02<23:33:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 10%|█ | 1249/12384 [2:39:09<23:33:28, 7.62s/it, loss=0.0001, acc=0.9993, iter_time=7.31s]
Epoch 2: 10%|█ | 1250/12384 [2:39:09<23:32:29, 7.61s/it, loss=0.0001, acc=0.9993, iter_time=7.31s]
Epoch 2: 10%|█ | 1250/12384 [2:39:17<23:32:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 10%|█ | 1251/12384 [2:39:17<23:33:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 10%|█ | 1251/12384 [2:39:25<23:33:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 10%|█ | 1252/12384 [2:39:25<23:32:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 10%|█ | 1252/12384 [2:39:32<23:32:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 10%|█ | 1253/12384 [2:39:32<23:32:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 10%|█ | 1253/12384 [2:39:40<23:32:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 10%|█ | 1254/12384 [2:39:40<23:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 10%|█ | 1254/12384 [2:39:48<23:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 10%|█ | 1255/12384 [2:39:48<23:32:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 10%|█ | 1255/12384 [2:39:55<23:32:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1256/12384 [2:39:55<23:33:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1256/12384 [2:40:03<23:33:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 10%|█ | 1257/12384 [2:40:03<23:32:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 10%|█ | 1257/12384 [2:40:10<23:32:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1258/12384 [2:40:10<23:31:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1258/12384 [2:40:18<23:31:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|█ | 1259/12384 [2:40:18<23:30:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|█ | 1259/12384 [2:40:26<23:30:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|█ | 1260/12384 [2:40:26<23:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|█ | 1260/12384 [2:40:33<23:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1261/12384 [2:40:33<23:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1261/12384 [2:40:41<23:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 10%|█ | 1262/12384 [2:40:41<23:31:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 10%|█ | 1262/12384 [2:40:48<23:31:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 10%|█ | 1263/12384 [2:40:48<23:31:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 10%|█ | 1263/12384 [2:40:56<23:31:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 10%|█ | 1264/12384 [2:40:56<23:49:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 10%|█ | 1264/12384 [2:41:04<23:49:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|█ | 1265/12384 [2:41:04<23:49:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|█ | 1265/12384 [2:41:12<23:49:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1266/12384 [2:41:12<23:42:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1266/12384 [2:41:19<23:42:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1267/12384 [2:41:19<23:39:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1267/12384 [2:41:27<23:39:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1268/12384 [2:41:27<23:35:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1268/12384 [2:41:34<23:35:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1269/12384 [2:41:34<23:33:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1269/12384 [2:41:42<23:33:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 10%|█ | 1270/12384 [2:41:42<23:30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 10%|█ | 1270/12384 [2:41:50<23:30:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.36s]
Epoch 2: 10%|█ | 1271/12384 [2:41:50<23:30:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.36s]
Epoch 2: 10%|█ | 1271/12384 [2:41:57<23:30:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 10%|█ | 1272/12384 [2:41:57<23:30:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 10%|█ | 1272/12384 [2:42:05<23:30:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 2: 10%|█ | 1273/12384 [2:42:05<23:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 2: 10%|█ | 1273/12384 [2:42:13<23:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 2: 10%|█ | 1274/12384 [2:42:13<23:30:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 2: 10%|█ | 1274/12384 [2:42:20<23:30:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 10%|█ | 1275/12384 [2:42:20<23:30:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 10%|█ | 1275/12384 [2:42:28<23:30:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 10%|█ | 1276/12384 [2:42:28<23:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 10%|█ | 1276/12384 [2:42:35<23:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 10%|█ | 1277/12384 [2:42:35<23:30:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 10%|█ | 1277/12384 [2:42:43<23:30:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 10%|█ | 1278/12384 [2:42:43<23:45:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 10%|█ | 1278/12384 [2:42:51<23:45:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1279/12384 [2:42:51<23:39:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1279/12384 [2:42:59<23:39:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 10%|█ | 1280/12384 [2:42:59<23:40:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 10%|█ | 1280/12384 [2:43:06<23:40:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 10%|█ | 1281/12384 [2:43:06<23:38:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 10%|█ | 1281/12384 [2:43:14<23:38:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 10%|█ | 1282/12384 [2:43:14<23:37:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 10%|█ | 1282/12384 [2:43:22<23:37:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 2: 10%|█ | 1283/12384 [2:43:22<23:37:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 2: 10%|█ | 1283/12384 [2:43:29<23:37:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 10%|█ | 1284/12384 [2:43:29<23:32:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 10%|█ | 1284/12384 [2:43:37<23:32:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 10%|█ | 1285/12384 [2:43:37<23:30:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 10%|█ | 1285/12384 [2:43:44<23:30:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.19s]
Epoch 2: 10%|█ | 1286/12384 [2:43:44<23:28:23, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.19s]
Epoch 2: 10%|█ | 1286/12384 [2:43:52<23:28:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 10%|█ | 1287/12384 [2:43:52<23:34:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 10%|█ | 1287/12384 [2:44:00<23:34:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 10%|█ | 1288/12384 [2:44:00<23:38:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 10%|█ | 1288/12384 [2:44:07<23:38:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 10%|█ | 1289/12384 [2:44:07<23:34:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 10%|█ | 1289/12384 [2:44:15<23:34:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 10%|█ | 1290/12384 [2:44:15<23:51:55, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 10%|█ | 1290/12384 [2:44:23<23:51:55, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 10%|█ | 1291/12384 [2:44:23<23:44:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 10%|█ | 1291/12384 [2:44:31<23:44:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|█ | 1292/12384 [2:44:31<23:38:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 10%|█ | 1292/12384 [2:44:38<23:38:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|█ | 1293/12384 [2:44:38<23:34:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 10%|█ | 1293/12384 [2:44:46<23:34:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1294/12384 [2:44:46<23:32:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 10%|█ | 1294/12384 [2:44:53<23:32:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1295/12384 [2:44:53<23:29:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1295/12384 [2:45:01<23:29:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 10%|█ | 1296/12384 [2:45:01<23:32:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 10%|█ | 1296/12384 [2:45:09<23:32:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 10%|█ | 1297/12384 [2:45:09<23:30:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 10%|█ | 1297/12384 [2:45:16<23:30:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 10%|█ | 1298/12384 [2:45:16<23:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 10%|█ | 1298/12384 [2:45:24<23:27:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 10%|█ | 1299/12384 [2:45:24<23:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 10%|█ | 1299/12384 [2:45:31<23:27:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1300/12384 [2:45:31<23:27:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 10%|█ | 1300/12384 [2:45:39<23:27:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 11%|█ | 1301/12384 [2:45:39<23:27:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 11%|█ | 1301/12384 [2:45:47<23:27:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 11%|█ | 1302/12384 [2:45:47<23:28:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 11%|█ | 1302/12384 [2:45:54<23:28:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 11%|█ | 1303/12384 [2:45:54<23:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 11%|█ | 1303/12384 [2:46:02<23:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 11%|█ | 1304/12384 [2:46:02<23:42:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 11%|█ | 1304/12384 [2:46:10<23:42:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 2: 11%|█ | 1305/12384 [2:46:10<23:36:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 2: 11%|█ | 1305/12384 [2:46:17<23:36:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 11%|█ | 1306/12384 [2:46:17<23:33:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 11%|█ | 1306/12384 [2:46:25<23:33:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 11%|█ | 1307/12384 [2:46:25<23:37:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 11%|█ | 1307/12384 [2:46:33<23:37:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 11%|█ | 1308/12384 [2:46:33<23:33:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 11%|█ | 1308/12384 [2:46:40<23:33:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 11%|█ | 1309/12384 [2:46:40<23:29:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 11%|█ | 1309/12384 [2:46:48<23:29:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1310/12384 [2:46:48<23:32:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1310/12384 [2:46:56<23:32:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 11%|█ | 1311/12384 [2:46:56<23:29:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 11%|█ | 1311/12384 [2:47:03<23:29:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 11%|█ | 1312/12384 [2:47:03<23:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 11%|█ | 1312/12384 [2:47:11<23:26:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 11%|█ | 1313/12384 [2:47:11<23:24:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 11%|█ | 1313/12384 [2:47:18<23:24:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1314/12384 [2:47:18<23:24:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1314/12384 [2:47:26<23:24:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 2: 11%|█ | 1315/12384 [2:47:26<23:22:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 2: 11%|█ | 1315/12384 [2:47:34<23:22:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 11%|█ | 1316/12384 [2:47:34<23:22:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 11%|█ | 1316/12384 [2:47:42<23:22:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 11%|█ | 1317/12384 [2:47:42<23:40:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 11%|█ | 1317/12384 [2:47:49<23:40:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 11%|█ | 1318/12384 [2:47:49<23:36:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 11%|█ | 1318/12384 [2:47:57<23:36:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 11%|█ | 1319/12384 [2:47:57<23:33:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 11%|█ | 1319/12384 [2:48:04<23:33:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 11%|█ | 1320/12384 [2:48:04<23:29:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 11%|█ | 1320/12384 [2:48:12<23:29:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 11%|█ | 1321/12384 [2:48:12<23:26:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 11%|█ | 1321/12384 [2:48:20<23:26:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 11%|█ | 1322/12384 [2:48:20<23:25:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 11%|█ | 1322/12384 [2:48:27<23:25:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 11%|█ | 1323/12384 [2:48:27<23:23:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 11%|█ | 1323/12384 [2:48:35<23:23:32, 7.61s/it, loss=0.0054, acc=0.9826, iter_time=11.13s]
Epoch 2: 11%|█ | 1324/12384 [2:48:35<23:23:29, 7.61s/it, loss=0.0054, acc=0.9826, iter_time=11.13s]
Epoch 2: 11%|█ | 1324/12384 [2:48:42<23:23:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1325/12384 [2:48:42<23:23:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1325/12384 [2:48:50<23:23:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1326/12384 [2:48:50<23:22:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1326/12384 [2:48:58<23:22:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 11%|█ | 1327/12384 [2:48:58<23:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 11%|█ | 1327/12384 [2:49:05<23:24:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 11%|█ | 1328/12384 [2:49:05<23:26:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 11%|█ | 1328/12384 [2:49:13<23:26:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 11%|█ | 1329/12384 [2:49:13<23:27:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 11%|█ | 1329/12384 [2:49:21<23:27:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 11%|█ | 1330/12384 [2:49:21<23:44:12, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 11%|█ | 1330/12384 [2:49:29<23:44:12, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1331/12384 [2:49:29<23:36:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1331/12384 [2:49:36<23:36:37, 7.69s/it, loss=0.0002, acc=0.9996, iter_time=8.01s]
Epoch 2: 11%|█ | 1332/12384 [2:49:36<23:32:29, 7.67s/it, loss=0.0002, acc=0.9996, iter_time=8.01s]
Epoch 2: 11%|█ | 1332/12384 [2:49:44<23:32:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 2: 11%|█ | 1333/12384 [2:49:44<23:29:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 2: 11%|█ | 1333/12384 [2:49:51<23:29:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 11%|█ | 1334/12384 [2:49:51<23:27:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 11%|█ | 1334/12384 [2:49:59<23:27:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 2: 11%|█ | 1335/12384 [2:49:59<23:25:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 2: 11%|█ | 1335/12384 [2:50:07<23:25:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 2: 11%|█ | 1336/12384 [2:50:07<23:24:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 2: 11%|█ | 1336/12384 [2:50:14<23:24:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.45s]
Epoch 2: 11%|█ | 1337/12384 [2:50:14<23:26:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.45s]
Epoch 2: 11%|█ | 1337/12384 [2:50:22<23:26:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 11%|█ | 1338/12384 [2:50:22<23:24:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 11%|█ | 1338/12384 [2:50:30<23:24:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1339/12384 [2:50:30<23:23:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1339/12384 [2:50:37<23:23:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1340/12384 [2:50:37<23:21:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1340/12384 [2:50:45<23:21:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1341/12384 [2:50:45<23:26:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1341/12384 [2:50:52<23:26:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 11%|█ | 1342/12384 [2:50:52<23:25:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 11%|█ | 1342/12384 [2:51:00<23:25:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 11%|█ | 1343/12384 [2:51:00<23:42:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 11%|█ | 1343/12384 [2:51:08<23:42:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 11%|█ | 1344/12384 [2:51:08<23:36:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 11%|█ | 1344/12384 [2:51:16<23:36:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 11%|█ | 1345/12384 [2:51:16<23:31:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 11%|█ | 1345/12384 [2:51:23<23:31:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 11%|█ | 1346/12384 [2:51:23<23:27:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 11%|█ | 1346/12384 [2:51:31<23:27:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 11%|█ | 1347/12384 [2:51:31<23:25:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 11%|█ | 1347/12384 [2:51:38<23:25:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 11%|█ | 1348/12384 [2:51:38<23:23:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 11%|█ | 1348/12384 [2:51:46<23:23:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 11%|█ | 1349/12384 [2:51:46<23:22:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 11%|█ | 1349/12384 [2:51:54<23:22:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 11%|█ | 1350/12384 [2:51:54<23:21:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 11%|█ | 1350/12384 [2:52:01<23:21:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1351/12384 [2:52:01<23:19:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1351/12384 [2:52:09<23:19:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 11%|█ | 1352/12384 [2:52:09<23:16:12, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 11%|█ | 1352/12384 [2:52:16<23:16:12, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 11%|█ | 1353/12384 [2:52:16<23:17:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 11%|█ | 1353/12384 [2:52:24<23:17:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 11%|█ | 1354/12384 [2:52:24<23:16:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 11%|█ | 1354/12384 [2:52:32<23:16:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 11%|█ | 1355/12384 [2:52:32<23:16:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 11%|█ | 1355/12384 [2:52:39<23:16:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 11%|█ | 1356/12384 [2:52:39<23:32:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 11%|█ | 1356/12384 [2:52:47<23:32:06, 7.68s/it, loss=0.0005, acc=0.9968, iter_time=7.60s]
Epoch 2: 11%|█ | 1357/12384 [2:52:47<23:28:23, 7.66s/it, loss=0.0005, acc=0.9968, iter_time=7.60s]
Epoch 2: 11%|█ | 1357/12384 [2:52:55<23:28:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1358/12384 [2:52:55<23:23:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1358/12384 [2:53:02<23:23:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 11%|█ | 1359/12384 [2:53:02<23:22:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 11%|█ | 1359/12384 [2:53:10<23:22:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 11%|█ | 1360/12384 [2:53:10<23:20:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 11%|█ | 1360/12384 [2:53:18<23:20:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 11%|█ | 1361/12384 [2:53:18<23:19:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 11%|█ | 1361/12384 [2:53:25<23:19:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 11%|█ | 1362/12384 [2:53:25<23:18:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 11%|█ | 1362/12384 [2:53:33<23:18:46, 7.61s/it, loss=0.0004, acc=0.9991, iter_time=6.68s]
Epoch 2: 11%|█ | 1363/12384 [2:53:33<23:20:06, 7.62s/it, loss=0.0004, acc=0.9991, iter_time=6.68s]
Epoch 2: 11%|█ | 1363/12384 [2:53:40<23:20:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 11%|█ | 1364/12384 [2:53:40<23:20:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 11%|█ | 1364/12384 [2:53:48<23:20:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 11%|█ | 1365/12384 [2:53:48<23:21:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 11%|█ | 1365/12384 [2:53:56<23:21:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 11%|█ | 1366/12384 [2:53:56<23:21:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 11%|█ | 1366/12384 [2:54:03<23:21:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 11%|█ | 1367/12384 [2:54:03<23:20:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 11%|█ | 1367/12384 [2:54:11<23:20:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 11%|█ | 1368/12384 [2:54:11<23:20:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 11%|█ | 1368/12384 [2:54:19<23:20:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 2: 11%|█ | 1369/12384 [2:54:19<23:36:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 2: 11%|█ | 1369/12384 [2:54:26<23:36:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 11%|█ | 1370/12384 [2:54:26<23:30:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 11%|█ | 1370/12384 [2:54:34<23:30:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 11%|█ | 1371/12384 [2:54:34<23:29:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 11%|█ | 1371/12384 [2:54:42<23:29:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1372/12384 [2:54:42<23:24:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1372/12384 [2:54:49<23:24:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1373/12384 [2:54:49<23:22:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█ | 1373/12384 [2:54:57<23:22:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 11%|█ | 1374/12384 [2:54:57<23:20:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 11%|█ | 1374/12384 [2:55:05<23:20:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 11%|█ | 1375/12384 [2:55:05<23:18:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 11%|█ | 1375/12384 [2:55:12<23:18:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 2: 11%|█ | 1376/12384 [2:55:12<23:17:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 2: 11%|█ | 1376/12384 [2:55:20<23:17:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 11%|█ | 1377/12384 [2:55:20<23:16:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 11%|█ | 1377/12384 [2:55:27<23:16:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 11%|█ | 1378/12384 [2:55:27<23:14:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 11%|█ | 1378/12384 [2:55:35<23:14:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 11%|█ | 1379/12384 [2:55:35<23:14:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 11%|█ | 1379/12384 [2:55:42<23:14:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 11%|█ | 1380/12384 [2:55:42<23:13:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 11%|█ | 1380/12384 [2:55:50<23:13:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 2: 11%|█ | 1381/12384 [2:55:50<23:14:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 2: 11%|█ | 1381/12384 [2:55:58<23:14:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 2: 11%|█ | 1382/12384 [2:55:58<23:30:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 2: 11%|█ | 1382/12384 [2:56:06<23:30:20, 7.69s/it, loss=0.0004, acc=0.9978, iter_time=7.21s]
Epoch 2: 11%|█ | 1383/12384 [2:56:06<23:24:52, 7.66s/it, loss=0.0004, acc=0.9978, iter_time=7.21s]
Epoch 2: 11%|█ | 1383/12384 [2:56:13<23:24:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 11%|█ | 1384/12384 [2:56:13<23:22:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 11%|█ | 1384/12384 [2:56:21<23:22:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 11%|█ | 1385/12384 [2:56:21<23:19:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 11%|█ | 1385/12384 [2:56:28<23:19:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 2: 11%|█ | 1386/12384 [2:56:28<23:16:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.14s]
Epoch 2: 11%|█ | 1386/12384 [2:56:36<23:16:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 11%|█ | 1387/12384 [2:56:36<23:14:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 11%|█ | 1387/12384 [2:56:44<23:14:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1388/12384 [2:56:44<23:15:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█ | 1388/12384 [2:56:51<23:15:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 11%|█ | 1389/12384 [2:56:51<23:14:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 11%|█ | 1389/12384 [2:56:59<23:14:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.56s]
Epoch 2: 11%|█ | 1390/12384 [2:56:59<23:15:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.56s]
Epoch 2: 11%|█ | 1390/12384 [2:57:06<23:15:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 11%|█ | 1391/12384 [2:57:06<23:14:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 11%|█ | 1391/12384 [2:57:14<23:14:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 11%|█ | 1392/12384 [2:57:14<23:13:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 11%|█ | 1392/12384 [2:57:22<23:13:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 11%|█ | 1393/12384 [2:57:22<23:13:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 11%|█ | 1393/12384 [2:57:29<23:13:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 11%|█▏ | 1394/12384 [2:57:29<23:12:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 11%|█▏ | 1394/12384 [2:57:37<23:12:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 11%|█▏ | 1395/12384 [2:57:37<23:30:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 11%|█▏ | 1395/12384 [2:57:45<23:30:51, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 11%|█▏ | 1396/12384 [2:57:45<23:24:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 11%|█▏ | 1396/12384 [2:57:52<23:24:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█▏ | 1397/12384 [2:57:52<23:20:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█▏ | 1397/12384 [2:58:00<23:20:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 11%|█▏ | 1398/12384 [2:58:00<23:17:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 11%|█▏ | 1398/12384 [2:58:08<23:17:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 11%|█▏ | 1399/12384 [2:58:08<23:15:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 11%|█▏ | 1399/12384 [2:58:15<23:15:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 11%|█▏ | 1400/12384 [2:58:15<23:14:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 11%|█▏ | 1400/12384 [2:58:23<23:14:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 11%|█▏ | 1401/12384 [2:58:23<23:13:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 11%|█▏ | 1401/12384 [2:58:30<23:13:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 2: 11%|█▏ | 1402/12384 [2:58:30<23:13:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 2: 11%|█▏ | 1402/12384 [2:58:38<23:13:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 11%|█▏ | 1403/12384 [2:58:38<23:13:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 11%|█▏ | 1403/12384 [2:58:46<23:13:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 11%|█▏ | 1404/12384 [2:58:46<23:12:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 11%|█▏ | 1404/12384 [2:58:53<23:12:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 11%|█▏ | 1405/12384 [2:58:53<23:12:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 11%|█▏ | 1405/12384 [2:59:01<23:12:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 11%|█▏ | 1406/12384 [2:59:01<23:11:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 11%|█▏ | 1406/12384 [2:59:08<23:11:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 11%|█▏ | 1407/12384 [2:59:08<23:11:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 11%|█▏ | 1407/12384 [2:59:16<23:11:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█▏ | 1408/12384 [2:59:16<23:13:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 11%|█▏ | 1408/12384 [2:59:24<23:13:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 11%|█▏ | 1409/12384 [2:59:24<23:28:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 11%|█▏ | 1409/12384 [2:59:32<23:28:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 11%|█▏ | 1410/12384 [2:59:32<23:24:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 11%|█▏ | 1410/12384 [2:59:39<23:24:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 11%|█▏ | 1411/12384 [2:59:39<23:22:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 11%|█▏ | 1411/12384 [2:59:47<23:22:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 11%|█▏ | 1412/12384 [2:59:47<23:17:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 11%|█▏ | 1412/12384 [2:59:54<23:17:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█▏ | 1413/12384 [2:59:54<23:16:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█▏ | 1413/12384 [3:00:02<23:16:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 11%|█▏ | 1414/12384 [3:00:02<23:13:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 11%|█▏ | 1414/12384 [3:00:10<23:13:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 11%|█▏ | 1415/12384 [3:00:10<23:11:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 11%|█▏ | 1415/12384 [3:00:17<23:11:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 11%|█▏ | 1416/12384 [3:00:17<23:11:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 11%|█▏ | 1416/12384 [3:00:25<23:11:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 11%|█▏ | 1417/12384 [3:00:25<23:11:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 11%|█▏ | 1417/12384 [3:00:32<23:11:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 11%|█▏ | 1418/12384 [3:00:32<23:11:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 11%|█▏ | 1418/12384 [3:00:40<23:11:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█▏ | 1419/12384 [3:00:40<23:10:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 11%|█▏ | 1419/12384 [3:00:48<23:10:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 11%|█▏ | 1420/12384 [3:00:48<23:10:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 11%|█▏ | 1420/12384 [3:00:56<23:10:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 11%|█▏ | 1421/12384 [3:00:56<23:27:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 11%|█▏ | 1421/12384 [3:01:03<23:27:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 11%|█▏ | 1422/12384 [3:01:03<23:22:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 11%|█▏ | 1422/12384 [3:01:11<23:22:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 11%|█▏ | 1423/12384 [3:01:11<23:18:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 11%|█▏ | 1423/12384 [3:01:18<23:18:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 11%|█▏ | 1424/12384 [3:01:18<23:15:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 11%|█▏ | 1424/12384 [3:01:26<23:15:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 2: 12%|█▏ | 1425/12384 [3:01:26<23:14:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.20s]
Epoch 2: 12%|█▏ | 1425/12384 [3:01:34<23:14:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 12%|█▏ | 1426/12384 [3:01:34<23:16:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 12%|█▏ | 1426/12384 [3:01:41<23:16:30, 7.65s/it, loss=0.0011, acc=0.9981, iter_time=5.10s]
Epoch 2: 12%|█▏ | 1427/12384 [3:01:41<23:15:14, 7.64s/it, loss=0.0011, acc=0.9981, iter_time=5.10s]
Epoch 2: 12%|█▏ | 1427/12384 [3:01:49<23:15:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.18s]
Epoch 2: 12%|█▏ | 1428/12384 [3:01:49<23:14:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.18s]
Epoch 2: 12%|█▏ | 1428/12384 [3:01:57<23:14:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 12%|█▏ | 1429/12384 [3:01:57<23:13:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 12%|█▏ | 1429/12384 [3:02:04<23:13:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 12%|█▏ | 1430/12384 [3:02:04<23:12:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 12%|█▏ | 1430/12384 [3:02:12<23:12:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 12%|█▏ | 1431/12384 [3:02:12<23:12:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 12%|█▏ | 1431/12384 [3:02:19<23:12:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 12%|█▏ | 1432/12384 [3:02:19<23:13:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 12%|█▏ | 1432/12384 [3:02:27<23:13:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 12%|█▏ | 1433/12384 [3:02:27<23:11:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 12%|█▏ | 1433/12384 [3:02:35<23:11:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 12%|█▏ | 1434/12384 [3:02:35<23:11:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 12%|█▏ | 1434/12384 [3:02:42<23:11:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 12%|█▏ | 1435/12384 [3:02:42<23:12:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 12%|█▏ | 1435/12384 [3:02:50<23:12:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 12%|█▏ | 1436/12384 [3:02:50<23:11:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 12%|█▏ | 1436/12384 [3:02:58<23:11:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 12%|█▏ | 1437/12384 [3:02:58<23:10:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 12%|█▏ | 1437/12384 [3:03:05<23:10:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1438/12384 [3:03:05<23:09:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1438/12384 [3:03:13<23:09:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 12%|█▏ | 1439/12384 [3:03:13<23:09:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 12%|█▏ | 1439/12384 [3:03:20<23:09:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 12%|█▏ | 1440/12384 [3:03:20<23:11:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 12%|█▏ | 1440/12384 [3:03:28<23:11:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 12%|█▏ | 1441/12384 [3:03:28<23:09:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 12%|█▏ | 1441/12384 [3:03:36<23:09:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 12%|█▏ | 1442/12384 [3:03:36<23:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 12%|█▏ | 1442/12384 [3:03:43<23:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 12%|█▏ | 1443/12384 [3:03:43<23:07:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 12%|█▏ | 1443/12384 [3:03:51<23:07:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 2: 12%|█▏ | 1444/12384 [3:03:51<23:07:48, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 2: 12%|█▏ | 1444/12384 [3:03:58<23:07:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 12%|█▏ | 1445/12384 [3:03:58<23:06:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 12%|█▏ | 1445/12384 [3:04:06<23:06:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 12%|█▏ | 1446/12384 [3:04:06<23:07:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 12%|█▏ | 1446/12384 [3:04:14<23:07:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 12%|█▏ | 1447/12384 [3:04:14<23:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 12%|█▏ | 1447/12384 [3:04:22<23:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 12%|█▏ | 1448/12384 [3:04:22<23:29:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 12%|█▏ | 1448/12384 [3:04:29<23:29:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 12%|█▏ | 1449/12384 [3:04:29<23:21:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 12%|█▏ | 1449/12384 [3:04:37<23:21:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1450/12384 [3:04:37<23:17:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1450/12384 [3:04:44<23:17:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 12%|█▏ | 1451/12384 [3:04:44<23:12:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 12%|█▏ | 1451/12384 [3:04:52<23:12:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 12%|█▏ | 1452/12384 [3:04:52<23:13:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 12%|█▏ | 1452/12384 [3:05:00<23:13:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 2: 12%|█▏ | 1453/12384 [3:05:00<23:11:59, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 2: 12%|█▏ | 1453/12384 [3:05:07<23:11:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 12%|█▏ | 1454/12384 [3:05:07<23:09:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 12%|█▏ | 1454/12384 [3:05:15<23:09:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 12%|█▏ | 1455/12384 [3:05:15<23:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 12%|█▏ | 1455/12384 [3:05:23<23:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 12%|█▏ | 1456/12384 [3:05:23<23:07:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 12%|█▏ | 1456/12384 [3:05:30<23:07:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 12%|█▏ | 1457/12384 [3:05:30<23:07:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 12%|█▏ | 1457/12384 [3:05:38<23:07:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1458/12384 [3:05:38<23:07:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1458/12384 [3:05:45<23:07:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 12%|█▏ | 1459/12384 [3:05:45<23:06:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 12%|█▏ | 1459/12384 [3:05:53<23:06:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 12%|█▏ | 1460/12384 [3:05:53<23:06:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 12%|█▏ | 1460/12384 [3:06:01<23:06:30, 7.62s/it, loss=0.0003, acc=0.9993, iter_time=7.91s]
Epoch 2: 12%|█▏ | 1461/12384 [3:06:01<23:20:51, 7.69s/it, loss=0.0003, acc=0.9993, iter_time=7.91s]
Epoch 2: 12%|█▏ | 1461/12384 [3:06:09<23:20:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 12%|█▏ | 1462/12384 [3:06:09<23:16:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 12%|█▏ | 1462/12384 [3:06:16<23:16:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 12%|█▏ | 1463/12384 [3:06:16<23:13:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 12%|█▏ | 1463/12384 [3:06:24<23:13:58, 7.66s/it, loss=0.0003, acc=0.9996, iter_time=9.39s]
Epoch 2: 12%|█▏ | 1464/12384 [3:06:24<23:12:04, 7.65s/it, loss=0.0003, acc=0.9996, iter_time=9.39s]
Epoch 2: 12%|█▏ | 1464/12384 [3:06:31<23:12:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 12%|█▏ | 1465/12384 [3:06:31<23:10:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 12%|█▏ | 1465/12384 [3:06:39<23:10:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 12%|█▏ | 1466/12384 [3:06:39<23:07:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 12%|█▏ | 1466/12384 [3:06:47<23:07:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 12%|█▏ | 1467/12384 [3:06:47<23:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 12%|█▏ | 1467/12384 [3:06:54<23:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 12%|█▏ | 1468/12384 [3:06:54<23:05:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 12%|█▏ | 1468/12384 [3:07:02<23:05:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 12%|█▏ | 1469/12384 [3:07:02<23:05:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 12%|█▏ | 1469/12384 [3:07:09<23:05:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 12%|█▏ | 1470/12384 [3:07:09<23:04:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 12%|█▏ | 1470/12384 [3:07:17<23:04:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 12%|█▏ | 1471/12384 [3:07:17<23:03:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 12%|█▏ | 1471/12384 [3:07:25<23:03:50, 7.61s/it, loss=0.0008, acc=0.9976, iter_time=8.01s]
Epoch 2: 12%|█▏ | 1472/12384 [3:07:25<23:03:29, 7.61s/it, loss=0.0008, acc=0.9976, iter_time=8.01s]
Epoch 2: 12%|█▏ | 1472/12384 [3:07:32<23:03:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 12%|█▏ | 1473/12384 [3:07:32<23:07:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 12%|█▏ | 1473/12384 [3:07:40<23:07:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 12%|█▏ | 1474/12384 [3:07:40<23:23:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 12%|█▏ | 1474/12384 [3:07:48<23:23:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 12%|█▏ | 1475/12384 [3:07:48<23:16:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 12%|█▏ | 1475/12384 [3:07:55<23:16:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 12%|█▏ | 1476/12384 [3:07:55<23:12:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 12%|█▏ | 1476/12384 [3:08:03<23:12:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 12%|█▏ | 1477/12384 [3:08:03<23:09:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 12%|█▏ | 1477/12384 [3:08:11<23:09:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 12%|█▏ | 1478/12384 [3:08:11<23:07:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 12%|█▏ | 1478/12384 [3:08:18<23:07:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1479/12384 [3:08:18<23:05:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1479/12384 [3:08:26<23:05:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 12%|█▏ | 1480/12384 [3:08:26<23:05:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 12%|█▏ | 1480/12384 [3:08:34<23:05:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 12%|█▏ | 1481/12384 [3:08:34<23:10:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 12%|█▏ | 1481/12384 [3:08:41<23:10:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 12%|█▏ | 1482/12384 [3:08:41<23:08:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 12%|█▏ | 1482/12384 [3:08:49<23:08:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 12%|█▏ | 1483/12384 [3:08:49<23:06:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 12%|█▏ | 1483/12384 [3:08:56<23:06:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 12%|█▏ | 1484/12384 [3:08:56<23:03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 12%|█▏ | 1484/12384 [3:09:04<23:03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 2: 12%|█▏ | 1485/12384 [3:09:04<22:59:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 2: 12%|█▏ | 1485/12384 [3:09:12<22:59:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 2: 12%|█▏ | 1486/12384 [3:09:12<23:00:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 2: 12%|█▏ | 1486/12384 [3:09:19<23:00:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 12%|█▏ | 1487/12384 [3:09:19<23:16:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 12%|█▏ | 1487/12384 [3:09:27<23:16:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 12%|█▏ | 1488/12384 [3:09:27<23:18:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 12%|█▏ | 1488/12384 [3:09:35<23:18:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 12%|█▏ | 1489/12384 [3:09:35<23:12:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 12%|█▏ | 1489/12384 [3:09:42<23:12:44, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.07s]
Epoch 2: 12%|█▏ | 1490/12384 [3:09:42<23:09:21, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.07s]
Epoch 2: 12%|█▏ | 1490/12384 [3:09:50<23:09:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 12%|█▏ | 1491/12384 [3:09:50<23:05:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 12%|█▏ | 1491/12384 [3:09:58<23:05:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 12%|█▏ | 1492/12384 [3:09:58<23:03:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 12%|█▏ | 1492/12384 [3:10:05<23:03:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 12%|█▏ | 1493/12384 [3:10:05<23:07:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 12%|█▏ | 1493/12384 [3:10:13<23:07:56, 7.65s/it, loss=0.0008, acc=0.9969, iter_time=6.35s]
Epoch 2: 12%|█▏ | 1494/12384 [3:10:13<23:04:05, 7.63s/it, loss=0.0008, acc=0.9969, iter_time=6.35s]
Epoch 2: 12%|█▏ | 1494/12384 [3:10:21<23:04:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.70s]
Epoch 2: 12%|█▏ | 1495/12384 [3:10:21<23:03:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.70s]
Epoch 2: 12%|█▏ | 1495/12384 [3:10:28<23:03:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 12%|█▏ | 1496/12384 [3:10:28<23:03:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 12%|█▏ | 1496/12384 [3:10:36<23:03:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 12%|█▏ | 1497/12384 [3:10:36<23:02:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 12%|█▏ | 1497/12384 [3:10:43<23:02:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 12%|█▏ | 1498/12384 [3:10:43<23:02:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 12%|█▏ | 1498/12384 [3:10:51<23:02:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 12%|█▏ | 1499/12384 [3:10:51<23:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 12%|█▏ | 1499/12384 [3:10:59<23:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 12%|█▏ | 1500/12384 [3:10:59<23:07:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 12%|█▏ | 1500/12384 [3:11:07<23:07:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 12%|█▏ | 1501/12384 [3:11:07<23:23:16, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 12%|█▏ | 1501/12384 [3:11:14<23:23:16, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 12%|█▏ | 1502/12384 [3:11:14<23:19:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 12%|█▏ | 1502/12384 [3:11:22<23:19:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 12%|█▏ | 1503/12384 [3:11:22<23:13:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 12%|█▏ | 1503/12384 [3:11:30<23:13:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 12%|█▏ | 1504/12384 [3:11:30<23:09:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 12%|█▏ | 1504/12384 [3:11:37<23:09:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 12%|█▏ | 1505/12384 [3:11:37<23:06:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 12%|█▏ | 1505/12384 [3:11:45<23:06:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1506/12384 [3:11:45<23:04:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1506/12384 [3:11:52<23:04:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1507/12384 [3:11:52<23:01:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1507/12384 [3:12:00<23:01:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 12%|█▏ | 1508/12384 [3:12:00<23:04:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 12%|█▏ | 1508/12384 [3:12:08<23:04:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 12%|█▏ | 1509/12384 [3:12:08<23:05:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 12%|█▏ | 1509/12384 [3:12:15<23:05:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 12%|█▏ | 1510/12384 [3:12:15<23:03:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 12%|█▏ | 1510/12384 [3:12:23<23:03:17, 7.63s/it, loss=0.0002, acc=0.9989, iter_time=7.92s]
Epoch 2: 12%|█▏ | 1511/12384 [3:12:23<23:02:59, 7.63s/it, loss=0.0002, acc=0.9989, iter_time=7.92s]
Epoch 2: 12%|█▏ | 1511/12384 [3:12:31<23:02:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 12%|█▏ | 1512/12384 [3:12:31<23:01:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 12%|█▏ | 1512/12384 [3:12:38<23:01:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 12%|█▏ | 1513/12384 [3:12:38<23:15:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 12%|█▏ | 1513/12384 [3:12:46<23:15:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1514/12384 [3:12:46<23:10:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1514/12384 [3:12:54<23:10:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 12%|█▏ | 1515/12384 [3:12:54<23:06:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 12%|█▏ | 1515/12384 [3:13:01<23:06:42, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.69s]
Epoch 2: 12%|█▏ | 1516/12384 [3:13:01<23:03:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.69s]
Epoch 2: 12%|█▏ | 1516/12384 [3:13:09<23:03:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 12%|█▏ | 1517/12384 [3:13:09<23:07:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 12%|█▏ | 1517/12384 [3:13:17<23:07:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 2: 12%|█▏ | 1518/12384 [3:13:17<23:05:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 2: 12%|█▏ | 1518/12384 [3:13:24<23:05:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 12%|█▏ | 1519/12384 [3:13:24<23:02:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 12%|█▏ | 1519/12384 [3:13:32<23:02:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 12%|█▏ | 1520/12384 [3:13:32<23:04:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 12%|█▏ | 1520/12384 [3:13:39<23:04:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 12%|█▏ | 1521/12384 [3:13:39<23:01:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 12%|█▏ | 1521/12384 [3:13:47<23:01:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 12%|█▏ | 1522/12384 [3:13:47<23:00:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 12%|█▏ | 1522/12384 [3:13:55<23:00:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1523/12384 [3:13:55<22:58:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1523/12384 [3:14:02<22:58:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 12%|█▏ | 1524/12384 [3:14:02<22:57:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 12%|█▏ | 1524/12384 [3:14:10<22:57:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 12%|█▏ | 1525/12384 [3:14:10<22:57:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 12%|█▏ | 1525/12384 [3:14:17<22:57:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 12%|█▏ | 1526/12384 [3:14:17<22:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 12%|█▏ | 1526/12384 [3:14:25<22:57:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 12%|█▏ | 1527/12384 [3:14:25<23:16:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 12%|█▏ | 1527/12384 [3:14:33<23:16:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 12%|█▏ | 1528/12384 [3:14:33<23:11:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 12%|█▏ | 1528/12384 [3:14:41<23:11:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 12%|█▏ | 1529/12384 [3:14:41<23:06:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 12%|█▏ | 1529/12384 [3:14:48<23:06:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 2: 12%|█▏ | 1530/12384 [3:14:48<23:03:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 2: 12%|█▏ | 1530/12384 [3:14:56<23:03:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 2: 12%|█▏ | 1531/12384 [3:14:56<23:00:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 2: 12%|█▏ | 1531/12384 [3:15:03<23:00:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 2: 12%|█▏ | 1532/12384 [3:15:03<22:59:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 2: 12%|█▏ | 1532/12384 [3:15:11<22:59:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 2: 12%|█▏ | 1533/12384 [3:15:11<22:59:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 2: 12%|█▏ | 1533/12384 [3:15:19<22:59:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 12%|█▏ | 1534/12384 [3:15:19<22:58:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 12%|█▏ | 1534/12384 [3:15:26<22:58:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 12%|█▏ | 1535/12384 [3:15:26<23:00:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 12%|█▏ | 1535/12384 [3:15:34<23:00:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 12%|█▏ | 1536/12384 [3:15:34<22:57:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 12%|█▏ | 1536/12384 [3:15:42<22:57:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 12%|█▏ | 1537/12384 [3:15:42<22:57:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 12%|█▏ | 1537/12384 [3:15:49<22:57:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 12%|█▏ | 1538/12384 [3:15:49<22:56:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 12%|█▏ | 1538/12384 [3:15:57<22:56:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 12%|█▏ | 1539/12384 [3:15:57<23:11:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 12%|█▏ | 1539/12384 [3:16:05<23:11:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1540/12384 [3:16:05<23:06:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1540/12384 [3:16:12<23:06:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1541/12384 [3:16:12<23:03:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▏ | 1541/12384 [3:16:20<23:03:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 12%|█▏ | 1542/12384 [3:16:20<22:59:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 12%|█▏ | 1542/12384 [3:16:28<22:59:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 12%|█▏ | 1543/12384 [3:16:28<22:59:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 12%|█▏ | 1543/12384 [3:16:35<22:59:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.15s]
Epoch 2: 12%|█▏ | 1544/12384 [3:16:35<22:56:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.15s]
Epoch 2: 12%|█▏ | 1544/12384 [3:16:43<22:56:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 12%|█▏ | 1545/12384 [3:16:43<22:56:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 12%|█▏ | 1545/12384 [3:16:50<22:56:44, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.16s]
Epoch 2: 12%|█▏ | 1546/12384 [3:16:50<22:56:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.16s]
Epoch 2: 12%|█▏ | 1546/12384 [3:16:58<22:56:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 12%|█▏ | 1547/12384 [3:16:58<22:54:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 12%|█▏ | 1547/12384 [3:17:06<22:54:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▎ | 1548/12384 [3:17:06<22:54:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 12%|█▎ | 1548/12384 [3:17:13<22:54:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1549/12384 [3:17:13<22:55:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1549/12384 [3:17:21<22:55:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 13%|█▎ | 1550/12384 [3:17:21<22:54:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 13%|█▎ | 1550/12384 [3:17:28<22:54:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1551/12384 [3:17:28<22:55:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1551/12384 [3:17:36<22:55:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 13%|█▎ | 1552/12384 [3:17:36<22:54:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 13%|█▎ | 1552/12384 [3:17:44<22:54:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 13%|█▎ | 1553/12384 [3:17:44<23:12:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 13%|█▎ | 1553/12384 [3:17:52<23:12:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 13%|█▎ | 1554/12384 [3:17:52<23:07:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 13%|█▎ | 1554/12384 [3:17:59<23:07:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 13%|█▎ | 1555/12384 [3:17:59<23:09:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 13%|█▎ | 1555/12384 [3:18:07<23:09:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1556/12384 [3:18:07<23:04:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1556/12384 [3:18:15<23:04:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1557/12384 [3:18:15<23:00:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1557/12384 [3:18:22<23:00:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1558/12384 [3:18:22<22:58:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1558/12384 [3:18:30<22:58:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 13%|█▎ | 1559/12384 [3:18:30<22:57:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 13%|█▎ | 1559/12384 [3:18:37<22:57:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 2: 13%|█▎ | 1560/12384 [3:18:37<22:56:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.20s]
Epoch 2: 13%|█▎ | 1560/12384 [3:18:45<22:56:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1561/12384 [3:18:45<22:53:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1561/12384 [3:18:53<22:53:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 13%|█▎ | 1562/12384 [3:18:53<22:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 13%|█▎ | 1562/12384 [3:19:00<22:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 13%|█▎ | 1563/12384 [3:19:00<22:52:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 13%|█▎ | 1563/12384 [3:19:08<22:52:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 13%|█▎ | 1564/12384 [3:19:08<22:50:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 13%|█▎ | 1564/12384 [3:19:15<22:50:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 13%|█▎ | 1565/12384 [3:19:15<22:49:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 13%|█▎ | 1565/12384 [3:19:23<22:49:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 13%|█▎ | 1566/12384 [3:19:23<23:08:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 13%|█▎ | 1566/12384 [3:19:31<23:08:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1567/12384 [3:19:31<23:02:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1567/12384 [3:19:39<23:02:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 13%|█▎ | 1568/12384 [3:19:39<23:02:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 13%|█▎ | 1568/12384 [3:19:46<23:02:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 13%|█▎ | 1569/12384 [3:19:46<22:59:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 13%|█▎ | 1569/12384 [3:19:54<22:59:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1570/12384 [3:19:54<22:57:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1570/12384 [3:20:01<22:57:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1571/12384 [3:20:01<22:55:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1571/12384 [3:20:09<22:55:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 13%|█▎ | 1572/12384 [3:20:09<22:53:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 13%|█▎ | 1572/12384 [3:20:17<22:53:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 2: 13%|█▎ | 1573/12384 [3:20:17<22:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 2: 13%|█▎ | 1573/12384 [3:20:24<22:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 13%|█▎ | 1574/12384 [3:20:24<22:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 13%|█▎ | 1574/12384 [3:20:32<22:50:28, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.30s]
Epoch 2: 13%|█▎ | 1575/12384 [3:20:32<22:49:41, 7.60s/it, loss=0.0002, acc=0.9998, iter_time=7.30s]
Epoch 2: 13%|█▎ | 1575/12384 [3:20:39<22:49:41, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 13%|█▎ | 1576/12384 [3:20:39<22:49:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 13%|█▎ | 1576/12384 [3:20:47<22:49:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 13%|█▎ | 1577/12384 [3:20:47<22:48:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 13%|█▎ | 1577/12384 [3:20:55<22:48:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 13%|█▎ | 1578/12384 [3:20:55<22:48:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 13%|█▎ | 1578/12384 [3:21:03<22:48:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 13%|█▎ | 1579/12384 [3:21:03<23:18:02, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 13%|█▎ | 1579/12384 [3:21:10<23:18:02, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 13%|█▎ | 1580/12384 [3:21:10<23:12:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 13%|█▎ | 1580/12384 [3:21:18<23:12:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1581/12384 [3:21:18<23:05:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1581/12384 [3:21:26<23:05:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 13%|█▎ | 1582/12384 [3:21:26<23:01:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 13%|█▎ | 1582/12384 [3:21:33<23:01:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 13%|█▎ | 1583/12384 [3:21:33<22:56:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 13%|█▎ | 1583/12384 [3:21:41<22:56:57, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=8.00s]
Epoch 2: 13%|█▎ | 1584/12384 [3:21:41<22:55:39, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=8.00s]
Epoch 2: 13%|█▎ | 1584/12384 [3:21:48<22:55:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 13%|█▎ | 1585/12384 [3:21:48<22:54:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 13%|█▎ | 1585/12384 [3:21:56<22:54:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 13%|█▎ | 1586/12384 [3:21:56<22:52:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 13%|█▎ | 1586/12384 [3:22:04<22:52:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 13%|█▎ | 1587/12384 [3:22:04<22:51:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 13%|█▎ | 1587/12384 [3:22:11<22:51:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 13%|█▎ | 1588/12384 [3:22:11<22:51:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 13%|█▎ | 1588/12384 [3:22:19<22:51:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1589/12384 [3:22:19<22:50:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1589/12384 [3:22:26<22:50:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 13%|█▎ | 1590/12384 [3:22:26<22:48:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 13%|█▎ | 1590/12384 [3:22:34<22:48:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 13%|█▎ | 1591/12384 [3:22:34<22:48:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 13%|█▎ | 1591/12384 [3:22:42<22:48:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 2: 13%|█▎ | 1592/12384 [3:22:42<22:52:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 2: 13%|█▎ | 1592/12384 [3:22:49<22:52:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 13%|█▎ | 1593/12384 [3:22:49<22:48:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 13%|█▎ | 1593/12384 [3:22:57<22:48:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 2: 13%|█▎ | 1594/12384 [3:22:57<22:48:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 2: 13%|█▎ | 1594/12384 [3:23:05<22:48:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 13%|█▎ | 1595/12384 [3:23:05<22:48:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 13%|█▎ | 1595/12384 [3:23:12<22:48:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1596/12384 [3:23:12<22:48:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1596/12384 [3:23:20<22:48:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 13%|█▎ | 1597/12384 [3:23:20<22:47:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 13%|█▎ | 1597/12384 [3:23:27<22:47:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1598/12384 [3:23:27<22:47:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1598/12384 [3:23:35<22:47:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1599/12384 [3:23:35<22:48:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1599/12384 [3:23:43<22:48:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 13%|█▎ | 1600/12384 [3:23:43<22:48:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 13%|█▎ | 1600/12384 [3:23:50<22:48:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 13%|█▎ | 1601/12384 [3:23:50<22:48:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 13%|█▎ | 1601/12384 [3:23:58<22:48:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 13%|█▎ | 1602/12384 [3:23:58<22:55:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 13%|█▎ | 1602/12384 [3:24:06<22:55:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 13%|█▎ | 1603/12384 [3:24:06<22:52:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 13%|█▎ | 1603/12384 [3:24:13<22:52:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 13%|█▎ | 1604/12384 [3:24:13<22:50:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 13%|█▎ | 1604/12384 [3:24:21<22:50:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 13%|█▎ | 1605/12384 [3:24:21<23:05:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 13%|█▎ | 1605/12384 [3:24:29<23:05:56, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 13%|█▎ | 1606/12384 [3:24:29<23:03:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 13%|█▎ | 1606/12384 [3:24:36<23:03:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 13%|█▎ | 1607/12384 [3:24:36<22:59:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 13%|█▎ | 1607/12384 [3:24:44<22:59:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 13%|█▎ | 1608/12384 [3:24:44<22:55:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 13%|█▎ | 1608/12384 [3:24:52<22:55:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 13%|█▎ | 1609/12384 [3:24:52<22:53:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 13%|█▎ | 1609/12384 [3:24:59<22:53:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1610/12384 [3:24:59<22:50:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1610/12384 [3:25:07<22:50:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 13%|█▎ | 1611/12384 [3:25:07<22:50:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 13%|█▎ | 1611/12384 [3:25:14<22:50:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 2: 13%|█▎ | 1612/12384 [3:25:14<22:52:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.86s]
Epoch 2: 13%|█▎ | 1612/12384 [3:25:22<22:52:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 13%|█▎ | 1613/12384 [3:25:22<22:49:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 13%|█▎ | 1613/12384 [3:25:30<22:49:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1614/12384 [3:25:30<22:48:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1614/12384 [3:25:37<22:48:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 13%|█▎ | 1615/12384 [3:25:37<22:47:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 13%|█▎ | 1615/12384 [3:25:45<22:47:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 13%|█▎ | 1616/12384 [3:25:45<22:48:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 13%|█▎ | 1616/12384 [3:25:53<22:48:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 13%|█▎ | 1617/12384 [3:25:53<22:47:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 13%|█▎ | 1617/12384 [3:26:00<22:47:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1618/12384 [3:26:00<22:47:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1618/12384 [3:26:08<22:47:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 13%|█▎ | 1619/12384 [3:26:08<23:02:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 13%|█▎ | 1619/12384 [3:26:16<23:02:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 13%|█▎ | 1620/12384 [3:26:16<22:55:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 13%|█▎ | 1620/12384 [3:26:23<22:55:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 13%|█▎ | 1621/12384 [3:26:23<22:55:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 13%|█▎ | 1621/12384 [3:26:31<22:55:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 13%|█▎ | 1622/12384 [3:26:31<22:55:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 13%|█▎ | 1622/12384 [3:26:39<22:55:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 13%|█▎ | 1623/12384 [3:26:39<22:54:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 13%|█▎ | 1623/12384 [3:26:46<22:54:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 13%|█▎ | 1624/12384 [3:26:46<22:54:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 13%|█▎ | 1624/12384 [3:26:54<22:54:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 13%|█▎ | 1625/12384 [3:26:54<22:51:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 13%|█▎ | 1625/12384 [3:27:02<22:51:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 13%|█▎ | 1626/12384 [3:27:02<22:50:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 13%|█▎ | 1626/12384 [3:27:09<22:50:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 13%|█▎ | 1627/12384 [3:27:09<22:47:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 13%|█▎ | 1627/12384 [3:27:17<22:47:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 2: 13%|█▎ | 1628/12384 [3:27:17<22:45:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 2: 13%|█▎ | 1628/12384 [3:27:24<22:45:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 13%|█▎ | 1629/12384 [3:27:24<22:45:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 13%|█▎ | 1629/12384 [3:27:32<22:45:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 2: 13%|█▎ | 1630/12384 [3:27:32<22:44:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 2: 13%|█▎ | 1630/12384 [3:27:40<22:44:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 13%|█▎ | 1631/12384 [3:27:40<22:43:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 13%|█▎ | 1631/12384 [3:27:48<22:43:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 13%|█▎ | 1632/12384 [3:27:48<23:02:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 13%|█▎ | 1632/12384 [3:27:55<23:02:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 13%|█▎ | 1633/12384 [3:27:55<22:56:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 13%|█▎ | 1633/12384 [3:28:03<22:56:59, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 2: 13%|█▎ | 1634/12384 [3:28:03<22:52:55, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.52s]
Epoch 2: 13%|█▎ | 1634/12384 [3:28:10<22:52:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 13%|█▎ | 1635/12384 [3:28:10<22:50:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 13%|█▎ | 1635/12384 [3:28:18<22:50:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1636/12384 [3:28:18<22:54:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1636/12384 [3:28:26<22:54:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 13%|█▎ | 1637/12384 [3:28:26<22:50:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 13%|█▎ | 1637/12384 [3:28:33<22:50:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 13%|█▎ | 1638/12384 [3:28:33<22:47:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 13%|█▎ | 1638/12384 [3:28:41<22:47:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 13%|█▎ | 1639/12384 [3:28:41<22:45:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 13%|█▎ | 1639/12384 [3:28:49<22:45:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 13%|█▎ | 1640/12384 [3:28:49<22:45:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 13%|█▎ | 1640/12384 [3:28:56<22:45:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 2: 13%|█▎ | 1641/12384 [3:28:56<22:44:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 2: 13%|█▎ | 1641/12384 [3:29:04<22:44:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 13%|█▎ | 1642/12384 [3:29:04<22:43:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 13%|█▎ | 1642/12384 [3:29:11<22:43:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 13%|█▎ | 1643/12384 [3:29:11<22:44:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 13%|█▎ | 1643/12384 [3:29:19<22:44:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 2: 13%|█▎ | 1644/12384 [3:29:19<22:41:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 2: 13%|█▎ | 1644/12384 [3:29:27<22:41:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 2: 13%|█▎ | 1645/12384 [3:29:27<22:55:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 2: 13%|█▎ | 1645/12384 [3:29:34<22:55:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1646/12384 [3:29:34<22:50:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 13%|█▎ | 1646/12384 [3:29:42<22:50:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1647/12384 [3:29:42<22:48:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1647/12384 [3:29:50<22:48:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 13%|█▎ | 1648/12384 [3:29:50<22:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 13%|█▎ | 1648/12384 [3:29:57<22:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 2: 13%|█▎ | 1649/12384 [3:29:57<22:42:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 2: 13%|█▎ | 1649/12384 [3:30:05<22:42:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 13%|█▎ | 1650/12384 [3:30:05<22:42:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 13%|█▎ | 1650/12384 [3:30:12<22:42:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1651/12384 [3:30:12<22:41:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 13%|█▎ | 1651/12384 [3:30:20<22:41:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1652/12384 [3:30:20<22:40:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 13%|█▎ | 1652/12384 [3:30:28<22:40:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 13%|█▎ | 1653/12384 [3:30:28<22:39:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 13%|█▎ | 1653/12384 [3:30:35<22:39:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 13%|█▎ | 1654/12384 [3:30:35<22:40:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 13%|█▎ | 1654/12384 [3:30:43<22:40:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 13%|█▎ | 1655/12384 [3:30:43<22:40:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 13%|█▎ | 1655/12384 [3:30:50<22:40:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 13%|█▎ | 1656/12384 [3:30:50<22:40:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 13%|█▎ | 1656/12384 [3:30:58<22:40:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 13%|█▎ | 1657/12384 [3:30:58<22:41:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 13%|█▎ | 1657/12384 [3:31:06<22:41:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 13%|█▎ | 1658/12384 [3:31:06<22:58:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 13%|█▎ | 1658/12384 [3:31:14<22:58:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 2: 13%|█▎ | 1659/12384 [3:31:14<22:58:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 2: 13%|█▎ | 1659/12384 [3:31:21<22:58:31, 7.71s/it, loss=0.0001, acc=0.9992, iter_time=10.78s]
Epoch 2: 13%|█▎ | 1660/12384 [3:31:21<22:53:45, 7.69s/it, loss=0.0001, acc=0.9992, iter_time=10.78s]
Epoch 2: 13%|█▎ | 1660/12384 [3:31:29<22:53:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 13%|█▎ | 1661/12384 [3:31:29<22:49:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 13%|█▎ | 1661/12384 [3:31:37<22:49:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 13%|█▎ | 1662/12384 [3:31:37<22:46:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 13%|█▎ | 1662/12384 [3:31:44<22:46:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 13%|█▎ | 1663/12384 [3:31:44<22:45:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 13%|█▎ | 1663/12384 [3:31:52<22:45:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 13%|█▎ | 1664/12384 [3:31:52<22:44:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 13%|█▎ | 1664/12384 [3:31:59<22:44:08, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=7.66s]
Epoch 2: 13%|█▎ | 1665/12384 [3:31:59<22:44:29, 7.64s/it, loss=0.0001, acc=0.9996, iter_time=7.66s]
Epoch 2: 13%|█▎ | 1665/12384 [3:32:07<22:44:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 13%|█▎ | 1666/12384 [3:32:07<22:40:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 13%|█▎ | 1666/12384 [3:32:15<22:40:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 13%|█▎ | 1667/12384 [3:32:15<22:41:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 13%|█▎ | 1667/12384 [3:32:22<22:41:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 13%|█▎ | 1668/12384 [3:32:22<22:42:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 13%|█▎ | 1668/12384 [3:32:30<22:42:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1669/12384 [3:32:30<22:40:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 13%|█▎ | 1669/12384 [3:32:38<22:40:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 13%|█▎ | 1670/12384 [3:32:38<22:38:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 13%|█▎ | 1670/12384 [3:32:45<22:38:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 13%|█▎ | 1671/12384 [3:32:45<22:55:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 13%|█▎ | 1671/12384 [3:32:53<22:55:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 14%|█▎ | 1672/12384 [3:32:53<22:54:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 14%|█▎ | 1672/12384 [3:33:01<22:54:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 14%|█▎ | 1673/12384 [3:33:01<22:48:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 14%|█▎ | 1673/12384 [3:33:08<22:48:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 14%|█▎ | 1674/12384 [3:33:08<22:44:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 14%|█▎ | 1674/12384 [3:33:16<22:44:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 14%|█▎ | 1675/12384 [3:33:16<22:42:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 14%|█▎ | 1675/12384 [3:33:24<22:42:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▎ | 1676/12384 [3:33:24<22:43:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▎ | 1676/12384 [3:33:31<22:43:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 14%|█▎ | 1677/12384 [3:33:31<22:41:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 14%|█▎ | 1677/12384 [3:33:39<22:41:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 14%|█▎ | 1678/12384 [3:33:39<22:41:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 14%|█▎ | 1678/12384 [3:33:46<22:41:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 14%|█▎ | 1679/12384 [3:33:46<22:45:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 14%|█▎ | 1679/12384 [3:33:54<22:45:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 14%|█▎ | 1680/12384 [3:33:54<22:43:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 14%|█▎ | 1680/12384 [3:34:02<22:43:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 2: 14%|█▎ | 1681/12384 [3:34:02<22:41:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 2: 14%|█▎ | 1681/12384 [3:34:09<22:41:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 2: 14%|█▎ | 1682/12384 [3:34:09<22:39:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 2: 14%|█▎ | 1682/12384 [3:34:17<22:39:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 14%|█▎ | 1683/12384 [3:34:17<22:38:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 14%|█▎ | 1683/12384 [3:34:25<22:38:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 14%|█▎ | 1684/12384 [3:34:25<22:37:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 14%|█▎ | 1684/12384 [3:34:33<22:37:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 14%|█▎ | 1685/12384 [3:34:33<22:59:24, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 14%|█▎ | 1685/12384 [3:34:40<22:59:24, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 14%|█▎ | 1686/12384 [3:34:40<22:51:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 14%|█▎ | 1686/12384 [3:34:48<22:51:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▎ | 1687/12384 [3:34:48<22:46:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▎ | 1687/12384 [3:34:55<22:46:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 14%|█▎ | 1688/12384 [3:34:55<22:44:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 14%|█▎ | 1688/12384 [3:35:03<22:44:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 14%|█▎ | 1689/12384 [3:35:03<22:42:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 14%|█▎ | 1689/12384 [3:35:11<22:42:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 14%|█▎ | 1690/12384 [3:35:11<22:39:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 14%|█▎ | 1690/12384 [3:35:18<22:39:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▎ | 1691/12384 [3:35:18<22:37:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▎ | 1691/12384 [3:35:26<22:37:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▎ | 1692/12384 [3:35:26<22:39:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▎ | 1692/12384 [3:35:33<22:39:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 14%|█▎ | 1693/12384 [3:35:33<22:41:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 14%|█▎ | 1693/12384 [3:35:41<22:41:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▎ | 1694/12384 [3:35:41<22:41:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▎ | 1694/12384 [3:35:49<22:41:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 14%|█▎ | 1695/12384 [3:35:49<22:37:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 14%|█▎ | 1695/12384 [3:35:56<22:37:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 2: 14%|█▎ | 1696/12384 [3:35:56<22:43:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 2: 14%|█▎ | 1696/12384 [3:36:04<22:43:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 14%|█▎ | 1697/12384 [3:36:04<22:55:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 14%|█▎ | 1697/12384 [3:36:12<22:55:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 14%|█▎ | 1698/12384 [3:36:12<22:51:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 14%|█▎ | 1698/12384 [3:36:20<22:51:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.23s]
Epoch 2: 14%|█▎ | 1699/12384 [3:36:20<22:46:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.23s]
Epoch 2: 14%|█▎ | 1699/12384 [3:36:27<22:46:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 14%|█▎ | 1700/12384 [3:36:27<22:43:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 14%|█▎ | 1700/12384 [3:36:35<22:43:05, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 14%|█▎ | 1701/12384 [3:36:35<22:40:31, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 14%|█▎ | 1701/12384 [3:36:42<22:40:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▎ | 1702/12384 [3:36:42<22:39:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▎ | 1702/12384 [3:36:50<22:39:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 14%|█▍ | 1703/12384 [3:36:50<22:43:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 14%|█▍ | 1703/12384 [3:36:58<22:43:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 2: 14%|█▍ | 1704/12384 [3:36:58<22:40:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 2: 14%|█▍ | 1704/12384 [3:37:05<22:40:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 2: 14%|█▍ | 1705/12384 [3:37:05<22:37:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 2: 14%|█▍ | 1705/12384 [3:37:13<22:37:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 14%|█▍ | 1706/12384 [3:37:13<22:36:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 14%|█▍ | 1706/12384 [3:37:21<22:36:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 2: 14%|█▍ | 1707/12384 [3:37:21<22:38:16, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 2: 14%|█▍ | 1707/12384 [3:37:28<22:38:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 14%|█▍ | 1708/12384 [3:37:28<22:36:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 14%|█▍ | 1708/12384 [3:37:36<22:36:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 14%|█▍ | 1709/12384 [3:37:36<22:41:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 14%|█▍ | 1709/12384 [3:37:44<22:41:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 14%|█▍ | 1710/12384 [3:37:44<22:39:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 14%|█▍ | 1710/12384 [3:37:51<22:39:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 14%|█▍ | 1711/12384 [3:37:51<22:54:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 14%|█▍ | 1711/12384 [3:37:59<22:54:30, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.85s]
Epoch 2: 14%|█▍ | 1712/12384 [3:37:59<22:47:55, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.85s]
Epoch 2: 14%|█▍ | 1712/12384 [3:38:07<22:47:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 14%|█▍ | 1713/12384 [3:38:07<22:43:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 14%|█▍ | 1713/12384 [3:38:14<22:43:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 14%|█▍ | 1714/12384 [3:38:14<22:40:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 14%|█▍ | 1714/12384 [3:38:22<22:40:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 14%|█▍ | 1715/12384 [3:38:22<22:37:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 14%|█▍ | 1715/12384 [3:38:30<22:37:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1716/12384 [3:38:30<22:36:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1716/12384 [3:38:37<22:36:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1717/12384 [3:38:37<22:36:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1717/12384 [3:38:45<22:36:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 14%|█▍ | 1718/12384 [3:38:45<22:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 14%|█▍ | 1718/12384 [3:38:52<22:34:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1719/12384 [3:38:52<22:35:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1719/12384 [3:39:00<22:35:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 14%|█▍ | 1720/12384 [3:39:00<22:34:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 14%|█▍ | 1720/12384 [3:39:08<22:34:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 14%|█▍ | 1721/12384 [3:39:08<22:33:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 14%|█▍ | 1721/12384 [3:39:15<22:33:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 14%|█▍ | 1722/12384 [3:39:15<22:33:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 14%|█▍ | 1722/12384 [3:39:23<22:33:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 14%|█▍ | 1723/12384 [3:39:23<22:33:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 14%|█▍ | 1723/12384 [3:39:30<22:33:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 14%|█▍ | 1724/12384 [3:39:30<22:32:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 14%|█▍ | 1724/12384 [3:39:38<22:32:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 14%|█▍ | 1725/12384 [3:39:38<22:32:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 14%|█▍ | 1725/12384 [3:39:46<22:32:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1726/12384 [3:39:46<22:31:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1726/12384 [3:39:53<22:31:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 14%|█▍ | 1727/12384 [3:39:53<22:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 14%|█▍ | 1727/12384 [3:40:01<22:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 14%|█▍ | 1728/12384 [3:40:01<22:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 14%|█▍ | 1728/12384 [3:40:08<22:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 2: 14%|█▍ | 1729/12384 [3:40:08<22:29:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 2: 14%|█▍ | 1729/12384 [3:40:16<22:29:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 14%|█▍ | 1730/12384 [3:40:16<22:29:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 14%|█▍ | 1730/12384 [3:40:24<22:29:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 14%|█▍ | 1731/12384 [3:40:24<22:34:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 14%|█▍ | 1731/12384 [3:40:31<22:34:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 14%|█▍ | 1732/12384 [3:40:32<22:45:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 14%|█▍ | 1732/12384 [3:40:39<22:45:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 14%|█▍ | 1733/12384 [3:40:39<22:40:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 14%|█▍ | 1733/12384 [3:40:47<22:40:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 14%|█▍ | 1734/12384 [3:40:47<22:39:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 14%|█▍ | 1734/12384 [3:40:54<22:39:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 2: 14%|█▍ | 1735/12384 [3:40:54<22:36:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 2: 14%|█▍ | 1735/12384 [3:41:02<22:36:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 14%|█▍ | 1736/12384 [3:41:02<22:35:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 14%|█▍ | 1736/12384 [3:41:10<22:35:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 14%|█▍ | 1737/12384 [3:41:10<22:49:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 14%|█▍ | 1737/12384 [3:41:18<22:49:37, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=5.74s]
Epoch 2: 14%|█▍ | 1738/12384 [3:41:18<22:43:22, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=5.74s]
Epoch 2: 14%|█▍ | 1738/12384 [3:41:25<22:43:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 2: 14%|█▍ | 1739/12384 [3:41:25<22:40:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 2: 14%|█▍ | 1739/12384 [3:41:33<22:40:15, 7.67s/it, loss=0.0005, acc=0.9976, iter_time=7.62s]
Epoch 2: 14%|█▍ | 1740/12384 [3:41:33<22:37:29, 7.65s/it, loss=0.0005, acc=0.9976, iter_time=7.62s]
Epoch 2: 14%|█▍ | 1740/12384 [3:41:40<22:37:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 14%|█▍ | 1741/12384 [3:41:40<22:35:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 14%|█▍ | 1741/12384 [3:41:48<22:35:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 14%|█▍ | 1742/12384 [3:41:48<22:33:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 14%|█▍ | 1742/12384 [3:41:56<22:33:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1743/12384 [3:41:56<22:35:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1743/12384 [3:42:03<22:35:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 14%|█▍ | 1744/12384 [3:42:03<22:33:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 14%|█▍ | 1744/12384 [3:42:11<22:33:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 14%|█▍ | 1745/12384 [3:42:11<22:32:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 14%|█▍ | 1745/12384 [3:42:19<22:32:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1746/12384 [3:42:19<22:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1746/12384 [3:42:26<22:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1747/12384 [3:42:26<22:30:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1747/12384 [3:42:34<22:30:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 14%|█▍ | 1748/12384 [3:42:34<22:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 14%|█▍ | 1748/12384 [3:42:41<22:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 14%|█▍ | 1749/12384 [3:42:41<22:30:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 14%|█▍ | 1749/12384 [3:42:49<22:30:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.46s]
Epoch 2: 14%|█▍ | 1750/12384 [3:42:49<22:28:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.46s]
Epoch 2: 14%|█▍ | 1750/12384 [3:42:57<22:28:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 14%|█▍ | 1751/12384 [3:42:57<22:26:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 14%|█▍ | 1751/12384 [3:43:04<22:26:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 14%|█▍ | 1752/12384 [3:43:04<22:26:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 14%|█▍ | 1752/12384 [3:43:12<22:26:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 14%|█▍ | 1753/12384 [3:43:12<22:31:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 14%|█▍ | 1753/12384 [3:43:19<22:31:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 14%|█▍ | 1754/12384 [3:43:19<22:30:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 14%|█▍ | 1754/12384 [3:43:27<22:30:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 2: 14%|█▍ | 1755/12384 [3:43:27<22:29:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.81s]
Epoch 2: 14%|█▍ | 1755/12384 [3:43:35<22:29:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.49s]
Epoch 2: 14%|█▍ | 1756/12384 [3:43:35<22:29:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.49s]
Epoch 2: 14%|█▍ | 1756/12384 [3:43:42<22:29:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 14%|█▍ | 1757/12384 [3:43:42<22:29:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 14%|█▍ | 1757/12384 [3:43:50<22:29:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 14%|█▍ | 1758/12384 [3:43:50<22:32:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 14%|█▍ | 1758/12384 [3:43:58<22:32:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 14%|█▍ | 1759/12384 [3:43:58<22:30:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 14%|█▍ | 1759/12384 [3:44:05<22:30:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 14%|█▍ | 1760/12384 [3:44:05<22:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 14%|█▍ | 1760/12384 [3:44:13<22:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 14%|█▍ | 1761/12384 [3:44:13<22:27:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 14%|█▍ | 1761/12384 [3:44:20<22:27:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 14%|█▍ | 1762/12384 [3:44:20<22:25:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 14%|█▍ | 1762/12384 [3:44:28<22:25:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 14%|█▍ | 1763/12384 [3:44:28<22:44:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 14%|█▍ | 1763/12384 [3:44:36<22:44:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 14%|█▍ | 1764/12384 [3:44:36<22:39:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 14%|█▍ | 1764/12384 [3:44:44<22:39:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1765/12384 [3:44:44<22:34:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 14%|█▍ | 1765/12384 [3:44:51<22:34:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 14%|█▍ | 1766/12384 [3:44:51<22:32:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 14%|█▍ | 1766/12384 [3:44:59<22:32:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 14%|█▍ | 1767/12384 [3:44:59<22:30:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 14%|█▍ | 1767/12384 [3:45:06<22:30:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 14%|█▍ | 1768/12384 [3:45:06<22:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 14%|█▍ | 1768/12384 [3:45:14<22:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 14%|█▍ | 1769/12384 [3:45:14<22:27:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 14%|█▍ | 1769/12384 [3:45:22<22:27:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 14%|█▍ | 1770/12384 [3:45:22<22:26:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 14%|█▍ | 1770/12384 [3:45:29<22:26:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 14%|█▍ | 1771/12384 [3:45:29<22:27:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 14%|█▍ | 1771/12384 [3:45:37<22:27:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 14%|█▍ | 1772/12384 [3:45:37<22:27:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 14%|█▍ | 1772/12384 [3:45:44<22:27:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 14%|█▍ | 1773/12384 [3:45:44<22:25:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 14%|█▍ | 1773/12384 [3:45:52<22:25:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 14%|█▍ | 1774/12384 [3:45:52<22:31:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 14%|█▍ | 1774/12384 [3:46:00<22:31:21, 7.64s/it, loss=0.0001, acc=0.9995, iter_time=4.30s]
Epoch 2: 14%|█▍ | 1775/12384 [3:46:00<22:28:48, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=4.30s]
Epoch 2: 14%|█▍ | 1775/12384 [3:46:07<22:28:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 2: 14%|█▍ | 1776/12384 [3:46:07<22:27:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 2: 14%|█▍ | 1776/12384 [3:46:15<22:27:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 14%|█▍ | 1777/12384 [3:46:15<22:41:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 14%|█▍ | 1777/12384 [3:46:23<22:41:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1778/12384 [3:46:23<22:36:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1778/12384 [3:46:30<22:36:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 14%|█▍ | 1779/12384 [3:46:30<22:33:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 14%|█▍ | 1779/12384 [3:46:38<22:33:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 14%|█▍ | 1780/12384 [3:46:38<22:29:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 14%|█▍ | 1780/12384 [3:46:46<22:29:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1781/12384 [3:46:46<22:27:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 14%|█▍ | 1781/12384 [3:46:53<22:27:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 14%|█▍ | 1782/12384 [3:46:53<22:26:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 14%|█▍ | 1782/12384 [3:47:01<22:26:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 14%|█▍ | 1783/12384 [3:47:01<22:25:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 14%|█▍ | 1783/12384 [3:47:09<22:25:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 14%|█▍ | 1784/12384 [3:47:09<22:30:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 14%|█▍ | 1784/12384 [3:47:16<22:30:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 14%|█▍ | 1785/12384 [3:47:16<22:27:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 14%|█▍ | 1785/12384 [3:47:24<22:27:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 2: 14%|█▍ | 1786/12384 [3:47:24<22:27:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 2: 14%|█▍ | 1786/12384 [3:47:31<22:27:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 14%|█▍ | 1787/12384 [3:47:31<22:26:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 14%|█▍ | 1787/12384 [3:47:39<22:26:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 14%|█▍ | 1788/12384 [3:47:39<22:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 14%|█▍ | 1788/12384 [3:47:47<22:26:28, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.10s]
Epoch 2: 14%|█▍ | 1789/12384 [3:47:47<22:41:27, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=9.10s]
Epoch 2: 14%|█▍ | 1789/12384 [3:47:55<22:41:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 14%|█▍ | 1790/12384 [3:47:55<22:40:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 14%|█▍ | 1790/12384 [3:48:02<22:40:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 14%|█▍ | 1791/12384 [3:48:02<22:35:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 14%|█▍ | 1791/12384 [3:48:10<22:35:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 2: 14%|█▍ | 1792/12384 [3:48:10<22:32:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 2: 14%|█▍ | 1792/12384 [3:48:17<22:32:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 14%|█▍ | 1793/12384 [3:48:17<22:30:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 14%|█▍ | 1793/12384 [3:48:25<22:30:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 14%|█▍ | 1794/12384 [3:48:25<22:27:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 14%|█▍ | 1794/12384 [3:48:33<22:27:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 14%|█▍ | 1795/12384 [3:48:33<22:27:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 14%|█▍ | 1795/12384 [3:48:40<22:27:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 15%|█▍ | 1796/12384 [3:48:40<22:28:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 15%|█▍ | 1796/12384 [3:48:48<22:28:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 15%|█▍ | 1797/12384 [3:48:48<22:26:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 15%|█▍ | 1797/12384 [3:48:56<22:26:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 15%|█▍ | 1798/12384 [3:48:56<22:25:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 15%|█▍ | 1798/12384 [3:49:03<22:25:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 15%|█▍ | 1799/12384 [3:49:03<22:24:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 15%|█▍ | 1799/12384 [3:49:11<22:24:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 15%|█▍ | 1800/12384 [3:49:11<22:23:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 15%|█▍ | 1800/12384 [3:49:18<22:23:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 15%|█▍ | 1801/12384 [3:49:18<22:22:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 15%|█▍ | 1801/12384 [3:49:26<22:22:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.42s]
Epoch 2: 15%|█▍ | 1802/12384 [3:49:26<22:23:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.42s]
Epoch 2: 15%|█▍ | 1802/12384 [3:49:34<22:23:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 2: 15%|█▍ | 1803/12384 [3:49:34<22:21:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 2: 15%|█▍ | 1803/12384 [3:49:41<22:21:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 2: 15%|█▍ | 1804/12384 [3:49:41<22:33:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 2: 15%|█▍ | 1804/12384 [3:49:49<22:33:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 15%|█▍ | 1805/12384 [3:49:49<22:32:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 15%|█▍ | 1805/12384 [3:49:57<22:32:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 15%|█▍ | 1806/12384 [3:49:57<22:28:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 15%|█▍ | 1806/12384 [3:50:04<22:28:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1807/12384 [3:50:04<22:26:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1807/12384 [3:50:12<22:26:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 15%|█▍ | 1808/12384 [3:50:12<22:23:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 15%|█▍ | 1808/12384 [3:50:19<22:23:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 15%|█▍ | 1809/12384 [3:50:19<22:22:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 15%|█▍ | 1809/12384 [3:50:27<22:22:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 15%|█▍ | 1810/12384 [3:50:27<22:20:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 15%|█▍ | 1810/12384 [3:50:35<22:20:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 2: 15%|█▍ | 1811/12384 [3:50:35<22:19:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 2: 15%|█▍ | 1811/12384 [3:50:42<22:19:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 15%|█▍ | 1812/12384 [3:50:42<22:17:44, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 15%|█▍ | 1812/12384 [3:50:50<22:17:44, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 15%|█▍ | 1813/12384 [3:50:50<22:17:39, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 15%|█▍ | 1813/12384 [3:50:57<22:17:39, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 15%|█▍ | 1814/12384 [3:50:57<22:17:38, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 15%|█▍ | 1814/12384 [3:51:05<22:17:38, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 15%|█▍ | 1815/12384 [3:51:05<22:16:21, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 15%|█▍ | 1815/12384 [3:51:13<22:16:21, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 15%|█▍ | 1816/12384 [3:51:13<22:33:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 15%|█▍ | 1816/12384 [3:51:20<22:33:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 15%|█▍ | 1817/12384 [3:51:20<22:28:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 15%|█▍ | 1817/12384 [3:51:28<22:28:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 15%|█▍ | 1818/12384 [3:51:28<22:25:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 15%|█▍ | 1818/12384 [3:51:36<22:25:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 15%|█▍ | 1819/12384 [3:51:36<22:24:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 15%|█▍ | 1819/12384 [3:51:43<22:24:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 15%|█▍ | 1820/12384 [3:51:43<22:22:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 15%|█▍ | 1820/12384 [3:51:51<22:22:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1821/12384 [3:51:51<22:20:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1821/12384 [3:51:59<22:20:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1822/12384 [3:51:59<22:20:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1822/12384 [3:52:06<22:20:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 15%|█▍ | 1823/12384 [3:52:06<22:19:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 15%|█▍ | 1823/12384 [3:52:14<22:19:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 2: 15%|█▍ | 1824/12384 [3:52:14<22:21:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 2: 15%|█▍ | 1824/12384 [3:52:21<22:21:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 15%|█▍ | 1825/12384 [3:52:21<22:20:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 15%|█▍ | 1825/12384 [3:52:29<22:20:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1826/12384 [3:52:29<22:19:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1826/12384 [3:52:37<22:19:01, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=7.61s]
Epoch 2: 15%|█▍ | 1827/12384 [3:52:37<22:19:39, 7.61s/it, loss=0.0008, acc=0.9979, iter_time=7.61s]
Epoch 2: 15%|█▍ | 1827/12384 [3:52:44<22:19:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 15%|█▍ | 1828/12384 [3:52:44<22:19:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 15%|█▍ | 1828/12384 [3:52:52<22:19:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 15%|█▍ | 1829/12384 [3:52:52<22:23:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 15%|█▍ | 1829/12384 [3:53:00<22:23:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 15%|█▍ | 1830/12384 [3:53:00<22:21:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 15%|█▍ | 1830/12384 [3:53:07<22:21:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 15%|█▍ | 1831/12384 [3:53:07<22:20:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 15%|█▍ | 1831/12384 [3:53:15<22:20:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 15%|█▍ | 1832/12384 [3:53:15<22:20:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 15%|█▍ | 1832/12384 [3:53:22<22:20:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 15%|█▍ | 1833/12384 [3:53:22<22:20:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 15%|█▍ | 1833/12384 [3:53:30<22:20:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 15%|█▍ | 1834/12384 [3:53:30<22:21:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 15%|█▍ | 1834/12384 [3:53:38<22:21:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 15%|█▍ | 1835/12384 [3:53:38<22:20:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 15%|█▍ | 1835/12384 [3:53:45<22:20:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 15%|█▍ | 1836/12384 [3:53:45<22:20:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 15%|█▍ | 1836/12384 [3:53:53<22:20:12, 7.62s/it, loss=0.0012, acc=0.9985, iter_time=12.37s]
Epoch 2: 15%|█▍ | 1837/12384 [3:53:53<22:19:48, 7.62s/it, loss=0.0012, acc=0.9985, iter_time=12.37s]
Epoch 2: 15%|█▍ | 1837/12384 [3:54:00<22:19:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1838/12384 [3:54:00<22:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▍ | 1838/12384 [3:54:08<22:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 15%|█▍ | 1839/12384 [3:54:08<22:17:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 15%|█▍ | 1839/12384 [3:54:16<22:17:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 15%|█▍ | 1840/12384 [3:54:16<22:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 15%|█▍ | 1840/12384 [3:54:23<22:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 15%|█▍ | 1841/12384 [3:54:23<22:20:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 15%|█▍ | 1841/12384 [3:54:31<22:20:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 15%|█▍ | 1842/12384 [3:54:31<22:37:26, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 15%|█▍ | 1842/12384 [3:54:39<22:37:26, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 15%|█▍ | 1843/12384 [3:54:39<22:30:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 15%|█▍ | 1843/12384 [3:54:47<22:30:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 15%|█▍ | 1844/12384 [3:54:47<22:27:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 15%|█▍ | 1844/12384 [3:54:54<22:27:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 15%|█▍ | 1845/12384 [3:54:54<22:23:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 15%|█▍ | 1845/12384 [3:55:02<22:23:02, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=10.89s]
Epoch 2: 15%|█▍ | 1846/12384 [3:55:02<22:21:32, 7.64s/it, loss=0.0002, acc=0.9990, iter_time=10.89s]
Epoch 2: 15%|█▍ | 1846/12384 [3:55:09<22:21:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 15%|█▍ | 1847/12384 [3:55:09<22:19:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 15%|█▍ | 1847/12384 [3:55:17<22:19:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 15%|█▍ | 1848/12384 [3:55:17<22:18:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 15%|█▍ | 1848/12384 [3:55:25<22:18:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 15%|█▍ | 1849/12384 [3:55:25<22:17:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 15%|█▍ | 1849/12384 [3:55:32<22:17:58, 7.62s/it, loss=0.0008, acc=1.0000, iter_time=7.83s]
Epoch 2: 15%|█▍ | 1850/12384 [3:55:32<22:17:13, 7.62s/it, loss=0.0008, acc=1.0000, iter_time=7.83s]
Epoch 2: 15%|█▍ | 1850/12384 [3:55:40<22:17:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 15%|█▍ | 1851/12384 [3:55:40<22:17:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 15%|█▍ | 1851/12384 [3:55:47<22:17:03, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 2: 15%|█▍ | 1852/12384 [3:55:47<22:16:32, 7.61s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 2: 15%|█▍ | 1852/12384 [3:55:55<22:16:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 15%|█▍ | 1853/12384 [3:55:55<22:17:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 15%|█▍ | 1853/12384 [3:56:03<22:17:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 15%|█▍ | 1854/12384 [3:56:03<22:17:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 15%|█▍ | 1854/12384 [3:56:10<22:17:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 2: 15%|█▍ | 1855/12384 [3:56:10<22:15:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 2: 15%|█▍ | 1855/12384 [3:56:18<22:15:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.70s]
Epoch 2: 15%|█▍ | 1856/12384 [3:56:18<22:31:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.70s]
Epoch 2: 15%|█▍ | 1856/12384 [3:56:26<22:31:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 15%|█▍ | 1857/12384 [3:56:26<22:34:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 15%|█▍ | 1857/12384 [3:56:34<22:34:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 15%|█▌ | 1858/12384 [3:56:34<22:29:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 15%|█▌ | 1858/12384 [3:56:41<22:29:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▌ | 1859/12384 [3:56:41<22:24:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▌ | 1859/12384 [3:56:49<22:24:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 15%|█▌ | 1860/12384 [3:56:49<22:23:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 15%|█▌ | 1860/12384 [3:56:56<22:23:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 15%|█▌ | 1861/12384 [3:56:56<22:20:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 15%|█▌ | 1861/12384 [3:57:04<22:20:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 15%|█▌ | 1862/12384 [3:57:04<22:18:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 15%|█▌ | 1862/12384 [3:57:12<22:18:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 15%|█▌ | 1863/12384 [3:57:12<22:17:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 15%|█▌ | 1863/12384 [3:57:19<22:17:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 15%|█▌ | 1864/12384 [3:57:19<22:17:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 15%|█▌ | 1864/12384 [3:57:27<22:17:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 15%|█▌ | 1865/12384 [3:57:27<22:16:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 15%|█▌ | 1865/12384 [3:57:34<22:16:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 15%|█▌ | 1866/12384 [3:57:34<22:15:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 15%|█▌ | 1866/12384 [3:57:42<22:15:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 15%|█▌ | 1867/12384 [3:57:42<22:13:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 15%|█▌ | 1867/12384 [3:57:50<22:13:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▌ | 1868/12384 [3:57:50<22:12:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▌ | 1868/12384 [3:57:58<22:12:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 15%|█▌ | 1869/12384 [3:57:58<22:31:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 15%|█▌ | 1869/12384 [3:58:05<22:31:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 15%|█▌ | 1870/12384 [3:58:05<22:26:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 15%|█▌ | 1870/12384 [3:58:13<22:26:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 15%|█▌ | 1871/12384 [3:58:13<22:21:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 15%|█▌ | 1871/12384 [3:58:20<22:21:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 15%|█▌ | 1872/12384 [3:58:20<22:18:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 15%|█▌ | 1872/12384 [3:58:28<22:18:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 2: 15%|█▌ | 1873/12384 [3:58:28<22:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 2: 15%|█▌ | 1873/12384 [3:58:36<22:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 15%|█▌ | 1874/12384 [3:58:36<22:17:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 15%|█▌ | 1874/12384 [3:58:43<22:17:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 15%|█▌ | 1875/12384 [3:58:43<22:15:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 15%|█▌ | 1875/12384 [3:58:51<22:15:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 15%|█▌ | 1876/12384 [3:58:51<22:14:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 15%|█▌ | 1876/12384 [3:58:58<22:14:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 15%|█▌ | 1877/12384 [3:58:58<22:12:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 15%|█▌ | 1877/12384 [3:59:06<22:12:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 15%|█▌ | 1878/12384 [3:59:06<22:11:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 15%|█▌ | 1878/12384 [3:59:14<22:11:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 15%|█▌ | 1879/12384 [3:59:14<22:18:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 15%|█▌ | 1879/12384 [3:59:21<22:18:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 15%|█▌ | 1880/12384 [3:59:21<22:15:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 15%|█▌ | 1880/12384 [3:59:29<22:15:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 15%|█▌ | 1881/12384 [3:59:29<22:13:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 15%|█▌ | 1881/12384 [3:59:37<22:13:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 2: 15%|█▌ | 1882/12384 [3:59:37<22:14:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 2: 15%|█▌ | 1882/12384 [3:59:44<22:14:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 2: 15%|█▌ | 1883/12384 [3:59:44<22:14:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 2: 15%|█▌ | 1883/12384 [3:59:52<22:14:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 15%|█▌ | 1884/12384 [3:59:52<22:13:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 15%|█▌ | 1884/12384 [3:59:59<22:13:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 15%|█▌ | 1885/12384 [3:59:59<22:12:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 15%|█▌ | 1885/12384 [4:00:07<22:12:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 15%|█▌ | 1886/12384 [4:00:07<22:11:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 15%|█▌ | 1886/12384 [4:00:15<22:11:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 15%|█▌ | 1887/12384 [4:00:15<22:12:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 15%|█▌ | 1887/12384 [4:00:22<22:12:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 15%|█▌ | 1888/12384 [4:00:22<22:12:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 15%|█▌ | 1888/12384 [4:00:30<22:12:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 2: 15%|█▌ | 1889/12384 [4:00:30<22:11:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 2: 15%|█▌ | 1889/12384 [4:00:38<22:11:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 15%|█▌ | 1890/12384 [4:00:38<22:10:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 15%|█▌ | 1890/12384 [4:00:45<22:10:42, 7.61s/it, loss=0.0018, acc=0.9961, iter_time=10.73s]
Epoch 2: 15%|█▌ | 1891/12384 [4:00:45<22:09:28, 7.60s/it, loss=0.0018, acc=0.9961, iter_time=10.73s]
Epoch 2: 15%|█▌ | 1891/12384 [4:00:53<22:09:28, 7.60s/it, loss=0.0004, acc=0.9984, iter_time=7.61s]
Epoch 2: 15%|█▌ | 1892/12384 [4:00:53<22:09:25, 7.60s/it, loss=0.0004, acc=0.9984, iter_time=7.61s]
Epoch 2: 15%|█▌ | 1892/12384 [4:01:00<22:09:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▌ | 1893/12384 [4:01:00<22:09:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 15%|█▌ | 1893/12384 [4:01:08<22:09:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 15%|█▌ | 1894/12384 [4:01:08<22:10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 15%|█▌ | 1894/12384 [4:01:16<22:10:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 15%|█▌ | 1895/12384 [4:01:16<22:30:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 15%|█▌ | 1895/12384 [4:01:24<22:30:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 15%|█▌ | 1896/12384 [4:01:24<22:23:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 15%|█▌ | 1896/12384 [4:01:31<22:23:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 15%|█▌ | 1897/12384 [4:01:31<22:24:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 15%|█▌ | 1897/12384 [4:01:39<22:24:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 2: 15%|█▌ | 1898/12384 [4:01:39<22:20:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 2: 15%|█▌ | 1898/12384 [4:01:47<22:20:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 15%|█▌ | 1899/12384 [4:01:47<22:23:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 15%|█▌ | 1899/12384 [4:01:54<22:23:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 15%|█▌ | 1900/12384 [4:01:54<22:24:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 15%|█▌ | 1900/12384 [4:02:02<22:24:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 2: 15%|█▌ | 1901/12384 [4:02:02<22:21:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 2: 15%|█▌ | 1901/12384 [4:02:10<22:21:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 15%|█▌ | 1902/12384 [4:02:10<22:18:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 15%|█▌ | 1902/12384 [4:02:17<22:18:17, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 2: 15%|█▌ | 1903/12384 [4:02:17<22:16:09, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 2: 15%|█▌ | 1903/12384 [4:02:25<22:16:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 15%|█▌ | 1904/12384 [4:02:25<22:14:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 15%|█▌ | 1904/12384 [4:02:32<22:14:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 15%|█▌ | 1905/12384 [4:02:32<22:12:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 15%|█▌ | 1905/12384 [4:02:40<22:12:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 15%|█▌ | 1906/12384 [4:02:40<22:10:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 15%|█▌ | 1906/12384 [4:02:48<22:10:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 15%|█▌ | 1907/12384 [4:02:48<22:09:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 15%|█▌ | 1907/12384 [4:02:55<22:09:09, 7.61s/it, loss=0.0001, acc=0.9985, iter_time=5.08s]
Epoch 2: 15%|█▌ | 1908/12384 [4:02:55<22:12:58, 7.63s/it, loss=0.0001, acc=0.9985, iter_time=5.08s]
Epoch 2: 15%|█▌ | 1908/12384 [4:03:03<22:12:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 15%|█▌ | 1909/12384 [4:03:03<22:11:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 15%|█▌ | 1909/12384 [4:03:11<22:11:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 15%|█▌ | 1910/12384 [4:03:11<22:09:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 15%|█▌ | 1910/12384 [4:03:18<22:09:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.60s]
Epoch 2: 15%|█▌ | 1911/12384 [4:03:18<22:09:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.60s]
Epoch 2: 15%|█▌ | 1911/12384 [4:03:26<22:09:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 15%|█▌ | 1912/12384 [4:03:26<22:09:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 15%|█▌ | 1912/12384 [4:03:33<22:09:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 15%|█▌ | 1913/12384 [4:03:33<22:07:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 15%|█▌ | 1913/12384 [4:03:41<22:07:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 15%|█▌ | 1914/12384 [4:03:41<22:07:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 15%|█▌ | 1914/12384 [4:03:49<22:07:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 15%|█▌ | 1915/12384 [4:03:49<22:08:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 15%|█▌ | 1915/12384 [4:03:56<22:08:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 15%|█▌ | 1916/12384 [4:03:56<22:08:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 15%|█▌ | 1916/12384 [4:04:04<22:08:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 15%|█▌ | 1917/12384 [4:04:04<22:09:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 15%|█▌ | 1917/12384 [4:04:11<22:09:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 15%|█▌ | 1918/12384 [4:04:11<22:09:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 15%|█▌ | 1918/12384 [4:04:19<22:09:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 15%|█▌ | 1919/12384 [4:04:19<22:09:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 15%|█▌ | 1919/12384 [4:04:27<22:09:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 16%|█▌ | 1920/12384 [4:04:27<22:08:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 16%|█▌ | 1920/12384 [4:04:35<22:08:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 16%|█▌ | 1921/12384 [4:04:35<22:33:14, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 16%|█▌ | 1921/12384 [4:04:42<22:33:14, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 16%|█▌ | 1922/12384 [4:04:42<22:25:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 16%|█▌ | 1922/12384 [4:04:50<22:25:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 16%|█▌ | 1923/12384 [4:04:50<22:19:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 16%|█▌ | 1923/12384 [4:04:58<22:19:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 16%|█▌ | 1924/12384 [4:04:58<22:14:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 16%|█▌ | 1924/12384 [4:05:05<22:14:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1925/12384 [4:05:05<22:11:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1925/12384 [4:05:13<22:11:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▌ | 1926/12384 [4:05:13<22:10:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▌ | 1926/12384 [4:05:20<22:10:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1927/12384 [4:05:20<22:08:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1927/12384 [4:05:28<22:08:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 16%|█▌ | 1928/12384 [4:05:28<22:07:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 16%|█▌ | 1928/12384 [4:05:36<22:07:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 16%|█▌ | 1929/12384 [4:05:36<22:08:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 16%|█▌ | 1929/12384 [4:05:43<22:08:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 16%|█▌ | 1930/12384 [4:05:43<22:07:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 16%|█▌ | 1930/12384 [4:05:51<22:07:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▌ | 1931/12384 [4:05:51<22:06:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▌ | 1931/12384 [4:05:59<22:06:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 16%|█▌ | 1932/12384 [4:05:59<22:22:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 16%|█▌ | 1932/12384 [4:06:06<22:22:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 16%|█▌ | 1933/12384 [4:06:06<22:17:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 16%|█▌ | 1933/12384 [4:06:14<22:17:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 16%|█▌ | 1934/12384 [4:06:14<22:13:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 16%|█▌ | 1934/12384 [4:06:22<22:13:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 16%|█▌ | 1935/12384 [4:06:22<22:10:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 16%|█▌ | 1935/12384 [4:06:29<22:10:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 16%|█▌ | 1936/12384 [4:06:29<22:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 16%|█▌ | 1936/12384 [4:06:37<22:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 16%|█▌ | 1937/12384 [4:06:37<22:06:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 16%|█▌ | 1937/12384 [4:06:44<22:06:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1938/12384 [4:06:44<22:05:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1938/12384 [4:06:52<22:05:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1939/12384 [4:06:52<22:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1939/12384 [4:07:00<22:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 16%|█▌ | 1940/12384 [4:07:00<22:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 16%|█▌ | 1940/12384 [4:07:07<22:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 16%|█▌ | 1941/12384 [4:07:07<22:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 16%|█▌ | 1941/12384 [4:07:15<22:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 16%|█▌ | 1942/12384 [4:07:15<22:06:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 16%|█▌ | 1942/12384 [4:07:23<22:06:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 16%|█▌ | 1943/12384 [4:07:23<22:10:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 16%|█▌ | 1943/12384 [4:07:30<22:10:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 16%|█▌ | 1944/12384 [4:07:30<22:08:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 16%|█▌ | 1944/12384 [4:07:38<22:08:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 16%|█▌ | 1945/12384 [4:07:38<22:09:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 16%|█▌ | 1945/12384 [4:07:45<22:09:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 16%|█▌ | 1946/12384 [4:07:45<22:08:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 16%|█▌ | 1946/12384 [4:07:53<22:08:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 16%|█▌ | 1947/12384 [4:07:53<22:25:30, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 16%|█▌ | 1947/12384 [4:08:01<22:25:30, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 16%|█▌ | 1948/12384 [4:08:01<22:19:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 16%|█▌ | 1948/12384 [4:08:09<22:19:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 16%|█▌ | 1949/12384 [4:08:09<22:13:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 16%|█▌ | 1949/12384 [4:08:16<22:13:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1950/12384 [4:08:16<22:09:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1950/12384 [4:08:24<22:09:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1951/12384 [4:08:24<22:07:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1951/12384 [4:08:31<22:07:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 16%|█▌ | 1952/12384 [4:08:31<22:05:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 16%|█▌ | 1952/12384 [4:08:39<22:05:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 16%|█▌ | 1953/12384 [4:08:39<22:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 16%|█▌ | 1953/12384 [4:08:47<22:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 16%|█▌ | 1954/12384 [4:08:47<22:04:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 16%|█▌ | 1954/12384 [4:08:54<22:04:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 16%|█▌ | 1955/12384 [4:08:54<22:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 16%|█▌ | 1955/12384 [4:09:02<22:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 2: 16%|█▌ | 1956/12384 [4:09:02<22:04:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 2: 16%|█▌ | 1956/12384 [4:09:10<22:04:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 16%|█▌ | 1957/12384 [4:09:10<22:06:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 16%|█▌ | 1957/12384 [4:09:17<22:06:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 16%|█▌ | 1958/12384 [4:09:17<22:19:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 16%|█▌ | 1958/12384 [4:09:25<22:19:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▌ | 1959/12384 [4:09:25<22:14:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▌ | 1959/12384 [4:09:33<22:14:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 16%|█▌ | 1960/12384 [4:09:33<22:10:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 16%|█▌ | 1960/12384 [4:09:40<22:10:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 16%|█▌ | 1961/12384 [4:09:40<22:07:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 16%|█▌ | 1961/12384 [4:09:48<22:07:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 16%|█▌ | 1962/12384 [4:09:48<22:07:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 16%|█▌ | 1962/12384 [4:09:56<22:07:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 16%|█▌ | 1963/12384 [4:09:56<22:05:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 16%|█▌ | 1963/12384 [4:10:03<22:05:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1964/12384 [4:10:03<22:03:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1964/12384 [4:10:11<22:03:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 16%|█▌ | 1965/12384 [4:10:11<22:12:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 16%|█▌ | 1965/12384 [4:10:19<22:12:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 16%|█▌ | 1966/12384 [4:10:19<22:09:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 16%|█▌ | 1966/12384 [4:10:26<22:09:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 16%|█▌ | 1967/12384 [4:10:26<22:05:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 16%|█▌ | 1967/12384 [4:10:34<22:05:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 2: 16%|█▌ | 1968/12384 [4:10:34<22:03:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 2: 16%|█▌ | 1968/12384 [4:10:41<22:03:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 16%|█▌ | 1969/12384 [4:10:41<22:02:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 16%|█▌ | 1969/12384 [4:10:49<22:02:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 16%|█▌ | 1970/12384 [4:10:49<22:02:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 16%|█▌ | 1970/12384 [4:10:57<22:02:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1971/12384 [4:10:57<22:00:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▌ | 1971/12384 [4:11:04<22:00:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 16%|█▌ | 1972/12384 [4:11:04<22:06:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 16%|█▌ | 1972/12384 [4:11:12<22:06:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 16%|█▌ | 1973/12384 [4:11:12<22:23:12, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 16%|█▌ | 1973/12384 [4:11:20<22:23:12, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 16%|█▌ | 1974/12384 [4:11:20<22:15:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 16%|█▌ | 1974/12384 [4:11:28<22:15:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 16%|█▌ | 1975/12384 [4:11:28<22:14:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 16%|█▌ | 1975/12384 [4:11:35<22:14:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 16%|█▌ | 1976/12384 [4:11:35<22:10:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 16%|█▌ | 1976/12384 [4:11:43<22:10:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 16%|█▌ | 1977/12384 [4:11:43<22:06:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 16%|█▌ | 1977/12384 [4:11:50<22:06:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▌ | 1978/12384 [4:11:50<22:03:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▌ | 1978/12384 [4:11:58<22:03:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1979/12384 [4:11:58<22:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1979/12384 [4:12:06<22:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 16%|█▌ | 1980/12384 [4:12:06<22:00:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 16%|█▌ | 1980/12384 [4:12:13<22:00:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 16%|█▌ | 1981/12384 [4:12:13<22:00:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 16%|█▌ | 1981/12384 [4:12:21<22:00:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 16%|█▌ | 1982/12384 [4:12:21<21:59:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 16%|█▌ | 1982/12384 [4:12:28<21:59:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 16%|█▌ | 1983/12384 [4:12:28<21:59:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 16%|█▌ | 1983/12384 [4:12:36<21:59:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 16%|█▌ | 1984/12384 [4:12:36<22:00:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 16%|█▌ | 1984/12384 [4:12:44<22:00:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 16%|█▌ | 1985/12384 [4:12:44<22:13:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 16%|█▌ | 1985/12384 [4:12:51<22:13:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 16%|█▌ | 1986/12384 [4:12:51<22:08:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 16%|█▌ | 1986/12384 [4:12:59<22:08:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 16%|█▌ | 1987/12384 [4:12:59<22:05:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 16%|█▌ | 1987/12384 [4:13:07<22:05:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1988/12384 [4:13:07<22:02:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▌ | 1988/12384 [4:13:14<22:02:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 16%|█▌ | 1989/12384 [4:13:14<22:00:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 16%|█▌ | 1989/12384 [4:13:22<22:00:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 2: 16%|█▌ | 1990/12384 [4:13:22<21:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 2: 16%|█▌ | 1990/12384 [4:13:29<21:59:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 16%|█▌ | 1991/12384 [4:13:29<21:59:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 16%|█▌ | 1991/12384 [4:13:37<21:59:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 2: 16%|█▌ | 1992/12384 [4:13:37<21:58:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 2: 16%|█▌ | 1992/12384 [4:13:45<21:58:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 16%|█▌ | 1993/12384 [4:13:45<21:57:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 16%|█▌ | 1993/12384 [4:13:52<21:57:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 16%|█▌ | 1994/12384 [4:13:52<21:57:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 16%|█▌ | 1994/12384 [4:14:00<21:57:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 16%|█▌ | 1995/12384 [4:14:00<21:57:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 16%|█▌ | 1995/12384 [4:14:07<21:57:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 16%|█▌ | 1996/12384 [4:14:07<21:56:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 16%|█▌ | 1996/12384 [4:14:15<21:56:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 16%|█▌ | 1997/12384 [4:14:15<21:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 16%|█▌ | 1997/12384 [4:14:23<21:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 2: 16%|█▌ | 1998/12384 [4:14:23<21:57:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 2: 16%|█▌ | 1998/12384 [4:14:30<21:57:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 16%|█▌ | 1999/12384 [4:14:30<21:58:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 16%|█▌ | 1999/12384 [4:14:38<21:58:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 16%|█▌ | 2000/12384 [4:14:38<22:14:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 16%|█▌ | 2000/12384 [4:14:46<22:14:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 16%|█▌ | 2001/12384 [4:14:46<22:08:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 16%|█▌ | 2001/12384 [4:14:54<22:08:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 16%|█▌ | 2002/12384 [4:14:54<22:06:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 16%|█▌ | 2002/12384 [4:15:01<22:06:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 16%|█▌ | 2003/12384 [4:15:01<22:03:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 16%|█▌ | 2003/12384 [4:15:09<22:03:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 16%|█▌ | 2004/12384 [4:15:09<22:02:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 16%|█▌ | 2004/12384 [4:15:16<22:02:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 16%|█▌ | 2005/12384 [4:15:16<22:01:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 16%|█▌ | 2005/12384 [4:15:24<22:01:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 16%|█▌ | 2006/12384 [4:15:24<21:59:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 16%|█▌ | 2006/12384 [4:15:32<21:59:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 16%|█▌ | 2007/12384 [4:15:32<21:57:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 16%|█▌ | 2007/12384 [4:15:39<21:57:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 16%|█▌ | 2008/12384 [4:15:39<21:57:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 16%|█▌ | 2008/12384 [4:15:47<21:57:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 2: 16%|█▌ | 2009/12384 [4:15:47<22:00:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 2: 16%|█▌ | 2009/12384 [4:15:55<22:00:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 16%|█▌ | 2010/12384 [4:15:55<21:59:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 16%|█▌ | 2010/12384 [4:16:02<21:59:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 16%|█▌ | 2011/12384 [4:16:02<22:12:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 16%|█▌ | 2011/12384 [4:16:10<22:12:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 16%|█▌ | 2012/12384 [4:16:10<22:08:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 16%|█▌ | 2012/12384 [4:16:18<22:08:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 16%|█▋ | 2013/12384 [4:16:18<22:03:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 16%|█▋ | 2013/12384 [4:16:25<22:03:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▋ | 2014/12384 [4:16:25<22:00:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 16%|█▋ | 2014/12384 [4:16:33<22:00:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▋ | 2015/12384 [4:16:33<21:58:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 16%|█▋ | 2015/12384 [4:16:40<21:58:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 16%|█▋ | 2016/12384 [4:16:40<21:57:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 16%|█▋ | 2016/12384 [4:16:48<21:57:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 16%|█▋ | 2017/12384 [4:16:48<21:56:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 16%|█▋ | 2017/12384 [4:16:56<21:56:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▋ | 2018/12384 [4:16:56<21:54:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▋ | 2018/12384 [4:17:03<21:54:47, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.66s]
Epoch 2: 16%|█▋ | 2019/12384 [4:17:03<21:54:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.66s]
Epoch 2: 16%|█▋ | 2019/12384 [4:17:11<21:54:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 16%|█▋ | 2020/12384 [4:17:11<21:53:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 16%|█▋ | 2020/12384 [4:17:19<21:53:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▋ | 2021/12384 [4:17:19<21:57:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 16%|█▋ | 2021/12384 [4:17:26<21:57:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 16%|█▋ | 2022/12384 [4:17:26<21:56:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 16%|█▋ | 2022/12384 [4:17:34<21:56:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 16%|█▋ | 2023/12384 [4:17:34<22:01:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 16%|█▋ | 2023/12384 [4:17:41<22:01:36, 7.65s/it, loss=0.0002, acc=0.9986, iter_time=8.02s]
Epoch 2: 16%|█▋ | 2024/12384 [4:17:41<22:00:03, 7.65s/it, loss=0.0002, acc=0.9986, iter_time=8.02s]
Epoch 2: 16%|█▋ | 2024/12384 [4:17:49<22:00:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 16%|█▋ | 2025/12384 [4:17:49<21:57:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 16%|█▋ | 2025/12384 [4:17:57<21:57:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 16%|█▋ | 2026/12384 [4:17:57<22:14:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 16%|█▋ | 2026/12384 [4:18:05<22:14:11, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 16%|█▋ | 2027/12384 [4:18:05<22:12:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 16%|█▋ | 2027/12384 [4:18:12<22:12:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 16%|█▋ | 2028/12384 [4:18:12<22:05:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 16%|█▋ | 2028/12384 [4:18:20<22:05:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 2: 16%|█▋ | 2029/12384 [4:18:20<22:00:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 2: 16%|█▋ | 2029/12384 [4:18:28<22:00:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 16%|█▋ | 2030/12384 [4:18:28<21:59:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 16%|█▋ | 2030/12384 [4:18:35<21:59:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 2: 16%|█▋ | 2031/12384 [4:18:35<21:57:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.56s]
Epoch 2: 16%|█▋ | 2031/12384 [4:18:43<21:57:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 16%|█▋ | 2032/12384 [4:18:43<21:55:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 16%|█▋ | 2032/12384 [4:18:50<21:55:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 16%|█▋ | 2033/12384 [4:18:50<21:55:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 16%|█▋ | 2033/12384 [4:18:58<21:55:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 16%|█▋ | 2034/12384 [4:18:58<21:54:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 16%|█▋ | 2034/12384 [4:19:06<21:54:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.72s]
Epoch 2: 16%|█▋ | 2035/12384 [4:19:06<21:53:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.72s]
Epoch 2: 16%|█▋ | 2035/12384 [4:19:13<21:53:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 16%|█▋ | 2036/12384 [4:19:13<21:53:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 16%|█▋ | 2036/12384 [4:19:21<21:53:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 16%|█▋ | 2037/12384 [4:19:21<22:06:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 16%|█▋ | 2037/12384 [4:19:29<22:06:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 16%|█▋ | 2038/12384 [4:19:29<22:01:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 16%|█▋ | 2038/12384 [4:19:36<22:01:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 16%|█▋ | 2039/12384 [4:19:36<21:57:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 16%|█▋ | 2039/12384 [4:19:44<21:57:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 2: 16%|█▋ | 2040/12384 [4:19:44<21:55:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 2: 16%|█▋ | 2040/12384 [4:19:51<21:55:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 2: 16%|█▋ | 2041/12384 [4:19:51<21:54:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.44s]
Epoch 2: 16%|█▋ | 2041/12384 [4:19:59<21:54:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 2: 16%|█▋ | 2042/12384 [4:19:59<21:54:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 2: 16%|█▋ | 2042/12384 [4:20:07<21:54:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 16%|█▋ | 2043/12384 [4:20:07<21:53:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 16%|█▋ | 2043/12384 [4:20:14<21:53:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2044/12384 [4:20:14<21:52:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2044/12384 [4:20:22<21:52:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2045/12384 [4:20:22<21:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2045/12384 [4:20:30<21:51:04, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 2: 17%|█▋ | 2046/12384 [4:20:30<21:50:51, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.79s]
Epoch 2: 17%|█▋ | 2046/12384 [4:20:37<21:50:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 17%|█▋ | 2047/12384 [4:20:37<21:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 17%|█▋ | 2047/12384 [4:20:45<21:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 17%|█▋ | 2048/12384 [4:20:45<21:50:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 17%|█▋ | 2048/12384 [4:20:52<21:50:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 17%|█▋ | 2049/12384 [4:20:52<21:49:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 17%|█▋ | 2049/12384 [4:21:00<21:49:23, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.48s]
Epoch 2: 17%|█▋ | 2050/12384 [4:21:00<21:49:25, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=10.48s]
Epoch 2: 17%|█▋ | 2050/12384 [4:21:08<21:49:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 17%|█▋ | 2051/12384 [4:21:08<21:48:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 17%|█▋ | 2051/12384 [4:21:15<21:48:44, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 17%|█▋ | 2052/12384 [4:21:15<21:53:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 17%|█▋ | 2052/12384 [4:21:23<21:53:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 17%|█▋ | 2053/12384 [4:21:23<22:07:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 17%|█▋ | 2053/12384 [4:21:31<22:07:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 17%|█▋ | 2054/12384 [4:21:31<22:01:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 17%|█▋ | 2054/12384 [4:21:38<22:01:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 17%|█▋ | 2055/12384 [4:21:38<21:57:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 17%|█▋ | 2055/12384 [4:21:46<21:57:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 17%|█▋ | 2056/12384 [4:21:46<21:56:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 17%|█▋ | 2056/12384 [4:21:54<21:56:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 17%|█▋ | 2057/12384 [4:21:54<21:53:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 17%|█▋ | 2057/12384 [4:22:01<21:53:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 2: 17%|█▋ | 2058/12384 [4:22:01<21:52:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 2: 17%|█▋ | 2058/12384 [4:22:09<21:52:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 17%|█▋ | 2059/12384 [4:22:09<21:52:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 17%|█▋ | 2059/12384 [4:22:16<21:52:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 17%|█▋ | 2060/12384 [4:22:16<21:51:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 17%|█▋ | 2060/12384 [4:22:24<21:51:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2061/12384 [4:22:24<21:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2061/12384 [4:22:32<21:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 17%|█▋ | 2062/12384 [4:22:32<21:50:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 17%|█▋ | 2062/12384 [4:22:40<21:50:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 17%|█▋ | 2063/12384 [4:22:40<22:04:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 17%|█▋ | 2063/12384 [4:22:47<22:04:08, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 2: 17%|█▋ | 2064/12384 [4:22:47<21:59:37, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.55s]
Epoch 2: 17%|█▋ | 2064/12384 [4:22:55<21:59:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2065/12384 [4:22:55<21:56:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2065/12384 [4:23:02<21:56:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2066/12384 [4:23:02<21:52:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2066/12384 [4:23:10<21:52:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 17%|█▋ | 2067/12384 [4:23:10<21:54:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 17%|█▋ | 2067/12384 [4:23:18<21:54:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 17%|█▋ | 2068/12384 [4:23:18<21:51:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 17%|█▋ | 2068/12384 [4:23:25<21:51:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 17%|█▋ | 2069/12384 [4:23:25<21:54:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 17%|█▋ | 2069/12384 [4:23:33<21:54:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 17%|█▋ | 2070/12384 [4:23:33<21:55:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 17%|█▋ | 2070/12384 [4:23:41<21:55:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 17%|█▋ | 2071/12384 [4:23:41<21:52:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 17%|█▋ | 2071/12384 [4:23:48<21:52:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 17%|█▋ | 2072/12384 [4:23:48<21:49:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 17%|█▋ | 2072/12384 [4:23:56<21:49:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 17%|█▋ | 2073/12384 [4:23:56<21:48:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 17%|█▋ | 2073/12384 [4:24:03<21:48:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 17%|█▋ | 2074/12384 [4:24:03<21:47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 17%|█▋ | 2074/12384 [4:24:11<21:47:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 17%|█▋ | 2075/12384 [4:24:11<21:46:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 17%|█▋ | 2075/12384 [4:24:19<21:46:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 17%|█▋ | 2076/12384 [4:24:19<21:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 17%|█▋ | 2076/12384 [4:24:26<21:47:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2077/12384 [4:24:26<21:47:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2077/12384 [4:24:34<21:47:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 17%|█▋ | 2078/12384 [4:24:34<21:51:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 17%|█▋ | 2078/12384 [4:24:42<21:51:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 17%|█▋ | 2079/12384 [4:24:42<22:10:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 17%|█▋ | 2079/12384 [4:24:49<22:10:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 17%|█▋ | 2080/12384 [4:24:49<22:01:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 17%|█▋ | 2080/12384 [4:24:57<22:01:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 17%|█▋ | 2081/12384 [4:24:57<21:56:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 17%|█▋ | 2081/12384 [4:25:05<21:56:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 17%|█▋ | 2082/12384 [4:25:05<21:52:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 17%|█▋ | 2082/12384 [4:25:12<21:52:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 17%|█▋ | 2083/12384 [4:25:12<21:50:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 17%|█▋ | 2083/12384 [4:25:20<21:50:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2084/12384 [4:25:20<21:49:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2084/12384 [4:25:27<21:49:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2085/12384 [4:25:27<21:47:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2085/12384 [4:25:35<21:47:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 17%|█▋ | 2086/12384 [4:25:35<21:47:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 17%|█▋ | 2086/12384 [4:25:43<21:47:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 17%|█▋ | 2087/12384 [4:25:43<21:46:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 17%|█▋ | 2087/12384 [4:25:50<21:46:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 17%|█▋ | 2088/12384 [4:25:50<21:45:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 17%|█▋ | 2088/12384 [4:25:58<21:45:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 17%|█▋ | 2089/12384 [4:25:58<21:57:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 17%|█▋ | 2089/12384 [4:26:06<21:57:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2090/12384 [4:26:06<21:53:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2090/12384 [4:26:13<21:53:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2091/12384 [4:26:13<21:50:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2091/12384 [4:26:21<21:50:14, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2092/12384 [4:26:21<21:49:20, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2092/12384 [4:26:28<21:49:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 17%|█▋ | 2093/12384 [4:26:28<21:47:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 17%|█▋ | 2093/12384 [4:26:36<21:47:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 2: 17%|█▋ | 2094/12384 [4:26:36<21:45:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.48s]
Epoch 2: 17%|█▋ | 2094/12384 [4:26:44<21:45:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 17%|█▋ | 2095/12384 [4:26:44<21:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 17%|█▋ | 2095/12384 [4:26:51<21:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 17%|█▋ | 2096/12384 [4:26:51<21:45:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 17%|█▋ | 2096/12384 [4:26:59<21:45:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 17%|█▋ | 2097/12384 [4:26:59<21:46:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 17%|█▋ | 2097/12384 [4:27:06<21:46:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 17%|█▋ | 2098/12384 [4:27:06<21:27:52, 7.51s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 17%|█▋ | 2098/12384 [4:27:14<21:27:52, 7.51s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 17%|█▋ | 2099/12384 [4:27:14<21:31:51, 7.54s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 17%|█▋ | 2099/12384 [4:27:21<21:31:51, 7.54s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2100/12384 [4:27:21<21:35:35, 7.56s/it, loss=0.0002, acc=0.9999, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2100/12384 [4:27:29<21:35:35, 7.56s/it, loss=0.0008, acc=0.9983, iter_time=5.81s]
Epoch 2: 17%|█▋ | 2101/12384 [4:27:29<21:37:45, 7.57s/it, loss=0.0008, acc=0.9983, iter_time=5.81s]
Epoch 2: 17%|█▋ | 2101/12384 [4:27:37<21:37:45, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 17%|█▋ | 2102/12384 [4:27:37<21:37:59, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 17%|█▋ | 2102/12384 [4:27:44<21:37:59, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 2: 17%|█▋ | 2103/12384 [4:27:44<21:37:55, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 2: 17%|█▋ | 2103/12384 [4:27:52<21:37:55, 7.57s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 17%|█▋ | 2104/12384 [4:27:52<21:39:46, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 17%|█▋ | 2104/12384 [4:28:00<21:39:46, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 17%|█▋ | 2105/12384 [4:28:00<21:56:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 17%|█▋ | 2105/12384 [4:28:07<21:56:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 17%|█▋ | 2106/12384 [4:28:07<21:55:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 17%|█▋ | 2106/12384 [4:28:15<21:55:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 17%|█▋ | 2107/12384 [4:28:15<21:51:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 17%|█▋ | 2107/12384 [4:28:23<21:51:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2108/12384 [4:28:23<21:49:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2108/12384 [4:28:30<21:49:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2109/12384 [4:28:30<21:48:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2109/12384 [4:28:38<21:48:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2110/12384 [4:28:38<21:45:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2110/12384 [4:28:45<21:45:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 17%|█▋ | 2111/12384 [4:28:45<21:44:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 17%|█▋ | 2111/12384 [4:28:53<21:44:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 17%|█▋ | 2112/12384 [4:28:53<21:43:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 17%|█▋ | 2112/12384 [4:29:01<21:43:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 17%|█▋ | 2113/12384 [4:29:01<21:45:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 17%|█▋ | 2113/12384 [4:29:08<21:45:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 17%|█▋ | 2114/12384 [4:29:08<21:43:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 17%|█▋ | 2114/12384 [4:29:16<21:43:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 17%|█▋ | 2115/12384 [4:29:16<21:58:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 17%|█▋ | 2115/12384 [4:29:24<21:58:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 17%|█▋ | 2116/12384 [4:29:24<21:52:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 17%|█▋ | 2116/12384 [4:29:31<21:52:36, 7.67s/it, loss=0.0003, acc=0.9987, iter_time=8.56s]
Epoch 2: 17%|█▋ | 2117/12384 [4:29:31<21:49:32, 7.65s/it, loss=0.0003, acc=0.9987, iter_time=8.56s]
Epoch 2: 17%|█▋ | 2117/12384 [4:29:39<21:49:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 17%|█▋ | 2118/12384 [4:29:39<21:44:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 17%|█▋ | 2118/12384 [4:29:47<21:44:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 17%|█▋ | 2119/12384 [4:29:47<21:42:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 17%|█▋ | 2119/12384 [4:29:54<21:42:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 17%|█▋ | 2120/12384 [4:29:54<21:42:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 17%|█▋ | 2120/12384 [4:30:02<21:42:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 17%|█▋ | 2121/12384 [4:30:02<21:41:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 17%|█▋ | 2121/12384 [4:30:09<21:41:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2122/12384 [4:30:09<21:40:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2122/12384 [4:30:17<21:40:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 17%|█▋ | 2123/12384 [4:30:17<21:39:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 17%|█▋ | 2123/12384 [4:30:25<21:39:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 17%|█▋ | 2124/12384 [4:30:25<21:39:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 17%|█▋ | 2124/12384 [4:30:32<21:39:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2125/12384 [4:30:32<21:39:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2125/12384 [4:30:40<21:39:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 17%|█▋ | 2126/12384 [4:30:40<21:42:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 17%|█▋ | 2126/12384 [4:30:47<21:42:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 17%|█▋ | 2127/12384 [4:30:47<21:41:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 17%|█▋ | 2127/12384 [4:30:55<21:41:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 17%|█▋ | 2128/12384 [4:30:55<21:41:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 17%|█▋ | 2128/12384 [4:31:03<21:41:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 2: 17%|█▋ | 2129/12384 [4:31:03<21:41:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.69s]
Epoch 2: 17%|█▋ | 2129/12384 [4:31:10<21:41:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 17%|█▋ | 2130/12384 [4:31:10<21:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 17%|█▋ | 2130/12384 [4:31:18<21:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 17%|█▋ | 2131/12384 [4:31:18<21:58:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 17%|█▋ | 2131/12384 [4:31:26<21:58:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 17%|█▋ | 2132/12384 [4:31:26<21:53:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 17%|█▋ | 2132/12384 [4:31:33<21:53:14, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 2: 17%|█▋ | 2133/12384 [4:31:33<21:49:48, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 2: 17%|█▋ | 2133/12384 [4:31:41<21:49:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2134/12384 [4:31:41<21:46:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 17%|█▋ | 2134/12384 [4:31:49<21:46:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2135/12384 [4:31:49<21:43:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2135/12384 [4:31:56<21:43:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 17%|█▋ | 2136/12384 [4:31:56<21:42:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 17%|█▋ | 2136/12384 [4:32:04<21:42:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 17%|█▋ | 2137/12384 [4:32:04<21:42:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 17%|█▋ | 2137/12384 [4:32:12<21:42:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 17%|█▋ | 2138/12384 [4:32:12<21:44:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 17%|█▋ | 2138/12384 [4:32:19<21:44:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 17%|█▋ | 2139/12384 [4:32:19<21:43:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 17%|█▋ | 2139/12384 [4:32:27<21:43:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 17%|█▋ | 2140/12384 [4:32:27<21:40:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 17%|█▋ | 2140/12384 [4:32:34<21:40:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 17%|█▋ | 2141/12384 [4:32:34<21:41:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 17%|█▋ | 2141/12384 [4:32:42<21:41:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 17%|█▋ | 2142/12384 [4:32:42<21:43:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 17%|█▋ | 2142/12384 [4:32:50<21:43:24, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=10.74s]
Epoch 2: 17%|█▋ | 2143/12384 [4:32:50<21:41:02, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=10.74s]
Epoch 2: 17%|█▋ | 2143/12384 [4:32:57<21:41:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 17%|█▋ | 2144/12384 [4:32:57<21:43:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 17%|█▋ | 2144/12384 [4:33:05<21:43:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2145/12384 [4:33:05<21:41:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2145/12384 [4:33:12<21:41:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 17%|█▋ | 2146/12384 [4:33:12<21:40:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 17%|█▋ | 2146/12384 [4:33:20<21:40:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 17%|█▋ | 2147/12384 [4:33:20<21:39:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 17%|█▋ | 2147/12384 [4:33:28<21:39:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 2: 17%|█▋ | 2148/12384 [4:33:28<21:38:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 2: 17%|█▋ | 2148/12384 [4:33:35<21:38:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 17%|█▋ | 2149/12384 [4:33:35<21:37:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 17%|█▋ | 2149/12384 [4:33:43<21:37:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 17%|█▋ | 2150/12384 [4:33:43<21:36:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 17%|█▋ | 2150/12384 [4:33:50<21:36:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 17%|█▋ | 2151/12384 [4:33:50<21:35:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 17%|█▋ | 2151/12384 [4:33:58<21:35:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 17%|█▋ | 2152/12384 [4:33:58<21:36:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 17%|█▋ | 2152/12384 [4:34:06<21:36:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 17%|█▋ | 2153/12384 [4:34:06<21:36:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 17%|█▋ | 2153/12384 [4:34:13<21:36:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2154/12384 [4:34:13<21:37:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2154/12384 [4:34:21<21:37:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 17%|█▋ | 2155/12384 [4:34:21<21:37:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 17%|█▋ | 2155/12384 [4:34:29<21:37:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 17%|█▋ | 2156/12384 [4:34:29<21:36:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 17%|█▋ | 2156/12384 [4:34:36<21:36:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 17%|█▋ | 2157/12384 [4:34:36<21:50:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 17%|█▋ | 2157/12384 [4:34:44<21:50:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 17%|█▋ | 2158/12384 [4:34:44<21:50:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 17%|█▋ | 2158/12384 [4:34:52<21:50:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 17%|█▋ | 2159/12384 [4:34:52<21:46:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 17%|█▋ | 2159/12384 [4:34:59<21:46:37, 7.67s/it, loss=0.0002, acc=0.9993, iter_time=8.01s]
Epoch 2: 17%|█▋ | 2160/12384 [4:34:59<21:43:42, 7.65s/it, loss=0.0002, acc=0.9993, iter_time=8.01s]
Epoch 2: 17%|█▋ | 2160/12384 [4:35:07<21:43:42, 7.65s/it, loss=0.0001, acc=0.9997, iter_time=7.21s]
Epoch 2: 17%|█▋ | 2161/12384 [4:35:07<21:41:21, 7.64s/it, loss=0.0001, acc=0.9997, iter_time=7.21s]
Epoch 2: 17%|█▋ | 2161/12384 [4:35:15<21:41:21, 7.64s/it, loss=0.0001, acc=0.9995, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2162/12384 [4:35:15<21:40:20, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=7.61s]
Epoch 2: 17%|█▋ | 2162/12384 [4:35:22<21:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 17%|█▋ | 2163/12384 [4:35:22<21:39:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 17%|█▋ | 2163/12384 [4:35:30<21:39:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 17%|█▋ | 2164/12384 [4:35:30<21:38:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 17%|█▋ | 2164/12384 [4:35:37<21:38:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2165/12384 [4:35:37<21:37:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 17%|█▋ | 2165/12384 [4:35:45<21:37:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 2: 17%|█▋ | 2166/12384 [4:35:45<21:37:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 2: 17%|█▋ | 2166/12384 [4:35:53<21:37:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 2: 17%|█▋ | 2167/12384 [4:35:53<21:37:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 2: 17%|█▋ | 2167/12384 [4:36:00<21:37:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 18%|█▊ | 2168/12384 [4:36:00<21:41:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 18%|█▊ | 2168/12384 [4:36:08<21:41:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 18%|█▊ | 2169/12384 [4:36:08<21:38:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 18%|█▊ | 2169/12384 [4:36:16<21:38:49, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.65s]
Epoch 2: 18%|█▊ | 2170/12384 [4:36:16<21:41:42, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.65s]
Epoch 2: 18%|█▊ | 2170/12384 [4:36:23<21:41:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 18%|█▊ | 2171/12384 [4:36:23<21:39:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 18%|█▊ | 2171/12384 [4:36:31<21:39:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 18%|█▊ | 2172/12384 [4:36:31<21:36:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 18%|█▊ | 2172/12384 [4:36:38<21:36:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 18%|█▊ | 2173/12384 [4:36:38<21:36:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 18%|█▊ | 2173/12384 [4:36:46<21:36:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 18%|█▊ | 2174/12384 [4:36:46<21:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 18%|█▊ | 2174/12384 [4:36:54<21:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 18%|█▊ | 2175/12384 [4:36:54<21:35:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 18%|█▊ | 2175/12384 [4:37:01<21:35:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 18%|█▊ | 2176/12384 [4:37:01<21:34:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 18%|█▊ | 2176/12384 [4:37:09<21:34:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 18%|█▊ | 2177/12384 [4:37:09<21:34:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 18%|█▊ | 2177/12384 [4:37:16<21:34:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 18%|█▊ | 2178/12384 [4:37:16<21:33:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 18%|█▊ | 2178/12384 [4:37:24<21:33:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 18%|█▊ | 2179/12384 [4:37:24<21:34:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 18%|█▊ | 2179/12384 [4:37:32<21:34:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2180/12384 [4:37:32<21:33:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2180/12384 [4:37:39<21:33:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2181/12384 [4:37:39<21:32:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2181/12384 [4:37:47<21:32:53, 7.60s/it, loss=0.0042, acc=0.9983, iter_time=8.00s]
Epoch 2: 18%|█▊ | 2182/12384 [4:37:47<21:33:17, 7.61s/it, loss=0.0042, acc=0.9983, iter_time=8.00s]
Epoch 2: 18%|█▊ | 2182/12384 [4:37:55<21:33:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 18%|█▊ | 2183/12384 [4:37:55<21:38:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 18%|█▊ | 2183/12384 [4:38:02<21:38:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 18%|█▊ | 2184/12384 [4:38:02<21:51:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 18%|█▊ | 2184/12384 [4:38:10<21:51:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 18%|█▊ | 2185/12384 [4:38:10<21:45:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 18%|█▊ | 2185/12384 [4:38:18<21:45:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2186/12384 [4:38:18<21:41:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2186/12384 [4:38:25<21:41:30, 7.66s/it, loss=0.0008, acc=0.9990, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2187/12384 [4:38:25<21:38:49, 7.64s/it, loss=0.0008, acc=0.9990, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2187/12384 [4:38:33<21:38:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 18%|█▊ | 2188/12384 [4:38:33<21:38:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 18%|█▊ | 2188/12384 [4:38:41<21:38:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2189/12384 [4:38:41<21:39:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2189/12384 [4:38:48<21:39:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 18%|█▊ | 2190/12384 [4:38:48<21:37:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 18%|█▊ | 2190/12384 [4:38:56<21:37:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 18%|█▊ | 2191/12384 [4:38:56<21:35:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 18%|█▊ | 2191/12384 [4:39:03<21:35:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 18%|█▊ | 2192/12384 [4:39:03<21:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 18%|█▊ | 2192/12384 [4:39:11<21:35:07, 7.62s/it, loss=0.0001, acc=0.9992, iter_time=5.09s]
Epoch 2: 18%|█▊ | 2193/12384 [4:39:11<21:33:16, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=5.09s]
Epoch 2: 18%|█▊ | 2193/12384 [4:39:19<21:33:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 18%|█▊ | 2194/12384 [4:39:19<21:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 18%|█▊ | 2194/12384 [4:39:26<21:32:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 18%|█▊ | 2195/12384 [4:39:26<21:46:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 18%|█▊ | 2195/12384 [4:39:34<21:46:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 18%|█▊ | 2196/12384 [4:39:34<21:42:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 18%|█▊ | 2196/12384 [4:39:42<21:42:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2197/12384 [4:39:42<21:38:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2197/12384 [4:39:49<21:38:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 18%|█▊ | 2198/12384 [4:39:49<21:37:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 18%|█▊ | 2198/12384 [4:39:57<21:37:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 18%|█▊ | 2199/12384 [4:39:57<21:35:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 18%|█▊ | 2199/12384 [4:40:05<21:35:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 18%|█▊ | 2200/12384 [4:40:05<21:34:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 18%|█▊ | 2200/12384 [4:40:12<21:34:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 18%|█▊ | 2201/12384 [4:40:12<21:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 18%|█▊ | 2201/12384 [4:40:20<21:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2202/12384 [4:40:20<21:33:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2202/12384 [4:40:27<21:33:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 18%|█▊ | 2203/12384 [4:40:27<21:33:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 18%|█▊ | 2203/12384 [4:40:35<21:33:07, 7.62s/it, loss=0.0006, acc=0.9992, iter_time=8.19s]
Epoch 2: 18%|█▊ | 2204/12384 [4:40:35<21:33:05, 7.62s/it, loss=0.0006, acc=0.9992, iter_time=8.19s]
Epoch 2: 18%|█▊ | 2204/12384 [4:40:43<21:33:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2205/12384 [4:40:43<21:33:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2205/12384 [4:40:50<21:33:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.10s]
Epoch 2: 18%|█▊ | 2206/12384 [4:40:50<21:33:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.10s]
Epoch 2: 18%|█▊ | 2206/12384 [4:40:58<21:33:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 18%|█▊ | 2207/12384 [4:40:58<21:32:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 18%|█▊ | 2207/12384 [4:41:06<21:32:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 18%|█▊ | 2208/12384 [4:41:06<21:33:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 18%|█▊ | 2208/12384 [4:41:13<21:33:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 18%|█▊ | 2209/12384 [4:41:13<21:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 18%|█▊ | 2209/12384 [4:41:21<21:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 18%|█▊ | 2210/12384 [4:41:21<21:48:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 18%|█▊ | 2210/12384 [4:41:29<21:48:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2211/12384 [4:41:29<21:44:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2211/12384 [4:41:36<21:44:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 18%|█▊ | 2212/12384 [4:41:36<21:39:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 18%|█▊ | 2212/12384 [4:41:44<21:39:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 18%|█▊ | 2213/12384 [4:41:44<21:37:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 18%|█▊ | 2213/12384 [4:41:51<21:37:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 18%|█▊ | 2214/12384 [4:41:51<21:33:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 18%|█▊ | 2214/12384 [4:41:59<21:33:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 18%|█▊ | 2215/12384 [4:41:59<21:33:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 18%|█▊ | 2215/12384 [4:42:07<21:33:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 18%|█▊ | 2216/12384 [4:42:07<21:31:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 18%|█▊ | 2216/12384 [4:42:14<21:31:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 18%|█▊ | 2217/12384 [4:42:14<21:32:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 18%|█▊ | 2217/12384 [4:42:22<21:32:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2218/12384 [4:42:22<21:30:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2218/12384 [4:42:30<21:30:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 2: 18%|█▊ | 2219/12384 [4:42:30<21:30:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 2: 18%|█▊ | 2219/12384 [4:42:37<21:30:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 2: 18%|█▊ | 2220/12384 [4:42:37<21:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 2: 18%|█▊ | 2220/12384 [4:42:45<21:30:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 2: 18%|█▊ | 2221/12384 [4:42:45<21:43:42, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 2: 18%|█▊ | 2221/12384 [4:42:53<21:43:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 18%|█▊ | 2222/12384 [4:42:53<21:37:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 18%|█▊ | 2222/12384 [4:43:00<21:37:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 18%|█▊ | 2223/12384 [4:43:00<21:34:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 18%|█▊ | 2223/12384 [4:43:08<21:34:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 2: 18%|█▊ | 2224/12384 [4:43:08<21:31:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 2: 18%|█▊ | 2224/12384 [4:43:15<21:31:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 2: 18%|█▊ | 2225/12384 [4:43:15<21:30:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 2: 18%|█▊ | 2225/12384 [4:43:23<21:30:48, 7.62s/it, loss=0.0011, acc=0.9986, iter_time=8.27s]
Epoch 2: 18%|█▊ | 2226/12384 [4:43:23<21:33:52, 7.64s/it, loss=0.0011, acc=0.9986, iter_time=8.27s]
Epoch 2: 18%|█▊ | 2226/12384 [4:43:31<21:33:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 18%|█▊ | 2227/12384 [4:43:31<21:38:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 18%|█▊ | 2227/12384 [4:43:38<21:38:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.23s]
Epoch 2: 18%|█▊ | 2228/12384 [4:43:38<21:35:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.23s]
Epoch 2: 18%|█▊ | 2228/12384 [4:43:46<21:35:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 18%|█▊ | 2229/12384 [4:43:46<21:32:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 18%|█▊ | 2229/12384 [4:43:54<21:32:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 18%|█▊ | 2230/12384 [4:43:54<21:29:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 18%|█▊ | 2230/12384 [4:44:01<21:29:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2231/12384 [4:44:01<21:29:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2231/12384 [4:44:09<21:29:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 18%|█▊ | 2232/12384 [4:44:09<21:39:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 18%|█▊ | 2232/12384 [4:44:17<21:39:37, 7.68s/it, loss=0.0004, acc=1.0000, iter_time=7.38s]
Epoch 2: 18%|█▊ | 2233/12384 [4:44:17<21:35:57, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.38s]
Epoch 2: 18%|█▊ | 2233/12384 [4:44:24<21:35:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 18%|█▊ | 2234/12384 [4:44:24<21:33:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 18%|█▊ | 2234/12384 [4:44:32<21:33:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 18%|█▊ | 2235/12384 [4:44:32<21:31:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 18%|█▊ | 2235/12384 [4:44:40<21:31:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 18%|█▊ | 2236/12384 [4:44:40<21:30:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 18%|█▊ | 2236/12384 [4:44:47<21:30:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 18%|█▊ | 2237/12384 [4:44:47<21:45:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 18%|█▊ | 2237/12384 [4:44:55<21:45:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 18%|█▊ | 2238/12384 [4:44:55<21:38:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 18%|█▊ | 2238/12384 [4:45:03<21:38:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2239/12384 [4:45:03<21:41:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2239/12384 [4:45:10<21:41:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 18%|█▊ | 2240/12384 [4:45:10<21:38:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 18%|█▊ | 2240/12384 [4:45:18<21:38:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 18%|█▊ | 2241/12384 [4:45:18<21:34:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 18%|█▊ | 2241/12384 [4:45:26<21:34:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 18%|█▊ | 2242/12384 [4:45:26<21:32:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 18%|█▊ | 2242/12384 [4:45:33<21:32:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 18%|█▊ | 2243/12384 [4:45:33<21:29:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 18%|█▊ | 2243/12384 [4:45:41<21:29:56, 7.63s/it, loss=0.0000, acc=0.9996, iter_time=10.46s]
Epoch 2: 18%|█▊ | 2244/12384 [4:45:41<21:29:19, 7.63s/it, loss=0.0000, acc=0.9996, iter_time=10.46s]
Epoch 2: 18%|█▊ | 2244/12384 [4:45:49<21:29:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2245/12384 [4:45:49<21:28:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2245/12384 [4:45:56<21:28:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 18%|█▊ | 2246/12384 [4:45:56<21:42:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 18%|█▊ | 2246/12384 [4:46:04<21:42:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 18%|█▊ | 2247/12384 [4:46:04<21:40:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 18%|█▊ | 2247/12384 [4:46:12<21:40:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 18%|█▊ | 2248/12384 [4:46:12<21:35:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 18%|█▊ | 2248/12384 [4:46:19<21:35:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2249/12384 [4:46:19<21:31:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2249/12384 [4:46:27<21:31:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2250/12384 [4:46:27<21:28:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2250/12384 [4:46:35<21:28:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2251/12384 [4:46:35<21:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2251/12384 [4:46:42<21:28:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 18%|█▊ | 2252/12384 [4:46:42<21:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 18%|█▊ | 2252/12384 [4:46:50<21:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 18%|█▊ | 2253/12384 [4:46:50<21:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 18%|█▊ | 2253/12384 [4:46:57<21:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 18%|█▊ | 2254/12384 [4:46:57<21:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 18%|█▊ | 2254/12384 [4:47:05<21:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 18%|█▊ | 2255/12384 [4:47:05<21:25:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 18%|█▊ | 2255/12384 [4:47:13<21:25:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 18%|█▊ | 2256/12384 [4:47:13<21:24:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 18%|█▊ | 2256/12384 [4:47:20<21:24:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 18%|█▊ | 2257/12384 [4:47:20<21:23:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 18%|█▊ | 2257/12384 [4:47:28<21:23:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 18%|█▊ | 2258/12384 [4:47:28<21:22:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 18%|█▊ | 2258/12384 [4:47:35<21:22:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2259/12384 [4:47:35<21:23:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2259/12384 [4:47:43<21:23:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 18%|█▊ | 2260/12384 [4:47:43<21:24:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 18%|█▊ | 2260/12384 [4:47:51<21:24:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2261/12384 [4:47:51<21:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 18%|█▊ | 2261/12384 [4:47:58<21:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2262/12384 [4:47:58<21:24:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 18%|█▊ | 2262/12384 [4:48:06<21:24:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 18%|█▊ | 2263/12384 [4:48:06<21:42:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 18%|█▊ | 2263/12384 [4:48:14<21:42:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 18%|█▊ | 2264/12384 [4:48:14<21:36:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 18%|█▊ | 2264/12384 [4:48:21<21:36:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 18%|█▊ | 2265/12384 [4:48:21<21:31:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 18%|█▊ | 2265/12384 [4:48:29<21:31:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2266/12384 [4:48:29<21:29:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2266/12384 [4:48:37<21:29:15, 7.65s/it, loss=0.0014, acc=0.9981, iter_time=7.38s]
Epoch 2: 18%|█▊ | 2267/12384 [4:48:37<21:27:56, 7.64s/it, loss=0.0014, acc=0.9981, iter_time=7.38s]
Epoch 2: 18%|█▊ | 2267/12384 [4:48:44<21:27:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 18%|█▊ | 2268/12384 [4:48:44<21:27:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 18%|█▊ | 2268/12384 [4:48:52<21:27:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 18%|█▊ | 2269/12384 [4:48:52<21:26:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 18%|█▊ | 2269/12384 [4:48:59<21:26:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 18%|█▊ | 2270/12384 [4:48:59<21:25:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 18%|█▊ | 2270/12384 [4:49:07<21:25:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 18%|█▊ | 2271/12384 [4:49:07<21:25:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 18%|█▊ | 2271/12384 [4:49:15<21:25:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 18%|█▊ | 2272/12384 [4:49:15<21:39:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 18%|█▊ | 2272/12384 [4:49:23<21:39:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.67s]
Epoch 2: 18%|█▊ | 2273/12384 [4:49:23<21:34:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.67s]
Epoch 2: 18%|█▊ | 2273/12384 [4:49:30<21:34:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 18%|█▊ | 2274/12384 [4:49:30<21:32:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 18%|█▊ | 2274/12384 [4:49:38<21:32:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 18%|█▊ | 2275/12384 [4:49:38<21:29:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 18%|█▊ | 2275/12384 [4:49:46<21:29:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 18%|█▊ | 2276/12384 [4:49:46<21:27:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 18%|█▊ | 2276/12384 [4:49:53<21:27:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 18%|█▊ | 2277/12384 [4:49:53<21:25:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 18%|█▊ | 2277/12384 [4:50:01<21:25:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 18%|█▊ | 2278/12384 [4:50:01<21:26:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 18%|█▊ | 2278/12384 [4:50:08<21:26:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 18%|█▊ | 2279/12384 [4:50:08<21:24:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 18%|█▊ | 2279/12384 [4:50:16<21:24:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 18%|█▊ | 2280/12384 [4:50:16<21:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 18%|█▊ | 2280/12384 [4:50:24<21:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 18%|█▊ | 2281/12384 [4:50:24<21:21:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 18%|█▊ | 2281/12384 [4:50:31<21:21:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 18%|█▊ | 2282/12384 [4:50:31<21:21:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 18%|█▊ | 2282/12384 [4:50:39<21:21:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 18%|█▊ | 2283/12384 [4:50:39<21:21:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 18%|█▊ | 2283/12384 [4:50:46<21:21:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 18%|█▊ | 2284/12384 [4:50:46<21:20:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 18%|█▊ | 2284/12384 [4:50:54<21:20:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2285/12384 [4:50:54<21:20:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 18%|█▊ | 2285/12384 [4:51:02<21:20:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 18%|█▊ | 2286/12384 [4:51:02<21:21:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 18%|█▊ | 2286/12384 [4:51:09<21:21:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 18%|█▊ | 2287/12384 [4:51:09<21:19:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 18%|█▊ | 2287/12384 [4:51:17<21:19:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 18%|█▊ | 2288/12384 [4:51:17<21:18:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 18%|█▊ | 2288/12384 [4:51:25<21:18:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 18%|█▊ | 2289/12384 [4:51:25<21:34:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 18%|█▊ | 2289/12384 [4:51:32<21:34:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 18%|█▊ | 2290/12384 [4:51:32<21:31:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 18%|█▊ | 2290/12384 [4:51:40<21:31:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 18%|█▊ | 2291/12384 [4:51:40<21:30:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 18%|█▊ | 2291/12384 [4:51:48<21:30:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 19%|█▊ | 2292/12384 [4:51:48<21:28:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 19%|█▊ | 2292/12384 [4:51:55<21:28:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 19%|█▊ | 2293/12384 [4:51:55<21:28:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 19%|█▊ | 2293/12384 [4:52:03<21:28:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 19%|█▊ | 2294/12384 [4:52:03<21:28:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 19%|█▊ | 2294/12384 [4:52:11<21:28:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 19%|█▊ | 2295/12384 [4:52:11<21:26:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 19%|█▊ | 2295/12384 [4:52:18<21:26:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 19%|█▊ | 2296/12384 [4:52:18<21:24:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 19%|█▊ | 2296/12384 [4:52:26<21:24:33, 7.64s/it, loss=0.0014, acc=0.9935, iter_time=7.65s]
Epoch 2: 19%|█▊ | 2297/12384 [4:52:26<21:22:49, 7.63s/it, loss=0.0014, acc=0.9935, iter_time=7.65s]
Epoch 2: 19%|█▊ | 2297/12384 [4:52:34<21:22:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 19%|█▊ | 2298/12384 [4:52:34<21:36:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 19%|█▊ | 2298/12384 [4:52:41<21:36:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▊ | 2299/12384 [4:52:41<21:30:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▊ | 2299/12384 [4:52:49<21:30:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 19%|█▊ | 2300/12384 [4:52:49<21:27:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 19%|█▊ | 2300/12384 [4:52:57<21:27:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 19%|█▊ | 2301/12384 [4:52:57<21:24:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 19%|█▊ | 2301/12384 [4:53:04<21:24:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 19%|█▊ | 2302/12384 [4:53:04<21:22:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 19%|█▊ | 2302/12384 [4:53:12<21:22:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 19%|█▊ | 2303/12384 [4:53:12<21:22:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 19%|█▊ | 2303/12384 [4:53:19<21:22:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 19%|█▊ | 2304/12384 [4:53:19<21:20:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 19%|█▊ | 2304/12384 [4:53:27<21:20:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 19%|█▊ | 2305/12384 [4:53:27<21:20:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 19%|█▊ | 2305/12384 [4:53:35<21:20:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 19%|█▊ | 2306/12384 [4:53:35<21:19:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 19%|█▊ | 2306/12384 [4:53:42<21:19:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 19%|█▊ | 2307/12384 [4:53:42<21:18:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 19%|█▊ | 2307/12384 [4:53:50<21:18:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 19%|█▊ | 2308/12384 [4:53:50<21:17:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 19%|█▊ | 2308/12384 [4:53:57<21:17:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 19%|█▊ | 2309/12384 [4:53:57<21:15:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 19%|█▊ | 2309/12384 [4:54:05<21:15:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 19%|█▊ | 2310/12384 [4:54:05<21:16:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 19%|█▊ | 2310/12384 [4:54:13<21:16:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 19%|█▊ | 2311/12384 [4:54:13<21:16:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 19%|█▊ | 2311/12384 [4:54:20<21:16:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 19%|█▊ | 2312/12384 [4:54:20<21:16:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 19%|█▊ | 2312/12384 [4:54:28<21:16:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 19%|█▊ | 2313/12384 [4:54:28<21:16:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 19%|█▊ | 2313/12384 [4:54:35<21:16:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▊ | 2314/12384 [4:54:35<21:15:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▊ | 2314/12384 [4:54:43<21:15:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▊ | 2315/12384 [4:54:43<21:33:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▊ | 2315/12384 [4:54:51<21:33:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 19%|█▊ | 2316/12384 [4:54:51<21:27:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 19%|█▊ | 2316/12384 [4:54:59<21:27:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▊ | 2317/12384 [4:54:59<21:22:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▊ | 2317/12384 [4:55:06<21:22:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 19%|█▊ | 2318/12384 [4:55:06<21:19:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 19%|█▊ | 2318/12384 [4:55:14<21:19:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 19%|█▊ | 2319/12384 [4:55:14<21:21:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 19%|█▊ | 2319/12384 [4:55:21<21:21:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 19%|█▊ | 2320/12384 [4:55:21<21:20:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 19%|█▊ | 2320/12384 [4:55:29<21:20:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 19%|█▊ | 2321/12384 [4:55:29<21:18:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 19%|█▊ | 2321/12384 [4:55:37<21:18:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2322/12384 [4:55:37<21:17:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2322/12384 [4:55:44<21:17:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 19%|█▉ | 2323/12384 [4:55:44<21:17:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 19%|█▉ | 2323/12384 [4:55:52<21:17:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 2: 19%|█▉ | 2324/12384 [4:55:52<21:16:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 2: 19%|█▉ | 2324/12384 [4:55:59<21:16:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 19%|█▉ | 2325/12384 [4:55:59<21:17:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 19%|█▉ | 2325/12384 [4:56:07<21:17:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 19%|█▉ | 2326/12384 [4:56:07<21:19:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 19%|█▉ | 2326/12384 [4:56:15<21:19:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 19%|█▉ | 2327/12384 [4:56:15<21:19:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 19%|█▉ | 2327/12384 [4:56:22<21:19:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 19%|█▉ | 2328/12384 [4:56:22<21:20:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 19%|█▉ | 2328/12384 [4:56:30<21:20:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2329/12384 [4:56:30<21:19:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2329/12384 [4:56:38<21:19:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 19%|█▉ | 2330/12384 [4:56:38<21:18:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 19%|█▉ | 2330/12384 [4:56:45<21:18:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 19%|█▉ | 2331/12384 [4:56:45<21:19:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 19%|█▉ | 2331/12384 [4:56:53<21:19:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 19%|█▉ | 2332/12384 [4:56:53<21:20:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 19%|█▉ | 2332/12384 [4:57:01<21:20:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 2: 19%|█▉ | 2333/12384 [4:57:01<21:20:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 2: 19%|█▉ | 2333/12384 [4:57:08<21:20:39, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.96s]
Epoch 2: 19%|█▉ | 2334/12384 [4:57:08<21:21:51, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.96s]
Epoch 2: 19%|█▉ | 2334/12384 [4:57:16<21:21:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2335/12384 [4:57:16<21:18:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2335/12384 [4:57:23<21:18:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 19%|█▉ | 2336/12384 [4:57:23<21:18:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 19%|█▉ | 2336/12384 [4:57:31<21:18:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 19%|█▉ | 2337/12384 [4:57:31<21:18:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 19%|█▉ | 2337/12384 [4:57:39<21:18:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 19%|█▉ | 2338/12384 [4:57:39<21:20:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 19%|█▉ | 2338/12384 [4:57:46<21:20:51, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 2: 19%|█▉ | 2339/12384 [4:57:46<21:18:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.70s]
Epoch 2: 19%|█▉ | 2339/12384 [4:57:54<21:18:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▉ | 2340/12384 [4:57:54<21:16:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▉ | 2340/12384 [4:58:02<21:16:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2341/12384 [4:58:02<21:28:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2341/12384 [4:58:09<21:28:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 2: 19%|█▉ | 2342/12384 [4:58:09<21:22:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 2: 19%|█▉ | 2342/12384 [4:58:17<21:22:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 19%|█▉ | 2343/12384 [4:58:17<21:19:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 19%|█▉ | 2343/12384 [4:58:25<21:19:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 19%|█▉ | 2344/12384 [4:58:25<21:19:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 19%|█▉ | 2344/12384 [4:58:32<21:19:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 19%|█▉ | 2345/12384 [4:58:32<21:16:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 19%|█▉ | 2345/12384 [4:58:40<21:16:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 19%|█▉ | 2346/12384 [4:58:40<21:18:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 19%|█▉ | 2346/12384 [4:58:48<21:18:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 19%|█▉ | 2347/12384 [4:58:48<21:16:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 19%|█▉ | 2347/12384 [4:58:55<21:16:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▉ | 2348/12384 [4:58:55<21:16:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▉ | 2348/12384 [4:59:03<21:16:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 19%|█▉ | 2349/12384 [4:59:03<21:14:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 19%|█▉ | 2349/12384 [4:59:11<21:14:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 19%|█▉ | 2350/12384 [4:59:11<21:28:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 19%|█▉ | 2350/12384 [4:59:18<21:28:04, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▉ | 2351/12384 [4:59:18<21:22:42, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 19%|█▉ | 2351/12384 [4:59:26<21:22:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 19%|█▉ | 2352/12384 [4:59:26<21:19:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 19%|█▉ | 2352/12384 [4:59:34<21:19:23, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=5.24s]
Epoch 2: 19%|█▉ | 2353/12384 [4:59:34<21:16:28, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=5.24s]
Epoch 2: 19%|█▉ | 2353/12384 [4:59:41<21:16:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 2: 19%|█▉ | 2354/12384 [4:59:41<21:15:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 2: 19%|█▉ | 2354/12384 [4:59:49<21:15:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 19%|█▉ | 2355/12384 [4:59:49<21:14:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 19%|█▉ | 2355/12384 [4:59:56<21:14:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 19%|█▉ | 2356/12384 [4:59:56<21:12:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 19%|█▉ | 2356/12384 [5:00:04<21:12:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▉ | 2357/12384 [5:00:04<21:12:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▉ | 2357/12384 [5:00:12<21:12:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2358/12384 [5:00:12<21:11:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2358/12384 [5:00:19<21:11:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2359/12384 [5:00:19<21:10:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2359/12384 [5:00:27<21:10:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 19%|█▉ | 2360/12384 [5:00:27<21:10:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 19%|█▉ | 2360/12384 [5:00:34<21:10:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 19%|█▉ | 2361/12384 [5:00:34<21:10:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 19%|█▉ | 2361/12384 [5:00:42<21:10:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 19%|█▉ | 2362/12384 [5:00:42<21:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 19%|█▉ | 2362/12384 [5:00:50<21:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 19%|█▉ | 2363/12384 [5:00:50<21:11:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 19%|█▉ | 2363/12384 [5:00:57<21:11:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 19%|█▉ | 2364/12384 [5:00:57<21:11:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 19%|█▉ | 2364/12384 [5:01:05<21:11:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 19%|█▉ | 2365/12384 [5:01:05<21:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 19%|█▉ | 2365/12384 [5:01:13<21:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 19%|█▉ | 2366/12384 [5:01:13<21:14:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 19%|█▉ | 2366/12384 [5:01:20<21:14:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 2: 19%|█▉ | 2367/12384 [5:01:20<21:14:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 2: 19%|█▉ | 2367/12384 [5:01:28<21:14:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.45s]
Epoch 2: 19%|█▉ | 2368/12384 [5:01:28<21:26:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.45s]
Epoch 2: 19%|█▉ | 2368/12384 [5:01:36<21:26:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2369/12384 [5:01:36<21:21:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2369/12384 [5:01:43<21:21:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 19%|█▉ | 2370/12384 [5:01:43<21:18:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 19%|█▉ | 2370/12384 [5:01:51<21:18:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 19%|█▉ | 2371/12384 [5:01:51<21:18:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 19%|█▉ | 2371/12384 [5:01:58<21:18:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 19%|█▉ | 2372/12384 [5:01:58<21:14:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 19%|█▉ | 2372/12384 [5:02:06<21:14:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 19%|█▉ | 2373/12384 [5:02:06<21:13:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 19%|█▉ | 2373/12384 [5:02:14<21:13:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 2: 19%|█▉ | 2374/12384 [5:02:14<21:11:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 2: 19%|█▉ | 2374/12384 [5:02:21<21:11:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 19%|█▉ | 2375/12384 [5:02:21<21:13:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 19%|█▉ | 2375/12384 [5:02:29<21:13:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.07s]
Epoch 2: 19%|█▉ | 2376/12384 [5:02:29<21:12:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.07s]
Epoch 2: 19%|█▉ | 2376/12384 [5:02:37<21:12:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 19%|█▉ | 2377/12384 [5:02:37<21:10:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 19%|█▉ | 2377/12384 [5:02:44<21:10:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 19%|█▉ | 2378/12384 [5:02:44<21:12:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 19%|█▉ | 2378/12384 [5:02:52<21:12:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2379/12384 [5:02:52<21:11:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2379/12384 [5:02:59<21:11:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 19%|█▉ | 2380/12384 [5:02:59<21:10:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 19%|█▉ | 2380/12384 [5:03:07<21:10:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▉ | 2381/12384 [5:03:07<21:09:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▉ | 2381/12384 [5:03:15<21:09:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 19%|█▉ | 2382/12384 [5:03:15<21:09:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 19%|█▉ | 2382/12384 [5:03:22<21:09:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 19%|█▉ | 2383/12384 [5:03:22<21:10:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 19%|█▉ | 2383/12384 [5:03:30<21:10:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 19%|█▉ | 2384/12384 [5:03:30<21:09:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 19%|█▉ | 2384/12384 [5:03:38<21:09:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 19%|█▉ | 2385/12384 [5:03:38<21:07:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 19%|█▉ | 2385/12384 [5:03:45<21:07:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 19%|█▉ | 2386/12384 [5:03:45<21:08:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 19%|█▉ | 2386/12384 [5:03:53<21:08:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 19%|█▉ | 2387/12384 [5:03:53<21:07:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 19%|█▉ | 2387/12384 [5:04:00<21:07:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▉ | 2388/12384 [5:04:00<21:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▉ | 2388/12384 [5:04:08<21:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 2: 19%|█▉ | 2389/12384 [5:04:08<21:08:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 2: 19%|█▉ | 2389/12384 [5:04:16<21:08:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 19%|█▉ | 2390/12384 [5:04:16<21:08:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 19%|█▉ | 2390/12384 [5:04:23<21:08:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2391/12384 [5:04:23<21:06:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2391/12384 [5:04:31<21:06:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2392/12384 [5:04:31<21:10:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2392/12384 [5:04:38<21:10:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 19%|█▉ | 2393/12384 [5:04:38<21:09:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 19%|█▉ | 2393/12384 [5:04:46<21:09:07, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.68s]
Epoch 2: 19%|█▉ | 2394/12384 [5:04:46<21:26:58, 7.73s/it, loss=0.0001, acc=0.9999, iter_time=7.68s]
Epoch 2: 19%|█▉ | 2394/12384 [5:04:54<21:26:58, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 19%|█▉ | 2395/12384 [5:04:54<21:20:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 19%|█▉ | 2395/12384 [5:05:02<21:20:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2396/12384 [5:05:02<21:17:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2396/12384 [5:05:09<21:17:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 19%|█▉ | 2397/12384 [5:05:09<21:12:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 19%|█▉ | 2397/12384 [5:05:17<21:12:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 19%|█▉ | 2398/12384 [5:05:17<21:10:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 19%|█▉ | 2398/12384 [5:05:25<21:10:03, 7.63s/it, loss=0.0002, acc=0.9985, iter_time=10.43s]
Epoch 2: 19%|█▉ | 2399/12384 [5:05:25<21:13:17, 7.65s/it, loss=0.0002, acc=0.9985, iter_time=10.43s]
Epoch 2: 19%|█▉ | 2399/12384 [5:05:32<21:13:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 2: 19%|█▉ | 2400/12384 [5:05:32<21:11:05, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 2: 19%|█▉ | 2400/12384 [5:05:40<21:11:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2401/12384 [5:05:40<21:09:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 19%|█▉ | 2401/12384 [5:05:47<21:09:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2402/12384 [5:05:47<21:08:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 19%|█▉ | 2402/12384 [5:05:55<21:08:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 19%|█▉ | 2403/12384 [5:05:55<21:22:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 19%|█▉ | 2403/12384 [5:06:03<21:22:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▉ | 2404/12384 [5:06:03<21:17:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 19%|█▉ | 2404/12384 [5:06:11<21:17:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 19%|█▉ | 2405/12384 [5:06:11<21:14:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 19%|█▉ | 2405/12384 [5:06:18<21:14:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 2: 19%|█▉ | 2406/12384 [5:06:18<21:14:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 2: 19%|█▉ | 2406/12384 [5:06:26<21:14:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 2: 19%|█▉ | 2407/12384 [5:06:26<21:12:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.04s]
Epoch 2: 19%|█▉ | 2407/12384 [5:06:33<21:12:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 19%|█▉ | 2408/12384 [5:06:33<21:09:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 19%|█▉ | 2408/12384 [5:06:41<21:09:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 19%|█▉ | 2409/12384 [5:06:41<21:08:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 19%|█▉ | 2409/12384 [5:06:49<21:08:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 19%|█▉ | 2410/12384 [5:06:49<21:07:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 19%|█▉ | 2410/12384 [5:06:56<21:07:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 19%|█▉ | 2411/12384 [5:06:56<21:10:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 19%|█▉ | 2411/12384 [5:07:04<21:10:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 19%|█▉ | 2412/12384 [5:07:04<21:10:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 19%|█▉ | 2412/12384 [5:07:12<21:10:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 19%|█▉ | 2413/12384 [5:07:12<21:08:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 19%|█▉ | 2413/12384 [5:07:19<21:08:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.77s]
Epoch 2: 19%|█▉ | 2414/12384 [5:07:19<21:07:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.77s]
Epoch 2: 19%|█▉ | 2414/12384 [5:07:27<21:07:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 20%|█▉ | 2415/12384 [5:07:27<21:06:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 20%|█▉ | 2415/12384 [5:07:34<21:06:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 20%|█▉ | 2416/12384 [5:07:34<21:04:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 20%|█▉ | 2416/12384 [5:07:42<21:04:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 2: 20%|█▉ | 2417/12384 [5:07:42<21:04:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.87s]
Epoch 2: 20%|█▉ | 2417/12384 [5:07:50<21:04:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 20%|█▉ | 2418/12384 [5:07:50<21:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 20%|█▉ | 2418/12384 [5:07:57<21:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 20%|█▉ | 2419/12384 [5:07:57<21:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 20%|█▉ | 2419/12384 [5:08:05<21:05:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|█▉ | 2420/12384 [5:08:05<21:07:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|█▉ | 2420/12384 [5:08:13<21:07:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 2: 20%|█▉ | 2421/12384 [5:08:13<21:22:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 2: 20%|█▉ | 2421/12384 [5:08:20<21:22:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 2: 20%|█▉ | 2422/12384 [5:08:20<21:15:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 2: 20%|█▉ | 2422/12384 [5:08:28<21:15:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 20%|█▉ | 2423/12384 [5:08:28<21:10:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 20%|█▉ | 2423/12384 [5:08:36<21:10:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 20%|█▉ | 2424/12384 [5:08:36<21:08:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 20%|█▉ | 2424/12384 [5:08:43<21:08:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 20%|█▉ | 2425/12384 [5:08:43<21:07:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 20%|█▉ | 2425/12384 [5:08:51<21:07:24, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.04s]
Epoch 2: 20%|█▉ | 2426/12384 [5:08:51<21:05:28, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.04s]
Epoch 2: 20%|█▉ | 2426/12384 [5:08:59<21:05:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 20%|█▉ | 2427/12384 [5:08:59<21:08:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 20%|█▉ | 2427/12384 [5:09:06<21:08:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 20%|█▉ | 2428/12384 [5:09:06<21:06:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 20%|█▉ | 2428/12384 [5:09:14<21:06:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 20%|█▉ | 2429/12384 [5:09:14<21:04:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 20%|█▉ | 2429/12384 [5:09:21<21:04:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 2: 20%|█▉ | 2430/12384 [5:09:21<21:02:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 2: 20%|█▉ | 2430/12384 [5:09:29<21:02:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 20%|█▉ | 2431/12384 [5:09:29<21:00:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 20%|█▉ | 2431/12384 [5:09:37<21:00:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 20%|█▉ | 2432/12384 [5:09:37<21:02:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 20%|█▉ | 2432/12384 [5:09:44<21:02:42, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.18s]
Epoch 2: 20%|█▉ | 2433/12384 [5:09:44<21:02:26, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=7.18s]
Epoch 2: 20%|█▉ | 2433/12384 [5:09:52<21:02:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 20%|█▉ | 2434/12384 [5:09:52<21:02:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 20%|█▉ | 2434/12384 [5:09:59<21:02:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 20%|█▉ | 2435/12384 [5:09:59<21:04:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 20%|█▉ | 2435/12384 [5:10:07<21:04:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 20%|█▉ | 2436/12384 [5:10:07<21:02:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 20%|█▉ | 2436/12384 [5:10:15<21:02:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 20%|█▉ | 2437/12384 [5:10:15<21:02:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 20%|█▉ | 2437/12384 [5:10:22<21:02:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 20%|█▉ | 2438/12384 [5:10:22<21:02:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 20%|█▉ | 2438/12384 [5:10:30<21:02:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 20%|█▉ | 2439/12384 [5:10:30<21:02:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 20%|█▉ | 2439/12384 [5:10:37<21:02:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 20%|█▉ | 2440/12384 [5:10:37<21:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 20%|█▉ | 2440/12384 [5:10:45<21:00:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 2: 20%|█▉ | 2441/12384 [5:10:45<21:07:16, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 2: 20%|█▉ | 2441/12384 [5:10:53<21:07:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 20%|█▉ | 2442/12384 [5:10:53<21:05:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 20%|█▉ | 2442/12384 [5:11:00<21:05:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 20%|█▉ | 2443/12384 [5:11:00<21:04:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 20%|█▉ | 2443/12384 [5:11:08<21:04:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|█▉ | 2444/12384 [5:11:08<21:04:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|█▉ | 2444/12384 [5:11:16<21:04:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|█▉ | 2445/12384 [5:11:16<21:02:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|█▉ | 2445/12384 [5:11:23<21:02:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|█▉ | 2446/12384 [5:11:23<21:02:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|█▉ | 2446/12384 [5:11:31<21:02:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 20%|█▉ | 2447/12384 [5:11:31<21:16:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 20%|█▉ | 2447/12384 [5:11:39<21:16:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 20%|█▉ | 2448/12384 [5:11:39<21:11:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 20%|█▉ | 2448/12384 [5:11:47<21:11:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 20%|█▉ | 2449/12384 [5:11:47<21:13:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 20%|█▉ | 2449/12384 [5:11:54<21:13:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 20%|█▉ | 2450/12384 [5:11:54<21:09:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 20%|█▉ | 2450/12384 [5:12:02<21:09:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 20%|█▉ | 2451/12384 [5:12:02<21:05:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 20%|█▉ | 2451/12384 [5:12:09<21:05:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 20%|█▉ | 2452/12384 [5:12:09<21:04:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 20%|█▉ | 2452/12384 [5:12:17<21:04:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 20%|█▉ | 2453/12384 [5:12:17<21:02:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 20%|█▉ | 2453/12384 [5:12:25<21:02:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 20%|█▉ | 2454/12384 [5:12:25<21:02:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 20%|█▉ | 2454/12384 [5:12:32<21:02:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 20%|█▉ | 2455/12384 [5:12:32<21:15:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 20%|█▉ | 2455/12384 [5:12:40<21:15:53, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 2: 20%|█▉ | 2456/12384 [5:12:40<21:10:43, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.54s]
Epoch 2: 20%|█▉ | 2456/12384 [5:12:48<21:10:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 20%|█▉ | 2457/12384 [5:12:48<21:06:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 20%|█▉ | 2457/12384 [5:12:55<21:06:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 20%|█▉ | 2458/12384 [5:12:55<21:04:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 20%|█▉ | 2458/12384 [5:13:03<21:04:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|█▉ | 2459/12384 [5:13:03<21:02:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|█▉ | 2459/12384 [5:13:11<21:02:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 20%|█▉ | 2460/12384 [5:13:11<21:01:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 20%|█▉ | 2460/12384 [5:13:18<21:01:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 20%|█▉ | 2461/12384 [5:13:18<21:00:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 20%|█▉ | 2461/12384 [5:13:26<21:00:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 20%|█▉ | 2462/12384 [5:13:26<20:59:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 20%|█▉ | 2462/12384 [5:13:33<20:59:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 20%|█▉ | 2463/12384 [5:13:33<20:57:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 20%|█▉ | 2463/12384 [5:13:41<20:57:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 20%|█▉ | 2464/12384 [5:13:41<20:57:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 20%|█▉ | 2464/12384 [5:13:49<20:57:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 2: 20%|█▉ | 2465/12384 [5:13:49<20:56:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 2: 20%|█▉ | 2465/12384 [5:13:56<20:56:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 20%|█▉ | 2466/12384 [5:13:56<20:56:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 20%|█▉ | 2466/12384 [5:14:04<20:56:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 20%|█▉ | 2467/12384 [5:14:04<20:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 20%|█▉ | 2467/12384 [5:14:11<20:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|█▉ | 2468/12384 [5:14:11<20:56:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|█▉ | 2468/12384 [5:14:19<20:56:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|█▉ | 2469/12384 [5:14:19<21:00:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|█▉ | 2469/12384 [5:14:27<21:00:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 20%|█▉ | 2470/12384 [5:14:27<20:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 20%|█▉ | 2470/12384 [5:14:34<20:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 20%|█▉ | 2471/12384 [5:14:34<20:57:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 20%|█▉ | 2471/12384 [5:14:42<20:57:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 20%|█▉ | 2472/12384 [5:14:42<20:56:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 20%|█▉ | 2472/12384 [5:14:50<20:56:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 20%|█▉ | 2473/12384 [5:14:50<21:13:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 20%|█▉ | 2473/12384 [5:14:57<21:13:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 20%|█▉ | 2474/12384 [5:14:57<21:08:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 20%|█▉ | 2474/12384 [5:15:05<21:08:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 2: 20%|█▉ | 2475/12384 [5:15:05<21:05:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 2: 20%|█▉ | 2475/12384 [5:15:13<21:05:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 20%|█▉ | 2476/12384 [5:15:13<21:02:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 20%|█▉ | 2476/12384 [5:15:20<21:02:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 20%|██ | 2477/12384 [5:15:20<21:00:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 20%|██ | 2477/12384 [5:15:28<21:00:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 2: 20%|██ | 2478/12384 [5:15:28<20:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 2: 20%|██ | 2478/12384 [5:15:35<20:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 20%|██ | 2479/12384 [5:15:35<21:02:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 20%|██ | 2479/12384 [5:15:43<21:02:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 20%|██ | 2480/12384 [5:15:43<21:00:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 20%|██ | 2480/12384 [5:15:51<21:00:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 20%|██ | 2481/12384 [5:15:51<21:00:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 20%|██ | 2481/12384 [5:15:58<21:00:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 20%|██ | 2482/12384 [5:15:58<20:58:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 20%|██ | 2482/12384 [5:16:06<20:58:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 20%|██ | 2483/12384 [5:16:06<20:57:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 20%|██ | 2483/12384 [5:16:14<20:57:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2484/12384 [5:16:14<20:57:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2484/12384 [5:16:21<20:57:38, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.33s]
Epoch 2: 20%|██ | 2485/12384 [5:16:21<20:56:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.33s]
Epoch 2: 20%|██ | 2485/12384 [5:16:29<20:56:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 20%|██ | 2486/12384 [5:16:29<20:56:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 20%|██ | 2486/12384 [5:16:36<20:56:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|██ | 2487/12384 [5:16:36<21:00:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 20%|██ | 2487/12384 [5:16:44<21:00:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 20%|██ | 2488/12384 [5:16:44<20:58:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 20%|██ | 2488/12384 [5:16:52<20:58:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 20%|██ | 2489/12384 [5:16:52<21:02:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 20%|██ | 2489/12384 [5:16:59<21:02:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 20%|██ | 2490/12384 [5:16:59<21:01:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 20%|██ | 2490/12384 [5:17:07<21:01:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 20%|██ | 2491/12384 [5:17:07<20:59:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 20%|██ | 2491/12384 [5:17:15<20:59:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 20%|██ | 2492/12384 [5:17:15<20:57:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 20%|██ | 2492/12384 [5:17:22<20:57:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 20%|██ | 2493/12384 [5:17:22<20:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 20%|██ | 2493/12384 [5:17:30<20:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 20%|██ | 2494/12384 [5:17:30<20:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 20%|██ | 2494/12384 [5:17:37<20:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 20%|██ | 2495/12384 [5:17:37<20:55:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 20%|██ | 2495/12384 [5:17:45<20:55:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 20%|██ | 2496/12384 [5:17:45<20:55:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 20%|██ | 2496/12384 [5:17:53<20:55:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 20%|██ | 2497/12384 [5:17:53<20:55:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 20%|██ | 2497/12384 [5:18:00<20:55:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 20%|██ | 2498/12384 [5:18:00<20:54:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 20%|██ | 2498/12384 [5:18:08<20:54:46, 7.62s/it, loss=0.0000, acc=0.9997, iter_time=7.67s]
Epoch 2: 20%|██ | 2499/12384 [5:18:08<21:13:35, 7.73s/it, loss=0.0000, acc=0.9997, iter_time=7.67s]
Epoch 2: 20%|██ | 2499/12384 [5:18:16<21:13:35, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 20%|██ | 2500/12384 [5:18:16<21:06:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 20%|██ | 2500/12384 [5:18:24<21:06:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2501/12384 [5:18:24<21:05:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2501/12384 [5:18:31<21:05:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 20%|██ | 2502/12384 [5:18:31<21:02:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 20%|██ | 2502/12384 [5:18:39<21:02:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 20%|██ | 2503/12384 [5:18:39<20:59:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 20%|██ | 2503/12384 [5:18:46<20:59:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 20%|██ | 2504/12384 [5:18:46<20:57:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 20%|██ | 2504/12384 [5:18:54<20:57:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 20%|██ | 2505/12384 [5:18:54<20:55:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 20%|██ | 2505/12384 [5:19:02<20:55:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 20%|██ | 2506/12384 [5:19:02<20:54:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 20%|██ | 2506/12384 [5:19:10<20:54:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 20%|██ | 2507/12384 [5:19:10<21:07:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 20%|██ | 2507/12384 [5:19:17<21:07:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 20%|██ | 2508/12384 [5:19:17<21:03:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 20%|██ | 2508/12384 [5:19:25<21:03:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 20%|██ | 2509/12384 [5:19:25<21:00:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 20%|██ | 2509/12384 [5:19:32<21:00:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2510/12384 [5:19:32<20:58:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2510/12384 [5:19:40<20:58:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 20%|██ | 2511/12384 [5:19:40<20:59:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 20%|██ | 2511/12384 [5:19:48<20:59:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 20%|██ | 2512/12384 [5:19:48<20:56:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 20%|██ | 2512/12384 [5:19:55<20:56:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 20%|██ | 2513/12384 [5:19:55<20:56:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 20%|██ | 2513/12384 [5:20:03<20:56:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 20%|██ | 2514/12384 [5:20:03<20:55:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 20%|██ | 2514/12384 [5:20:11<20:55:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 2: 20%|██ | 2515/12384 [5:20:11<20:53:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 2: 20%|██ | 2515/12384 [5:20:18<20:53:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 20%|██ | 2516/12384 [5:20:18<20:52:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 20%|██ | 2516/12384 [5:20:26<20:52:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 20%|██ | 2517/12384 [5:20:26<20:54:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 20%|██ | 2517/12384 [5:20:33<20:54:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 20%|██ | 2518/12384 [5:20:33<20:53:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 20%|██ | 2518/12384 [5:20:41<20:53:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2519/12384 [5:20:41<20:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2519/12384 [5:20:49<20:53:24, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=8.00s]
Epoch 2: 20%|██ | 2520/12384 [5:20:49<20:53:28, 7.62s/it, loss=0.0006, acc=0.9975, iter_time=8.00s]
Epoch 2: 20%|██ | 2520/12384 [5:20:56<20:53:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 20%|██ | 2521/12384 [5:20:56<20:51:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 20%|██ | 2521/12384 [5:21:04<20:51:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 20%|██ | 2522/12384 [5:21:04<20:51:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 20%|██ | 2522/12384 [5:21:11<20:51:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 20%|██ | 2523/12384 [5:21:11<20:51:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 20%|██ | 2523/12384 [5:21:19<20:51:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 20%|██ | 2524/12384 [5:21:19<20:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 20%|██ | 2524/12384 [5:21:27<20:51:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 20%|██ | 2525/12384 [5:21:27<21:07:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 20%|██ | 2525/12384 [5:21:35<21:07:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 20%|██ | 2526/12384 [5:21:35<21:02:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 20%|██ | 2526/12384 [5:21:42<21:02:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 20%|██ | 2527/12384 [5:21:42<20:57:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 20%|██ | 2527/12384 [5:21:50<20:57:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 20%|██ | 2528/12384 [5:21:50<20:55:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 20%|██ | 2528/12384 [5:21:57<20:55:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 20%|██ | 2529/12384 [5:21:57<20:52:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 20%|██ | 2529/12384 [5:22:05<20:52:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2530/12384 [5:22:05<20:51:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 20%|██ | 2530/12384 [5:22:13<20:51:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 20%|██ | 2531/12384 [5:22:13<20:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 20%|██ | 2531/12384 [5:22:20<20:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 20%|██ | 2532/12384 [5:22:20<20:50:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 20%|██ | 2532/12384 [5:22:28<20:50:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 20%|██ | 2533/12384 [5:22:28<20:50:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 20%|██ | 2533/12384 [5:22:35<20:50:06, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.11s]
Epoch 2: 20%|██ | 2534/12384 [5:22:35<20:49:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.11s]
Epoch 2: 20%|██ | 2534/12384 [5:22:43<20:49:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 20%|██ | 2535/12384 [5:22:43<20:48:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 20%|██ | 2535/12384 [5:22:51<20:48:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 20%|██ | 2536/12384 [5:22:51<20:48:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 20%|██ | 2536/12384 [5:22:58<20:48:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 20%|██ | 2537/12384 [5:22:58<20:49:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 20%|██ | 2537/12384 [5:23:06<20:49:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 20%|██ | 2538/12384 [5:23:06<20:49:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 20%|██ | 2538/12384 [5:23:14<20:49:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 21%|██ | 2539/12384 [5:23:14<20:48:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 21%|██ | 2539/12384 [5:23:21<20:48:27, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=5.83s]
Epoch 2: 21%|██ | 2540/12384 [5:23:21<20:48:32, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=5.83s]
Epoch 2: 21%|██ | 2540/12384 [5:23:29<20:48:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 21%|██ | 2541/12384 [5:23:29<20:52:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 21%|██ | 2541/12384 [5:23:36<20:52:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 21%|██ | 2542/12384 [5:23:36<20:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 21%|██ | 2542/12384 [5:23:44<20:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 21%|██ | 2543/12384 [5:23:44<20:50:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 21%|██ | 2543/12384 [5:23:52<20:50:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 21%|██ | 2544/12384 [5:23:52<20:49:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 21%|██ | 2544/12384 [5:23:59<20:49:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 2: 21%|██ | 2545/12384 [5:23:59<20:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 2: 21%|██ | 2545/12384 [5:24:07<20:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 21%|██ | 2546/12384 [5:24:07<20:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 21%|██ | 2546/12384 [5:24:14<20:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 21%|██ | 2547/12384 [5:24:14<20:46:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 21%|██ | 2547/12384 [5:24:22<20:46:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 21%|██ | 2548/12384 [5:24:22<20:45:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 21%|██ | 2548/12384 [5:24:30<20:45:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2549/12384 [5:24:30<20:51:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2549/12384 [5:24:37<20:51:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 21%|██ | 2550/12384 [5:24:37<20:50:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 21%|██ | 2550/12384 [5:24:45<20:50:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2551/12384 [5:24:45<20:51:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2551/12384 [5:24:53<20:51:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 21%|██ | 2552/12384 [5:24:53<21:05:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 21%|██ | 2552/12384 [5:25:01<21:05:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 21%|██ | 2553/12384 [5:25:01<20:58:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 21%|██ | 2553/12384 [5:25:08<20:58:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2554/12384 [5:25:08<20:53:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2554/12384 [5:25:16<20:53:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 21%|██ | 2555/12384 [5:25:16<20:54:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 21%|██ | 2555/12384 [5:25:23<20:54:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 21%|██ | 2556/12384 [5:25:23<20:52:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 21%|██ | 2556/12384 [5:25:31<20:52:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 21%|██ | 2557/12384 [5:25:31<20:50:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 21%|██ | 2557/12384 [5:25:39<20:50:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2558/12384 [5:25:39<20:48:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2558/12384 [5:25:46<20:48:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 21%|██ | 2559/12384 [5:25:46<20:50:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 21%|██ | 2559/12384 [5:25:54<20:50:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 21%|██ | 2560/12384 [5:25:54<20:48:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 21%|██ | 2560/12384 [5:26:02<20:48:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 21%|██ | 2561/12384 [5:26:02<21:00:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 21%|██ | 2561/12384 [5:26:09<21:00:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2562/12384 [5:26:09<20:55:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2562/12384 [5:26:17<20:55:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 21%|██ | 2563/12384 [5:26:17<20:52:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 21%|██ | 2563/12384 [5:26:25<20:52:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2564/12384 [5:26:25<20:50:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2564/12384 [5:26:32<20:50:38, 7.64s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 2: 21%|██ | 2565/12384 [5:26:32<20:49:23, 7.63s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 2: 21%|██ | 2565/12384 [5:26:40<20:49:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 21%|██ | 2566/12384 [5:26:40<20:47:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 21%|██ | 2566/12384 [5:26:47<20:47:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 21%|██ | 2567/12384 [5:26:47<20:46:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 21%|██ | 2567/12384 [5:26:55<20:46:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 21%|██ | 2568/12384 [5:26:55<20:48:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 21%|██ | 2568/12384 [5:27:03<20:48:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 21%|██ | 2569/12384 [5:27:03<20:47:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 21%|██ | 2569/12384 [5:27:10<20:47:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 21%|██ | 2570/12384 [5:27:10<20:45:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 21%|██ | 2570/12384 [5:27:18<20:45:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 21%|██ | 2571/12384 [5:27:18<20:44:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 21%|██ | 2571/12384 [5:27:25<20:44:52, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2572/12384 [5:27:25<20:43:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2572/12384 [5:27:33<20:43:53, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=3.86s]
Epoch 2: 21%|██ | 2573/12384 [5:27:33<20:43:53, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=3.86s]
Epoch 2: 21%|██ | 2573/12384 [5:27:41<20:43:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 2: 21%|██ | 2574/12384 [5:27:41<20:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 2: 21%|██ | 2574/12384 [5:27:48<20:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██ | 2575/12384 [5:27:48<20:44:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██ | 2575/12384 [5:27:56<20:44:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2576/12384 [5:27:56<20:45:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2576/12384 [5:28:04<20:45:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 21%|██ | 2577/12384 [5:28:04<20:44:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 21%|██ | 2577/12384 [5:28:11<20:44:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 21%|██ | 2578/12384 [5:28:11<21:00:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 21%|██ | 2578/12384 [5:28:19<21:00:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 21%|██ | 2579/12384 [5:28:19<20:55:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 21%|██ | 2579/12384 [5:28:27<20:55:08, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 2: 21%|██ | 2580/12384 [5:28:27<20:51:55, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.11s]
Epoch 2: 21%|██ | 2580/12384 [5:28:34<20:51:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2581/12384 [5:28:34<20:48:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2581/12384 [5:28:42<20:48:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 21%|██ | 2582/12384 [5:28:42<20:47:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 21%|██ | 2582/12384 [5:28:50<20:47:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 21%|██ | 2583/12384 [5:28:50<20:46:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 21%|██ | 2583/12384 [5:28:57<20:46:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 21%|██ | 2584/12384 [5:28:57<20:44:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 21%|██ | 2584/12384 [5:29:05<20:44:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 21%|██ | 2585/12384 [5:29:05<20:43:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 21%|██ | 2585/12384 [5:29:12<20:43:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2586/12384 [5:29:12<20:42:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2586/12384 [5:29:20<20:42:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 21%|██ | 2587/12384 [5:29:20<20:41:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 21%|██ | 2587/12384 [5:29:28<20:41:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 21%|██ | 2588/12384 [5:29:28<20:41:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 21%|██ | 2588/12384 [5:29:35<20:41:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██ | 2589/12384 [5:29:35<20:42:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██ | 2589/12384 [5:29:43<20:42:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 21%|██ | 2590/12384 [5:29:43<20:40:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 21%|██ | 2590/12384 [5:29:50<20:40:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 21%|██ | 2591/12384 [5:29:50<20:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 21%|██ | 2591/12384 [5:29:58<20:41:16, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.02s]
Epoch 2: 21%|██ | 2592/12384 [5:29:58<20:42:13, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.02s]
Epoch 2: 21%|██ | 2592/12384 [5:30:06<20:42:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 2: 21%|██ | 2593/12384 [5:30:06<20:42:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 2: 21%|██ | 2593/12384 [5:30:13<20:42:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 21%|██ | 2594/12384 [5:30:13<20:41:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 21%|██ | 2594/12384 [5:30:21<20:41:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2595/12384 [5:30:21<20:41:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2595/12384 [5:30:28<20:41:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2596/12384 [5:30:28<20:41:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2596/12384 [5:30:36<20:41:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 21%|██ | 2597/12384 [5:30:36<20:46:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 21%|██ | 2597/12384 [5:30:44<20:46:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 21%|██ | 2598/12384 [5:30:44<20:45:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 21%|██ | 2598/12384 [5:30:51<20:45:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 21%|██ | 2599/12384 [5:30:51<20:44:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 21%|██ | 2599/12384 [5:30:59<20:44:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 21%|██ | 2600/12384 [5:30:59<20:43:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 21%|██ | 2600/12384 [5:31:07<20:43:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 21%|██ | 2601/12384 [5:31:07<20:41:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 21%|██ | 2601/12384 [5:31:14<20:41:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 21%|██ | 2602/12384 [5:31:14<20:41:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 21%|██ | 2602/12384 [5:31:22<20:41:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2603/12384 [5:31:22<20:41:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2603/12384 [5:31:29<20:41:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 21%|██ | 2604/12384 [5:31:29<20:41:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 21%|██ | 2604/12384 [5:31:37<20:41:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 21%|██ | 2605/12384 [5:31:37<20:55:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 21%|██ | 2605/12384 [5:31:45<20:55:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 21%|██ | 2606/12384 [5:31:45<20:51:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 21%|██ | 2606/12384 [5:31:53<20:51:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2607/12384 [5:31:53<20:49:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2607/12384 [5:32:00<20:49:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 21%|██ | 2608/12384 [5:32:00<20:45:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 21%|██ | 2608/12384 [5:32:08<20:45:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 21%|██ | 2609/12384 [5:32:08<20:42:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 21%|██ | 2609/12384 [5:32:15<20:42:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 21%|██ | 2610/12384 [5:32:15<20:42:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 21%|██ | 2610/12384 [5:32:23<20:42:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 21%|██ | 2611/12384 [5:32:23<20:42:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 21%|██ | 2611/12384 [5:32:31<20:42:28, 7.63s/it, loss=0.0002, acc=0.9985, iter_time=8.26s]
Epoch 2: 21%|██ | 2612/12384 [5:32:31<20:41:09, 7.62s/it, loss=0.0002, acc=0.9985, iter_time=8.26s]
Epoch 2: 21%|██ | 2612/12384 [5:32:39<20:41:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 21%|██ | 2613/12384 [5:32:39<20:53:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 21%|██ | 2613/12384 [5:32:46<20:53:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 21%|██ | 2614/12384 [5:32:46<20:49:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 21%|██ | 2614/12384 [5:32:54<20:49:42, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 2: 21%|██ | 2615/12384 [5:32:54<20:46:45, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.55s]
Epoch 2: 21%|██ | 2615/12384 [5:33:01<20:46:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 21%|██ | 2616/12384 [5:33:01<20:45:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 21%|██ | 2616/12384 [5:33:09<20:45:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 21%|██ | 2617/12384 [5:33:09<20:46:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 21%|██ | 2617/12384 [5:33:17<20:46:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 21%|██ | 2618/12384 [5:33:17<20:43:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 21%|██ | 2618/12384 [5:33:24<20:43:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2619/12384 [5:33:24<20:41:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2619/12384 [5:33:32<20:41:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 21%|██ | 2620/12384 [5:33:32<20:39:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 21%|██ | 2620/12384 [5:33:39<20:39:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2621/12384 [5:33:39<20:38:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██ | 2621/12384 [5:33:47<20:38:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2622/12384 [5:33:47<20:38:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 21%|██ | 2622/12384 [5:33:55<20:38:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 21%|██ | 2623/12384 [5:33:55<20:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 21%|██ | 2623/12384 [5:34:02<20:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 21%|██ | 2624/12384 [5:34:02<20:38:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 21%|██ | 2624/12384 [5:34:10<20:38:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 21%|██ | 2625/12384 [5:34:10<20:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 21%|██ | 2625/12384 [5:34:18<20:37:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 21%|██ | 2626/12384 [5:34:18<20:37:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 21%|██ | 2626/12384 [5:34:25<20:37:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 21%|██ | 2627/12384 [5:34:25<20:36:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 21%|██ | 2627/12384 [5:34:33<20:36:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 21%|██ | 2628/12384 [5:34:33<20:37:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 21%|██ | 2628/12384 [5:34:40<20:37:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 21%|██ | 2629/12384 [5:34:40<20:36:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 21%|██ | 2629/12384 [5:34:48<20:36:22, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 2: 21%|██ | 2630/12384 [5:34:48<20:37:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 2: 21%|██ | 2630/12384 [5:34:56<20:37:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 21%|██ | 2631/12384 [5:34:56<20:53:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 21%|██ | 2631/12384 [5:35:03<20:53:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 21%|██▏ | 2632/12384 [5:35:03<20:48:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 21%|██▏ | 2632/12384 [5:35:11<20:48:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 21%|██▏ | 2633/12384 [5:35:11<20:44:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 21%|██▏ | 2633/12384 [5:35:19<20:44:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 21%|██▏ | 2634/12384 [5:35:19<20:40:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 21%|██▏ | 2634/12384 [5:35:26<20:40:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 21%|██▏ | 2635/12384 [5:35:26<20:41:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 21%|██▏ | 2635/12384 [5:35:34<20:41:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 21%|██▏ | 2636/12384 [5:35:34<20:42:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 21%|██▏ | 2636/12384 [5:35:42<20:42:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 2: 21%|██▏ | 2637/12384 [5:35:42<20:45:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 2: 21%|██▏ | 2637/12384 [5:35:49<20:45:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 21%|██▏ | 2638/12384 [5:35:49<20:42:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 21%|██▏ | 2638/12384 [5:35:57<20:42:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 21%|██▏ | 2639/12384 [5:35:57<20:54:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 21%|██▏ | 2639/12384 [5:36:05<20:54:53, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 21%|██▏ | 2640/12384 [5:36:05<20:48:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 21%|██▏ | 2640/12384 [5:36:12<20:48:58, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 21%|██▏ | 2641/12384 [5:36:12<20:45:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 21%|██▏ | 2641/12384 [5:36:20<20:45:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 21%|██▏ | 2642/12384 [5:36:20<20:42:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 21%|██▏ | 2642/12384 [5:36:28<20:42:36, 7.65s/it, loss=0.0002, acc=0.9987, iter_time=8.98s]
Epoch 2: 21%|██▏ | 2643/12384 [5:36:28<20:41:29, 7.65s/it, loss=0.0002, acc=0.9987, iter_time=8.98s]
Epoch 2: 21%|██▏ | 2643/12384 [5:36:35<20:41:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 21%|██▏ | 2644/12384 [5:36:35<20:39:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 21%|██▏ | 2644/12384 [5:36:43<20:39:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 21%|██▏ | 2645/12384 [5:36:43<20:38:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 21%|██▏ | 2645/12384 [5:36:51<20:38:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 21%|██▏ | 2646/12384 [5:36:51<20:38:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 21%|██▏ | 2646/12384 [5:36:58<20:38:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██▏ | 2647/12384 [5:36:58<20:38:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██▏ | 2647/12384 [5:37:06<20:38:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 21%|██▏ | 2648/12384 [5:37:06<20:37:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 21%|██▏ | 2648/12384 [5:37:13<20:37:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 21%|██▏ | 2649/12384 [5:37:13<20:34:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 21%|██▏ | 2649/12384 [5:37:21<20:34:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 21%|██▏ | 2650/12384 [5:37:21<20:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 21%|██▏ | 2650/12384 [5:37:29<20:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 21%|██▏ | 2651/12384 [5:37:29<20:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 21%|██▏ | 2651/12384 [5:37:36<20:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██▏ | 2652/12384 [5:37:36<20:36:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██▏ | 2652/12384 [5:37:44<20:36:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 21%|██▏ | 2653/12384 [5:37:44<20:35:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 21%|██▏ | 2653/12384 [5:37:51<20:35:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 21%|██▏ | 2654/12384 [5:37:51<20:34:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 21%|██▏ | 2654/12384 [5:37:59<20:34:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██▏ | 2655/12384 [5:37:59<20:35:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██▏ | 2655/12384 [5:38:07<20:35:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 21%|██▏ | 2656/12384 [5:38:07<20:38:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 21%|██▏ | 2656/12384 [5:38:15<20:38:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 21%|██▏ | 2657/12384 [5:38:15<20:47:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 21%|██▏ | 2657/12384 [5:38:22<20:47:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 21%|██▏ | 2658/12384 [5:38:22<20:43:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 21%|██▏ | 2658/12384 [5:38:30<20:43:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██▏ | 2659/12384 [5:38:30<20:40:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 21%|██▏ | 2659/12384 [5:38:37<20:40:30, 7.65s/it, loss=0.0001, acc=0.9997, iter_time=7.59s]
Epoch 2: 21%|██▏ | 2660/12384 [5:38:37<20:37:16, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.59s]
Epoch 2: 21%|██▏ | 2660/12384 [5:38:45<20:37:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██▏ | 2661/12384 [5:38:45<20:36:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██▏ | 2661/12384 [5:38:53<20:36:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██▏ | 2662/12384 [5:38:53<20:35:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 21%|██▏ | 2662/12384 [5:39:00<20:35:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2663/12384 [5:39:00<20:34:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2663/12384 [5:39:08<20:34:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 22%|██▏ | 2664/12384 [5:39:08<20:33:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 22%|██▏ | 2664/12384 [5:39:16<20:33:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 22%|██▏ | 2665/12384 [5:39:16<20:46:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 22%|██▏ | 2665/12384 [5:39:23<20:46:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 22%|██▏ | 2666/12384 [5:39:23<20:41:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 22%|██▏ | 2666/12384 [5:39:31<20:41:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 22%|██▏ | 2667/12384 [5:39:31<20:39:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 22%|██▏ | 2667/12384 [5:39:39<20:39:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 22%|██▏ | 2668/12384 [5:39:39<20:36:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 22%|██▏ | 2668/12384 [5:39:46<20:36:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 22%|██▏ | 2669/12384 [5:39:46<20:39:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 22%|██▏ | 2669/12384 [5:39:54<20:39:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 22%|██▏ | 2670/12384 [5:39:54<20:37:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 22%|██▏ | 2670/12384 [5:40:01<20:37:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 22%|██▏ | 2671/12384 [5:40:01<20:35:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 22%|██▏ | 2671/12384 [5:40:09<20:35:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 22%|██▏ | 2672/12384 [5:40:09<20:36:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 22%|██▏ | 2672/12384 [5:40:17<20:36:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 22%|██▏ | 2673/12384 [5:40:17<20:35:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 22%|██▏ | 2673/12384 [5:40:24<20:35:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 22%|██▏ | 2674/12384 [5:40:24<20:34:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 22%|██▏ | 2674/12384 [5:40:32<20:34:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 22%|██▏ | 2675/12384 [5:40:32<20:34:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 22%|██▏ | 2675/12384 [5:40:40<20:34:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 22%|██▏ | 2676/12384 [5:40:40<20:33:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 22%|██▏ | 2676/12384 [5:40:47<20:33:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2677/12384 [5:40:47<20:32:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2677/12384 [5:40:55<20:32:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2678/12384 [5:40:55<20:31:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2678/12384 [5:41:02<20:31:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 22%|██▏ | 2679/12384 [5:41:02<20:27:40, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 22%|██▏ | 2679/12384 [5:41:10<20:27:40, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 22%|██▏ | 2680/12384 [5:41:10<20:28:20, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 22%|██▏ | 2680/12384 [5:41:18<20:28:20, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 22%|██▏ | 2681/12384 [5:41:18<20:28:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 22%|██▏ | 2681/12384 [5:41:25<20:28:16, 7.60s/it, loss=0.0005, acc=1.0000, iter_time=8.01s]
Epoch 2: 22%|██▏ | 2682/12384 [5:41:25<20:28:39, 7.60s/it, loss=0.0005, acc=1.0000, iter_time=8.01s]
Epoch 2: 22%|██▏ | 2682/12384 [5:41:33<20:28:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 22%|██▏ | 2683/12384 [5:41:33<20:45:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 22%|██▏ | 2683/12384 [5:41:41<20:45:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 22%|██▏ | 2684/12384 [5:41:41<20:39:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 22%|██▏ | 2684/12384 [5:41:48<20:39:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 22%|██▏ | 2685/12384 [5:41:48<20:35:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 22%|██▏ | 2685/12384 [5:41:56<20:35:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 22%|██▏ | 2686/12384 [5:41:56<20:32:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 22%|██▏ | 2686/12384 [5:42:03<20:32:49, 7.63s/it, loss=0.0002, acc=0.9989, iter_time=10.72s]
Epoch 2: 22%|██▏ | 2687/12384 [5:42:03<20:30:55, 7.62s/it, loss=0.0002, acc=0.9989, iter_time=10.72s]
Epoch 2: 22%|██▏ | 2687/12384 [5:42:11<20:30:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 22%|██▏ | 2688/12384 [5:42:11<20:30:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 22%|██▏ | 2688/12384 [5:42:19<20:30:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 22%|██▏ | 2689/12384 [5:42:19<20:30:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 22%|██▏ | 2689/12384 [5:42:26<20:30:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 22%|██▏ | 2690/12384 [5:42:26<20:29:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 22%|██▏ | 2690/12384 [5:42:34<20:29:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 22%|██▏ | 2691/12384 [5:42:34<20:44:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 22%|██▏ | 2691/12384 [5:42:42<20:44:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2692/12384 [5:42:42<20:39:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2692/12384 [5:42:49<20:39:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 22%|██▏ | 2693/12384 [5:42:49<20:35:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 22%|██▏ | 2693/12384 [5:42:57<20:35:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 2: 22%|██▏ | 2694/12384 [5:42:57<20:33:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 2: 22%|██▏ | 2694/12384 [5:43:05<20:33:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2695/12384 [5:43:05<20:32:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2695/12384 [5:43:12<20:32:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 2: 22%|██▏ | 2696/12384 [5:43:12<20:30:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 2: 22%|██▏ | 2696/12384 [5:43:20<20:30:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 22%|██▏ | 2697/12384 [5:43:20<20:30:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 22%|██▏ | 2697/12384 [5:43:27<20:30:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 22%|██▏ | 2698/12384 [5:43:27<20:30:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 22%|██▏ | 2698/12384 [5:43:35<20:30:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2699/12384 [5:43:35<20:29:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2699/12384 [5:43:43<20:29:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2700/12384 [5:43:43<20:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2700/12384 [5:43:50<20:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 22%|██▏ | 2701/12384 [5:43:50<20:28:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 22%|██▏ | 2701/12384 [5:43:58<20:28:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2702/12384 [5:43:58<20:27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2702/12384 [5:44:06<20:27:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 22%|██▏ | 2703/12384 [5:44:06<20:27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 22%|██▏ | 2703/12384 [5:44:13<20:27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 22%|██▏ | 2704/12384 [5:44:13<20:27:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 22%|██▏ | 2704/12384 [5:44:21<20:27:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 22%|██▏ | 2705/12384 [5:44:21<20:27:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 22%|██▏ | 2705/12384 [5:44:28<20:27:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 22%|██▏ | 2706/12384 [5:44:28<20:27:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 22%|██▏ | 2706/12384 [5:44:36<20:27:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2707/12384 [5:44:36<20:27:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2707/12384 [5:44:44<20:27:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 22%|██▏ | 2708/12384 [5:44:44<20:27:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 22%|██▏ | 2708/12384 [5:44:52<20:27:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 22%|██▏ | 2709/12384 [5:44:52<20:42:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 22%|██▏ | 2709/12384 [5:44:59<20:42:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 22%|██▏ | 2710/12384 [5:44:59<20:37:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 22%|██▏ | 2710/12384 [5:45:07<20:37:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2711/12384 [5:45:07<20:33:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2711/12384 [5:45:14<20:33:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 22%|██▏ | 2712/12384 [5:45:14<20:32:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 22%|██▏ | 2712/12384 [5:45:22<20:32:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 22%|██▏ | 2713/12384 [5:45:22<20:30:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 22%|██▏ | 2713/12384 [5:45:30<20:30:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2714/12384 [5:45:30<20:29:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2714/12384 [5:45:37<20:29:00, 7.63s/it, loss=0.0035, acc=0.9945, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2715/12384 [5:45:37<20:27:29, 7.62s/it, loss=0.0035, acc=0.9945, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2715/12384 [5:45:45<20:27:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2716/12384 [5:45:45<20:26:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2716/12384 [5:45:52<20:26:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2717/12384 [5:45:52<20:26:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2717/12384 [5:46:00<20:26:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 22%|██▏ | 2718/12384 [5:46:00<20:26:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 22%|██▏ | 2718/12384 [5:46:08<20:26:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 22%|██▏ | 2719/12384 [5:46:08<20:26:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 22%|██▏ | 2719/12384 [5:46:15<20:26:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 22%|██▏ | 2720/12384 [5:46:15<20:26:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 22%|██▏ | 2720/12384 [5:46:23<20:26:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 22%|██▏ | 2721/12384 [5:46:23<20:25:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 22%|██▏ | 2721/12384 [5:46:30<20:25:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 22%|██▏ | 2722/12384 [5:46:30<20:25:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 22%|██▏ | 2722/12384 [5:46:38<20:25:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 22%|██▏ | 2723/12384 [5:46:38<20:28:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 22%|██▏ | 2723/12384 [5:46:46<20:28:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 22%|██▏ | 2724/12384 [5:46:46<20:27:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 22%|██▏ | 2724/12384 [5:46:53<20:27:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 22%|██▏ | 2725/12384 [5:46:53<20:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 22%|██▏ | 2725/12384 [5:47:01<20:27:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 22%|██▏ | 2726/12384 [5:47:01<20:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 22%|██▏ | 2726/12384 [5:47:09<20:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 22%|██▏ | 2727/12384 [5:47:09<20:25:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 22%|██▏ | 2727/12384 [5:47:16<20:25:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 22%|██▏ | 2728/12384 [5:47:16<20:29:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 22%|██▏ | 2728/12384 [5:47:24<20:29:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 22%|██▏ | 2729/12384 [5:47:24<20:28:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 22%|██▏ | 2729/12384 [5:47:31<20:28:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 22%|██▏ | 2730/12384 [5:47:31<20:26:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 22%|██▏ | 2730/12384 [5:47:39<20:26:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 22%|██▏ | 2731/12384 [5:47:39<20:25:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 22%|██▏ | 2731/12384 [5:47:47<20:25:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 22%|██▏ | 2732/12384 [5:47:47<20:34:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 22%|██▏ | 2732/12384 [5:47:54<20:34:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 22%|██▏ | 2733/12384 [5:47:54<20:30:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 22%|██▏ | 2733/12384 [5:48:02<20:30:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 22%|██▏ | 2734/12384 [5:48:02<20:30:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 22%|██▏ | 2734/12384 [5:48:10<20:30:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 22%|██▏ | 2735/12384 [5:48:10<20:27:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 22%|██▏ | 2735/12384 [5:48:18<20:27:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 22%|██▏ | 2736/12384 [5:48:18<20:42:52, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 22%|██▏ | 2736/12384 [5:48:25<20:42:52, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 22%|██▏ | 2737/12384 [5:48:25<20:37:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 22%|██▏ | 2737/12384 [5:48:33<20:37:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 22%|██▏ | 2738/12384 [5:48:33<20:34:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 22%|██▏ | 2738/12384 [5:48:41<20:34:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2739/12384 [5:48:41<20:34:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2739/12384 [5:48:48<20:34:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 22%|██▏ | 2740/12384 [5:48:48<20:31:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 22%|██▏ | 2740/12384 [5:48:56<20:31:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2741/12384 [5:48:56<20:27:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 22%|██▏ | 2741/12384 [5:49:03<20:27:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 22%|██▏ | 2742/12384 [5:49:03<20:26:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 22%|██▏ | 2742/12384 [5:49:11<20:26:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 22%|██▏ | 2743/12384 [5:49:11<20:23:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 22%|██▏ | 2743/12384 [5:49:19<20:23:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 2: 22%|██▏ | 2744/12384 [5:49:19<20:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 2: 22%|██▏ | 2744/12384 [5:49:26<20:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 22%|██▏ | 2745/12384 [5:49:26<20:23:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 22%|██▏ | 2745/12384 [5:49:34<20:23:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 22%|██▏ | 2746/12384 [5:49:34<20:23:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 22%|██▏ | 2746/12384 [5:49:41<20:23:01, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=7.29s]
Epoch 2: 22%|██▏ | 2747/12384 [5:49:41<20:21:01, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=7.29s]
Epoch 2: 22%|██▏ | 2747/12384 [5:49:49<20:21:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 22%|██▏ | 2748/12384 [5:49:49<20:21:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 22%|██▏ | 2748/12384 [5:49:57<20:21:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 22%|██▏ | 2749/12384 [5:49:57<20:20:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 22%|██▏ | 2749/12384 [5:50:04<20:20:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 22%|██▏ | 2750/12384 [5:50:04<20:19:23, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 22%|██▏ | 2750/12384 [5:50:12<20:19:23, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 22%|██▏ | 2751/12384 [5:50:12<20:20:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 22%|██▏ | 2751/12384 [5:50:19<20:20:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 22%|██▏ | 2752/12384 [5:50:19<20:20:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 22%|██▏ | 2752/12384 [5:50:27<20:20:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 22%|██▏ | 2753/12384 [5:50:27<20:20:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 22%|██▏ | 2753/12384 [5:50:35<20:20:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 22%|██▏ | 2754/12384 [5:50:35<20:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 22%|██▏ | 2754/12384 [5:50:42<20:21:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 22%|██▏ | 2755/12384 [5:50:42<20:21:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 22%|██▏ | 2755/12384 [5:50:50<20:21:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 22%|██▏ | 2756/12384 [5:50:50<20:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 22%|██▏ | 2756/12384 [5:50:57<20:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 22%|██▏ | 2757/12384 [5:50:57<20:22:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 22%|██▏ | 2757/12384 [5:51:05<20:22:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 22%|██▏ | 2758/12384 [5:51:05<20:21:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 22%|██▏ | 2758/12384 [5:51:13<20:21:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 22%|██▏ | 2759/12384 [5:51:13<20:21:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 22%|██▏ | 2759/12384 [5:51:20<20:21:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 22%|██▏ | 2760/12384 [5:51:20<20:22:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 22%|██▏ | 2760/12384 [5:51:28<20:22:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 22%|██▏ | 2761/12384 [5:51:28<20:22:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 22%|██▏ | 2761/12384 [5:51:36<20:22:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 22%|██▏ | 2762/12384 [5:51:36<20:38:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 22%|██▏ | 2762/12384 [5:51:44<20:38:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 22%|██▏ | 2763/12384 [5:51:44<20:32:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 22%|██▏ | 2763/12384 [5:51:51<20:32:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 22%|██▏ | 2764/12384 [5:51:51<20:28:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 22%|██▏ | 2764/12384 [5:51:59<20:28:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 22%|██▏ | 2765/12384 [5:51:59<20:25:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 22%|██▏ | 2765/12384 [5:52:06<20:25:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2766/12384 [5:52:06<20:23:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2766/12384 [5:52:14<20:23:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2767/12384 [5:52:14<20:22:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2767/12384 [5:52:22<20:22:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 22%|██▏ | 2768/12384 [5:52:22<20:23:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 22%|██▏ | 2768/12384 [5:52:29<20:23:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 22%|██▏ | 2769/12384 [5:52:29<20:21:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 22%|██▏ | 2769/12384 [5:52:37<20:21:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 22%|██▏ | 2770/12384 [5:52:37<20:36:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 22%|██▏ | 2770/12384 [5:52:45<20:36:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2771/12384 [5:52:45<20:31:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2771/12384 [5:52:52<20:31:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2772/12384 [5:52:52<20:27:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 22%|██▏ | 2772/12384 [5:53:00<20:27:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 22%|██▏ | 2773/12384 [5:53:00<20:25:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 22%|██▏ | 2773/12384 [5:53:08<20:25:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 22%|██▏ | 2774/12384 [5:53:08<20:23:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 22%|██▏ | 2774/12384 [5:53:15<20:23:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 22%|██▏ | 2775/12384 [5:53:15<20:22:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 22%|██▏ | 2775/12384 [5:53:23<20:22:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 22%|██▏ | 2776/12384 [5:53:23<20:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 22%|██▏ | 2776/12384 [5:53:30<20:21:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 2: 22%|██▏ | 2777/12384 [5:53:30<20:19:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 2: 22%|██▏ | 2777/12384 [5:53:38<20:19:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 22%|██▏ | 2778/12384 [5:53:38<20:19:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 22%|██▏ | 2778/12384 [5:53:46<20:19:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 22%|██▏ | 2779/12384 [5:53:46<20:18:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 22%|██▏ | 2779/12384 [5:53:53<20:18:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2780/12384 [5:53:53<20:20:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 22%|██▏ | 2780/12384 [5:54:01<20:20:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 22%|██▏ | 2781/12384 [5:54:01<20:18:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 22%|██▏ | 2781/12384 [5:54:08<20:18:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 2: 22%|██▏ | 2782/12384 [5:54:08<20:18:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 2: 22%|██▏ | 2782/12384 [5:54:16<20:18:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 22%|██▏ | 2783/12384 [5:54:16<20:17:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 22%|██▏ | 2783/12384 [5:54:24<20:17:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 22%|██▏ | 2784/12384 [5:54:24<20:17:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 22%|██▏ | 2784/12384 [5:54:31<20:17:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 22%|██▏ | 2785/12384 [5:54:31<20:17:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 22%|██▏ | 2785/12384 [5:54:39<20:17:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 22%|██▏ | 2786/12384 [5:54:39<20:17:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 22%|██▏ | 2786/12384 [5:54:47<20:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2787/12384 [5:54:47<20:16:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2787/12384 [5:54:54<20:16:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 23%|██▎ | 2788/12384 [5:54:54<20:16:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 23%|██▎ | 2788/12384 [5:55:02<20:16:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 23%|██▎ | 2789/12384 [5:55:02<20:32:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 23%|██▎ | 2789/12384 [5:55:10<20:32:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 23%|██▎ | 2790/12384 [5:55:10<20:27:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 23%|██▎ | 2790/12384 [5:55:17<20:27:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 23%|██▎ | 2791/12384 [5:55:17<20:23:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 23%|██▎ | 2791/12384 [5:55:25<20:23:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 23%|██▎ | 2792/12384 [5:55:25<20:22:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 23%|██▎ | 2792/12384 [5:55:33<20:22:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 23%|██▎ | 2793/12384 [5:55:33<20:19:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 23%|██▎ | 2793/12384 [5:55:40<20:19:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2794/12384 [5:55:40<20:18:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2794/12384 [5:55:48<20:18:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2795/12384 [5:55:48<20:18:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2795/12384 [5:55:56<20:18:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 23%|██▎ | 2796/12384 [5:55:56<20:31:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 23%|██▎ | 2796/12384 [5:56:03<20:31:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2797/12384 [5:56:03<20:26:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2797/12384 [5:56:11<20:26:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2798/12384 [5:56:11<20:22:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2798/12384 [5:56:18<20:22:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2799/12384 [5:56:18<20:20:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2799/12384 [5:56:26<20:20:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 23%|██▎ | 2800/12384 [5:56:26<20:18:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 23%|██▎ | 2800/12384 [5:56:34<20:18:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 2: 23%|██▎ | 2801/12384 [5:56:34<20:17:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 2: 23%|██▎ | 2801/12384 [5:56:41<20:17:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.63s]
Epoch 2: 23%|██▎ | 2802/12384 [5:56:41<20:16:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.63s]
Epoch 2: 23%|██▎ | 2802/12384 [5:56:49<20:16:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2803/12384 [5:56:49<20:15:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2803/12384 [5:56:56<20:15:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 23%|██▎ | 2804/12384 [5:56:56<20:13:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 23%|██▎ | 2804/12384 [5:57:04<20:13:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 23%|██▎ | 2805/12384 [5:57:04<20:14:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 23%|██▎ | 2805/12384 [5:57:12<20:14:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2806/12384 [5:57:12<20:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2806/12384 [5:57:19<20:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 23%|██▎ | 2807/12384 [5:57:19<20:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 23%|██▎ | 2807/12384 [5:57:27<20:14:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 23%|██▎ | 2808/12384 [5:57:27<20:15:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 23%|██▎ | 2808/12384 [5:57:35<20:15:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 2: 23%|██▎ | 2809/12384 [5:57:35<20:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.98s]
Epoch 2: 23%|██▎ | 2809/12384 [5:57:42<20:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 23%|██▎ | 2810/12384 [5:57:42<20:15:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 23%|██▎ | 2810/12384 [5:57:50<20:15:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2811/12384 [5:57:50<20:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2811/12384 [5:57:57<20:14:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 23%|██▎ | 2812/12384 [5:57:57<20:13:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 23%|██▎ | 2812/12384 [5:58:05<20:13:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 23%|██▎ | 2813/12384 [5:58:05<20:12:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 23%|██▎ | 2813/12384 [5:58:13<20:12:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2814/12384 [5:58:13<20:11:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2814/12384 [5:58:20<20:11:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 23%|██▎ | 2815/12384 [5:58:20<20:29:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 23%|██▎ | 2815/12384 [5:58:28<20:29:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 23%|██▎ | 2816/12384 [5:58:28<20:24:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 23%|██▎ | 2816/12384 [5:58:36<20:24:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 23%|██▎ | 2817/12384 [5:58:36<20:21:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 23%|██▎ | 2817/12384 [5:58:43<20:21:09, 7.66s/it, loss=0.0003, acc=0.9986, iter_time=9.25s]
Epoch 2: 23%|██▎ | 2818/12384 [5:58:43<20:17:45, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=9.25s]
Epoch 2: 23%|██▎ | 2818/12384 [5:58:51<20:17:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 23%|██▎ | 2819/12384 [5:58:51<20:20:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 23%|██▎ | 2819/12384 [5:58:59<20:20:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 23%|██▎ | 2820/12384 [5:58:59<20:17:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 23%|██▎ | 2820/12384 [5:59:06<20:17:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 23%|██▎ | 2821/12384 [5:59:06<20:17:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 23%|██▎ | 2821/12384 [5:59:14<20:17:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 23%|██▎ | 2822/12384 [5:59:14<20:29:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 23%|██▎ | 2822/12384 [5:59:22<20:29:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2823/12384 [5:59:22<20:24:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2823/12384 [5:59:29<20:24:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 23%|██▎ | 2824/12384 [5:59:29<20:20:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 23%|██▎ | 2824/12384 [5:59:37<20:20:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 23%|██▎ | 2825/12384 [5:59:37<20:17:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 23%|██▎ | 2825/12384 [5:59:45<20:17:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 23%|██▎ | 2826/12384 [5:59:45<20:15:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 23%|██▎ | 2826/12384 [5:59:52<20:15:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 23%|██▎ | 2827/12384 [5:59:52<20:15:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 23%|██▎ | 2827/12384 [6:00:00<20:15:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 23%|██▎ | 2828/12384 [6:00:00<20:14:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 23%|██▎ | 2828/12384 [6:00:07<20:14:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 23%|██▎ | 2829/12384 [6:00:07<20:14:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 23%|██▎ | 2829/12384 [6:00:15<20:14:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2830/12384 [6:00:15<20:13:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2830/12384 [6:00:23<20:13:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2831/12384 [6:00:23<20:12:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2831/12384 [6:00:30<20:12:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 23%|██▎ | 2832/12384 [6:00:30<20:12:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 23%|██▎ | 2832/12384 [6:00:38<20:12:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 23%|██▎ | 2833/12384 [6:00:38<20:12:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 23%|██▎ | 2833/12384 [6:00:45<20:12:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 23%|██▎ | 2834/12384 [6:00:45<20:11:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 23%|██▎ | 2834/12384 [6:00:53<20:11:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 23%|██▎ | 2835/12384 [6:00:53<20:14:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 23%|██▎ | 2835/12384 [6:01:01<20:14:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2836/12384 [6:01:01<20:13:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2836/12384 [6:01:08<20:13:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 23%|██▎ | 2837/12384 [6:01:08<20:13:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 23%|██▎ | 2837/12384 [6:01:16<20:13:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2838/12384 [6:01:16<20:13:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2838/12384 [6:01:24<20:13:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 23%|██▎ | 2839/12384 [6:01:24<20:13:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 23%|██▎ | 2839/12384 [6:01:31<20:13:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 23%|██▎ | 2840/12384 [6:01:31<20:13:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 23%|██▎ | 2840/12384 [6:01:39<20:13:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 23%|██▎ | 2841/12384 [6:01:39<20:28:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 23%|██▎ | 2841/12384 [6:01:47<20:28:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 23%|██▎ | 2842/12384 [6:01:47<20:22:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 23%|██▎ | 2842/12384 [6:01:54<20:22:48, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.76s]
Epoch 2: 23%|██▎ | 2843/12384 [6:01:54<20:19:17, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.76s]
Epoch 2: 23%|██▎ | 2843/12384 [6:02:02<20:19:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 23%|██▎ | 2844/12384 [6:02:02<20:16:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 23%|██▎ | 2844/12384 [6:02:10<20:16:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 23%|██▎ | 2845/12384 [6:02:10<20:15:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 23%|██▎ | 2845/12384 [6:02:17<20:15:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 23%|██▎ | 2846/12384 [6:02:17<20:12:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 23%|██▎ | 2846/12384 [6:02:25<20:12:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 23%|██▎ | 2847/12384 [6:02:25<20:11:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 23%|██▎ | 2847/12384 [6:02:33<20:11:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 23%|██▎ | 2848/12384 [6:02:33<20:24:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 23%|██▎ | 2848/12384 [6:02:40<20:24:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 23%|██▎ | 2849/12384 [6:02:40<20:18:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 23%|██▎ | 2849/12384 [6:02:48<20:18:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 23%|██▎ | 2850/12384 [6:02:48<20:16:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 23%|██▎ | 2850/12384 [6:02:56<20:16:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 23%|██▎ | 2851/12384 [6:02:56<20:13:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 23%|██▎ | 2851/12384 [6:03:03<20:13:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2852/12384 [6:03:03<20:11:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2852/12384 [6:03:11<20:11:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2853/12384 [6:03:11<20:10:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2853/12384 [6:03:18<20:10:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2854/12384 [6:03:18<20:10:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 23%|██▎ | 2854/12384 [6:03:26<20:10:11, 7.62s/it, loss=0.0009, acc=0.9978, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2855/12384 [6:03:26<20:09:20, 7.61s/it, loss=0.0009, acc=0.9978, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2855/12384 [6:03:34<20:09:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 23%|██▎ | 2856/12384 [6:03:34<20:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 23%|██▎ | 2856/12384 [6:03:41<20:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 23%|██▎ | 2857/12384 [6:03:41<20:12:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 23%|██▎ | 2857/12384 [6:03:49<20:12:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 23%|██▎ | 2858/12384 [6:03:49<20:11:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 23%|██▎ | 2858/12384 [6:03:57<20:11:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 23%|██▎ | 2859/12384 [6:03:57<20:13:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 23%|██▎ | 2859/12384 [6:04:04<20:13:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 23%|██▎ | 2860/12384 [6:04:04<20:12:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 23%|██▎ | 2860/12384 [6:04:12<20:12:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 23%|██▎ | 2861/12384 [6:04:12<20:10:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 23%|██▎ | 2861/12384 [6:04:19<20:10:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 23%|██▎ | 2862/12384 [6:04:19<20:08:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 23%|██▎ | 2862/12384 [6:04:27<20:08:45, 7.62s/it, loss=0.0018, acc=0.9973, iter_time=4.80s]
Epoch 2: 23%|██▎ | 2863/12384 [6:04:27<20:08:03, 7.61s/it, loss=0.0018, acc=0.9973, iter_time=4.80s]
Epoch 2: 23%|██▎ | 2863/12384 [6:04:35<20:08:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 2: 23%|██▎ | 2864/12384 [6:04:35<20:07:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 2: 23%|██▎ | 2864/12384 [6:04:42<20:07:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 23%|██▎ | 2865/12384 [6:04:42<20:05:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 23%|██▎ | 2865/12384 [6:04:50<20:05:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 23%|██▎ | 2866/12384 [6:04:50<20:05:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 23%|██▎ | 2866/12384 [6:04:58<20:05:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 23%|██▎ | 2867/12384 [6:04:58<20:20:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 23%|██▎ | 2867/12384 [6:05:05<20:20:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 23%|██▎ | 2868/12384 [6:05:05<20:15:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 23%|██▎ | 2868/12384 [6:05:13<20:15:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 2: 23%|██▎ | 2869/12384 [6:05:13<20:12:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 2: 23%|██▎ | 2869/12384 [6:05:21<20:12:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 23%|██▎ | 2870/12384 [6:05:21<20:10:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 23%|██▎ | 2870/12384 [6:05:28<20:10:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 23%|██▎ | 2871/12384 [6:05:28<20:10:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 23%|██▎ | 2871/12384 [6:05:36<20:10:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 23%|██▎ | 2872/12384 [6:05:36<20:09:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 23%|██▎ | 2872/12384 [6:05:43<20:09:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 23%|██▎ | 2873/12384 [6:05:43<20:12:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 23%|██▎ | 2873/12384 [6:05:51<20:12:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 23%|██▎ | 2874/12384 [6:05:51<20:24:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 23%|██▎ | 2874/12384 [6:05:59<20:24:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 23%|██▎ | 2875/12384 [6:05:59<20:17:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 23%|██▎ | 2875/12384 [6:06:07<20:17:29, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=8.88s]
Epoch 2: 23%|██▎ | 2876/12384 [6:06:07<20:13:14, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.88s]
Epoch 2: 23%|██▎ | 2876/12384 [6:06:14<20:13:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 23%|██▎ | 2877/12384 [6:06:14<20:09:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 23%|██▎ | 2877/12384 [6:06:22<20:09:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2878/12384 [6:06:22<20:11:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2878/12384 [6:06:29<20:11:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 23%|██▎ | 2879/12384 [6:06:29<20:11:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 23%|██▎ | 2879/12384 [6:06:37<20:11:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 23%|██▎ | 2880/12384 [6:06:37<20:09:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 23%|██▎ | 2880/12384 [6:06:45<20:09:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 23%|██▎ | 2881/12384 [6:06:45<20:10:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 23%|██▎ | 2881/12384 [6:06:52<20:10:04, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=9.18s]
Epoch 2: 23%|██▎ | 2882/12384 [6:06:52<20:08:50, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=9.18s]
Epoch 2: 23%|██▎ | 2882/12384 [6:07:00<20:08:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 23%|██▎ | 2883/12384 [6:07:00<20:10:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 23%|██▎ | 2883/12384 [6:07:08<20:10:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2884/12384 [6:07:08<20:11:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2884/12384 [6:07:15<20:11:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 23%|██▎ | 2885/12384 [6:07:15<20:10:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 23%|██▎ | 2885/12384 [6:07:23<20:10:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 23%|██▎ | 2886/12384 [6:07:23<20:08:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 23%|██▎ | 2886/12384 [6:07:31<20:08:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2887/12384 [6:07:31<20:07:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2887/12384 [6:07:38<20:07:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 23%|██▎ | 2888/12384 [6:07:38<20:06:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 23%|██▎ | 2888/12384 [6:07:46<20:06:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 23%|██▎ | 2889/12384 [6:07:46<20:05:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 23%|██▎ | 2889/12384 [6:07:53<20:05:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2890/12384 [6:07:53<20:05:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 23%|██▎ | 2890/12384 [6:08:01<20:05:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2891/12384 [6:08:01<20:03:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2891/12384 [6:08:09<20:03:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2892/12384 [6:08:09<20:03:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 23%|██▎ | 2892/12384 [6:08:17<20:03:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 23%|██▎ | 2893/12384 [6:08:17<20:20:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 23%|██▎ | 2893/12384 [6:08:24<20:20:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 23%|██▎ | 2894/12384 [6:08:24<20:15:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 23%|██▎ | 2894/12384 [6:08:32<20:15:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2895/12384 [6:08:32<20:11:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2895/12384 [6:08:39<20:11:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 23%|██▎ | 2896/12384 [6:08:39<20:08:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 23%|██▎ | 2896/12384 [6:08:47<20:08:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 23%|██▎ | 2897/12384 [6:08:47<20:06:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 23%|██▎ | 2897/12384 [6:08:55<20:06:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 23%|██▎ | 2898/12384 [6:08:55<20:04:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 23%|██▎ | 2898/12384 [6:09:02<20:04:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 23%|██▎ | 2899/12384 [6:09:02<20:03:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 23%|██▎ | 2899/12384 [6:09:10<20:03:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 23%|██▎ | 2900/12384 [6:09:10<20:03:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 23%|██▎ | 2900/12384 [6:09:17<20:03:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 23%|██▎ | 2901/12384 [6:09:17<20:03:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 23%|██▎ | 2901/12384 [6:09:25<20:03:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 23%|██▎ | 2902/12384 [6:09:25<20:03:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 23%|██▎ | 2902/12384 [6:09:33<20:03:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 23%|██▎ | 2903/12384 [6:09:33<20:03:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 23%|██▎ | 2903/12384 [6:09:40<20:03:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 23%|██▎ | 2904/12384 [6:09:40<20:02:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 23%|██▎ | 2904/12384 [6:09:48<20:02:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 23%|██▎ | 2905/12384 [6:09:48<20:01:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 23%|██▎ | 2905/12384 [6:09:55<20:01:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 23%|██▎ | 2906/12384 [6:09:55<20:02:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 23%|██▎ | 2906/12384 [6:10:03<20:02:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 2: 23%|██▎ | 2907/12384 [6:10:03<20:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.25s]
Epoch 2: 23%|██▎ | 2907/12384 [6:10:11<20:01:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2908/12384 [6:10:11<20:01:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 23%|██▎ | 2908/12384 [6:10:18<20:01:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 23%|██▎ | 2909/12384 [6:10:18<20:00:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 23%|██▎ | 2909/12384 [6:10:26<20:00:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 23%|██▎ | 2910/12384 [6:10:26<20:00:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 23%|██▎ | 2910/12384 [6:10:33<20:00:07, 7.60s/it, loss=0.0001, acc=0.9990, iter_time=7.62s]
Epoch 2: 24%|██▎ | 2911/12384 [6:10:33<20:00:13, 7.60s/it, loss=0.0001, acc=0.9990, iter_time=7.62s]
Epoch 2: 24%|██▎ | 2911/12384 [6:10:41<20:00:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 24%|██▎ | 2912/12384 [6:10:41<20:01:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 24%|██▎ | 2912/12384 [6:10:49<20:01:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 24%|██▎ | 2913/12384 [6:10:49<20:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 24%|██▎ | 2913/12384 [6:10:56<20:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 24%|██▎ | 2914/12384 [6:10:56<20:03:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 24%|██▎ | 2914/12384 [6:11:04<20:03:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▎ | 2915/12384 [6:11:04<20:06:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▎ | 2915/12384 [6:11:12<20:06:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 24%|██▎ | 2916/12384 [6:11:12<20:04:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 24%|██▎ | 2916/12384 [6:11:19<20:04:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 24%|██▎ | 2917/12384 [6:11:19<20:03:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 24%|██▎ | 2917/12384 [6:11:27<20:03:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 24%|██▎ | 2918/12384 [6:11:27<20:01:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 24%|██▎ | 2918/12384 [6:11:34<20:01:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 24%|██▎ | 2919/12384 [6:11:34<20:02:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 24%|██▎ | 2919/12384 [6:11:42<20:02:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 24%|██▎ | 2920/12384 [6:11:42<20:17:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 24%|██▎ | 2920/12384 [6:11:50<20:17:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 24%|██▎ | 2921/12384 [6:11:50<20:13:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 24%|██▎ | 2921/12384 [6:11:58<20:13:19, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=4.10s]
Epoch 2: 24%|██▎ | 2922/12384 [6:11:58<20:09:09, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=4.10s]
Epoch 2: 24%|██▎ | 2922/12384 [6:12:05<20:09:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 24%|██▎ | 2923/12384 [6:12:05<20:08:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 24%|██▎ | 2923/12384 [6:12:13<20:08:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 24%|██▎ | 2924/12384 [6:12:13<20:05:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 24%|██▎ | 2924/12384 [6:12:21<20:05:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 24%|██▎ | 2925/12384 [6:12:21<20:03:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 24%|██▎ | 2925/12384 [6:12:28<20:03:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 24%|██▎ | 2926/12384 [6:12:28<20:14:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 24%|██▎ | 2926/12384 [6:12:36<20:14:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 24%|██▎ | 2927/12384 [6:12:36<20:09:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 24%|██▎ | 2927/12384 [6:12:44<20:09:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 24%|██▎ | 2928/12384 [6:12:44<20:06:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 24%|██▎ | 2928/12384 [6:12:51<20:06:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 24%|██▎ | 2929/12384 [6:12:51<20:04:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 24%|██▎ | 2929/12384 [6:12:59<20:04:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 24%|██▎ | 2930/12384 [6:12:59<20:04:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 24%|██▎ | 2930/12384 [6:13:06<20:04:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 2: 24%|██▎ | 2931/12384 [6:13:06<20:03:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 2: 24%|██▎ | 2931/12384 [6:13:14<20:03:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 24%|██▎ | 2932/12384 [6:13:14<20:01:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 24%|██▎ | 2932/12384 [6:13:22<20:01:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 24%|██▎ | 2933/12384 [6:13:22<19:58:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 24%|██▎ | 2933/12384 [6:13:29<19:58:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 24%|██▎ | 2934/12384 [6:13:29<19:58:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 24%|██▎ | 2934/12384 [6:13:37<19:58:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 24%|██▎ | 2935/12384 [6:13:37<19:59:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 24%|██▎ | 2935/12384 [6:13:45<19:59:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 24%|██▎ | 2936/12384 [6:13:45<19:59:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 24%|██▎ | 2936/12384 [6:13:52<19:59:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 24%|██▎ | 2937/12384 [6:13:52<19:59:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 24%|██▎ | 2937/12384 [6:14:00<19:59:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 24%|██▎ | 2938/12384 [6:14:00<19:58:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 24%|██▎ | 2938/12384 [6:14:07<19:58:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▎ | 2939/12384 [6:14:07<19:58:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▎ | 2939/12384 [6:14:15<19:58:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 24%|██▎ | 2940/12384 [6:14:15<19:58:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 24%|██▎ | 2940/12384 [6:14:23<19:58:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 24%|██▎ | 2941/12384 [6:14:23<19:58:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 24%|██▎ | 2941/12384 [6:14:30<19:58:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 2: 24%|██▍ | 2942/12384 [6:14:30<19:56:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 2: 24%|██▍ | 2942/12384 [6:14:38<19:56:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 24%|██▍ | 2943/12384 [6:14:38<19:56:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 24%|██▍ | 2943/12384 [6:14:45<19:56:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 24%|██▍ | 2944/12384 [6:14:45<19:56:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 24%|██▍ | 2944/12384 [6:14:53<19:56:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 24%|██▍ | 2945/12384 [6:14:53<19:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 24%|██▍ | 2945/12384 [6:15:01<19:57:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 24%|██▍ | 2946/12384 [6:15:01<20:14:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 24%|██▍ | 2946/12384 [6:15:09<20:14:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 24%|██▍ | 2947/12384 [6:15:09<20:09:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 24%|██▍ | 2947/12384 [6:15:16<20:09:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 24%|██▍ | 2948/12384 [6:15:16<20:06:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 24%|██▍ | 2948/12384 [6:15:24<20:06:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 24%|██▍ | 2949/12384 [6:15:24<20:03:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 24%|██▍ | 2949/12384 [6:15:32<20:03:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 2: 24%|██▍ | 2950/12384 [6:15:32<20:05:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 2: 24%|██▍ | 2950/12384 [6:15:39<20:05:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 24%|██▍ | 2951/12384 [6:15:39<20:02:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 24%|██▍ | 2951/12384 [6:15:47<20:02:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 24%|██▍ | 2952/12384 [6:15:47<20:00:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 24%|██▍ | 2952/12384 [6:15:55<20:00:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 24%|██▍ | 2953/12384 [6:15:55<20:11:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 24%|██▍ | 2953/12384 [6:16:02<20:11:36, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 24%|██▍ | 2954/12384 [6:16:02<20:06:51, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 24%|██▍ | 2954/12384 [6:16:10<20:06:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 24%|██▍ | 2955/12384 [6:16:10<20:02:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 24%|██▍ | 2955/12384 [6:16:17<20:02:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 24%|██▍ | 2956/12384 [6:16:17<20:00:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 24%|██▍ | 2956/12384 [6:16:25<20:00:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 24%|██▍ | 2957/12384 [6:16:25<20:03:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 24%|██▍ | 2957/12384 [6:16:33<20:03:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 2: 24%|██▍ | 2958/12384 [6:16:33<20:01:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 2: 24%|██▍ | 2958/12384 [6:16:40<20:01:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 24%|██▍ | 2959/12384 [6:16:40<19:58:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 24%|██▍ | 2959/12384 [6:16:48<19:58:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 24%|██▍ | 2960/12384 [6:16:48<19:57:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 24%|██▍ | 2960/12384 [6:16:56<19:57:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 2: 24%|██▍ | 2961/12384 [6:16:56<19:55:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 2: 24%|██▍ | 2961/12384 [6:17:03<19:55:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 24%|██▍ | 2962/12384 [6:17:03<19:54:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 24%|██▍ | 2962/12384 [6:17:11<19:54:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 24%|██▍ | 2963/12384 [6:17:11<19:56:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 24%|██▍ | 2963/12384 [6:17:18<19:56:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▍ | 2964/12384 [6:17:18<19:56:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▍ | 2964/12384 [6:17:26<19:56:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 24%|██▍ | 2965/12384 [6:17:26<19:55:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 24%|██▍ | 2965/12384 [6:17:34<19:55:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 24%|██▍ | 2966/12384 [6:17:34<19:54:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 24%|██▍ | 2966/12384 [6:17:41<19:54:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 24%|██▍ | 2967/12384 [6:17:41<19:54:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 24%|██▍ | 2967/12384 [6:17:49<19:54:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 24%|██▍ | 2968/12384 [6:17:49<19:53:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 24%|██▍ | 2968/12384 [6:17:56<19:53:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 24%|██▍ | 2969/12384 [6:17:56<19:54:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 24%|██▍ | 2969/12384 [6:18:04<19:54:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 24%|██▍ | 2970/12384 [6:18:04<19:54:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 24%|██▍ | 2970/12384 [6:18:12<19:54:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 2: 24%|██▍ | 2971/12384 [6:18:12<19:54:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.39s]
Epoch 2: 24%|██▍ | 2971/12384 [6:18:19<19:54:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 24%|██▍ | 2972/12384 [6:18:19<19:53:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 24%|██▍ | 2972/12384 [6:18:27<19:53:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 24%|██▍ | 2973/12384 [6:18:27<20:08:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 24%|██▍ | 2973/12384 [6:18:35<20:08:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 24%|██▍ | 2974/12384 [6:18:35<20:04:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 24%|██▍ | 2974/12384 [6:18:42<20:04:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 24%|██▍ | 2975/12384 [6:18:42<20:01:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 24%|██▍ | 2975/12384 [6:18:50<20:01:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 24%|██▍ | 2976/12384 [6:18:50<19:59:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 24%|██▍ | 2976/12384 [6:18:58<19:59:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 24%|██▍ | 2977/12384 [6:18:58<20:00:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 24%|██▍ | 2977/12384 [6:19:05<20:00:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 24%|██▍ | 2978/12384 [6:19:05<19:58:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 24%|██▍ | 2978/12384 [6:19:13<19:58:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 24%|██▍ | 2979/12384 [6:19:13<20:09:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 24%|██▍ | 2979/12384 [6:19:21<20:09:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 24%|██▍ | 2980/12384 [6:19:21<20:03:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 24%|██▍ | 2980/12384 [6:19:28<20:03:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 24%|██▍ | 2981/12384 [6:19:28<20:01:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 24%|██▍ | 2981/12384 [6:19:36<20:01:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 24%|██▍ | 2982/12384 [6:19:36<19:58:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 24%|██▍ | 2982/12384 [6:19:44<19:58:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 24%|██▍ | 2983/12384 [6:19:44<19:56:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 24%|██▍ | 2983/12384 [6:19:51<19:56:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 24%|██▍ | 2984/12384 [6:19:51<19:55:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 24%|██▍ | 2984/12384 [6:19:59<19:55:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 24%|██▍ | 2985/12384 [6:19:59<19:54:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 24%|██▍ | 2985/12384 [6:20:07<19:54:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 24%|██▍ | 2986/12384 [6:20:07<19:53:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 24%|██▍ | 2986/12384 [6:20:14<19:53:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 24%|██▍ | 2987/12384 [6:20:14<19:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 24%|██▍ | 2987/12384 [6:20:22<19:53:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 24%|██▍ | 2988/12384 [6:20:22<19:52:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 24%|██▍ | 2988/12384 [6:20:29<19:52:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 24%|██▍ | 2989/12384 [6:20:29<19:50:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 24%|██▍ | 2989/12384 [6:20:37<19:50:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 24%|██▍ | 2990/12384 [6:20:37<19:56:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 24%|██▍ | 2990/12384 [6:20:45<19:56:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 24%|██▍ | 2991/12384 [6:20:45<19:55:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 24%|██▍ | 2991/12384 [6:20:52<19:55:11, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.85s]
Epoch 2: 24%|██▍ | 2992/12384 [6:20:52<19:54:11, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.85s]
Epoch 2: 24%|██▍ | 2992/12384 [6:21:00<19:54:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 24%|██▍ | 2993/12384 [6:21:00<19:53:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 24%|██▍ | 2993/12384 [6:21:07<19:53:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▍ | 2994/12384 [6:21:07<19:51:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▍ | 2994/12384 [6:21:15<19:51:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 24%|██▍ | 2995/12384 [6:21:15<19:54:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 24%|██▍ | 2995/12384 [6:21:23<19:54:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 24%|██▍ | 2996/12384 [6:21:23<19:53:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 24%|██▍ | 2996/12384 [6:21:30<19:53:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▍ | 2997/12384 [6:21:30<19:53:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▍ | 2997/12384 [6:21:38<19:53:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 24%|██▍ | 2998/12384 [6:21:38<19:54:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 24%|██▍ | 2998/12384 [6:21:46<19:54:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 24%|██▍ | 2999/12384 [6:21:46<20:09:14, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 24%|██▍ | 2999/12384 [6:21:54<20:09:14, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 24%|██▍ | 3000/12384 [6:21:54<20:03:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 24%|██▍ | 3000/12384 [6:22:01<20:03:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 24%|██▍ | 3001/12384 [6:22:01<20:00:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 24%|██▍ | 3001/12384 [6:22:09<20:00:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 24%|██▍ | 3002/12384 [6:22:09<19:57:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 24%|██▍ | 3002/12384 [6:22:16<19:57:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 24%|██▍ | 3003/12384 [6:22:16<19:55:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 24%|██▍ | 3003/12384 [6:22:24<19:55:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 24%|██▍ | 3004/12384 [6:22:24<19:52:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 24%|██▍ | 3004/12384 [6:22:32<19:52:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 24%|██▍ | 3005/12384 [6:22:32<20:03:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 24%|██▍ | 3005/12384 [6:22:40<20:03:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 24%|██▍ | 3006/12384 [6:22:40<19:57:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 24%|██▍ | 3006/12384 [6:22:47<19:57:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 24%|██▍ | 3007/12384 [6:22:47<19:54:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 24%|██▍ | 3007/12384 [6:22:55<19:54:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 24%|██▍ | 3008/12384 [6:22:55<19:54:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 24%|██▍ | 3008/12384 [6:23:02<19:54:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 24%|██▍ | 3009/12384 [6:23:02<19:51:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 24%|██▍ | 3009/12384 [6:23:10<19:51:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 24%|██▍ | 3010/12384 [6:23:10<19:51:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 24%|██▍ | 3010/12384 [6:23:18<19:51:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 24%|██▍ | 3011/12384 [6:23:18<19:50:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 24%|██▍ | 3011/12384 [6:23:25<19:50:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 24%|██▍ | 3012/12384 [6:23:25<19:48:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 24%|██▍ | 3012/12384 [6:23:33<19:48:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 24%|██▍ | 3013/12384 [6:23:33<19:47:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 24%|██▍ | 3013/12384 [6:23:40<19:47:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▍ | 3014/12384 [6:23:40<19:48:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 24%|██▍ | 3014/12384 [6:23:48<19:48:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 2: 24%|██▍ | 3015/12384 [6:23:48<19:48:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.03s]
Epoch 2: 24%|██▍ | 3015/12384 [6:23:56<19:48:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 2: 24%|██▍ | 3016/12384 [6:23:56<19:47:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 2: 24%|██▍ | 3016/12384 [6:24:03<19:47:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 24%|██▍ | 3017/12384 [6:24:03<19:48:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 24%|██▍ | 3017/12384 [6:24:11<19:48:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 24%|██▍ | 3018/12384 [6:24:11<19:46:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 24%|██▍ | 3018/12384 [6:24:18<19:46:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 24%|██▍ | 3019/12384 [6:24:18<19:46:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 24%|██▍ | 3019/12384 [6:24:26<19:46:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 24%|██▍ | 3020/12384 [6:24:26<19:48:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 24%|██▍ | 3020/12384 [6:24:34<19:48:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 24%|██▍ | 3021/12384 [6:24:34<19:49:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 24%|██▍ | 3021/12384 [6:24:41<19:49:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 24%|██▍ | 3022/12384 [6:24:41<19:47:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 24%|██▍ | 3022/12384 [6:24:49<19:47:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 24%|██▍ | 3023/12384 [6:24:49<19:48:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 24%|██▍ | 3023/12384 [6:24:57<19:48:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 24%|██▍ | 3024/12384 [6:24:57<19:48:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 24%|██▍ | 3024/12384 [6:25:04<19:48:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 24%|██▍ | 3025/12384 [6:25:04<20:03:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 24%|██▍ | 3025/12384 [6:25:12<20:03:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 24%|██▍ | 3026/12384 [6:25:12<19:59:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 24%|██▍ | 3026/12384 [6:25:20<19:59:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 24%|██▍ | 3027/12384 [6:25:20<19:55:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 24%|██▍ | 3027/12384 [6:25:27<19:55:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 24%|██▍ | 3028/12384 [6:25:27<19:53:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 24%|██▍ | 3028/12384 [6:25:35<19:53:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 24%|██▍ | 3029/12384 [6:25:35<19:52:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 24%|██▍ | 3029/12384 [6:25:43<19:52:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 24%|██▍ | 3030/12384 [6:25:43<19:51:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 24%|██▍ | 3030/12384 [6:25:50<19:51:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 24%|██▍ | 3031/12384 [6:25:50<19:52:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 24%|██▍ | 3031/12384 [6:25:58<19:52:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 24%|██▍ | 3032/12384 [6:25:58<19:50:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 24%|██▍ | 3032/12384 [6:26:05<19:50:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 24%|██▍ | 3033/12384 [6:26:05<19:49:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 24%|██▍ | 3033/12384 [6:26:13<19:49:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 24%|██▍ | 3034/12384 [6:26:13<19:48:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 24%|██▍ | 3034/12384 [6:26:21<19:48:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 25%|██▍ | 3035/12384 [6:26:21<19:48:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 25%|██▍ | 3035/12384 [6:26:28<19:48:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 25%|██▍ | 3036/12384 [6:26:28<19:47:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 25%|██▍ | 3036/12384 [6:26:36<19:47:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▍ | 3037/12384 [6:26:36<19:46:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▍ | 3037/12384 [6:26:44<19:46:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 25%|██▍ | 3038/12384 [6:26:44<19:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 25%|██▍ | 3038/12384 [6:26:51<19:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 25%|██▍ | 3039/12384 [6:26:51<19:45:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 25%|██▍ | 3039/12384 [6:26:59<19:45:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 25%|██▍ | 3040/12384 [6:26:59<19:45:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 25%|██▍ | 3040/12384 [6:27:06<19:45:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 25%|██▍ | 3041/12384 [6:27:06<19:45:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 25%|██▍ | 3041/12384 [6:27:14<19:45:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 25%|██▍ | 3042/12384 [6:27:14<19:45:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 25%|██▍ | 3042/12384 [6:27:22<19:45:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 25%|██▍ | 3043/12384 [6:27:22<19:44:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 25%|██▍ | 3043/12384 [6:27:29<19:44:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 25%|██▍ | 3044/12384 [6:27:29<19:42:16, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 25%|██▍ | 3044/12384 [6:27:37<19:42:16, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 2: 25%|██▍ | 3045/12384 [6:27:37<19:42:06, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 2: 25%|██▍ | 3045/12384 [6:27:44<19:42:06, 7.59s/it, loss=0.0005, acc=0.9995, iter_time=7.61s]
Epoch 2: 25%|██▍ | 3046/12384 [6:27:44<19:42:45, 7.60s/it, loss=0.0005, acc=0.9995, iter_time=7.61s]
Epoch 2: 25%|██▍ | 3046/12384 [6:27:52<19:42:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 25%|██▍ | 3047/12384 [6:27:52<19:44:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 25%|██▍ | 3047/12384 [6:28:00<19:44:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 25%|██▍ | 3048/12384 [6:28:00<19:47:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 25%|██▍ | 3048/12384 [6:28:07<19:47:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 25%|██▍ | 3049/12384 [6:28:07<19:46:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 25%|██▍ | 3049/12384 [6:28:15<19:46:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▍ | 3050/12384 [6:28:15<19:46:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▍ | 3050/12384 [6:28:23<19:46:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 25%|██▍ | 3051/12384 [6:28:23<20:00:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 25%|██▍ | 3051/12384 [6:28:30<20:00:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 25%|██▍ | 3052/12384 [6:28:30<19:54:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 25%|██▍ | 3052/12384 [6:28:38<19:54:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 25%|██▍ | 3053/12384 [6:28:38<19:52:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 25%|██▍ | 3053/12384 [6:28:46<19:52:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 2: 25%|██▍ | 3054/12384 [6:28:46<19:50:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 2: 25%|██▍ | 3054/12384 [6:28:53<19:50:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 2: 25%|██▍ | 3055/12384 [6:28:53<19:47:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 2: 25%|██▍ | 3055/12384 [6:29:01<19:47:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 25%|██▍ | 3056/12384 [6:29:01<19:46:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 25%|██▍ | 3056/12384 [6:29:09<19:46:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 2: 25%|██▍ | 3057/12384 [6:29:09<19:57:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 2: 25%|██▍ | 3057/12384 [6:29:16<19:57:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▍ | 3058/12384 [6:29:16<19:53:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▍ | 3058/12384 [6:29:24<19:53:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 25%|██▍ | 3059/12384 [6:29:24<19:51:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 25%|██▍ | 3059/12384 [6:29:32<19:51:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 25%|██▍ | 3060/12384 [6:29:32<19:48:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 25%|██▍ | 3060/12384 [6:29:39<19:48:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 25%|██▍ | 3061/12384 [6:29:39<19:46:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 25%|██▍ | 3061/12384 [6:29:47<19:46:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 25%|██▍ | 3062/12384 [6:29:47<19:46:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 25%|██▍ | 3062/12384 [6:29:55<19:46:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 25%|██▍ | 3063/12384 [6:29:55<19:45:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 25%|██▍ | 3063/12384 [6:30:02<19:45:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 25%|██▍ | 3064/12384 [6:30:02<19:44:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 25%|██▍ | 3064/12384 [6:30:10<19:44:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 25%|██▍ | 3065/12384 [6:30:10<19:44:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 25%|██▍ | 3065/12384 [6:30:17<19:44:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 25%|██▍ | 3066/12384 [6:30:17<19:43:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 25%|██▍ | 3066/12384 [6:30:25<19:43:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▍ | 3067/12384 [6:30:25<19:43:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▍ | 3067/12384 [6:30:33<19:43:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 25%|██▍ | 3068/12384 [6:30:33<19:41:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 25%|██▍ | 3068/12384 [6:30:40<19:41:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 25%|██▍ | 3069/12384 [6:30:40<19:40:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 25%|██▍ | 3069/12384 [6:30:48<19:40:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▍ | 3070/12384 [6:30:48<19:40:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▍ | 3070/12384 [6:30:55<19:40:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 25%|██▍ | 3071/12384 [6:30:55<19:40:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 25%|██▍ | 3071/12384 [6:31:03<19:40:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 25%|██▍ | 3072/12384 [6:31:03<19:39:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 25%|██▍ | 3072/12384 [6:31:11<19:39:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 25%|██▍ | 3073/12384 [6:31:11<19:42:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 25%|██▍ | 3073/12384 [6:31:18<19:42:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 25%|██▍ | 3074/12384 [6:31:18<19:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 25%|██▍ | 3074/12384 [6:31:26<19:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▍ | 3075/12384 [6:31:26<19:41:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▍ | 3075/12384 [6:31:33<19:41:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▍ | 3076/12384 [6:31:33<19:42:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▍ | 3076/12384 [6:31:41<19:42:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 25%|██▍ | 3077/12384 [6:31:41<19:58:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 25%|██▍ | 3077/12384 [6:31:49<19:58:17, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 2: 25%|██▍ | 3078/12384 [6:31:49<19:53:04, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 2: 25%|██▍ | 3078/12384 [6:31:57<19:53:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 25%|██▍ | 3079/12384 [6:31:57<19:48:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 25%|██▍ | 3079/12384 [6:32:04<19:48:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 25%|██▍ | 3080/12384 [6:32:04<19:46:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 25%|██▍ | 3080/12384 [6:32:12<19:46:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 25%|██▍ | 3081/12384 [6:32:12<19:46:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 25%|██▍ | 3081/12384 [6:32:20<19:46:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 25%|██▍ | 3082/12384 [6:32:20<19:44:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 25%|██▍ | 3082/12384 [6:32:27<19:44:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 25%|██▍ | 3083/12384 [6:32:27<19:42:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 25%|██▍ | 3083/12384 [6:32:35<19:42:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 25%|██▍ | 3084/12384 [6:32:35<19:41:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 25%|██▍ | 3084/12384 [6:32:42<19:41:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 2: 25%|██▍ | 3085/12384 [6:32:42<19:39:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 2: 25%|██▍ | 3085/12384 [6:32:50<19:39:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 2: 25%|██▍ | 3086/12384 [6:32:50<19:39:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 2: 25%|██▍ | 3086/12384 [6:32:58<19:39:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 25%|██▍ | 3087/12384 [6:32:58<19:38:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 25%|██▍ | 3087/12384 [6:33:05<19:38:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 25%|██▍ | 3088/12384 [6:33:05<19:40:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 25%|██▍ | 3088/12384 [6:33:13<19:40:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 25%|██▍ | 3089/12384 [6:33:13<19:40:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 25%|██▍ | 3089/12384 [6:33:20<19:40:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 25%|██▍ | 3090/12384 [6:33:20<19:39:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 25%|██▍ | 3090/12384 [6:33:28<19:39:29, 7.61s/it, loss=0.0000, acc=0.9998, iter_time=7.60s]
Epoch 2: 25%|██▍ | 3091/12384 [6:33:28<19:39:32, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=7.60s]
Epoch 2: 25%|██▍ | 3091/12384 [6:33:36<19:39:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 25%|██▍ | 3092/12384 [6:33:36<19:39:29, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 25%|██▍ | 3092/12384 [6:33:43<19:39:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▍ | 3093/12384 [6:33:43<19:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▍ | 3093/12384 [6:33:51<19:38:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 25%|██▍ | 3094/12384 [6:33:51<19:37:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 25%|██▍ | 3094/12384 [6:33:58<19:37:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 25%|██▍ | 3095/12384 [6:33:58<19:36:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 25%|██▍ | 3095/12384 [6:34:06<19:36:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 25%|██▌ | 3096/12384 [6:34:06<19:37:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 25%|██▌ | 3096/12384 [6:34:14<19:37:15, 7.60s/it, loss=0.0004, acc=1.0000, iter_time=6.65s]
Epoch 2: 25%|██▌ | 3097/12384 [6:34:14<19:37:15, 7.61s/it, loss=0.0004, acc=1.0000, iter_time=6.65s]
Epoch 2: 25%|██▌ | 3097/12384 [6:34:21<19:37:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 25%|██▌ | 3098/12384 [6:34:21<19:36:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 25%|██▌ | 3098/12384 [6:34:29<19:36:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 25%|██▌ | 3099/12384 [6:34:29<19:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 25%|██▌ | 3099/12384 [6:34:36<19:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 2: 25%|██▌ | 3100/12384 [6:34:36<19:37:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 2: 25%|██▌ | 3100/12384 [6:34:44<19:37:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 25%|██▌ | 3101/12384 [6:34:44<19:37:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 25%|██▌ | 3101/12384 [6:34:52<19:37:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▌ | 3102/12384 [6:34:52<19:36:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▌ | 3102/12384 [6:34:59<19:36:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 25%|██▌ | 3103/12384 [6:34:59<19:36:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 25%|██▌ | 3103/12384 [6:35:07<19:36:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 25%|██▌ | 3104/12384 [6:35:07<19:51:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 25%|██▌ | 3104/12384 [6:35:15<19:51:31, 7.70s/it, loss=0.0000, acc=0.9999, iter_time=7.48s]
Epoch 2: 25%|██▌ | 3105/12384 [6:35:15<19:47:53, 7.68s/it, loss=0.0000, acc=0.9999, iter_time=7.48s]
Epoch 2: 25%|██▌ | 3105/12384 [6:35:22<19:47:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 25%|██▌ | 3106/12384 [6:35:22<19:43:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 25%|██▌ | 3106/12384 [6:35:30<19:43:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 25%|██▌ | 3107/12384 [6:35:30<19:40:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 25%|██▌ | 3107/12384 [6:35:38<19:40:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 25%|██▌ | 3108/12384 [6:35:38<19:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 25%|██▌ | 3108/12384 [6:35:45<19:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 2: 25%|██▌ | 3109/12384 [6:35:45<19:38:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.63s]
Epoch 2: 25%|██▌ | 3109/12384 [6:35:53<19:38:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.96s]
Epoch 2: 25%|██▌ | 3110/12384 [6:35:53<19:53:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.96s]
Epoch 2: 25%|██▌ | 3110/12384 [6:36:01<19:53:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 25%|██▌ | 3111/12384 [6:36:01<19:49:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 25%|██▌ | 3111/12384 [6:36:08<19:49:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 25%|██▌ | 3112/12384 [6:36:08<19:46:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 25%|██▌ | 3112/12384 [6:36:16<19:46:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 25%|██▌ | 3113/12384 [6:36:16<19:46:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 25%|██▌ | 3113/12384 [6:36:24<19:46:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 25%|██▌ | 3114/12384 [6:36:24<19:44:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 25%|██▌ | 3114/12384 [6:36:31<19:44:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 2: 25%|██▌ | 3115/12384 [6:36:31<19:41:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 2: 25%|██▌ | 3115/12384 [6:36:39<19:41:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 2: 25%|██▌ | 3116/12384 [6:36:39<19:37:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 2: 25%|██▌ | 3116/12384 [6:36:47<19:37:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 25%|██▌ | 3117/12384 [6:36:47<19:40:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 25%|██▌ | 3117/12384 [6:36:54<19:40:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 25%|██▌ | 3118/12384 [6:36:54<19:38:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 25%|██▌ | 3118/12384 [6:37:02<19:38:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 2: 25%|██▌ | 3119/12384 [6:37:02<19:36:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 2: 25%|██▌ | 3119/12384 [6:37:09<19:36:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 2: 25%|██▌ | 3120/12384 [6:37:09<19:36:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 2: 25%|██▌ | 3120/12384 [6:37:17<19:36:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 25%|██▌ | 3121/12384 [6:37:17<19:37:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 25%|██▌ | 3121/12384 [6:37:25<19:37:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▌ | 3122/12384 [6:37:25<19:35:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▌ | 3122/12384 [6:37:32<19:35:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▌ | 3123/12384 [6:37:32<19:36:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▌ | 3123/12384 [6:37:40<19:36:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▌ | 3124/12384 [6:37:40<19:36:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▌ | 3124/12384 [6:37:48<19:36:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 25%|██▌ | 3125/12384 [6:37:48<19:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 25%|██▌ | 3125/12384 [6:37:55<19:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 25%|██▌ | 3126/12384 [6:37:55<19:36:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 25%|██▌ | 3126/12384 [6:38:03<19:36:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▌ | 3127/12384 [6:38:03<19:34:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▌ | 3127/12384 [6:38:10<19:34:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 25%|██▌ | 3128/12384 [6:38:10<19:34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 25%|██▌ | 3128/12384 [6:38:18<19:34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 25%|██▌ | 3129/12384 [6:38:18<19:35:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 25%|██▌ | 3129/12384 [6:38:26<19:35:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 25%|██▌ | 3130/12384 [6:38:26<19:49:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 25%|██▌ | 3130/12384 [6:38:34<19:49:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 25%|██▌ | 3131/12384 [6:38:34<19:44:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 25%|██▌ | 3131/12384 [6:38:41<19:44:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 25%|██▌ | 3132/12384 [6:38:41<19:41:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 25%|██▌ | 3132/12384 [6:38:49<19:41:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 25%|██▌ | 3133/12384 [6:38:49<19:37:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 25%|██▌ | 3133/12384 [6:38:56<19:37:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 25%|██▌ | 3134/12384 [6:38:56<19:36:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 25%|██▌ | 3134/12384 [6:39:04<19:36:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 25%|██▌ | 3135/12384 [6:39:04<19:40:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 25%|██▌ | 3135/12384 [6:39:12<19:40:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 25%|██▌ | 3136/12384 [6:39:12<19:39:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 25%|██▌ | 3136/12384 [6:39:20<19:39:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 25%|██▌ | 3137/12384 [6:39:20<19:49:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 25%|██▌ | 3137/12384 [6:39:27<19:49:04, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▌ | 3138/12384 [6:39:27<19:43:53, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▌ | 3138/12384 [6:39:35<19:43:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 25%|██▌ | 3139/12384 [6:39:35<19:40:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 25%|██▌ | 3139/12384 [6:39:42<19:40:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 25%|██▌ | 3140/12384 [6:39:42<19:37:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 25%|██▌ | 3140/12384 [6:39:50<19:37:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▌ | 3141/12384 [6:39:50<19:36:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 25%|██▌ | 3141/12384 [6:39:58<19:36:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 25%|██▌ | 3142/12384 [6:39:58<19:36:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 25%|██▌ | 3142/12384 [6:40:05<19:36:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 25%|██▌ | 3143/12384 [6:40:05<19:33:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 25%|██▌ | 3143/12384 [6:40:13<19:33:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 25%|██▌ | 3144/12384 [6:40:13<19:34:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 25%|██▌ | 3144/12384 [6:40:21<19:34:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 25%|██▌ | 3145/12384 [6:40:21<19:34:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 25%|██▌ | 3145/12384 [6:40:28<19:34:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 2: 25%|██▌ | 3146/12384 [6:40:28<19:33:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 2: 25%|██▌ | 3146/12384 [6:40:36<19:33:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 25%|██▌ | 3147/12384 [6:40:36<19:32:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 25%|██▌ | 3147/12384 [6:40:43<19:32:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▌ | 3148/12384 [6:40:43<19:32:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▌ | 3148/12384 [6:40:51<19:32:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▌ | 3149/12384 [6:40:51<19:31:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 25%|██▌ | 3149/12384 [6:40:59<19:31:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 25%|██▌ | 3150/12384 [6:40:59<19:30:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 25%|██▌ | 3150/12384 [6:41:06<19:30:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 25%|██▌ | 3151/12384 [6:41:06<19:29:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 25%|██▌ | 3151/12384 [6:41:14<19:29:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 25%|██▌ | 3152/12384 [6:41:14<19:29:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 25%|██▌ | 3152/12384 [6:41:21<19:29:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 25%|██▌ | 3153/12384 [6:41:21<19:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 25%|██▌ | 3153/12384 [6:41:29<19:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 25%|██▌ | 3154/12384 [6:41:29<19:29:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 25%|██▌ | 3154/12384 [6:41:37<19:29:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▌ | 3155/12384 [6:41:37<19:33:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 25%|██▌ | 3155/12384 [6:41:44<19:33:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 25%|██▌ | 3156/12384 [6:41:44<19:32:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 25%|██▌ | 3156/12384 [6:41:52<19:32:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 2: 25%|██▌ | 3157/12384 [6:41:52<19:47:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 2: 25%|██▌ | 3157/12384 [6:42:00<19:47:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 2: 26%|██▌ | 3158/12384 [6:42:00<19:40:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.41s]
Epoch 2: 26%|██▌ | 3158/12384 [6:42:07<19:40:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 26%|██▌ | 3159/12384 [6:42:07<19:36:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 26%|██▌ | 3159/12384 [6:42:15<19:36:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 26%|██▌ | 3160/12384 [6:42:15<19:34:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 26%|██▌ | 3160/12384 [6:42:23<19:34:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 26%|██▌ | 3161/12384 [6:42:23<19:32:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 26%|██▌ | 3161/12384 [6:42:30<19:32:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3162/12384 [6:42:30<19:31:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3162/12384 [6:42:38<19:31:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 26%|██▌ | 3163/12384 [6:42:38<19:44:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 26%|██▌ | 3163/12384 [6:42:46<19:44:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▌ | 3164/12384 [6:42:46<19:39:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▌ | 3164/12384 [6:42:53<19:39:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 26%|██▌ | 3165/12384 [6:42:53<19:35:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 26%|██▌ | 3165/12384 [6:43:01<19:35:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3166/12384 [6:43:01<19:33:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3166/12384 [6:43:09<19:33:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▌ | 3167/12384 [6:43:09<19:32:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▌ | 3167/12384 [6:43:16<19:32:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 26%|██▌ | 3168/12384 [6:43:16<19:31:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 26%|██▌ | 3168/12384 [6:43:24<19:31:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 26%|██▌ | 3169/12384 [6:43:24<19:29:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 26%|██▌ | 3169/12384 [6:43:31<19:29:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 26%|██▌ | 3170/12384 [6:43:31<19:31:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 26%|██▌ | 3170/12384 [6:43:39<19:31:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 26%|██▌ | 3171/12384 [6:43:39<19:32:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 26%|██▌ | 3171/12384 [6:43:47<19:32:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 26%|██▌ | 3172/12384 [6:43:47<19:33:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 26%|██▌ | 3172/12384 [6:43:54<19:33:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▌ | 3173/12384 [6:43:54<19:32:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▌ | 3173/12384 [6:44:02<19:32:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3174/12384 [6:44:02<19:31:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3174/12384 [6:44:10<19:31:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3175/12384 [6:44:10<19:31:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3175/12384 [6:44:17<19:31:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 26%|██▌ | 3176/12384 [6:44:17<19:30:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 26%|██▌ | 3176/12384 [6:44:25<19:30:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 26%|██▌ | 3177/12384 [6:44:25<19:28:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 26%|██▌ | 3177/12384 [6:44:32<19:28:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 26%|██▌ | 3178/12384 [6:44:32<19:28:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 26%|██▌ | 3178/12384 [6:44:40<19:28:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 26%|██▌ | 3179/12384 [6:44:40<19:29:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 26%|██▌ | 3179/12384 [6:44:48<19:29:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 26%|██▌ | 3180/12384 [6:44:48<19:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 26%|██▌ | 3180/12384 [6:44:55<19:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 2: 26%|██▌ | 3181/12384 [6:44:55<19:29:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 2: 26%|██▌ | 3181/12384 [6:45:03<19:29:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 26%|██▌ | 3182/12384 [6:45:03<19:28:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 26%|██▌ | 3182/12384 [6:45:11<19:28:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 26%|██▌ | 3183/12384 [6:45:11<19:46:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 26%|██▌ | 3183/12384 [6:45:19<19:46:53, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 26%|██▌ | 3184/12384 [6:45:19<19:42:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 26%|██▌ | 3184/12384 [6:45:26<19:42:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 26%|██▌ | 3185/12384 [6:45:26<19:37:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 26%|██▌ | 3185/12384 [6:45:34<19:37:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▌ | 3186/12384 [6:45:34<19:33:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▌ | 3186/12384 [6:45:41<19:33:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▌ | 3187/12384 [6:45:41<19:33:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▌ | 3187/12384 [6:45:49<19:33:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 26%|██▌ | 3188/12384 [6:45:49<19:29:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 26%|██▌ | 3188/12384 [6:45:57<19:29:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 26%|██▌ | 3189/12384 [6:45:57<19:39:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 26%|██▌ | 3189/12384 [6:46:05<19:39:56, 7.70s/it, loss=0.0004, acc=0.9979, iter_time=7.59s]
Epoch 2: 26%|██▌ | 3190/12384 [6:46:05<19:36:52, 7.68s/it, loss=0.0004, acc=0.9979, iter_time=7.59s]
Epoch 2: 26%|██▌ | 3190/12384 [6:46:12<19:36:52, 7.68s/it, loss=0.0010, acc=1.0000, iter_time=4.82s]
Epoch 2: 26%|██▌ | 3191/12384 [6:46:12<19:34:19, 7.66s/it, loss=0.0010, acc=1.0000, iter_time=4.82s]
Epoch 2: 26%|██▌ | 3191/12384 [6:46:20<19:34:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 26%|██▌ | 3192/12384 [6:46:20<19:31:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 26%|██▌ | 3192/12384 [6:46:27<19:31:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 2: 26%|██▌ | 3193/12384 [6:46:27<19:27:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 2: 26%|██▌ | 3193/12384 [6:46:35<19:27:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 26%|██▌ | 3194/12384 [6:46:35<19:25:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 26%|██▌ | 3194/12384 [6:46:43<19:25:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 26%|██▌ | 3195/12384 [6:46:43<19:25:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 26%|██▌ | 3195/12384 [6:46:50<19:25:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 26%|██▌ | 3196/12384 [6:46:50<19:28:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 26%|██▌ | 3196/12384 [6:46:58<19:28:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 2: 26%|██▌ | 3197/12384 [6:46:58<19:25:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 2: 26%|██▌ | 3197/12384 [6:47:05<19:25:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 26%|██▌ | 3198/12384 [6:47:05<19:26:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 26%|██▌ | 3198/12384 [6:47:13<19:26:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 26%|██▌ | 3199/12384 [6:47:13<19:25:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 26%|██▌ | 3199/12384 [6:47:21<19:25:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 26%|██▌ | 3200/12384 [6:47:21<19:24:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 26%|██▌ | 3200/12384 [6:47:28<19:24:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▌ | 3201/12384 [6:47:28<19:24:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▌ | 3201/12384 [6:47:36<19:24:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▌ | 3202/12384 [6:47:36<19:23:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▌ | 3202/12384 [6:47:43<19:23:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3203/12384 [6:47:43<19:24:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3203/12384 [6:47:51<19:24:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▌ | 3204/12384 [6:47:51<19:23:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▌ | 3204/12384 [6:47:59<19:23:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 2: 26%|██▌ | 3205/12384 [6:47:59<19:23:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 2: 26%|██▌ | 3205/12384 [6:48:06<19:23:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 26%|██▌ | 3206/12384 [6:48:06<19:23:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 26%|██▌ | 3206/12384 [6:48:14<19:23:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3207/12384 [6:48:14<19:22:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3207/12384 [6:48:21<19:22:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 26%|██▌ | 3208/12384 [6:48:21<19:23:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 26%|██▌ | 3208/12384 [6:48:29<19:23:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 26%|██▌ | 3209/12384 [6:48:29<19:38:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 26%|██▌ | 3209/12384 [6:48:37<19:38:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 26%|██▌ | 3210/12384 [6:48:37<19:33:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 26%|██▌ | 3210/12384 [6:48:45<19:33:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3211/12384 [6:48:45<19:31:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3211/12384 [6:48:52<19:31:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 26%|██▌ | 3212/12384 [6:48:52<19:29:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 26%|██▌ | 3212/12384 [6:49:00<19:29:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 2: 26%|██▌ | 3213/12384 [6:49:00<19:26:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 2: 26%|██▌ | 3213/12384 [6:49:07<19:26:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 26%|██▌ | 3214/12384 [6:49:07<19:25:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 26%|██▌ | 3214/12384 [6:49:15<19:25:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 26%|██▌ | 3215/12384 [6:49:15<19:37:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 26%|██▌ | 3215/12384 [6:49:23<19:37:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 26%|██▌ | 3216/12384 [6:49:23<19:33:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 26%|██▌ | 3216/12384 [6:49:31<19:33:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 26%|██▌ | 3217/12384 [6:49:31<19:30:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 26%|██▌ | 3217/12384 [6:49:38<19:30:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 26%|██▌ | 3218/12384 [6:49:38<19:27:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 26%|██▌ | 3218/12384 [6:49:46<19:27:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3219/12384 [6:49:46<19:26:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▌ | 3219/12384 [6:49:53<19:26:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 26%|██▌ | 3220/12384 [6:49:53<19:24:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 26%|██▌ | 3220/12384 [6:50:01<19:24:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 26%|██▌ | 3221/12384 [6:50:01<19:24:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 26%|██▌ | 3221/12384 [6:50:09<19:24:05, 7.62s/it, loss=0.0008, acc=0.9998, iter_time=5.82s]
Epoch 2: 26%|██▌ | 3222/12384 [6:50:09<19:22:49, 7.62s/it, loss=0.0008, acc=0.9998, iter_time=5.82s]
Epoch 2: 26%|██▌ | 3222/12384 [6:50:16<19:22:49, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=9.40s]
Epoch 2: 26%|██▌ | 3223/12384 [6:50:16<19:22:33, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=9.40s]
Epoch 2: 26%|██▌ | 3223/12384 [6:50:24<19:22:33, 7.61s/it, loss=0.0004, acc=0.9998, iter_time=7.61s]
Epoch 2: 26%|██▌ | 3224/12384 [6:50:24<19:24:21, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=7.61s]
Epoch 2: 26%|██▌ | 3224/12384 [6:50:31<19:24:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 26%|██▌ | 3225/12384 [6:50:31<19:22:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 26%|██▌ | 3225/12384 [6:50:39<19:22:48, 7.62s/it, loss=0.0003, acc=0.9984, iter_time=5.80s]
Epoch 2: 26%|██▌ | 3226/12384 [6:50:39<19:22:18, 7.61s/it, loss=0.0003, acc=0.9984, iter_time=5.80s]
Epoch 2: 26%|██▌ | 3226/12384 [6:50:47<19:22:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 26%|██▌ | 3227/12384 [6:50:47<19:21:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 26%|██▌ | 3227/12384 [6:50:54<19:21:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 26%|██▌ | 3228/12384 [6:50:54<19:22:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 26%|██▌ | 3228/12384 [6:51:02<19:22:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 26%|██▌ | 3229/12384 [6:51:02<19:20:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 26%|██▌ | 3229/12384 [6:51:09<19:20:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 26%|██▌ | 3230/12384 [6:51:09<19:19:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 26%|██▌ | 3230/12384 [6:51:17<19:19:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 26%|██▌ | 3231/12384 [6:51:17<19:20:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 26%|██▌ | 3231/12384 [6:51:25<19:20:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 26%|██▌ | 3232/12384 [6:51:25<19:28:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 26%|██▌ | 3232/12384 [6:51:33<19:28:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 26%|██▌ | 3233/12384 [6:51:33<19:26:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 26%|██▌ | 3233/12384 [6:51:40<19:26:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3234/12384 [6:51:40<19:24:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3234/12384 [6:51:48<19:24:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3235/12384 [6:51:48<19:38:27, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3235/12384 [6:51:56<19:38:27, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 26%|██▌ | 3236/12384 [6:51:56<19:32:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 26%|██▌ | 3236/12384 [6:52:03<19:32:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3237/12384 [6:52:03<19:29:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3237/12384 [6:52:11<19:29:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3238/12384 [6:52:11<19:26:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 26%|██▌ | 3238/12384 [6:52:19<19:26:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 26%|██▌ | 3239/12384 [6:52:19<19:24:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 26%|██▌ | 3239/12384 [6:52:26<19:24:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 26%|██▌ | 3240/12384 [6:52:26<19:22:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 26%|██▌ | 3240/12384 [6:52:34<19:22:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 26%|██▌ | 3241/12384 [6:52:34<19:22:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 26%|██▌ | 3241/12384 [6:52:41<19:22:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 26%|██▌ | 3242/12384 [6:52:41<19:25:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 26%|██▌ | 3242/12384 [6:52:49<19:25:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 26%|██▌ | 3243/12384 [6:52:49<19:23:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 26%|██▌ | 3243/12384 [6:52:57<19:23:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 26%|██▌ | 3244/12384 [6:52:57<19:22:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 26%|██▌ | 3244/12384 [6:53:04<19:22:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 26%|██▌ | 3245/12384 [6:53:04<19:21:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 26%|██▌ | 3245/12384 [6:53:12<19:21:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▌ | 3246/12384 [6:53:12<19:20:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▌ | 3246/12384 [6:53:20<19:20:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 26%|██▌ | 3247/12384 [6:53:20<19:19:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 26%|██▌ | 3247/12384 [6:53:27<19:19:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 26%|██▌ | 3248/12384 [6:53:27<19:19:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 26%|██▌ | 3248/12384 [6:53:35<19:19:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 26%|██▌ | 3249/12384 [6:53:35<19:19:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 26%|██▌ | 3249/12384 [6:53:42<19:19:06, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=9.71s]
Epoch 2: 26%|██▌ | 3250/12384 [6:53:42<19:17:58, 7.61s/it, loss=0.0000, acc=0.9999, iter_time=9.71s]
Epoch 2: 26%|██▌ | 3250/12384 [6:53:50<19:17:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▋ | 3251/12384 [6:53:50<19:18:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▋ | 3251/12384 [6:53:58<19:18:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▋ | 3252/12384 [6:53:58<19:18:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▋ | 3252/12384 [6:54:05<19:18:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▋ | 3253/12384 [6:54:05<19:17:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▋ | 3253/12384 [6:54:13<19:17:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▋ | 3254/12384 [6:54:13<19:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▋ | 3254/12384 [6:54:20<19:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 26%|██▋ | 3255/12384 [6:54:20<19:17:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 26%|██▋ | 3255/12384 [6:54:28<19:17:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 26%|██▋ | 3256/12384 [6:54:28<19:17:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 26%|██▋ | 3256/12384 [6:54:36<19:17:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 26%|██▋ | 3257/12384 [6:54:36<19:18:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 26%|██▋ | 3257/12384 [6:54:43<19:18:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▋ | 3258/12384 [6:54:43<19:18:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▋ | 3258/12384 [6:54:51<19:18:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 2: 26%|██▋ | 3259/12384 [6:54:51<19:18:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 2: 26%|██▋ | 3259/12384 [6:54:58<19:18:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.21s]
Epoch 2: 26%|██▋ | 3260/12384 [6:54:58<19:16:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.21s]
Epoch 2: 26%|██▋ | 3260/12384 [6:55:06<19:16:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 26%|██▋ | 3261/12384 [6:55:06<19:30:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 26%|██▋ | 3261/12384 [6:55:14<19:30:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 26%|██▋ | 3262/12384 [6:55:14<19:26:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 26%|██▋ | 3262/12384 [6:55:22<19:26:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 26%|██▋ | 3263/12384 [6:55:22<19:23:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 26%|██▋ | 3263/12384 [6:55:29<19:23:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.58s]
Epoch 2: 26%|██▋ | 3264/12384 [6:55:29<19:21:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.58s]
Epoch 2: 26%|██▋ | 3264/12384 [6:55:37<19:21:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 26%|██▋ | 3265/12384 [6:55:37<19:19:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 26%|██▋ | 3265/12384 [6:55:44<19:19:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 26%|██▋ | 3266/12384 [6:55:44<19:19:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 26%|██▋ | 3266/12384 [6:55:52<19:19:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▋ | 3267/12384 [6:55:52<19:18:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▋ | 3267/12384 [6:56:00<19:18:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▋ | 3268/12384 [6:56:00<19:18:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 26%|██▋ | 3268/12384 [6:56:07<19:18:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 26%|██▋ | 3269/12384 [6:56:07<19:20:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 26%|██▋ | 3269/12384 [6:56:15<19:20:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 26%|██▋ | 3270/12384 [6:56:15<19:18:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 26%|██▋ | 3270/12384 [6:56:23<19:18:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 26%|██▋ | 3271/12384 [6:56:23<19:17:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 26%|██▋ | 3271/12384 [6:56:30<19:17:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 26%|██▋ | 3272/12384 [6:56:30<19:17:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 26%|██▋ | 3272/12384 [6:56:38<19:17:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▋ | 3273/12384 [6:56:38<19:17:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 26%|██▋ | 3273/12384 [6:56:45<19:17:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 26%|██▋ | 3274/12384 [6:56:45<19:16:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 26%|██▋ | 3274/12384 [6:56:53<19:16:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▋ | 3275/12384 [6:56:53<19:16:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 26%|██▋ | 3275/12384 [6:57:01<19:16:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▋ | 3276/12384 [6:57:01<19:15:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 26%|██▋ | 3276/12384 [6:57:08<19:15:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 26%|██▋ | 3277/12384 [6:57:08<19:14:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 26%|██▋ | 3277/12384 [6:57:16<19:14:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 26%|██▋ | 3278/12384 [6:57:16<19:14:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 26%|██▋ | 3278/12384 [6:57:23<19:14:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 26%|██▋ | 3279/12384 [6:57:23<19:14:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 26%|██▋ | 3279/12384 [6:57:31<19:14:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 26%|██▋ | 3280/12384 [6:57:31<19:13:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 26%|██▋ | 3280/12384 [6:57:39<19:13:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 26%|██▋ | 3281/12384 [6:57:39<19:13:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 26%|██▋ | 3281/12384 [6:57:46<19:13:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 27%|██▋ | 3282/12384 [6:57:46<19:13:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 27%|██▋ | 3282/12384 [6:57:54<19:13:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 27%|██▋ | 3283/12384 [6:57:54<19:14:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 27%|██▋ | 3283/12384 [6:58:01<19:14:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 27%|██▋ | 3284/12384 [6:58:01<19:15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 27%|██▋ | 3284/12384 [6:58:09<19:15:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 27%|██▋ | 3285/12384 [6:58:09<19:15:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 27%|██▋ | 3285/12384 [6:58:17<19:15:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 27%|██▋ | 3286/12384 [6:58:17<19:14:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 27%|██▋ | 3286/12384 [6:58:24<19:14:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 27%|██▋ | 3287/12384 [6:58:24<19:15:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 27%|██▋ | 3287/12384 [6:58:32<19:15:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 27%|██▋ | 3288/12384 [6:58:32<19:29:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 27%|██▋ | 3288/12384 [6:58:40<19:29:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 27%|██▋ | 3289/12384 [6:58:40<19:25:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 27%|██▋ | 3289/12384 [6:58:47<19:25:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3290/12384 [6:58:47<19:21:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3290/12384 [6:58:55<19:21:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 27%|██▋ | 3291/12384 [6:58:55<19:19:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 27%|██▋ | 3291/12384 [6:59:03<19:19:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 27%|██▋ | 3292/12384 [6:59:03<19:16:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 27%|██▋ | 3292/12384 [6:59:10<19:16:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 27%|██▋ | 3293/12384 [6:59:10<19:16:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 27%|██▋ | 3293/12384 [6:59:18<19:16:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3294/12384 [6:59:18<19:14:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3294/12384 [6:59:26<19:14:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 27%|██▋ | 3295/12384 [6:59:26<19:13:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 27%|██▋ | 3295/12384 [6:59:33<19:13:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 27%|██▋ | 3296/12384 [6:59:33<19:29:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 27%|██▋ | 3296/12384 [6:59:41<19:29:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 27%|██▋ | 3297/12384 [6:59:41<19:23:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 27%|██▋ | 3297/12384 [6:59:49<19:23:44, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3298/12384 [6:59:49<19:20:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3298/12384 [6:59:56<19:20:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3299/12384 [6:59:56<19:17:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3299/12384 [7:00:04<19:17:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 27%|██▋ | 3300/12384 [7:00:04<19:15:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 27%|██▋ | 3300/12384 [7:00:12<19:15:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3301/12384 [7:00:12<19:14:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3301/12384 [7:00:19<19:14:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 27%|██▋ | 3302/12384 [7:00:19<19:13:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 27%|██▋ | 3302/12384 [7:00:27<19:13:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 27%|██▋ | 3303/12384 [7:00:27<19:13:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 27%|██▋ | 3303/12384 [7:00:34<19:13:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 27%|██▋ | 3304/12384 [7:00:34<19:11:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 27%|██▋ | 3304/12384 [7:00:42<19:11:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 2: 27%|██▋ | 3305/12384 [7:00:42<19:14:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 2: 27%|██▋ | 3305/12384 [7:00:50<19:14:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 27%|██▋ | 3306/12384 [7:00:50<19:12:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 27%|██▋ | 3306/12384 [7:00:57<19:12:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 27%|██▋ | 3307/12384 [7:00:57<19:11:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 27%|██▋ | 3307/12384 [7:01:05<19:11:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 27%|██▋ | 3308/12384 [7:01:05<19:12:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 27%|██▋ | 3308/12384 [7:01:13<19:12:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 27%|██▋ | 3309/12384 [7:01:13<19:16:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 27%|██▋ | 3309/12384 [7:01:20<19:16:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 2: 27%|██▋ | 3310/12384 [7:01:20<19:15:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 2: 27%|██▋ | 3310/12384 [7:01:28<19:15:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 27%|██▋ | 3311/12384 [7:01:28<19:14:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 27%|██▋ | 3311/12384 [7:01:35<19:14:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 27%|██▋ | 3312/12384 [7:01:35<19:12:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 27%|██▋ | 3312/12384 [7:01:43<19:12:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 2: 27%|██▋ | 3313/12384 [7:01:43<19:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.85s]
Epoch 2: 27%|██▋ | 3313/12384 [7:01:51<19:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 27%|██▋ | 3314/12384 [7:01:51<19:25:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 27%|██▋ | 3314/12384 [7:01:59<19:25:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 27%|██▋ | 3315/12384 [7:01:59<19:21:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 27%|██▋ | 3315/12384 [7:02:06<19:21:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3316/12384 [7:02:06<19:18:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3316/12384 [7:02:14<19:18:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 27%|██▋ | 3317/12384 [7:02:14<19:15:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 27%|██▋ | 3317/12384 [7:02:21<19:15:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 27%|██▋ | 3318/12384 [7:02:21<19:13:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 27%|██▋ | 3318/12384 [7:02:29<19:13:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3319/12384 [7:02:29<19:12:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3319/12384 [7:02:37<19:12:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 27%|██▋ | 3320/12384 [7:02:37<19:12:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 27%|██▋ | 3320/12384 [7:02:44<19:12:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 27%|██▋ | 3321/12384 [7:02:44<19:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 27%|██▋ | 3321/12384 [7:02:52<19:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 27%|██▋ | 3322/12384 [7:02:52<19:23:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 27%|██▋ | 3322/12384 [7:03:00<19:23:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 27%|██▋ | 3323/12384 [7:03:00<19:21:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 27%|██▋ | 3323/12384 [7:03:07<19:21:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3324/12384 [7:03:07<19:17:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3324/12384 [7:03:15<19:17:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3325/12384 [7:03:15<19:14:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3325/12384 [7:03:23<19:14:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3326/12384 [7:03:23<19:16:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3326/12384 [7:03:30<19:16:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 27%|██▋ | 3327/12384 [7:03:30<19:14:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 27%|██▋ | 3327/12384 [7:03:38<19:14:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 27%|██▋ | 3328/12384 [7:03:38<19:12:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 27%|██▋ | 3328/12384 [7:03:46<19:12:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 27%|██▋ | 3329/12384 [7:03:46<19:10:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 27%|██▋ | 3329/12384 [7:03:53<19:10:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3330/12384 [7:03:53<19:09:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3330/12384 [7:04:01<19:09:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 27%|██▋ | 3331/12384 [7:04:01<19:08:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 27%|██▋ | 3331/12384 [7:04:08<19:08:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 27%|██▋ | 3332/12384 [7:04:08<19:12:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 27%|██▋ | 3332/12384 [7:04:16<19:12:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 27%|██▋ | 3333/12384 [7:04:16<19:10:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 27%|██▋ | 3333/12384 [7:04:24<19:10:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 2: 27%|██▋ | 3334/12384 [7:04:24<19:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 2: 27%|██▋ | 3334/12384 [7:04:31<19:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 27%|██▋ | 3335/12384 [7:04:31<19:07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 27%|██▋ | 3335/12384 [7:04:39<19:07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 27%|██▋ | 3336/12384 [7:04:39<19:07:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 27%|██▋ | 3336/12384 [7:04:46<19:07:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 27%|██▋ | 3337/12384 [7:04:46<19:09:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 27%|██▋ | 3337/12384 [7:04:54<19:09:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 27%|██▋ | 3338/12384 [7:04:54<19:11:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 27%|██▋ | 3338/12384 [7:05:02<19:11:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 27%|██▋ | 3339/12384 [7:05:02<19:09:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 27%|██▋ | 3339/12384 [7:05:09<19:09:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 27%|██▋ | 3340/12384 [7:05:09<19:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 27%|██▋ | 3340/12384 [7:05:17<19:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 27%|██▋ | 3341/12384 [7:05:17<19:24:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 27%|██▋ | 3341/12384 [7:05:25<19:24:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 27%|██▋ | 3342/12384 [7:05:25<19:19:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 27%|██▋ | 3342/12384 [7:05:33<19:19:43, 7.70s/it, loss=0.0002, acc=0.9978, iter_time=8.82s]
Epoch 2: 27%|██▋ | 3343/12384 [7:05:33<19:15:45, 7.67s/it, loss=0.0002, acc=0.9978, iter_time=8.82s]
Epoch 2: 27%|██▋ | 3343/12384 [7:05:40<19:15:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 27%|██▋ | 3344/12384 [7:05:40<19:13:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 27%|██▋ | 3344/12384 [7:05:48<19:13:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 27%|██▋ | 3345/12384 [7:05:48<19:12:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 27%|██▋ | 3345/12384 [7:05:55<19:12:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 27%|██▋ | 3346/12384 [7:05:55<19:10:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 27%|██▋ | 3346/12384 [7:06:03<19:10:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3347/12384 [7:06:03<19:08:19, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3347/12384 [7:06:11<19:08:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 27%|██▋ | 3348/12384 [7:06:11<19:06:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 27%|██▋ | 3348/12384 [7:06:18<19:06:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 27%|██▋ | 3349/12384 [7:06:18<19:06:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 27%|██▋ | 3349/12384 [7:06:26<19:06:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 27%|██▋ | 3350/12384 [7:06:26<19:06:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 27%|██▋ | 3350/12384 [7:06:34<19:06:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 27%|██▋ | 3351/12384 [7:06:34<19:10:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 27%|██▋ | 3351/12384 [7:06:41<19:10:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 27%|██▋ | 3352/12384 [7:06:41<19:08:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 27%|██▋ | 3352/12384 [7:06:49<19:08:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 27%|██▋ | 3353/12384 [7:06:49<19:06:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 27%|██▋ | 3353/12384 [7:06:56<19:06:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3354/12384 [7:06:56<19:05:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3354/12384 [7:07:04<19:05:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 27%|██▋ | 3355/12384 [7:07:04<19:06:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 27%|██▋ | 3355/12384 [7:07:12<19:06:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 27%|██▋ | 3356/12384 [7:07:12<19:09:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 27%|██▋ | 3356/12384 [7:07:19<19:09:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 27%|██▋ | 3357/12384 [7:07:19<19:08:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 27%|██▋ | 3357/12384 [7:07:27<19:08:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3358/12384 [7:07:27<19:07:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3358/12384 [7:07:34<19:07:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 2: 27%|██▋ | 3359/12384 [7:07:34<19:07:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 2: 27%|██▋ | 3359/12384 [7:07:42<19:07:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 27%|██▋ | 3360/12384 [7:07:42<19:06:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 27%|██▋ | 3360/12384 [7:07:50<19:06:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 27%|██▋ | 3361/12384 [7:07:50<19:06:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 27%|██▋ | 3361/12384 [7:07:57<19:06:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3362/12384 [7:07:57<19:05:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3362/12384 [7:08:05<19:05:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3363/12384 [7:08:05<19:04:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3363/12384 [7:08:13<19:04:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3364/12384 [7:08:13<19:04:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3364/12384 [7:08:20<19:04:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3365/12384 [7:08:20<19:04:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3365/12384 [7:08:28<19:04:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3366/12384 [7:08:28<19:04:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3366/12384 [7:08:36<19:04:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 27%|██▋ | 3367/12384 [7:08:36<19:19:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 27%|██▋ | 3367/12384 [7:08:43<19:19:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 27%|██▋ | 3368/12384 [7:08:43<19:15:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 27%|██▋ | 3368/12384 [7:08:51<19:15:42, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 27%|██▋ | 3369/12384 [7:08:51<19:13:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 27%|██▋ | 3369/12384 [7:08:59<19:13:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 27%|██▋ | 3370/12384 [7:08:59<19:10:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 27%|██▋ | 3370/12384 [7:09:06<19:10:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3371/12384 [7:09:06<19:07:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3371/12384 [7:09:14<19:07:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3372/12384 [7:09:14<19:05:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3372/12384 [7:09:21<19:05:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3373/12384 [7:09:21<19:04:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3373/12384 [7:09:29<19:04:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3374/12384 [7:09:29<19:05:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3374/12384 [7:09:37<19:05:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 27%|██▋ | 3375/12384 [7:09:37<19:16:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 27%|██▋ | 3375/12384 [7:09:45<19:16:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 27%|██▋ | 3376/12384 [7:09:45<19:12:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 27%|██▋ | 3376/12384 [7:09:52<19:12:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 27%|██▋ | 3377/12384 [7:09:52<19:08:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 27%|██▋ | 3377/12384 [7:10:00<19:08:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3378/12384 [7:10:00<19:06:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3378/12384 [7:10:07<19:06:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 27%|██▋ | 3379/12384 [7:10:07<19:03:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 27%|██▋ | 3379/12384 [7:10:15<19:03:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 27%|██▋ | 3380/12384 [7:10:15<19:03:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 27%|██▋ | 3380/12384 [7:10:23<19:03:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3381/12384 [7:10:23<19:02:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3381/12384 [7:10:30<19:02:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 27%|██▋ | 3382/12384 [7:10:30<19:02:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 27%|██▋ | 3382/12384 [7:10:38<19:02:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 27%|██▋ | 3383/12384 [7:10:38<19:01:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 27%|██▋ | 3383/12384 [7:10:45<19:01:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 2: 27%|██▋ | 3384/12384 [7:10:45<19:02:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 2: 27%|██▋ | 3384/12384 [7:10:53<19:02:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 27%|██▋ | 3385/12384 [7:10:53<19:01:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 27%|██▋ | 3385/12384 [7:11:01<19:01:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3386/12384 [7:11:01<19:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 27%|██▋ | 3386/12384 [7:11:08<19:04:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 27%|██▋ | 3387/12384 [7:11:08<19:05:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 27%|██▋ | 3387/12384 [7:11:16<19:05:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 27%|██▋ | 3388/12384 [7:11:16<19:04:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 27%|██▋ | 3388/12384 [7:11:24<19:04:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 27%|██▋ | 3389/12384 [7:11:24<19:01:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 27%|██▋ | 3389/12384 [7:11:31<19:01:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 27%|██▋ | 3390/12384 [7:11:31<19:00:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 27%|██▋ | 3390/12384 [7:11:39<19:00:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 27%|██▋ | 3391/12384 [7:11:39<19:01:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 27%|██▋ | 3391/12384 [7:11:46<19:01:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 2: 27%|██▋ | 3392/12384 [7:11:46<19:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 2: 27%|██▋ | 3392/12384 [7:11:54<19:00:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 27%|██▋ | 3393/12384 [7:11:54<19:16:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 27%|██▋ | 3393/12384 [7:12:02<19:16:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 27%|██▋ | 3394/12384 [7:12:02<19:11:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 27%|██▋ | 3394/12384 [7:12:10<19:11:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3395/12384 [7:12:10<19:08:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 27%|██▋ | 3395/12384 [7:12:17<19:08:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 27%|██▋ | 3396/12384 [7:12:17<19:06:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 27%|██▋ | 3396/12384 [7:12:25<19:06:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 2: 27%|██▋ | 3397/12384 [7:12:25<19:04:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 2: 27%|██▋ | 3397/12384 [7:12:32<19:04:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 27%|██▋ | 3398/12384 [7:12:32<19:03:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 27%|██▋ | 3398/12384 [7:12:40<19:03:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 27%|██▋ | 3399/12384 [7:12:40<19:03:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 27%|██▋ | 3399/12384 [7:12:48<19:03:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 27%|██▋ | 3400/12384 [7:12:48<19:03:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 27%|██▋ | 3400/12384 [7:12:56<19:03:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 27%|██▋ | 3401/12384 [7:12:56<19:14:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 27%|██▋ | 3401/12384 [7:13:03<19:14:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3402/12384 [7:13:03<19:10:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 27%|██▋ | 3402/12384 [7:13:11<19:10:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3403/12384 [7:13:11<19:06:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 27%|██▋ | 3403/12384 [7:13:18<19:06:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 2: 27%|██▋ | 3404/12384 [7:13:18<19:04:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 2: 27%|██▋ | 3404/12384 [7:13:26<19:04:03, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.97s]
Epoch 2: 27%|██▋ | 3405/12384 [7:13:26<19:02:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.97s]
Epoch 2: 27%|██▋ | 3405/12384 [7:13:34<19:02:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3406/12384 [7:13:34<19:04:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3406/12384 [7:13:41<19:04:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 28%|██▊ | 3407/12384 [7:13:41<19:02:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 28%|██▊ | 3407/12384 [7:13:49<19:02:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 28%|██▊ | 3408/12384 [7:13:49<19:00:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 28%|██▊ | 3408/12384 [7:13:57<19:00:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 28%|██▊ | 3409/12384 [7:13:57<18:59:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 28%|██▊ | 3409/12384 [7:14:04<18:59:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3410/12384 [7:14:04<18:58:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3410/12384 [7:14:12<18:58:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 28%|██▊ | 3411/12384 [7:14:12<18:57:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 28%|██▊ | 3411/12384 [7:14:19<18:57:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 28%|██▊ | 3412/12384 [7:14:19<18:57:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 28%|██▊ | 3412/12384 [7:14:27<18:57:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 2: 28%|██▊ | 3413/12384 [7:14:27<18:59:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 2: 28%|██▊ | 3413/12384 [7:14:35<18:59:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 28%|██▊ | 3414/12384 [7:14:35<18:59:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 28%|██▊ | 3414/12384 [7:14:42<18:59:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 28%|██▊ | 3415/12384 [7:14:42<18:57:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 28%|██▊ | 3415/12384 [7:14:50<18:57:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 28%|██▊ | 3416/12384 [7:14:50<18:57:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 28%|██▊ | 3416/12384 [7:14:57<18:57:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 28%|██▊ | 3417/12384 [7:14:57<18:57:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 28%|██▊ | 3417/12384 [7:15:05<18:57:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 28%|██▊ | 3418/12384 [7:15:05<18:57:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 28%|██▊ | 3418/12384 [7:15:13<18:57:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.97s]
Epoch 2: 28%|██▊ | 3419/12384 [7:15:13<19:12:11, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=10.97s]
Epoch 2: 28%|██▊ | 3419/12384 [7:15:21<19:12:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 28%|██▊ | 3420/12384 [7:15:21<19:06:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 28%|██▊ | 3420/12384 [7:15:28<19:06:54, 7.68s/it, loss=0.0001, acc=0.9991, iter_time=8.46s]
Epoch 2: 28%|██▊ | 3421/12384 [7:15:28<19:04:15, 7.66s/it, loss=0.0001, acc=0.9991, iter_time=8.46s]
Epoch 2: 28%|██▊ | 3421/12384 [7:15:36<19:04:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3422/12384 [7:15:36<19:01:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3422/12384 [7:15:43<19:01:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3423/12384 [7:15:43<19:00:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3423/12384 [7:15:51<19:00:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 28%|██▊ | 3424/12384 [7:15:51<18:58:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 28%|██▊ | 3424/12384 [7:15:59<18:58:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 28%|██▊ | 3425/12384 [7:15:59<18:58:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 28%|██▊ | 3425/12384 [7:16:06<18:58:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 28%|██▊ | 3426/12384 [7:16:06<18:56:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 28%|██▊ | 3426/12384 [7:16:14<18:56:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 28%|██▊ | 3427/12384 [7:16:14<18:55:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 28%|██▊ | 3427/12384 [7:16:21<18:55:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 28%|██▊ | 3428/12384 [7:16:21<18:54:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 28%|██▊ | 3428/12384 [7:16:29<18:54:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 28%|██▊ | 3429/12384 [7:16:29<18:54:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 28%|██▊ | 3429/12384 [7:16:37<18:54:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3430/12384 [7:16:37<18:56:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3430/12384 [7:16:44<18:56:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 28%|██▊ | 3431/12384 [7:16:44<18:56:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 28%|██▊ | 3431/12384 [7:16:52<18:56:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 28%|██▊ | 3432/12384 [7:16:52<18:56:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 28%|██▊ | 3432/12384 [7:16:59<18:56:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 2: 28%|██▊ | 3433/12384 [7:16:59<18:55:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 2: 28%|██▊ | 3433/12384 [7:17:07<18:55:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 28%|██▊ | 3434/12384 [7:17:07<18:55:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 28%|██▊ | 3434/12384 [7:17:15<18:55:41, 7.61s/it, loss=0.0005, acc=0.9973, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3435/12384 [7:17:15<18:55:38, 7.61s/it, loss=0.0005, acc=0.9973, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3435/12384 [7:17:22<18:55:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3436/12384 [7:17:22<18:54:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3436/12384 [7:17:30<18:54:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 28%|██▊ | 3437/12384 [7:17:30<18:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 28%|██▊ | 3437/12384 [7:17:38<18:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 28%|██▊ | 3438/12384 [7:17:38<18:53:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 28%|██▊ | 3438/12384 [7:17:45<18:53:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3439/12384 [7:17:45<18:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3439/12384 [7:17:53<18:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 28%|██▊ | 3440/12384 [7:17:53<18:54:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 28%|██▊ | 3440/12384 [7:18:00<18:54:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 2: 28%|██▊ | 3441/12384 [7:18:00<18:52:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 2: 28%|██▊ | 3441/12384 [7:18:08<18:52:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 28%|██▊ | 3442/12384 [7:18:08<18:53:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 28%|██▊ | 3442/12384 [7:18:16<18:53:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3443/12384 [7:18:16<18:53:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3443/12384 [7:18:23<18:53:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 28%|██▊ | 3444/12384 [7:18:23<18:53:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 28%|██▊ | 3444/12384 [7:18:31<18:53:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 28%|██▊ | 3445/12384 [7:18:31<19:06:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 28%|██▊ | 3445/12384 [7:18:39<19:06:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 28%|██▊ | 3446/12384 [7:18:39<19:02:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 28%|██▊ | 3446/12384 [7:18:46<19:02:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 28%|██▊ | 3447/12384 [7:18:46<19:00:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 28%|██▊ | 3447/12384 [7:18:54<19:00:31, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 28%|██▊ | 3448/12384 [7:18:54<18:59:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 28%|██▊ | 3448/12384 [7:19:01<18:59:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 28%|██▊ | 3449/12384 [7:19:01<18:56:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 28%|██▊ | 3449/12384 [7:19:09<18:56:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3450/12384 [7:19:09<18:54:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3450/12384 [7:19:17<18:54:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 28%|██▊ | 3451/12384 [7:19:17<18:53:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 28%|██▊ | 3451/12384 [7:19:24<18:53:19, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=9.12s]
Epoch 2: 28%|██▊ | 3452/12384 [7:19:24<18:52:18, 7.61s/it, loss=0.0002, acc=0.9986, iter_time=9.12s]
Epoch 2: 28%|██▊ | 3452/12384 [7:19:32<18:52:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 28%|██▊ | 3453/12384 [7:19:32<18:51:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 28%|██▊ | 3453/12384 [7:19:39<18:51:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 28%|██▊ | 3454/12384 [7:19:39<18:51:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 28%|██▊ | 3454/12384 [7:19:47<18:51:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3455/12384 [7:19:47<18:51:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3455/12384 [7:19:55<18:51:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 28%|██▊ | 3456/12384 [7:19:55<18:51:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 28%|██▊ | 3456/12384 [7:20:02<18:51:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 28%|██▊ | 3457/12384 [7:20:02<18:50:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 28%|██▊ | 3457/12384 [7:20:10<18:50:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3458/12384 [7:20:10<18:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3458/12384 [7:20:18<18:51:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 28%|██▊ | 3459/12384 [7:20:18<18:52:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 28%|██▊ | 3459/12384 [7:20:25<18:52:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 2: 28%|██▊ | 3460/12384 [7:20:25<18:52:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 2: 28%|██▊ | 3460/12384 [7:20:33<18:52:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 28%|██▊ | 3461/12384 [7:20:33<18:56:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 28%|██▊ | 3461/12384 [7:20:40<18:56:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3462/12384 [7:20:40<18:54:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3462/12384 [7:20:48<18:54:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3463/12384 [7:20:48<18:53:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3463/12384 [7:20:56<18:53:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 28%|██▊ | 3464/12384 [7:20:56<18:53:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 28%|██▊ | 3464/12384 [7:21:03<18:53:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 2: 28%|██▊ | 3465/12384 [7:21:03<18:52:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 2: 28%|██▊ | 3465/12384 [7:21:11<18:52:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 28%|██▊ | 3466/12384 [7:21:11<18:51:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 28%|██▊ | 3466/12384 [7:21:19<18:51:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3467/12384 [7:21:19<18:51:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3467/12384 [7:21:26<18:51:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3468/12384 [7:21:26<18:52:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3468/12384 [7:21:34<18:52:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3469/12384 [7:21:34<18:51:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3469/12384 [7:21:41<18:51:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 2: 28%|██▊ | 3470/12384 [7:21:41<18:52:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 2: 28%|██▊ | 3470/12384 [7:21:49<18:52:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 2: 28%|██▊ | 3471/12384 [7:21:49<18:52:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 2: 28%|██▊ | 3471/12384 [7:21:57<18:52:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 2: 28%|██▊ | 3472/12384 [7:21:57<19:09:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.01s]
Epoch 2: 28%|██▊ | 3472/12384 [7:22:05<19:09:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 28%|██▊ | 3473/12384 [7:22:05<19:03:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 28%|██▊ | 3473/12384 [7:22:12<19:03:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3474/12384 [7:22:12<18:59:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3474/12384 [7:22:20<18:59:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 28%|██▊ | 3475/12384 [7:22:20<18:59:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 28%|██▊ | 3475/12384 [7:22:28<18:59:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 28%|██▊ | 3476/12384 [7:22:28<18:57:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 28%|██▊ | 3476/12384 [7:22:35<18:57:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 28%|██▊ | 3477/12384 [7:22:35<18:59:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 28%|██▊ | 3477/12384 [7:22:43<18:59:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 28%|██▊ | 3478/12384 [7:22:43<18:55:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 28%|██▊ | 3478/12384 [7:22:50<18:55:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 28%|██▊ | 3479/12384 [7:22:50<18:54:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 28%|██▊ | 3479/12384 [7:22:58<18:54:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 28%|██▊ | 3480/12384 [7:22:58<19:05:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 28%|██▊ | 3480/12384 [7:23:06<19:05:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 28%|██▊ | 3481/12384 [7:23:06<18:59:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 28%|██▊ | 3481/12384 [7:23:14<18:59:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 28%|██▊ | 3482/12384 [7:23:14<18:56:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 28%|██▊ | 3482/12384 [7:23:21<18:56:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 2: 28%|██▊ | 3483/12384 [7:23:21<18:56:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 2: 28%|██▊ | 3483/12384 [7:23:29<18:56:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 28%|██▊ | 3484/12384 [7:23:29<18:54:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 28%|██▊ | 3484/12384 [7:23:37<18:54:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 28%|██▊ | 3485/12384 [7:23:37<18:54:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 28%|██▊ | 3485/12384 [7:23:44<18:54:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 28%|██▊ | 3486/12384 [7:23:44<18:52:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 28%|██▊ | 3486/12384 [7:23:52<18:52:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 28%|██▊ | 3487/12384 [7:23:52<18:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 28%|██▊ | 3487/12384 [7:23:59<18:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 28%|██▊ | 3488/12384 [7:23:59<18:49:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 28%|██▊ | 3488/12384 [7:24:07<18:49:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 28%|██▊ | 3489/12384 [7:24:07<18:51:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 28%|██▊ | 3489/12384 [7:24:15<18:51:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 28%|██▊ | 3490/12384 [7:24:15<18:50:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 28%|██▊ | 3490/12384 [7:24:22<18:50:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 2: 28%|██▊ | 3491/12384 [7:24:22<18:49:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 2: 28%|██▊ | 3491/12384 [7:24:30<18:49:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 28%|██▊ | 3492/12384 [7:24:30<18:50:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 28%|██▊ | 3492/12384 [7:24:37<18:50:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 28%|██▊ | 3493/12384 [7:24:37<18:49:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 28%|██▊ | 3493/12384 [7:24:45<18:49:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 28%|██▊ | 3494/12384 [7:24:45<18:49:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 28%|██▊ | 3494/12384 [7:24:53<18:49:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 28%|██▊ | 3495/12384 [7:24:53<18:49:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 28%|██▊ | 3495/12384 [7:25:00<18:49:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 28%|██▊ | 3496/12384 [7:25:00<18:48:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 28%|██▊ | 3496/12384 [7:25:08<18:48:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 28%|██▊ | 3497/12384 [7:25:08<18:50:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 28%|██▊ | 3497/12384 [7:25:16<18:50:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 28%|██▊ | 3498/12384 [7:25:16<19:04:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 28%|██▊ | 3498/12384 [7:25:24<19:04:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 28%|██▊ | 3499/12384 [7:25:24<19:00:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 28%|██▊ | 3499/12384 [7:25:31<19:00:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 28%|██▊ | 3500/12384 [7:25:31<18:55:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 28%|██▊ | 3500/12384 [7:25:39<18:55:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3501/12384 [7:25:39<18:55:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 28%|██▊ | 3501/12384 [7:25:46<18:55:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 28%|██▊ | 3502/12384 [7:25:46<18:53:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 28%|██▊ | 3502/12384 [7:25:54<18:53:13, 7.66s/it, loss=0.0001, acc=0.9997, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3503/12384 [7:25:54<18:50:43, 7.64s/it, loss=0.0001, acc=0.9997, iter_time=7.62s]
Epoch 2: 28%|██▊ | 3503/12384 [7:26:02<18:50:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 28%|██▊ | 3504/12384 [7:26:02<18:49:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 28%|██▊ | 3504/12384 [7:26:09<18:49:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 28%|██▊ | 3505/12384 [7:26:09<18:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 28%|██▊ | 3505/12384 [7:26:17<18:48:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 2: 28%|██▊ | 3506/12384 [7:26:17<18:47:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 2: 28%|██▊ | 3506/12384 [7:26:24<18:47:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 28%|██▊ | 3507/12384 [7:26:24<18:46:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 28%|██▊ | 3507/12384 [7:26:32<18:46:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 28%|██▊ | 3508/12384 [7:26:32<18:45:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 28%|██▊ | 3508/12384 [7:26:40<18:45:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 28%|██▊ | 3509/12384 [7:26:40<18:45:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 28%|██▊ | 3509/12384 [7:26:47<18:45:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 28%|██▊ | 3510/12384 [7:26:47<18:45:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 28%|██▊ | 3510/12384 [7:26:55<18:45:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 28%|██▊ | 3511/12384 [7:26:55<18:46:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 28%|██▊ | 3511/12384 [7:27:03<18:46:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 28%|██▊ | 3512/12384 [7:27:03<18:46:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 28%|██▊ | 3512/12384 [7:27:10<18:46:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 28%|██▊ | 3513/12384 [7:27:10<18:46:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 28%|██▊ | 3513/12384 [7:27:18<18:46:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 28%|██▊ | 3514/12384 [7:27:18<18:44:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 28%|██▊ | 3514/12384 [7:27:25<18:44:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 28%|██▊ | 3515/12384 [7:27:25<18:43:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 28%|██▊ | 3515/12384 [7:27:33<18:43:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 28%|██▊ | 3516/12384 [7:27:33<18:44:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 28%|██▊ | 3516/12384 [7:27:41<18:44:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 28%|██▊ | 3517/12384 [7:27:41<18:45:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 28%|██▊ | 3517/12384 [7:27:48<18:45:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3518/12384 [7:27:48<18:45:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 28%|██▊ | 3518/12384 [7:27:56<18:45:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 28%|██▊ | 3519/12384 [7:27:56<18:44:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 28%|██▊ | 3519/12384 [7:28:03<18:44:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 28%|██▊ | 3520/12384 [7:28:03<18:47:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 28%|██▊ | 3520/12384 [7:28:11<18:47:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 2: 28%|██▊ | 3521/12384 [7:28:11<18:45:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 2: 28%|██▊ | 3521/12384 [7:28:19<18:45:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 28%|██▊ | 3522/12384 [7:28:19<18:49:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 28%|██▊ | 3522/12384 [7:28:26<18:49:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 28%|██▊ | 3523/12384 [7:28:26<18:48:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 28%|██▊ | 3523/12384 [7:28:34<18:48:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 28%|██▊ | 3524/12384 [7:28:34<18:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 28%|██▊ | 3524/12384 [7:28:42<18:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 28%|██▊ | 3525/12384 [7:28:42<19:00:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 28%|██▊ | 3525/12384 [7:28:50<19:00:22, 7.72s/it, loss=0.0032, acc=0.9947, iter_time=6.71s]
Epoch 2: 28%|██▊ | 3526/12384 [7:28:50<18:56:03, 7.70s/it, loss=0.0032, acc=0.9947, iter_time=6.71s]
Epoch 2: 28%|██▊ | 3526/12384 [7:28:57<18:56:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 28%|██▊ | 3527/12384 [7:28:57<18:52:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 28%|██▊ | 3527/12384 [7:29:05<18:52:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 28%|██▊ | 3528/12384 [7:29:05<18:50:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 28%|██▊ | 3528/12384 [7:29:12<18:50:26, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 2: 28%|██▊ | 3529/12384 [7:29:12<18:48:45, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 2: 28%|██▊ | 3529/12384 [7:29:20<18:48:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▊ | 3530/12384 [7:29:20<18:46:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▊ | 3530/12384 [7:29:28<18:46:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▊ | 3531/12384 [7:29:28<18:44:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▊ | 3531/12384 [7:29:35<18:44:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 29%|██▊ | 3532/12384 [7:29:35<18:44:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 29%|██▊ | 3532/12384 [7:29:43<18:44:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 2: 29%|██▊ | 3533/12384 [7:29:43<18:43:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 2: 29%|██▊ | 3533/12384 [7:29:50<18:43:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 29%|██▊ | 3534/12384 [7:29:50<18:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 29%|██▊ | 3534/12384 [7:29:58<18:42:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 29%|██▊ | 3535/12384 [7:29:58<18:42:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 29%|██▊ | 3535/12384 [7:30:06<18:42:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 29%|██▊ | 3536/12384 [7:30:06<18:41:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 29%|██▊ | 3536/12384 [7:30:13<18:41:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 29%|██▊ | 3537/12384 [7:30:13<18:41:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 29%|██▊ | 3537/12384 [7:30:21<18:41:02, 7.60s/it, loss=0.0001, acc=0.9995, iter_time=10.76s]
Epoch 2: 29%|██▊ | 3538/12384 [7:30:21<18:41:06, 7.60s/it, loss=0.0001, acc=0.9995, iter_time=10.76s]
Epoch 2: 29%|██▊ | 3538/12384 [7:30:28<18:41:06, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▊ | 3539/12384 [7:30:28<18:40:43, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▊ | 3539/12384 [7:30:36<18:40:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 29%|██▊ | 3540/12384 [7:30:36<18:40:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 29%|██▊ | 3540/12384 [7:30:44<18:40:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 29%|██▊ | 3541/12384 [7:30:44<18:41:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 29%|██▊ | 3541/12384 [7:30:51<18:41:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 29%|██▊ | 3542/12384 [7:30:51<18:40:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 29%|██▊ | 3542/12384 [7:30:59<18:40:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 29%|██▊ | 3543/12384 [7:30:59<18:41:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 29%|██▊ | 3543/12384 [7:31:07<18:41:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 29%|██▊ | 3544/12384 [7:31:07<18:40:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 29%|██▊ | 3544/12384 [7:31:14<18:40:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 2: 29%|██▊ | 3545/12384 [7:31:14<18:40:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.84s]
Epoch 2: 29%|██▊ | 3545/12384 [7:31:22<18:40:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 29%|██▊ | 3546/12384 [7:31:22<18:40:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 29%|██▊ | 3546/12384 [7:31:29<18:40:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 29%|██▊ | 3547/12384 [7:31:29<18:40:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 29%|██▊ | 3547/12384 [7:31:37<18:40:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▊ | 3548/12384 [7:31:37<18:41:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▊ | 3548/12384 [7:31:45<18:41:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▊ | 3549/12384 [7:31:45<18:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▊ | 3549/12384 [7:31:52<18:41:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 29%|██▊ | 3550/12384 [7:31:52<18:42:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 29%|██▊ | 3550/12384 [7:32:00<18:42:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 29%|██▊ | 3551/12384 [7:32:00<18:58:03, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 29%|██▊ | 3551/12384 [7:32:08<18:58:03, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 29%|██▊ | 3552/12384 [7:32:08<18:53:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 29%|██▊ | 3552/12384 [7:32:16<18:53:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 29%|██▊ | 3553/12384 [7:32:16<18:52:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 29%|██▊ | 3553/12384 [7:32:23<18:52:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 29%|██▊ | 3554/12384 [7:32:23<18:49:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 29%|██▊ | 3554/12384 [7:32:31<18:49:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 2: 29%|██▊ | 3555/12384 [7:32:31<18:46:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 2: 29%|██▊ | 3555/12384 [7:32:38<18:46:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 29%|██▊ | 3556/12384 [7:32:38<18:44:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 29%|██▊ | 3556/12384 [7:32:46<18:44:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▊ | 3557/12384 [7:32:46<18:43:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▊ | 3557/12384 [7:32:54<18:43:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▊ | 3558/12384 [7:32:54<18:42:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▊ | 3558/12384 [7:33:02<18:42:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 29%|██▊ | 3559/12384 [7:33:02<18:54:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 29%|██▊ | 3559/12384 [7:33:09<18:54:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 29%|██▊ | 3560/12384 [7:33:09<18:49:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 29%|██▊ | 3560/12384 [7:33:17<18:49:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 29%|██▉ | 3561/12384 [7:33:17<18:49:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 29%|██▉ | 3561/12384 [7:33:24<18:49:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 29%|██▉ | 3562/12384 [7:33:24<18:46:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 29%|██▉ | 3562/12384 [7:33:32<18:46:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 29%|██▉ | 3563/12384 [7:33:32<18:47:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 29%|██▉ | 3563/12384 [7:33:40<18:47:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 29%|██▉ | 3564/12384 [7:33:40<18:46:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 29%|██▉ | 3564/12384 [7:33:47<18:46:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 29%|██▉ | 3565/12384 [7:33:47<18:43:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 29%|██▉ | 3565/12384 [7:33:55<18:43:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 29%|██▉ | 3566/12384 [7:33:55<18:41:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 29%|██▉ | 3566/12384 [7:34:03<18:41:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 29%|██▉ | 3567/12384 [7:34:03<18:41:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 29%|██▉ | 3567/12384 [7:34:10<18:41:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 29%|██▉ | 3568/12384 [7:34:10<18:39:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 29%|██▉ | 3568/12384 [7:34:18<18:39:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 29%|██▉ | 3569/12384 [7:34:18<18:38:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 29%|██▉ | 3569/12384 [7:34:25<18:38:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 29%|██▉ | 3570/12384 [7:34:25<18:37:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 29%|██▉ | 3570/12384 [7:34:33<18:37:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 29%|██▉ | 3571/12384 [7:34:33<18:38:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 29%|██▉ | 3571/12384 [7:34:41<18:38:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 29%|██▉ | 3572/12384 [7:34:41<18:38:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 29%|██▉ | 3572/12384 [7:34:48<18:38:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 29%|██▉ | 3573/12384 [7:34:48<18:37:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 29%|██▉ | 3573/12384 [7:34:56<18:37:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 29%|██▉ | 3574/12384 [7:34:56<18:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 29%|██▉ | 3574/12384 [7:35:03<18:37:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 29%|██▉ | 3575/12384 [7:35:03<18:38:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 29%|██▉ | 3575/12384 [7:35:11<18:38:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 29%|██▉ | 3576/12384 [7:35:11<18:39:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 29%|██▉ | 3576/12384 [7:35:19<18:39:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 29%|██▉ | 3577/12384 [7:35:19<18:52:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 29%|██▉ | 3577/12384 [7:35:27<18:52:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 29%|██▉ | 3578/12384 [7:35:27<18:48:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 29%|██▉ | 3578/12384 [7:35:34<18:48:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 29%|██▉ | 3579/12384 [7:35:34<18:44:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 29%|██▉ | 3579/12384 [7:35:42<18:44:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 29%|██▉ | 3580/12384 [7:35:42<18:41:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 29%|██▉ | 3580/12384 [7:35:50<18:41:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 29%|██▉ | 3581/12384 [7:35:50<18:42:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 29%|██▉ | 3581/12384 [7:35:57<18:42:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 29%|██▉ | 3582/12384 [7:35:57<18:40:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 29%|██▉ | 3582/12384 [7:36:05<18:40:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 2: 29%|██▉ | 3583/12384 [7:36:05<18:38:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.21s]
Epoch 2: 29%|██▉ | 3583/12384 [7:36:12<18:38:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 29%|██▉ | 3584/12384 [7:36:12<18:37:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 29%|██▉ | 3584/12384 [7:36:20<18:37:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 29%|██▉ | 3585/12384 [7:36:20<18:55:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 29%|██▉ | 3585/12384 [7:36:28<18:55:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3586/12384 [7:36:28<18:54:17, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3586/12384 [7:36:36<18:54:17, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 29%|██▉ | 3587/12384 [7:36:36<18:49:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 29%|██▉ | 3587/12384 [7:36:43<18:49:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 29%|██▉ | 3588/12384 [7:36:43<18:46:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 29%|██▉ | 3588/12384 [7:36:51<18:46:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 29%|██▉ | 3589/12384 [7:36:51<18:43:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 29%|██▉ | 3589/12384 [7:36:59<18:43:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3590/12384 [7:36:59<18:40:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3590/12384 [7:37:06<18:40:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.97s]
Epoch 2: 29%|██▉ | 3591/12384 [7:37:06<18:38:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.97s]
Epoch 2: 29%|██▉ | 3591/12384 [7:37:14<18:38:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 2: 29%|██▉ | 3592/12384 [7:37:14<18:37:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 2: 29%|██▉ | 3592/12384 [7:37:21<18:37:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 2: 29%|██▉ | 3593/12384 [7:37:21<18:36:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.13s]
Epoch 2: 29%|██▉ | 3593/12384 [7:37:29<18:36:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 29%|██▉ | 3594/12384 [7:37:29<18:37:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 29%|██▉ | 3594/12384 [7:37:37<18:37:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▉ | 3595/12384 [7:37:37<18:36:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▉ | 3595/12384 [7:37:44<18:36:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 2: 29%|██▉ | 3596/12384 [7:37:44<18:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 2: 29%|██▉ | 3596/12384 [7:37:52<18:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 29%|██▉ | 3597/12384 [7:37:52<18:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 29%|██▉ | 3597/12384 [7:37:59<18:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 29%|██▉ | 3598/12384 [7:37:59<18:33:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 29%|██▉ | 3598/12384 [7:38:07<18:33:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3599/12384 [7:38:07<18:33:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3599/12384 [7:38:15<18:33:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 29%|██▉ | 3600/12384 [7:38:15<18:33:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 29%|██▉ | 3600/12384 [7:38:22<18:33:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 2: 29%|██▉ | 3601/12384 [7:38:22<18:32:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 2: 29%|██▉ | 3601/12384 [7:38:30<18:32:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 29%|██▉ | 3602/12384 [7:38:30<18:31:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 29%|██▉ | 3602/12384 [7:38:38<18:31:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 29%|██▉ | 3603/12384 [7:38:38<18:47:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 29%|██▉ | 3603/12384 [7:38:45<18:47:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 29%|██▉ | 3604/12384 [7:38:45<18:43:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 29%|██▉ | 3604/12384 [7:38:53<18:43:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 29%|██▉ | 3605/12384 [7:38:53<18:44:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 29%|██▉ | 3605/12384 [7:39:01<18:44:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 29%|██▉ | 3606/12384 [7:39:01<18:40:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 29%|██▉ | 3606/12384 [7:39:08<18:40:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 29%|██▉ | 3607/12384 [7:39:08<18:38:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 29%|██▉ | 3607/12384 [7:39:16<18:38:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 2: 29%|██▉ | 3608/12384 [7:39:16<18:37:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 2: 29%|██▉ | 3608/12384 [7:39:24<18:37:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 29%|██▉ | 3609/12384 [7:39:24<18:35:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 29%|██▉ | 3609/12384 [7:39:31<18:35:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▉ | 3610/12384 [7:39:31<18:34:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▉ | 3610/12384 [7:39:39<18:34:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 29%|██▉ | 3611/12384 [7:39:39<18:49:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 29%|██▉ | 3611/12384 [7:39:47<18:49:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 29%|██▉ | 3612/12384 [7:39:47<18:43:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 29%|██▉ | 3612/12384 [7:39:54<18:43:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▉ | 3613/12384 [7:39:54<18:39:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▉ | 3613/12384 [7:40:02<18:39:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 29%|██▉ | 3614/12384 [7:40:02<18:37:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 29%|██▉ | 3614/12384 [7:40:10<18:37:52, 7.65s/it, loss=0.0007, acc=0.9971, iter_time=8.54s]
Epoch 2: 29%|██▉ | 3615/12384 [7:40:10<18:39:49, 7.66s/it, loss=0.0007, acc=0.9971, iter_time=8.54s]
Epoch 2: 29%|██▉ | 3615/12384 [7:40:17<18:39:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 29%|██▉ | 3616/12384 [7:40:17<18:40:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 29%|██▉ | 3616/12384 [7:40:25<18:40:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 29%|██▉ | 3617/12384 [7:40:25<18:38:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 29%|██▉ | 3617/12384 [7:40:33<18:38:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▉ | 3618/12384 [7:40:33<18:36:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▉ | 3618/12384 [7:40:40<18:36:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 29%|██▉ | 3619/12384 [7:40:40<18:35:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 29%|██▉ | 3619/12384 [7:40:48<18:35:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▉ | 3620/12384 [7:40:48<18:32:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 29%|██▉ | 3620/12384 [7:40:55<18:32:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 29%|██▉ | 3621/12384 [7:40:55<18:30:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 29%|██▉ | 3621/12384 [7:41:03<18:30:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▉ | 3622/12384 [7:41:03<18:30:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▉ | 3622/12384 [7:41:11<18:30:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 29%|██▉ | 3623/12384 [7:41:11<18:30:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 29%|██▉ | 3623/12384 [7:41:18<18:30:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 29%|██▉ | 3624/12384 [7:41:18<18:30:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 29%|██▉ | 3624/12384 [7:41:26<18:30:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 2: 29%|██▉ | 3625/12384 [7:41:26<18:30:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 2: 29%|██▉ | 3625/12384 [7:41:33<18:30:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 29%|██▉ | 3626/12384 [7:41:33<18:30:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 29%|██▉ | 3626/12384 [7:41:41<18:30:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 29%|██▉ | 3627/12384 [7:41:41<18:30:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 29%|██▉ | 3627/12384 [7:41:49<18:30:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 29%|██▉ | 3628/12384 [7:41:49<18:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 29%|██▉ | 3628/12384 [7:41:57<18:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 29%|██▉ | 3629/12384 [7:41:57<18:45:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 29%|██▉ | 3629/12384 [7:42:04<18:45:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 29%|██▉ | 3630/12384 [7:42:04<18:40:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 29%|██▉ | 3630/12384 [7:42:12<18:40:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 29%|██▉ | 3631/12384 [7:42:12<18:37:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 29%|██▉ | 3631/12384 [7:42:19<18:37:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 29%|██▉ | 3632/12384 [7:42:19<18:35:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 29%|██▉ | 3632/12384 [7:42:27<18:35:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 29%|██▉ | 3633/12384 [7:42:27<18:32:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 29%|██▉ | 3633/12384 [7:42:35<18:32:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 29%|██▉ | 3634/12384 [7:42:35<18:31:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 29%|██▉ | 3634/12384 [7:42:42<18:31:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 29%|██▉ | 3635/12384 [7:42:42<18:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 29%|██▉ | 3635/12384 [7:42:50<18:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 2: 29%|██▉ | 3636/12384 [7:42:50<18:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 2: 29%|██▉ | 3636/12384 [7:42:58<18:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.65s]
Epoch 2: 29%|██▉ | 3637/12384 [7:42:58<18:42:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.65s]
Epoch 2: 29%|██▉ | 3637/12384 [7:43:05<18:42:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▉ | 3638/12384 [7:43:05<18:37:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▉ | 3638/12384 [7:43:13<18:37:47, 7.67s/it, loss=0.0013, acc=0.9971, iter_time=5.82s]
Epoch 2: 29%|██▉ | 3639/12384 [7:43:13<18:35:06, 7.65s/it, loss=0.0013, acc=0.9971, iter_time=5.82s]
Epoch 2: 29%|██▉ | 3639/12384 [7:43:20<18:35:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 2: 29%|██▉ | 3640/12384 [7:43:20<18:33:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 2: 29%|██▉ | 3640/12384 [7:43:28<18:33:14, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=7.51s]
Epoch 2: 29%|██▉ | 3641/12384 [7:43:28<18:31:17, 7.63s/it, loss=0.0005, acc=0.9993, iter_time=7.51s]
Epoch 2: 29%|██▉ | 3641/12384 [7:43:36<18:31:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3642/12384 [7:43:36<18:30:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3642/12384 [7:43:43<18:30:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 29%|██▉ | 3643/12384 [7:43:43<18:29:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 29%|██▉ | 3643/12384 [7:43:51<18:29:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 29%|██▉ | 3644/12384 [7:43:51<18:29:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 29%|██▉ | 3644/12384 [7:43:59<18:29:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 29%|██▉ | 3645/12384 [7:43:59<18:31:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 29%|██▉ | 3645/12384 [7:44:06<18:31:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 29%|██▉ | 3646/12384 [7:44:06<18:30:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 29%|██▉ | 3646/12384 [7:44:14<18:30:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 29%|██▉ | 3647/12384 [7:44:14<18:28:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 29%|██▉ | 3647/12384 [7:44:21<18:28:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 29%|██▉ | 3648/12384 [7:44:21<18:28:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 29%|██▉ | 3648/12384 [7:44:29<18:28:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 29%|██▉ | 3649/12384 [7:44:29<18:27:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 29%|██▉ | 3649/12384 [7:44:37<18:27:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 29%|██▉ | 3650/12384 [7:44:37<18:29:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 29%|██▉ | 3650/12384 [7:44:44<18:29:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 29%|██▉ | 3651/12384 [7:44:44<18:28:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 29%|██▉ | 3651/12384 [7:44:52<18:28:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3652/12384 [7:44:52<18:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 29%|██▉ | 3652/12384 [7:44:59<18:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▉ | 3653/12384 [7:44:59<18:27:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 29%|██▉ | 3653/12384 [7:45:07<18:27:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|██▉ | 3654/12384 [7:45:07<18:26:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|██▉ | 3654/12384 [7:45:15<18:26:27, 7.60s/it, loss=0.0001, acc=0.9996, iter_time=7.03s]
Epoch 2: 30%|██▉ | 3655/12384 [7:45:15<18:26:38, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=7.03s]
Epoch 2: 30%|██▉ | 3655/12384 [7:45:23<18:26:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 30%|██▉ | 3656/12384 [7:45:23<18:39:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 30%|██▉ | 3656/12384 [7:45:30<18:39:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 30%|██▉ | 3657/12384 [7:45:30<18:35:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 30%|██▉ | 3657/12384 [7:45:38<18:35:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 30%|██▉ | 3658/12384 [7:45:38<18:32:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 30%|██▉ | 3658/12384 [7:45:45<18:32:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 30%|██▉ | 3659/12384 [7:45:45<18:30:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 30%|██▉ | 3659/12384 [7:45:53<18:30:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3660/12384 [7:45:53<18:29:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3660/12384 [7:46:01<18:29:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 30%|██▉ | 3661/12384 [7:46:01<18:28:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 30%|██▉ | 3661/12384 [7:46:08<18:28:26, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3662/12384 [7:46:08<18:27:33, 7.62s/it, loss=0.0004, acc=0.9985, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3662/12384 [7:46:16<18:27:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 30%|██▉ | 3663/12384 [7:46:16<18:29:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 30%|██▉ | 3663/12384 [7:46:23<18:29:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 30%|██▉ | 3664/12384 [7:46:23<18:28:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 30%|██▉ | 3664/12384 [7:46:31<18:28:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 30%|██▉ | 3665/12384 [7:46:31<18:27:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 30%|██▉ | 3665/12384 [7:46:39<18:27:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 30%|██▉ | 3666/12384 [7:46:39<18:26:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 30%|██▉ | 3666/12384 [7:46:46<18:26:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|██▉ | 3667/12384 [7:46:46<18:25:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|██▉ | 3667/12384 [7:46:54<18:25:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|██▉ | 3668/12384 [7:46:54<18:25:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|██▉ | 3668/12384 [7:47:02<18:25:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3669/12384 [7:47:02<18:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3669/12384 [7:47:09<18:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3670/12384 [7:47:09<18:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3670/12384 [7:47:17<18:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|██▉ | 3671/12384 [7:47:17<18:25:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|██▉ | 3671/12384 [7:47:24<18:25:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3672/12384 [7:47:24<18:27:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3672/12384 [7:47:32<18:27:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 30%|██▉ | 3673/12384 [7:47:32<18:27:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 30%|██▉ | 3673/12384 [7:47:40<18:27:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 30%|██▉ | 3674/12384 [7:47:40<18:26:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 30%|██▉ | 3674/12384 [7:47:47<18:26:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 30%|██▉ | 3675/12384 [7:47:47<18:26:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 30%|██▉ | 3675/12384 [7:47:55<18:26:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3676/12384 [7:47:55<18:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3676/12384 [7:48:02<18:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|██▉ | 3677/12384 [7:48:02<18:24:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|██▉ | 3677/12384 [7:48:10<18:24:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3678/12384 [7:48:10<18:27:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3678/12384 [7:48:18<18:27:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 30%|██▉ | 3679/12384 [7:48:18<18:26:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 30%|██▉ | 3679/12384 [7:48:25<18:26:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 30%|██▉ | 3680/12384 [7:48:25<18:26:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 30%|██▉ | 3680/12384 [7:48:33<18:26:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 30%|██▉ | 3681/12384 [7:48:33<18:26:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 30%|██▉ | 3681/12384 [7:48:41<18:26:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.35s]
Epoch 2: 30%|██▉ | 3682/12384 [7:48:41<18:39:26, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.35s]
Epoch 2: 30%|██▉ | 3682/12384 [7:48:49<18:39:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 30%|██▉ | 3683/12384 [7:48:49<18:34:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 30%|██▉ | 3683/12384 [7:48:56<18:34:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 30%|██▉ | 3684/12384 [7:48:56<18:31:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 30%|██▉ | 3684/12384 [7:49:04<18:31:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 30%|██▉ | 3685/12384 [7:49:04<18:29:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 30%|██▉ | 3685/12384 [7:49:11<18:29:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3686/12384 [7:49:11<18:27:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3686/12384 [7:49:19<18:27:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|██▉ | 3687/12384 [7:49:19<18:26:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|██▉ | 3687/12384 [7:49:27<18:26:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 30%|██▉ | 3688/12384 [7:49:27<18:25:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 30%|██▉ | 3688/12384 [7:49:34<18:25:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 30%|██▉ | 3689/12384 [7:49:34<18:23:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 30%|██▉ | 3689/12384 [7:49:42<18:23:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 30%|██▉ | 3690/12384 [7:49:42<18:35:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 30%|██▉ | 3690/12384 [7:49:50<18:35:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 30%|██▉ | 3691/12384 [7:49:50<18:31:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 30%|██▉ | 3691/12384 [7:49:57<18:31:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 30%|██▉ | 3692/12384 [7:49:57<18:30:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 30%|██▉ | 3692/12384 [7:50:05<18:30:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 30%|██▉ | 3693/12384 [7:50:05<18:27:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 30%|██▉ | 3693/12384 [7:50:13<18:27:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 30%|██▉ | 3694/12384 [7:50:13<18:26:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 30%|██▉ | 3694/12384 [7:50:20<18:26:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 30%|██▉ | 3695/12384 [7:50:20<18:24:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 30%|██▉ | 3695/12384 [7:50:28<18:24:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 30%|██▉ | 3696/12384 [7:50:28<18:23:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 30%|██▉ | 3696/12384 [7:50:35<18:23:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 2: 30%|██▉ | 3697/12384 [7:50:35<18:22:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 2: 30%|██▉ | 3697/12384 [7:50:43<18:22:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 30%|██▉ | 3698/12384 [7:50:43<18:22:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 30%|██▉ | 3698/12384 [7:50:51<18:22:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3699/12384 [7:50:51<18:22:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3699/12384 [7:50:58<18:22:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|██▉ | 3700/12384 [7:50:58<18:21:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|██▉ | 3700/12384 [7:51:06<18:21:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 2: 30%|██▉ | 3701/12384 [7:51:06<18:21:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 2: 30%|██▉ | 3701/12384 [7:51:13<18:21:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 30%|██▉ | 3702/12384 [7:51:13<18:21:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 30%|██▉ | 3702/12384 [7:51:21<18:21:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3703/12384 [7:51:21<18:21:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3703/12384 [7:51:29<18:21:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 30%|██▉ | 3704/12384 [7:51:29<18:20:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 30%|██▉ | 3704/12384 [7:51:36<18:20:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 30%|██▉ | 3705/12384 [7:51:36<18:19:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 30%|██▉ | 3705/12384 [7:51:44<18:19:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 30%|██▉ | 3706/12384 [7:51:44<18:19:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 30%|██▉ | 3706/12384 [7:51:51<18:19:57, 7.61s/it, loss=0.0007, acc=0.9973, iter_time=11.14s]
Epoch 2: 30%|██▉ | 3707/12384 [7:51:51<18:19:29, 7.60s/it, loss=0.0007, acc=0.9973, iter_time=11.14s]
Epoch 2: 30%|██▉ | 3707/12384 [7:51:59<18:19:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3708/12384 [7:51:59<18:19:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|██▉ | 3708/12384 [7:52:07<18:19:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 30%|██▉ | 3709/12384 [7:52:07<18:34:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 30%|██▉ | 3709/12384 [7:52:15<18:34:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 30%|██▉ | 3710/12384 [7:52:15<18:30:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 30%|██▉ | 3710/12384 [7:52:22<18:30:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3711/12384 [7:52:22<18:27:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|██▉ | 3711/12384 [7:52:30<18:27:08, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 2: 30%|██▉ | 3712/12384 [7:52:30<18:25:55, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.57s]
Epoch 2: 30%|██▉ | 3712/12384 [7:52:38<18:25:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 30%|██▉ | 3713/12384 [7:52:38<18:23:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 30%|██▉ | 3713/12384 [7:52:45<18:23:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 30%|██▉ | 3714/12384 [7:52:45<18:21:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 30%|██▉ | 3714/12384 [7:52:53<18:21:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 30%|██▉ | 3715/12384 [7:52:53<18:21:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 30%|██▉ | 3715/12384 [7:53:00<18:21:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 30%|███ | 3716/12384 [7:53:00<18:21:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 30%|███ | 3716/12384 [7:53:08<18:21:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 30%|███ | 3717/12384 [7:53:08<18:33:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 30%|███ | 3717/12384 [7:53:16<18:33:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3718/12384 [7:53:16<18:32:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3718/12384 [7:53:24<18:32:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 30%|███ | 3719/12384 [7:53:24<18:31:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 30%|███ | 3719/12384 [7:53:31<18:31:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 30%|███ | 3720/12384 [7:53:31<18:28:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 30%|███ | 3720/12384 [7:53:39<18:28:48, 7.68s/it, loss=0.0004, acc=0.9980, iter_time=6.66s]
Epoch 2: 30%|███ | 3721/12384 [7:53:39<18:26:01, 7.66s/it, loss=0.0004, acc=0.9980, iter_time=6.66s]
Epoch 2: 30%|███ | 3721/12384 [7:53:46<18:26:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 30%|███ | 3722/12384 [7:53:46<18:23:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 30%|███ | 3722/12384 [7:53:54<18:23:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|███ | 3723/12384 [7:53:54<18:21:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|███ | 3723/12384 [7:54:02<18:21:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 30%|███ | 3724/12384 [7:54:02<18:20:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 30%|███ | 3724/12384 [7:54:09<18:20:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 30%|███ | 3725/12384 [7:54:09<18:20:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 30%|███ | 3725/12384 [7:54:17<18:20:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3726/12384 [7:54:17<18:19:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3726/12384 [7:54:25<18:19:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 30%|███ | 3727/12384 [7:54:25<18:19:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 30%|███ | 3727/12384 [7:54:32<18:19:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 30%|███ | 3728/12384 [7:54:32<18:18:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 30%|███ | 3728/12384 [7:54:40<18:18:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 30%|███ | 3729/12384 [7:54:40<18:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 30%|███ | 3729/12384 [7:54:47<18:17:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|███ | 3730/12384 [7:54:47<18:18:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|███ | 3730/12384 [7:54:55<18:18:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3731/12384 [7:54:55<18:18:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3731/12384 [7:55:03<18:18:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 30%|███ | 3732/12384 [7:55:03<18:27:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 30%|███ | 3732/12384 [7:55:10<18:27:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 30%|███ | 3733/12384 [7:55:10<18:23:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 30%|███ | 3733/12384 [7:55:18<18:23:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 30%|███ | 3734/12384 [7:55:18<18:24:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 30%|███ | 3734/12384 [7:55:26<18:24:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 30%|███ | 3735/12384 [7:55:26<18:36:31, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 30%|███ | 3735/12384 [7:55:34<18:36:31, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 30%|███ | 3736/12384 [7:55:34<18:29:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 30%|███ | 3736/12384 [7:55:41<18:29:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 30%|███ | 3737/12384 [7:55:41<18:25:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 30%|███ | 3737/12384 [7:55:49<18:25:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 30%|███ | 3738/12384 [7:55:49<18:23:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 30%|███ | 3738/12384 [7:55:56<18:23:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|███ | 3739/12384 [7:55:56<18:21:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|███ | 3739/12384 [7:56:04<18:21:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3740/12384 [7:56:04<18:20:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3740/12384 [7:56:12<18:20:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3741/12384 [7:56:12<18:18:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3741/12384 [7:56:19<18:18:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 30%|███ | 3742/12384 [7:56:19<18:17:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 30%|███ | 3742/12384 [7:56:27<18:17:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 30%|███ | 3743/12384 [7:56:27<18:17:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 30%|███ | 3743/12384 [7:56:35<18:17:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 2: 30%|███ | 3744/12384 [7:56:35<18:15:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 2: 30%|███ | 3744/12384 [7:56:42<18:15:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 30%|███ | 3745/12384 [7:56:42<18:14:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 30%|███ | 3745/12384 [7:56:50<18:14:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 30%|███ | 3746/12384 [7:56:50<18:15:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 30%|███ | 3746/12384 [7:56:57<18:15:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 30%|███ | 3747/12384 [7:56:57<18:14:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 30%|███ | 3747/12384 [7:57:05<18:14:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 30%|███ | 3748/12384 [7:57:05<18:15:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 30%|███ | 3748/12384 [7:57:13<18:15:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 30%|███ | 3749/12384 [7:57:13<18:19:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 30%|███ | 3749/12384 [7:57:20<18:19:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 2: 30%|███ | 3750/12384 [7:57:20<18:19:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 2: 30%|███ | 3750/12384 [7:57:28<18:19:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 30%|███ | 3751/12384 [7:57:28<18:23:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 30%|███ | 3751/12384 [7:57:36<18:23:00, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 2: 30%|███ | 3752/12384 [7:57:36<18:20:02, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 2: 30%|███ | 3752/12384 [7:57:43<18:20:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 30%|███ | 3753/12384 [7:57:43<18:19:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 30%|███ | 3753/12384 [7:57:51<18:19:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 30%|███ | 3754/12384 [7:57:51<18:17:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 30%|███ | 3754/12384 [7:57:58<18:17:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 30%|███ | 3755/12384 [7:57:58<18:15:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 30%|███ | 3755/12384 [7:58:06<18:15:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 30%|███ | 3756/12384 [7:58:06<18:14:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 30%|███ | 3756/12384 [7:58:14<18:14:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3757/12384 [7:58:14<18:15:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3757/12384 [7:58:21<18:15:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3758/12384 [7:58:21<18:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3758/12384 [7:58:29<18:14:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|███ | 3759/12384 [7:58:29<18:14:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 30%|███ | 3759/12384 [7:58:36<18:14:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 30%|███ | 3760/12384 [7:58:36<18:13:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 30%|███ | 3760/12384 [7:58:44<18:13:54, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=6.74s]
Epoch 2: 30%|███ | 3761/12384 [7:58:44<18:27:19, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=6.74s]
Epoch 2: 30%|███ | 3761/12384 [7:58:52<18:27:19, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 2: 30%|███ | 3762/12384 [7:58:52<18:22:19, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.83s]
Epoch 2: 30%|███ | 3762/12384 [7:59:00<18:22:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|███ | 3763/12384 [7:59:00<18:19:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 30%|███ | 3763/12384 [7:59:07<18:19:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3764/12384 [7:59:07<18:19:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3764/12384 [7:59:15<18:19:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 30%|███ | 3765/12384 [7:59:15<18:17:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 30%|███ | 3765/12384 [7:59:22<18:17:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 30%|███ | 3766/12384 [7:59:22<18:16:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 30%|███ | 3766/12384 [7:59:30<18:16:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 30%|███ | 3767/12384 [7:59:30<18:27:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 30%|███ | 3767/12384 [7:59:38<18:27:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 30%|███ | 3768/12384 [7:59:38<18:22:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 30%|███ | 3768/12384 [7:59:46<18:22:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 30%|███ | 3769/12384 [7:59:46<18:19:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 30%|███ | 3769/12384 [7:59:53<18:19:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3770/12384 [7:59:53<18:17:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 30%|███ | 3770/12384 [8:00:01<18:17:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3771/12384 [8:00:01<18:15:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3771/12384 [8:00:08<18:15:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3772/12384 [8:00:08<18:14:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 30%|███ | 3772/12384 [8:00:16<18:14:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 2: 30%|███ | 3773/12384 [8:00:16<18:13:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 2: 30%|███ | 3773/12384 [8:00:24<18:13:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 30%|███ | 3774/12384 [8:00:24<18:13:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 30%|███ | 3774/12384 [8:00:31<18:13:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 30%|███ | 3775/12384 [8:00:31<18:14:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 30%|███ | 3775/12384 [8:00:39<18:14:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 30%|███ | 3776/12384 [8:00:39<18:16:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 30%|███ | 3776/12384 [8:00:47<18:16:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 30%|███ | 3777/12384 [8:00:47<18:15:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 30%|███ | 3777/12384 [8:00:54<18:15:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 31%|███ | 3778/12384 [8:00:54<18:14:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 31%|███ | 3778/12384 [8:01:02<18:14:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 2: 31%|███ | 3779/12384 [8:01:02<18:13:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 2: 31%|███ | 3779/12384 [8:01:09<18:13:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3780/12384 [8:01:09<18:13:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3780/12384 [8:01:17<18:13:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 31%|███ | 3781/12384 [8:01:17<18:13:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 31%|███ | 3781/12384 [8:01:25<18:13:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 2: 31%|███ | 3782/12384 [8:01:25<18:11:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 2: 31%|███ | 3782/12384 [8:01:32<18:11:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 31%|███ | 3783/12384 [8:01:32<18:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 31%|███ | 3783/12384 [8:01:40<18:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 31%|███ | 3784/12384 [8:01:40<18:11:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 31%|███ | 3784/12384 [8:01:47<18:11:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 2: 31%|███ | 3785/12384 [8:01:47<18:09:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 2: 31%|███ | 3785/12384 [8:01:55<18:09:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 31%|███ | 3786/12384 [8:01:55<18:09:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 31%|███ | 3786/12384 [8:02:03<18:09:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 31%|███ | 3787/12384 [8:02:03<18:26:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 31%|███ | 3787/12384 [8:02:11<18:26:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 31%|███ | 3788/12384 [8:02:11<18:22:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 31%|███ | 3788/12384 [8:02:18<18:22:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3789/12384 [8:02:18<18:18:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3789/12384 [8:02:26<18:18:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 31%|███ | 3790/12384 [8:02:26<18:14:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 31%|███ | 3790/12384 [8:02:33<18:14:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 31%|███ | 3791/12384 [8:02:33<18:13:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 31%|███ | 3791/12384 [8:02:41<18:13:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 31%|███ | 3792/12384 [8:02:41<18:11:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 31%|███ | 3792/12384 [8:02:49<18:11:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 31%|███ | 3793/12384 [8:02:49<18:23:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 31%|███ | 3793/12384 [8:02:57<18:23:15, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3794/12384 [8:02:57<18:19:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3794/12384 [8:03:04<18:19:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3795/12384 [8:03:04<18:16:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3795/12384 [8:03:12<18:16:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3796/12384 [8:03:12<18:14:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3796/12384 [8:03:20<18:14:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 31%|███ | 3797/12384 [8:03:20<18:16:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 31%|███ | 3797/12384 [8:03:27<18:16:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3798/12384 [8:03:27<18:13:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3798/12384 [8:03:35<18:13:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3799/12384 [8:03:35<18:12:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3799/12384 [8:03:42<18:12:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 31%|███ | 3800/12384 [8:03:42<18:11:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 31%|███ | 3800/12384 [8:03:50<18:11:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 31%|███ | 3801/12384 [8:03:50<18:15:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 31%|███ | 3801/12384 [8:03:58<18:15:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 31%|███ | 3802/12384 [8:03:58<18:13:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 31%|███ | 3802/12384 [8:04:05<18:13:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 31%|███ | 3803/12384 [8:04:05<18:12:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 31%|███ | 3803/12384 [8:04:13<18:12:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 31%|███ | 3804/12384 [8:04:13<18:10:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 31%|███ | 3804/12384 [8:04:21<18:10:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 31%|███ | 3805/12384 [8:04:21<18:09:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 31%|███ | 3805/12384 [8:04:28<18:09:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 31%|███ | 3806/12384 [8:04:28<18:09:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 31%|███ | 3806/12384 [8:04:36<18:09:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 31%|███ | 3807/12384 [8:04:36<18:09:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 31%|███ | 3807/12384 [8:04:43<18:09:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 31%|███ | 3808/12384 [8:04:43<18:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 31%|███ | 3808/12384 [8:04:51<18:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 31%|███ | 3809/12384 [8:04:51<18:06:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 31%|███ | 3809/12384 [8:04:59<18:06:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 31%|███ | 3810/12384 [8:04:59<18:08:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 31%|███ | 3810/12384 [8:05:06<18:08:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 31%|███ | 3811/12384 [8:05:06<18:07:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 31%|███ | 3811/12384 [8:05:14<18:07:30, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.98s]
Epoch 2: 31%|███ | 3812/12384 [8:05:14<18:07:25, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.98s]
Epoch 2: 31%|███ | 3812/12384 [8:05:22<18:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 31%|███ | 3813/12384 [8:05:22<18:22:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 31%|███ | 3813/12384 [8:05:29<18:22:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 31%|███ | 3814/12384 [8:05:29<18:18:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 31%|███ | 3814/12384 [8:05:37<18:18:09, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 31%|███ | 3815/12384 [8:05:37<18:13:48, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 31%|███ | 3815/12384 [8:05:45<18:13:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 31%|███ | 3816/12384 [8:05:45<18:13:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 31%|███ | 3816/12384 [8:05:52<18:13:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 31%|███ | 3817/12384 [8:05:52<18:11:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 31%|███ | 3817/12384 [8:06:00<18:11:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 31%|███ | 3818/12384 [8:06:00<18:10:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 31%|███ | 3818/12384 [8:06:08<18:10:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 31%|███ | 3819/12384 [8:06:08<18:10:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 31%|███ | 3819/12384 [8:06:15<18:10:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 31%|███ | 3820/12384 [8:06:15<18:08:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 31%|███ | 3820/12384 [8:06:23<18:08:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3821/12384 [8:06:23<18:09:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3821/12384 [8:06:30<18:09:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 31%|███ | 3822/12384 [8:06:30<18:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 31%|███ | 3822/12384 [8:06:38<18:08:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3823/12384 [8:06:38<18:07:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3823/12384 [8:06:46<18:07:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 31%|███ | 3824/12384 [8:06:46<18:06:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 31%|███ | 3824/12384 [8:06:53<18:06:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.71s]
Epoch 2: 31%|███ | 3825/12384 [8:06:53<18:06:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.71s]
Epoch 2: 31%|███ | 3825/12384 [8:07:01<18:06:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 31%|███ | 3826/12384 [8:07:01<18:06:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 31%|███ | 3826/12384 [8:07:08<18:06:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 31%|███ | 3827/12384 [8:07:08<18:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 31%|███ | 3827/12384 [8:07:16<18:04:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 31%|███ | 3828/12384 [8:07:16<18:04:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 31%|███ | 3828/12384 [8:07:24<18:04:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3829/12384 [8:07:24<18:04:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3829/12384 [8:07:31<18:04:34, 7.61s/it, loss=0.0002, acc=0.9990, iter_time=7.60s]
Epoch 2: 31%|███ | 3830/12384 [8:07:31<18:06:23, 7.62s/it, loss=0.0002, acc=0.9990, iter_time=7.60s]
Epoch 2: 31%|███ | 3830/12384 [8:07:39<18:06:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 31%|███ | 3831/12384 [8:07:39<18:06:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 31%|███ | 3831/12384 [8:07:47<18:06:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 31%|███ | 3832/12384 [8:07:47<18:06:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 31%|███ | 3832/12384 [8:07:54<18:06:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 31%|███ | 3833/12384 [8:07:54<18:06:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 31%|███ | 3833/12384 [8:08:02<18:06:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 31%|███ | 3834/12384 [8:08:02<18:05:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 31%|███ | 3834/12384 [8:08:09<18:05:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 31%|███ | 3835/12384 [8:08:09<18:07:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 31%|███ | 3835/12384 [8:08:17<18:07:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 31%|███ | 3836/12384 [8:08:17<18:06:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 31%|███ | 3836/12384 [8:08:25<18:06:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3837/12384 [8:08:25<18:04:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3837/12384 [8:08:32<18:04:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 31%|███ | 3838/12384 [8:08:32<18:03:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 31%|███ | 3838/12384 [8:08:40<18:03:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3839/12384 [8:08:40<18:04:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███ | 3839/12384 [8:08:48<18:04:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 31%|███ | 3840/12384 [8:08:48<18:17:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 31%|███ | 3840/12384 [8:08:55<18:17:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 31%|███ | 3841/12384 [8:08:55<18:12:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 31%|███ | 3841/12384 [8:09:03<18:12:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 31%|███ | 3842/12384 [8:09:03<18:10:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 31%|███ | 3842/12384 [8:09:11<18:10:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3843/12384 [8:09:11<18:08:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 31%|███ | 3843/12384 [8:09:18<18:08:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 31%|███ | 3844/12384 [8:09:18<18:06:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 31%|███ | 3844/12384 [8:09:26<18:06:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 31%|███ | 3845/12384 [8:09:26<18:17:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 31%|███ | 3845/12384 [8:09:34<18:17:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 31%|███ | 3846/12384 [8:09:34<18:13:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 31%|███ | 3846/12384 [8:09:41<18:13:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 31%|███ | 3847/12384 [8:09:41<18:09:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 31%|███ | 3847/12384 [8:09:49<18:09:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 31%|███ | 3848/12384 [8:09:49<18:07:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 31%|███ | 3848/12384 [8:09:57<18:07:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 31%|███ | 3849/12384 [8:09:57<18:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 31%|███ | 3849/12384 [8:10:04<18:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 2: 31%|███ | 3850/12384 [8:10:04<18:03:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 2: 31%|███ | 3850/12384 [8:10:12<18:03:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 31%|███ | 3851/12384 [8:10:12<18:06:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 31%|███ | 3851/12384 [8:10:19<18:06:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 31%|███ | 3852/12384 [8:10:19<18:06:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 31%|███ | 3852/12384 [8:10:27<18:06:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 31%|███ | 3853/12384 [8:10:27<18:04:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 31%|███ | 3853/12384 [8:10:35<18:04:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 31%|███ | 3854/12384 [8:10:35<18:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 31%|███ | 3854/12384 [8:10:42<18:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 31%|███ | 3855/12384 [8:10:42<18:03:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 31%|███ | 3855/12384 [8:10:50<18:03:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 2: 31%|███ | 3856/12384 [8:10:50<18:03:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 2: 31%|███ | 3856/12384 [8:10:57<18:03:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 31%|███ | 3857/12384 [8:10:57<18:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 31%|███ | 3857/12384 [8:11:05<18:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 31%|███ | 3858/12384 [8:11:05<18:01:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 31%|███ | 3858/12384 [8:11:13<18:01:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 31%|███ | 3859/12384 [8:11:13<18:00:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 31%|███ | 3859/12384 [8:11:20<18:00:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 31%|███ | 3860/12384 [8:11:20<18:01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 31%|███ | 3860/12384 [8:11:28<18:01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 31%|███ | 3861/12384 [8:11:28<18:00:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 31%|███ | 3861/12384 [8:11:35<18:00:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 31%|███ | 3862/12384 [8:11:35<18:00:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 31%|███ | 3862/12384 [8:11:43<18:00:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 31%|███ | 3863/12384 [8:11:43<18:01:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 31%|███ | 3863/12384 [8:11:51<18:01:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 31%|███ | 3864/12384 [8:11:51<18:00:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 31%|███ | 3864/12384 [8:11:58<18:00:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 31%|███ | 3865/12384 [8:11:58<18:00:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 31%|███ | 3865/12384 [8:12:06<18:00:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 31%|███ | 3866/12384 [8:12:06<18:15:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 31%|███ | 3866/12384 [8:12:14<18:15:11, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 31%|███ | 3867/12384 [8:12:14<18:10:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 31%|███ | 3867/12384 [8:12:21<18:10:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 31%|███ | 3868/12384 [8:12:21<18:07:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 31%|███ | 3868/12384 [8:12:29<18:07:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 31%|███ | 3869/12384 [8:12:29<18:04:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 31%|███ | 3869/12384 [8:12:37<18:04:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 2: 31%|███▏ | 3870/12384 [8:12:37<18:03:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 2: 31%|███▏ | 3870/12384 [8:12:44<18:03:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███▏ | 3871/12384 [8:12:44<18:02:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███▏ | 3871/12384 [8:12:52<18:02:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 31%|███▏ | 3872/12384 [8:12:52<18:14:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 31%|███▏ | 3872/12384 [8:13:00<18:14:45, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 31%|███▏ | 3873/12384 [8:13:00<18:09:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 31%|███▏ | 3873/12384 [8:13:07<18:09:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 31%|███▏ | 3874/12384 [8:13:07<18:06:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 31%|███▏ | 3874/12384 [8:13:15<18:06:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 31%|███▏ | 3875/12384 [8:13:15<18:04:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 31%|███▏ | 3875/12384 [8:13:23<18:04:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 31%|███▏ | 3876/12384 [8:13:23<18:02:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 31%|███▏ | 3876/12384 [8:13:30<18:02:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 31%|███▏ | 3877/12384 [8:13:30<18:02:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 31%|███▏ | 3877/12384 [8:13:38<18:02:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 31%|███▏ | 3878/12384 [8:13:38<18:00:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 31%|███▏ | 3878/12384 [8:13:46<18:00:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 31%|███▏ | 3879/12384 [8:13:46<17:59:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 31%|███▏ | 3879/12384 [8:13:53<17:59:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 31%|███▏ | 3880/12384 [8:13:53<18:00:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 31%|███▏ | 3880/12384 [8:14:01<18:00:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 31%|███▏ | 3881/12384 [8:14:01<18:02:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 31%|███▏ | 3881/12384 [8:14:08<18:02:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 31%|███▏ | 3882/12384 [8:14:08<18:01:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 31%|███▏ | 3882/12384 [8:14:16<18:01:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 31%|███▏ | 3883/12384 [8:14:16<17:59:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 31%|███▏ | 3883/12384 [8:14:24<17:59:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 31%|███▏ | 3884/12384 [8:14:24<17:58:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 31%|███▏ | 3884/12384 [8:14:31<17:58:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 31%|███▏ | 3885/12384 [8:14:31<17:58:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 31%|███▏ | 3885/12384 [8:14:39<17:58:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 31%|███▏ | 3886/12384 [8:14:39<17:57:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 31%|███▏ | 3886/12384 [8:14:46<17:57:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 31%|███▏ | 3887/12384 [8:14:46<17:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 31%|███▏ | 3887/12384 [8:14:54<17:57:14, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 2: 31%|███▏ | 3888/12384 [8:14:54<17:57:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 2: 31%|███▏ | 3888/12384 [8:15:02<17:57:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 31%|███▏ | 3889/12384 [8:15:02<17:56:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 31%|███▏ | 3889/12384 [8:15:09<17:56:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 31%|███▏ | 3890/12384 [8:15:09<17:56:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 31%|███▏ | 3890/12384 [8:15:17<17:56:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 2: 31%|███▏ | 3891/12384 [8:15:17<17:57:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 2: 31%|███▏ | 3891/12384 [8:15:25<17:57:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 31%|███▏ | 3892/12384 [8:15:25<17:57:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 31%|███▏ | 3892/12384 [8:15:32<17:57:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 31%|███▏ | 3893/12384 [8:15:32<18:08:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 31%|███▏ | 3893/12384 [8:15:40<18:08:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 31%|███▏ | 3894/12384 [8:15:40<18:04:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 31%|███▏ | 3894/12384 [8:15:48<18:04:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███▏ | 3895/12384 [8:15:48<18:02:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 31%|███▏ | 3895/12384 [8:15:55<18:02:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 31%|███▏ | 3896/12384 [8:15:55<18:01:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 31%|███▏ | 3896/12384 [8:16:03<18:01:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 31%|███▏ | 3897/12384 [8:16:03<18:00:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 31%|███▏ | 3897/12384 [8:16:10<18:00:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 31%|███▏ | 3898/12384 [8:16:10<17:59:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 31%|███▏ | 3898/12384 [8:16:18<17:59:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 31%|███▏ | 3899/12384 [8:16:18<17:56:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 31%|███▏ | 3899/12384 [8:16:26<17:56:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 31%|███▏ | 3900/12384 [8:16:26<17:57:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 31%|███▏ | 3900/12384 [8:16:33<17:57:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 3901/12384 [8:16:33<17:55:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 3901/12384 [8:16:41<17:55:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 32%|███▏ | 3902/12384 [8:16:41<17:54:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 32%|███▏ | 3902/12384 [8:16:48<17:54:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3903/12384 [8:16:48<17:55:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3903/12384 [8:16:56<17:55:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 32%|███▏ | 3904/12384 [8:16:56<17:54:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 32%|███▏ | 3904/12384 [8:17:04<17:54:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3905/12384 [8:17:04<17:53:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3905/12384 [8:17:11<17:53:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3906/12384 [8:17:11<17:55:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3906/12384 [8:17:19<17:55:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3907/12384 [8:17:19<17:55:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3907/12384 [8:17:27<17:55:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3908/12384 [8:17:27<17:55:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3908/12384 [8:17:34<17:55:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 3909/12384 [8:17:34<17:55:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 3909/12384 [8:17:42<17:55:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 3910/12384 [8:17:42<17:55:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 3910/12384 [8:17:49<17:55:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 32%|███▏ | 3911/12384 [8:17:49<17:54:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 32%|███▏ | 3911/12384 [8:17:57<17:54:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 32%|███▏ | 3912/12384 [8:17:57<17:54:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 32%|███▏ | 3912/12384 [8:18:05<17:54:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 2: 32%|███▏ | 3913/12384 [8:18:05<17:56:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 2: 32%|███▏ | 3913/12384 [8:18:12<17:56:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 32%|███▏ | 3914/12384 [8:18:12<17:54:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 32%|███▏ | 3914/12384 [8:18:20<17:54:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 32%|███▏ | 3915/12384 [8:18:20<17:55:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 32%|███▏ | 3915/12384 [8:18:27<17:55:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3916/12384 [8:18:27<17:55:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3916/12384 [8:18:35<17:55:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 32%|███▏ | 3917/12384 [8:18:35<17:53:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 32%|███▏ | 3917/12384 [8:18:43<17:53:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 32%|███▏ | 3918/12384 [8:18:43<17:53:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 32%|███▏ | 3918/12384 [8:18:51<17:53:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 32%|███▏ | 3919/12384 [8:18:51<18:07:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 32%|███▏ | 3919/12384 [8:18:58<18:07:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 32%|███▏ | 3920/12384 [8:18:58<18:03:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 32%|███▏ | 3920/12384 [8:19:06<18:03:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 32%|███▏ | 3921/12384 [8:19:06<18:03:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 32%|███▏ | 3921/12384 [8:19:14<18:03:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 2: 32%|███▏ | 3922/12384 [8:19:14<18:00:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 2: 32%|███▏ | 3922/12384 [8:19:21<18:00:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 32%|███▏ | 3923/12384 [8:19:21<18:02:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 32%|███▏ | 3923/12384 [8:19:29<18:02:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 32%|███▏ | 3924/12384 [8:19:29<17:59:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 32%|███▏ | 3924/12384 [8:19:37<17:59:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 32%|███▏ | 3925/12384 [8:19:37<18:09:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 32%|███▏ | 3925/12384 [8:19:44<18:09:04, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 3926/12384 [8:19:44<18:04:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 3926/12384 [8:19:52<18:04:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 3927/12384 [8:19:52<17:59:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 3927/12384 [8:20:00<17:59:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 32%|███▏ | 3928/12384 [8:20:00<17:59:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 32%|███▏ | 3928/12384 [8:20:07<17:59:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 2: 32%|███▏ | 3929/12384 [8:20:07<17:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 2: 32%|███▏ | 3929/12384 [8:20:15<17:56:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 32%|███▏ | 3930/12384 [8:20:15<17:56:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 32%|███▏ | 3930/12384 [8:20:22<17:56:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 32%|███▏ | 3931/12384 [8:20:22<17:54:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 32%|███▏ | 3931/12384 [8:20:30<17:54:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 32%|███▏ | 3932/12384 [8:20:30<17:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 32%|███▏ | 3932/12384 [8:20:38<17:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 32%|███▏ | 3933/12384 [8:20:38<17:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 32%|███▏ | 3933/12384 [8:20:45<17:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 32%|███▏ | 3934/12384 [8:20:45<17:53:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 32%|███▏ | 3934/12384 [8:20:53<17:53:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 32%|███▏ | 3935/12384 [8:20:53<17:52:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 32%|███▏ | 3935/12384 [8:21:00<17:52:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 32%|███▏ | 3936/12384 [8:21:00<17:51:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 32%|███▏ | 3936/12384 [8:21:08<17:51:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3937/12384 [8:21:08<17:51:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3937/12384 [8:21:16<17:51:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3938/12384 [8:21:16<17:52:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3938/12384 [8:21:23<17:52:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3939/12384 [8:21:23<17:52:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3939/12384 [8:21:31<17:52:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 32%|███▏ | 3940/12384 [8:21:31<17:51:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 32%|███▏ | 3940/12384 [8:21:39<17:51:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 32%|███▏ | 3941/12384 [8:21:39<17:50:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 32%|███▏ | 3941/12384 [8:21:46<17:50:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 32%|███▏ | 3942/12384 [8:21:46<17:51:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 32%|███▏ | 3942/12384 [8:21:54<17:51:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 32%|███▏ | 3943/12384 [8:21:54<17:50:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 32%|███▏ | 3943/12384 [8:22:01<17:50:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 2: 32%|███▏ | 3944/12384 [8:22:01<17:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 2: 32%|███▏ | 3944/12384 [8:22:09<17:50:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 32%|███▏ | 3945/12384 [8:22:09<18:05:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 32%|███▏ | 3945/12384 [8:22:17<18:05:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 32%|███▏ | 3946/12384 [8:22:17<18:00:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 32%|███▏ | 3946/12384 [8:22:25<18:00:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 32%|███▏ | 3947/12384 [8:22:25<17:59:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 32%|███▏ | 3947/12384 [8:22:32<17:59:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 32%|███▏ | 3948/12384 [8:22:32<17:56:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 32%|███▏ | 3948/12384 [8:22:40<17:56:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 32%|███▏ | 3949/12384 [8:22:40<17:54:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 32%|███▏ | 3949/12384 [8:22:47<17:54:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 32%|███▏ | 3950/12384 [8:22:47<17:52:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 32%|███▏ | 3950/12384 [8:22:55<17:52:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 32%|███▏ | 3951/12384 [8:22:55<18:04:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 32%|███▏ | 3951/12384 [8:23:03<18:04:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 32%|███▏ | 3952/12384 [8:23:03<18:00:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 32%|███▏ | 3952/12384 [8:23:11<18:00:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 32%|███▏ | 3953/12384 [8:23:11<17:58:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 32%|███▏ | 3953/12384 [8:23:18<17:58:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 32%|███▏ | 3954/12384 [8:23:18<17:55:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 32%|███▏ | 3954/12384 [8:23:26<17:55:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 32%|███▏ | 3955/12384 [8:23:26<17:53:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 32%|███▏ | 3955/12384 [8:23:33<17:53:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 32%|███▏ | 3956/12384 [8:23:33<17:51:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 32%|███▏ | 3956/12384 [8:23:41<17:51:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3957/12384 [8:23:41<17:50:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3957/12384 [8:23:49<17:50:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3958/12384 [8:23:49<17:49:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3958/12384 [8:23:56<17:49:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3959/12384 [8:23:56<17:48:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3959/12384 [8:24:04<17:48:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 32%|███▏ | 3960/12384 [8:24:04<17:49:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 32%|███▏ | 3960/12384 [8:24:11<17:49:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3961/12384 [8:24:11<17:49:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3961/12384 [8:24:19<17:49:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3962/12384 [8:24:19<17:49:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 32%|███▏ | 3962/12384 [8:24:27<17:49:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 32%|███▏ | 3963/12384 [8:24:27<17:49:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 32%|███▏ | 3963/12384 [8:24:34<17:49:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3964/12384 [8:24:34<17:49:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3964/12384 [8:24:42<17:49:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 2: 32%|███▏ | 3965/12384 [8:24:42<17:49:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 2: 32%|███▏ | 3965/12384 [8:24:50<17:49:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 32%|███▏ | 3966/12384 [8:24:50<17:48:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 32%|███▏ | 3966/12384 [8:24:57<17:48:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 32%|███▏ | 3967/12384 [8:24:57<17:48:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 32%|███▏ | 3967/12384 [8:25:05<17:48:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 32%|███▏ | 3968/12384 [8:25:05<17:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 32%|███▏ | 3968/12384 [8:25:12<17:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 32%|███▏ | 3969/12384 [8:25:12<17:47:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 32%|███▏ | 3969/12384 [8:25:20<17:47:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 32%|███▏ | 3970/12384 [8:25:20<17:49:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 32%|███▏ | 3970/12384 [8:25:28<17:49:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 32%|███▏ | 3971/12384 [8:25:28<17:57:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 32%|███▏ | 3971/12384 [8:25:35<17:57:39, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.77s]
Epoch 2: 32%|███▏ | 3972/12384 [8:25:35<17:54:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.77s]
Epoch 2: 32%|███▏ | 3972/12384 [8:25:43<17:54:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 3973/12384 [8:25:43<17:51:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 3973/12384 [8:25:51<17:51:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 32%|███▏ | 3974/12384 [8:25:51<17:50:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 32%|███▏ | 3974/12384 [8:25:58<17:50:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 32%|███▏ | 3975/12384 [8:25:58<17:49:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 32%|███▏ | 3975/12384 [8:26:06<17:49:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 32%|███▏ | 3976/12384 [8:26:06<17:47:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 32%|███▏ | 3976/12384 [8:26:13<17:47:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 32%|███▏ | 3977/12384 [8:26:13<17:47:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 32%|███▏ | 3977/12384 [8:26:21<17:47:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 32%|███▏ | 3978/12384 [8:26:21<17:46:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 32%|███▏ | 3978/12384 [8:26:29<17:46:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 32%|███▏ | 3979/12384 [8:26:29<17:47:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 32%|███▏ | 3979/12384 [8:26:36<17:47:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 32%|███▏ | 3980/12384 [8:26:36<17:47:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 32%|███▏ | 3980/12384 [8:26:44<17:47:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 32%|███▏ | 3981/12384 [8:26:44<17:45:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 32%|███▏ | 3981/12384 [8:26:52<17:45:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 32%|███▏ | 3982/12384 [8:26:52<17:46:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 32%|███▏ | 3982/12384 [8:26:59<17:46:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 32%|███▏ | 3983/12384 [8:26:59<17:46:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 32%|███▏ | 3983/12384 [8:27:07<17:46:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 32%|███▏ | 3984/12384 [8:27:07<17:46:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 32%|███▏ | 3984/12384 [8:27:14<17:46:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 32%|███▏ | 3985/12384 [8:27:14<17:45:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 32%|███▏ | 3985/12384 [8:27:22<17:45:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 32%|███▏ | 3986/12384 [8:27:22<17:45:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 32%|███▏ | 3986/12384 [8:27:30<17:45:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.51s]
Epoch 2: 32%|███▏ | 3987/12384 [8:27:30<17:49:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.51s]
Epoch 2: 32%|███▏ | 3987/12384 [8:27:37<17:49:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3988/12384 [8:27:37<17:48:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 3988/12384 [8:27:45<17:48:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 32%|███▏ | 3989/12384 [8:27:45<17:46:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 32%|███▏ | 3989/12384 [8:27:53<17:46:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 32%|███▏ | 3990/12384 [8:27:53<17:45:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 32%|███▏ | 3990/12384 [8:28:00<17:45:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 32%|███▏ | 3991/12384 [8:28:00<17:45:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 32%|███▏ | 3991/12384 [8:28:08<17:45:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 32%|███▏ | 3992/12384 [8:28:08<17:48:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 32%|███▏ | 3992/12384 [8:28:15<17:48:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 32%|███▏ | 3993/12384 [8:28:15<17:48:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 32%|███▏ | 3993/12384 [8:28:23<17:48:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 32%|███▏ | 3994/12384 [8:28:23<17:46:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 32%|███▏ | 3994/12384 [8:28:31<17:46:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 3995/12384 [8:28:31<17:44:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 3995/12384 [8:28:38<17:44:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 32%|███▏ | 3996/12384 [8:28:38<17:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 32%|███▏ | 3996/12384 [8:28:46<17:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 32%|███▏ | 3997/12384 [8:28:46<17:58:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 32%|███▏ | 3997/12384 [8:28:54<17:58:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 2: 32%|███▏ | 3998/12384 [8:28:54<17:52:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 2: 32%|███▏ | 3998/12384 [8:29:01<17:52:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 32%|███▏ | 3999/12384 [8:29:01<17:49:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 32%|███▏ | 3999/12384 [8:29:09<17:49:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 32%|███▏ | 4000/12384 [8:29:09<17:47:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 32%|███▏ | 4000/12384 [8:29:17<17:47:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 32%|███▏ | 4001/12384 [8:29:17<17:46:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 32%|███▏ | 4001/12384 [8:29:24<17:46:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 32%|███▏ | 4002/12384 [8:29:24<17:48:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 32%|███▏ | 4002/12384 [8:29:32<17:48:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 32%|███▏ | 4003/12384 [8:29:32<17:58:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 32%|███▏ | 4003/12384 [8:29:40<17:58:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 32%|███▏ | 4004/12384 [8:29:40<17:56:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 32%|███▏ | 4004/12384 [8:29:48<17:56:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 32%|███▏ | 4005/12384 [8:29:48<17:51:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 32%|███▏ | 4005/12384 [8:29:55<17:51:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 2: 32%|███▏ | 4006/12384 [8:29:55<17:49:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 2: 32%|███▏ | 4006/12384 [8:30:03<17:49:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 32%|███▏ | 4007/12384 [8:30:03<17:47:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 32%|███▏ | 4007/12384 [8:30:10<17:47:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.53s]
Epoch 2: 32%|███▏ | 4008/12384 [8:30:10<17:45:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.53s]
Epoch 2: 32%|███▏ | 4008/12384 [8:30:18<17:45:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 32%|███▏ | 4009/12384 [8:30:18<17:44:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 32%|███▏ | 4009/12384 [8:30:26<17:44:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 4010/12384 [8:30:26<17:44:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 4010/12384 [8:30:33<17:44:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 4011/12384 [8:30:33<17:43:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 4011/12384 [8:30:41<17:43:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 32%|███▏ | 4012/12384 [8:30:41<17:44:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 32%|███▏ | 4012/12384 [8:30:48<17:44:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 4013/12384 [8:30:48<17:44:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 4013/12384 [8:30:56<17:44:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 4014/12384 [8:30:56<17:42:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 32%|███▏ | 4014/12384 [8:31:04<17:42:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 32%|███▏ | 4015/12384 [8:31:04<17:42:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 32%|███▏ | 4015/12384 [8:31:11<17:42:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 4016/12384 [8:31:11<17:43:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 32%|███▏ | 4016/12384 [8:31:19<17:43:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 32%|███▏ | 4017/12384 [8:31:19<17:41:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 32%|███▏ | 4017/12384 [8:31:27<17:41:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 4018/12384 [8:31:27<17:41:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 4018/12384 [8:31:34<17:41:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 32%|███▏ | 4019/12384 [8:31:34<17:41:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 32%|███▏ | 4019/12384 [8:31:42<17:41:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 32%|███▏ | 4020/12384 [8:31:42<17:40:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 32%|███▏ | 4020/12384 [8:31:49<17:40:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 2: 32%|███▏ | 4021/12384 [8:31:49<17:44:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 2: 32%|███▏ | 4021/12384 [8:31:57<17:44:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 32%|███▏ | 4022/12384 [8:31:57<17:42:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 32%|███▏ | 4022/12384 [8:32:05<17:42:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 4023/12384 [8:32:05<17:41:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 32%|███▏ | 4023/12384 [8:32:13<17:41:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 32%|███▏ | 4024/12384 [8:32:13<17:55:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 32%|███▏ | 4024/12384 [8:32:20<17:55:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 33%|███▎ | 4025/12384 [8:32:20<17:49:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 33%|███▎ | 4025/12384 [8:32:28<17:49:34, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 2: 33%|███▎ | 4026/12384 [8:32:28<17:47:00, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 2: 33%|███▎ | 4026/12384 [8:32:35<17:47:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 33%|███▎ | 4027/12384 [8:32:35<17:45:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 33%|███▎ | 4027/12384 [8:32:43<17:45:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 33%|███▎ | 4028/12384 [8:32:43<17:42:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 33%|███▎ | 4028/12384 [8:32:51<17:42:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 33%|███▎ | 4029/12384 [8:32:51<17:41:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 33%|███▎ | 4029/12384 [8:32:58<17:41:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 33%|███▎ | 4030/12384 [8:32:58<17:39:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 33%|███▎ | 4030/12384 [8:33:06<17:39:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 33%|███▎ | 4031/12384 [8:33:06<17:40:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 33%|███▎ | 4031/12384 [8:33:13<17:40:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 33%|███▎ | 4032/12384 [8:33:13<17:40:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 33%|███▎ | 4032/12384 [8:33:21<17:40:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 33%|███▎ | 4033/12384 [8:33:21<17:40:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 33%|███▎ | 4033/12384 [8:33:29<17:40:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 33%|███▎ | 4034/12384 [8:33:29<17:39:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 33%|███▎ | 4034/12384 [8:33:36<17:39:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 33%|███▎ | 4035/12384 [8:33:36<17:37:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 33%|███▎ | 4035/12384 [8:33:44<17:37:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4036/12384 [8:33:44<17:38:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4036/12384 [8:33:51<17:38:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 33%|███▎ | 4037/12384 [8:33:51<17:38:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 33%|███▎ | 4037/12384 [8:33:59<17:38:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 33%|███▎ | 4038/12384 [8:33:59<17:38:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 33%|███▎ | 4038/12384 [8:34:07<17:38:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 33%|███▎ | 4039/12384 [8:34:07<17:40:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 33%|███▎ | 4039/12384 [8:34:14<17:40:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 2: 33%|███▎ | 4040/12384 [8:34:14<17:40:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.55s]
Epoch 2: 33%|███▎ | 4040/12384 [8:34:22<17:40:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 33%|███▎ | 4041/12384 [8:34:22<17:38:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 33%|███▎ | 4041/12384 [8:34:30<17:38:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4042/12384 [8:34:30<17:38:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4042/12384 [8:34:37<17:38:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 33%|███▎ | 4043/12384 [8:34:37<17:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 33%|███▎ | 4043/12384 [8:34:45<17:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 33%|███▎ | 4044/12384 [8:34:45<17:38:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 33%|███▎ | 4044/12384 [8:34:52<17:38:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 33%|███▎ | 4045/12384 [8:34:52<17:37:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 33%|███▎ | 4045/12384 [8:35:00<17:37:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 33%|███▎ | 4046/12384 [8:35:00<17:36:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 33%|███▎ | 4046/12384 [8:35:08<17:36:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 33%|███▎ | 4047/12384 [8:35:08<17:36:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 33%|███▎ | 4047/12384 [8:35:15<17:36:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 33%|███▎ | 4048/12384 [8:35:15<17:37:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 33%|███▎ | 4048/12384 [8:35:23<17:37:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 33%|███▎ | 4049/12384 [8:35:23<17:40:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 33%|███▎ | 4049/12384 [8:35:31<17:40:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 2: 33%|███▎ | 4050/12384 [8:35:31<17:53:15, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 2: 33%|███▎ | 4050/12384 [8:35:38<17:53:15, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 33%|███▎ | 4051/12384 [8:35:38<17:48:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 33%|███▎ | 4051/12384 [8:35:46<17:48:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 33%|███▎ | 4052/12384 [8:35:46<17:45:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 33%|███▎ | 4052/12384 [8:35:54<17:45:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 33%|███▎ | 4053/12384 [8:35:54<17:45:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 33%|███▎ | 4053/12384 [8:36:01<17:45:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 33%|███▎ | 4054/12384 [8:36:01<17:42:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 33%|███▎ | 4054/12384 [8:36:09<17:42:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 33%|███▎ | 4055/12384 [8:36:09<17:40:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 33%|███▎ | 4055/12384 [8:36:17<17:40:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 33%|███▎ | 4056/12384 [8:36:17<17:51:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 33%|███▎ | 4056/12384 [8:36:24<17:51:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 33%|███▎ | 4057/12384 [8:36:24<17:47:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 33%|███▎ | 4057/12384 [8:36:32<17:47:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 33%|███▎ | 4058/12384 [8:36:32<17:44:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 33%|███▎ | 4058/12384 [8:36:40<17:44:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 33%|███▎ | 4059/12384 [8:36:40<17:42:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 33%|███▎ | 4059/12384 [8:36:47<17:42:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 33%|███▎ | 4060/12384 [8:36:47<17:40:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 33%|███▎ | 4060/12384 [8:36:55<17:40:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 33%|███▎ | 4061/12384 [8:36:55<17:38:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 33%|███▎ | 4061/12384 [8:37:03<17:38:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 33%|███▎ | 4062/12384 [8:37:03<17:37:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 33%|███▎ | 4062/12384 [8:37:10<17:37:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 33%|███▎ | 4063/12384 [8:37:10<17:36:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 33%|███▎ | 4063/12384 [8:37:18<17:36:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 33%|███▎ | 4064/12384 [8:37:18<17:35:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 33%|███▎ | 4064/12384 [8:37:25<17:35:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 33%|███▎ | 4065/12384 [8:37:25<17:35:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 33%|███▎ | 4065/12384 [8:37:33<17:35:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4066/12384 [8:37:33<17:35:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4066/12384 [8:37:41<17:35:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4067/12384 [8:37:41<17:35:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4067/12384 [8:37:48<17:35:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 33%|███▎ | 4068/12384 [8:37:48<17:34:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 33%|███▎ | 4068/12384 [8:37:56<17:34:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 33%|███▎ | 4069/12384 [8:37:56<17:34:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 33%|███▎ | 4069/12384 [8:38:03<17:34:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4070/12384 [8:38:03<17:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4070/12384 [8:38:11<17:34:45, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 2: 33%|███▎ | 4071/12384 [8:38:11<17:34:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.70s]
Epoch 2: 33%|███▎ | 4071/12384 [8:38:19<17:34:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 33%|███▎ | 4072/12384 [8:38:19<17:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 33%|███▎ | 4072/12384 [8:38:26<17:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 33%|███▎ | 4073/12384 [8:38:26<17:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 33%|███▎ | 4073/12384 [8:38:34<17:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 33%|███▎ | 4074/12384 [8:38:34<17:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 33%|███▎ | 4074/12384 [8:38:42<17:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 33%|███▎ | 4075/12384 [8:38:42<17:36:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 33%|███▎ | 4075/12384 [8:38:49<17:36:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4076/12384 [8:38:49<17:39:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4076/12384 [8:38:57<17:39:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 33%|███▎ | 4077/12384 [8:38:57<17:51:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 33%|███▎ | 4077/12384 [8:39:05<17:51:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 33%|███▎ | 4078/12384 [8:39:05<17:44:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 33%|███▎ | 4078/12384 [8:39:12<17:44:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 33%|███▎ | 4079/12384 [8:39:12<17:41:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 33%|███▎ | 4079/12384 [8:39:20<17:41:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 33%|███▎ | 4080/12384 [8:39:20<17:37:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 33%|███▎ | 4080/12384 [8:39:28<17:37:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 33%|███▎ | 4081/12384 [8:39:28<17:35:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 33%|███▎ | 4081/12384 [8:39:35<17:35:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 33%|███▎ | 4082/12384 [8:39:35<17:46:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 33%|███▎ | 4082/12384 [8:39:43<17:46:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 33%|███▎ | 4083/12384 [8:39:43<17:42:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 33%|███▎ | 4083/12384 [8:39:51<17:42:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4084/12384 [8:39:51<17:38:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4084/12384 [8:39:58<17:38:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 33%|███▎ | 4085/12384 [8:39:58<17:37:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 33%|███▎ | 4085/12384 [8:40:06<17:37:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 2: 33%|███▎ | 4086/12384 [8:40:06<17:35:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 2: 33%|███▎ | 4086/12384 [8:40:14<17:35:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 33%|███▎ | 4087/12384 [8:40:14<17:35:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 33%|███▎ | 4087/12384 [8:40:21<17:35:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 33%|███▎ | 4088/12384 [8:40:21<17:34:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 33%|███▎ | 4088/12384 [8:40:29<17:34:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 33%|███▎ | 4089/12384 [8:40:29<17:33:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 33%|███▎ | 4089/12384 [8:40:36<17:33:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4090/12384 [8:40:36<17:32:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4090/12384 [8:40:44<17:32:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4091/12384 [8:40:44<17:31:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4091/12384 [8:40:52<17:31:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4092/12384 [8:40:52<17:31:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4092/12384 [8:40:59<17:31:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4093/12384 [8:40:59<17:31:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4093/12384 [8:41:07<17:31:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4094/12384 [8:41:07<17:31:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4094/12384 [8:41:14<17:31:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 33%|███▎ | 4095/12384 [8:41:14<17:31:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 33%|███▎ | 4095/12384 [8:41:22<17:31:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 33%|███▎ | 4096/12384 [8:41:22<17:31:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 33%|███▎ | 4096/12384 [8:41:30<17:31:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 33%|███▎ | 4097/12384 [8:41:30<17:32:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 33%|███▎ | 4097/12384 [8:41:37<17:32:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 33%|███▎ | 4098/12384 [8:41:37<17:32:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 33%|███▎ | 4098/12384 [8:41:45<17:32:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 33%|███▎ | 4099/12384 [8:41:45<17:30:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 33%|███▎ | 4099/12384 [8:41:53<17:30:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 33%|███▎ | 4100/12384 [8:41:53<17:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 33%|███▎ | 4100/12384 [8:42:00<17:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 33%|███▎ | 4101/12384 [8:42:00<17:30:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 33%|███▎ | 4101/12384 [8:42:08<17:30:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 33%|███▎ | 4102/12384 [8:42:08<17:30:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 33%|███▎ | 4102/12384 [8:42:16<17:30:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 33%|███▎ | 4103/12384 [8:42:16<17:42:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 33%|███▎ | 4103/12384 [8:42:23<17:42:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 33%|███▎ | 4104/12384 [8:42:23<17:39:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 33%|███▎ | 4104/12384 [8:42:31<17:39:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 33%|███▎ | 4105/12384 [8:42:31<17:35:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 33%|███▎ | 4105/12384 [8:42:38<17:35:03, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=8.67s]
Epoch 2: 33%|███▎ | 4106/12384 [8:42:38<17:32:37, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.67s]
Epoch 2: 33%|███▎ | 4106/12384 [8:42:46<17:32:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 33%|███▎ | 4107/12384 [8:42:46<17:31:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 33%|███▎ | 4107/12384 [8:42:54<17:31:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 33%|███▎ | 4108/12384 [8:42:54<17:35:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 33%|███▎ | 4108/12384 [8:43:01<17:35:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 33%|███▎ | 4109/12384 [8:43:01<17:33:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 33%|███▎ | 4109/12384 [8:43:09<17:33:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 33%|███▎ | 4110/12384 [8:43:09<17:33:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 33%|███▎ | 4110/12384 [8:43:17<17:33:07, 7.64s/it, loss=0.0014, acc=0.9964, iter_time=9.97s]
Epoch 2: 33%|███▎ | 4111/12384 [8:43:17<17:32:34, 7.63s/it, loss=0.0014, acc=0.9964, iter_time=9.97s]
Epoch 2: 33%|███▎ | 4111/12384 [8:43:24<17:32:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 33%|███▎ | 4112/12384 [8:43:24<17:30:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 33%|███▎ | 4112/12384 [8:43:32<17:30:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 33%|███▎ | 4113/12384 [8:43:32<17:30:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 33%|███▎ | 4113/12384 [8:43:39<17:30:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 33%|███▎ | 4114/12384 [8:43:39<17:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 33%|███▎ | 4114/12384 [8:43:47<17:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 33%|███▎ | 4115/12384 [8:43:47<17:30:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 33%|███▎ | 4115/12384 [8:43:55<17:30:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4116/12384 [8:43:55<17:28:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 33%|███▎ | 4116/12384 [8:44:02<17:28:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 33%|███▎ | 4117/12384 [8:44:02<17:28:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 33%|███▎ | 4117/12384 [8:44:10<17:28:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4118/12384 [8:44:10<17:28:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4118/12384 [8:44:18<17:28:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 33%|███▎ | 4119/12384 [8:44:18<17:29:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 33%|███▎ | 4119/12384 [8:44:25<17:29:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 33%|███▎ | 4120/12384 [8:44:25<17:29:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 33%|███▎ | 4120/12384 [8:44:33<17:29:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 33%|███▎ | 4121/12384 [8:44:33<17:30:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 33%|███▎ | 4121/12384 [8:44:40<17:30:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 33%|███▎ | 4122/12384 [8:44:40<17:29:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 33%|███▎ | 4122/12384 [8:44:48<17:29:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 33%|███▎ | 4123/12384 [8:44:48<17:28:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 33%|███▎ | 4123/12384 [8:44:56<17:28:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4124/12384 [8:44:56<17:27:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4124/12384 [8:45:03<17:27:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4125/12384 [8:45:03<17:26:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 33%|███▎ | 4125/12384 [8:45:11<17:26:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 33%|███▎ | 4126/12384 [8:45:11<17:26:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 33%|███▎ | 4126/12384 [8:45:18<17:26:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 33%|███▎ | 4127/12384 [8:45:18<17:26:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 33%|███▎ | 4127/12384 [8:45:26<17:26:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 33%|███▎ | 4128/12384 [8:45:26<17:26:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 33%|███▎ | 4128/12384 [8:45:34<17:26:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 33%|███▎ | 4129/12384 [8:45:34<17:38:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 33%|███▎ | 4129/12384 [8:45:41<17:38:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 33%|███▎ | 4130/12384 [8:45:41<17:34:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 33%|███▎ | 4130/12384 [8:45:49<17:34:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 33%|███▎ | 4131/12384 [8:45:49<17:31:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 33%|███▎ | 4131/12384 [8:45:57<17:31:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 33%|███▎ | 4132/12384 [8:45:57<17:30:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 33%|███▎ | 4132/12384 [8:46:04<17:30:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 33%|███▎ | 4133/12384 [8:46:04<17:29:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 33%|███▎ | 4133/12384 [8:46:12<17:29:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 33%|███▎ | 4134/12384 [8:46:12<17:30:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 33%|███▎ | 4134/12384 [8:46:20<17:30:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 33%|███▎ | 4135/12384 [8:46:20<17:29:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 33%|███▎ | 4135/12384 [8:46:27<17:29:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 33%|███▎ | 4136/12384 [8:46:27<17:31:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 33%|███▎ | 4136/12384 [8:46:35<17:31:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 33%|███▎ | 4137/12384 [8:46:35<17:30:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 33%|███▎ | 4137/12384 [8:46:43<17:30:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 33%|███▎ | 4138/12384 [8:46:43<17:28:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 33%|███▎ | 4138/12384 [8:46:50<17:28:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 33%|███▎ | 4139/12384 [8:46:50<17:28:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 33%|███▎ | 4139/12384 [8:46:58<17:28:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 33%|███▎ | 4140/12384 [8:46:58<17:27:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 33%|███▎ | 4140/12384 [8:47:05<17:27:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 33%|███▎ | 4141/12384 [8:47:05<17:26:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 33%|███▎ | 4141/12384 [8:47:13<17:26:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 33%|███▎ | 4142/12384 [8:47:13<17:25:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 33%|███▎ | 4142/12384 [8:47:21<17:25:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 33%|███▎ | 4143/12384 [8:47:21<17:25:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 33%|███▎ | 4143/12384 [8:47:28<17:25:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 33%|███▎ | 4144/12384 [8:47:28<17:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 33%|███▎ | 4144/12384 [8:47:36<17:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 33%|███▎ | 4145/12384 [8:47:36<17:24:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 33%|███▎ | 4145/12384 [8:47:43<17:24:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 33%|███▎ | 4146/12384 [8:47:43<17:26:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 33%|███▎ | 4146/12384 [8:47:51<17:26:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4147/12384 [8:47:51<17:26:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4147/12384 [8:47:59<17:26:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4148/12384 [8:47:59<17:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 33%|███▎ | 4148/12384 [8:48:06<17:25:35, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 2: 34%|███▎ | 4149/12384 [8:48:06<17:25:13, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.81s]
Epoch 2: 34%|███▎ | 4149/12384 [8:48:14<17:25:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 2: 34%|███▎ | 4150/12384 [8:48:14<17:25:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 2: 34%|███▎ | 4150/12384 [8:48:21<17:25:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 34%|███▎ | 4151/12384 [8:48:21<17:24:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 34%|███▎ | 4151/12384 [8:48:29<17:24:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 34%|███▎ | 4152/12384 [8:48:29<17:24:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 34%|███▎ | 4152/12384 [8:48:37<17:24:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 34%|███▎ | 4153/12384 [8:48:37<17:23:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 34%|███▎ | 4153/12384 [8:48:44<17:23:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▎ | 4154/12384 [8:48:44<17:23:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▎ | 4154/12384 [8:48:52<17:23:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 34%|███▎ | 4155/12384 [8:48:52<17:37:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 34%|███▎ | 4155/12384 [8:49:00<17:37:43, 7.71s/it, loss=0.0001, acc=0.9998, iter_time=5.80s]
Epoch 2: 34%|███▎ | 4156/12384 [8:49:00<17:33:21, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=5.80s]
Epoch 2: 34%|███▎ | 4156/12384 [8:49:07<17:33:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 34%|███▎ | 4157/12384 [8:49:07<17:30:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 34%|███▎ | 4157/12384 [8:49:15<17:30:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▎ | 4158/12384 [8:49:15<17:27:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▎ | 4158/12384 [8:49:23<17:27:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 34%|███▎ | 4159/12384 [8:49:23<17:26:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 34%|███▎ | 4159/12384 [8:49:30<17:26:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 34%|███▎ | 4160/12384 [8:49:30<17:29:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 34%|███▎ | 4160/12384 [8:49:38<17:29:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▎ | 4161/12384 [8:49:38<17:38:58, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▎ | 4161/12384 [8:49:46<17:38:58, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 34%|███▎ | 4162/12384 [8:49:46<17:34:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 34%|███▎ | 4162/12384 [8:49:54<17:34:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 34%|███▎ | 4163/12384 [8:49:54<17:30:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 34%|███▎ | 4163/12384 [8:50:01<17:30:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 34%|███▎ | 4164/12384 [8:50:01<17:27:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 34%|███▎ | 4164/12384 [8:50:09<17:27:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 34%|███▎ | 4165/12384 [8:50:09<17:28:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 34%|███▎ | 4165/12384 [8:50:16<17:28:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 34%|███▎ | 4166/12384 [8:50:16<17:25:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 34%|███▎ | 4166/12384 [8:50:24<17:25:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 34%|███▎ | 4167/12384 [8:50:24<17:24:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 34%|███▎ | 4167/12384 [8:50:32<17:24:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 34%|███▎ | 4168/12384 [8:50:32<17:23:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 34%|███▎ | 4168/12384 [8:50:39<17:23:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 34%|███▎ | 4169/12384 [8:50:39<17:24:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 34%|███▎ | 4169/12384 [8:50:47<17:24:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 2: 34%|███▎ | 4170/12384 [8:50:47<17:22:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 2: 34%|███▎ | 4170/12384 [8:50:55<17:22:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 34%|███▎ | 4171/12384 [8:50:55<17:26:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 34%|███▎ | 4171/12384 [8:51:02<17:26:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 34%|███▎ | 4172/12384 [8:51:02<17:24:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 34%|███▎ | 4172/12384 [8:51:10<17:24:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 34%|███▎ | 4173/12384 [8:51:10<17:23:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 34%|███▎ | 4173/12384 [8:51:17<17:23:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 34%|███▎ | 4174/12384 [8:51:17<17:22:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 34%|███▎ | 4174/12384 [8:51:25<17:22:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 34%|███▎ | 4175/12384 [8:51:25<17:21:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 34%|███▎ | 4175/12384 [8:51:33<17:21:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 34%|███▎ | 4176/12384 [8:51:33<17:21:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 34%|███▎ | 4176/12384 [8:51:40<17:21:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 34%|███▎ | 4177/12384 [8:51:40<17:20:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 34%|███▎ | 4177/12384 [8:51:48<17:20:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 34%|███▎ | 4178/12384 [8:51:48<17:19:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 34%|███▎ | 4178/12384 [8:51:55<17:19:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 34%|███▎ | 4179/12384 [8:51:55<17:19:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 34%|███▎ | 4179/12384 [8:52:03<17:19:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 34%|███▍ | 4180/12384 [8:52:03<17:19:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 34%|███▍ | 4180/12384 [8:52:11<17:19:57, 7.61s/it, loss=0.0004, acc=0.9977, iter_time=7.33s]
Epoch 2: 34%|███▍ | 4181/12384 [8:52:11<17:34:01, 7.71s/it, loss=0.0004, acc=0.9977, iter_time=7.33s]
Epoch 2: 34%|███▍ | 4181/12384 [8:52:19<17:34:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 34%|███▍ | 4182/12384 [8:52:19<17:32:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 34%|███▍ | 4182/12384 [8:52:26<17:32:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 34%|███▍ | 4183/12384 [8:52:26<17:28:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 34%|███▍ | 4183/12384 [8:52:34<17:28:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 34%|███▍ | 4184/12384 [8:52:34<17:24:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 34%|███▍ | 4184/12384 [8:52:41<17:24:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 34%|███▍ | 4185/12384 [8:52:41<17:23:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 34%|███▍ | 4185/12384 [8:52:49<17:23:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 34%|███▍ | 4186/12384 [8:52:49<17:21:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 34%|███▍ | 4186/12384 [8:52:57<17:21:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 34%|███▍ | 4187/12384 [8:52:57<17:20:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 34%|███▍ | 4187/12384 [8:53:04<17:20:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 34%|███▍ | 4188/12384 [8:53:04<17:19:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 34%|███▍ | 4188/12384 [8:53:12<17:19:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▍ | 4189/12384 [8:53:12<17:20:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▍ | 4189/12384 [8:53:19<17:20:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 34%|███▍ | 4190/12384 [8:53:19<17:20:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 34%|███▍ | 4190/12384 [8:53:27<17:20:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 34%|███▍ | 4191/12384 [8:53:27<17:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 34%|███▍ | 4191/12384 [8:53:35<17:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 2: 34%|███▍ | 4192/12384 [8:53:35<17:20:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 2: 34%|███▍ | 4192/12384 [8:53:42<17:20:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 34%|███▍ | 4193/12384 [8:53:42<17:22:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 34%|███▍ | 4193/12384 [8:53:50<17:22:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 34%|███▍ | 4194/12384 [8:53:50<17:22:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 34%|███▍ | 4194/12384 [8:53:58<17:22:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 34%|███▍ | 4195/12384 [8:53:58<17:21:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 34%|███▍ | 4195/12384 [8:54:05<17:21:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4196/12384 [8:54:05<17:20:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4196/12384 [8:54:13<17:20:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4197/12384 [8:54:13<17:20:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4197/12384 [8:54:20<17:20:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4198/12384 [8:54:20<17:19:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4198/12384 [8:54:28<17:19:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 34%|███▍ | 4199/12384 [8:54:28<17:17:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 34%|███▍ | 4199/12384 [8:54:36<17:17:41, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=9.16s]
Epoch 2: 34%|███▍ | 4200/12384 [8:54:36<17:17:11, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=9.16s]
Epoch 2: 34%|███▍ | 4200/12384 [8:54:43<17:17:11, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 2: 34%|███▍ | 4201/12384 [8:54:43<17:17:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 2: 34%|███▍ | 4201/12384 [8:54:51<17:17:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4202/12384 [8:54:51<17:16:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4202/12384 [8:54:58<17:16:39, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 34%|███▍ | 4203/12384 [8:54:58<17:16:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 34%|███▍ | 4203/12384 [8:55:06<17:16:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▍ | 4204/12384 [8:55:06<17:16:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▍ | 4204/12384 [8:55:14<17:16:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 2: 34%|███▍ | 4205/12384 [8:55:14<17:16:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 2: 34%|███▍ | 4205/12384 [8:55:21<17:16:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 34%|███▍ | 4206/12384 [8:55:21<17:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 34%|███▍ | 4206/12384 [8:55:29<17:17:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 34%|███▍ | 4207/12384 [8:55:29<17:16:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 34%|███▍ | 4207/12384 [8:55:37<17:16:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 34%|███▍ | 4208/12384 [8:55:37<17:30:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 34%|███▍ | 4208/12384 [8:55:44<17:30:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 34%|███▍ | 4209/12384 [8:55:44<17:27:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 34%|███▍ | 4209/12384 [8:55:52<17:27:09, 7.69s/it, loss=0.0001, acc=0.9990, iter_time=9.22s]
Epoch 2: 34%|███▍ | 4210/12384 [8:55:52<17:24:35, 7.67s/it, loss=0.0001, acc=0.9990, iter_time=9.22s]
Epoch 2: 34%|███▍ | 4210/12384 [8:56:00<17:24:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 34%|███▍ | 4211/12384 [8:56:00<17:22:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 34%|███▍ | 4211/12384 [8:56:07<17:22:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 34%|███▍ | 4212/12384 [8:56:07<17:20:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 34%|███▍ | 4212/12384 [8:56:15<17:20:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 34%|███▍ | 4213/12384 [8:56:15<17:31:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 34%|███▍ | 4213/12384 [8:56:23<17:31:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 34%|███▍ | 4214/12384 [8:56:23<17:26:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 34%|███▍ | 4214/12384 [8:56:30<17:26:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 34%|███▍ | 4215/12384 [8:56:30<17:23:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 34%|███▍ | 4215/12384 [8:56:38<17:23:08, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 34%|███▍ | 4216/12384 [8:56:38<17:20:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 34%|███▍ | 4216/12384 [8:56:46<17:20:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 2: 34%|███▍ | 4217/12384 [8:56:46<17:18:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 2: 34%|███▍ | 4217/12384 [8:56:53<17:18:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 2: 34%|███▍ | 4218/12384 [8:56:53<17:17:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 2: 34%|███▍ | 4218/12384 [8:57:01<17:17:13, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.86s]
Epoch 2: 34%|███▍ | 4219/12384 [8:57:01<17:16:28, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=7.86s]
Epoch 2: 34%|███▍ | 4219/12384 [8:57:08<17:16:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 34%|███▍ | 4220/12384 [8:57:08<17:15:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 34%|███▍ | 4220/12384 [8:57:16<17:15:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 2: 34%|███▍ | 4221/12384 [8:57:16<17:15:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.85s]
Epoch 2: 34%|███▍ | 4221/12384 [8:57:24<17:15:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 34%|███▍ | 4222/12384 [8:57:24<17:14:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 34%|███▍ | 4222/12384 [8:57:31<17:14:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 34%|███▍ | 4223/12384 [8:57:31<17:13:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 34%|███▍ | 4223/12384 [8:57:39<17:13:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 34%|███▍ | 4224/12384 [8:57:39<17:14:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 34%|███▍ | 4224/12384 [8:57:46<17:14:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 34%|███▍ | 4225/12384 [8:57:46<17:13:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 34%|███▍ | 4225/12384 [8:57:54<17:13:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 34%|███▍ | 4226/12384 [8:57:54<17:12:22, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 34%|███▍ | 4226/12384 [8:58:02<17:12:22, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 34%|███▍ | 4227/12384 [8:58:02<17:12:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 34%|███▍ | 4227/12384 [8:58:09<17:12:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 34%|███▍ | 4228/12384 [8:58:09<17:13:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 34%|███▍ | 4228/12384 [8:58:17<17:13:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 34%|███▍ | 4229/12384 [8:58:17<17:12:03, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 34%|███▍ | 4229/12384 [8:58:24<17:12:03, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 34%|███▍ | 4230/12384 [8:58:24<17:12:06, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 34%|███▍ | 4230/12384 [8:58:32<17:12:06, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 34%|███▍ | 4231/12384 [8:58:32<17:11:57, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 34%|███▍ | 4231/12384 [8:58:40<17:11:57, 7.59s/it, loss=0.0004, acc=1.0000, iter_time=8.01s]
Epoch 2: 34%|███▍ | 4232/12384 [8:58:40<17:20:32, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=8.01s]
Epoch 2: 34%|███▍ | 4232/12384 [8:58:47<17:20:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 34%|███▍ | 4233/12384 [8:58:47<17:18:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 34%|███▍ | 4233/12384 [8:58:55<17:18:43, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.69s]
Epoch 2: 34%|███▍ | 4234/12384 [8:58:55<17:31:26, 7.74s/it, loss=0.0001, acc=0.9999, iter_time=7.69s]
Epoch 2: 34%|███▍ | 4234/12384 [8:59:03<17:31:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 34%|███▍ | 4235/12384 [8:59:03<17:29:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 34%|███▍ | 4235/12384 [8:59:11<17:29:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 34%|███▍ | 4236/12384 [8:59:11<17:23:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 34%|███▍ | 4236/12384 [8:59:18<17:23:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 34%|███▍ | 4237/12384 [8:59:18<17:20:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 34%|███▍ | 4237/12384 [8:59:26<17:20:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 34%|███▍ | 4238/12384 [8:59:26<17:29:40, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 34%|███▍ | 4238/12384 [8:59:34<17:29:40, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4239/12384 [8:59:34<17:24:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4239/12384 [8:59:41<17:24:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 34%|███▍ | 4240/12384 [8:59:41<17:21:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 34%|███▍ | 4240/12384 [8:59:49<17:21:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 34%|███▍ | 4241/12384 [8:59:49<17:18:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 34%|███▍ | 4241/12384 [8:59:57<17:18:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4242/12384 [8:59:57<17:16:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 34%|███▍ | 4242/12384 [9:00:04<17:16:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 34%|███▍ | 4243/12384 [9:00:04<17:15:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 34%|███▍ | 4243/12384 [9:00:12<17:15:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.17s]
Epoch 2: 34%|███▍ | 4244/12384 [9:00:12<17:14:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.17s]
Epoch 2: 34%|███▍ | 4244/12384 [9:00:19<17:14:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.93s]
Epoch 2: 34%|███▍ | 4245/12384 [9:00:19<17:13:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.93s]
Epoch 2: 34%|███▍ | 4245/12384 [9:00:27<17:13:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 34%|███▍ | 4246/12384 [9:00:27<17:12:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 34%|███▍ | 4246/12384 [9:00:35<17:12:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 34%|███▍ | 4247/12384 [9:00:35<17:11:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 34%|███▍ | 4247/12384 [9:00:42<17:11:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 34%|███▍ | 4248/12384 [9:00:42<17:12:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 34%|███▍ | 4248/12384 [9:00:50<17:12:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 34%|███▍ | 4249/12384 [9:00:50<17:11:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 34%|███▍ | 4249/12384 [9:00:57<17:11:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 34%|███▍ | 4250/12384 [9:00:57<17:09:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 34%|███▍ | 4250/12384 [9:01:05<17:09:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 34%|███▍ | 4251/12384 [9:01:05<17:09:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 34%|███▍ | 4251/12384 [9:01:13<17:09:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 34%|███▍ | 4252/12384 [9:01:13<17:09:14, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 34%|███▍ | 4252/12384 [9:01:20<17:09:14, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 34%|███▍ | 4253/12384 [9:01:20<17:10:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 34%|███▍ | 4253/12384 [9:01:28<17:10:01, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 34%|███▍ | 4254/12384 [9:01:28<17:10:19, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 34%|███▍ | 4254/12384 [9:01:35<17:10:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 34%|███▍ | 4255/12384 [9:01:35<17:11:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 34%|███▍ | 4255/12384 [9:01:43<17:11:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 34%|███▍ | 4256/12384 [9:01:43<17:11:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 34%|███▍ | 4256/12384 [9:01:51<17:11:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 34%|███▍ | 4257/12384 [9:01:51<17:14:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 34%|███▍ | 4257/12384 [9:01:58<17:14:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 34%|███▍ | 4258/12384 [9:01:58<17:13:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 34%|███▍ | 4258/12384 [9:02:06<17:13:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.46s]
Epoch 2: 34%|███▍ | 4259/12384 [9:02:06<17:11:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.46s]
Epoch 2: 34%|███▍ | 4259/12384 [9:02:14<17:11:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 34%|███▍ | 4260/12384 [9:02:14<17:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 34%|███▍ | 4260/12384 [9:02:22<17:11:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 34%|███▍ | 4261/12384 [9:02:22<17:24:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 34%|███▍ | 4261/12384 [9:02:29<17:24:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 34%|███▍ | 4262/12384 [9:02:29<17:19:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 34%|███▍ | 4262/12384 [9:02:37<17:19:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 2: 34%|███▍ | 4263/12384 [9:02:37<17:15:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 2: 34%|███▍ | 4263/12384 [9:02:44<17:15:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 2: 34%|███▍ | 4264/12384 [9:02:44<17:14:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 2: 34%|███▍ | 4264/12384 [9:02:52<17:14:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 34%|███▍ | 4265/12384 [9:02:52<17:24:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 34%|███▍ | 4265/12384 [9:03:00<17:24:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 34%|███▍ | 4266/12384 [9:03:00<17:21:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 34%|███▍ | 4266/12384 [9:03:07<17:21:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 34%|███▍ | 4267/12384 [9:03:07<17:18:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 34%|███▍ | 4267/12384 [9:03:15<17:18:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 34%|███▍ | 4268/12384 [9:03:15<17:14:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 34%|███▍ | 4268/12384 [9:03:23<17:14:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▍ | 4269/12384 [9:03:23<17:13:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 34%|███▍ | 4269/12384 [9:03:30<17:13:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 34%|███▍ | 4270/12384 [9:03:30<17:12:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 34%|███▍ | 4270/12384 [9:03:38<17:12:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 34%|███▍ | 4271/12384 [9:03:38<17:11:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 34%|███▍ | 4271/12384 [9:03:46<17:11:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 2: 34%|███▍ | 4272/12384 [9:03:46<17:13:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 2: 34%|███▍ | 4272/12384 [9:03:53<17:13:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 35%|███▍ | 4273/12384 [9:03:53<17:13:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 35%|███▍ | 4273/12384 [9:04:01<17:13:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 35%|███▍ | 4274/12384 [9:04:01<17:11:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 35%|███▍ | 4274/12384 [9:04:08<17:11:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 35%|███▍ | 4275/12384 [9:04:08<17:11:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 35%|███▍ | 4275/12384 [9:04:16<17:11:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 35%|███▍ | 4276/12384 [9:04:16<17:09:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 35%|███▍ | 4276/12384 [9:04:24<17:09:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▍ | 4277/12384 [9:04:24<17:09:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▍ | 4277/12384 [9:04:31<17:09:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 35%|███▍ | 4278/12384 [9:04:31<17:09:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 35%|███▍ | 4278/12384 [9:04:39<17:09:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 35%|███▍ | 4279/12384 [9:04:39<17:08:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 35%|███▍ | 4279/12384 [9:04:47<17:08:35, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.53s]
Epoch 2: 35%|███▍ | 4280/12384 [9:04:47<17:07:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.53s]
Epoch 2: 35%|███▍ | 4280/12384 [9:04:54<17:07:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 35%|███▍ | 4281/12384 [9:04:54<17:07:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 35%|███▍ | 4281/12384 [9:05:02<17:07:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 35%|███▍ | 4282/12384 [9:05:02<17:06:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 35%|███▍ | 4282/12384 [9:05:09<17:06:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 35%|███▍ | 4283/12384 [9:05:09<17:06:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 35%|███▍ | 4283/12384 [9:05:17<17:06:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 2: 35%|███▍ | 4284/12384 [9:05:17<17:06:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.86s]
Epoch 2: 35%|███▍ | 4284/12384 [9:05:25<17:06:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 35%|███▍ | 4285/12384 [9:05:25<17:07:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 35%|███▍ | 4285/12384 [9:05:32<17:07:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 35%|███▍ | 4286/12384 [9:05:32<17:07:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 35%|███▍ | 4286/12384 [9:05:40<17:07:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 35%|███▍ | 4287/12384 [9:05:40<17:20:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 35%|███▍ | 4287/12384 [9:05:48<17:20:32, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 35%|███▍ | 4288/12384 [9:05:48<17:21:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 35%|███▍ | 4288/12384 [9:05:55<17:21:05, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 35%|███▍ | 4289/12384 [9:05:55<17:16:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 35%|███▍ | 4289/12384 [9:06:03<17:16:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▍ | 4290/12384 [9:06:03<17:13:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▍ | 4290/12384 [9:06:11<17:13:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▍ | 4291/12384 [9:06:11<17:10:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▍ | 4291/12384 [9:06:19<17:10:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 35%|███▍ | 4292/12384 [9:06:19<17:20:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 35%|███▍ | 4292/12384 [9:06:26<17:20:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 35%|███▍ | 4293/12384 [9:06:26<17:15:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 35%|███▍ | 4293/12384 [9:06:34<17:15:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▍ | 4294/12384 [9:06:34<17:12:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▍ | 4294/12384 [9:06:41<17:12:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 35%|███▍ | 4295/12384 [9:06:41<17:10:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 35%|███▍ | 4295/12384 [9:06:49<17:10:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 35%|███▍ | 4296/12384 [9:06:49<17:09:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 35%|███▍ | 4296/12384 [9:06:57<17:09:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 35%|███▍ | 4297/12384 [9:06:57<17:11:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 35%|███▍ | 4297/12384 [9:07:04<17:11:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 35%|███▍ | 4298/12384 [9:07:04<17:08:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 35%|███▍ | 4298/12384 [9:07:12<17:08:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 35%|███▍ | 4299/12384 [9:07:12<17:06:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 35%|███▍ | 4299/12384 [9:07:19<17:06:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 35%|███▍ | 4300/12384 [9:07:19<17:08:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 35%|███▍ | 4300/12384 [9:07:27<17:08:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 35%|███▍ | 4301/12384 [9:07:27<17:07:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 35%|███▍ | 4301/12384 [9:07:35<17:07:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 35%|███▍ | 4302/12384 [9:07:35<17:09:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 35%|███▍ | 4302/12384 [9:07:42<17:09:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 35%|███▍ | 4303/12384 [9:07:42<17:08:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 35%|███▍ | 4303/12384 [9:07:50<17:08:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▍ | 4304/12384 [9:07:50<17:08:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▍ | 4304/12384 [9:07:58<17:08:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 35%|███▍ | 4305/12384 [9:07:58<17:08:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 35%|███▍ | 4305/12384 [9:08:05<17:08:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 35%|███▍ | 4306/12384 [9:08:05<17:07:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 35%|███▍ | 4306/12384 [9:08:13<17:07:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 35%|███▍ | 4307/12384 [9:08:13<17:06:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 35%|███▍ | 4307/12384 [9:08:20<17:06:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 35%|███▍ | 4308/12384 [9:08:20<17:05:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 35%|███▍ | 4308/12384 [9:08:28<17:05:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▍ | 4309/12384 [9:08:28<17:04:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▍ | 4309/12384 [9:08:36<17:04:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 35%|███▍ | 4310/12384 [9:08:36<17:04:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 35%|███▍ | 4310/12384 [9:08:43<17:04:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 35%|███▍ | 4311/12384 [9:08:43<17:03:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 35%|███▍ | 4311/12384 [9:08:51<17:03:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 35%|███▍ | 4312/12384 [9:08:51<17:04:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 35%|███▍ | 4312/12384 [9:08:59<17:04:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 35%|███▍ | 4313/12384 [9:08:59<17:16:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 35%|███▍ | 4313/12384 [9:09:06<17:16:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 35%|███▍ | 4314/12384 [9:09:06<17:11:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 35%|███▍ | 4314/12384 [9:09:14<17:11:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 35%|███▍ | 4315/12384 [9:09:14<17:09:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 35%|███▍ | 4315/12384 [9:09:22<17:09:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 2: 35%|███▍ | 4316/12384 [9:09:22<17:07:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 2: 35%|███▍ | 4316/12384 [9:09:29<17:07:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 35%|███▍ | 4317/12384 [9:09:29<17:05:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 35%|███▍ | 4317/12384 [9:09:37<17:05:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 35%|███▍ | 4318/12384 [9:09:37<17:05:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 35%|███▍ | 4318/12384 [9:09:45<17:05:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 35%|███▍ | 4319/12384 [9:09:45<17:13:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 35%|███▍ | 4319/12384 [9:09:52<17:13:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▍ | 4320/12384 [9:09:52<17:13:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▍ | 4320/12384 [9:10:00<17:13:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 35%|███▍ | 4321/12384 [9:10:00<17:10:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 35%|███▍ | 4321/12384 [9:10:08<17:10:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 35%|███▍ | 4322/12384 [9:10:08<17:06:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 35%|███▍ | 4322/12384 [9:10:15<17:06:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 35%|███▍ | 4323/12384 [9:10:15<17:05:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 35%|███▍ | 4323/12384 [9:10:23<17:05:57, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=3.45s]
Epoch 2: 35%|███▍ | 4324/12384 [9:10:23<17:06:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=3.45s]
Epoch 2: 35%|███▍ | 4324/12384 [9:10:31<17:06:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.86s]
Epoch 2: 35%|███▍ | 4325/12384 [9:10:31<17:06:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.86s]
Epoch 2: 35%|███▍ | 4325/12384 [9:10:38<17:06:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 35%|███▍ | 4326/12384 [9:10:38<17:05:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 35%|███▍ | 4326/12384 [9:10:46<17:05:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 35%|███▍ | 4327/12384 [9:10:46<17:04:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 35%|███▍ | 4327/12384 [9:10:53<17:04:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 35%|███▍ | 4328/12384 [9:10:53<17:03:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 35%|███▍ | 4328/12384 [9:11:01<17:03:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 35%|███▍ | 4329/12384 [9:11:01<17:04:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 35%|███▍ | 4329/12384 [9:11:09<17:04:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 35%|███▍ | 4330/12384 [9:11:09<17:02:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 35%|███▍ | 4330/12384 [9:11:16<17:02:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 35%|███▍ | 4331/12384 [9:11:16<17:01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 35%|███▍ | 4331/12384 [9:11:24<17:01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 35%|███▍ | 4332/12384 [9:11:24<17:03:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 35%|███▍ | 4332/12384 [9:11:32<17:03:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 2: 35%|███▍ | 4333/12384 [9:11:32<17:03:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 2: 35%|███▍ | 4333/12384 [9:11:39<17:03:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 35%|███▍ | 4334/12384 [9:11:39<17:02:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 35%|███▍ | 4334/12384 [9:11:47<17:02:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▌ | 4335/12384 [9:11:47<17:01:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▌ | 4335/12384 [9:11:54<17:01:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 35%|███▌ | 4336/12384 [9:11:54<17:01:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 35%|███▌ | 4336/12384 [9:12:02<17:01:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 35%|███▌ | 4337/12384 [9:12:02<17:01:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 35%|███▌ | 4337/12384 [9:12:10<17:01:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▌ | 4338/12384 [9:12:10<17:01:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▌ | 4338/12384 [9:12:18<17:01:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 35%|███▌ | 4339/12384 [9:12:18<17:15:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 35%|███▌ | 4339/12384 [9:12:25<17:15:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 35%|███▌ | 4340/12384 [9:12:25<17:11:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 35%|███▌ | 4340/12384 [9:12:33<17:11:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 35%|███▌ | 4341/12384 [9:12:33<17:08:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 35%|███▌ | 4341/12384 [9:12:40<17:08:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▌ | 4342/12384 [9:12:40<17:05:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▌ | 4342/12384 [9:12:48<17:05:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▌ | 4343/12384 [9:12:48<17:03:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▌ | 4343/12384 [9:12:56<17:03:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 35%|███▌ | 4344/12384 [9:12:56<17:02:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 35%|███▌ | 4344/12384 [9:13:03<17:02:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 35%|███▌ | 4345/12384 [9:13:03<17:01:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 35%|███▌ | 4345/12384 [9:13:11<17:01:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 35%|███▌ | 4346/12384 [9:13:11<17:01:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 35%|███▌ | 4346/12384 [9:13:18<17:01:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 35%|███▌ | 4347/12384 [9:13:18<17:01:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 35%|███▌ | 4347/12384 [9:13:26<17:01:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▌ | 4348/12384 [9:13:26<17:00:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▌ | 4348/12384 [9:13:34<17:00:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 35%|███▌ | 4349/12384 [9:13:34<16:59:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 35%|███▌ | 4349/12384 [9:13:41<16:59:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 35%|███▌ | 4350/12384 [9:13:41<17:00:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 35%|███▌ | 4350/12384 [9:13:49<17:00:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 35%|███▌ | 4351/12384 [9:13:49<17:00:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 35%|███▌ | 4351/12384 [9:13:57<17:00:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 35%|███▌ | 4352/12384 [9:13:57<17:00:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 35%|███▌ | 4352/12384 [9:14:04<17:00:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 35%|███▌ | 4353/12384 [9:14:04<17:00:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 35%|███▌ | 4353/12384 [9:14:12<17:00:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 35%|███▌ | 4354/12384 [9:14:12<17:03:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 35%|███▌ | 4354/12384 [9:14:19<17:03:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 35%|███▌ | 4355/12384 [9:14:19<17:02:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 35%|███▌ | 4355/12384 [9:14:27<17:02:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 35%|███▌ | 4356/12384 [9:14:27<17:01:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 35%|███▌ | 4356/12384 [9:14:35<17:01:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 35%|███▌ | 4357/12384 [9:14:35<17:00:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 35%|███▌ | 4357/12384 [9:14:42<17:00:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▌ | 4358/12384 [9:14:42<17:00:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▌ | 4358/12384 [9:14:50<17:00:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 2: 35%|███▌ | 4359/12384 [9:14:50<16:59:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 2: 35%|███▌ | 4359/12384 [9:14:58<16:59:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 35%|███▌ | 4360/12384 [9:14:58<16:59:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 35%|███▌ | 4360/12384 [9:15:05<16:59:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 35%|███▌ | 4361/12384 [9:15:05<17:01:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 35%|███▌ | 4361/12384 [9:15:13<17:01:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 35%|███▌ | 4362/12384 [9:15:13<17:00:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 35%|███▌ | 4362/12384 [9:15:20<17:00:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 35%|███▌ | 4363/12384 [9:15:20<16:58:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 35%|███▌ | 4363/12384 [9:15:28<16:58:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 35%|███▌ | 4364/12384 [9:15:28<16:57:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 35%|███▌ | 4364/12384 [9:15:36<16:57:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 35%|███▌ | 4365/12384 [9:15:36<17:08:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 35%|███▌ | 4365/12384 [9:15:44<17:08:48, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 2: 35%|███▌ | 4366/12384 [9:15:44<17:08:03, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.88s]
Epoch 2: 35%|███▌ | 4366/12384 [9:15:51<17:08:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 35%|███▌ | 4367/12384 [9:15:51<17:04:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 35%|███▌ | 4367/12384 [9:15:59<17:04:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 35%|███▌ | 4368/12384 [9:15:59<17:02:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 35%|███▌ | 4368/12384 [9:16:07<17:02:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 35%|███▌ | 4369/12384 [9:16:07<17:01:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 35%|███▌ | 4369/12384 [9:16:14<17:01:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 35%|███▌ | 4370/12384 [9:16:14<17:08:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 35%|███▌ | 4370/12384 [9:16:22<17:08:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 35%|███▌ | 4371/12384 [9:16:22<17:04:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 35%|███▌ | 4371/12384 [9:16:30<17:04:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 2: 35%|███▌ | 4372/12384 [9:16:30<17:01:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 2: 35%|███▌ | 4372/12384 [9:16:37<17:01:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 35%|███▌ | 4373/12384 [9:16:37<16:59:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 35%|███▌ | 4373/12384 [9:16:45<16:59:50, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 2: 35%|███▌ | 4374/12384 [9:16:45<16:58:24, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=7.60s]
Epoch 2: 35%|███▌ | 4374/12384 [9:16:52<16:58:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▌ | 4375/12384 [9:16:52<16:57:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 35%|███▌ | 4375/12384 [9:17:00<16:57:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 35%|███▌ | 4376/12384 [9:17:00<16:57:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 35%|███▌ | 4376/12384 [9:17:08<16:57:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 2: 35%|███▌ | 4377/12384 [9:17:08<16:56:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.42s]
Epoch 2: 35%|███▌ | 4377/12384 [9:17:15<16:56:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.87s]
Epoch 2: 35%|███▌ | 4378/12384 [9:17:15<16:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.87s]
Epoch 2: 35%|███▌ | 4378/12384 [9:17:23<16:56:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 35%|███▌ | 4379/12384 [9:17:23<16:56:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 35%|███▌ | 4379/12384 [9:17:30<16:56:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 35%|███▌ | 4380/12384 [9:17:30<16:54:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 35%|███▌ | 4380/12384 [9:17:38<16:54:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 35%|███▌ | 4381/12384 [9:17:38<16:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 35%|███▌ | 4381/12384 [9:17:46<16:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 35%|███▌ | 4382/12384 [9:17:46<16:54:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 35%|███▌ | 4382/12384 [9:17:53<16:54:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 2: 35%|███▌ | 4383/12384 [9:17:53<16:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.40s]
Epoch 2: 35%|███▌ | 4383/12384 [9:18:01<16:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 35%|███▌ | 4384/12384 [9:18:01<16:55:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 35%|███▌ | 4384/12384 [9:18:08<16:55:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 35%|███▌ | 4385/12384 [9:18:08<16:54:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 35%|███▌ | 4385/12384 [9:18:16<16:54:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 35%|███▌ | 4386/12384 [9:18:16<16:54:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 35%|███▌ | 4386/12384 [9:18:24<16:54:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 35%|███▌ | 4387/12384 [9:18:24<16:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 35%|███▌ | 4387/12384 [9:18:31<16:54:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▌ | 4388/12384 [9:18:31<16:54:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 35%|███▌ | 4388/12384 [9:18:39<16:54:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 35%|███▌ | 4389/12384 [9:18:39<16:53:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 35%|███▌ | 4389/12384 [9:18:47<16:53:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 35%|███▌ | 4390/12384 [9:18:47<16:53:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 35%|███▌ | 4390/12384 [9:18:54<16:53:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▌ | 4391/12384 [9:18:54<16:52:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 35%|███▌ | 4391/12384 [9:19:02<16:52:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 35%|███▌ | 4392/12384 [9:19:02<17:06:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 35%|███▌ | 4392/12384 [9:19:10<17:06:00, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.81s]
Epoch 2: 35%|███▌ | 4393/12384 [9:19:10<17:00:49, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.81s]
Epoch 2: 35%|███▌ | 4393/12384 [9:19:17<17:00:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 35%|███▌ | 4394/12384 [9:19:17<16:57:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 35%|███▌ | 4394/12384 [9:19:25<16:57:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 35%|███▌ | 4395/12384 [9:19:25<16:57:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 35%|███▌ | 4395/12384 [9:19:32<16:57:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 35%|███▌ | 4396/12384 [9:19:32<16:56:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 35%|███▌ | 4396/12384 [9:19:40<16:56:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 36%|███▌ | 4397/12384 [9:19:40<17:05:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 36%|███▌ | 4397/12384 [9:19:48<17:05:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4398/12384 [9:19:48<17:01:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4398/12384 [9:19:56<17:01:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4399/12384 [9:19:56<16:58:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4399/12384 [9:20:03<16:58:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 36%|███▌ | 4400/12384 [9:20:03<17:00:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 36%|███▌ | 4400/12384 [9:20:11<17:00:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 36%|███▌ | 4401/12384 [9:20:11<16:57:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 36%|███▌ | 4401/12384 [9:20:18<16:57:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 36%|███▌ | 4402/12384 [9:20:18<16:55:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 36%|███▌ | 4402/12384 [9:20:26<16:55:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 36%|███▌ | 4403/12384 [9:20:26<16:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 36%|███▌ | 4403/12384 [9:20:34<16:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 36%|███▌ | 4404/12384 [9:20:34<16:53:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 36%|███▌ | 4404/12384 [9:20:41<16:53:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4405/12384 [9:20:41<16:53:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4405/12384 [9:20:49<16:53:07, 7.62s/it, loss=0.0000, acc=0.9998, iter_time=7.63s]
Epoch 2: 36%|███▌ | 4406/12384 [9:20:49<16:54:45, 7.63s/it, loss=0.0000, acc=0.9998, iter_time=7.63s]
Epoch 2: 36%|███▌ | 4406/12384 [9:20:57<16:54:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 36%|███▌ | 4407/12384 [9:20:57<16:53:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 36%|███▌ | 4407/12384 [9:21:04<16:53:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 36%|███▌ | 4408/12384 [9:21:04<16:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 36%|███▌ | 4408/12384 [9:21:12<16:53:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 36%|███▌ | 4409/12384 [9:21:12<16:51:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 36%|███▌ | 4409/12384 [9:21:19<16:51:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 36%|███▌ | 4410/12384 [9:21:19<16:51:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 36%|███▌ | 4410/12384 [9:21:27<16:51:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 36%|███▌ | 4411/12384 [9:21:27<16:50:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 36%|███▌ | 4411/12384 [9:21:35<16:50:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 36%|███▌ | 4412/12384 [9:21:35<16:51:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 36%|███▌ | 4412/12384 [9:21:42<16:51:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 36%|███▌ | 4413/12384 [9:21:42<16:50:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 36%|███▌ | 4413/12384 [9:21:50<16:50:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 36%|███▌ | 4414/12384 [9:21:50<16:50:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 36%|███▌ | 4414/12384 [9:21:57<16:50:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 36%|███▌ | 4415/12384 [9:21:57<16:50:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 36%|███▌ | 4415/12384 [9:22:05<16:50:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 36%|███▌ | 4416/12384 [9:22:05<16:51:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 36%|███▌ | 4416/12384 [9:22:13<16:51:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 36%|███▌ | 4417/12384 [9:22:13<16:50:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 36%|███▌ | 4417/12384 [9:22:21<16:50:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 36%|███▌ | 4418/12384 [9:22:21<17:02:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 36%|███▌ | 4418/12384 [9:22:28<17:02:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 36%|███▌ | 4419/12384 [9:22:28<16:59:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 36%|███▌ | 4419/12384 [9:22:36<16:59:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4420/12384 [9:22:36<16:56:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4420/12384 [9:22:43<16:56:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 36%|███▌ | 4421/12384 [9:22:43<16:54:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 36%|███▌ | 4421/12384 [9:22:51<16:54:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 36%|███▌ | 4422/12384 [9:22:51<17:02:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 36%|███▌ | 4422/12384 [9:22:59<17:02:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4423/12384 [9:22:59<16:59:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4423/12384 [9:23:06<16:59:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 36%|███▌ | 4424/12384 [9:23:06<16:56:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 36%|███▌ | 4424/12384 [9:23:14<16:56:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 36%|███▌ | 4425/12384 [9:23:14<16:55:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 36%|███▌ | 4425/12384 [9:23:22<16:55:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 36%|███▌ | 4426/12384 [9:23:22<16:53:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 36%|███▌ | 4426/12384 [9:23:29<16:53:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▌ | 4427/12384 [9:23:29<16:53:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▌ | 4427/12384 [9:23:37<16:53:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▌ | 4428/12384 [9:23:37<16:56:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▌ | 4428/12384 [9:23:45<16:56:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 36%|███▌ | 4429/12384 [9:23:45<16:54:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 36%|███▌ | 4429/12384 [9:23:52<16:54:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▌ | 4430/12384 [9:23:52<16:52:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▌ | 4430/12384 [9:24:00<16:52:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4431/12384 [9:24:00<16:52:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4431/12384 [9:24:08<16:52:09, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 2: 36%|███▌ | 4432/12384 [9:24:08<16:51:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 2: 36%|███▌ | 4432/12384 [9:24:15<16:51:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 36%|███▌ | 4433/12384 [9:24:15<16:50:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 36%|███▌ | 4433/12384 [9:24:23<16:50:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 36%|███▌ | 4434/12384 [9:24:23<16:50:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 36%|███▌ | 4434/12384 [9:24:30<16:50:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 36%|███▌ | 4435/12384 [9:24:30<16:49:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 36%|███▌ | 4435/12384 [9:24:38<16:49:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 36%|███▌ | 4436/12384 [9:24:38<16:49:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 36%|███▌ | 4436/12384 [9:24:46<16:49:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 36%|███▌ | 4437/12384 [9:24:46<16:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 36%|███▌ | 4437/12384 [9:24:53<16:49:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 36%|███▌ | 4438/12384 [9:24:53<16:47:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 36%|███▌ | 4438/12384 [9:25:01<16:47:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4439/12384 [9:25:01<16:48:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4439/12384 [9:25:08<16:48:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 36%|███▌ | 4440/12384 [9:25:08<16:47:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 36%|███▌ | 4440/12384 [9:25:16<16:47:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 2: 36%|███▌ | 4441/12384 [9:25:16<16:46:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 2: 36%|███▌ | 4441/12384 [9:25:24<16:46:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 36%|███▌ | 4442/12384 [9:25:24<16:47:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 36%|███▌ | 4442/12384 [9:25:31<16:47:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4443/12384 [9:25:31<16:48:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4443/12384 [9:25:39<16:48:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 36%|███▌ | 4444/12384 [9:25:39<16:47:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 36%|███▌ | 4444/12384 [9:25:47<16:47:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 36%|███▌ | 4445/12384 [9:25:47<17:00:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 36%|███▌ | 4445/12384 [9:25:54<17:00:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 36%|███▌ | 4446/12384 [9:25:54<16:56:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 36%|███▌ | 4446/12384 [9:26:02<16:56:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4447/12384 [9:26:02<16:53:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4447/12384 [9:26:10<16:53:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 36%|███▌ | 4448/12384 [9:26:10<16:51:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 36%|███▌ | 4448/12384 [9:26:18<16:51:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 36%|███▌ | 4449/12384 [9:26:18<17:01:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 36%|███▌ | 4449/12384 [9:26:25<17:01:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 36%|███▌ | 4450/12384 [9:26:25<16:56:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 36%|███▌ | 4450/12384 [9:26:33<16:56:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 36%|███▌ | 4451/12384 [9:26:33<16:52:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 36%|███▌ | 4451/12384 [9:26:40<16:52:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 36%|███▌ | 4452/12384 [9:26:40<16:53:25, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 36%|███▌ | 4452/12384 [9:26:48<16:53:25, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.19s]
Epoch 2: 36%|███▌ | 4453/12384 [9:26:48<16:50:32, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=11.19s]
Epoch 2: 36%|███▌ | 4453/12384 [9:26:56<16:50:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4454/12384 [9:26:56<16:48:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 36%|███▌ | 4454/12384 [9:27:03<16:48:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4455/12384 [9:27:03<16:48:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4455/12384 [9:27:11<16:48:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 36%|███▌ | 4456/12384 [9:27:11<16:47:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 36%|███▌ | 4456/12384 [9:27:19<16:47:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 36%|███▌ | 4457/12384 [9:27:19<16:48:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 36%|███▌ | 4457/12384 [9:27:26<16:48:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 36%|███▌ | 4458/12384 [9:27:26<16:46:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 36%|███▌ | 4458/12384 [9:27:34<16:46:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 36%|███▌ | 4459/12384 [9:27:34<16:48:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 36%|███▌ | 4459/12384 [9:27:41<16:48:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 36%|███▌ | 4460/12384 [9:27:41<16:47:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 36%|███▌ | 4460/12384 [9:27:49<16:47:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 36%|███▌ | 4461/12384 [9:27:49<16:49:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 36%|███▌ | 4461/12384 [9:27:57<16:49:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 36%|███▌ | 4462/12384 [9:27:57<16:47:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 36%|███▌ | 4462/12384 [9:28:04<16:47:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 36%|███▌ | 4463/12384 [9:28:04<16:46:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.53s]
Epoch 2: 36%|███▌ | 4463/12384 [9:28:12<16:46:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 36%|███▌ | 4464/12384 [9:28:12<16:46:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 36%|███▌ | 4464/12384 [9:28:20<16:46:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 36%|███▌ | 4465/12384 [9:28:20<16:49:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 36%|███▌ | 4465/12384 [9:28:27<16:49:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 2: 36%|███▌ | 4466/12384 [9:28:27<16:51:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 2: 36%|███▌ | 4466/12384 [9:28:35<16:51:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 36%|███▌ | 4467/12384 [9:28:35<16:48:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 36%|███▌ | 4467/12384 [9:28:43<16:48:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 36%|███▌ | 4468/12384 [9:28:43<16:49:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 36%|███▌ | 4468/12384 [9:28:50<16:49:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 36%|███▌ | 4469/12384 [9:28:50<16:48:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 36%|███▌ | 4469/12384 [9:28:58<16:48:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 36%|███▌ | 4470/12384 [9:28:58<16:47:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 36%|███▌ | 4470/12384 [9:29:06<16:47:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 36%|███▌ | 4471/12384 [9:29:06<16:57:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 36%|███▌ | 4471/12384 [9:29:13<16:57:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 36%|███▌ | 4472/12384 [9:29:13<16:52:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 36%|███▌ | 4472/12384 [9:29:21<16:52:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 36%|███▌ | 4473/12384 [9:29:21<16:49:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 36%|███▌ | 4473/12384 [9:29:29<16:49:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 36%|███▌ | 4474/12384 [9:29:29<16:47:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 36%|███▌ | 4474/12384 [9:29:36<16:47:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4475/12384 [9:29:36<16:45:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4475/12384 [9:29:44<16:45:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 36%|███▌ | 4476/12384 [9:29:44<16:56:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 36%|███▌ | 4476/12384 [9:29:52<16:56:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 36%|███▌ | 4477/12384 [9:29:52<16:52:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 36%|███▌ | 4477/12384 [9:29:59<16:52:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4478/12384 [9:29:59<16:49:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▌ | 4478/12384 [9:30:07<16:49:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 36%|███▌ | 4479/12384 [9:30:07<16:47:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 36%|███▌ | 4479/12384 [9:30:15<16:47:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 36%|███▌ | 4480/12384 [9:30:15<16:46:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 36%|███▌ | 4480/12384 [9:30:22<16:46:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 36%|███▌ | 4481/12384 [9:30:22<16:48:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 36%|███▌ | 4481/12384 [9:30:30<16:48:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 36%|███▌ | 4482/12384 [9:30:30<16:46:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 36%|███▌ | 4482/12384 [9:30:37<16:46:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 36%|███▌ | 4483/12384 [9:30:37<16:44:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 36%|███▌ | 4483/12384 [9:30:45<16:44:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 36%|███▌ | 4484/12384 [9:30:45<16:43:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 36%|███▌ | 4484/12384 [9:30:53<16:43:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 2: 36%|███▌ | 4485/12384 [9:30:53<16:42:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 2: 36%|███▌ | 4485/12384 [9:31:00<16:42:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.53s]
Epoch 2: 36%|███▌ | 4486/12384 [9:31:00<16:46:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.53s]
Epoch 2: 36%|███▌ | 4486/12384 [9:31:08<16:46:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 36%|███▌ | 4487/12384 [9:31:08<16:45:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 36%|███▌ | 4487/12384 [9:31:16<16:45:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 36%|███▌ | 4488/12384 [9:31:16<16:43:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 36%|███▌ | 4488/12384 [9:31:23<16:43:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 36%|███▌ | 4489/12384 [9:31:23<16:42:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 36%|███▌ | 4489/12384 [9:31:31<16:42:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▋ | 4490/12384 [9:31:31<16:41:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▋ | 4490/12384 [9:31:38<16:41:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 36%|███▋ | 4491/12384 [9:31:38<16:41:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 36%|███▋ | 4491/12384 [9:31:46<16:41:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 36%|███▋ | 4492/12384 [9:31:46<16:41:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 36%|███▋ | 4492/12384 [9:31:54<16:41:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▋ | 4493/12384 [9:31:54<16:41:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▋ | 4493/12384 [9:32:01<16:41:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▋ | 4494/12384 [9:32:01<16:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▋ | 4494/12384 [9:32:09<16:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 36%|███▋ | 4495/12384 [9:32:09<16:39:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 36%|███▋ | 4495/12384 [9:32:17<16:39:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 36%|███▋ | 4496/12384 [9:32:17<16:42:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 36%|███▋ | 4496/12384 [9:32:24<16:42:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 36%|███▋ | 4497/12384 [9:32:24<16:56:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 36%|███▋ | 4497/12384 [9:32:32<16:56:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 36%|███▋ | 4498/12384 [9:32:32<16:50:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 36%|███▋ | 4498/12384 [9:32:40<16:50:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 36%|███▋ | 4499/12384 [9:32:40<16:47:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 36%|███▋ | 4499/12384 [9:32:47<16:47:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 36%|███▋ | 4500/12384 [9:32:47<16:44:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 36%|███▋ | 4500/12384 [9:32:55<16:44:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 36%|███▋ | 4501/12384 [9:32:55<16:46:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 36%|███▋ | 4501/12384 [9:33:03<16:46:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 36%|███▋ | 4502/12384 [9:33:03<16:44:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 36%|███▋ | 4502/12384 [9:33:10<16:44:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 36%|███▋ | 4503/12384 [9:33:10<16:42:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 36%|███▋ | 4503/12384 [9:33:18<16:42:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 36%|███▋ | 4504/12384 [9:33:18<16:41:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 36%|███▋ | 4504/12384 [9:33:25<16:41:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 36%|███▋ | 4505/12384 [9:33:25<16:43:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 36%|███▋ | 4505/12384 [9:33:33<16:43:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 36%|███▋ | 4506/12384 [9:33:33<16:42:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 36%|███▋ | 4506/12384 [9:33:41<16:42:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▋ | 4507/12384 [9:33:41<16:41:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▋ | 4507/12384 [9:33:48<16:41:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 36%|███▋ | 4508/12384 [9:33:48<16:39:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 36%|███▋ | 4508/12384 [9:33:56<16:39:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 36%|███▋ | 4509/12384 [9:33:56<16:41:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 36%|███▋ | 4509/12384 [9:34:04<16:41:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 36%|███▋ | 4510/12384 [9:34:04<16:40:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 36%|███▋ | 4510/12384 [9:34:11<16:40:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 2: 36%|███▋ | 4511/12384 [9:34:11<16:39:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 2: 36%|███▋ | 4511/12384 [9:34:19<16:39:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 36%|███▋ | 4512/12384 [9:34:19<16:38:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 36%|███▋ | 4512/12384 [9:34:26<16:38:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▋ | 4513/12384 [9:34:26<16:38:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 36%|███▋ | 4513/12384 [9:34:34<16:38:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 36%|███▋ | 4514/12384 [9:34:34<16:38:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 36%|███▋ | 4514/12384 [9:34:42<16:38:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▋ | 4515/12384 [9:34:42<16:43:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 36%|███▋ | 4515/12384 [9:34:49<16:43:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 36%|███▋ | 4516/12384 [9:34:49<16:42:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 36%|███▋ | 4516/12384 [9:34:57<16:42:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 36%|███▋ | 4517/12384 [9:34:57<16:41:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 36%|███▋ | 4517/12384 [9:35:05<16:41:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 36%|███▋ | 4518/12384 [9:35:05<16:41:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 36%|███▋ | 4518/12384 [9:35:12<16:41:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 36%|███▋ | 4519/12384 [9:35:12<16:39:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 36%|███▋ | 4519/12384 [9:35:20<16:39:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 36%|███▋ | 4520/12384 [9:35:20<16:38:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 36%|███▋ | 4520/12384 [9:35:27<16:38:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 37%|███▋ | 4521/12384 [9:35:27<16:37:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 37%|███▋ | 4521/12384 [9:35:35<16:37:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4522/12384 [9:35:35<16:42:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4522/12384 [9:35:43<16:42:19, 7.65s/it, loss=0.0004, acc=0.9981, iter_time=5.17s]
Epoch 2: 37%|███▋ | 4523/12384 [9:35:43<16:54:06, 7.74s/it, loss=0.0004, acc=0.9981, iter_time=5.17s]
Epoch 2: 37%|███▋ | 4523/12384 [9:35:51<16:54:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 37%|███▋ | 4524/12384 [9:35:51<16:49:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 37%|███▋ | 4524/12384 [9:35:58<16:49:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 37%|███▋ | 4525/12384 [9:35:58<16:46:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 37%|███▋ | 4525/12384 [9:36:06<16:46:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4526/12384 [9:36:06<16:42:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4526/12384 [9:36:14<16:42:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4527/12384 [9:36:14<16:40:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4527/12384 [9:36:21<16:40:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 37%|███▋ | 4528/12384 [9:36:21<16:39:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 37%|███▋ | 4528/12384 [9:36:29<16:39:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 37%|███▋ | 4529/12384 [9:36:29<16:37:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 37%|███▋ | 4529/12384 [9:36:36<16:37:54, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4530/12384 [9:36:36<16:37:34, 7.62s/it, loss=0.0001, acc=0.9994, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4530/12384 [9:36:44<16:37:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4531/12384 [9:36:44<16:36:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4531/12384 [9:36:52<16:36:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 37%|███▋ | 4532/12384 [9:36:52<16:35:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 37%|███▋ | 4532/12384 [9:36:59<16:35:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 2: 37%|███▋ | 4533/12384 [9:36:59<16:35:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 2: 37%|███▋ | 4533/12384 [9:37:07<16:35:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 37%|███▋ | 4534/12384 [9:37:07<16:35:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 37%|███▋ | 4534/12384 [9:37:14<16:35:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4535/12384 [9:37:14<16:36:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4535/12384 [9:37:22<16:36:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 37%|███▋ | 4536/12384 [9:37:22<16:35:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 37%|███▋ | 4536/12384 [9:37:30<16:35:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 2: 37%|███▋ | 4537/12384 [9:37:30<16:37:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 2: 37%|███▋ | 4537/12384 [9:37:37<16:37:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 37%|███▋ | 4538/12384 [9:37:37<16:36:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 37%|███▋ | 4538/12384 [9:37:45<16:36:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 37%|███▋ | 4539/12384 [9:37:45<16:35:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 37%|███▋ | 4539/12384 [9:37:53<16:35:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 37%|███▋ | 4540/12384 [9:37:53<16:34:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 37%|███▋ | 4540/12384 [9:38:00<16:34:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 37%|███▋ | 4541/12384 [9:38:00<16:33:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 37%|███▋ | 4541/12384 [9:38:08<16:33:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.58s]
Epoch 2: 37%|███▋ | 4542/12384 [9:38:08<16:34:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.58s]
Epoch 2: 37%|███▋ | 4542/12384 [9:38:15<16:34:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 37%|███▋ | 4543/12384 [9:38:15<16:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 37%|███▋ | 4543/12384 [9:38:23<16:34:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 37%|███▋ | 4544/12384 [9:38:23<16:35:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 37%|███▋ | 4544/12384 [9:38:31<16:35:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 37%|███▋ | 4545/12384 [9:38:31<16:35:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 37%|███▋ | 4545/12384 [9:38:38<16:35:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 37%|███▋ | 4546/12384 [9:38:38<16:34:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 37%|███▋ | 4546/12384 [9:38:46<16:34:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 37%|███▋ | 4547/12384 [9:38:46<16:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 37%|███▋ | 4547/12384 [9:38:53<16:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4548/12384 [9:38:53<16:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4548/12384 [9:39:01<16:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 37%|███▋ | 4549/12384 [9:39:01<16:45:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 37%|███▋ | 4549/12384 [9:39:09<16:45:25, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 37%|███▋ | 4550/12384 [9:39:09<16:41:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 37%|███▋ | 4550/12384 [9:39:17<16:41:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4551/12384 [9:39:17<16:38:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4551/12384 [9:39:24<16:38:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 37%|███▋ | 4552/12384 [9:39:24<16:37:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 37%|███▋ | 4552/12384 [9:39:32<16:37:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 37%|███▋ | 4553/12384 [9:39:32<16:35:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 37%|███▋ | 4553/12384 [9:39:40<16:35:58, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 2: 37%|███▋ | 4554/12384 [9:39:40<16:45:03, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.87s]
Epoch 2: 37%|███▋ | 4554/12384 [9:39:47<16:45:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 37%|███▋ | 4555/12384 [9:39:47<16:41:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 37%|███▋ | 4555/12384 [9:39:55<16:41:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 37%|███▋ | 4556/12384 [9:39:55<16:37:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 37%|███▋ | 4556/12384 [9:40:02<16:37:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 2: 37%|███▋ | 4557/12384 [9:40:02<16:36:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 2: 37%|███▋ | 4557/12384 [9:40:10<16:36:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 37%|███▋ | 4558/12384 [9:40:10<16:34:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 37%|███▋ | 4558/12384 [9:40:18<16:34:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 37%|███▋ | 4559/12384 [9:40:18<16:33:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 37%|███▋ | 4559/12384 [9:40:25<16:33:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 37%|███▋ | 4560/12384 [9:40:25<16:33:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 37%|███▋ | 4560/12384 [9:40:33<16:33:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 37%|███▋ | 4561/12384 [9:40:33<16:33:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 37%|███▋ | 4561/12384 [9:40:40<16:33:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 37%|███▋ | 4562/12384 [9:40:40<16:33:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 37%|███▋ | 4562/12384 [9:40:48<16:33:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4563/12384 [9:40:48<16:32:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4563/12384 [9:40:56<16:32:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4564/12384 [9:40:56<16:31:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4564/12384 [9:41:03<16:31:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4565/12384 [9:41:03<16:31:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4565/12384 [9:41:11<16:31:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4566/12384 [9:41:11<16:31:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4566/12384 [9:41:19<16:31:10, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4567/12384 [9:41:19<16:31:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4567/12384 [9:41:26<16:31:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 37%|███▋ | 4568/12384 [9:41:26<16:30:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 37%|███▋ | 4568/12384 [9:41:34<16:30:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 37%|███▋ | 4569/12384 [9:41:34<16:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 37%|███▋ | 4569/12384 [9:41:41<16:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 37%|███▋ | 4570/12384 [9:41:41<16:30:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 37%|███▋ | 4570/12384 [9:41:49<16:30:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4571/12384 [9:41:49<16:30:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4571/12384 [9:41:57<16:30:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 37%|███▋ | 4572/12384 [9:41:57<16:31:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 37%|███▋ | 4572/12384 [9:42:04<16:31:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 37%|███▋ | 4573/12384 [9:42:04<16:30:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 37%|███▋ | 4573/12384 [9:42:12<16:30:57, 7.61s/it, loss=0.0003, acc=0.9992, iter_time=7.92s]
Epoch 2: 37%|███▋ | 4574/12384 [9:42:12<16:30:36, 7.61s/it, loss=0.0003, acc=0.9992, iter_time=7.92s]
Epoch 2: 37%|███▋ | 4574/12384 [9:42:19<16:30:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 37%|███▋ | 4575/12384 [9:42:19<16:30:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 37%|███▋ | 4575/12384 [9:42:27<16:30:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 37%|███▋ | 4576/12384 [9:42:27<16:43:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 37%|███▋ | 4576/12384 [9:42:35<16:43:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 37%|███▋ | 4577/12384 [9:42:35<16:40:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 37%|███▋ | 4577/12384 [9:42:43<16:40:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 37%|███▋ | 4578/12384 [9:42:43<16:37:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 37%|███▋ | 4578/12384 [9:42:50<16:37:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 37%|███▋ | 4579/12384 [9:42:50<16:34:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 37%|███▋ | 4579/12384 [9:42:58<16:34:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.33s]
Epoch 2: 37%|███▋ | 4580/12384 [9:42:58<16:32:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.33s]
Epoch 2: 37%|███▋ | 4580/12384 [9:43:06<16:32:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 37%|███▋ | 4581/12384 [9:43:06<16:41:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 37%|███▋ | 4581/12384 [9:43:13<16:41:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 37%|███▋ | 4582/12384 [9:43:13<16:37:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 37%|███▋ | 4582/12384 [9:43:21<16:37:39, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 2: 37%|███▋ | 4583/12384 [9:43:21<16:35:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 2: 37%|███▋ | 4583/12384 [9:43:28<16:35:02, 7.65s/it, loss=0.0002, acc=0.9989, iter_time=10.88s]
Epoch 2: 37%|███▋ | 4584/12384 [9:43:28<16:33:24, 7.64s/it, loss=0.0002, acc=0.9989, iter_time=10.88s]
Epoch 2: 37%|███▋ | 4584/12384 [9:43:36<16:33:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 37%|███▋ | 4585/12384 [9:43:36<16:31:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 37%|███▋ | 4585/12384 [9:43:44<16:31:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 37%|███▋ | 4586/12384 [9:43:44<16:29:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 37%|███▋ | 4586/12384 [9:43:51<16:29:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 37%|███▋ | 4587/12384 [9:43:51<16:29:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 37%|███▋ | 4587/12384 [9:43:59<16:29:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 37%|███▋ | 4588/12384 [9:43:59<16:28:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 37%|███▋ | 4588/12384 [9:44:06<16:28:10, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4589/12384 [9:44:06<16:28:05, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4589/12384 [9:44:14<16:28:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4590/12384 [9:44:14<16:28:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4590/12384 [9:44:22<16:28:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4591/12384 [9:44:22<16:28:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4591/12384 [9:44:29<16:28:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 37%|███▋ | 4592/12384 [9:44:29<16:28:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 37%|███▋ | 4592/12384 [9:44:37<16:28:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 37%|███▋ | 4593/12384 [9:44:37<16:27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 37%|███▋ | 4593/12384 [9:44:45<16:27:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4594/12384 [9:44:45<16:28:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4594/12384 [9:44:52<16:28:21, 7.61s/it, loss=0.0002, acc=0.9984, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4595/12384 [9:44:52<16:27:42, 7.61s/it, loss=0.0002, acc=0.9984, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4595/12384 [9:45:00<16:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 37%|███▋ | 4596/12384 [9:45:00<16:26:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 37%|███▋ | 4596/12384 [9:45:07<16:26:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 37%|███▋ | 4597/12384 [9:45:07<16:26:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 37%|███▋ | 4597/12384 [9:45:15<16:26:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 37%|███▋ | 4598/12384 [9:45:15<16:27:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 37%|███▋ | 4598/12384 [9:45:23<16:27:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 37%|███▋ | 4599/12384 [9:45:23<16:27:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 37%|███▋ | 4599/12384 [9:45:30<16:27:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 2: 37%|███▋ | 4600/12384 [9:45:30<16:27:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 2: 37%|███▋ | 4600/12384 [9:45:38<16:27:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 37%|███▋ | 4601/12384 [9:45:38<16:27:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 37%|███▋ | 4601/12384 [9:45:46<16:27:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 37%|███▋ | 4602/12384 [9:45:46<16:40:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 37%|███▋ | 4602/12384 [9:45:53<16:40:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 37%|███▋ | 4603/12384 [9:45:53<16:36:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 37%|███▋ | 4603/12384 [9:46:01<16:36:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4604/12384 [9:46:01<16:32:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4604/12384 [9:46:09<16:32:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4605/12384 [9:46:09<16:31:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4605/12384 [9:46:16<16:31:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 37%|███▋ | 4606/12384 [9:46:16<16:39:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 37%|███▋ | 4606/12384 [9:46:24<16:39:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 37%|███▋ | 4607/12384 [9:46:24<16:34:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 37%|███▋ | 4607/12384 [9:46:32<16:34:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 2: 37%|███▋ | 4608/12384 [9:46:32<16:34:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 2: 37%|███▋ | 4608/12384 [9:46:39<16:34:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 37%|███▋ | 4609/12384 [9:46:39<16:31:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 37%|███▋ | 4609/12384 [9:46:47<16:31:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 37%|███▋ | 4610/12384 [9:46:47<16:29:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 37%|███▋ | 4610/12384 [9:46:55<16:29:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 37%|███▋ | 4611/12384 [9:46:55<16:29:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 37%|███▋ | 4611/12384 [9:47:02<16:29:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 37%|███▋ | 4612/12384 [9:47:02<16:29:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 37%|███▋ | 4612/12384 [9:47:10<16:29:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 37%|███▋ | 4613/12384 [9:47:10<16:27:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 37%|███▋ | 4613/12384 [9:47:17<16:27:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 37%|███▋ | 4614/12384 [9:47:17<16:26:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 37%|███▋ | 4614/12384 [9:47:25<16:26:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 37%|███▋ | 4615/12384 [9:47:25<16:26:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 37%|███▋ | 4615/12384 [9:47:33<16:26:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 2: 37%|███▋ | 4616/12384 [9:47:33<16:29:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 2: 37%|███▋ | 4616/12384 [9:47:40<16:29:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 37%|███▋ | 4617/12384 [9:47:40<16:29:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 37%|███▋ | 4617/12384 [9:47:48<16:29:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 37%|███▋ | 4618/12384 [9:47:48<16:28:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 37%|███▋ | 4618/12384 [9:47:56<16:28:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 37%|███▋ | 4619/12384 [9:47:56<16:27:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 37%|███▋ | 4619/12384 [9:48:03<16:27:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 37%|███▋ | 4620/12384 [9:48:03<16:26:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 37%|███▋ | 4620/12384 [9:48:11<16:26:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 37%|███▋ | 4621/12384 [9:48:11<16:24:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 37%|███▋ | 4621/12384 [9:48:18<16:24:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 2: 37%|███▋ | 4622/12384 [9:48:18<16:23:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.99s]
Epoch 2: 37%|███▋ | 4622/12384 [9:48:26<16:23:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 37%|███▋ | 4623/12384 [9:48:26<16:23:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 37%|███▋ | 4623/12384 [9:48:34<16:23:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.30s]
Epoch 2: 37%|███▋ | 4624/12384 [9:48:34<16:23:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.30s]
Epoch 2: 37%|███▋ | 4624/12384 [9:48:41<16:23:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 37%|███▋ | 4625/12384 [9:48:41<16:24:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 37%|███▋ | 4625/12384 [9:48:49<16:24:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 37%|███▋ | 4626/12384 [9:48:49<16:23:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 37%|███▋ | 4626/12384 [9:48:56<16:23:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 37%|███▋ | 4627/12384 [9:48:56<16:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 37%|███▋ | 4627/12384 [9:49:04<16:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 37%|███▋ | 4628/12384 [9:49:04<16:23:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 37%|███▋ | 4628/12384 [9:49:12<16:23:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 37%|███▋ | 4629/12384 [9:49:12<16:35:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 37%|███▋ | 4629/12384 [9:49:20<16:35:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 37%|███▋ | 4630/12384 [9:49:20<16:32:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 37%|███▋ | 4630/12384 [9:49:27<16:32:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 37%|███▋ | 4631/12384 [9:49:27<16:29:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 37%|███▋ | 4631/12384 [9:49:35<16:29:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 2: 37%|███▋ | 4632/12384 [9:49:35<16:27:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 2: 37%|███▋ | 4632/12384 [9:49:43<16:27:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 37%|███▋ | 4633/12384 [9:49:43<16:36:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 37%|███▋ | 4633/12384 [9:49:50<16:36:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4634/12384 [9:49:50<16:31:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 37%|███▋ | 4634/12384 [9:49:58<16:31:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 37%|███▋ | 4635/12384 [9:49:58<16:29:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 37%|███▋ | 4635/12384 [9:50:05<16:29:04, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.27s]
Epoch 2: 37%|███▋ | 4636/12384 [9:50:05<16:26:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.27s]
Epoch 2: 37%|███▋ | 4636/12384 [9:50:13<16:26:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 37%|███▋ | 4637/12384 [9:50:13<16:24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 37%|███▋ | 4637/12384 [9:50:21<16:24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 37%|███▋ | 4638/12384 [9:50:21<16:23:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 37%|███▋ | 4638/12384 [9:50:28<16:23:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4639/12384 [9:50:28<16:23:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 37%|███▋ | 4639/12384 [9:50:36<16:23:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 37%|███▋ | 4640/12384 [9:50:36<16:22:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 37%|███▋ | 4640/12384 [9:50:43<16:22:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 37%|███▋ | 4641/12384 [9:50:43<16:22:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 37%|███▋ | 4641/12384 [9:50:51<16:22:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 37%|███▋ | 4642/12384 [9:50:51<16:22:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 37%|███▋ | 4642/12384 [9:50:59<16:22:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4643/12384 [9:50:59<16:21:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 37%|███▋ | 4643/12384 [9:51:06<16:21:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 38%|███▊ | 4644/12384 [9:51:06<16:21:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 38%|███▊ | 4644/12384 [9:51:14<16:21:41, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 2: 38%|███▊ | 4645/12384 [9:51:14<16:21:40, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.26s]
Epoch 2: 38%|███▊ | 4645/12384 [9:51:22<16:21:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 38%|███▊ | 4646/12384 [9:51:22<16:22:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 38%|███▊ | 4646/12384 [9:51:29<16:22:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 38%|███▊ | 4647/12384 [9:51:29<16:20:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 38%|███▊ | 4647/12384 [9:51:37<16:20:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 38%|███▊ | 4648/12384 [9:51:37<16:21:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 38%|███▊ | 4648/12384 [9:51:44<16:21:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 38%|███▊ | 4649/12384 [9:51:44<16:21:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 38%|███▊ | 4649/12384 [9:51:52<16:21:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 38%|███▊ | 4650/12384 [9:51:52<16:20:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 38%|███▊ | 4650/12384 [9:52:00<16:20:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 38%|███▊ | 4651/12384 [9:52:00<16:20:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 38%|███▊ | 4651/12384 [9:52:07<16:20:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 38%|███▊ | 4652/12384 [9:52:07<16:20:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 38%|███▊ | 4652/12384 [9:52:15<16:20:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 38%|███▊ | 4653/12384 [9:52:15<16:20:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 38%|███▊ | 4653/12384 [9:52:22<16:20:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 38%|███▊ | 4654/12384 [9:52:22<16:20:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 38%|███▊ | 4654/12384 [9:52:30<16:20:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 38%|███▊ | 4655/12384 [9:52:30<16:32:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 38%|███▊ | 4655/12384 [9:52:38<16:32:36, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 2: 38%|███▊ | 4656/12384 [9:52:38<16:29:35, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 2: 38%|███▊ | 4656/12384 [9:52:46<16:29:35, 7.68s/it, loss=0.0003, acc=0.9986, iter_time=7.21s]
Epoch 2: 38%|███▊ | 4657/12384 [9:52:46<16:26:26, 7.66s/it, loss=0.0003, acc=0.9986, iter_time=7.21s]
Epoch 2: 38%|███▊ | 4657/12384 [9:52:53<16:26:26, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4658/12384 [9:52:53<16:23:51, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4658/12384 [9:53:01<16:23:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4659/12384 [9:53:01<16:22:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4659/12384 [9:53:09<16:22:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 38%|███▊ | 4660/12384 [9:53:09<16:32:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 38%|███▊ | 4660/12384 [9:53:16<16:32:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 38%|███▊ | 4661/12384 [9:53:16<16:30:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 38%|███▊ | 4661/12384 [9:53:24<16:30:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 38%|███▊ | 4662/12384 [9:53:24<16:27:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 38%|███▊ | 4662/12384 [9:53:32<16:27:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 38%|███▊ | 4663/12384 [9:53:32<16:24:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 38%|███▊ | 4663/12384 [9:53:39<16:24:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 38%|███▊ | 4664/12384 [9:53:39<16:21:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 38%|███▊ | 4664/12384 [9:53:47<16:21:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 38%|███▊ | 4665/12384 [9:53:47<16:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 38%|███▊ | 4665/12384 [9:53:54<16:20:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 38%|███▊ | 4666/12384 [9:53:54<16:19:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 38%|███▊ | 4666/12384 [9:54:02<16:19:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 38%|███▊ | 4667/12384 [9:54:02<16:19:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 38%|███▊ | 4667/12384 [9:54:10<16:19:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 38%|███▊ | 4668/12384 [9:54:10<16:19:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 38%|███▊ | 4668/12384 [9:54:17<16:19:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 38%|███▊ | 4669/12384 [9:54:17<16:19:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 38%|███▊ | 4669/12384 [9:54:25<16:19:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 38%|███▊ | 4670/12384 [9:54:25<16:19:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 38%|███▊ | 4670/12384 [9:54:32<16:19:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 38%|███▊ | 4671/12384 [9:54:32<16:18:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 38%|███▊ | 4671/12384 [9:54:40<16:18:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 38%|███▊ | 4672/12384 [9:54:40<16:18:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 38%|███▊ | 4672/12384 [9:54:48<16:18:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 2: 38%|███▊ | 4673/12384 [9:54:48<16:18:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 2: 38%|███▊ | 4673/12384 [9:54:55<16:18:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 38%|███▊ | 4674/12384 [9:54:55<16:18:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 38%|███▊ | 4674/12384 [9:55:03<16:18:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 38%|███▊ | 4675/12384 [9:55:03<16:22:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 38%|███▊ | 4675/12384 [9:55:11<16:22:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 38%|███▊ | 4676/12384 [9:55:11<16:20:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 38%|███▊ | 4676/12384 [9:55:18<16:20:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 38%|███▊ | 4677/12384 [9:55:18<16:20:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 38%|███▊ | 4677/12384 [9:55:26<16:20:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 38%|███▊ | 4678/12384 [9:55:26<16:17:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 38%|███▊ | 4678/12384 [9:55:33<16:17:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 38%|███▊ | 4679/12384 [9:55:33<16:18:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 38%|███▊ | 4679/12384 [9:55:41<16:18:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 38%|███▊ | 4680/12384 [9:55:41<16:17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 38%|███▊ | 4680/12384 [9:55:49<16:17:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 38%|███▊ | 4681/12384 [9:55:49<16:32:54, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 38%|███▊ | 4681/12384 [9:55:57<16:32:54, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 38%|███▊ | 4682/12384 [9:55:57<16:28:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 38%|███▊ | 4682/12384 [9:56:04<16:28:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 38%|███▊ | 4683/12384 [9:56:04<16:26:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 38%|███▊ | 4683/12384 [9:56:12<16:26:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 38%|███▊ | 4684/12384 [9:56:12<16:23:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 38%|███▊ | 4684/12384 [9:56:20<16:23:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 38%|███▊ | 4685/12384 [9:56:20<16:22:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 38%|███▊ | 4685/12384 [9:56:27<16:22:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 2: 38%|███▊ | 4686/12384 [9:56:27<16:21:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 2: 38%|███▊ | 4686/12384 [9:56:35<16:21:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 38%|███▊ | 4687/12384 [9:56:35<16:30:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 38%|███▊ | 4687/12384 [9:56:43<16:30:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 38%|███▊ | 4688/12384 [9:56:43<16:27:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 38%|███▊ | 4688/12384 [9:56:50<16:27:15, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 38%|███▊ | 4689/12384 [9:56:50<16:23:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 38%|███▊ | 4689/12384 [9:56:58<16:23:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4690/12384 [9:56:58<16:21:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4690/12384 [9:57:06<16:21:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4691/12384 [9:57:06<16:19:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4691/12384 [9:57:13<16:19:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4692/12384 [9:57:13<16:18:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4692/12384 [9:57:21<16:18:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4693/12384 [9:57:21<16:17:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4693/12384 [9:57:28<16:17:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 38%|███▊ | 4694/12384 [9:57:28<16:15:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 38%|███▊ | 4694/12384 [9:57:36<16:15:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 38%|███▊ | 4695/12384 [9:57:36<16:14:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 38%|███▊ | 4695/12384 [9:57:44<16:14:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 2: 38%|███▊ | 4696/12384 [9:57:44<16:15:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 2: 38%|███▊ | 4696/12384 [9:57:51<16:15:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 38%|███▊ | 4697/12384 [9:57:51<16:14:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 38%|███▊ | 4697/12384 [9:57:59<16:14:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 38%|███▊ | 4698/12384 [9:57:59<16:14:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 38%|███▊ | 4698/12384 [9:58:06<16:14:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4699/12384 [9:58:06<16:15:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4699/12384 [9:58:14<16:15:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 38%|███▊ | 4700/12384 [9:58:14<16:15:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 38%|███▊ | 4700/12384 [9:58:22<16:15:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 38%|███▊ | 4701/12384 [9:58:22<16:15:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 38%|███▊ | 4701/12384 [9:58:29<16:15:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 38%|███▊ | 4702/12384 [9:58:29<16:14:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 38%|███▊ | 4702/12384 [9:58:37<16:14:37, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 2: 38%|███▊ | 4703/12384 [9:58:37<16:14:47, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 2: 38%|███▊ | 4703/12384 [9:58:44<16:14:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 38%|███▊ | 4704/12384 [9:58:44<16:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 38%|███▊ | 4704/12384 [9:58:52<16:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 38%|███▊ | 4705/12384 [9:58:52<16:14:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 38%|███▊ | 4705/12384 [9:59:00<16:14:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 38%|███▊ | 4706/12384 [9:59:00<16:14:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 38%|███▊ | 4706/12384 [9:59:08<16:14:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 38%|███▊ | 4707/12384 [9:59:08<16:25:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 38%|███▊ | 4707/12384 [9:59:15<16:25:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 38%|███▊ | 4708/12384 [9:59:15<16:22:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 38%|███▊ | 4708/12384 [9:59:23<16:22:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 38%|███▊ | 4709/12384 [9:59:23<16:19:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 38%|███▊ | 4709/12384 [9:59:30<16:19:51, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 2: 38%|███▊ | 4710/12384 [9:59:30<16:17:22, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.67s]
Epoch 2: 38%|███▊ | 4710/12384 [9:59:38<16:17:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 38%|███▊ | 4711/12384 [9:59:38<16:15:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 38%|███▊ | 4711/12384 [9:59:46<16:15:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 38%|███▊ | 4712/12384 [9:59:46<16:13:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 38%|███▊ | 4712/12384 [9:59:53<16:13:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 38%|███▊ | 4713/12384 [9:59:53<16:12:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 38%|███▊ | 4713/12384 [10:00:01<16:12:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 38%|███▊ | 4714/12384 [10:00:01<16:12:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 38%|███▊ | 4714/12384 [10:00:08<16:12:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 38%|███▊ | 4715/12384 [10:00:08<16:12:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 38%|███▊ | 4715/12384 [10:00:16<16:12:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 38%|███▊ | 4716/12384 [10:00:16<16:11:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 38%|███▊ | 4716/12384 [10:00:24<16:11:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 38%|███▊ | 4717/12384 [10:00:24<16:10:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 38%|███▊ | 4717/12384 [10:00:31<16:10:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 38%|███▊ | 4718/12384 [10:00:31<16:10:00, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 38%|███▊ | 4718/12384 [10:00:39<16:10:00, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 38%|███▊ | 4719/12384 [10:00:39<16:09:54, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 38%|███▊ | 4719/12384 [10:00:46<16:09:54, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 38%|███▊ | 4720/12384 [10:00:46<16:11:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 38%|███▊ | 4720/12384 [10:00:54<16:11:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 38%|███▊ | 4721/12384 [10:00:54<16:10:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 38%|███▊ | 4721/12384 [10:01:02<16:10:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4722/12384 [10:01:02<16:12:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4722/12384 [10:01:09<16:12:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 38%|███▊ | 4723/12384 [10:01:09<16:12:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 38%|███▊ | 4723/12384 [10:01:17<16:12:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4724/12384 [10:01:17<16:11:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4724/12384 [10:01:25<16:11:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 38%|███▊ | 4725/12384 [10:01:25<16:13:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 38%|███▊ | 4725/12384 [10:01:32<16:13:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4726/12384 [10:01:32<16:13:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4726/12384 [10:01:40<16:13:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 38%|███▊ | 4727/12384 [10:01:40<16:12:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 38%|███▊ | 4727/12384 [10:01:47<16:12:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 38%|███▊ | 4728/12384 [10:01:47<16:11:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 38%|███▊ | 4728/12384 [10:01:55<16:11:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.27s]
Epoch 2: 38%|███▊ | 4729/12384 [10:01:55<16:11:19, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.27s]
Epoch 2: 38%|███▊ | 4729/12384 [10:02:03<16:11:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 38%|███▊ | 4730/12384 [10:02:03<16:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 38%|███▊ | 4730/12384 [10:02:10<16:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 38%|███▊ | 4731/12384 [10:02:10<16:11:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 38%|███▊ | 4731/12384 [10:02:18<16:11:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 38%|███▊ | 4732/12384 [10:02:18<16:18:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 38%|███▊ | 4732/12384 [10:02:26<16:18:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 38%|███▊ | 4733/12384 [10:02:26<16:28:07, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 38%|███▊ | 4733/12384 [10:02:34<16:28:07, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 38%|███▊ | 4734/12384 [10:02:34<16:23:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 38%|███▊ | 4734/12384 [10:02:41<16:23:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 38%|███▊ | 4735/12384 [10:02:41<16:19:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 38%|███▊ | 4735/12384 [10:02:49<16:19:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 38%|███▊ | 4736/12384 [10:02:49<16:16:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 38%|███▊ | 4736/12384 [10:02:56<16:16:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 38%|███▊ | 4737/12384 [10:02:56<16:14:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 38%|███▊ | 4737/12384 [10:03:04<16:14:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 38%|███▊ | 4738/12384 [10:03:04<16:12:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 38%|███▊ | 4738/12384 [10:03:12<16:12:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 38%|███▊ | 4739/12384 [10:03:12<16:11:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 38%|███▊ | 4739/12384 [10:03:19<16:11:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 38%|███▊ | 4740/12384 [10:03:19<16:10:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 38%|███▊ | 4740/12384 [10:03:27<16:10:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 38%|███▊ | 4741/12384 [10:03:27<16:10:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 38%|███▊ | 4741/12384 [10:03:34<16:10:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 38%|███▊ | 4742/12384 [10:03:34<16:10:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 38%|███▊ | 4742/12384 [10:03:42<16:10:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4743/12384 [10:03:42<16:10:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4743/12384 [10:03:50<16:10:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 38%|███▊ | 4744/12384 [10:03:50<16:10:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 38%|███▊ | 4744/12384 [10:03:57<16:10:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 38%|███▊ | 4745/12384 [10:03:57<16:10:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 38%|███▊ | 4745/12384 [10:04:05<16:10:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 38%|███▊ | 4746/12384 [10:04:05<16:11:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 38%|███▊ | 4746/12384 [10:04:13<16:11:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 2: 38%|███▊ | 4747/12384 [10:04:13<16:09:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 2: 38%|███▊ | 4747/12384 [10:04:20<16:09:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 38%|███▊ | 4748/12384 [10:04:20<16:09:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 38%|███▊ | 4748/12384 [10:04:28<16:09:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 38%|███▊ | 4749/12384 [10:04:28<16:09:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 38%|███▊ | 4749/12384 [10:04:35<16:09:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 38%|███▊ | 4750/12384 [10:04:35<16:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 38%|███▊ | 4750/12384 [10:04:43<16:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 38%|███▊ | 4751/12384 [10:04:43<16:10:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 38%|███▊ | 4751/12384 [10:04:51<16:10:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 38%|███▊ | 4752/12384 [10:04:51<16:10:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 38%|███▊ | 4752/12384 [10:04:58<16:10:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 38%|███▊ | 4753/12384 [10:04:58<16:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 38%|███▊ | 4753/12384 [10:05:06<16:08:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 38%|███▊ | 4754/12384 [10:05:06<16:10:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 38%|███▊ | 4754/12384 [10:05:14<16:10:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 38%|███▊ | 4755/12384 [10:05:14<16:09:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 38%|███▊ | 4755/12384 [10:05:21<16:09:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 38%|███▊ | 4756/12384 [10:05:21<16:09:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 38%|███▊ | 4756/12384 [10:05:29<16:09:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.06s]
Epoch 2: 38%|███▊ | 4757/12384 [10:05:29<16:07:27, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=5.06s]
Epoch 2: 38%|███▊ | 4757/12384 [10:05:36<16:07:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 38%|███▊ | 4758/12384 [10:05:36<16:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 38%|███▊ | 4758/12384 [10:05:44<16:07:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4759/12384 [10:05:44<16:07:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 38%|███▊ | 4759/12384 [10:05:52<16:07:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 38%|███▊ | 4760/12384 [10:05:52<16:19:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 38%|███▊ | 4760/12384 [10:06:00<16:19:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 38%|███▊ | 4761/12384 [10:06:00<16:16:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 38%|███▊ | 4761/12384 [10:06:07<16:16:48, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 38%|███▊ | 4762/12384 [10:06:07<16:13:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 38%|███▊ | 4762/12384 [10:06:15<16:13:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 38%|███▊ | 4763/12384 [10:06:15<16:11:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 38%|███▊ | 4763/12384 [10:06:22<16:11:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 38%|███▊ | 4764/12384 [10:06:22<16:09:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 38%|███▊ | 4764/12384 [10:06:30<16:09:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 38%|███▊ | 4765/12384 [10:06:30<16:17:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 38%|███▊ | 4765/12384 [10:06:38<16:17:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 38%|███▊ | 4766/12384 [10:06:38<16:13:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 38%|███▊ | 4766/12384 [10:06:45<16:13:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4767/12384 [10:06:45<16:11:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 38%|███▊ | 4767/12384 [10:06:53<16:11:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 39%|███▊ | 4768/12384 [10:06:53<16:09:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 39%|███▊ | 4768/12384 [10:07:01<16:09:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 39%|███▊ | 4769/12384 [10:07:01<16:08:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 39%|███▊ | 4769/12384 [10:07:08<16:08:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 2: 39%|███▊ | 4770/12384 [10:07:08<16:07:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 2: 39%|███▊ | 4770/12384 [10:07:16<16:07:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 39%|███▊ | 4771/12384 [10:07:16<16:06:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 39%|███▊ | 4771/12384 [10:07:23<16:06:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▊ | 4772/12384 [10:07:23<16:05:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▊ | 4772/12384 [10:07:31<16:05:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 39%|███▊ | 4773/12384 [10:07:31<16:05:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 39%|███▊ | 4773/12384 [10:07:39<16:05:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▊ | 4774/12384 [10:07:39<16:05:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▊ | 4774/12384 [10:07:46<16:05:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 39%|███▊ | 4775/12384 [10:07:46<16:07:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 39%|███▊ | 4775/12384 [10:07:54<16:07:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 39%|███▊ | 4776/12384 [10:07:54<16:06:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 39%|███▊ | 4776/12384 [10:08:02<16:06:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 39%|███▊ | 4777/12384 [10:08:02<16:06:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 39%|███▊ | 4777/12384 [10:08:09<16:06:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 39%|███▊ | 4778/12384 [10:08:09<16:06:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 39%|███▊ | 4778/12384 [10:08:17<16:06:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▊ | 4779/12384 [10:08:17<16:05:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▊ | 4779/12384 [10:08:24<16:05:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 39%|███▊ | 4780/12384 [10:08:24<16:04:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 39%|███▊ | 4780/12384 [10:08:32<16:04:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▊ | 4781/12384 [10:08:32<16:03:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▊ | 4781/12384 [10:08:40<16:03:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▊ | 4782/12384 [10:08:40<16:03:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▊ | 4782/12384 [10:08:47<16:03:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 39%|███▊ | 4783/12384 [10:08:47<16:02:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 39%|███▊ | 4783/12384 [10:08:55<16:02:43, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 39%|███▊ | 4784/12384 [10:08:55<16:05:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 39%|███▊ | 4784/12384 [10:09:02<16:05:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 39%|███▊ | 4785/12384 [10:09:02<16:04:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 39%|███▊ | 4785/12384 [10:09:10<16:04:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 39%|███▊ | 4786/12384 [10:09:10<16:18:16, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 39%|███▊ | 4786/12384 [10:09:18<16:18:16, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 39%|███▊ | 4787/12384 [10:09:18<16:12:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 39%|███▊ | 4787/12384 [10:09:26<16:12:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 39%|███▊ | 4788/12384 [10:09:26<16:10:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 39%|███▊ | 4788/12384 [10:09:33<16:10:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 39%|███▊ | 4789/12384 [10:09:33<16:08:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 39%|███▊ | 4789/12384 [10:09:41<16:08:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 39%|███▊ | 4790/12384 [10:09:41<16:06:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 39%|███▊ | 4790/12384 [10:09:48<16:06:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 39%|███▊ | 4791/12384 [10:09:48<16:05:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 39%|███▊ | 4791/12384 [10:09:56<16:05:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 2: 39%|███▊ | 4792/12384 [10:09:56<16:06:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 2: 39%|███▊ | 4792/12384 [10:10:04<16:06:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 39%|███▊ | 4793/12384 [10:10:04<16:05:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 39%|███▊ | 4793/12384 [10:10:11<16:05:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 2: 39%|███▊ | 4794/12384 [10:10:11<16:04:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 2: 39%|███▊ | 4794/12384 [10:10:19<16:04:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 39%|███▊ | 4795/12384 [10:10:19<16:03:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 39%|███▊ | 4795/12384 [10:10:27<16:03:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 39%|███▊ | 4796/12384 [10:10:27<16:03:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 39%|███▊ | 4796/12384 [10:10:34<16:03:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 39%|███▊ | 4797/12384 [10:10:34<16:03:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 39%|███▊ | 4797/12384 [10:10:42<16:03:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 39%|███▊ | 4798/12384 [10:10:42<16:02:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 39%|███▊ | 4798/12384 [10:10:49<16:02:32, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.56s]
Epoch 2: 39%|███▉ | 4799/12384 [10:10:49<16:01:41, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=8.56s]
Epoch 2: 39%|███▉ | 4799/12384 [10:10:57<16:01:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▉ | 4800/12384 [10:10:57<16:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▉ | 4800/12384 [10:11:05<16:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 39%|███▉ | 4801/12384 [10:11:05<16:02:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 39%|███▉ | 4801/12384 [10:11:12<16:02:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 39%|███▉ | 4802/12384 [10:11:12<16:01:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 39%|███▉ | 4802/12384 [10:11:20<16:01:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 39%|███▉ | 4803/12384 [10:11:20<16:00:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 39%|███▉ | 4803/12384 [10:11:27<16:00:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 39%|███▉ | 4804/12384 [10:11:27<16:00:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 39%|███▉ | 4804/12384 [10:11:35<16:00:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 39%|███▉ | 4805/12384 [10:11:35<16:00:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 39%|███▉ | 4805/12384 [10:11:43<16:00:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 39%|███▉ | 4806/12384 [10:11:43<16:00:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 39%|███▉ | 4806/12384 [10:11:50<16:00:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 39%|███▉ | 4807/12384 [10:11:50<15:59:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 39%|███▉ | 4807/12384 [10:11:58<15:59:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 39%|███▉ | 4808/12384 [10:11:58<15:59:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 39%|███▉ | 4808/12384 [10:12:05<15:59:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 39%|███▉ | 4809/12384 [10:12:05<16:02:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 39%|███▉ | 4809/12384 [10:12:13<16:02:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 39%|███▉ | 4810/12384 [10:12:13<16:01:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 39%|███▉ | 4810/12384 [10:12:21<16:01:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▉ | 4811/12384 [10:12:21<16:01:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▉ | 4811/12384 [10:12:28<16:01:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 39%|███▉ | 4812/12384 [10:12:28<16:00:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 39%|███▉ | 4812/12384 [10:12:36<16:00:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 39%|███▉ | 4813/12384 [10:12:36<16:12:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 39%|███▉ | 4813/12384 [10:12:44<16:12:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 39%|███▉ | 4814/12384 [10:12:44<16:09:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 39%|███▉ | 4814/12384 [10:12:51<16:09:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 39%|███▉ | 4815/12384 [10:12:51<16:05:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 39%|███▉ | 4815/12384 [10:12:59<16:05:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▉ | 4816/12384 [10:12:59<16:04:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▉ | 4816/12384 [10:13:07<16:04:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 39%|███▉ | 4817/12384 [10:13:07<16:02:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 39%|███▉ | 4817/12384 [10:13:15<16:02:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 39%|███▉ | 4818/12384 [10:13:15<16:13:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 39%|███▉ | 4818/12384 [10:13:22<16:13:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 39%|███▉ | 4819/12384 [10:13:22<16:08:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 39%|███▉ | 4819/12384 [10:13:30<16:08:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 39%|███▉ | 4820/12384 [10:13:30<16:05:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 39%|███▉ | 4820/12384 [10:13:37<16:05:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 39%|███▉ | 4821/12384 [10:13:37<16:03:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 39%|███▉ | 4821/12384 [10:13:45<16:03:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 39%|███▉ | 4822/12384 [10:13:45<16:01:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 39%|███▉ | 4822/12384 [10:13:53<16:01:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 39%|███▉ | 4823/12384 [10:13:53<16:00:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 39%|███▉ | 4823/12384 [10:14:00<16:00:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 39%|███▉ | 4824/12384 [10:14:00<16:00:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 39%|███▉ | 4824/12384 [10:14:08<16:00:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 2: 39%|███▉ | 4825/12384 [10:14:08<15:59:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.32s]
Epoch 2: 39%|███▉ | 4825/12384 [10:14:15<15:59:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 2: 39%|███▉ | 4826/12384 [10:14:15<16:00:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.24s]
Epoch 2: 39%|███▉ | 4826/12384 [10:14:23<16:00:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 39%|███▉ | 4827/12384 [10:14:23<15:59:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 39%|███▉ | 4827/12384 [10:14:31<15:59:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 39%|███▉ | 4828/12384 [10:14:31<15:58:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 39%|███▉ | 4828/12384 [10:14:38<15:58:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 39%|███▉ | 4829/12384 [10:14:38<15:59:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 39%|███▉ | 4829/12384 [10:14:46<15:59:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 39%|███▉ | 4830/12384 [10:14:46<15:58:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 39%|███▉ | 4830/12384 [10:14:53<15:58:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 39%|███▉ | 4831/12384 [10:14:53<15:57:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 39%|███▉ | 4831/12384 [10:15:01<15:57:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 39%|███▉ | 4832/12384 [10:15:01<15:57:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 39%|███▉ | 4832/12384 [10:15:09<15:57:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 39%|███▉ | 4833/12384 [10:15:09<15:56:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 39%|███▉ | 4833/12384 [10:15:16<15:56:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 39%|███▉ | 4834/12384 [10:15:16<16:00:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 39%|███▉ | 4834/12384 [10:15:24<16:00:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 2: 39%|███▉ | 4835/12384 [10:15:24<15:58:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 2: 39%|███▉ | 4835/12384 [10:15:32<15:58:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 39%|███▉ | 4836/12384 [10:15:32<15:57:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 39%|███▉ | 4836/12384 [10:15:39<15:57:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.39s]
Epoch 2: 39%|███▉ | 4837/12384 [10:15:39<15:57:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.39s]
Epoch 2: 39%|███▉ | 4837/12384 [10:15:47<15:57:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 2: 39%|███▉ | 4838/12384 [10:15:47<15:57:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 2: 39%|███▉ | 4838/12384 [10:15:55<15:57:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 39%|███▉ | 4839/12384 [10:15:55<16:11:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 39%|███▉ | 4839/12384 [10:16:02<16:11:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 39%|███▉ | 4840/12384 [10:16:02<16:07:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 39%|███▉ | 4840/12384 [10:16:10<16:07:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 39%|███▉ | 4841/12384 [10:16:10<16:04:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 39%|███▉ | 4841/12384 [10:16:18<16:04:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 39%|███▉ | 4842/12384 [10:16:18<16:01:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 39%|███▉ | 4842/12384 [10:16:25<16:01:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 39%|███▉ | 4843/12384 [10:16:25<16:01:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 39%|███▉ | 4843/12384 [10:16:33<16:01:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 39%|███▉ | 4844/12384 [10:16:33<15:59:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 39%|███▉ | 4844/12384 [10:16:40<15:59:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 39%|███▉ | 4845/12384 [10:16:40<15:57:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 39%|███▉ | 4845/12384 [10:16:48<15:57:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 39%|███▉ | 4846/12384 [10:16:48<15:56:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 39%|███▉ | 4846/12384 [10:16:56<15:56:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 39%|███▉ | 4847/12384 [10:16:56<15:56:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 39%|███▉ | 4847/12384 [10:17:03<15:56:38, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▉ | 4848/12384 [10:17:03<15:56:08, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▉ | 4848/12384 [10:17:11<15:56:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 39%|███▉ | 4849/12384 [10:17:11<15:56:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 39%|███▉ | 4849/12384 [10:17:19<15:56:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 39%|███▉ | 4850/12384 [10:17:19<15:56:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 39%|███▉ | 4850/12384 [10:17:26<15:56:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 39%|███▉ | 4851/12384 [10:17:26<15:56:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 39%|███▉ | 4851/12384 [10:17:34<15:56:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 39%|███▉ | 4852/12384 [10:17:34<15:56:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 39%|███▉ | 4852/12384 [10:17:41<15:56:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 39%|███▉ | 4853/12384 [10:17:41<15:56:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 39%|███▉ | 4853/12384 [10:17:49<15:56:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 39%|███▉ | 4854/12384 [10:17:49<15:56:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 39%|███▉ | 4854/12384 [10:17:57<15:56:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 39%|███▉ | 4855/12384 [10:17:57<15:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 39%|███▉ | 4855/12384 [10:18:04<15:54:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 39%|███▉ | 4856/12384 [10:18:04<15:54:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 39%|███▉ | 4856/12384 [10:18:12<15:54:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 39%|███▉ | 4857/12384 [10:18:12<15:53:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 39%|███▉ | 4857/12384 [10:18:19<15:53:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 39%|███▉ | 4858/12384 [10:18:19<15:53:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 39%|███▉ | 4858/12384 [10:18:27<15:53:26, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 39%|███▉ | 4859/12384 [10:18:27<15:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 39%|███▉ | 4859/12384 [10:18:35<15:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 39%|███▉ | 4860/12384 [10:18:35<15:52:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 39%|███▉ | 4860/12384 [10:18:42<15:52:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 39%|███▉ | 4861/12384 [10:18:42<15:54:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 39%|███▉ | 4861/12384 [10:18:50<15:54:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 39%|███▉ | 4862/12384 [10:18:50<15:55:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 39%|███▉ | 4862/12384 [10:18:57<15:55:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 39%|███▉ | 4863/12384 [10:18:57<15:53:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 39%|███▉ | 4863/12384 [10:19:05<15:53:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▉ | 4864/12384 [10:19:05<15:54:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 39%|███▉ | 4864/12384 [10:19:13<15:54:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 39%|███▉ | 4865/12384 [10:19:13<16:05:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 39%|███▉ | 4865/12384 [10:19:21<16:05:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 39%|███▉ | 4866/12384 [10:19:21<16:01:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 39%|███▉ | 4866/12384 [10:19:28<16:01:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▉ | 4867/12384 [10:19:28<15:58:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▉ | 4867/12384 [10:19:36<15:58:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 39%|███▉ | 4868/12384 [10:19:36<15:56:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 39%|███▉ | 4868/12384 [10:19:43<15:56:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 39%|███▉ | 4869/12384 [10:19:43<15:56:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 39%|███▉ | 4869/12384 [10:19:51<15:56:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 39%|███▉ | 4870/12384 [10:19:51<15:55:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 39%|███▉ | 4870/12384 [10:19:59<15:55:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 39%|███▉ | 4871/12384 [10:19:59<16:04:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 39%|███▉ | 4871/12384 [10:20:07<16:04:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 39%|███▉ | 4872/12384 [10:20:07<16:01:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 39%|███▉ | 4872/12384 [10:20:14<16:01:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▉ | 4873/12384 [10:20:14<15:58:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▉ | 4873/12384 [10:20:22<15:58:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 39%|███▉ | 4874/12384 [10:20:22<15:56:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 39%|███▉ | 4874/12384 [10:20:29<15:56:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 39%|███▉ | 4875/12384 [10:20:29<15:55:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 39%|███▉ | 4875/12384 [10:20:37<15:55:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 39%|███▉ | 4876/12384 [10:20:37<15:55:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 39%|███▉ | 4876/12384 [10:20:45<15:55:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 39%|███▉ | 4877/12384 [10:20:45<15:54:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 39%|███▉ | 4877/12384 [10:20:52<15:54:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▉ | 4878/12384 [10:20:52<15:56:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▉ | 4878/12384 [10:21:00<15:56:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 39%|███▉ | 4879/12384 [10:21:00<15:54:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 39%|███▉ | 4879/12384 [10:21:08<15:54:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 39%|███▉ | 4880/12384 [10:21:08<15:54:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 39%|███▉ | 4880/12384 [10:21:15<15:54:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 39%|███▉ | 4881/12384 [10:21:15<15:52:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 39%|███▉ | 4881/12384 [10:21:23<15:52:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 2: 39%|███▉ | 4882/12384 [10:21:23<15:52:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.29s]
Epoch 2: 39%|███▉ | 4882/12384 [10:21:30<15:52:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 39%|███▉ | 4883/12384 [10:21:30<15:51:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 39%|███▉ | 4883/12384 [10:21:38<15:51:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▉ | 4884/12384 [10:21:38<15:51:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 39%|███▉ | 4884/12384 [10:21:46<15:51:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▉ | 4885/12384 [10:21:46<15:51:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 39%|███▉ | 4885/12384 [10:21:53<15:51:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 39%|███▉ | 4886/12384 [10:21:53<15:50:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 39%|███▉ | 4886/12384 [10:22:01<15:50:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 39%|███▉ | 4887/12384 [10:22:01<15:50:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 39%|███▉ | 4887/12384 [10:22:08<15:50:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 39%|███▉ | 4888/12384 [10:22:08<15:49:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 39%|███▉ | 4888/12384 [10:22:16<15:49:50, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=7.19s]
Epoch 2: 39%|███▉ | 4889/12384 [10:22:16<15:50:39, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.19s]
Epoch 2: 39%|███▉ | 4889/12384 [10:22:24<15:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 39%|███▉ | 4890/12384 [10:22:24<15:50:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 39%|███▉ | 4890/12384 [10:22:31<15:50:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 39%|███▉ | 4891/12384 [10:22:31<16:01:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 39%|███▉ | 4891/12384 [10:22:39<16:01:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 40%|███▉ | 4892/12384 [10:22:39<15:57:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 40%|███▉ | 4892/12384 [10:22:47<15:57:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4893/12384 [10:22:47<15:57:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4893/12384 [10:22:54<15:57:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 40%|███▉ | 4894/12384 [10:22:54<15:55:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 40%|███▉ | 4894/12384 [10:23:02<15:55:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 40%|███▉ | 4895/12384 [10:23:02<15:52:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 40%|███▉ | 4895/12384 [10:23:10<15:52:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 40%|███▉ | 4896/12384 [10:23:10<15:52:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 40%|███▉ | 4896/12384 [10:23:17<15:52:05, 7.63s/it, loss=0.0005, acc=0.9990, iter_time=6.53s]
Epoch 2: 40%|███▉ | 4897/12384 [10:23:17<15:51:46, 7.63s/it, loss=0.0005, acc=0.9990, iter_time=6.53s]
Epoch 2: 40%|███▉ | 4897/12384 [10:23:25<15:51:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 40%|███▉ | 4898/12384 [10:23:25<15:51:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 40%|███▉ | 4898/12384 [10:23:32<15:51:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|███▉ | 4899/12384 [10:23:32<15:50:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|███▉ | 4899/12384 [10:23:40<15:50:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4900/12384 [10:23:40<15:50:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4900/12384 [10:23:48<15:50:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 40%|███▉ | 4901/12384 [10:23:48<15:49:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 40%|███▉ | 4901/12384 [10:23:55<15:49:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 40%|███▉ | 4902/12384 [10:23:55<15:49:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 40%|███▉ | 4902/12384 [10:24:03<15:49:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 40%|███▉ | 4903/12384 [10:24:03<15:48:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 40%|███▉ | 4903/12384 [10:24:10<15:48:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 40%|███▉ | 4904/12384 [10:24:10<15:49:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 40%|███▉ | 4904/12384 [10:24:18<15:49:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 40%|███▉ | 4905/12384 [10:24:18<15:48:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 40%|███▉ | 4905/12384 [10:24:26<15:48:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 40%|███▉ | 4906/12384 [10:24:26<15:48:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 40%|███▉ | 4906/12384 [10:24:33<15:48:00, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4907/12384 [10:24:33<15:47:21, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4907/12384 [10:24:41<15:47:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 40%|███▉ | 4908/12384 [10:24:41<15:47:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 40%|███▉ | 4908/12384 [10:24:49<15:47:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 40%|███▉ | 4909/12384 [10:24:49<15:47:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 40%|███▉ | 4909/12384 [10:24:56<15:47:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 40%|███▉ | 4910/12384 [10:24:56<15:47:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 40%|███▉ | 4910/12384 [10:25:04<15:47:09, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4911/12384 [10:25:04<15:47:09, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4911/12384 [10:25:11<15:47:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 40%|███▉ | 4912/12384 [10:25:11<15:47:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 40%|███▉ | 4912/12384 [10:25:19<15:47:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 40%|███▉ | 4913/12384 [10:25:19<15:49:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 40%|███▉ | 4913/12384 [10:25:27<15:49:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 40%|███▉ | 4914/12384 [10:25:27<15:48:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 40%|███▉ | 4914/12384 [10:25:34<15:48:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4915/12384 [10:25:34<15:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4915/12384 [10:25:42<15:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 40%|███▉ | 4916/12384 [10:25:42<15:46:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 40%|███▉ | 4916/12384 [10:25:50<15:46:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 40%|███▉ | 4917/12384 [10:25:50<15:58:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 40%|███▉ | 4917/12384 [10:25:57<15:58:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 40%|███▉ | 4918/12384 [10:25:57<15:54:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 40%|███▉ | 4918/12384 [10:26:05<15:54:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4919/12384 [10:26:05<15:52:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4919/12384 [10:26:13<15:52:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 40%|███▉ | 4920/12384 [10:26:13<15:51:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 40%|███▉ | 4920/12384 [10:26:20<15:51:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 40%|███▉ | 4921/12384 [10:26:20<15:53:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 40%|███▉ | 4921/12384 [10:26:28<15:53:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 40%|███▉ | 4922/12384 [10:26:28<15:50:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 40%|███▉ | 4922/12384 [10:26:36<15:50:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 40%|███▉ | 4923/12384 [10:26:36<15:59:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 40%|███▉ | 4923/12384 [10:26:43<15:59:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 2: 40%|███▉ | 4924/12384 [10:26:43<15:57:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.72s]
Epoch 2: 40%|███▉ | 4924/12384 [10:26:51<15:57:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 2: 40%|███▉ | 4925/12384 [10:26:51<15:53:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 2: 40%|███▉ | 4925/12384 [10:26:59<15:53:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4926/12384 [10:26:59<15:50:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|███▉ | 4926/12384 [10:27:06<15:50:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 40%|███▉ | 4927/12384 [10:27:06<15:48:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 40%|███▉ | 4927/12384 [10:27:14<15:48:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 40%|███▉ | 4928/12384 [10:27:14<15:48:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 40%|███▉ | 4928/12384 [10:27:21<15:48:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|███▉ | 4929/12384 [10:27:21<15:46:52, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|███▉ | 4929/12384 [10:27:29<15:46:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 40%|███▉ | 4930/12384 [10:27:29<15:46:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 40%|███▉ | 4930/12384 [10:27:37<15:46:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|███▉ | 4931/12384 [10:27:37<15:47:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|███▉ | 4931/12384 [10:27:44<15:47:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 40%|███▉ | 4932/12384 [10:27:44<15:47:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 40%|███▉ | 4932/12384 [10:27:52<15:47:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 40%|███▉ | 4933/12384 [10:27:52<15:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 40%|███▉ | 4933/12384 [10:28:00<15:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 40%|███▉ | 4934/12384 [10:28:00<15:45:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 40%|███▉ | 4934/12384 [10:28:07<15:45:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 40%|███▉ | 4935/12384 [10:28:07<15:45:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 40%|███▉ | 4935/12384 [10:28:15<15:45:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 40%|███▉ | 4936/12384 [10:28:15<15:45:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 40%|███▉ | 4936/12384 [10:28:22<15:45:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 40%|███▉ | 4937/12384 [10:28:22<15:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 40%|███▉ | 4937/12384 [10:28:30<15:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|███▉ | 4938/12384 [10:28:30<15:46:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|███▉ | 4938/12384 [10:28:38<15:46:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 40%|███▉ | 4939/12384 [10:28:38<15:45:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 40%|███▉ | 4939/12384 [10:28:45<15:45:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 40%|███▉ | 4940/12384 [10:28:45<15:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 40%|███▉ | 4940/12384 [10:28:53<15:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 40%|███▉ | 4941/12384 [10:28:53<15:44:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 40%|███▉ | 4941/12384 [10:29:00<15:44:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|███▉ | 4942/12384 [10:29:00<15:44:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|███▉ | 4942/12384 [10:29:08<15:44:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 40%|███▉ | 4943/12384 [10:29:08<15:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 40%|███▉ | 4943/12384 [10:29:16<15:43:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 40%|███▉ | 4944/12384 [10:29:16<15:55:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 40%|███▉ | 4944/12384 [10:29:24<15:55:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 40%|███▉ | 4945/12384 [10:29:24<15:51:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 40%|███▉ | 4945/12384 [10:29:31<15:51:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 40%|███▉ | 4946/12384 [10:29:31<15:48:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 40%|███▉ | 4946/12384 [10:29:39<15:48:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 40%|███▉ | 4947/12384 [10:29:39<15:46:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 40%|███▉ | 4947/12384 [10:29:46<15:46:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 40%|███▉ | 4948/12384 [10:29:46<15:46:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 40%|███▉ | 4948/12384 [10:29:54<15:46:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 40%|███▉ | 4949/12384 [10:29:54<15:54:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 40%|███▉ | 4949/12384 [10:30:02<15:54:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 40%|███▉ | 4950/12384 [10:30:02<15:51:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 40%|███▉ | 4950/12384 [10:30:10<15:51:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 40%|███▉ | 4951/12384 [10:30:10<15:48:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 40%|███▉ | 4951/12384 [10:30:17<15:48:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 40%|███▉ | 4952/12384 [10:30:17<15:46:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 40%|███▉ | 4952/12384 [10:30:25<15:46:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.70s]
Epoch 2: 40%|███▉ | 4953/12384 [10:30:25<15:45:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.70s]
Epoch 2: 40%|███▉ | 4953/12384 [10:30:32<15:45:52, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.59s]
Epoch 2: 40%|████ | 4954/12384 [10:30:32<15:45:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.59s]
Epoch 2: 40%|████ | 4954/12384 [10:30:40<15:45:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.17s]
Epoch 2: 40%|████ | 4955/12384 [10:30:40<15:44:30, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.17s]
Epoch 2: 40%|████ | 4955/12384 [10:30:48<15:44:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|████ | 4956/12384 [10:30:48<15:43:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|████ | 4956/12384 [10:30:55<15:43:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 40%|████ | 4957/12384 [10:30:55<15:44:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 40%|████ | 4957/12384 [10:31:03<15:44:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 40%|████ | 4958/12384 [10:31:03<15:42:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 40%|████ | 4958/12384 [10:31:10<15:42:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|████ | 4959/12384 [10:31:10<15:42:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|████ | 4959/12384 [10:31:18<15:42:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 40%|████ | 4960/12384 [10:31:18<15:42:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 40%|████ | 4960/12384 [10:31:26<15:42:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 40%|████ | 4961/12384 [10:31:26<15:41:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 40%|████ | 4961/12384 [10:31:33<15:41:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 40%|████ | 4962/12384 [10:31:33<15:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 40%|████ | 4962/12384 [10:31:41<15:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 40%|████ | 4963/12384 [10:31:41<15:42:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 40%|████ | 4963/12384 [10:31:49<15:42:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 40%|████ | 4964/12384 [10:31:49<15:41:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 40%|████ | 4964/12384 [10:31:56<15:41:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 40%|████ | 4965/12384 [10:31:56<15:42:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 40%|████ | 4965/12384 [10:32:04<15:42:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 40%|████ | 4966/12384 [10:32:04<15:41:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 40%|████ | 4966/12384 [10:32:11<15:41:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 40%|████ | 4967/12384 [10:32:11<15:41:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 40%|████ | 4967/12384 [10:32:19<15:41:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 2: 40%|████ | 4968/12384 [10:32:19<15:41:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 2: 40%|████ | 4968/12384 [10:32:27<15:41:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 2: 40%|████ | 4969/12384 [10:32:27<15:40:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 2: 40%|████ | 4969/12384 [10:32:35<15:40:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 40%|████ | 4970/12384 [10:32:35<15:53:19, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 40%|████ | 4970/12384 [10:32:42<15:53:19, 7.72s/it, loss=0.0007, acc=0.9992, iter_time=7.91s]
Epoch 2: 40%|████ | 4971/12384 [10:32:42<15:48:51, 7.68s/it, loss=0.0007, acc=0.9992, iter_time=7.91s]
Epoch 2: 40%|████ | 4971/12384 [10:32:50<15:48:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 40%|████ | 4972/12384 [10:32:50<15:46:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 40%|████ | 4972/12384 [10:32:57<15:46:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 40%|████ | 4973/12384 [10:32:57<15:44:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 40%|████ | 4973/12384 [10:33:05<15:44:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 40%|████ | 4974/12384 [10:33:05<15:43:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 40%|████ | 4974/12384 [10:33:13<15:43:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 40%|████ | 4975/12384 [10:33:13<15:41:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 40%|████ | 4975/12384 [10:33:21<15:41:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 40%|████ | 4976/12384 [10:33:21<15:52:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 40%|████ | 4976/12384 [10:33:28<15:52:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 40%|████ | 4977/12384 [10:33:28<15:49:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 40%|████ | 4977/12384 [10:33:36<15:49:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|████ | 4978/12384 [10:33:36<15:46:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|████ | 4978/12384 [10:33:43<15:46:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 40%|████ | 4979/12384 [10:33:43<15:43:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 40%|████ | 4979/12384 [10:33:51<15:43:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 40%|████ | 4980/12384 [10:33:51<15:42:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 40%|████ | 4980/12384 [10:33:59<15:42:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|████ | 4981/12384 [10:33:59<15:40:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|████ | 4981/12384 [10:34:06<15:40:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 40%|████ | 4982/12384 [10:34:06<15:40:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 40%|████ | 4982/12384 [10:34:14<15:40:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 2: 40%|████ | 4983/12384 [10:34:14<15:39:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 2: 40%|████ | 4983/12384 [10:34:21<15:39:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 40%|████ | 4984/12384 [10:34:21<15:38:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 40%|████ | 4984/12384 [10:34:29<15:38:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 2: 40%|████ | 4985/12384 [10:34:29<15:39:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 2: 40%|████ | 4985/12384 [10:34:37<15:39:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 2: 40%|████ | 4986/12384 [10:34:37<15:38:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 2: 40%|████ | 4986/12384 [10:34:44<15:38:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 40%|████ | 4987/12384 [10:34:44<15:37:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 40%|████ | 4987/12384 [10:34:52<15:37:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|████ | 4988/12384 [10:34:52<15:37:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|████ | 4988/12384 [10:34:59<15:37:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 40%|████ | 4989/12384 [10:34:59<15:38:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 40%|████ | 4989/12384 [10:35:07<15:38:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 2: 40%|████ | 4990/12384 [10:35:07<15:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 2: 40%|████ | 4990/12384 [10:35:15<15:37:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 40%|████ | 4991/12384 [10:35:15<15:37:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 40%|████ | 4991/12384 [10:35:22<15:37:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 40%|████ | 4992/12384 [10:35:22<15:40:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 40%|████ | 4992/12384 [10:35:30<15:40:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 40%|████ | 4993/12384 [10:35:30<15:39:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 40%|████ | 4993/12384 [10:35:38<15:39:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 40%|████ | 4994/12384 [10:35:38<15:39:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 40%|████ | 4994/12384 [10:35:45<15:39:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 40%|████ | 4995/12384 [10:35:45<15:38:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 40%|████ | 4995/12384 [10:35:53<15:38:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 40%|████ | 4996/12384 [10:35:53<15:36:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 40%|████ | 4996/12384 [10:36:01<15:36:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 2: 40%|████ | 4997/12384 [10:36:01<15:48:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=12.03s]
Epoch 2: 40%|████ | 4997/12384 [10:36:08<15:48:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 40%|████ | 4998/12384 [10:36:08<15:44:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 40%|████ | 4998/12384 [10:36:16<15:44:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 40%|████ | 4999/12384 [10:36:16<15:43:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 40%|████ | 4999/12384 [10:36:24<15:43:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 40%|████ | 5000/12384 [10:36:24<15:40:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 40%|████ | 5000/12384 [10:36:31<15:40:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|████ | 5001/12384 [10:36:31<15:39:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 40%|████ | 5001/12384 [10:36:39<15:39:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 2: 40%|████ | 5002/12384 [10:36:39<15:38:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 2: 40%|████ | 5002/12384 [10:36:46<15:38:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 40%|████ | 5003/12384 [10:36:46<15:37:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 40%|████ | 5003/12384 [10:36:54<15:37:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 40%|████ | 5004/12384 [10:36:54<15:37:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 40%|████ | 5004/12384 [10:37:02<15:37:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 40%|████ | 5005/12384 [10:37:02<15:37:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 40%|████ | 5005/12384 [10:37:09<15:37:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 40%|████ | 5006/12384 [10:37:09<15:36:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 40%|████ | 5006/12384 [10:37:17<15:36:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 40%|████ | 5007/12384 [10:37:17<15:37:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 40%|████ | 5007/12384 [10:37:24<15:37:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 40%|████ | 5008/12384 [10:37:24<15:37:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 40%|████ | 5008/12384 [10:37:32<15:37:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|████ | 5009/12384 [10:37:32<15:36:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 40%|████ | 5009/12384 [10:37:40<15:36:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 40%|████ | 5010/12384 [10:37:40<15:34:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 40%|████ | 5010/12384 [10:37:47<15:34:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 40%|████ | 5011/12384 [10:37:47<15:34:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 40%|████ | 5011/12384 [10:37:55<15:34:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 40%|████ | 5012/12384 [10:37:55<15:35:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 40%|████ | 5012/12384 [10:38:03<15:35:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 40%|████ | 5013/12384 [10:38:03<15:34:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 40%|████ | 5013/12384 [10:38:10<15:34:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|████ | 5014/12384 [10:38:10<15:34:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 40%|████ | 5014/12384 [10:38:18<15:34:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 40%|████ | 5015/12384 [10:38:18<15:34:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 40%|████ | 5015/12384 [10:38:25<15:34:35, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.22s]
Epoch 2: 41%|████ | 5016/12384 [10:38:25<15:34:08, 7.61s/it, loss=0.0001, acc=0.9998, iter_time=9.22s]
Epoch 2: 41%|████ | 5016/12384 [10:38:33<15:34:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 41%|████ | 5017/12384 [10:38:33<15:34:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 41%|████ | 5017/12384 [10:38:41<15:34:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 41%|████ | 5018/12384 [10:38:41<15:34:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 41%|████ | 5018/12384 [10:38:48<15:34:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 41%|████ | 5019/12384 [10:38:48<15:35:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 41%|████ | 5019/12384 [10:38:56<15:35:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5020/12384 [10:38:56<15:34:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5020/12384 [10:39:03<15:34:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 41%|████ | 5021/12384 [10:39:03<15:35:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 41%|████ | 5021/12384 [10:39:11<15:35:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 41%|████ | 5022/12384 [10:39:11<15:35:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 41%|████ | 5022/12384 [10:39:19<15:35:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 41%|████ | 5023/12384 [10:39:19<15:47:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 41%|████ | 5023/12384 [10:39:27<15:47:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 41%|████ | 5024/12384 [10:39:27<15:44:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 41%|████ | 5024/12384 [10:39:34<15:44:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 41%|████ | 5025/12384 [10:39:34<15:41:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 41%|████ | 5025/12384 [10:39:42<15:41:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 41%|████ | 5026/12384 [10:39:42<15:37:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 41%|████ | 5026/12384 [10:39:49<15:37:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 41%|████ | 5027/12384 [10:39:49<15:36:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 41%|████ | 5027/12384 [10:39:57<15:36:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5028/12384 [10:39:57<15:34:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5028/12384 [10:40:05<15:34:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 41%|████ | 5029/12384 [10:40:05<15:45:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 41%|████ | 5029/12384 [10:40:13<15:45:17, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 41%|████ | 5030/12384 [10:40:13<15:41:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 41%|████ | 5030/12384 [10:40:20<15:41:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 41%|████ | 5031/12384 [10:40:20<15:41:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 41%|████ | 5031/12384 [10:40:28<15:41:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 41%|████ | 5032/12384 [10:40:28<15:37:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 41%|████ | 5032/12384 [10:40:35<15:37:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 41%|████ | 5033/12384 [10:40:35<15:35:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 41%|████ | 5033/12384 [10:40:43<15:35:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 41%|████ | 5034/12384 [10:40:43<15:35:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 41%|████ | 5034/12384 [10:40:51<15:35:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 41%|████ | 5035/12384 [10:40:51<15:34:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 41%|████ | 5035/12384 [10:40:58<15:34:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████ | 5036/12384 [10:40:58<15:32:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████ | 5036/12384 [10:41:06<15:32:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5037/12384 [10:41:06<15:32:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5037/12384 [10:41:14<15:32:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 41%|████ | 5038/12384 [10:41:14<15:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 41%|████ | 5038/12384 [10:41:21<15:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 2: 41%|████ | 5039/12384 [10:41:21<15:30:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.81s]
Epoch 2: 41%|████ | 5039/12384 [10:41:29<15:30:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 41%|████ | 5040/12384 [10:41:29<15:30:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 41%|████ | 5040/12384 [10:41:36<15:30:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 41%|████ | 5041/12384 [10:41:36<15:30:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 41%|████ | 5041/12384 [10:41:44<15:30:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 41%|████ | 5042/12384 [10:41:44<15:30:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 41%|████ | 5042/12384 [10:41:52<15:30:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████ | 5043/12384 [10:41:52<15:30:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████ | 5043/12384 [10:41:59<15:30:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 41%|████ | 5044/12384 [10:41:59<15:29:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 41%|████ | 5044/12384 [10:42:07<15:29:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 41%|████ | 5045/12384 [10:42:07<15:28:40, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 41%|████ | 5045/12384 [10:42:14<15:28:40, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 41%|████ | 5046/12384 [10:42:14<15:30:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 41%|████ | 5046/12384 [10:42:22<15:30:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5047/12384 [10:42:22<15:34:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5047/12384 [10:42:30<15:34:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 41%|████ | 5048/12384 [10:42:30<15:33:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 41%|████ | 5048/12384 [10:42:38<15:33:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 41%|████ | 5049/12384 [10:42:38<15:44:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 41%|████ | 5049/12384 [10:42:45<15:44:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 41%|████ | 5050/12384 [10:42:45<15:43:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 41%|████ | 5050/12384 [10:42:53<15:43:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████ | 5051/12384 [10:42:53<15:39:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████ | 5051/12384 [10:43:01<15:39:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 41%|████ | 5052/12384 [10:43:01<15:36:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 41%|████ | 5052/12384 [10:43:08<15:36:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 41%|████ | 5053/12384 [10:43:08<15:34:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 41%|████ | 5053/12384 [10:43:16<15:34:30, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.82s]
Epoch 2: 41%|████ | 5054/12384 [10:43:16<15:32:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.82s]
Epoch 2: 41%|████ | 5054/12384 [10:43:23<15:32:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 2: 41%|████ | 5055/12384 [10:43:23<15:31:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.56s]
Epoch 2: 41%|████ | 5055/12384 [10:43:31<15:31:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 2: 41%|████ | 5056/12384 [10:43:31<15:30:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 2: 41%|████ | 5056/12384 [10:43:39<15:30:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5057/12384 [10:43:39<15:30:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5057/12384 [10:43:46<15:30:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 41%|████ | 5058/12384 [10:43:46<15:30:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 41%|████ | 5058/12384 [10:43:54<15:30:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 41%|████ | 5059/12384 [10:43:54<15:31:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 41%|████ | 5059/12384 [10:44:01<15:31:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 41%|████ | 5060/12384 [10:44:01<15:30:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 41%|████ | 5060/12384 [10:44:09<15:30:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5061/12384 [10:44:09<15:30:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5061/12384 [10:44:17<15:30:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 41%|████ | 5062/12384 [10:44:17<15:29:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 41%|████ | 5062/12384 [10:44:24<15:29:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5063/12384 [10:44:24<15:30:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5063/12384 [10:44:32<15:30:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 41%|████ | 5064/12384 [10:44:32<15:32:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 41%|████ | 5064/12384 [10:44:40<15:32:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 2: 41%|████ | 5065/12384 [10:44:40<15:30:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 2: 41%|████ | 5065/12384 [10:44:47<15:30:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 41%|████ | 5066/12384 [10:44:47<15:32:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 41%|████ | 5066/12384 [10:44:55<15:32:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 41%|████ | 5067/12384 [10:44:55<15:32:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 41%|████ | 5067/12384 [10:45:03<15:32:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5068/12384 [10:45:03<15:30:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5068/12384 [10:45:10<15:30:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 41%|████ | 5069/12384 [10:45:10<15:29:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 41%|████ | 5069/12384 [10:45:18<15:29:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 41%|████ | 5070/12384 [10:45:18<15:29:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 41%|████ | 5070/12384 [10:45:25<15:29:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 41%|████ | 5071/12384 [10:45:25<15:28:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 41%|████ | 5071/12384 [10:45:33<15:28:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 41%|████ | 5072/12384 [10:45:33<15:27:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 41%|████ | 5072/12384 [10:45:41<15:27:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 41%|████ | 5073/12384 [10:45:41<15:28:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 41%|████ | 5073/12384 [10:45:48<15:28:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 41%|████ | 5074/12384 [10:45:48<15:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 41%|████ | 5074/12384 [10:45:56<15:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 41%|████ | 5075/12384 [10:45:56<15:40:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 41%|████ | 5075/12384 [10:46:04<15:40:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 41%|████ | 5076/12384 [10:46:04<15:36:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 41%|████ | 5076/12384 [10:46:11<15:36:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 41%|████ | 5077/12384 [10:46:11<15:34:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 41%|████ | 5077/12384 [10:46:19<15:34:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 41%|████ | 5078/12384 [10:46:19<15:32:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 41%|████ | 5078/12384 [10:46:27<15:32:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 41%|████ | 5079/12384 [10:46:27<15:31:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 41%|████ | 5079/12384 [10:46:34<15:31:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 41%|████ | 5080/12384 [10:46:34<15:30:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 41%|████ | 5080/12384 [10:46:42<15:30:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 2: 41%|████ | 5081/12384 [10:46:42<15:29:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 2: 41%|████ | 5081/12384 [10:46:50<15:29:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.76s]
Epoch 2: 41%|████ | 5082/12384 [10:46:50<15:28:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.76s]
Epoch 2: 41%|████ | 5082/12384 [10:46:57<15:28:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 41%|████ | 5083/12384 [10:46:57<15:27:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 41%|████ | 5083/12384 [10:47:05<15:27:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5084/12384 [10:47:05<15:26:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████ | 5084/12384 [10:47:12<15:26:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████ | 5085/12384 [10:47:12<15:26:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████ | 5085/12384 [10:47:20<15:26:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 41%|████ | 5086/12384 [10:47:20<15:25:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 41%|████ | 5086/12384 [10:47:28<15:25:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 41%|████ | 5087/12384 [10:47:28<15:24:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 41%|████ | 5087/12384 [10:47:35<15:24:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 41%|████ | 5088/12384 [10:47:35<15:24:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 41%|████ | 5088/12384 [10:47:43<15:24:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 41%|████ | 5089/12384 [10:47:43<15:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 41%|████ | 5089/12384 [10:47:50<15:26:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 41%|████ | 5090/12384 [10:47:50<15:25:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 41%|████ | 5090/12384 [10:47:58<15:25:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 41%|████ | 5091/12384 [10:47:58<15:26:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 41%|████ | 5091/12384 [10:48:06<15:26:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5092/12384 [10:48:06<15:26:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5092/12384 [10:48:13<15:26:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5093/12384 [10:48:13<15:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████ | 5093/12384 [10:48:21<15:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 41%|████ | 5094/12384 [10:48:21<15:26:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 41%|████ | 5094/12384 [10:48:29<15:26:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 41%|████ | 5095/12384 [10:48:29<15:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 41%|████ | 5095/12384 [10:48:36<15:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 41%|████ | 5096/12384 [10:48:36<15:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 41%|████ | 5096/12384 [10:48:44<15:25:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 41%|████ | 5097/12384 [10:48:44<15:32:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 41%|████ | 5097/12384 [10:48:52<15:32:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 2: 41%|████ | 5098/12384 [10:48:52<15:29:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 2: 41%|████ | 5098/12384 [10:48:59<15:29:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 41%|████ | 5099/12384 [10:48:59<15:28:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 41%|████ | 5099/12384 [10:49:07<15:28:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 41%|████ | 5100/12384 [10:49:07<15:32:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 41%|████ | 5100/12384 [10:49:15<15:32:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 2: 41%|████ | 5101/12384 [10:49:15<15:42:50, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 2: 41%|████ | 5101/12384 [10:49:23<15:42:50, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 41%|████ | 5102/12384 [10:49:23<15:42:21, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 41%|████ | 5102/12384 [10:49:30<15:42:21, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 41%|████ | 5103/12384 [10:49:30<15:36:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 41%|████ | 5103/12384 [10:49:38<15:36:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 41%|████ | 5104/12384 [10:49:38<15:33:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 41%|████ | 5104/12384 [10:49:46<15:33:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 41%|████ | 5105/12384 [10:49:46<15:30:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 41%|████ | 5105/12384 [10:49:53<15:30:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 41%|████ | 5106/12384 [10:49:53<15:28:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 41%|████ | 5106/12384 [10:50:01<15:28:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 41%|████ | 5107/12384 [10:50:01<15:36:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 41%|████ | 5107/12384 [10:50:09<15:36:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 41%|████ | 5108/12384 [10:50:09<15:33:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 41%|████ | 5108/12384 [10:50:16<15:33:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████▏ | 5109/12384 [10:50:16<15:29:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████▏ | 5109/12384 [10:50:24<15:29:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 41%|████▏ | 5110/12384 [10:50:24<15:27:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 41%|████▏ | 5110/12384 [10:50:32<15:27:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 41%|████▏ | 5111/12384 [10:50:32<15:26:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 41%|████▏ | 5111/12384 [10:50:39<15:26:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 41%|████▏ | 5112/12384 [10:50:39<15:25:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 41%|████▏ | 5112/12384 [10:50:47<15:25:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 41%|████▏ | 5113/12384 [10:50:47<15:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 41%|████▏ | 5113/12384 [10:50:54<15:25:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 41%|████▏ | 5114/12384 [10:50:54<15:25:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 41%|████▏ | 5114/12384 [10:51:02<15:25:04, 7.63s/it, loss=0.0004, acc=0.9982, iter_time=7.64s]
Epoch 2: 41%|████▏ | 5115/12384 [10:51:02<15:24:47, 7.63s/it, loss=0.0004, acc=0.9982, iter_time=7.64s]
Epoch 2: 41%|████▏ | 5115/12384 [10:51:10<15:24:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████▏ | 5116/12384 [10:51:10<15:23:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 41%|████▏ | 5116/12384 [10:51:17<15:23:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████▏ | 5117/12384 [10:51:17<15:22:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████▏ | 5117/12384 [10:51:25<15:22:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████▏ | 5118/12384 [10:51:25<15:22:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 41%|████▏ | 5118/12384 [10:51:32<15:22:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████▏ | 5119/12384 [10:51:32<15:22:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████▏ | 5119/12384 [10:51:40<15:22:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 41%|████▏ | 5120/12384 [10:51:40<15:22:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 41%|████▏ | 5120/12384 [10:51:48<15:22:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 41%|████▏ | 5121/12384 [10:51:48<15:24:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 41%|████▏ | 5121/12384 [10:51:55<15:24:37, 7.64s/it, loss=0.0028, acc=0.9931, iter_time=4.48s]
Epoch 2: 41%|████▏ | 5122/12384 [10:51:55<15:23:31, 7.63s/it, loss=0.0028, acc=0.9931, iter_time=4.48s]
Epoch 2: 41%|████▏ | 5122/12384 [10:52:03<15:23:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 41%|████▏ | 5123/12384 [10:52:03<15:23:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 41%|████▏ | 5123/12384 [10:52:11<15:23:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 41%|████▏ | 5124/12384 [10:52:11<15:22:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 41%|████▏ | 5124/12384 [10:52:18<15:22:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 41%|████▏ | 5125/12384 [10:52:18<15:22:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 41%|████▏ | 5125/12384 [10:52:26<15:22:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 41%|████▏ | 5126/12384 [10:52:26<15:22:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 41%|████▏ | 5126/12384 [10:52:34<15:22:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 41%|████▏ | 5127/12384 [10:52:34<15:21:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 41%|████▏ | 5127/12384 [10:52:42<15:21:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 41%|████▏ | 5128/12384 [10:52:42<15:38:03, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 41%|████▏ | 5128/12384 [10:52:49<15:38:03, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 41%|████▏ | 5129/12384 [10:52:49<15:33:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 41%|████▏ | 5129/12384 [10:52:57<15:33:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 41%|████▏ | 5130/12384 [10:52:57<15:29:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 41%|████▏ | 5130/12384 [10:53:04<15:29:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 41%|████▏ | 5131/12384 [10:53:04<15:26:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 41%|████▏ | 5131/12384 [10:53:12<15:26:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 41%|████▏ | 5132/12384 [10:53:12<15:25:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 41%|████▏ | 5132/12384 [10:53:20<15:25:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 41%|████▏ | 5133/12384 [10:53:20<15:23:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 41%|████▏ | 5133/12384 [10:53:27<15:23:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 41%|████▏ | 5134/12384 [10:53:27<15:21:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 41%|████▏ | 5134/12384 [10:53:35<15:21:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████▏ | 5135/12384 [10:53:35<15:25:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████▏ | 5135/12384 [10:53:43<15:25:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 41%|████▏ | 5136/12384 [10:53:43<15:26:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 41%|████▏ | 5136/12384 [10:53:50<15:26:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 41%|████▏ | 5137/12384 [10:53:50<15:28:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 41%|████▏ | 5137/12384 [10:53:58<15:28:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 41%|████▏ | 5138/12384 [10:53:58<15:25:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 41%|████▏ | 5138/12384 [10:54:06<15:25:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████▏ | 5139/12384 [10:54:06<15:23:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 41%|████▏ | 5139/12384 [10:54:13<15:23:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 42%|████▏ | 5140/12384 [10:54:13<15:21:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 42%|████▏ | 5140/12384 [10:54:21<15:21:25, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.12s]
Epoch 2: 42%|████▏ | 5141/12384 [10:54:21<15:19:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.12s]
Epoch 2: 42%|████▏ | 5141/12384 [10:54:28<15:19:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 42%|████▏ | 5142/12384 [10:54:28<15:19:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 42%|████▏ | 5142/12384 [10:54:36<15:19:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 42%|████▏ | 5143/12384 [10:54:36<15:19:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 42%|████▏ | 5143/12384 [10:54:44<15:19:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 42%|████▏ | 5144/12384 [10:54:44<15:23:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 42%|████▏ | 5144/12384 [10:54:51<15:23:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 42%|████▏ | 5145/12384 [10:54:51<15:22:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 42%|████▏ | 5145/12384 [10:54:59<15:22:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 42%|████▏ | 5146/12384 [10:54:59<15:20:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 42%|████▏ | 5146/12384 [10:55:07<15:20:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5147/12384 [10:55:07<15:19:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5147/12384 [10:55:14<15:19:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5148/12384 [10:55:14<15:18:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5148/12384 [10:55:22<15:18:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 42%|████▏ | 5149/12384 [10:55:22<15:17:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 42%|████▏ | 5149/12384 [10:55:29<15:17:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 42%|████▏ | 5150/12384 [10:55:29<15:16:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 42%|████▏ | 5150/12384 [10:55:37<15:16:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 42%|████▏ | 5151/12384 [10:55:37<15:16:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 42%|████▏ | 5151/12384 [10:55:45<15:16:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 42%|████▏ | 5152/12384 [10:55:45<15:17:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 42%|████▏ | 5152/12384 [10:55:52<15:17:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 42%|████▏ | 5153/12384 [10:55:52<15:16:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 42%|████▏ | 5153/12384 [10:56:00<15:16:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 2: 42%|████▏ | 5154/12384 [10:56:00<15:27:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 2: 42%|████▏ | 5154/12384 [10:56:08<15:27:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 2: 42%|████▏ | 5155/12384 [10:56:08<15:24:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 2: 42%|████▏ | 5155/12384 [10:56:15<15:24:23, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 42%|████▏ | 5156/12384 [10:56:15<15:22:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 42%|████▏ | 5156/12384 [10:56:23<15:22:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 42%|████▏ | 5157/12384 [10:56:23<15:19:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 42%|████▏ | 5157/12384 [10:56:31<15:19:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 42%|████▏ | 5158/12384 [10:56:31<15:18:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 42%|████▏ | 5158/12384 [10:56:38<15:18:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 42%|████▏ | 5159/12384 [10:56:38<15:18:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 42%|████▏ | 5159/12384 [10:56:46<15:18:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 2: 42%|████▏ | 5160/12384 [10:56:46<15:28:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 2: 42%|████▏ | 5160/12384 [10:56:54<15:28:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 42%|████▏ | 5161/12384 [10:56:54<15:24:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 42%|████▏ | 5161/12384 [10:57:01<15:24:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5162/12384 [10:57:01<15:21:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5162/12384 [10:57:09<15:21:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5163/12384 [10:57:09<15:19:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5163/12384 [10:57:17<15:19:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5164/12384 [10:57:17<15:18:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5164/12384 [10:57:24<15:18:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 42%|████▏ | 5165/12384 [10:57:24<15:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 42%|████▏ | 5165/12384 [10:57:32<15:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5166/12384 [10:57:32<15:17:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5166/12384 [10:57:39<15:17:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5167/12384 [10:57:39<15:17:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5167/12384 [10:57:47<15:17:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 42%|████▏ | 5168/12384 [10:57:47<15:19:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 42%|████▏ | 5168/12384 [10:57:55<15:19:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 42%|████▏ | 5169/12384 [10:57:55<15:17:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 42%|████▏ | 5169/12384 [10:58:02<15:17:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 42%|████▏ | 5170/12384 [10:58:02<15:19:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 42%|████▏ | 5170/12384 [10:58:10<15:19:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 42%|████▏ | 5171/12384 [10:58:10<15:18:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 42%|████▏ | 5171/12384 [10:58:18<15:18:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 42%|████▏ | 5172/12384 [10:58:18<15:16:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 42%|████▏ | 5172/12384 [10:58:25<15:16:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5173/12384 [10:58:25<15:16:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5173/12384 [10:58:33<15:16:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5174/12384 [10:58:33<15:15:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5174/12384 [10:58:40<15:15:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 42%|████▏ | 5175/12384 [10:58:40<15:15:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 42%|████▏ | 5175/12384 [10:58:48<15:15:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 42%|████▏ | 5176/12384 [10:58:48<15:14:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 42%|████▏ | 5176/12384 [10:58:56<15:14:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 42%|████▏ | 5177/12384 [10:58:56<15:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.51s]
Epoch 2: 42%|████▏ | 5177/12384 [10:59:03<15:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 42%|████▏ | 5178/12384 [10:59:03<15:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 42%|████▏ | 5178/12384 [10:59:11<15:13:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 42%|████▏ | 5179/12384 [10:59:11<15:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 42%|████▏ | 5179/12384 [10:59:18<15:13:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 42%|████▏ | 5180/12384 [10:59:18<15:14:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 42%|████▏ | 5180/12384 [10:59:26<15:14:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 42%|████▏ | 5181/12384 [10:59:26<15:26:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 42%|████▏ | 5181/12384 [10:59:34<15:26:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 42%|████▏ | 5182/12384 [10:59:34<15:22:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 42%|████▏ | 5182/12384 [10:59:42<15:22:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 2: 42%|████▏ | 5183/12384 [10:59:42<15:19:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 2: 42%|████▏ | 5183/12384 [10:59:49<15:19:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 42%|████▏ | 5184/12384 [10:59:49<15:17:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 42%|████▏ | 5184/12384 [10:59:57<15:17:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 42%|████▏ | 5185/12384 [10:59:57<15:15:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 42%|████▏ | 5185/12384 [11:00:04<15:15:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 42%|████▏ | 5186/12384 [11:00:04<15:13:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 42%|████▏ | 5186/12384 [11:00:12<15:13:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 42%|████▏ | 5187/12384 [11:00:12<15:13:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 42%|████▏ | 5187/12384 [11:00:20<15:13:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5188/12384 [11:00:20<15:14:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5188/12384 [11:00:27<15:14:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 42%|████▏ | 5189/12384 [11:00:27<15:15:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 42%|████▏ | 5189/12384 [11:00:35<15:15:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 42%|████▏ | 5190/12384 [11:00:35<15:14:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 42%|████▏ | 5190/12384 [11:00:43<15:14:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 42%|████▏ | 5191/12384 [11:00:43<15:13:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 42%|████▏ | 5191/12384 [11:00:50<15:13:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 42%|████▏ | 5192/12384 [11:00:50<15:13:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 42%|████▏ | 5192/12384 [11:00:58<15:13:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 42%|████▏ | 5193/12384 [11:00:58<15:13:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 42%|████▏ | 5193/12384 [11:01:05<15:13:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 42%|████▏ | 5194/12384 [11:01:05<15:12:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 42%|████▏ | 5194/12384 [11:01:13<15:12:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 42%|████▏ | 5195/12384 [11:01:13<15:12:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 42%|████▏ | 5195/12384 [11:01:21<15:12:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 42%|████▏ | 5196/12384 [11:01:21<15:12:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 42%|████▏ | 5196/12384 [11:01:28<15:12:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 42%|████▏ | 5197/12384 [11:01:28<15:14:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 42%|████▏ | 5197/12384 [11:01:36<15:14:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=12.29s]
Epoch 2: 42%|████▏ | 5198/12384 [11:01:36<15:12:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=12.29s]
Epoch 2: 42%|████▏ | 5198/12384 [11:01:44<15:12:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5199/12384 [11:01:44<15:11:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5199/12384 [11:01:51<15:11:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 42%|████▏ | 5200/12384 [11:01:51<15:12:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 42%|████▏ | 5200/12384 [11:01:59<15:12:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 42%|████▏ | 5201/12384 [11:01:59<15:10:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 42%|████▏ | 5201/12384 [11:02:06<15:10:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5202/12384 [11:02:06<15:10:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5202/12384 [11:02:14<15:10:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 42%|████▏ | 5203/12384 [11:02:14<15:10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 42%|████▏ | 5203/12384 [11:02:22<15:10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 42%|████▏ | 5204/12384 [11:02:22<15:10:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 42%|████▏ | 5204/12384 [11:02:29<15:10:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 42%|████▏ | 5205/12384 [11:02:29<15:12:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 42%|████▏ | 5205/12384 [11:02:37<15:12:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 42%|████▏ | 5206/12384 [11:02:37<15:11:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 42%|████▏ | 5206/12384 [11:02:45<15:11:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 42%|████▏ | 5207/12384 [11:02:45<15:22:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 42%|████▏ | 5207/12384 [11:02:52<15:22:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 42%|████▏ | 5208/12384 [11:02:52<15:19:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 42%|████▏ | 5208/12384 [11:03:00<15:19:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 42%|████▏ | 5209/12384 [11:03:00<15:16:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 42%|████▏ | 5209/12384 [11:03:08<15:16:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 42%|████▏ | 5210/12384 [11:03:08<15:14:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 42%|████▏ | 5210/12384 [11:03:15<15:14:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 42%|████▏ | 5211/12384 [11:03:15<15:16:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 42%|████▏ | 5211/12384 [11:03:23<15:16:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 42%|████▏ | 5212/12384 [11:03:23<15:13:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 42%|████▏ | 5212/12384 [11:03:31<15:13:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 42%|████▏ | 5213/12384 [11:03:31<15:22:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 42%|████▏ | 5213/12384 [11:03:38<15:22:09, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 42%|████▏ | 5214/12384 [11:03:38<15:17:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 42%|████▏ | 5214/12384 [11:03:46<15:17:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 42%|████▏ | 5215/12384 [11:03:46<15:14:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 42%|████▏ | 5215/12384 [11:03:54<15:14:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 42%|████▏ | 5216/12384 [11:03:54<15:13:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 42%|████▏ | 5216/12384 [11:04:01<15:13:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 42%|████▏ | 5217/12384 [11:04:01<15:12:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 42%|████▏ | 5217/12384 [11:04:09<15:12:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 42%|████▏ | 5218/12384 [11:04:09<15:11:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 42%|████▏ | 5218/12384 [11:04:16<15:11:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 42%|████▏ | 5219/12384 [11:04:16<15:10:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 42%|████▏ | 5219/12384 [11:04:24<15:10:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 42%|████▏ | 5220/12384 [11:04:24<15:10:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 42%|████▏ | 5220/12384 [11:04:32<15:10:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 42%|████▏ | 5221/12384 [11:04:32<15:09:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 42%|████▏ | 5221/12384 [11:04:39<15:09:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 42%|████▏ | 5222/12384 [11:04:39<15:08:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 42%|████▏ | 5222/12384 [11:04:47<15:08:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 2: 42%|████▏ | 5223/12384 [11:04:47<15:08:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 2: 42%|████▏ | 5223/12384 [11:04:55<15:08:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 2: 42%|████▏ | 5224/12384 [11:04:55<15:09:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 2: 42%|████▏ | 5224/12384 [11:05:02<15:09:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 42%|████▏ | 5225/12384 [11:05:02<15:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 42%|████▏ | 5225/12384 [11:05:10<15:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 42%|████▏ | 5226/12384 [11:05:10<15:07:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 42%|████▏ | 5226/12384 [11:05:17<15:07:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 42%|████▏ | 5227/12384 [11:05:17<15:08:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 42%|████▏ | 5227/12384 [11:05:25<15:08:16, 7.61s/it, loss=0.0005, acc=0.9978, iter_time=4.78s]
Epoch 2: 42%|████▏ | 5228/12384 [11:05:25<15:06:46, 7.60s/it, loss=0.0005, acc=0.9978, iter_time=4.78s]
Epoch 2: 42%|████▏ | 5228/12384 [11:05:33<15:06:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 42%|████▏ | 5229/12384 [11:05:33<15:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 42%|████▏ | 5229/12384 [11:05:40<15:06:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 42%|████▏ | 5230/12384 [11:05:40<15:06:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 42%|████▏ | 5230/12384 [11:05:48<15:06:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 42%|████▏ | 5231/12384 [11:05:48<15:06:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 42%|████▏ | 5231/12384 [11:05:55<15:06:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 42%|████▏ | 5232/12384 [11:05:56<15:13:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 42%|████▏ | 5232/12384 [11:06:03<15:13:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 2: 42%|████▏ | 5233/12384 [11:06:03<15:22:40, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 2: 42%|████▏ | 5233/12384 [11:06:11<15:22:40, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 42%|████▏ | 5234/12384 [11:06:11<15:17:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 42%|████▏ | 5234/12384 [11:06:19<15:17:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 42%|████▏ | 5235/12384 [11:06:19<15:13:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 42%|████▏ | 5235/12384 [11:06:26<15:13:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 42%|████▏ | 5236/12384 [11:06:26<15:12:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 42%|████▏ | 5236/12384 [11:06:34<15:12:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 42%|████▏ | 5237/12384 [11:06:34<15:09:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 42%|████▏ | 5237/12384 [11:06:41<15:09:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 42%|████▏ | 5238/12384 [11:06:41<15:07:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 42%|████▏ | 5238/12384 [11:06:49<15:07:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 42%|████▏ | 5239/12384 [11:06:49<15:07:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 42%|████▏ | 5239/12384 [11:06:57<15:07:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 42%|████▏ | 5240/12384 [11:06:57<15:06:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 42%|████▏ | 5240/12384 [11:07:04<15:06:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 42%|████▏ | 5241/12384 [11:07:04<15:06:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 42%|████▏ | 5241/12384 [11:07:12<15:06:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 42%|████▏ | 5242/12384 [11:07:12<15:06:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 42%|████▏ | 5242/12384 [11:07:20<15:06:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 42%|████▏ | 5243/12384 [11:07:20<15:06:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 42%|████▏ | 5243/12384 [11:07:27<15:06:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 42%|████▏ | 5244/12384 [11:07:27<15:06:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 42%|████▏ | 5244/12384 [11:07:35<15:06:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 42%|████▏ | 5245/12384 [11:07:35<15:06:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 42%|████▏ | 5245/12384 [11:07:42<15:06:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 42%|████▏ | 5246/12384 [11:07:42<15:05:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 42%|████▏ | 5246/12384 [11:07:50<15:05:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 42%|████▏ | 5247/12384 [11:07:50<15:05:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 42%|████▏ | 5247/12384 [11:07:58<15:05:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 42%|████▏ | 5248/12384 [11:07:58<15:04:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 42%|████▏ | 5248/12384 [11:08:05<15:04:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 42%|████▏ | 5249/12384 [11:08:05<15:04:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 42%|████▏ | 5249/12384 [11:08:13<15:04:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5250/12384 [11:08:13<15:05:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5250/12384 [11:08:20<15:05:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 42%|████▏ | 5251/12384 [11:08:20<15:05:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 42%|████▏ | 5251/12384 [11:08:28<15:05:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5252/12384 [11:08:28<15:04:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 42%|████▏ | 5252/12384 [11:08:36<15:04:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 42%|████▏ | 5253/12384 [11:08:36<15:05:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 42%|████▏ | 5253/12384 [11:08:43<15:05:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 42%|████▏ | 5254/12384 [11:08:43<15:05:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 42%|████▏ | 5254/12384 [11:08:51<15:05:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 42%|████▏ | 5255/12384 [11:08:51<15:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 42%|████▏ | 5255/12384 [11:08:58<15:04:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 42%|████▏ | 5256/12384 [11:08:58<15:03:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 42%|████▏ | 5256/12384 [11:09:06<15:03:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 42%|████▏ | 5257/12384 [11:09:06<15:03:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 42%|████▏ | 5257/12384 [11:09:14<15:03:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5258/12384 [11:09:14<15:02:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5258/12384 [11:09:22<15:02:35, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 2: 42%|████▏ | 5259/12384 [11:09:22<15:14:47, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.41s]
Epoch 2: 42%|████▏ | 5259/12384 [11:09:29<15:14:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5260/12384 [11:09:29<15:10:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 42%|████▏ | 5260/12384 [11:09:37<15:10:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 42%|████▏ | 5261/12384 [11:09:37<15:07:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 42%|████▏ | 5261/12384 [11:09:44<15:07:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 42%|████▏ | 5262/12384 [11:09:44<15:06:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 42%|████▏ | 5262/12384 [11:09:52<15:06:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 42%|████▏ | 5263/12384 [11:09:52<15:04:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 42%|████▏ | 5263/12384 [11:10:00<15:04:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5264/12384 [11:10:00<15:06:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5264/12384 [11:10:07<15:06:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 43%|████▎ | 5265/12384 [11:10:07<15:06:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 43%|████▎ | 5265/12384 [11:10:15<15:06:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 43%|████▎ | 5266/12384 [11:10:15<15:05:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 43%|████▎ | 5266/12384 [11:10:23<15:05:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 43%|████▎ | 5267/12384 [11:10:23<15:04:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 43%|████▎ | 5267/12384 [11:10:30<15:04:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 43%|████▎ | 5268/12384 [11:10:30<15:03:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 43%|████▎ | 5268/12384 [11:10:38<15:03:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5269/12384 [11:10:38<15:03:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5269/12384 [11:10:45<15:03:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 43%|████▎ | 5270/12384 [11:10:45<15:04:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 43%|████▎ | 5270/12384 [11:10:53<15:04:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 43%|████▎ | 5271/12384 [11:10:53<15:02:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 43%|████▎ | 5271/12384 [11:11:01<15:02:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 43%|████▎ | 5272/12384 [11:11:01<15:02:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 43%|████▎ | 5272/12384 [11:11:08<15:02:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 43%|████▎ | 5273/12384 [11:11:08<15:01:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 43%|████▎ | 5273/12384 [11:11:16<15:01:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5274/12384 [11:11:16<15:01:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5274/12384 [11:11:23<15:01:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5275/12384 [11:11:23<15:00:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5275/12384 [11:11:31<15:00:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 43%|████▎ | 5276/12384 [11:11:31<15:00:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 43%|████▎ | 5276/12384 [11:11:39<15:00:09, 7.60s/it, loss=0.0000, acc=0.9999, iter_time=8.52s]
Epoch 2: 43%|████▎ | 5277/12384 [11:11:39<15:03:01, 7.62s/it, loss=0.0000, acc=0.9999, iter_time=8.52s]
Epoch 2: 43%|████▎ | 5277/12384 [11:11:46<15:03:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 43%|████▎ | 5278/12384 [11:11:46<15:02:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 43%|████▎ | 5278/12384 [11:11:54<15:02:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 43%|████▎ | 5279/12384 [11:11:54<15:02:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 43%|████▎ | 5279/12384 [11:12:02<15:02:12, 7.62s/it, loss=0.0001, acc=0.9984, iter_time=9.65s]
Epoch 2: 43%|████▎ | 5280/12384 [11:12:02<15:01:57, 7.62s/it, loss=0.0001, acc=0.9984, iter_time=9.65s]
Epoch 2: 43%|████▎ | 5280/12384 [11:12:09<15:01:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 43%|████▎ | 5281/12384 [11:12:09<15:02:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 43%|████▎ | 5281/12384 [11:12:17<15:02:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 43%|████▎ | 5282/12384 [11:12:17<15:04:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 43%|████▎ | 5282/12384 [11:12:24<15:04:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 43%|████▎ | 5283/12384 [11:12:24<15:03:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 43%|████▎ | 5283/12384 [11:12:32<15:03:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 43%|████▎ | 5284/12384 [11:12:32<15:02:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 43%|████▎ | 5284/12384 [11:12:40<15:02:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 2: 43%|████▎ | 5285/12384 [11:12:40<15:14:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 2: 43%|████▎ | 5285/12384 [11:12:48<15:14:21, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 43%|████▎ | 5286/12384 [11:12:48<15:10:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 43%|████▎ | 5286/12384 [11:12:55<15:10:19, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 2: 43%|████▎ | 5287/12384 [11:12:55<15:07:35, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.13s]
Epoch 2: 43%|████▎ | 5287/12384 [11:13:03<15:07:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 43%|████▎ | 5288/12384 [11:13:03<15:05:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 43%|████▎ | 5288/12384 [11:13:11<15:05:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 43%|████▎ | 5289/12384 [11:13:11<15:03:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 43%|████▎ | 5289/12384 [11:13:18<15:03:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5290/12384 [11:13:18<15:01:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5290/12384 [11:13:26<15:01:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 43%|████▎ | 5291/12384 [11:13:26<15:11:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 43%|████▎ | 5291/12384 [11:13:34<15:11:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 43%|████▎ | 5292/12384 [11:13:34<15:08:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 43%|████▎ | 5292/12384 [11:13:41<15:08:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 43%|████▎ | 5293/12384 [11:13:41<15:04:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 43%|████▎ | 5293/12384 [11:13:49<15:04:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5294/12384 [11:13:49<15:03:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5294/12384 [11:13:56<15:03:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 43%|████▎ | 5295/12384 [11:13:56<15:02:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 43%|████▎ | 5295/12384 [11:14:04<15:02:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 2: 43%|████▎ | 5296/12384 [11:14:04<15:01:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.44s]
Epoch 2: 43%|████▎ | 5296/12384 [11:14:12<15:01:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 43%|████▎ | 5297/12384 [11:14:12<15:01:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 43%|████▎ | 5297/12384 [11:14:19<15:01:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 2: 43%|████▎ | 5298/12384 [11:14:19<15:01:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 2: 43%|████▎ | 5298/12384 [11:14:27<15:01:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 43%|████▎ | 5299/12384 [11:14:27<15:02:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 43%|████▎ | 5299/12384 [11:14:35<15:02:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5300/12384 [11:14:35<15:00:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5300/12384 [11:14:42<15:00:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5301/12384 [11:14:42<15:00:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5301/12384 [11:14:50<15:00:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 43%|████▎ | 5302/12384 [11:14:50<14:59:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 43%|████▎ | 5302/12384 [11:14:57<14:59:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 43%|████▎ | 5303/12384 [11:14:57<15:00:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 43%|████▎ | 5303/12384 [11:15:05<15:00:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 43%|████▎ | 5304/12384 [11:15:05<15:00:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 43%|████▎ | 5304/12384 [11:15:13<15:00:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 43%|████▎ | 5305/12384 [11:15:13<14:59:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 43%|████▎ | 5305/12384 [11:15:20<14:59:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 43%|████▎ | 5306/12384 [11:15:20<14:59:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 43%|████▎ | 5306/12384 [11:15:28<14:59:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 43%|████▎ | 5307/12384 [11:15:28<14:59:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 43%|████▎ | 5307/12384 [11:15:36<14:59:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 43%|████▎ | 5308/12384 [11:15:36<14:58:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 43%|████▎ | 5308/12384 [11:15:43<14:58:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5309/12384 [11:15:43<15:00:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5309/12384 [11:15:51<15:00:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 43%|████▎ | 5310/12384 [11:15:51<14:59:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 43%|████▎ | 5310/12384 [11:15:59<14:59:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5311/12384 [11:15:59<14:59:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5311/12384 [11:16:06<14:59:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 43%|████▎ | 5312/12384 [11:16:06<15:09:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 43%|████▎ | 5312/12384 [11:16:14<15:09:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 43%|████▎ | 5313/12384 [11:16:14<15:06:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 43%|████▎ | 5313/12384 [11:16:22<15:06:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 43%|████▎ | 5314/12384 [11:16:22<15:02:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 43%|████▎ | 5314/12384 [11:16:29<15:02:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 2: 43%|████▎ | 5315/12384 [11:16:29<15:01:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 2: 43%|████▎ | 5315/12384 [11:16:37<15:01:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 43%|████▎ | 5316/12384 [11:16:37<14:59:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 43%|████▎ | 5316/12384 [11:16:45<14:59:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 43%|████▎ | 5317/12384 [11:16:45<15:08:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 43%|████▎ | 5317/12384 [11:16:52<15:08:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 43%|████▎ | 5318/12384 [11:16:52<15:03:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 43%|████▎ | 5318/12384 [11:17:00<15:03:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 43%|████▎ | 5319/12384 [11:17:00<15:00:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 43%|████▎ | 5319/12384 [11:17:08<15:00:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 43%|████▎ | 5320/12384 [11:17:08<15:00:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 43%|████▎ | 5320/12384 [11:17:15<15:00:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 43%|████▎ | 5321/12384 [11:17:15<14:58:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 43%|████▎ | 5321/12384 [11:17:23<14:58:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 43%|████▎ | 5322/12384 [11:17:23<14:57:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 43%|████▎ | 5322/12384 [11:17:30<14:57:59, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 2: 43%|████▎ | 5323/12384 [11:17:30<14:57:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 2: 43%|████▎ | 5323/12384 [11:17:38<14:57:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5324/12384 [11:17:38<14:56:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5324/12384 [11:17:46<14:56:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5325/12384 [11:17:46<14:56:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5325/12384 [11:17:53<14:56:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5326/12384 [11:17:53<14:58:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5326/12384 [11:18:01<14:58:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 43%|████▎ | 5327/12384 [11:18:01<14:57:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 43%|████▎ | 5327/12384 [11:18:09<14:57:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 43%|████▎ | 5328/12384 [11:18:09<14:56:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 43%|████▎ | 5328/12384 [11:18:16<14:56:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 43%|████▎ | 5329/12384 [11:18:16<14:56:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 43%|████▎ | 5329/12384 [11:18:24<14:56:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 43%|████▎ | 5330/12384 [11:18:24<14:56:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 43%|████▎ | 5330/12384 [11:18:31<14:56:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 43%|████▎ | 5331/12384 [11:18:31<14:56:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 43%|████▎ | 5331/12384 [11:18:39<14:56:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 43%|████▎ | 5332/12384 [11:18:39<14:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 43%|████▎ | 5332/12384 [11:18:47<14:54:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 2: 43%|████▎ | 5333/12384 [11:18:47<14:53:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 2: 43%|████▎ | 5333/12384 [11:18:54<14:53:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 43%|████▎ | 5334/12384 [11:18:54<14:53:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 43%|████▎ | 5334/12384 [11:19:02<14:53:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 2: 43%|████▎ | 5335/12384 [11:19:02<14:53:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 2: 43%|████▎ | 5335/12384 [11:19:09<14:53:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 2: 43%|████▎ | 5336/12384 [11:19:09<14:53:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 2: 43%|████▎ | 5336/12384 [11:19:17<14:53:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.48s]
Epoch 2: 43%|████▎ | 5337/12384 [11:19:17<14:53:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.48s]
Epoch 2: 43%|████▎ | 5337/12384 [11:19:25<14:53:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 2: 43%|████▎ | 5338/12384 [11:19:25<15:05:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 2: 43%|████▎ | 5338/12384 [11:19:33<15:05:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 43%|████▎ | 5339/12384 [11:19:33<15:00:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 43%|████▎ | 5339/12384 [11:19:40<15:00:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 43%|████▎ | 5340/12384 [11:19:40<14:57:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 43%|████▎ | 5340/12384 [11:19:48<14:57:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5341/12384 [11:19:48<14:56:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5341/12384 [11:19:55<14:56:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5342/12384 [11:19:55<14:55:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5342/12384 [11:20:03<14:55:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 43%|████▎ | 5343/12384 [11:20:03<14:55:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.94s]
Epoch 2: 43%|████▎ | 5343/12384 [11:20:11<14:55:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 43%|████▎ | 5344/12384 [11:20:11<14:54:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 43%|████▎ | 5344/12384 [11:20:18<14:54:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 43%|████▎ | 5345/12384 [11:20:18<14:53:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 43%|████▎ | 5345/12384 [11:20:26<14:53:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 43%|████▎ | 5346/12384 [11:20:26<14:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 43%|████▎ | 5346/12384 [11:20:33<14:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 43%|████▎ | 5347/12384 [11:20:33<14:52:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 43%|████▎ | 5347/12384 [11:20:41<14:52:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5348/12384 [11:20:41<14:52:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5348/12384 [11:20:49<14:52:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5349/12384 [11:20:49<14:52:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 43%|████▎ | 5349/12384 [11:20:56<14:52:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 43%|████▎ | 5350/12384 [11:20:56<14:52:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 43%|████▎ | 5350/12384 [11:21:04<14:52:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 43%|████▎ | 5351/12384 [11:21:04<14:54:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 43%|████▎ | 5351/12384 [11:21:12<14:54:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 43%|████▎ | 5352/12384 [11:21:12<14:53:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 43%|████▎ | 5352/12384 [11:21:19<14:53:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 43%|████▎ | 5353/12384 [11:21:19<14:53:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 43%|████▎ | 5353/12384 [11:21:27<14:53:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 43%|████▎ | 5354/12384 [11:21:27<14:52:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 43%|████▎ | 5354/12384 [11:21:34<14:52:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 43%|████▎ | 5355/12384 [11:21:34<14:51:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 43%|████▎ | 5355/12384 [11:21:42<14:51:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5356/12384 [11:21:42<14:51:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5356/12384 [11:21:50<14:51:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5357/12384 [11:21:50<14:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5357/12384 [11:21:57<14:50:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 43%|████▎ | 5358/12384 [11:21:57<14:51:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 43%|████▎ | 5358/12384 [11:22:05<14:51:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 43%|████▎ | 5359/12384 [11:22:05<14:52:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 43%|████▎ | 5359/12384 [11:22:12<14:52:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 43%|████▎ | 5360/12384 [11:22:12<14:52:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 43%|████▎ | 5360/12384 [11:22:20<14:52:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 43%|████▎ | 5361/12384 [11:22:20<14:51:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 43%|████▎ | 5361/12384 [11:22:28<14:51:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5362/12384 [11:22:28<14:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 43%|████▎ | 5362/12384 [11:22:35<14:50:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 2: 43%|████▎ | 5363/12384 [11:22:35<14:51:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.65s]
Epoch 2: 43%|████▎ | 5363/12384 [11:22:43<14:51:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 43%|████▎ | 5364/12384 [11:22:43<14:51:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 43%|████▎ | 5364/12384 [11:22:51<14:51:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 2: 43%|████▎ | 5365/12384 [11:22:51<15:02:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 2: 43%|████▎ | 5365/12384 [11:22:59<15:02:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 43%|████▎ | 5366/12384 [11:22:59<15:02:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 43%|████▎ | 5366/12384 [11:23:07<15:02:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 43%|████▎ | 5367/12384 [11:23:07<15:19:29, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 43%|████▎ | 5367/12384 [11:23:15<15:19:29, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 43%|████▎ | 5368/12384 [11:23:15<15:24:39, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 43%|████▎ | 5368/12384 [11:23:23<15:24:39, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 43%|████▎ | 5369/12384 [11:23:23<15:46:24, 8.09s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 43%|████▎ | 5369/12384 [11:23:32<15:46:24, 8.09s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 2: 43%|████▎ | 5370/12384 [11:23:32<15:49:47, 8.12s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 2: 43%|████▎ | 5370/12384 [11:23:39<15:49:47, 8.12s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5371/12384 [11:23:39<15:34:31, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 43%|████▎ | 5371/12384 [11:23:47<15:34:31, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 43%|████▎ | 5372/12384 [11:23:47<15:25:37, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 43%|████▎ | 5372/12384 [11:23:55<15:25:37, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 43%|████▎ | 5373/12384 [11:23:55<15:24:10, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 43%|████▎ | 5373/12384 [11:24:03<15:24:10, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 43%|████▎ | 5374/12384 [11:24:03<15:16:41, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 43%|████▎ | 5374/12384 [11:24:10<15:16:41, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 43%|████▎ | 5375/12384 [11:24:10<15:09:58, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 43%|████▎ | 5375/12384 [11:24:18<15:09:58, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 43%|████▎ | 5376/12384 [11:24:18<15:05:41, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 43%|████▎ | 5376/12384 [11:24:26<15:05:41, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 43%|████▎ | 5377/12384 [11:24:26<15:01:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 43%|████▎ | 5377/12384 [11:24:33<15:01:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 43%|████▎ | 5378/12384 [11:24:33<14:58:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 43%|████▎ | 5378/12384 [11:24:41<14:58:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 43%|████▎ | 5379/12384 [11:24:41<14:55:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 43%|████▎ | 5379/12384 [11:24:48<14:55:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 43%|████▎ | 5380/12384 [11:24:48<14:55:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 43%|████▎ | 5380/12384 [11:24:56<14:55:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 43%|████▎ | 5381/12384 [11:24:56<14:52:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 43%|████▎ | 5381/12384 [11:25:04<14:52:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 43%|████▎ | 5382/12384 [11:25:04<14:51:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 43%|████▎ | 5382/12384 [11:25:11<14:51:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 43%|████▎ | 5383/12384 [11:25:11<14:49:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 43%|████▎ | 5383/12384 [11:25:19<14:49:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 43%|████▎ | 5384/12384 [11:25:19<14:49:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 43%|████▎ | 5384/12384 [11:25:26<14:49:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 43%|████▎ | 5385/12384 [11:25:26<14:48:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 43%|████▎ | 5385/12384 [11:25:34<14:48:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 43%|████▎ | 5386/12384 [11:25:34<14:49:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.89s]
Epoch 2: 43%|████▎ | 5386/12384 [11:25:42<14:49:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 43%|████▎ | 5387/12384 [11:25:42<14:49:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 43%|████▎ | 5387/12384 [11:25:49<14:49:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▎ | 5388/12384 [11:25:49<14:48:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▎ | 5388/12384 [11:25:57<14:48:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▎ | 5389/12384 [11:25:57<14:49:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▎ | 5389/12384 [11:26:05<14:49:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 44%|████▎ | 5390/12384 [11:26:05<14:48:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 44%|████▎ | 5390/12384 [11:26:13<14:48:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 2: 44%|████▎ | 5391/12384 [11:26:13<14:59:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 2: 44%|████▎ | 5391/12384 [11:26:20<14:59:25, 7.72s/it, loss=0.0003, acc=0.9983, iter_time=8.29s]
Epoch 2: 44%|████▎ | 5392/12384 [11:26:20<14:55:31, 7.68s/it, loss=0.0003, acc=0.9983, iter_time=8.29s]
Epoch 2: 44%|████▎ | 5392/12384 [11:26:28<14:55:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 2: 44%|████▎ | 5393/12384 [11:26:28<14:54:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.93s]
Epoch 2: 44%|████▎ | 5393/12384 [11:26:35<14:54:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 44%|████▎ | 5394/12384 [11:26:35<14:51:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 44%|████▎ | 5394/12384 [11:26:43<14:51:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 44%|████▎ | 5395/12384 [11:26:43<14:52:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 44%|████▎ | 5395/12384 [11:26:51<14:52:19, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=6.37s]
Epoch 2: 44%|████▎ | 5396/12384 [11:26:51<14:51:33, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=6.37s]
Epoch 2: 44%|████▎ | 5396/12384 [11:26:58<14:51:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 44%|████▎ | 5397/12384 [11:26:58<14:51:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 44%|████▎ | 5397/12384 [11:27:06<14:51:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 44%|████▎ | 5398/12384 [11:27:06<14:49:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 44%|████▎ | 5398/12384 [11:27:14<14:49:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 44%|████▎ | 5399/12384 [11:27:14<14:51:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 44%|████▎ | 5399/12384 [11:27:21<14:51:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▎ | 5400/12384 [11:27:21<14:50:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▎ | 5400/12384 [11:27:29<14:50:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▎ | 5401/12384 [11:27:29<14:49:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▎ | 5401/12384 [11:27:37<14:49:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 44%|████▎ | 5402/12384 [11:27:37<14:50:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 44%|████▎ | 5402/12384 [11:27:44<14:50:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 44%|████▎ | 5403/12384 [11:27:44<14:50:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 44%|████▎ | 5403/12384 [11:27:52<14:50:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 44%|████▎ | 5404/12384 [11:27:52<14:50:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 44%|████▎ | 5404/12384 [11:28:00<14:50:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 44%|████▎ | 5405/12384 [11:28:00<14:52:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 44%|████▎ | 5405/12384 [11:28:07<14:52:17, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=10.30s]
Epoch 2: 44%|████▎ | 5406/12384 [11:28:07<14:51:24, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=10.30s]
Epoch 2: 44%|████▎ | 5406/12384 [11:28:15<14:51:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 44%|████▎ | 5407/12384 [11:28:15<14:49:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 44%|████▎ | 5407/12384 [11:28:22<14:49:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 44%|████▎ | 5408/12384 [11:28:22<14:46:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 44%|████▎ | 5408/12384 [11:28:30<14:46:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▎ | 5409/12384 [11:28:30<14:45:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▎ | 5409/12384 [11:28:38<14:45:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 44%|████▎ | 5410/12384 [11:28:38<14:47:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 44%|████▎ | 5410/12384 [11:28:45<14:47:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 44%|████▎ | 5411/12384 [11:28:45<14:46:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 44%|████▎ | 5411/12384 [11:28:53<14:46:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 44%|████▎ | 5412/12384 [11:28:53<14:45:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 44%|████▎ | 5412/12384 [11:29:01<14:45:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 44%|████▎ | 5413/12384 [11:29:01<14:45:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 44%|████▎ | 5413/12384 [11:29:08<14:45:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 44%|████▎ | 5414/12384 [11:29:08<14:46:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 44%|████▎ | 5414/12384 [11:29:16<14:46:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 44%|████▎ | 5415/12384 [11:29:16<14:47:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 44%|████▎ | 5415/12384 [11:29:24<14:47:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 44%|████▎ | 5416/12384 [11:29:24<14:46:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 44%|████▎ | 5416/12384 [11:29:31<14:46:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 44%|████▎ | 5417/12384 [11:29:31<14:54:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 44%|████▎ | 5417/12384 [11:29:39<14:54:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 44%|████▍ | 5418/12384 [11:29:39<14:54:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 44%|████▍ | 5418/12384 [11:29:47<14:54:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 44%|████▍ | 5419/12384 [11:29:47<14:51:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 44%|████▍ | 5419/12384 [11:29:54<14:51:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 2: 44%|████▍ | 5420/12384 [11:29:54<14:51:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 2: 44%|████▍ | 5420/12384 [11:30:02<14:51:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5421/12384 [11:30:02<14:48:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5421/12384 [11:30:10<14:48:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 44%|████▍ | 5422/12384 [11:30:10<14:47:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 44%|████▍ | 5422/12384 [11:30:17<14:47:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 44%|████▍ | 5423/12384 [11:30:17<14:45:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 44%|████▍ | 5423/12384 [11:30:25<14:45:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 44%|████▍ | 5424/12384 [11:30:25<14:45:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 44%|████▍ | 5424/12384 [11:30:32<14:45:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.24s]
Epoch 2: 44%|████▍ | 5425/12384 [11:30:32<14:44:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.24s]
Epoch 2: 44%|████▍ | 5425/12384 [11:30:40<14:44:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=12.04s]
Epoch 2: 44%|████▍ | 5426/12384 [11:30:40<14:43:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=12.04s]
Epoch 2: 44%|████▍ | 5426/12384 [11:30:48<14:43:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 2: 44%|████▍ | 5427/12384 [11:30:48<14:43:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 2: 44%|████▍ | 5427/12384 [11:30:55<14:43:32, 7.62s/it, loss=0.0002, acc=0.9982, iter_time=7.64s]
Epoch 2: 44%|████▍ | 5428/12384 [11:30:55<14:42:47, 7.61s/it, loss=0.0002, acc=0.9982, iter_time=7.64s]
Epoch 2: 44%|████▍ | 5428/12384 [11:31:03<14:42:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 44%|████▍ | 5429/12384 [11:31:03<14:42:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 44%|████▍ | 5429/12384 [11:31:11<14:42:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 44%|████▍ | 5430/12384 [11:31:11<14:43:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 44%|████▍ | 5430/12384 [11:31:18<14:43:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 44%|████▍ | 5431/12384 [11:31:18<14:44:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 44%|████▍ | 5431/12384 [11:31:26<14:44:57, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.05s]
Epoch 2: 44%|████▍ | 5432/12384 [11:31:26<14:43:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.05s]
Epoch 2: 44%|████▍ | 5432/12384 [11:31:33<14:43:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 44%|████▍ | 5433/12384 [11:31:33<14:43:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 44%|████▍ | 5433/12384 [11:31:41<14:43:16, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.42s]
Epoch 2: 44%|████▍ | 5434/12384 [11:31:41<14:42:01, 7.61s/it, loss=0.0003, acc=1.0000, iter_time=6.42s]
Epoch 2: 44%|████▍ | 5434/12384 [11:31:49<14:42:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 44%|████▍ | 5435/12384 [11:31:49<14:42:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 44%|████▍ | 5435/12384 [11:31:56<14:42:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 44%|████▍ | 5436/12384 [11:31:56<14:42:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 44%|████▍ | 5436/12384 [11:32:04<14:42:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 44%|████▍ | 5437/12384 [11:32:04<14:42:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 44%|████▍ | 5437/12384 [11:32:12<14:42:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 44%|████▍ | 5438/12384 [11:32:12<14:42:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 44%|████▍ | 5438/12384 [11:32:19<14:42:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 44%|████▍ | 5439/12384 [11:32:19<14:42:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 44%|████▍ | 5439/12384 [11:32:27<14:42:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 44%|████▍ | 5440/12384 [11:32:27<14:45:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 44%|████▍ | 5440/12384 [11:32:34<14:45:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 44%|████▍ | 5441/12384 [11:32:34<14:43:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 44%|████▍ | 5441/12384 [11:32:42<14:43:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 2: 44%|████▍ | 5442/12384 [11:32:42<14:42:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 2: 44%|████▍ | 5442/12384 [11:32:50<14:42:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 44%|████▍ | 5443/12384 [11:32:50<14:53:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 44%|████▍ | 5443/12384 [11:32:58<14:53:16, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 44%|████▍ | 5444/12384 [11:32:58<14:49:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 44%|████▍ | 5444/12384 [11:33:05<14:49:19, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 44%|████▍ | 5445/12384 [11:33:05<14:52:31, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 44%|████▍ | 5445/12384 [11:33:13<14:52:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.24s]
Epoch 2: 44%|████▍ | 5446/12384 [11:33:13<14:48:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.24s]
Epoch 2: 44%|████▍ | 5446/12384 [11:33:21<14:48:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 44%|████▍ | 5447/12384 [11:33:21<14:46:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 44%|████▍ | 5447/12384 [11:33:28<14:46:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 44%|████▍ | 5448/12384 [11:33:28<14:47:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 44%|████▍ | 5448/12384 [11:33:36<14:47:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 44%|████▍ | 5449/12384 [11:33:36<14:45:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 44%|████▍ | 5449/12384 [11:33:44<14:45:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 44%|████▍ | 5450/12384 [11:33:44<14:43:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 44%|████▍ | 5450/12384 [11:33:51<14:43:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 44%|████▍ | 5451/12384 [11:33:51<14:43:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 44%|████▍ | 5451/12384 [11:33:59<14:43:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 44%|████▍ | 5452/12384 [11:33:59<14:42:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 44%|████▍ | 5452/12384 [11:34:06<14:42:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.17s]
Epoch 2: 44%|████▍ | 5453/12384 [11:34:06<14:41:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.17s]
Epoch 2: 44%|████▍ | 5453/12384 [11:34:14<14:41:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 44%|████▍ | 5454/12384 [11:34:14<14:44:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 44%|████▍ | 5454/12384 [11:34:22<14:44:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 44%|████▍ | 5455/12384 [11:34:22<14:42:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 44%|████▍ | 5455/12384 [11:34:29<14:42:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 44%|████▍ | 5456/12384 [11:34:29<14:40:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 44%|████▍ | 5456/12384 [11:34:37<14:40:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 44%|████▍ | 5457/12384 [11:34:37<14:40:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 44%|████▍ | 5457/12384 [11:34:45<14:40:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 44%|████▍ | 5458/12384 [11:34:45<14:39:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 44%|████▍ | 5458/12384 [11:34:52<14:39:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 44%|████▍ | 5459/12384 [11:34:52<14:38:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 44%|████▍ | 5459/12384 [11:35:00<14:38:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 44%|████▍ | 5460/12384 [11:35:00<14:39:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 44%|████▍ | 5460/12384 [11:35:07<14:39:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 44%|████▍ | 5461/12384 [11:35:07<14:40:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 44%|████▍ | 5461/12384 [11:35:15<14:40:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 44%|████▍ | 5462/12384 [11:35:15<14:41:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 44%|████▍ | 5462/12384 [11:35:23<14:41:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5463/12384 [11:35:23<14:41:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5463/12384 [11:35:30<14:41:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5464/12384 [11:35:30<14:42:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5464/12384 [11:35:38<14:42:26, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5465/12384 [11:35:38<14:40:44, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5465/12384 [11:35:46<14:40:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 44%|████▍ | 5466/12384 [11:35:46<14:39:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 44%|████▍ | 5466/12384 [11:35:53<14:39:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▍ | 5467/12384 [11:35:53<14:38:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▍ | 5467/12384 [11:36:01<14:38:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 44%|████▍ | 5468/12384 [11:36:01<14:38:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 44%|████▍ | 5468/12384 [11:36:09<14:38:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 44%|████▍ | 5469/12384 [11:36:09<14:49:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 44%|████▍ | 5469/12384 [11:36:17<14:49:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=3.70s]
Epoch 2: 44%|████▍ | 5470/12384 [11:36:17<14:47:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=3.70s]
Epoch 2: 44%|████▍ | 5470/12384 [11:36:24<14:47:09, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 44%|████▍ | 5471/12384 [11:36:24<14:43:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 44%|████▍ | 5471/12384 [11:36:32<14:43:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 44%|████▍ | 5472/12384 [11:36:32<14:41:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 44%|████▍ | 5472/12384 [11:36:39<14:41:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 44%|████▍ | 5473/12384 [11:36:39<14:41:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 44%|████▍ | 5473/12384 [11:36:47<14:41:24, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 2: 44%|████▍ | 5474/12384 [11:36:47<14:39:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 2: 44%|████▍ | 5474/12384 [11:36:55<14:39:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 44%|████▍ | 5475/12384 [11:36:55<14:40:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.60s]
Epoch 2: 44%|████▍ | 5475/12384 [11:37:02<14:40:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 44%|████▍ | 5476/12384 [11:37:02<14:40:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 44%|████▍ | 5476/12384 [11:37:10<14:40:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 44%|████▍ | 5477/12384 [11:37:10<14:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 44%|████▍ | 5477/12384 [11:37:18<14:39:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 44%|████▍ | 5478/12384 [11:37:18<14:38:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 44%|████▍ | 5478/12384 [11:37:25<14:38:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 44%|████▍ | 5479/12384 [11:37:25<14:37:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 44%|████▍ | 5479/12384 [11:37:33<14:37:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 44%|████▍ | 5480/12384 [11:37:33<14:38:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 44%|████▍ | 5480/12384 [11:37:41<14:38:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5481/12384 [11:37:41<14:41:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 44%|████▍ | 5481/12384 [11:37:48<14:41:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 44%|████▍ | 5482/12384 [11:37:48<14:43:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 44%|████▍ | 5482/12384 [11:37:56<14:43:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 44%|████▍ | 5483/12384 [11:37:56<14:41:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 44%|████▍ | 5483/12384 [11:38:03<14:41:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 44%|████▍ | 5484/12384 [11:38:03<14:39:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 44%|████▍ | 5484/12384 [11:38:11<14:39:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 44%|████▍ | 5485/12384 [11:38:11<14:37:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 44%|████▍ | 5485/12384 [11:38:19<14:37:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 44%|████▍ | 5486/12384 [11:38:19<14:36:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 44%|████▍ | 5486/12384 [11:38:26<14:36:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 44%|████▍ | 5487/12384 [11:38:26<14:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 44%|████▍ | 5487/12384 [11:38:34<14:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 44%|████▍ | 5488/12384 [11:38:34<14:35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 44%|████▍ | 5488/12384 [11:38:42<14:35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 44%|████▍ | 5489/12384 [11:38:42<14:35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 44%|████▍ | 5489/12384 [11:38:49<14:35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▍ | 5490/12384 [11:38:49<14:35:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▍ | 5490/12384 [11:38:57<14:35:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 44%|████▍ | 5491/12384 [11:38:57<14:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 44%|████▍ | 5491/12384 [11:39:04<14:34:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 44%|████▍ | 5492/12384 [11:39:04<14:34:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 44%|████▍ | 5492/12384 [11:39:12<14:34:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▍ | 5493/12384 [11:39:12<14:36:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 44%|████▍ | 5493/12384 [11:39:20<14:36:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 44%|████▍ | 5494/12384 [11:39:20<14:35:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 44%|████▍ | 5494/12384 [11:39:27<14:35:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 44%|████▍ | 5495/12384 [11:39:27<14:35:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 44%|████▍ | 5495/12384 [11:39:35<14:35:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 44%|████▍ | 5496/12384 [11:39:35<14:45:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 44%|████▍ | 5496/12384 [11:39:43<14:45:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 44%|████▍ | 5497/12384 [11:39:43<14:42:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 44%|████▍ | 5497/12384 [11:39:50<14:42:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 44%|████▍ | 5498/12384 [11:39:50<14:39:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 44%|████▍ | 5498/12384 [11:39:58<14:39:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 44%|████▍ | 5499/12384 [11:39:58<14:39:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 44%|████▍ | 5499/12384 [11:40:06<14:39:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 44%|████▍ | 5500/12384 [11:40:06<14:37:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 44%|████▍ | 5500/12384 [11:40:13<14:37:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 44%|████▍ | 5501/12384 [11:40:13<14:36:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.73s]
Epoch 2: 44%|████▍ | 5501/12384 [11:40:21<14:36:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 44%|████▍ | 5502/12384 [11:40:21<14:35:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 44%|████▍ | 5502/12384 [11:40:29<14:35:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 44%|████▍ | 5503/12384 [11:40:29<14:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 44%|████▍ | 5503/12384 [11:40:36<14:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 44%|████▍ | 5504/12384 [11:40:36<14:33:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 44%|████▍ | 5504/12384 [11:40:44<14:33:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 44%|████▍ | 5505/12384 [11:40:44<14:32:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 44%|████▍ | 5505/12384 [11:40:51<14:32:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 44%|████▍ | 5506/12384 [11:40:51<14:32:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 44%|████▍ | 5506/12384 [11:40:59<14:32:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 44%|████▍ | 5507/12384 [11:40:59<14:32:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 44%|████▍ | 5507/12384 [11:41:07<14:32:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 44%|████▍ | 5508/12384 [11:41:07<14:32:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 44%|████▍ | 5508/12384 [11:41:14<14:32:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 44%|████▍ | 5509/12384 [11:41:14<14:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 44%|████▍ | 5509/12384 [11:41:22<14:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 44%|████▍ | 5510/12384 [11:41:22<14:32:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 44%|████▍ | 5510/12384 [11:41:29<14:32:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 2: 45%|████▍ | 5511/12384 [11:41:29<14:32:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 2: 45%|████▍ | 5511/12384 [11:41:37<14:32:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 45%|████▍ | 5512/12384 [11:41:37<14:32:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 45%|████▍ | 5512/12384 [11:41:45<14:32:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 45%|████▍ | 5513/12384 [11:41:45<14:33:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 45%|████▍ | 5513/12384 [11:41:52<14:33:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 45%|████▍ | 5514/12384 [11:41:52<14:32:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 45%|████▍ | 5514/12384 [11:42:00<14:32:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 45%|████▍ | 5515/12384 [11:42:00<14:31:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 45%|████▍ | 5515/12384 [11:42:08<14:31:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 45%|████▍ | 5516/12384 [11:42:08<14:31:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 45%|████▍ | 5516/12384 [11:42:15<14:31:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 45%|████▍ | 5517/12384 [11:42:15<14:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 45%|████▍ | 5517/12384 [11:42:23<14:31:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 45%|████▍ | 5518/12384 [11:42:23<14:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 45%|████▍ | 5518/12384 [11:42:30<14:31:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 45%|████▍ | 5519/12384 [11:42:30<14:32:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 45%|████▍ | 5519/12384 [11:42:39<14:32:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 45%|████▍ | 5520/12384 [11:42:39<15:05:34, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 45%|████▍ | 5520/12384 [11:42:47<15:05:34, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 2: 45%|████▍ | 5521/12384 [11:42:47<14:55:53, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=6.92s]
Epoch 2: 45%|████▍ | 5521/12384 [11:42:55<14:55:53, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 45%|████▍ | 5522/12384 [11:42:55<15:03:32, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 45%|████▍ | 5522/12384 [11:43:02<15:03:32, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 45%|████▍ | 5523/12384 [11:43:02<14:53:26, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 45%|████▍ | 5523/12384 [11:43:10<14:53:26, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 45%|████▍ | 5524/12384 [11:43:10<14:48:00, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 45%|████▍ | 5524/12384 [11:43:18<14:48:00, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 45%|████▍ | 5525/12384 [11:43:18<14:45:17, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 45%|████▍ | 5525/12384 [11:43:25<14:45:17, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 45%|████▍ | 5526/12384 [11:43:25<14:40:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 45%|████▍ | 5526/12384 [11:43:33<14:40:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 45%|████▍ | 5527/12384 [11:43:33<14:38:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 45%|████▍ | 5527/12384 [11:43:41<14:38:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 45%|████▍ | 5528/12384 [11:43:41<14:37:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 45%|████▍ | 5528/12384 [11:43:48<14:37:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 45%|████▍ | 5529/12384 [11:43:48<14:36:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 45%|████▍ | 5529/12384 [11:43:56<14:36:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 45%|████▍ | 5530/12384 [11:43:56<14:36:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 45%|████▍ | 5530/12384 [11:44:04<14:36:47, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.97s]
Epoch 2: 45%|████▍ | 5531/12384 [11:44:04<14:35:23, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.97s]
Epoch 2: 45%|████▍ | 5531/12384 [11:44:11<14:35:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 2: 45%|████▍ | 5532/12384 [11:44:11<14:33:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.28s]
Epoch 2: 45%|████▍ | 5532/12384 [11:44:19<14:33:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 2: 45%|████▍ | 5533/12384 [11:44:19<14:31:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.76s]
Epoch 2: 45%|████▍ | 5533/12384 [11:44:26<14:31:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 45%|████▍ | 5534/12384 [11:44:26<14:31:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 45%|████▍ | 5534/12384 [11:44:34<14:31:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 45%|████▍ | 5535/12384 [11:44:34<14:30:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 45%|████▍ | 5535/12384 [11:44:42<14:30:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 45%|████▍ | 5536/12384 [11:44:42<14:29:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 45%|████▍ | 5536/12384 [11:44:49<14:29:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 45%|████▍ | 5537/12384 [11:44:49<14:28:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 45%|████▍ | 5537/12384 [11:44:57<14:28:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 2: 45%|████▍ | 5538/12384 [11:44:57<14:28:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.41s]
Epoch 2: 45%|████▍ | 5538/12384 [11:45:04<14:28:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 45%|████▍ | 5539/12384 [11:45:04<14:29:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 45%|████▍ | 5539/12384 [11:45:12<14:29:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 45%|████▍ | 5540/12384 [11:45:12<14:28:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 45%|████▍ | 5540/12384 [11:45:20<14:28:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 45%|████▍ | 5541/12384 [11:45:20<14:28:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 45%|████▍ | 5541/12384 [11:45:27<14:28:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 45%|████▍ | 5542/12384 [11:45:27<14:31:58, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 45%|████▍ | 5542/12384 [11:45:35<14:31:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 2: 45%|████▍ | 5543/12384 [11:45:35<14:29:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 2: 45%|████▍ | 5543/12384 [11:45:43<14:29:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 2: 45%|████▍ | 5544/12384 [11:45:43<14:28:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 2: 45%|████▍ | 5544/12384 [11:45:50<14:28:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 45%|████▍ | 5545/12384 [11:45:50<14:28:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 45%|████▍ | 5545/12384 [11:45:58<14:28:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 45%|████▍ | 5546/12384 [11:45:58<14:27:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 45%|████▍ | 5546/12384 [11:46:05<14:27:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 45%|████▍ | 5547/12384 [11:46:05<14:28:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 45%|████▍ | 5547/12384 [11:46:13<14:28:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 45%|████▍ | 5548/12384 [11:46:13<14:29:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 45%|████▍ | 5548/12384 [11:46:21<14:29:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 45%|████▍ | 5549/12384 [11:46:21<14:39:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 45%|████▍ | 5549/12384 [11:46:29<14:39:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 45%|████▍ | 5550/12384 [11:46:29<14:35:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 45%|████▍ | 5550/12384 [11:46:36<14:35:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 45%|████▍ | 5551/12384 [11:46:36<14:35:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 45%|████▍ | 5551/12384 [11:46:44<14:35:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 45%|████▍ | 5552/12384 [11:46:44<14:43:37, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 45%|████▍ | 5552/12384 [11:46:52<14:43:37, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 45%|████▍ | 5553/12384 [11:46:52<14:37:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 45%|████▍ | 5553/12384 [11:46:59<14:37:59, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 45%|████▍ | 5554/12384 [11:46:59<14:34:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 45%|████▍ | 5554/12384 [11:47:07<14:34:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 45%|████▍ | 5555/12384 [11:47:07<14:31:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 45%|████▍ | 5555/12384 [11:47:15<14:31:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 45%|████▍ | 5556/12384 [11:47:15<14:29:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 45%|████▍ | 5556/12384 [11:47:22<14:29:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 2: 45%|████▍ | 5557/12384 [11:47:22<14:29:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 2: 45%|████▍ | 5557/12384 [11:47:30<14:29:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 2: 45%|████▍ | 5558/12384 [11:47:30<14:30:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.60s]
Epoch 2: 45%|████▍ | 5558/12384 [11:47:38<14:30:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 45%|████▍ | 5559/12384 [11:47:38<14:29:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 45%|████▍ | 5559/12384 [11:47:45<14:29:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 45%|████▍ | 5560/12384 [11:47:45<14:28:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 45%|████▍ | 5560/12384 [11:47:53<14:28:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 2: 45%|████▍ | 5561/12384 [11:47:53<14:26:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 2: 45%|████▍ | 5561/12384 [11:48:00<14:26:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 45%|████▍ | 5562/12384 [11:48:00<14:25:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 45%|████▍ | 5562/12384 [11:48:08<14:25:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 45%|████▍ | 5563/12384 [11:48:08<14:25:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 45%|████▍ | 5563/12384 [11:48:16<14:25:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 45%|████▍ | 5564/12384 [11:48:16<14:25:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 45%|████▍ | 5564/12384 [11:48:23<14:25:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 45%|████▍ | 5565/12384 [11:48:23<14:25:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 45%|████▍ | 5565/12384 [11:48:31<14:25:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 2: 45%|████▍ | 5566/12384 [11:48:31<14:25:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 2: 45%|████▍ | 5566/12384 [11:48:38<14:25:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.43s]
Epoch 2: 45%|████▍ | 5567/12384 [11:48:38<14:25:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.43s]
Epoch 2: 45%|████▍ | 5567/12384 [11:48:46<14:25:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 45%|████▍ | 5568/12384 [11:48:46<14:26:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 45%|████▍ | 5568/12384 [11:48:54<14:26:17, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.96s]
Epoch 2: 45%|████▍ | 5569/12384 [11:48:54<14:25:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.96s]
Epoch 2: 45%|████▍ | 5569/12384 [11:49:01<14:25:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 45%|████▍ | 5570/12384 [11:49:01<14:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 45%|████▍ | 5570/12384 [11:49:09<14:25:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 45%|████▍ | 5571/12384 [11:49:09<14:24:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 45%|████▍ | 5571/12384 [11:49:17<14:24:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 45%|████▍ | 5572/12384 [11:49:17<14:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 45%|████▍ | 5572/12384 [11:49:24<14:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 45%|████▌ | 5573/12384 [11:49:24<14:27:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 45%|████▌ | 5573/12384 [11:49:33<14:27:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 45%|████▌ | 5574/12384 [11:49:33<15:03:06, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 45%|████▌ | 5574/12384 [11:49:41<15:03:06, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 45%|████▌ | 5575/12384 [11:49:41<15:06:24, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 45%|████▌ | 5575/12384 [11:49:49<15:06:24, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 45%|████▌ | 5576/12384 [11:49:49<14:56:11, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 45%|████▌ | 5576/12384 [11:49:56<14:56:11, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 45%|████▌ | 5577/12384 [11:49:56<14:50:13, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 45%|████▌ | 5577/12384 [11:50:04<14:50:13, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 45%|████▌ | 5578/12384 [11:50:04<14:44:44, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 45%|████▌ | 5578/12384 [11:50:12<14:44:44, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 45%|████▌ | 5579/12384 [11:50:12<14:40:33, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 45%|████▌ | 5579/12384 [11:50:20<14:40:33, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 45%|████▌ | 5580/12384 [11:50:20<14:38:40, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 45%|████▌ | 5580/12384 [11:50:27<14:38:40, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 45%|████▌ | 5581/12384 [11:50:27<14:36:15, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 45%|████▌ | 5581/12384 [11:50:35<14:36:15, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 45%|████▌ | 5582/12384 [11:50:35<14:34:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 45%|████▌ | 5582/12384 [11:50:43<14:34:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 45%|████▌ | 5583/12384 [11:50:43<14:33:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 45%|████▌ | 5583/12384 [11:50:50<14:33:53, 7.71s/it, loss=0.0002, acc=0.9987, iter_time=9.09s]
Epoch 2: 45%|████▌ | 5584/12384 [11:50:50<14:32:08, 7.70s/it, loss=0.0002, acc=0.9987, iter_time=9.09s]
Epoch 2: 45%|████▌ | 5584/12384 [11:50:58<14:32:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 45%|████▌ | 5585/12384 [11:50:58<14:31:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 45%|████▌ | 5585/12384 [11:51:06<14:31:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 45%|████▌ | 5586/12384 [11:51:06<14:30:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 45%|████▌ | 5586/12384 [11:51:13<14:30:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 45%|████▌ | 5587/12384 [11:51:13<14:30:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 45%|████▌ | 5587/12384 [11:51:21<14:30:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 45%|████▌ | 5588/12384 [11:51:21<14:30:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 45%|████▌ | 5588/12384 [11:51:30<14:30:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 45%|████▌ | 5589/12384 [11:51:30<15:11:30, 8.05s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 45%|████▌ | 5589/12384 [11:51:38<15:11:30, 8.05s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 45%|████▌ | 5590/12384 [11:51:38<14:58:35, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 45%|████▌ | 5590/12384 [11:51:45<14:58:35, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 45%|████▌ | 5591/12384 [11:51:45<14:50:22, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 45%|████▌ | 5591/12384 [11:51:53<14:50:22, 7.86s/it, loss=0.0001, acc=0.9986, iter_time=10.95s]
Epoch 2: 45%|████▌ | 5592/12384 [11:51:53<14:43:44, 7.81s/it, loss=0.0001, acc=0.9986, iter_time=10.95s]
Epoch 2: 45%|████▌ | 5592/12384 [11:52:01<14:43:44, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 45%|████▌ | 5593/12384 [11:52:01<14:37:42, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 45%|████▌ | 5593/12384 [11:52:08<14:37:42, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 45%|████▌ | 5594/12384 [11:52:08<14:37:30, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 45%|████▌ | 5594/12384 [11:52:16<14:37:30, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 2: 45%|████▌ | 5595/12384 [11:52:16<14:33:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 2: 45%|████▌ | 5595/12384 [11:52:24<14:33:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 45%|████▌ | 5596/12384 [11:52:24<14:32:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.66s]
Epoch 2: 45%|████▌ | 5596/12384 [11:52:31<14:32:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 45%|████▌ | 5597/12384 [11:52:31<14:30:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 45%|████▌ | 5597/12384 [11:52:39<14:30:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 45%|████▌ | 5598/12384 [11:52:39<14:29:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 45%|████▌ | 5598/12384 [11:52:47<14:29:33, 7.69s/it, loss=0.0003, acc=0.9978, iter_time=7.34s]
Epoch 2: 45%|████▌ | 5599/12384 [11:52:47<14:30:11, 7.70s/it, loss=0.0003, acc=0.9978, iter_time=7.34s]
Epoch 2: 45%|████▌ | 5599/12384 [11:52:54<14:30:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 45%|████▌ | 5600/12384 [11:52:54<14:30:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 45%|████▌ | 5600/12384 [11:53:02<14:30:54, 7.70s/it, loss=0.0001, acc=0.9997, iter_time=6.78s]
Epoch 2: 45%|████▌ | 5601/12384 [11:53:02<14:42:19, 7.80s/it, loss=0.0001, acc=0.9997, iter_time=6.78s]
Epoch 2: 45%|████▌ | 5601/12384 [11:53:10<14:42:19, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 45%|████▌ | 5602/12384 [11:53:10<14:37:21, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 45%|████▌ | 5602/12384 [11:53:18<14:37:21, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 45%|████▌ | 5603/12384 [11:53:18<14:34:30, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 45%|████▌ | 5603/12384 [11:53:26<14:34:30, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 45%|████▌ | 5604/12384 [11:53:26<14:50:22, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 45%|████▌ | 5604/12384 [11:53:34<14:50:22, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 2: 45%|████▌ | 5605/12384 [11:53:34<14:47:20, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 2: 45%|████▌ | 5605/12384 [11:53:41<14:47:20, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 2: 45%|████▌ | 5606/12384 [11:53:41<14:40:32, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=10.80s]
Epoch 2: 45%|████▌ | 5606/12384 [11:53:49<14:40:32, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 45%|████▌ | 5607/12384 [11:53:49<14:36:32, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 45%|████▌ | 5607/12384 [11:53:57<14:36:32, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 45%|████▌ | 5608/12384 [11:53:57<14:33:32, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 45%|████▌ | 5608/12384 [11:54:05<14:33:32, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 45%|████▌ | 5609/12384 [11:54:05<14:32:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 45%|████▌ | 5609/12384 [11:54:12<14:32:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 2: 45%|████▌ | 5610/12384 [11:54:12<14:30:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.59s]
Epoch 2: 45%|████▌ | 5610/12384 [11:54:20<14:30:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 45%|████▌ | 5611/12384 [11:54:20<14:30:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 45%|████▌ | 5611/12384 [11:54:28<14:30:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 45%|████▌ | 5612/12384 [11:54:28<14:29:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 45%|████▌ | 5612/12384 [11:54:35<14:29:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 45%|████▌ | 5613/12384 [11:54:35<14:29:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 45%|████▌ | 5613/12384 [11:54:43<14:29:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 45%|████▌ | 5614/12384 [11:54:43<14:29:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 45%|████▌ | 5614/12384 [11:54:51<14:29:01, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=6.74s]
Epoch 2: 45%|████▌ | 5615/12384 [11:54:51<14:28:36, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=6.74s]
Epoch 2: 45%|████▌ | 5615/12384 [11:54:58<14:28:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 45%|████▌ | 5616/12384 [11:54:58<14:28:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 45%|████▌ | 5616/12384 [11:55:06<14:28:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 45%|████▌ | 5617/12384 [11:55:06<14:27:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 45%|████▌ | 5617/12384 [11:55:14<14:27:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 45%|████▌ | 5618/12384 [11:55:14<14:26:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 45%|████▌ | 5618/12384 [11:55:21<14:26:52, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 45%|████▌ | 5619/12384 [11:55:21<14:26:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 45%|████▌ | 5619/12384 [11:55:29<14:26:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 45%|████▌ | 5620/12384 [11:55:29<14:24:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 45%|████▌ | 5620/12384 [11:55:37<14:24:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 45%|████▌ | 5621/12384 [11:55:37<14:24:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 45%|████▌ | 5621/12384 [11:55:44<14:24:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 45%|████▌ | 5622/12384 [11:55:44<14:25:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 45%|████▌ | 5622/12384 [11:55:52<14:25:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 2: 45%|████▌ | 5623/12384 [11:55:52<14:24:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 2: 45%|████▌ | 5623/12384 [11:56:00<14:24:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 45%|████▌ | 5624/12384 [11:56:00<14:27:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 45%|████▌ | 5624/12384 [11:56:08<14:27:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 45%|████▌ | 5625/12384 [11:56:08<14:26:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 45%|████▌ | 5625/12384 [11:56:15<14:26:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 45%|████▌ | 5626/12384 [11:56:15<14:25:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 45%|████▌ | 5626/12384 [11:56:23<14:25:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 2: 45%|████▌ | 5627/12384 [11:56:23<14:38:44, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 2: 45%|████▌ | 5627/12384 [11:56:31<14:38:44, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 45%|████▌ | 5628/12384 [11:56:31<14:35:23, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 45%|████▌ | 5628/12384 [11:56:39<14:35:23, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 45%|████▌ | 5629/12384 [11:56:39<14:31:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 45%|████▌ | 5629/12384 [11:56:46<14:31:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 45%|████▌ | 5630/12384 [11:56:46<14:29:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 45%|████▌ | 5630/12384 [11:56:54<14:29:36, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 2: 45%|████▌ | 5631/12384 [11:56:54<14:41:42, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 2: 45%|████▌ | 5631/12384 [11:57:02<14:41:42, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 45%|████▌ | 5632/12384 [11:57:02<14:35:45, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 45%|████▌ | 5632/12384 [11:57:10<14:35:45, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 45%|████▌ | 5633/12384 [11:57:10<14:32:16, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 45%|████▌ | 5633/12384 [11:57:17<14:32:16, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 45%|████▌ | 5634/12384 [11:57:17<14:29:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 45%|████▌ | 5634/12384 [11:57:25<14:29:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 46%|████▌ | 5635/12384 [11:57:25<14:28:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 46%|████▌ | 5635/12384 [11:57:33<14:28:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 46%|████▌ | 5636/12384 [11:57:33<14:24:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 46%|████▌ | 5636/12384 [11:57:40<14:24:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▌ | 5637/12384 [11:57:40<14:22:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▌ | 5637/12384 [11:57:48<14:22:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▌ | 5638/12384 [11:57:48<14:20:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▌ | 5638/12384 [11:57:56<14:20:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 46%|████▌ | 5639/12384 [11:57:56<14:18:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 46%|████▌ | 5639/12384 [11:58:03<14:18:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 46%|████▌ | 5640/12384 [11:58:03<14:18:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 46%|████▌ | 5640/12384 [11:58:11<14:18:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 46%|████▌ | 5641/12384 [11:58:11<14:16:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 46%|████▌ | 5641/12384 [11:58:18<14:16:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5642/12384 [11:58:18<14:16:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5642/12384 [11:58:26<14:16:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 46%|████▌ | 5643/12384 [11:58:26<14:16:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 46%|████▌ | 5643/12384 [11:58:34<14:16:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 2: 46%|████▌ | 5644/12384 [11:58:34<14:15:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 2: 46%|████▌ | 5644/12384 [11:58:41<14:15:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5645/12384 [11:58:41<14:15:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5645/12384 [11:58:49<14:15:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5646/12384 [11:58:49<14:14:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5646/12384 [11:58:56<14:14:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5647/12384 [11:58:56<14:13:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5647/12384 [11:59:04<14:13:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 46%|████▌ | 5648/12384 [11:59:04<14:14:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 46%|████▌ | 5648/12384 [11:59:12<14:14:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 46%|████▌ | 5649/12384 [11:59:12<14:13:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 46%|████▌ | 5649/12384 [11:59:19<14:13:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 46%|████▌ | 5650/12384 [11:59:19<14:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 46%|████▌ | 5650/12384 [11:59:27<14:13:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5651/12384 [11:59:27<14:13:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5651/12384 [11:59:34<14:13:17, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 46%|████▌ | 5652/12384 [11:59:34<14:13:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 46%|████▌ | 5652/12384 [11:59:42<14:13:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 46%|████▌ | 5653/12384 [11:59:42<14:22:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 46%|████▌ | 5653/12384 [11:59:50<14:22:33, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=11.20s]
Epoch 2: 46%|████▌ | 5654/12384 [11:59:50<14:19:55, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.20s]
Epoch 2: 46%|████▌ | 5654/12384 [11:59:58<14:19:55, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 46%|████▌ | 5655/12384 [11:59:58<14:17:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 46%|████▌ | 5655/12384 [12:00:05<14:17:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 46%|████▌ | 5656/12384 [12:00:05<14:17:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 46%|████▌ | 5656/12384 [12:00:13<14:17:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 46%|████▌ | 5657/12384 [12:00:13<14:25:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 46%|████▌ | 5657/12384 [12:00:21<14:25:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5658/12384 [12:00:21<14:21:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5658/12384 [12:00:28<14:21:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5659/12384 [12:00:28<14:18:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5659/12384 [12:00:36<14:18:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5660/12384 [12:00:36<14:16:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5660/12384 [12:00:44<14:16:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5661/12384 [12:00:44<14:15:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5661/12384 [12:00:51<14:15:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 46%|████▌ | 5662/12384 [12:00:51<14:14:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 46%|████▌ | 5662/12384 [12:00:59<14:14:07, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5663/12384 [12:00:59<14:13:27, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5663/12384 [12:01:06<14:13:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 46%|████▌ | 5664/12384 [12:01:06<14:14:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 46%|████▌ | 5664/12384 [12:01:14<14:14:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 46%|████▌ | 5665/12384 [12:01:14<14:17:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 46%|████▌ | 5665/12384 [12:01:22<14:17:05, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.26s]
Epoch 2: 46%|████▌ | 5666/12384 [12:01:22<14:15:35, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=6.26s]
Epoch 2: 46%|████▌ | 5666/12384 [12:01:29<14:15:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 46%|████▌ | 5667/12384 [12:01:29<14:13:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 46%|████▌ | 5667/12384 [12:01:37<14:13:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 46%|████▌ | 5668/12384 [12:01:37<14:12:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 46%|████▌ | 5668/12384 [12:01:45<14:12:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5669/12384 [12:01:45<14:12:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 46%|████▌ | 5669/12384 [12:01:52<14:12:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.36s]
Epoch 2: 46%|████▌ | 5670/12384 [12:01:52<14:12:22, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.36s]
Epoch 2: 46%|████▌ | 5670/12384 [12:02:00<14:12:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 46%|████▌ | 5671/12384 [12:02:00<14:11:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 46%|████▌ | 5671/12384 [12:02:07<14:11:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 46%|████▌ | 5672/12384 [12:02:07<14:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 46%|████▌ | 5672/12384 [12:02:15<14:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 46%|████▌ | 5673/12384 [12:02:15<14:11:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 46%|████▌ | 5673/12384 [12:02:23<14:11:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 46%|████▌ | 5674/12384 [12:02:23<14:11:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 46%|████▌ | 5674/12384 [12:02:30<14:11:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 46%|████▌ | 5675/12384 [12:02:30<14:11:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 46%|████▌ | 5675/12384 [12:02:38<14:11:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 46%|████▌ | 5676/12384 [12:02:38<14:11:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 46%|████▌ | 5676/12384 [12:02:45<14:11:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 46%|████▌ | 5677/12384 [12:02:45<14:12:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 46%|████▌ | 5677/12384 [12:02:53<14:12:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 46%|████▌ | 5678/12384 [12:02:53<14:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 46%|████▌ | 5678/12384 [12:03:01<14:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5679/12384 [12:03:01<14:11:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▌ | 5679/12384 [12:03:09<14:11:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 2: 46%|████▌ | 5680/12384 [12:03:09<14:21:33, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 2: 46%|████▌ | 5680/12384 [12:03:16<14:21:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 46%|████▌ | 5681/12384 [12:03:16<14:17:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 46%|████▌ | 5681/12384 [12:03:24<14:17:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 46%|████▌ | 5682/12384 [12:03:24<14:14:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 46%|████▌ | 5682/12384 [12:03:32<14:14:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 46%|████▌ | 5683/12384 [12:03:32<14:23:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 46%|████▌ | 5683/12384 [12:03:39<14:23:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 46%|████▌ | 5684/12384 [12:03:39<14:19:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 46%|████▌ | 5684/12384 [12:03:47<14:19:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 46%|████▌ | 5685/12384 [12:03:47<14:18:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 46%|████▌ | 5685/12384 [12:03:55<14:18:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 46%|████▌ | 5686/12384 [12:03:55<14:15:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 46%|████▌ | 5686/12384 [12:04:02<14:15:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 46%|████▌ | 5687/12384 [12:04:02<14:14:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 46%|████▌ | 5687/12384 [12:04:10<14:14:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 46%|████▌ | 5688/12384 [12:04:10<14:13:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 46%|████▌ | 5688/12384 [12:04:17<14:13:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 46%|████▌ | 5689/12384 [12:04:17<14:10:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 46%|████▌ | 5689/12384 [12:04:25<14:10:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 2: 46%|████▌ | 5690/12384 [12:04:25<14:10:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 2: 46%|████▌ | 5690/12384 [12:04:33<14:10:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 46%|████▌ | 5691/12384 [12:04:33<14:10:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 46%|████▌ | 5691/12384 [12:04:40<14:10:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 46%|████▌ | 5692/12384 [12:04:40<14:09:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 46%|████▌ | 5692/12384 [12:04:48<14:09:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 46%|████▌ | 5693/12384 [12:04:48<14:09:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 46%|████▌ | 5693/12384 [12:04:56<14:09:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 46%|████▌ | 5694/12384 [12:04:56<14:09:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 46%|████▌ | 5694/12384 [12:05:03<14:09:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 46%|████▌ | 5695/12384 [12:05:03<14:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 46%|████▌ | 5695/12384 [12:05:11<14:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 46%|████▌ | 5696/12384 [12:05:11<14:08:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 46%|████▌ | 5696/12384 [12:05:18<14:08:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 46%|████▌ | 5697/12384 [12:05:18<14:07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 46%|████▌ | 5697/12384 [12:05:26<14:07:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 46%|████▌ | 5698/12384 [12:05:26<14:11:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 46%|████▌ | 5698/12384 [12:05:34<14:11:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 46%|████▌ | 5699/12384 [12:05:34<14:10:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 46%|████▌ | 5699/12384 [12:05:41<14:10:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5700/12384 [12:05:41<14:09:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5700/12384 [12:05:49<14:09:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 46%|████▌ | 5701/12384 [12:05:49<14:08:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 46%|████▌ | 5701/12384 [12:05:56<14:08:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 46%|████▌ | 5702/12384 [12:05:56<14:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 46%|████▌ | 5702/12384 [12:06:04<14:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 46%|████▌ | 5703/12384 [12:06:04<14:09:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 46%|████▌ | 5703/12384 [12:06:12<14:09:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 46%|████▌ | 5704/12384 [12:06:12<14:08:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 46%|████▌ | 5704/12384 [12:06:19<14:08:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 46%|████▌ | 5705/12384 [12:06:19<14:08:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 46%|████▌ | 5705/12384 [12:06:27<14:08:11, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.76s]
Epoch 2: 46%|████▌ | 5706/12384 [12:06:27<14:19:07, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.76s]
Epoch 2: 46%|████▌ | 5706/12384 [12:06:35<14:19:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 46%|████▌ | 5707/12384 [12:06:35<14:18:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 46%|████▌ | 5707/12384 [12:06:43<14:18:18, 7.71s/it, loss=0.0004, acc=0.9991, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5708/12384 [12:06:43<14:14:34, 7.68s/it, loss=0.0004, acc=0.9991, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5708/12384 [12:06:50<14:14:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 46%|████▌ | 5709/12384 [12:06:50<14:20:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 46%|████▌ | 5709/12384 [12:06:58<14:20:20, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 46%|████▌ | 5710/12384 [12:06:58<14:16:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 46%|████▌ | 5710/12384 [12:07:06<14:16:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 46%|████▌ | 5711/12384 [12:07:06<14:12:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 46%|████▌ | 5711/12384 [12:07:13<14:12:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 46%|████▌ | 5712/12384 [12:07:13<14:11:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 46%|████▌ | 5712/12384 [12:07:21<14:11:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 46%|████▌ | 5713/12384 [12:07:21<14:09:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 46%|████▌ | 5713/12384 [12:07:29<14:09:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 46%|████▌ | 5714/12384 [12:07:29<14:09:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 46%|████▌ | 5714/12384 [12:07:36<14:09:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 46%|████▌ | 5715/12384 [12:07:36<14:08:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 46%|████▌ | 5715/12384 [12:07:44<14:08:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 2: 46%|████▌ | 5716/12384 [12:07:44<14:08:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.77s]
Epoch 2: 46%|████▌ | 5716/12384 [12:07:51<14:08:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 2: 46%|████▌ | 5717/12384 [12:07:51<14:07:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 2: 46%|████▌ | 5717/12384 [12:07:59<14:07:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5718/12384 [12:07:59<14:07:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5718/12384 [12:08:07<14:07:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 46%|████▌ | 5719/12384 [12:08:07<14:06:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 46%|████▌ | 5719/12384 [12:08:14<14:06:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 2: 46%|████▌ | 5720/12384 [12:08:14<14:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 2: 46%|████▌ | 5720/12384 [12:08:22<14:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 46%|████▌ | 5721/12384 [12:08:22<14:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 46%|████▌ | 5721/12384 [12:08:29<14:06:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 46%|████▌ | 5722/12384 [12:08:29<14:05:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 46%|████▌ | 5722/12384 [12:08:37<14:05:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5723/12384 [12:08:37<14:05:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5723/12384 [12:08:45<14:05:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5724/12384 [12:08:45<14:05:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▌ | 5724/12384 [12:08:52<14:05:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 46%|████▌ | 5725/12384 [12:08:52<14:05:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 46%|████▌ | 5725/12384 [12:09:00<14:05:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 46%|████▌ | 5726/12384 [12:09:00<14:05:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 46%|████▌ | 5726/12384 [12:09:08<14:05:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 46%|████▌ | 5727/12384 [12:09:08<14:04:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 46%|████▌ | 5727/12384 [12:09:15<14:04:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 46%|████▋ | 5728/12384 [12:09:15<14:04:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 46%|████▋ | 5728/12384 [12:09:23<14:04:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 46%|████▋ | 5729/12384 [12:09:23<14:06:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 46%|████▋ | 5729/12384 [12:09:30<14:06:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▋ | 5730/12384 [12:09:30<14:06:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▋ | 5730/12384 [12:09:38<14:06:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▋ | 5731/12384 [12:09:38<14:05:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▋ | 5731/12384 [12:09:46<14:05:41, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 2: 46%|████▋ | 5732/12384 [12:09:46<14:11:49, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 2: 46%|████▋ | 5732/12384 [12:09:54<14:11:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 46%|████▋ | 5733/12384 [12:09:54<14:20:03, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 46%|████▋ | 5733/12384 [12:10:01<14:20:03, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 46%|████▋ | 5734/12384 [12:10:01<14:14:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 46%|████▋ | 5734/12384 [12:10:09<14:14:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▋ | 5735/12384 [12:10:09<14:11:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▋ | 5735/12384 [12:10:17<14:11:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 46%|████▋ | 5736/12384 [12:10:17<14:08:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 46%|████▋ | 5736/12384 [12:10:24<14:08:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 46%|████▋ | 5737/12384 [12:10:24<14:06:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 46%|████▋ | 5737/12384 [12:10:32<14:06:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 46%|████▋ | 5738/12384 [12:10:32<14:04:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 46%|████▋ | 5738/12384 [12:10:39<14:04:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 46%|████▋ | 5739/12384 [12:10:39<14:04:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 46%|████▋ | 5739/12384 [12:10:47<14:04:26, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.14s]
Epoch 2: 46%|████▋ | 5740/12384 [12:10:47<14:04:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.14s]
Epoch 2: 46%|████▋ | 5740/12384 [12:10:55<14:04:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 46%|████▋ | 5741/12384 [12:10:55<14:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 46%|████▋ | 5741/12384 [12:11:02<14:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 46%|████▋ | 5742/12384 [12:11:02<14:02:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 46%|████▋ | 5742/12384 [12:11:10<14:02:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▋ | 5743/12384 [12:11:10<14:02:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 46%|████▋ | 5743/12384 [12:11:18<14:02:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 46%|████▋ | 5744/12384 [12:11:18<14:02:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 46%|████▋ | 5744/12384 [12:11:25<14:02:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 46%|████▋ | 5745/12384 [12:11:25<14:02:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 46%|████▋ | 5745/12384 [12:11:33<14:02:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 46%|████▋ | 5746/12384 [12:11:33<14:02:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 46%|████▋ | 5746/12384 [12:11:40<14:02:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 46%|████▋ | 5747/12384 [12:11:40<14:04:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 46%|████▋ | 5747/12384 [12:11:48<14:04:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 46%|████▋ | 5748/12384 [12:11:48<14:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 46%|████▋ | 5748/12384 [12:11:56<14:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 46%|████▋ | 5749/12384 [12:11:56<14:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 46%|████▋ | 5749/12384 [12:12:03<14:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 46%|████▋ | 5750/12384 [12:12:03<14:01:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 46%|████▋ | 5750/12384 [12:12:11<14:01:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 46%|████▋ | 5751/12384 [12:12:11<14:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 46%|████▋ | 5751/12384 [12:12:18<14:01:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 46%|████▋ | 5752/12384 [12:12:18<14:00:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 46%|████▋ | 5752/12384 [12:12:26<14:00:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 46%|████▋ | 5753/12384 [12:12:26<13:59:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 46%|████▋ | 5753/12384 [12:12:34<13:59:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▋ | 5754/12384 [12:12:34<14:02:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 46%|████▋ | 5754/12384 [12:12:41<14:02:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 46%|████▋ | 5755/12384 [12:12:41<14:02:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 46%|████▋ | 5755/12384 [12:12:49<14:02:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 46%|████▋ | 5756/12384 [12:12:49<14:01:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 46%|████▋ | 5756/12384 [12:12:57<14:01:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 46%|████▋ | 5757/12384 [12:12:57<14:01:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 46%|████▋ | 5757/12384 [12:13:04<14:01:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▋ | 5758/12384 [12:13:04<14:01:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 46%|████▋ | 5758/12384 [12:13:12<14:01:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 47%|████▋ | 5759/12384 [12:13:12<14:09:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 47%|████▋ | 5759/12384 [12:13:20<14:09:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 47%|████▋ | 5760/12384 [12:13:20<14:08:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 47%|████▋ | 5760/12384 [12:13:27<14:08:02, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 47%|████▋ | 5761/12384 [12:13:27<14:04:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 47%|████▋ | 5761/12384 [12:13:35<14:04:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 47%|████▋ | 5762/12384 [12:13:35<14:12:08, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 47%|████▋ | 5762/12384 [12:13:43<14:12:08, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 47%|████▋ | 5763/12384 [12:13:43<14:08:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 47%|████▋ | 5763/12384 [12:13:50<14:08:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 47%|████▋ | 5764/12384 [12:13:50<14:04:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 47%|████▋ | 5764/12384 [12:13:58<14:04:54, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5765/12384 [12:13:58<14:04:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5765/12384 [12:14:06<14:04:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 47%|████▋ | 5766/12384 [12:14:06<14:02:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 47%|████▋ | 5766/12384 [12:14:13<14:02:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 47%|████▋ | 5767/12384 [12:14:13<14:01:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 47%|████▋ | 5767/12384 [12:14:21<14:01:18, 7.63s/it, loss=0.0002, acc=0.9977, iter_time=9.28s]
Epoch 2: 47%|████▋ | 5768/12384 [12:14:21<14:00:35, 7.62s/it, loss=0.0002, acc=0.9977, iter_time=9.28s]
Epoch 2: 47%|████▋ | 5768/12384 [12:14:28<14:00:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 47%|████▋ | 5769/12384 [12:14:28<13:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 47%|████▋ | 5769/12384 [12:14:36<13:59:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 47%|████▋ | 5770/12384 [12:14:36<13:59:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 47%|████▋ | 5770/12384 [12:14:44<13:59:04, 7.61s/it, loss=0.0002, acc=0.9978, iter_time=8.78s]
Epoch 2: 47%|████▋ | 5771/12384 [12:14:44<13:58:33, 7.61s/it, loss=0.0002, acc=0.9978, iter_time=8.78s]
Epoch 2: 47%|████▋ | 5771/12384 [12:14:51<13:58:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 47%|████▋ | 5772/12384 [12:14:51<13:58:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 47%|████▋ | 5772/12384 [12:14:59<13:58:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 47%|████▋ | 5773/12384 [12:14:59<13:58:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 47%|████▋ | 5773/12384 [12:15:06<13:58:08, 7.61s/it, loss=0.0003, acc=0.9991, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5774/12384 [12:15:06<13:58:18, 7.61s/it, loss=0.0003, acc=0.9991, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5774/12384 [12:15:14<13:58:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 47%|████▋ | 5775/12384 [12:15:14<13:57:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 47%|████▋ | 5775/12384 [12:15:22<13:57:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 2: 47%|████▋ | 5776/12384 [12:15:22<14:00:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 2: 47%|████▋ | 5776/12384 [12:15:29<14:00:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 47%|████▋ | 5777/12384 [12:15:29<13:59:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 47%|████▋ | 5777/12384 [12:15:37<13:59:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 47%|████▋ | 5778/12384 [12:15:37<13:59:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 47%|████▋ | 5778/12384 [12:15:45<13:59:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5779/12384 [12:15:45<13:58:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5779/12384 [12:15:52<13:58:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 47%|████▋ | 5780/12384 [12:15:52<13:58:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 47%|████▋ | 5780/12384 [12:16:00<13:58:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5781/12384 [12:16:00<13:57:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5781/12384 [12:16:07<13:57:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 47%|████▋ | 5782/12384 [12:16:07<13:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 47%|████▋ | 5782/12384 [12:16:15<13:57:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 47%|████▋ | 5783/12384 [12:16:15<13:57:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 47%|████▋ | 5783/12384 [12:16:23<13:57:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 47%|████▋ | 5784/12384 [12:16:23<13:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 47%|████▋ | 5784/12384 [12:16:31<13:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 47%|████▋ | 5785/12384 [12:16:31<14:07:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 47%|████▋ | 5785/12384 [12:16:38<14:07:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 47%|████▋ | 5786/12384 [12:16:38<14:04:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 47%|████▋ | 5786/12384 [12:16:46<14:04:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5787/12384 [12:16:46<14:02:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5787/12384 [12:16:54<14:02:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 47%|████▋ | 5788/12384 [12:16:54<14:10:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 47%|████▋ | 5788/12384 [12:17:01<14:10:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5789/12384 [12:17:01<14:06:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5789/12384 [12:17:09<14:06:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5790/12384 [12:17:09<14:02:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5790/12384 [12:17:17<14:02:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 47%|████▋ | 5791/12384 [12:17:17<14:00:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 47%|████▋ | 5791/12384 [12:17:24<14:00:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 47%|████▋ | 5792/12384 [12:17:24<13:58:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 47%|████▋ | 5792/12384 [12:17:32<13:58:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 47%|████▋ | 5793/12384 [12:17:32<13:57:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 47%|████▋ | 5793/12384 [12:17:39<13:57:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 47%|████▋ | 5794/12384 [12:17:39<13:57:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 47%|████▋ | 5794/12384 [12:17:47<13:57:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 47%|████▋ | 5795/12384 [12:17:47<13:56:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 47%|████▋ | 5795/12384 [12:17:55<13:56:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5796/12384 [12:17:55<13:55:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5796/12384 [12:18:02<13:55:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5797/12384 [12:18:02<13:55:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5797/12384 [12:18:10<13:55:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 47%|████▋ | 5798/12384 [12:18:10<13:54:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 47%|████▋ | 5798/12384 [12:18:17<13:54:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 47%|████▋ | 5799/12384 [12:18:17<13:57:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 47%|████▋ | 5799/12384 [12:18:25<13:57:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 47%|████▋ | 5800/12384 [12:18:25<13:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 47%|████▋ | 5800/12384 [12:18:33<13:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 2: 47%|████▋ | 5801/12384 [12:18:33<13:55:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 2: 47%|████▋ | 5801/12384 [12:18:40<13:55:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 47%|████▋ | 5802/12384 [12:18:40<13:54:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 47%|████▋ | 5802/12384 [12:18:48<13:54:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 47%|████▋ | 5803/12384 [12:18:48<13:52:41, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 47%|████▋ | 5803/12384 [12:18:55<13:52:41, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 2: 47%|████▋ | 5804/12384 [12:18:55<13:53:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 2: 47%|████▋ | 5804/12384 [12:19:03<13:53:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5805/12384 [12:19:03<13:52:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5805/12384 [12:19:11<13:52:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5806/12384 [12:19:11<13:52:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5806/12384 [12:19:18<13:52:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 47%|████▋ | 5807/12384 [12:19:18<13:52:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 47%|████▋ | 5807/12384 [12:19:26<13:52:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 47%|████▋ | 5808/12384 [12:19:26<13:53:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 47%|████▋ | 5808/12384 [12:19:33<13:53:21, 7.60s/it, loss=0.0014, acc=0.9973, iter_time=5.76s]
Epoch 2: 47%|████▋ | 5809/12384 [12:19:33<13:53:22, 7.60s/it, loss=0.0014, acc=0.9973, iter_time=5.76s]
Epoch 2: 47%|████▋ | 5809/12384 [12:19:41<13:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 47%|████▋ | 5810/12384 [12:19:41<13:56:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 47%|████▋ | 5810/12384 [12:19:49<13:56:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 47%|████▋ | 5811/12384 [12:19:49<14:06:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 47%|████▋ | 5811/12384 [12:19:57<14:06:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 47%|████▋ | 5812/12384 [12:19:57<14:02:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 47%|████▋ | 5812/12384 [12:20:04<14:02:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 47%|████▋ | 5813/12384 [12:20:04<13:58:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 47%|████▋ | 5813/12384 [12:20:12<13:58:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 47%|████▋ | 5814/12384 [12:20:12<13:56:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 47%|████▋ | 5814/12384 [12:20:20<13:56:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 47%|████▋ | 5815/12384 [12:20:20<14:06:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 47%|████▋ | 5815/12384 [12:20:27<14:06:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 47%|████▋ | 5816/12384 [12:20:27<14:01:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 47%|████▋ | 5816/12384 [12:20:35<14:01:30, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=4.18s]
Epoch 2: 47%|████▋ | 5817/12384 [12:20:35<13:58:50, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=4.18s]
Epoch 2: 47%|████▋ | 5817/12384 [12:20:43<13:58:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 47%|████▋ | 5818/12384 [12:20:43<14:00:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 47%|████▋ | 5818/12384 [12:20:50<14:00:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 47%|████▋ | 5819/12384 [12:20:50<13:57:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 47%|████▋ | 5819/12384 [12:20:58<13:57:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5820/12384 [12:20:58<13:56:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5820/12384 [12:21:06<13:56:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 47%|████▋ | 5821/12384 [12:21:06<13:55:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 47%|████▋ | 5821/12384 [12:21:13<13:55:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 47%|████▋ | 5822/12384 [12:21:13<13:54:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 47%|████▋ | 5822/12384 [12:21:21<13:54:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5823/12384 [12:21:21<13:53:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5823/12384 [12:21:28<13:53:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 47%|████▋ | 5824/12384 [12:21:28<13:56:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 47%|████▋ | 5824/12384 [12:21:36<13:56:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 47%|████▋ | 5825/12384 [12:21:36<13:55:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 47%|████▋ | 5825/12384 [12:21:44<13:55:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 47%|████▋ | 5826/12384 [12:21:44<13:53:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 47%|████▋ | 5826/12384 [12:21:51<13:53:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 47%|████▋ | 5827/12384 [12:21:51<13:52:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 47%|████▋ | 5827/12384 [12:21:59<13:52:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 47%|████▋ | 5828/12384 [12:21:59<13:52:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 47%|████▋ | 5828/12384 [12:22:06<13:52:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 47%|████▋ | 5829/12384 [12:22:06<13:51:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 47%|████▋ | 5829/12384 [12:22:14<13:51:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 2: 47%|████▋ | 5830/12384 [12:22:14<13:51:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 2: 47%|████▋ | 5830/12384 [12:22:22<13:51:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 2: 47%|████▋ | 5831/12384 [12:22:22<13:50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 2: 47%|████▋ | 5831/12384 [12:22:29<13:50:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 47%|████▋ | 5832/12384 [12:22:29<13:50:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 47%|████▋ | 5832/12384 [12:22:37<13:50:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 47%|████▋ | 5833/12384 [12:22:37<13:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 47%|████▋ | 5833/12384 [12:22:45<13:50:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 47%|████▋ | 5834/12384 [12:22:45<13:52:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 47%|████▋ | 5834/12384 [12:22:52<13:52:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 47%|████▋ | 5835/12384 [12:22:52<13:51:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 47%|████▋ | 5835/12384 [12:23:00<13:51:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 47%|████▋ | 5836/12384 [12:23:00<13:50:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 47%|████▋ | 5836/12384 [12:23:08<13:50:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 47%|████▋ | 5837/12384 [12:23:08<14:01:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 47%|████▋ | 5837/12384 [12:23:15<14:01:01, 7.71s/it, loss=0.0000, acc=0.9997, iter_time=8.22s]
Epoch 2: 47%|████▋ | 5838/12384 [12:23:15<13:57:58, 7.68s/it, loss=0.0000, acc=0.9997, iter_time=8.22s]
Epoch 2: 47%|████▋ | 5838/12384 [12:23:23<13:57:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 47%|████▋ | 5839/12384 [12:23:23<13:55:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 47%|████▋ | 5839/12384 [12:23:31<13:55:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 47%|████▋ | 5840/12384 [12:23:31<13:54:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 47%|████▋ | 5840/12384 [12:23:38<13:54:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 47%|████▋ | 5841/12384 [12:23:38<13:53:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 47%|████▋ | 5841/12384 [12:23:46<13:53:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 47%|████▋ | 5842/12384 [12:23:46<13:51:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 47%|████▋ | 5842/12384 [12:23:53<13:51:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 47%|████▋ | 5843/12384 [12:23:53<13:49:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 47%|████▋ | 5843/12384 [12:24:01<13:49:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 47%|████▋ | 5844/12384 [12:24:01<13:49:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 47%|████▋ | 5844/12384 [12:24:09<13:49:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 47%|████▋ | 5845/12384 [12:24:09<13:48:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 47%|████▋ | 5845/12384 [12:24:16<13:48:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5846/12384 [12:24:16<13:49:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 47%|████▋ | 5846/12384 [12:24:24<13:49:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 47%|████▋ | 5847/12384 [12:24:24<13:49:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 47%|████▋ | 5847/12384 [12:24:31<13:49:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 47%|████▋ | 5848/12384 [12:24:31<13:48:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 47%|████▋ | 5848/12384 [12:24:39<13:48:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 47%|████▋ | 5849/12384 [12:24:39<13:48:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 47%|████▋ | 5849/12384 [12:24:47<13:48:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 47%|████▋ | 5850/12384 [12:24:47<13:48:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 47%|████▋ | 5850/12384 [12:24:54<13:48:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 47%|████▋ | 5851/12384 [12:24:54<13:48:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 47%|████▋ | 5851/12384 [12:25:02<13:48:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5852/12384 [12:25:02<13:48:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5852/12384 [12:25:09<13:48:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 47%|████▋ | 5853/12384 [12:25:09<13:48:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 47%|████▋ | 5853/12384 [12:25:17<13:48:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 47%|████▋ | 5854/12384 [12:25:17<13:47:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 47%|████▋ | 5854/12384 [12:25:25<13:47:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 47%|████▋ | 5855/12384 [12:25:25<13:47:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 47%|████▋ | 5855/12384 [12:25:32<13:47:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 47%|████▋ | 5856/12384 [12:25:32<13:48:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 47%|████▋ | 5856/12384 [12:25:40<13:48:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 47%|████▋ | 5857/12384 [12:25:40<13:49:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 47%|████▋ | 5857/12384 [12:25:48<13:49:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.17s]
Epoch 2: 47%|████▋ | 5858/12384 [12:25:48<13:54:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.17s]
Epoch 2: 47%|████▋ | 5858/12384 [12:25:55<13:54:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 47%|████▋ | 5859/12384 [12:25:55<13:56:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.68s]
Epoch 2: 47%|████▋ | 5859/12384 [12:26:03<13:56:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 47%|████▋ | 5860/12384 [12:26:03<13:54:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 47%|████▋ | 5860/12384 [12:26:11<13:54:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 47%|████▋ | 5861/12384 [12:26:11<13:54:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 47%|████▋ | 5861/12384 [12:26:18<13:54:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 2: 47%|████▋ | 5862/12384 [12:26:18<13:54:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.03s]
Epoch 2: 47%|████▋ | 5862/12384 [12:26:26<13:54:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 47%|████▋ | 5863/12384 [12:26:26<13:52:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 47%|████▋ | 5863/12384 [12:26:34<13:52:20, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 47%|████▋ | 5864/12384 [12:26:34<14:00:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 47%|████▋ | 5864/12384 [12:26:42<14:00:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 47%|████▋ | 5865/12384 [12:26:42<13:55:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 47%|████▋ | 5865/12384 [12:26:49<13:55:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 47%|████▋ | 5866/12384 [12:26:49<13:54:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 47%|████▋ | 5866/12384 [12:26:57<13:54:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 47%|████▋ | 5867/12384 [12:26:57<13:51:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 47%|████▋ | 5867/12384 [12:27:05<13:51:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 47%|████▋ | 5868/12384 [12:27:05<13:59:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 47%|████▋ | 5868/12384 [12:27:12<13:59:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5869/12384 [12:27:12<13:55:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5869/12384 [12:27:20<13:55:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 47%|████▋ | 5870/12384 [12:27:20<13:51:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 47%|████▋ | 5870/12384 [12:27:28<13:51:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5871/12384 [12:27:28<13:49:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 47%|████▋ | 5871/12384 [12:27:35<13:49:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 47%|████▋ | 5872/12384 [12:27:35<13:48:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 47%|████▋ | 5872/12384 [12:27:43<13:48:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 47%|████▋ | 5873/12384 [12:27:43<13:47:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 47%|████▋ | 5873/12384 [12:27:50<13:47:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 47%|████▋ | 5874/12384 [12:27:50<13:47:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 47%|████▋ | 5874/12384 [12:27:58<13:47:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 47%|████▋ | 5875/12384 [12:27:58<13:46:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 47%|████▋ | 5875/12384 [12:28:06<13:46:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 2: 47%|████▋ | 5876/12384 [12:28:06<13:45:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.33s]
Epoch 2: 47%|████▋ | 5876/12384 [12:28:13<13:45:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 47%|████▋ | 5877/12384 [12:28:13<13:44:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 47%|████▋ | 5877/12384 [12:28:21<13:44:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 47%|████▋ | 5878/12384 [12:28:21<13:47:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 47%|████▋ | 5878/12384 [12:28:28<13:47:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5879/12384 [12:28:28<13:46:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 47%|████▋ | 5879/12384 [12:28:36<13:46:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 47%|████▋ | 5880/12384 [12:28:36<13:46:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 47%|████▋ | 5880/12384 [12:28:44<13:46:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 47%|████▋ | 5881/12384 [12:28:44<13:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 47%|████▋ | 5881/12384 [12:28:51<13:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 47%|████▋ | 5882/12384 [12:28:51<13:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 47%|████▋ | 5882/12384 [12:28:59<13:45:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 48%|████▊ | 5883/12384 [12:28:59<13:45:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 48%|████▊ | 5883/12384 [12:29:07<13:45:28, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5884/12384 [12:29:07<13:45:43, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5884/12384 [12:29:14<13:45:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5885/12384 [12:29:14<13:45:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5885/12384 [12:29:22<13:45:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 2: 48%|████▊ | 5886/12384 [12:29:22<13:44:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 2: 48%|████▊ | 5886/12384 [12:29:29<13:44:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5887/12384 [12:29:29<13:44:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5887/12384 [12:29:37<13:44:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 48%|████▊ | 5888/12384 [12:29:37<13:44:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 48%|████▊ | 5888/12384 [12:29:45<13:44:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 48%|████▊ | 5889/12384 [12:29:45<13:47:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 48%|████▊ | 5889/12384 [12:29:53<13:47:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 48%|████▊ | 5890/12384 [12:29:53<13:57:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 48%|████▊ | 5890/12384 [12:30:00<13:57:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 48%|████▊ | 5891/12384 [12:30:00<13:52:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 48%|████▊ | 5891/12384 [12:30:08<13:52:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 48%|████▊ | 5892/12384 [12:30:08<13:49:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 48%|████▊ | 5892/12384 [12:30:15<13:49:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 48%|████▊ | 5893/12384 [12:30:15<13:47:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 48%|████▊ | 5893/12384 [12:30:23<13:47:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.25s]
Epoch 2: 48%|████▊ | 5894/12384 [12:30:23<13:54:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.25s]
Epoch 2: 48%|████▊ | 5894/12384 [12:30:31<13:54:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 48%|████▊ | 5895/12384 [12:30:31<13:50:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 48%|████▊ | 5895/12384 [12:30:39<13:50:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.49s]
Epoch 2: 48%|████▊ | 5896/12384 [12:30:39<13:48:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.49s]
Epoch 2: 48%|████▊ | 5896/12384 [12:30:46<13:48:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 48%|████▊ | 5897/12384 [12:30:46<13:47:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 48%|████▊ | 5897/12384 [12:30:54<13:47:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 48%|████▊ | 5898/12384 [12:30:54<13:45:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 48%|████▊ | 5898/12384 [12:31:01<13:45:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 48%|████▊ | 5899/12384 [12:31:01<13:45:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 48%|████▊ | 5899/12384 [12:31:09<13:45:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5900/12384 [12:31:09<13:44:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5900/12384 [12:31:17<13:44:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 48%|████▊ | 5901/12384 [12:31:17<13:43:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 48%|████▊ | 5901/12384 [12:31:24<13:43:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 48%|████▊ | 5902/12384 [12:31:24<13:42:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 48%|████▊ | 5902/12384 [12:31:32<13:42:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 48%|████▊ | 5903/12384 [12:31:32<13:42:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 48%|████▊ | 5903/12384 [12:31:39<13:42:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 2: 48%|████▊ | 5904/12384 [12:31:39<13:42:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.56s]
Epoch 2: 48%|████▊ | 5904/12384 [12:31:47<13:42:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 48%|████▊ | 5905/12384 [12:31:47<13:42:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 48%|████▊ | 5905/12384 [12:31:55<13:42:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 48%|████▊ | 5906/12384 [12:31:55<13:41:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 48%|████▊ | 5906/12384 [12:32:02<13:41:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 48%|████▊ | 5907/12384 [12:32:02<13:41:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 48%|████▊ | 5907/12384 [12:32:10<13:41:56, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=10.40s]
Epoch 2: 48%|████▊ | 5908/12384 [12:32:10<13:41:12, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=10.40s]
Epoch 2: 48%|████▊ | 5908/12384 [12:32:18<13:41:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 48%|████▊ | 5909/12384 [12:32:18<13:42:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 48%|████▊ | 5909/12384 [12:32:25<13:42:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5910/12384 [12:32:25<13:40:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5910/12384 [12:32:33<13:40:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5911/12384 [12:32:33<13:40:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5911/12384 [12:32:40<13:40:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 48%|████▊ | 5912/12384 [12:32:40<13:40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 48%|████▊ | 5912/12384 [12:32:48<13:40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 48%|████▊ | 5913/12384 [12:32:48<13:40:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 48%|████▊ | 5913/12384 [12:32:56<13:40:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5914/12384 [12:32:56<13:40:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5914/12384 [12:33:03<13:40:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 48%|████▊ | 5915/12384 [12:33:03<13:40:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 48%|████▊ | 5915/12384 [12:33:11<13:40:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 48%|████▊ | 5916/12384 [12:33:11<13:52:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 48%|████▊ | 5916/12384 [12:33:19<13:52:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.75s]
Epoch 2: 48%|████▊ | 5917/12384 [12:33:19<14:01:53, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=11.75s]
Epoch 2: 48%|████▊ | 5917/12384 [12:33:27<14:01:53, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 2: 48%|████▊ | 5918/12384 [12:33:27<13:54:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.38s]
Epoch 2: 48%|████▊ | 5918/12384 [12:33:34<13:54:39, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 48%|████▊ | 5919/12384 [12:33:34<13:49:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 48%|████▊ | 5919/12384 [12:33:42<13:49:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 48%|████▊ | 5920/12384 [12:33:42<13:46:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 48%|████▊ | 5920/12384 [12:33:50<13:46:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 48%|████▊ | 5921/12384 [12:33:50<13:44:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 48%|████▊ | 5921/12384 [12:33:57<13:44:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 48%|████▊ | 5922/12384 [12:33:57<13:42:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 48%|████▊ | 5922/12384 [12:34:05<13:42:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 48%|████▊ | 5923/12384 [12:34:05<13:42:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 48%|████▊ | 5923/12384 [12:34:12<13:42:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 48%|████▊ | 5924/12384 [12:34:12<13:41:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 48%|████▊ | 5924/12384 [12:34:20<13:41:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5925/12384 [12:34:20<13:42:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5925/12384 [12:34:28<13:42:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 48%|████▊ | 5926/12384 [12:34:28<13:41:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 48%|████▊ | 5926/12384 [12:34:35<13:41:40, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=10.13s]
Epoch 2: 48%|████▊ | 5927/12384 [12:34:35<13:40:02, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=10.13s]
Epoch 2: 48%|████▊ | 5927/12384 [12:34:43<13:40:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 48%|████▊ | 5928/12384 [12:34:43<13:40:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 48%|████▊ | 5928/12384 [12:34:51<13:40:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 48%|████▊ | 5929/12384 [12:34:51<13:42:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 48%|████▊ | 5929/12384 [12:34:58<13:42:24, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.28s]
Epoch 2: 48%|████▊ | 5930/12384 [12:34:58<13:41:54, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.28s]
Epoch 2: 48%|████▊ | 5930/12384 [12:35:06<13:41:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5931/12384 [12:35:06<13:41:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5931/12384 [12:35:13<13:41:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 48%|████▊ | 5932/12384 [12:35:13<13:39:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 48%|████▊ | 5932/12384 [12:35:21<13:39:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.23s]
Epoch 2: 48%|████▊ | 5933/12384 [12:35:21<13:39:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.23s]
Epoch 2: 48%|████▊ | 5933/12384 [12:35:29<13:39:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 2: 48%|████▊ | 5934/12384 [12:35:29<13:39:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 2: 48%|████▊ | 5934/12384 [12:35:36<13:39:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 48%|████▊ | 5935/12384 [12:35:36<13:38:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 48%|████▊ | 5935/12384 [12:35:44<13:38:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 2: 48%|████▊ | 5936/12384 [12:35:44<13:38:30, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 2: 48%|████▊ | 5936/12384 [12:35:52<13:38:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 2: 48%|████▊ | 5937/12384 [12:35:52<13:37:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 2: 48%|████▊ | 5937/12384 [12:35:59<13:37:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 2: 48%|████▊ | 5938/12384 [12:35:59<13:37:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 2: 48%|████▊ | 5938/12384 [12:36:07<13:37:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 48%|████▊ | 5939/12384 [12:36:07<13:38:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 48%|████▊ | 5939/12384 [12:36:14<13:38:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 48%|████▊ | 5940/12384 [12:36:14<13:36:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 48%|████▊ | 5940/12384 [12:36:22<13:36:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5941/12384 [12:36:22<13:36:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5941/12384 [12:36:30<13:36:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5942/12384 [12:36:30<13:36:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5942/12384 [12:36:38<13:36:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 48%|████▊ | 5943/12384 [12:36:38<13:52:04, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 48%|████▊ | 5943/12384 [12:36:45<13:52:04, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 48%|████▊ | 5944/12384 [12:36:45<13:47:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 48%|████▊ | 5944/12384 [12:36:53<13:47:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 48%|████▊ | 5945/12384 [12:36:53<13:44:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 48%|████▊ | 5945/12384 [12:37:01<13:44:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 48%|████▊ | 5946/12384 [12:37:01<13:50:18, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 48%|████▊ | 5946/12384 [12:37:08<13:50:18, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 48%|████▊ | 5947/12384 [12:37:08<13:46:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 48%|████▊ | 5947/12384 [12:37:16<13:46:02, 7.70s/it, loss=0.0007, acc=0.9978, iter_time=7.93s]
Epoch 2: 48%|████▊ | 5948/12384 [12:37:16<13:43:02, 7.67s/it, loss=0.0007, acc=0.9978, iter_time=7.93s]
Epoch 2: 48%|████▊ | 5948/12384 [12:37:24<13:43:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 48%|████▊ | 5949/12384 [12:37:24<13:40:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 48%|████▊ | 5949/12384 [12:37:31<13:40:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5950/12384 [12:37:31<13:39:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5950/12384 [12:37:39<13:39:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5951/12384 [12:37:39<13:37:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5951/12384 [12:37:46<13:37:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 48%|████▊ | 5952/12384 [12:37:46<13:37:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 48%|████▊ | 5952/12384 [12:37:54<13:37:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 48%|████▊ | 5953/12384 [12:37:54<13:36:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 48%|████▊ | 5953/12384 [12:38:02<13:36:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5954/12384 [12:38:02<13:36:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 48%|████▊ | 5954/12384 [12:38:09<13:36:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5955/12384 [12:38:09<13:35:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5955/12384 [12:38:17<13:35:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 48%|████▊ | 5956/12384 [12:38:17<13:34:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 48%|████▊ | 5956/12384 [12:38:24<13:34:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 48%|████▊ | 5957/12384 [12:38:24<13:34:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 48%|████▊ | 5957/12384 [12:38:32<13:34:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5958/12384 [12:38:32<13:34:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5958/12384 [12:38:40<13:34:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 48%|████▊ | 5959/12384 [12:38:40<13:33:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 48%|████▊ | 5959/12384 [12:38:47<13:33:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 48%|████▊ | 5960/12384 [12:38:47<13:34:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 48%|████▊ | 5960/12384 [12:38:55<13:34:13, 7.60s/it, loss=0.0001, acc=0.9992, iter_time=7.23s]
Epoch 2: 48%|████▊ | 5961/12384 [12:38:55<13:34:12, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=7.23s]
Epoch 2: 48%|████▊ | 5961/12384 [12:39:02<13:34:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5962/12384 [12:39:02<13:33:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5962/12384 [12:39:10<13:33:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5963/12384 [12:39:10<13:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5963/12384 [12:39:18<13:33:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5964/12384 [12:39:18<13:33:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5964/12384 [12:39:25<13:33:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5965/12384 [12:39:25<13:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5965/12384 [12:39:33<13:33:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5966/12384 [12:39:33<13:33:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5966/12384 [12:39:40<13:33:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5967/12384 [12:39:40<13:33:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5967/12384 [12:39:48<13:33:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 48%|████▊ | 5968/12384 [12:39:48<13:34:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 48%|████▊ | 5968/12384 [12:39:56<13:34:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 48%|████▊ | 5969/12384 [12:39:56<13:44:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 48%|████▊ | 5969/12384 [12:40:04<13:44:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 48%|████▊ | 5970/12384 [12:40:04<13:41:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 48%|████▊ | 5970/12384 [12:40:11<13:41:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 48%|████▊ | 5971/12384 [12:40:11<13:39:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 48%|████▊ | 5971/12384 [12:40:19<13:39:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 48%|████▊ | 5972/12384 [12:40:19<13:50:29, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 48%|████▊ | 5972/12384 [12:40:27<13:50:29, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 48%|████▊ | 5973/12384 [12:40:27<13:45:33, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 48%|████▊ | 5973/12384 [12:40:35<13:45:33, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 48%|████▊ | 5974/12384 [12:40:35<13:41:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 48%|████▊ | 5974/12384 [12:40:42<13:41:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5975/12384 [12:40:42<13:38:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5975/12384 [12:40:50<13:38:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 48%|████▊ | 5976/12384 [12:40:50<13:37:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 48%|████▊ | 5976/12384 [12:40:57<13:37:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 48%|████▊ | 5977/12384 [12:40:57<13:35:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 48%|████▊ | 5977/12384 [12:41:05<13:35:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5978/12384 [12:41:05<13:34:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5978/12384 [12:41:13<13:34:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5979/12384 [12:41:13<13:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 48%|████▊ | 5979/12384 [12:41:20<13:33:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5980/12384 [12:41:20<13:35:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5980/12384 [12:41:28<13:35:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 48%|████▊ | 5981/12384 [12:41:28<13:37:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 48%|████▊ | 5981/12384 [12:41:36<13:37:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 48%|████▊ | 5982/12384 [12:41:36<13:35:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 48%|████▊ | 5982/12384 [12:41:43<13:35:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 2: 48%|████▊ | 5983/12384 [12:41:43<13:35:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 2: 48%|████▊ | 5983/12384 [12:41:51<13:35:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 48%|████▊ | 5984/12384 [12:41:51<13:34:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 48%|████▊ | 5984/12384 [12:41:58<13:34:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 48%|████▊ | 5985/12384 [12:41:58<13:33:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 48%|████▊ | 5985/12384 [12:42:06<13:33:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 48%|████▊ | 5986/12384 [12:42:06<13:32:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 48%|████▊ | 5986/12384 [12:42:14<13:32:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 48%|████▊ | 5987/12384 [12:42:14<13:32:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 48%|████▊ | 5987/12384 [12:42:21<13:32:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 48%|████▊ | 5988/12384 [12:42:21<13:31:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 48%|████▊ | 5988/12384 [12:42:29<13:31:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5989/12384 [12:42:29<13:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 48%|████▊ | 5989/12384 [12:42:37<13:30:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5990/12384 [12:42:37<13:32:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 5990/12384 [12:42:44<13:32:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 48%|████▊ | 5991/12384 [12:42:44<13:32:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 48%|████▊ | 5991/12384 [12:42:52<13:32:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 48%|████▊ | 5992/12384 [12:42:52<13:31:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 48%|████▊ | 5992/12384 [12:42:59<13:31:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 48%|████▊ | 5993/12384 [12:42:59<13:31:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 48%|████▊ | 5993/12384 [12:43:07<13:31:25, 7.62s/it, loss=0.0001, acc=0.9999, iter_time=10.44s]
Epoch 2: 48%|████▊ | 5994/12384 [12:43:07<13:32:13, 7.63s/it, loss=0.0001, acc=0.9999, iter_time=10.44s]
Epoch 2: 48%|████▊ | 5994/12384 [12:43:15<13:32:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 48%|████▊ | 5995/12384 [12:43:15<13:42:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 48%|████▊ | 5995/12384 [12:43:23<13:42:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 48%|████▊ | 5996/12384 [12:43:23<13:37:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 48%|████▊ | 5996/12384 [12:43:30<13:37:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5997/12384 [12:43:30<13:34:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 48%|████▊ | 5997/12384 [12:43:38<13:34:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 48%|████▊ | 5998/12384 [12:43:38<13:36:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 48%|████▊ | 5998/12384 [12:43:46<13:36:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 48%|████▊ | 5999/12384 [12:43:46<13:44:38, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 48%|████▊ | 5999/12384 [12:43:53<13:44:38, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 48%|████▊ | 6000/12384 [12:43:53<13:39:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 48%|████▊ | 6000/12384 [12:44:01<13:39:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 48%|████▊ | 6001/12384 [12:44:01<13:35:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 48%|████▊ | 6001/12384 [12:44:09<13:35:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 48%|████▊ | 6002/12384 [12:44:09<13:33:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 48%|████▊ | 6002/12384 [12:44:16<13:33:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 48%|████▊ | 6003/12384 [12:44:16<13:33:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 48%|████▊ | 6003/12384 [12:44:24<13:33:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 48%|████▊ | 6004/12384 [12:44:24<13:33:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 48%|████▊ | 6004/12384 [12:44:32<13:33:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 6005/12384 [12:44:32<13:33:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 48%|████▊ | 6005/12384 [12:44:39<13:33:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 48%|████▊ | 6006/12384 [12:44:39<13:33:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 48%|████▊ | 6006/12384 [12:44:47<13:33:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 49%|████▊ | 6007/12384 [12:44:47<13:32:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 49%|████▊ | 6007/12384 [12:44:54<13:32:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 49%|████▊ | 6008/12384 [12:44:54<13:32:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 49%|████▊ | 6008/12384 [12:45:02<13:32:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 49%|████▊ | 6009/12384 [12:45:02<13:30:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 49%|████▊ | 6009/12384 [12:45:10<13:30:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▊ | 6010/12384 [12:45:10<13:29:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▊ | 6010/12384 [12:45:17<13:29:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▊ | 6011/12384 [12:45:17<13:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▊ | 6011/12384 [12:45:25<13:29:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▊ | 6012/12384 [12:45:25<13:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▊ | 6012/12384 [12:45:32<13:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 49%|████▊ | 6013/12384 [12:45:32<13:28:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 49%|████▊ | 6013/12384 [12:45:40<13:28:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 49%|████▊ | 6014/12384 [12:45:40<13:29:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.40s]
Epoch 2: 49%|████▊ | 6014/12384 [12:45:48<13:29:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 49%|████▊ | 6015/12384 [12:45:48<13:28:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 49%|████▊ | 6015/12384 [12:45:55<13:28:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 49%|████▊ | 6016/12384 [12:45:55<13:27:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 49%|████▊ | 6016/12384 [12:46:03<13:27:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 49%|████▊ | 6017/12384 [12:46:03<13:31:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 49%|████▊ | 6017/12384 [12:46:11<13:31:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 49%|████▊ | 6018/12384 [12:46:11<13:30:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 49%|████▊ | 6018/12384 [12:46:18<13:30:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 49%|████▊ | 6019/12384 [12:46:18<13:29:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 49%|████▊ | 6019/12384 [12:46:26<13:29:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 2: 49%|████▊ | 6020/12384 [12:46:26<13:27:43, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 2: 49%|████▊ | 6020/12384 [12:46:34<13:27:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 49%|████▊ | 6021/12384 [12:46:34<13:39:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 49%|████▊ | 6021/12384 [12:46:41<13:39:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 49%|████▊ | 6022/12384 [12:46:41<13:35:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 49%|████▊ | 6022/12384 [12:46:49<13:35:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▊ | 6023/12384 [12:46:49<13:31:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▊ | 6023/12384 [12:46:57<13:31:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 49%|████▊ | 6024/12384 [12:46:57<13:29:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 49%|████▊ | 6024/12384 [12:47:04<13:29:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.74s]
Epoch 2: 49%|████▊ | 6025/12384 [12:47:04<13:28:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.74s]
Epoch 2: 49%|████▊ | 6025/12384 [12:47:12<13:28:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 49%|████▊ | 6026/12384 [12:47:12<13:27:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 49%|████▊ | 6026/12384 [12:47:19<13:27:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 49%|████▊ | 6027/12384 [12:47:19<13:27:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 49%|████▊ | 6027/12384 [12:47:27<13:27:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 49%|████▊ | 6028/12384 [12:47:27<13:27:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 49%|████▊ | 6028/12384 [12:47:35<13:27:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 49%|████▊ | 6029/12384 [12:47:35<13:26:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 49%|████▊ | 6029/12384 [12:47:42<13:26:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 49%|████▊ | 6030/12384 [12:47:42<13:27:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 49%|████▊ | 6030/12384 [12:47:50<13:27:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 49%|████▊ | 6031/12384 [12:47:50<13:26:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 49%|████▊ | 6031/12384 [12:47:58<13:26:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 49%|████▊ | 6032/12384 [12:47:58<13:26:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 49%|████▊ | 6032/12384 [12:48:05<13:26:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 49%|████▊ | 6033/12384 [12:48:05<13:25:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 49%|████▊ | 6033/12384 [12:48:13<13:25:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▊ | 6034/12384 [12:48:13<13:25:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▊ | 6034/12384 [12:48:20<13:25:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 49%|████▊ | 6035/12384 [12:48:20<13:27:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 49%|████▊ | 6035/12384 [12:48:28<13:27:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 49%|████▊ | 6036/12384 [12:48:28<13:26:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 49%|████▊ | 6036/12384 [12:48:36<13:26:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 49%|████▊ | 6037/12384 [12:48:36<13:27:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 49%|████▊ | 6037/12384 [12:48:43<13:27:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 49%|████▉ | 6038/12384 [12:48:43<13:28:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 49%|████▉ | 6038/12384 [12:48:51<13:28:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 49%|████▉ | 6039/12384 [12:48:51<13:27:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 49%|████▉ | 6039/12384 [12:48:59<13:27:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 49%|████▉ | 6040/12384 [12:48:59<13:26:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 49%|████▉ | 6040/12384 [12:49:06<13:26:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 49%|████▉ | 6041/12384 [12:49:06<13:25:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.10s]
Epoch 2: 49%|████▉ | 6041/12384 [12:49:14<13:25:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 49%|████▉ | 6042/12384 [12:49:14<13:24:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 49%|████▉ | 6042/12384 [12:49:21<13:24:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▉ | 6043/12384 [12:49:21<13:24:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▉ | 6043/12384 [12:49:29<13:24:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6044/12384 [12:49:29<13:24:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6044/12384 [12:49:37<13:24:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 49%|████▉ | 6045/12384 [12:49:37<13:24:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 49%|████▉ | 6045/12384 [12:49:44<13:24:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 49%|████▉ | 6046/12384 [12:49:44<13:23:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 49%|████▉ | 6046/12384 [12:49:52<13:23:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 49%|████▉ | 6047/12384 [12:49:52<13:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 49%|████▉ | 6047/12384 [12:50:00<13:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 49%|████▉ | 6048/12384 [12:50:00<13:37:00, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 49%|████▉ | 6048/12384 [12:50:07<13:37:00, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 49%|████▉ | 6049/12384 [12:50:07<13:32:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 49%|████▉ | 6049/12384 [12:50:15<13:32:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 49%|████▉ | 6050/12384 [12:50:15<13:28:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 49%|████▉ | 6050/12384 [12:50:23<13:28:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 49%|████▉ | 6051/12384 [12:50:23<13:27:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 49%|████▉ | 6051/12384 [12:50:31<13:27:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 49%|████▉ | 6052/12384 [12:50:31<13:35:35, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 49%|████▉ | 6052/12384 [12:50:38<13:35:35, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 49%|████▉ | 6053/12384 [12:50:38<13:33:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 49%|████▉ | 6053/12384 [12:50:46<13:33:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 49%|████▉ | 6054/12384 [12:50:46<13:29:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 49%|████▉ | 6054/12384 [12:50:53<13:29:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 49%|████▉ | 6055/12384 [12:50:53<13:27:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 49%|████▉ | 6055/12384 [12:51:01<13:27:47, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 49%|████▉ | 6056/12384 [12:51:01<13:26:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 49%|████▉ | 6056/12384 [12:51:09<13:26:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 49%|████▉ | 6057/12384 [12:51:09<13:25:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 49%|████▉ | 6057/12384 [12:51:16<13:25:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 49%|████▉ | 6058/12384 [12:51:16<13:24:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 49%|████▉ | 6058/12384 [12:51:24<13:24:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 49%|████▉ | 6059/12384 [12:51:24<13:24:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 49%|████▉ | 6059/12384 [12:51:32<13:24:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 49%|████▉ | 6060/12384 [12:51:32<13:23:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 49%|████▉ | 6060/12384 [12:51:39<13:23:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 49%|████▉ | 6061/12384 [12:51:39<13:25:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 49%|████▉ | 6061/12384 [12:51:47<13:25:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 49%|████▉ | 6062/12384 [12:51:47<13:23:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 49%|████▉ | 6062/12384 [12:51:54<13:23:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 49%|████▉ | 6063/12384 [12:51:54<13:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 49%|████▉ | 6063/12384 [12:52:02<13:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 49%|████▉ | 6064/12384 [12:52:02<13:22:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 49%|████▉ | 6064/12384 [12:52:10<13:22:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 49%|████▉ | 6065/12384 [12:52:10<13:21:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 49%|████▉ | 6065/12384 [12:52:17<13:21:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6066/12384 [12:52:17<13:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6066/12384 [12:52:25<13:21:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6067/12384 [12:52:25<13:20:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6067/12384 [12:52:32<13:20:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 2: 49%|████▉ | 6068/12384 [12:52:32<13:20:10, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 2: 49%|████▉ | 6068/12384 [12:52:40<13:20:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 2: 49%|████▉ | 6069/12384 [12:52:40<13:20:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.97s]
Epoch 2: 49%|████▉ | 6069/12384 [12:52:48<13:20:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 49%|████▉ | 6070/12384 [12:52:48<13:19:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 49%|████▉ | 6070/12384 [12:52:55<13:19:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6071/12384 [12:52:55<13:19:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6071/12384 [12:53:03<13:19:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 49%|████▉ | 6072/12384 [12:53:03<13:20:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 49%|████▉ | 6072/12384 [12:53:10<13:20:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 2: 49%|████▉ | 6073/12384 [12:53:10<13:20:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 2: 49%|████▉ | 6073/12384 [12:53:19<13:20:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 49%|████▉ | 6074/12384 [12:53:19<13:34:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 49%|████▉ | 6074/12384 [12:53:26<13:34:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 2: 49%|████▉ | 6075/12384 [12:53:26<13:29:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.49s]
Epoch 2: 49%|████▉ | 6075/12384 [12:53:34<13:29:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 49%|████▉ | 6076/12384 [12:53:34<13:26:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 49%|████▉ | 6076/12384 [12:53:41<13:26:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 49%|████▉ | 6077/12384 [12:53:41<13:24:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 49%|████▉ | 6077/12384 [12:53:49<13:24:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 49%|████▉ | 6078/12384 [12:53:49<13:23:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 49%|████▉ | 6078/12384 [12:53:57<13:23:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 49%|████▉ | 6079/12384 [12:53:57<13:21:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 49%|████▉ | 6079/12384 [12:54:04<13:21:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 49%|████▉ | 6080/12384 [12:54:04<13:20:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 49%|████▉ | 6080/12384 [12:54:12<13:20:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 49%|████▉ | 6081/12384 [12:54:12<13:20:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 49%|████▉ | 6081/12384 [12:54:19<13:20:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 49%|████▉ | 6082/12384 [12:54:19<13:20:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 49%|████▉ | 6082/12384 [12:54:27<13:20:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 49%|████▉ | 6083/12384 [12:54:27<13:19:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 49%|████▉ | 6083/12384 [12:54:35<13:19:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6084/12384 [12:54:35<13:19:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6084/12384 [12:54:42<13:19:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 49%|████▉ | 6085/12384 [12:54:42<13:22:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 49%|████▉ | 6085/12384 [12:54:50<13:22:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 49%|████▉ | 6086/12384 [12:54:50<13:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 49%|████▉ | 6086/12384 [12:54:58<13:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6087/12384 [12:54:58<13:21:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6087/12384 [12:55:05<13:21:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 49%|████▉ | 6088/12384 [12:55:05<13:20:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 49%|████▉ | 6088/12384 [12:55:13<13:20:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 49%|████▉ | 6089/12384 [12:55:13<13:19:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 49%|████▉ | 6089/12384 [12:55:20<13:19:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6090/12384 [12:55:20<13:19:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6090/12384 [12:55:28<13:19:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▉ | 6091/12384 [12:55:28<13:18:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▉ | 6091/12384 [12:55:36<13:18:31, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▉ | 6092/12384 [12:55:36<13:18:24, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▉ | 6092/12384 [12:55:43<13:18:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6093/12384 [12:55:43<13:18:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6093/12384 [12:55:51<13:18:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 49%|████▉ | 6094/12384 [12:55:51<13:18:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 49%|████▉ | 6094/12384 [12:55:59<13:18:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 49%|████▉ | 6095/12384 [12:55:59<13:18:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 49%|████▉ | 6095/12384 [12:56:06<13:18:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 49%|████▉ | 6096/12384 [12:56:06<13:18:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 49%|████▉ | 6096/12384 [12:56:14<13:18:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 49%|████▉ | 6097/12384 [12:56:14<13:18:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 49%|████▉ | 6097/12384 [12:56:21<13:18:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 49%|████▉ | 6098/12384 [12:56:21<13:17:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 49%|████▉ | 6098/12384 [12:56:29<13:17:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 49%|████▉ | 6099/12384 [12:56:29<13:16:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 49%|████▉ | 6099/12384 [12:56:37<13:16:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6100/12384 [12:56:37<13:16:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6100/12384 [12:56:44<13:16:10, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 49%|████▉ | 6101/12384 [12:56:44<13:26:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 49%|████▉ | 6101/12384 [12:56:52<13:26:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 49%|████▉ | 6102/12384 [12:56:52<13:24:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 49%|████▉ | 6102/12384 [12:57:00<13:24:36, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 2: 49%|████▉ | 6103/12384 [12:57:00<13:22:32, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 2: 49%|████▉ | 6103/12384 [12:57:08<13:22:32, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 49%|████▉ | 6104/12384 [12:57:08<13:30:14, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 49%|████▉ | 6104/12384 [12:57:15<13:30:14, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 49%|████▉ | 6105/12384 [12:57:15<13:26:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 49%|████▉ | 6105/12384 [12:57:23<13:26:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6106/12384 [12:57:23<13:22:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6106/12384 [12:57:30<13:22:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6107/12384 [12:57:30<13:20:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6107/12384 [12:57:38<13:20:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▉ | 6108/12384 [12:57:38<13:19:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 49%|████▉ | 6108/12384 [12:57:46<13:19:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 49%|████▉ | 6109/12384 [12:57:46<13:17:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 49%|████▉ | 6109/12384 [12:57:53<13:17:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 49%|████▉ | 6110/12384 [12:57:53<13:16:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 49%|████▉ | 6110/12384 [12:58:01<13:16:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 49%|████▉ | 6111/12384 [12:58:01<13:15:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 49%|████▉ | 6111/12384 [12:58:08<13:15:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 49%|████▉ | 6112/12384 [12:58:08<13:15:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 49%|████▉ | 6112/12384 [12:58:16<13:15:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 2: 49%|████▉ | 6113/12384 [12:58:16<13:14:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 2: 49%|████▉ | 6113/12384 [12:58:24<13:14:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 49%|████▉ | 6114/12384 [12:58:24<13:14:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 49%|████▉ | 6114/12384 [12:58:31<13:14:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 49%|████▉ | 6115/12384 [12:58:31<13:15:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 49%|████▉ | 6115/12384 [12:58:39<13:15:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6116/12384 [12:58:39<13:14:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6116/12384 [12:58:46<13:14:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 49%|████▉ | 6117/12384 [12:58:46<13:14:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 49%|████▉ | 6117/12384 [12:58:54<13:14:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6118/12384 [12:58:54<13:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6118/12384 [12:59:02<13:14:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6119/12384 [12:59:02<13:14:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 49%|████▉ | 6119/12384 [12:59:09<13:14:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 49%|████▉ | 6120/12384 [12:59:09<13:14:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 49%|████▉ | 6120/12384 [12:59:17<13:14:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.64s]
Epoch 2: 49%|████▉ | 6121/12384 [12:59:17<13:13:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=3.64s]
Epoch 2: 49%|████▉ | 6121/12384 [12:59:24<13:13:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 49%|████▉ | 6122/12384 [12:59:24<13:13:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 49%|████▉ | 6122/12384 [12:59:32<13:13:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 49%|████▉ | 6123/12384 [12:59:32<13:12:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 49%|████▉ | 6123/12384 [12:59:40<13:12:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 49%|████▉ | 6124/12384 [12:59:40<13:13:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 49%|████▉ | 6124/12384 [12:59:47<13:13:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 49%|████▉ | 6125/12384 [12:59:47<13:13:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 49%|████▉ | 6125/12384 [12:59:55<13:13:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6126/12384 [12:59:55<13:13:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 49%|████▉ | 6126/12384 [13:00:03<13:13:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 49%|████▉ | 6127/12384 [13:00:03<13:23:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 49%|████▉ | 6127/12384 [13:00:11<13:23:16, 7.70s/it, loss=0.0003, acc=0.9995, iter_time=8.30s]
Epoch 2: 49%|████▉ | 6128/12384 [13:00:11<13:23:00, 7.70s/it, loss=0.0003, acc=0.9995, iter_time=8.30s]
Epoch 2: 49%|████▉ | 6128/12384 [13:00:18<13:23:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.71s]
Epoch 2: 49%|████▉ | 6129/12384 [13:00:18<13:19:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.71s]
Epoch 2: 49%|████▉ | 6129/12384 [13:00:26<13:19:16, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 2: 49%|████▉ | 6130/12384 [13:00:26<13:26:49, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 2: 49%|████▉ | 6130/12384 [13:00:34<13:26:49, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 50%|████▉ | 6131/12384 [13:00:34<13:22:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 50%|████▉ | 6131/12384 [13:00:41<13:22:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 2: 50%|████▉ | 6132/12384 [13:00:41<13:20:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 2: 50%|████▉ | 6132/12384 [13:00:49<13:20:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 2: 50%|████▉ | 6133/12384 [13:00:49<13:18:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 2: 50%|████▉ | 6133/12384 [13:00:57<13:18:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 50%|████▉ | 6134/12384 [13:00:57<13:16:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 50%|████▉ | 6134/12384 [13:01:04<13:16:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 50%|████▉ | 6135/12384 [13:01:04<13:14:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 50%|████▉ | 6135/12384 [13:01:12<13:14:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 50%|████▉ | 6136/12384 [13:01:12<13:14:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 50%|████▉ | 6136/12384 [13:01:19<13:14:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 50%|████▉ | 6137/12384 [13:01:19<13:14:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 50%|████▉ | 6137/12384 [13:01:27<13:14:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 2: 50%|████▉ | 6138/12384 [13:01:27<13:13:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 2: 50%|████▉ | 6138/12384 [13:01:35<13:13:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 50%|████▉ | 6139/12384 [13:01:35<13:13:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 50%|████▉ | 6139/12384 [13:01:42<13:13:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 50%|████▉ | 6140/12384 [13:01:42<13:13:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 50%|████▉ | 6140/12384 [13:01:50<13:13:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 50%|████▉ | 6141/12384 [13:01:50<13:12:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 50%|████▉ | 6141/12384 [13:01:57<13:12:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 50%|████▉ | 6142/12384 [13:01:57<13:12:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 50%|████▉ | 6142/12384 [13:02:05<13:12:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 50%|████▉ | 6143/12384 [13:02:05<13:12:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 50%|████▉ | 6143/12384 [13:02:13<13:12:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 50%|████▉ | 6144/12384 [13:02:13<13:13:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 50%|████▉ | 6144/12384 [13:02:20<13:13:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 50%|████▉ | 6145/12384 [13:02:20<13:12:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 50%|████▉ | 6145/12384 [13:02:28<13:12:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 50%|████▉ | 6146/12384 [13:02:28<13:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 50%|████▉ | 6146/12384 [13:02:36<13:12:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|████▉ | 6147/12384 [13:02:36<13:11:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|████▉ | 6147/12384 [13:02:43<13:11:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 50%|████▉ | 6148/12384 [13:02:43<13:10:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 50%|████▉ | 6148/12384 [13:02:51<13:10:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|████▉ | 6149/12384 [13:02:51<13:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|████▉ | 6149/12384 [13:02:58<13:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|████▉ | 6150/12384 [13:02:58<13:10:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|████▉ | 6150/12384 [13:03:06<13:10:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 50%|████▉ | 6151/12384 [13:03:06<13:09:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 50%|████▉ | 6151/12384 [13:03:14<13:09:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 2: 50%|████▉ | 6152/12384 [13:03:14<13:10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 2: 50%|████▉ | 6152/12384 [13:03:22<13:10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 50%|████▉ | 6153/12384 [13:03:22<13:23:20, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 50%|████▉ | 6153/12384 [13:03:29<13:23:20, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 50%|████▉ | 6154/12384 [13:03:29<13:18:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 50%|████▉ | 6154/12384 [13:03:37<13:18:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 50%|████▉ | 6155/12384 [13:03:37<13:15:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 50%|████▉ | 6155/12384 [13:03:45<13:15:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 50%|████▉ | 6156/12384 [13:03:45<13:23:43, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 50%|████▉ | 6156/12384 [13:03:52<13:23:43, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|████▉ | 6157/12384 [13:03:52<13:19:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|████▉ | 6157/12384 [13:04:00<13:19:26, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 50%|████▉ | 6158/12384 [13:04:00<13:16:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 50%|████▉ | 6158/12384 [13:04:08<13:16:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 50%|████▉ | 6159/12384 [13:04:08<13:14:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 50%|████▉ | 6159/12384 [13:04:15<13:14:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 50%|████▉ | 6160/12384 [13:04:15<13:13:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 50%|████▉ | 6160/12384 [13:04:23<13:13:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 2: 50%|████▉ | 6161/12384 [13:04:23<13:12:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.66s]
Epoch 2: 50%|████▉ | 6161/12384 [13:04:30<13:12:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 2: 50%|████▉ | 6162/12384 [13:04:30<13:11:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.93s]
Epoch 2: 50%|████▉ | 6162/12384 [13:04:38<13:11:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 50%|████▉ | 6163/12384 [13:04:38<13:11:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 50%|████▉ | 6163/12384 [13:04:46<13:11:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 50%|████▉ | 6164/12384 [13:04:46<13:10:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 50%|████▉ | 6164/12384 [13:04:53<13:10:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 50%|████▉ | 6165/12384 [13:04:53<13:10:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 50%|████▉ | 6165/12384 [13:05:01<13:10:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 50%|████▉ | 6166/12384 [13:05:01<13:10:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 50%|████▉ | 6166/12384 [13:05:09<13:10:23, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=10.48s]
Epoch 2: 50%|████▉ | 6167/12384 [13:05:09<13:10:03, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=10.48s]
Epoch 2: 50%|████▉ | 6167/12384 [13:05:16<13:10:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|████▉ | 6168/12384 [13:05:16<13:10:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|████▉ | 6168/12384 [13:05:24<13:10:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 50%|████▉ | 6169/12384 [13:05:24<13:10:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 50%|████▉ | 6169/12384 [13:05:31<13:10:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 50%|████▉ | 6170/12384 [13:05:31<13:09:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 50%|████▉ | 6170/12384 [13:05:39<13:09:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 50%|████▉ | 6171/12384 [13:05:39<13:09:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.73s]
Epoch 2: 50%|████▉ | 6171/12384 [13:05:47<13:09:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 50%|████▉ | 6172/12384 [13:05:47<13:08:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 50%|████▉ | 6172/12384 [13:05:54<13:08:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 2: 50%|████▉ | 6173/12384 [13:05:54<13:08:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 2: 50%|████▉ | 6173/12384 [13:06:02<13:08:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 50%|████▉ | 6174/12384 [13:06:02<13:07:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 50%|████▉ | 6174/12384 [13:06:09<13:07:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 50%|████▉ | 6175/12384 [13:06:09<13:07:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 50%|████▉ | 6175/12384 [13:06:17<13:07:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 50%|████▉ | 6176/12384 [13:06:17<13:07:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 50%|████▉ | 6176/12384 [13:06:25<13:07:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 2: 50%|████▉ | 6177/12384 [13:06:25<13:06:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 2: 50%|████▉ | 6177/12384 [13:06:32<13:06:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 50%|████▉ | 6178/12384 [13:06:32<13:06:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 50%|████▉ | 6178/12384 [13:06:40<13:06:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 50%|████▉ | 6179/12384 [13:06:40<13:17:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 50%|████▉ | 6179/12384 [13:06:48<13:17:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 50%|████▉ | 6180/12384 [13:06:48<13:14:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 50%|████▉ | 6180/12384 [13:06:55<13:14:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 2: 50%|████▉ | 6181/12384 [13:06:55<13:12:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.70s]
Epoch 2: 50%|████▉ | 6181/12384 [13:07:03<13:12:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 2: 50%|████▉ | 6182/12384 [13:07:03<13:10:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 2: 50%|████▉ | 6182/12384 [13:07:11<13:10:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 50%|████▉ | 6183/12384 [13:07:11<13:08:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 50%|████▉ | 6183/12384 [13:07:18<13:08:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 50%|████▉ | 6184/12384 [13:07:18<13:07:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 50%|████▉ | 6184/12384 [13:07:26<13:07:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 50%|████▉ | 6185/12384 [13:07:26<13:09:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 50%|████▉ | 6185/12384 [13:07:34<13:09:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 2: 50%|████▉ | 6186/12384 [13:07:34<13:08:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.71s]
Epoch 2: 50%|████▉ | 6186/12384 [13:07:41<13:08:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 50%|████▉ | 6187/12384 [13:07:41<13:07:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 50%|████▉ | 6187/12384 [13:07:49<13:07:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 50%|████▉ | 6188/12384 [13:07:49<13:06:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 50%|████▉ | 6188/12384 [13:07:56<13:06:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 50%|████▉ | 6189/12384 [13:07:56<13:06:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 50%|████▉ | 6189/12384 [13:08:04<13:06:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 50%|████▉ | 6190/12384 [13:08:04<13:06:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.94s]
Epoch 2: 50%|████▉ | 6190/12384 [13:08:12<13:06:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|████▉ | 6191/12384 [13:08:12<13:05:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|████▉ | 6191/12384 [13:08:19<13:05:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 50%|█████ | 6192/12384 [13:08:19<13:07:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 50%|█████ | 6192/12384 [13:08:27<13:07:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 50%|█████ | 6193/12384 [13:08:27<13:07:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 50%|█████ | 6193/12384 [13:08:35<13:07:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 50%|█████ | 6194/12384 [13:08:35<13:06:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 50%|█████ | 6194/12384 [13:08:42<13:06:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 50%|█████ | 6195/12384 [13:08:42<13:06:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 50%|█████ | 6195/12384 [13:08:50<13:06:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 50%|█████ | 6196/12384 [13:08:50<13:05:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 50%|█████ | 6196/12384 [13:08:57<13:05:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 50%|█████ | 6197/12384 [13:08:57<13:04:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 50%|█████ | 6197/12384 [13:09:05<13:04:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 50%|█████ | 6198/12384 [13:09:05<13:06:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 50%|█████ | 6198/12384 [13:09:13<13:06:28, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|█████ | 6199/12384 [13:09:13<13:07:12, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|█████ | 6199/12384 [13:09:20<13:07:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 50%|█████ | 6200/12384 [13:09:20<13:07:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 50%|█████ | 6200/12384 [13:09:28<13:07:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 50%|█████ | 6201/12384 [13:09:28<13:07:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 50%|█████ | 6201/12384 [13:09:36<13:07:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 50%|█████ | 6202/12384 [13:09:36<13:05:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 50%|█████ | 6202/12384 [13:09:43<13:05:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 50%|█████ | 6203/12384 [13:09:43<13:04:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 50%|█████ | 6203/12384 [13:09:51<13:04:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 50%|█████ | 6204/12384 [13:09:51<13:04:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 50%|█████ | 6204/12384 [13:09:59<13:04:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 50%|█████ | 6205/12384 [13:09:59<13:14:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 50%|█████ | 6205/12384 [13:10:06<13:14:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 50%|█████ | 6206/12384 [13:10:06<13:11:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 50%|█████ | 6206/12384 [13:10:14<13:11:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 50%|█████ | 6207/12384 [13:10:14<13:09:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 50%|█████ | 6207/12384 [13:10:22<13:09:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 50%|█████ | 6208/12384 [13:10:22<13:07:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 50%|█████ | 6208/12384 [13:10:29<13:07:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 50%|█████ | 6209/12384 [13:10:29<13:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 50%|█████ | 6209/12384 [13:10:37<13:05:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 50%|█████ | 6210/12384 [13:10:37<13:04:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 50%|█████ | 6210/12384 [13:10:44<13:04:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 50%|█████ | 6211/12384 [13:10:44<13:04:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 50%|█████ | 6211/12384 [13:10:52<13:04:10, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=9.62s]
Epoch 2: 50%|█████ | 6212/12384 [13:10:52<13:03:41, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=9.62s]
Epoch 2: 50%|█████ | 6212/12384 [13:11:00<13:03:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 50%|█████ | 6213/12384 [13:11:00<13:03:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 50%|█████ | 6213/12384 [13:11:07<13:03:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|█████ | 6214/12384 [13:11:07<13:02:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 50%|█████ | 6214/12384 [13:11:15<13:02:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 50%|█████ | 6215/12384 [13:11:15<13:02:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 50%|█████ | 6215/12384 [13:11:23<13:02:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 50%|█████ | 6216/12384 [13:11:23<13:03:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 50%|█████ | 6216/12384 [13:11:30<13:03:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 2: 50%|█████ | 6217/12384 [13:11:30<13:02:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 2: 50%|█████ | 6217/12384 [13:11:38<13:02:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|█████ | 6218/12384 [13:11:38<13:02:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|█████ | 6218/12384 [13:11:45<13:02:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 50%|█████ | 6219/12384 [13:11:45<13:06:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 50%|█████ | 6219/12384 [13:11:53<13:06:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 50%|█████ | 6220/12384 [13:11:53<13:05:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 50%|█████ | 6220/12384 [13:12:01<13:05:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 50%|█████ | 6221/12384 [13:12:01<13:03:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 50%|█████ | 6221/12384 [13:12:08<13:03:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 50%|█████ | 6222/12384 [13:12:08<13:02:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 50%|█████ | 6222/12384 [13:12:16<13:02:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 50%|█████ | 6223/12384 [13:12:16<13:02:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 50%|█████ | 6223/12384 [13:12:24<13:02:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 50%|█████ | 6224/12384 [13:12:24<13:02:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 50%|█████ | 6224/12384 [13:12:31<13:02:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 50%|█████ | 6225/12384 [13:12:31<13:01:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 50%|█████ | 6225/12384 [13:12:39<13:01:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 50%|█████ | 6226/12384 [13:12:39<13:01:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 50%|█████ | 6226/12384 [13:12:46<13:01:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 50%|█████ | 6227/12384 [13:12:46<13:00:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 50%|█████ | 6227/12384 [13:12:54<13:00:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 50%|█████ | 6228/12384 [13:12:54<13:05:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 50%|█████ | 6228/12384 [13:13:02<13:05:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 50%|█████ | 6229/12384 [13:13:02<13:04:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 50%|█████ | 6229/12384 [13:13:09<13:04:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 50%|█████ | 6230/12384 [13:13:09<13:02:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 50%|█████ | 6230/12384 [13:13:17<13:02:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 50%|█████ | 6231/12384 [13:13:17<13:02:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 50%|█████ | 6231/12384 [13:13:25<13:02:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 50%|█████ | 6232/12384 [13:13:25<13:17:44, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 50%|█████ | 6232/12384 [13:13:33<13:17:44, 7.78s/it, loss=0.0001, acc=1.0000, iter_time=7.40s]
Epoch 2: 50%|█████ | 6233/12384 [13:13:33<13:12:54, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.40s]
Epoch 2: 50%|█████ | 6233/12384 [13:13:40<13:12:54, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 50%|█████ | 6234/12384 [13:13:40<13:11:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 50%|█████ | 6234/12384 [13:13:48<13:11:01, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 50%|█████ | 6235/12384 [13:13:48<13:07:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 50%|█████ | 6235/12384 [13:13:56<13:07:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 50%|█████ | 6236/12384 [13:13:56<13:13:40, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 50%|█████ | 6236/12384 [13:14:03<13:13:40, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 50%|█████ | 6237/12384 [13:14:03<13:09:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 50%|█████ | 6237/12384 [13:14:11<13:09:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 50%|█████ | 6238/12384 [13:14:11<13:06:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 50%|█████ | 6238/12384 [13:14:19<13:06:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 50%|█████ | 6239/12384 [13:14:19<13:04:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 50%|█████ | 6239/12384 [13:14:26<13:04:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 50%|█████ | 6240/12384 [13:14:26<13:02:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 50%|█████ | 6240/12384 [13:14:34<13:02:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 2: 50%|█████ | 6241/12384 [13:14:34<13:01:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.59s]
Epoch 2: 50%|█████ | 6241/12384 [13:14:42<13:01:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 50%|█████ | 6242/12384 [13:14:42<13:03:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 50%|█████ | 6242/12384 [13:14:49<13:03:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 50%|█████ | 6243/12384 [13:14:49<13:05:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 50%|█████ | 6243/12384 [13:14:57<13:05:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 50%|█████ | 6244/12384 [13:14:57<13:03:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 50%|█████ | 6244/12384 [13:15:05<13:03:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 50%|█████ | 6245/12384 [13:15:05<13:02:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 50%|█████ | 6245/12384 [13:15:12<13:02:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 50%|█████ | 6246/12384 [13:15:12<13:01:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 50%|█████ | 6246/12384 [13:15:20<13:01:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 50%|█████ | 6247/12384 [13:15:20<13:01:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 50%|█████ | 6247/12384 [13:15:27<13:01:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|█████ | 6248/12384 [13:15:27<13:00:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 50%|█████ | 6248/12384 [13:15:35<13:00:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 50%|█████ | 6249/12384 [13:15:35<12:59:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 50%|█████ | 6249/12384 [13:15:43<12:59:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 50%|█████ | 6250/12384 [13:15:43<13:00:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 50%|█████ | 6250/12384 [13:15:50<13:00:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 50%|█████ | 6251/12384 [13:15:50<12:59:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 50%|█████ | 6251/12384 [13:15:58<12:59:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 50%|█████ | 6252/12384 [13:15:58<12:59:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 50%|█████ | 6252/12384 [13:16:06<12:59:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 50%|█████ | 6253/12384 [13:16:06<12:58:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 50%|█████ | 6253/12384 [13:16:13<12:58:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 51%|█████ | 6254/12384 [13:16:13<12:58:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 51%|█████ | 6254/12384 [13:16:21<12:58:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 51%|█████ | 6255/12384 [13:16:21<12:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 51%|█████ | 6255/12384 [13:16:28<12:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 51%|█████ | 6256/12384 [13:16:28<12:57:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 51%|█████ | 6256/12384 [13:16:36<12:57:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 51%|█████ | 6257/12384 [13:16:36<12:58:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 51%|█████ | 6257/12384 [13:16:44<12:58:29, 7.62s/it, loss=0.0001, acc=0.9998, iter_time=7.71s]
Epoch 2: 51%|█████ | 6258/12384 [13:16:44<13:10:05, 7.74s/it, loss=0.0001, acc=0.9998, iter_time=7.71s]
Epoch 2: 51%|█████ | 6258/12384 [13:16:52<13:10:05, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 51%|█████ | 6259/12384 [13:16:52<13:06:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 51%|█████ | 6259/12384 [13:16:59<13:06:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 51%|█████ | 6260/12384 [13:16:59<13:05:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 51%|█████ | 6260/12384 [13:17:07<13:05:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 51%|█████ | 6261/12384 [13:17:07<13:02:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 51%|█████ | 6261/12384 [13:17:15<13:02:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 51%|█████ | 6262/12384 [13:17:15<13:09:37, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 51%|█████ | 6262/12384 [13:17:23<13:09:37, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████ | 6263/12384 [13:17:23<13:06:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████ | 6263/12384 [13:17:30<13:06:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 51%|█████ | 6264/12384 [13:17:30<13:05:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 51%|█████ | 6264/12384 [13:17:38<13:05:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 51%|█████ | 6265/12384 [13:17:38<13:01:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 51%|█████ | 6265/12384 [13:17:45<13:01:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 2: 51%|█████ | 6266/12384 [13:17:45<13:00:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.38s]
Epoch 2: 51%|█████ | 6266/12384 [13:17:53<13:00:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6267/12384 [13:17:53<12:58:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6267/12384 [13:18:01<12:58:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 51%|█████ | 6268/12384 [13:18:01<12:57:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 51%|█████ | 6268/12384 [13:18:08<12:57:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████ | 6269/12384 [13:18:08<12:57:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████ | 6269/12384 [13:18:16<12:57:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6270/12384 [13:18:16<12:56:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6270/12384 [13:18:23<12:56:21, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.62s]
Epoch 2: 51%|█████ | 6271/12384 [13:18:23<12:55:53, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.62s]
Epoch 2: 51%|█████ | 6271/12384 [13:18:31<12:55:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 51%|█████ | 6272/12384 [13:18:31<12:55:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 51%|█████ | 6272/12384 [13:18:39<12:55:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 51%|█████ | 6273/12384 [13:18:39<12:55:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 51%|█████ | 6273/12384 [13:18:46<12:55:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6274/12384 [13:18:46<12:55:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6274/12384 [13:18:54<12:55:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 51%|█████ | 6275/12384 [13:18:54<12:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 51%|█████ | 6275/12384 [13:19:02<12:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 2: 51%|█████ | 6276/12384 [13:19:02<12:55:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 2: 51%|█████ | 6276/12384 [13:19:09<12:55:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████ | 6277/12384 [13:19:09<12:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████ | 6277/12384 [13:19:17<12:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 51%|█████ | 6278/12384 [13:19:17<12:54:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 51%|█████ | 6278/12384 [13:19:24<12:54:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 2: 51%|█████ | 6279/12384 [13:19:24<12:54:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.96s]
Epoch 2: 51%|█████ | 6279/12384 [13:19:32<12:54:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 51%|█████ | 6280/12384 [13:19:32<12:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 51%|█████ | 6280/12384 [13:19:40<12:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 51%|█████ | 6281/12384 [13:19:40<12:54:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 51%|█████ | 6281/12384 [13:19:47<12:54:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 51%|█████ | 6282/12384 [13:19:47<12:55:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 51%|█████ | 6282/12384 [13:19:55<12:55:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 51%|█████ | 6283/12384 [13:19:55<12:56:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 51%|█████ | 6283/12384 [13:20:02<12:56:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████ | 6284/12384 [13:20:02<12:55:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████ | 6284/12384 [13:20:10<12:55:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 51%|█████ | 6285/12384 [13:20:10<13:04:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 51%|█████ | 6285/12384 [13:20:18<13:04:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 51%|█████ | 6286/12384 [13:20:18<13:01:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 51%|█████ | 6286/12384 [13:20:26<13:01:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 51%|█████ | 6287/12384 [13:20:26<13:00:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 51%|█████ | 6287/12384 [13:20:33<13:00:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 51%|█████ | 6288/12384 [13:20:33<12:57:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 51%|█████ | 6288/12384 [13:20:41<12:57:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 51%|█████ | 6289/12384 [13:20:41<13:03:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 51%|█████ | 6289/12384 [13:20:49<13:03:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6290/12384 [13:20:49<13:00:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6290/12384 [13:20:56<13:00:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 2: 51%|█████ | 6291/12384 [13:20:56<12:57:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 2: 51%|█████ | 6291/12384 [13:21:04<12:57:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 51%|█████ | 6292/12384 [13:21:04<12:55:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 51%|█████ | 6292/12384 [13:21:12<12:55:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 51%|█████ | 6293/12384 [13:21:12<12:54:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 51%|█████ | 6293/12384 [13:21:19<12:54:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 51%|█████ | 6294/12384 [13:21:19<12:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 51%|█████ | 6294/12384 [13:21:27<12:53:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████ | 6295/12384 [13:21:27<12:52:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████ | 6295/12384 [13:21:34<12:52:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 51%|█████ | 6296/12384 [13:21:34<12:55:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 51%|█████ | 6296/12384 [13:21:42<12:55:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 51%|█████ | 6297/12384 [13:21:42<12:54:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 51%|█████ | 6297/12384 [13:21:50<12:54:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 51%|█████ | 6298/12384 [13:21:50<13:03:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 51%|█████ | 6298/12384 [13:21:58<13:03:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 51%|█████ | 6299/12384 [13:21:58<12:59:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 51%|█████ | 6299/12384 [13:22:05<12:59:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 51%|█████ | 6300/12384 [13:22:05<12:57:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 51%|█████ | 6300/12384 [13:22:13<12:57:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 51%|█████ | 6301/12384 [13:22:13<12:55:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 51%|█████ | 6301/12384 [13:22:20<12:55:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 51%|█████ | 6302/12384 [13:22:20<12:54:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 51%|█████ | 6302/12384 [13:22:28<12:54:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 51%|█████ | 6303/12384 [13:22:28<12:53:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 51%|█████ | 6303/12384 [13:22:36<12:53:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 51%|█████ | 6304/12384 [13:22:36<12:52:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 51%|█████ | 6304/12384 [13:22:43<12:52:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.37s]
Epoch 2: 51%|█████ | 6305/12384 [13:22:43<12:52:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.37s]
Epoch 2: 51%|█████ | 6305/12384 [13:22:51<12:52:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 51%|█████ | 6306/12384 [13:22:51<12:52:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 51%|█████ | 6306/12384 [13:22:59<12:52:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 51%|█████ | 6307/12384 [13:22:59<12:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 51%|█████ | 6307/12384 [13:23:06<12:51:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6308/12384 [13:23:06<12:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6308/12384 [13:23:14<12:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████ | 6309/12384 [13:23:14<12:51:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████ | 6309/12384 [13:23:21<12:51:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6310/12384 [13:23:21<12:51:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6310/12384 [13:23:29<12:51:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 51%|█████ | 6311/12384 [13:23:29<13:03:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 51%|█████ | 6311/12384 [13:23:37<13:03:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 51%|█████ | 6312/12384 [13:23:37<13:03:50, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 51%|█████ | 6312/12384 [13:23:45<13:03:50, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 51%|█████ | 6313/12384 [13:23:45<13:02:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 51%|█████ | 6313/12384 [13:23:52<13:02:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6314/12384 [13:23:52<12:58:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6314/12384 [13:24:00<12:58:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 51%|█████ | 6315/12384 [13:24:00<12:55:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 51%|█████ | 6315/12384 [13:24:08<12:55:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 51%|█████ | 6316/12384 [13:24:08<12:54:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 51%|█████ | 6316/12384 [13:24:15<12:54:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 51%|█████ | 6317/12384 [13:24:15<12:52:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 51%|█████ | 6317/12384 [13:24:23<12:52:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 51%|█████ | 6318/12384 [13:24:23<12:51:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 51%|█████ | 6318/12384 [13:24:31<12:51:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 51%|█████ | 6319/12384 [13:24:31<12:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 51%|█████ | 6319/12384 [13:24:38<12:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 51%|█████ | 6320/12384 [13:24:38<12:50:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 51%|█████ | 6320/12384 [13:24:46<12:50:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 2: 51%|█████ | 6321/12384 [13:24:46<12:49:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 2: 51%|█████ | 6321/12384 [13:24:53<12:49:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 51%|█████ | 6322/12384 [13:24:53<12:49:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 51%|█████ | 6322/12384 [13:25:01<12:49:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6323/12384 [13:25:01<12:48:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6323/12384 [13:25:09<12:48:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6324/12384 [13:25:09<12:49:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████ | 6324/12384 [13:25:16<12:49:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6325/12384 [13:25:16<12:49:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6325/12384 [13:25:24<12:49:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6326/12384 [13:25:24<12:48:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6326/12384 [13:25:31<12:48:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6327/12384 [13:25:31<12:48:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 51%|█████ | 6327/12384 [13:25:39<12:48:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 51%|█████ | 6328/12384 [13:25:39<12:48:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 51%|█████ | 6328/12384 [13:25:47<12:48:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 51%|█████ | 6329/12384 [13:25:47<12:48:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 51%|█████ | 6329/12384 [13:25:54<12:48:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████ | 6330/12384 [13:25:54<12:48:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████ | 6330/12384 [13:26:02<12:48:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 51%|█████ | 6331/12384 [13:26:02<12:48:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.57s]
Epoch 2: 51%|█████ | 6331/12384 [13:26:10<12:48:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 51%|█████ | 6332/12384 [13:26:10<12:48:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 51%|█████ | 6332/12384 [13:26:17<12:48:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 51%|█████ | 6333/12384 [13:26:17<12:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 51%|█████ | 6333/12384 [13:26:25<12:47:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 51%|█████ | 6334/12384 [13:26:25<12:50:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 51%|█████ | 6334/12384 [13:26:32<12:50:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 2: 51%|█████ | 6335/12384 [13:26:32<12:49:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 2: 51%|█████ | 6335/12384 [13:26:40<12:49:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 51%|█████ | 6336/12384 [13:26:40<12:49:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 51%|█████ | 6336/12384 [13:26:48<12:49:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 51%|█████ | 6337/12384 [13:26:48<12:58:57, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 51%|█████ | 6337/12384 [13:26:56<12:58:57, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 51%|█████ | 6338/12384 [13:26:56<12:54:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 51%|█████ | 6338/12384 [13:27:03<12:54:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 51%|█████ | 6339/12384 [13:27:03<12:52:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 51%|█████ | 6339/12384 [13:27:11<12:52:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 51%|█████ | 6340/12384 [13:27:11<12:50:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 51%|█████ | 6340/12384 [13:27:18<12:50:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 51%|█████ | 6341/12384 [13:27:18<12:49:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 51%|█████ | 6341/12384 [13:27:26<12:49:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 51%|█████ | 6342/12384 [13:27:26<12:47:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 51%|█████ | 6342/12384 [13:27:34<12:47:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 51%|█████ | 6343/12384 [13:27:34<12:47:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 51%|█████ | 6343/12384 [13:27:41<12:47:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 51%|█████ | 6344/12384 [13:27:41<12:47:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 51%|█████ | 6344/12384 [13:27:49<12:47:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.71s]
Epoch 2: 51%|█████ | 6345/12384 [13:27:49<12:46:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.71s]
Epoch 2: 51%|█████ | 6345/12384 [13:27:56<12:46:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 51%|█████ | 6346/12384 [13:27:56<12:46:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 51%|█████ | 6346/12384 [13:28:04<12:46:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 51%|█████▏ | 6347/12384 [13:28:04<12:46:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 51%|█████▏ | 6347/12384 [13:28:12<12:46:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 2: 51%|█████▏ | 6348/12384 [13:28:12<12:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 2: 51%|█████▏ | 6348/12384 [13:28:19<12:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████▏ | 6349/12384 [13:28:19<12:45:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 51%|█████▏ | 6349/12384 [13:28:27<12:45:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6350/12384 [13:28:27<12:45:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6350/12384 [13:28:35<12:45:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.37s]
Epoch 2: 51%|█████▏ | 6351/12384 [13:28:35<12:44:09, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.37s]
Epoch 2: 51%|█████▏ | 6351/12384 [13:28:42<12:44:09, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 51%|█████▏ | 6352/12384 [13:28:42<12:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 51%|█████▏ | 6352/12384 [13:28:50<12:44:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 51%|█████▏ | 6353/12384 [13:28:50<12:45:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 51%|█████▏ | 6353/12384 [13:28:57<12:45:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6354/12384 [13:28:57<12:44:08, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6354/12384 [13:29:05<12:44:08, 7.60s/it, loss=0.0002, acc=0.9993, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6355/12384 [13:29:05<12:43:33, 7.60s/it, loss=0.0002, acc=0.9993, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6355/12384 [13:29:13<12:43:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6356/12384 [13:29:13<12:45:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6356/12384 [13:29:20<12:45:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 51%|█████▏ | 6357/12384 [13:29:20<12:45:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 51%|█████▏ | 6357/12384 [13:29:28<12:45:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████▏ | 6358/12384 [13:29:28<12:44:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████▏ | 6358/12384 [13:29:35<12:44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6359/12384 [13:29:35<12:44:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6359/12384 [13:29:43<12:44:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 51%|█████▏ | 6360/12384 [13:29:43<12:43:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 51%|█████▏ | 6360/12384 [13:29:51<12:43:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 2: 51%|█████▏ | 6361/12384 [13:29:51<12:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 2: 51%|█████▏ | 6361/12384 [13:29:58<12:44:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 51%|█████▏ | 6362/12384 [13:29:58<12:44:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 51%|█████▏ | 6362/12384 [13:30:06<12:44:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 51%|█████▏ | 6363/12384 [13:30:06<12:54:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 51%|█████▏ | 6363/12384 [13:30:14<12:54:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 51%|█████▏ | 6364/12384 [13:30:14<12:50:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 51%|█████▏ | 6364/12384 [13:30:21<12:50:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████▏ | 6365/12384 [13:30:21<12:48:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 51%|█████▏ | 6365/12384 [13:30:29<12:48:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 51%|█████▏ | 6366/12384 [13:30:29<12:49:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 51%|█████▏ | 6366/12384 [13:30:37<12:49:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 51%|█████▏ | 6367/12384 [13:30:37<12:56:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 51%|█████▏ | 6367/12384 [13:30:45<12:56:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 51%|█████▏ | 6368/12384 [13:30:45<12:51:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 51%|█████▏ | 6368/12384 [13:30:52<12:51:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 51%|█████▏ | 6369/12384 [13:30:52<12:48:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 51%|█████▏ | 6369/12384 [13:31:00<12:48:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 51%|█████▏ | 6370/12384 [13:31:00<12:46:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 51%|█████▏ | 6370/12384 [13:31:07<12:46:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 51%|█████▏ | 6371/12384 [13:31:07<12:45:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 51%|█████▏ | 6371/12384 [13:31:15<12:45:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 51%|█████▏ | 6372/12384 [13:31:15<12:44:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 51%|█████▏ | 6372/12384 [13:31:23<12:44:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 51%|█████▏ | 6373/12384 [13:31:23<12:43:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 51%|█████▏ | 6373/12384 [13:31:30<12:43:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 51%|█████▏ | 6374/12384 [13:31:30<12:42:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 51%|█████▏ | 6374/12384 [13:31:38<12:42:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6375/12384 [13:31:38<12:42:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 51%|█████▏ | 6375/12384 [13:31:46<12:42:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 51%|█████▏ | 6376/12384 [13:31:46<12:44:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 51%|█████▏ | 6376/12384 [13:31:53<12:44:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 51%|█████▏ | 6377/12384 [13:31:53<12:43:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 51%|█████▏ | 6377/12384 [13:32:01<12:43:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 52%|█████▏ | 6378/12384 [13:32:01<12:42:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 52%|█████▏ | 6378/12384 [13:32:08<12:42:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6379/12384 [13:32:08<12:42:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6379/12384 [13:32:16<12:42:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6380/12384 [13:32:16<12:42:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6380/12384 [13:32:24<12:42:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 52%|█████▏ | 6381/12384 [13:32:24<12:42:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 52%|█████▏ | 6381/12384 [13:32:31<12:42:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 52%|█████▏ | 6382/12384 [13:32:31<12:42:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 52%|█████▏ | 6382/12384 [13:32:39<12:42:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 2: 52%|█████▏ | 6383/12384 [13:32:39<12:42:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.25s]
Epoch 2: 52%|█████▏ | 6383/12384 [13:32:46<12:42:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 52%|█████▏ | 6384/12384 [13:32:46<12:41:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 52%|█████▏ | 6384/12384 [13:32:54<12:41:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 52%|█████▏ | 6385/12384 [13:32:54<12:41:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 52%|█████▏ | 6385/12384 [13:33:02<12:41:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 52%|█████▏ | 6386/12384 [13:33:02<12:41:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 52%|█████▏ | 6386/12384 [13:33:09<12:41:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 52%|█████▏ | 6387/12384 [13:33:09<12:40:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 52%|█████▏ | 6387/12384 [13:33:17<12:40:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 52%|█████▏ | 6388/12384 [13:33:17<12:41:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 52%|█████▏ | 6388/12384 [13:33:25<12:41:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 52%|█████▏ | 6389/12384 [13:33:25<12:51:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 52%|█████▏ | 6389/12384 [13:33:33<12:51:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 52%|█████▏ | 6390/12384 [13:33:33<12:48:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 52%|█████▏ | 6390/12384 [13:33:40<12:48:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 52%|█████▏ | 6391/12384 [13:33:40<12:45:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 52%|█████▏ | 6391/12384 [13:33:48<12:45:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 52%|█████▏ | 6392/12384 [13:33:48<12:44:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 52%|█████▏ | 6392/12384 [13:33:56<12:44:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 52%|█████▏ | 6393/12384 [13:33:56<12:50:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 52%|█████▏ | 6393/12384 [13:34:03<12:50:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6394/12384 [13:34:03<12:46:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6394/12384 [13:34:11<12:46:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 52%|█████▏ | 6395/12384 [13:34:11<12:44:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 52%|█████▏ | 6395/12384 [13:34:18<12:44:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 52%|█████▏ | 6396/12384 [13:34:18<12:42:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 52%|█████▏ | 6396/12384 [13:34:26<12:42:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6397/12384 [13:34:26<12:40:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6397/12384 [13:34:34<12:40:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 52%|█████▏ | 6398/12384 [13:34:34<12:39:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 52%|█████▏ | 6398/12384 [13:34:41<12:39:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 52%|█████▏ | 6399/12384 [13:34:41<12:40:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 52%|█████▏ | 6399/12384 [13:34:49<12:40:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 52%|█████▏ | 6400/12384 [13:34:49<12:39:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 52%|█████▏ | 6400/12384 [13:34:56<12:39:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 52%|█████▏ | 6401/12384 [13:34:56<12:39:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 52%|█████▏ | 6401/12384 [13:35:04<12:39:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 52%|█████▏ | 6402/12384 [13:35:04<12:39:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 52%|█████▏ | 6402/12384 [13:35:12<12:39:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 52%|█████▏ | 6403/12384 [13:35:12<12:38:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 52%|█████▏ | 6403/12384 [13:35:19<12:38:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 52%|█████▏ | 6404/12384 [13:35:19<12:38:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 52%|█████▏ | 6404/12384 [13:35:27<12:38:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 52%|█████▏ | 6405/12384 [13:35:27<12:38:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 52%|█████▏ | 6405/12384 [13:35:34<12:38:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 52%|█████▏ | 6406/12384 [13:35:34<12:38:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 52%|█████▏ | 6406/12384 [13:35:42<12:38:05, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=5.08s]
Epoch 2: 52%|█████▏ | 6407/12384 [13:35:42<12:37:14, 7.60s/it, loss=0.0002, acc=1.0000, iter_time=5.08s]
Epoch 2: 52%|█████▏ | 6407/12384 [13:35:50<12:37:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 52%|█████▏ | 6408/12384 [13:35:50<12:37:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.08s]
Epoch 2: 52%|█████▏ | 6408/12384 [13:35:57<12:37:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 52%|█████▏ | 6409/12384 [13:35:57<12:37:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 52%|█████▏ | 6409/12384 [13:36:05<12:37:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 52%|█████▏ | 6410/12384 [13:36:05<12:37:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 52%|█████▏ | 6410/12384 [13:36:13<12:37:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 52%|█████▏ | 6411/12384 [13:36:13<12:37:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 52%|█████▏ | 6411/12384 [13:36:20<12:37:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 52%|█████▏ | 6412/12384 [13:36:20<12:37:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 52%|█████▏ | 6412/12384 [13:36:28<12:37:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 52%|█████▏ | 6413/12384 [13:36:28<12:36:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 52%|█████▏ | 6413/12384 [13:36:35<12:36:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 52%|█████▏ | 6414/12384 [13:36:35<12:38:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 52%|█████▏ | 6414/12384 [13:36:43<12:38:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6415/12384 [13:36:43<12:37:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6415/12384 [13:36:51<12:37:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 52%|█████▏ | 6416/12384 [13:36:51<12:46:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 52%|█████▏ | 6416/12384 [13:36:58<12:46:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 52%|█████▏ | 6417/12384 [13:36:58<12:42:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 52%|█████▏ | 6417/12384 [13:37:06<12:42:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 52%|█████▏ | 6418/12384 [13:37:06<12:40:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 52%|█████▏ | 6418/12384 [13:37:14<12:40:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 52%|█████▏ | 6419/12384 [13:37:14<12:48:19, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 52%|█████▏ | 6419/12384 [13:37:22<12:48:19, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 52%|█████▏ | 6420/12384 [13:37:22<12:44:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 52%|█████▏ | 6420/12384 [13:37:29<12:44:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6421/12384 [13:37:29<12:42:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6421/12384 [13:37:37<12:42:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 52%|█████▏ | 6422/12384 [13:37:37<12:40:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 52%|█████▏ | 6422/12384 [13:37:44<12:40:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 52%|█████▏ | 6423/12384 [13:37:44<12:39:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 52%|█████▏ | 6423/12384 [13:37:52<12:39:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 52%|█████▏ | 6424/12384 [13:37:52<12:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 52%|█████▏ | 6424/12384 [13:38:00<12:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 52%|█████▏ | 6425/12384 [13:38:00<12:38:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 52%|█████▏ | 6425/12384 [13:38:07<12:38:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 52%|█████▏ | 6426/12384 [13:38:07<12:37:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 52%|█████▏ | 6426/12384 [13:38:15<12:37:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6427/12384 [13:38:15<12:36:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6427/12384 [13:38:23<12:36:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 52%|█████▏ | 6428/12384 [13:38:23<12:35:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 52%|█████▏ | 6428/12384 [13:38:30<12:35:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 52%|█████▏ | 6429/12384 [13:38:30<12:34:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 52%|█████▏ | 6429/12384 [13:38:38<12:34:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 52%|█████▏ | 6430/12384 [13:38:38<12:34:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 52%|█████▏ | 6430/12384 [13:38:45<12:34:29, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 52%|█████▏ | 6431/12384 [13:38:45<12:34:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 52%|█████▏ | 6431/12384 [13:38:53<12:34:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 52%|█████▏ | 6432/12384 [13:38:53<12:34:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 52%|█████▏ | 6432/12384 [13:39:01<12:34:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 2: 52%|█████▏ | 6433/12384 [13:39:01<12:34:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 2: 52%|█████▏ | 6433/12384 [13:39:08<12:34:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 52%|█████▏ | 6434/12384 [13:39:08<12:34:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 52%|█████▏ | 6434/12384 [13:39:16<12:34:05, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 52%|█████▏ | 6435/12384 [13:39:16<12:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 52%|█████▏ | 6435/12384 [13:39:23<12:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6436/12384 [13:39:23<12:35:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6436/12384 [13:39:31<12:35:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 52%|█████▏ | 6437/12384 [13:39:31<12:36:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 52%|█████▏ | 6437/12384 [13:39:39<12:36:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 52%|█████▏ | 6438/12384 [13:39:39<12:35:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 52%|█████▏ | 6438/12384 [13:39:46<12:35:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 52%|█████▏ | 6439/12384 [13:39:46<12:35:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 52%|█████▏ | 6439/12384 [13:39:54<12:35:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 2: 52%|█████▏ | 6440/12384 [13:39:54<12:34:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.31s]
Epoch 2: 52%|█████▏ | 6440/12384 [13:40:02<12:34:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 52%|█████▏ | 6441/12384 [13:40:02<12:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 52%|█████▏ | 6441/12384 [13:40:09<12:34:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 52%|█████▏ | 6442/12384 [13:40:09<12:43:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 52%|█████▏ | 6442/12384 [13:40:17<12:43:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 52%|█████▏ | 6443/12384 [13:40:17<12:40:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 52%|█████▏ | 6443/12384 [13:40:25<12:40:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 52%|█████▏ | 6444/12384 [13:40:25<12:37:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 52%|█████▏ | 6444/12384 [13:40:32<12:37:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 52%|█████▏ | 6445/12384 [13:40:32<12:36:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 52%|█████▏ | 6445/12384 [13:40:40<12:36:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 52%|█████▏ | 6446/12384 [13:40:40<12:35:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 52%|█████▏ | 6446/12384 [13:40:47<12:35:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 52%|█████▏ | 6447/12384 [13:40:47<12:34:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 52%|█████▏ | 6447/12384 [13:40:55<12:34:24, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=7.56s]
Epoch 2: 52%|█████▏ | 6448/12384 [13:40:55<12:33:49, 7.62s/it, loss=0.0002, acc=0.9997, iter_time=7.56s]
Epoch 2: 52%|█████▏ | 6448/12384 [13:41:03<12:33:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 52%|█████▏ | 6449/12384 [13:41:03<12:33:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 52%|█████▏ | 6449/12384 [13:41:10<12:33:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6450/12384 [13:41:10<12:32:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6450/12384 [13:41:18<12:32:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6451/12384 [13:41:18<12:32:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6451/12384 [13:41:25<12:32:02, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6452/12384 [13:41:25<12:32:11, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6452/12384 [13:41:33<12:32:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 52%|█████▏ | 6453/12384 [13:41:33<12:33:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 52%|█████▏ | 6453/12384 [13:41:41<12:33:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 52%|█████▏ | 6454/12384 [13:41:41<12:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 52%|█████▏ | 6454/12384 [13:41:48<12:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6455/12384 [13:41:48<12:32:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6455/12384 [13:41:56<12:32:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 52%|█████▏ | 6456/12384 [13:41:56<12:32:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 52%|█████▏ | 6456/12384 [13:42:04<12:32:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 52%|█████▏ | 6457/12384 [13:42:04<12:32:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 52%|█████▏ | 6457/12384 [13:42:11<12:32:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 52%|█████▏ | 6458/12384 [13:42:11<12:31:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 52%|█████▏ | 6458/12384 [13:42:19<12:31:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 52%|█████▏ | 6459/12384 [13:42:19<12:31:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 52%|█████▏ | 6459/12384 [13:42:26<12:31:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 52%|█████▏ | 6460/12384 [13:42:26<12:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 52%|█████▏ | 6460/12384 [13:42:34<12:31:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 52%|█████▏ | 6461/12384 [13:42:34<12:31:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 52%|█████▏ | 6461/12384 [13:42:42<12:31:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 52%|█████▏ | 6462/12384 [13:42:42<12:31:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 52%|█████▏ | 6462/12384 [13:42:49<12:31:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 52%|█████▏ | 6463/12384 [13:42:49<12:32:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 52%|█████▏ | 6463/12384 [13:42:57<12:32:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 52%|█████▏ | 6464/12384 [13:42:57<12:32:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 52%|█████▏ | 6464/12384 [13:43:05<12:32:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 2: 52%|█████▏ | 6465/12384 [13:43:05<12:31:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 2: 52%|█████▏ | 6465/12384 [13:43:12<12:31:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 52%|█████▏ | 6466/12384 [13:43:12<12:31:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 52%|█████▏ | 6466/12384 [13:43:20<12:31:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6467/12384 [13:43:20<12:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6467/12384 [13:43:27<12:30:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 52%|█████▏ | 6468/12384 [13:43:27<12:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 52%|█████▏ | 6468/12384 [13:43:35<12:30:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 52%|█████▏ | 6469/12384 [13:43:35<12:39:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 52%|█████▏ | 6469/12384 [13:43:43<12:39:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 52%|█████▏ | 6470/12384 [13:43:43<12:36:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 52%|█████▏ | 6470/12384 [13:43:51<12:36:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 52%|█████▏ | 6471/12384 [13:43:51<12:35:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 52%|█████▏ | 6471/12384 [13:43:58<12:35:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 2: 52%|█████▏ | 6472/12384 [13:43:58<12:36:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 2: 52%|█████▏ | 6472/12384 [13:44:06<12:36:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 52%|█████▏ | 6473/12384 [13:44:06<12:42:17, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 52%|█████▏ | 6473/12384 [13:44:14<12:42:17, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 52%|█████▏ | 6474/12384 [13:44:14<12:39:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 52%|█████▏ | 6474/12384 [13:44:21<12:39:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 52%|█████▏ | 6475/12384 [13:44:21<12:36:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 52%|█████▏ | 6475/12384 [13:44:29<12:36:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6476/12384 [13:44:29<12:34:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6476/12384 [13:44:37<12:34:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 52%|█████▏ | 6477/12384 [13:44:37<12:32:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 52%|█████▏ | 6477/12384 [13:44:44<12:32:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 52%|█████▏ | 6478/12384 [13:44:44<12:31:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 52%|█████▏ | 6478/12384 [13:44:52<12:31:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 52%|█████▏ | 6479/12384 [13:44:52<12:29:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 52%|█████▏ | 6479/12384 [13:44:59<12:29:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 52%|█████▏ | 6480/12384 [13:44:59<12:29:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 52%|█████▏ | 6480/12384 [13:45:07<12:29:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 52%|█████▏ | 6481/12384 [13:45:07<12:29:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 52%|█████▏ | 6481/12384 [13:45:15<12:29:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 52%|█████▏ | 6482/12384 [13:45:15<12:28:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 52%|█████▏ | 6482/12384 [13:45:22<12:28:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 52%|█████▏ | 6483/12384 [13:45:22<12:28:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 52%|█████▏ | 6483/12384 [13:45:30<12:28:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6484/12384 [13:45:30<12:28:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6484/12384 [13:45:37<12:28:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 52%|█████▏ | 6485/12384 [13:45:37<12:27:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 52%|█████▏ | 6485/12384 [13:45:45<12:27:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 52%|█████▏ | 6486/12384 [13:45:45<12:27:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 52%|█████▏ | 6486/12384 [13:45:53<12:27:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 52%|█████▏ | 6487/12384 [13:45:53<12:28:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 52%|█████▏ | 6487/12384 [13:46:00<12:28:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 2: 52%|█████▏ | 6488/12384 [13:46:00<12:28:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.04s]
Epoch 2: 52%|█████▏ | 6488/12384 [13:46:08<12:28:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 52%|█████▏ | 6489/12384 [13:46:08<12:28:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 52%|█████▏ | 6489/12384 [13:46:16<12:28:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 52%|█████▏ | 6490/12384 [13:46:16<12:28:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 52%|█████▏ | 6490/12384 [13:46:23<12:28:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6491/12384 [13:46:23<12:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 52%|█████▏ | 6491/12384 [13:46:31<12:27:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 52%|█████▏ | 6492/12384 [13:46:31<12:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 52%|█████▏ | 6492/12384 [13:46:38<12:27:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 52%|█████▏ | 6493/12384 [13:46:38<12:28:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 52%|█████▏ | 6493/12384 [13:46:46<12:28:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 2: 52%|█████▏ | 6494/12384 [13:46:46<12:27:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.99s]
Epoch 2: 52%|█████▏ | 6494/12384 [13:46:54<12:27:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 52%|█████▏ | 6495/12384 [13:46:54<12:37:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 52%|█████▏ | 6495/12384 [13:47:02<12:37:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 52%|█████▏ | 6496/12384 [13:47:02<12:33:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 52%|█████▏ | 6496/12384 [13:47:09<12:33:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 52%|█████▏ | 6497/12384 [13:47:09<12:31:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 52%|█████▏ | 6497/12384 [13:47:17<12:31:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 52%|█████▏ | 6498/12384 [13:47:17<12:30:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 52%|█████▏ | 6498/12384 [13:47:25<12:30:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 52%|█████▏ | 6499/12384 [13:47:25<12:36:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 52%|█████▏ | 6499/12384 [13:47:32<12:36:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6500/12384 [13:47:32<12:33:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 52%|█████▏ | 6500/12384 [13:47:40<12:33:25, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 52%|█████▏ | 6501/12384 [13:47:40<12:31:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 52%|█████▏ | 6501/12384 [13:47:47<12:31:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 53%|█████▎ | 6502/12384 [13:47:47<12:29:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 53%|█████▎ | 6502/12384 [13:47:55<12:29:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 2: 53%|█████▎ | 6503/12384 [13:47:55<12:29:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.94s]
Epoch 2: 53%|█████▎ | 6503/12384 [13:48:03<12:29:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 2: 53%|█████▎ | 6504/12384 [13:48:03<12:29:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 2: 53%|█████▎ | 6504/12384 [13:48:10<12:29:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 53%|█████▎ | 6505/12384 [13:48:10<12:28:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 53%|█████▎ | 6505/12384 [13:48:18<12:28:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6506/12384 [13:48:18<12:26:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6506/12384 [13:48:26<12:26:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6507/12384 [13:48:26<12:25:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6507/12384 [13:48:33<12:25:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 53%|█████▎ | 6508/12384 [13:48:33<12:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 53%|█████▎ | 6508/12384 [13:48:41<12:25:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 53%|█████▎ | 6509/12384 [13:48:41<12:24:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.07s]
Epoch 2: 53%|█████▎ | 6509/12384 [13:48:48<12:24:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 53%|█████▎ | 6510/12384 [13:48:48<12:25:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.61s]
Epoch 2: 53%|█████▎ | 6510/12384 [13:48:56<12:25:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 53%|█████▎ | 6511/12384 [13:48:56<12:24:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 53%|█████▎ | 6511/12384 [13:49:04<12:24:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 53%|█████▎ | 6512/12384 [13:49:04<12:24:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 53%|█████▎ | 6512/12384 [13:49:11<12:24:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 53%|█████▎ | 6513/12384 [13:49:11<12:25:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 53%|█████▎ | 6513/12384 [13:49:19<12:25:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 53%|█████▎ | 6514/12384 [13:49:19<12:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 53%|█████▎ | 6514/12384 [13:49:26<12:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 53%|█████▎ | 6515/12384 [13:49:26<12:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 53%|█████▎ | 6515/12384 [13:49:34<12:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 53%|█████▎ | 6516/12384 [13:49:34<12:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 53%|█████▎ | 6516/12384 [13:49:42<12:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 53%|█████▎ | 6517/12384 [13:49:42<12:24:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 53%|█████▎ | 6517/12384 [13:49:49<12:24:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 53%|█████▎ | 6518/12384 [13:49:49<12:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 53%|█████▎ | 6518/12384 [13:49:57<12:23:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 53%|█████▎ | 6519/12384 [13:49:57<12:24:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 53%|█████▎ | 6519/12384 [13:50:04<12:24:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 2: 53%|█████▎ | 6520/12384 [13:50:04<12:23:39, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 2: 53%|█████▎ | 6520/12384 [13:50:12<12:23:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 53%|█████▎ | 6521/12384 [13:50:12<12:33:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 53%|█████▎ | 6521/12384 [13:50:20<12:33:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 53%|█████▎ | 6522/12384 [13:50:20<12:30:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 53%|█████▎ | 6522/12384 [13:50:28<12:30:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 53%|█████▎ | 6523/12384 [13:50:28<12:28:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 53%|█████▎ | 6523/12384 [13:50:35<12:28:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 53%|█████▎ | 6524/12384 [13:50:35<12:26:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 53%|█████▎ | 6524/12384 [13:50:43<12:26:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 53%|█████▎ | 6525/12384 [13:50:43<12:33:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 53%|█████▎ | 6525/12384 [13:50:51<12:33:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 53%|█████▎ | 6526/12384 [13:50:51<12:29:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 53%|█████▎ | 6526/12384 [13:50:58<12:29:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 53%|█████▎ | 6527/12384 [13:50:58<12:27:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 53%|█████▎ | 6527/12384 [13:51:06<12:27:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 53%|█████▎ | 6528/12384 [13:51:06<12:25:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 53%|█████▎ | 6528/12384 [13:51:14<12:25:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 53%|█████▎ | 6529/12384 [13:51:14<12:25:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 53%|█████▎ | 6529/12384 [13:51:21<12:25:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 53%|█████▎ | 6530/12384 [13:51:21<12:24:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 53%|█████▎ | 6530/12384 [13:51:29<12:24:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 53%|█████▎ | 6531/12384 [13:51:29<12:23:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 53%|█████▎ | 6531/12384 [13:51:36<12:23:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 53%|█████▎ | 6532/12384 [13:51:36<12:23:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 53%|█████▎ | 6532/12384 [13:51:44<12:23:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 53%|█████▎ | 6533/12384 [13:51:44<12:25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 53%|█████▎ | 6533/12384 [13:51:52<12:25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 53%|█████▎ | 6534/12384 [13:51:52<12:24:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 53%|█████▎ | 6534/12384 [13:51:59<12:24:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6535/12384 [13:51:59<12:23:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6535/12384 [13:52:07<12:23:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 53%|█████▎ | 6536/12384 [13:52:07<12:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 53%|█████▎ | 6536/12384 [13:52:15<12:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 2: 53%|█████▎ | 6537/12384 [13:52:15<12:22:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 2: 53%|█████▎ | 6537/12384 [13:52:22<12:22:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 53%|█████▎ | 6538/12384 [13:52:22<12:21:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.37s]
Epoch 2: 53%|█████▎ | 6538/12384 [13:52:30<12:21:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 53%|█████▎ | 6539/12384 [13:52:30<12:22:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 53%|█████▎ | 6539/12384 [13:52:37<12:22:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 53%|█████▎ | 6540/12384 [13:52:37<12:21:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 53%|█████▎ | 6540/12384 [13:52:45<12:21:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 53%|█████▎ | 6541/12384 [13:52:45<12:21:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 53%|█████▎ | 6541/12384 [13:52:53<12:21:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6542/12384 [13:52:53<12:21:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6542/12384 [13:53:00<12:21:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 53%|█████▎ | 6543/12384 [13:53:00<12:20:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 53%|█████▎ | 6543/12384 [13:53:08<12:20:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 53%|█████▎ | 6544/12384 [13:53:08<12:20:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 53%|█████▎ | 6544/12384 [13:53:15<12:20:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 53%|█████▎ | 6545/12384 [13:53:15<12:21:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 53%|█████▎ | 6545/12384 [13:53:23<12:21:11, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.69s]
Epoch 2: 53%|█████▎ | 6546/12384 [13:53:23<12:21:16, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.69s]
Epoch 2: 53%|█████▎ | 6546/12384 [13:53:31<12:21:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 53%|█████▎ | 6547/12384 [13:53:31<12:31:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 53%|█████▎ | 6547/12384 [13:53:39<12:31:03, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 2: 53%|█████▎ | 6548/12384 [13:53:39<12:27:43, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 2: 53%|█████▎ | 6548/12384 [13:53:46<12:27:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6549/12384 [13:53:46<12:25:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6549/12384 [13:53:54<12:25:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 53%|█████▎ | 6550/12384 [13:53:54<12:23:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 53%|█████▎ | 6550/12384 [13:54:01<12:23:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 53%|█████▎ | 6551/12384 [13:54:01<12:22:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 53%|█████▎ | 6551/12384 [13:54:09<12:22:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 53%|█████▎ | 6552/12384 [13:54:09<12:21:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 53%|█████▎ | 6552/12384 [13:54:17<12:21:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.26s]
Epoch 2: 53%|█████▎ | 6553/12384 [13:54:17<12:20:09, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.26s]
Epoch 2: 53%|█████▎ | 6553/12384 [13:54:24<12:20:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 53%|█████▎ | 6554/12384 [13:54:24<12:19:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 53%|█████▎ | 6554/12384 [13:54:32<12:19:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 53%|█████▎ | 6555/12384 [13:54:32<12:19:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 53%|█████▎ | 6555/12384 [13:54:40<12:19:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6556/12384 [13:54:40<12:19:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6556/12384 [13:54:47<12:19:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 53%|█████▎ | 6557/12384 [13:54:47<12:18:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 53%|█████▎ | 6557/12384 [13:54:55<12:18:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 53%|█████▎ | 6558/12384 [13:54:55<12:18:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 53%|█████▎ | 6558/12384 [13:55:02<12:18:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 53%|█████▎ | 6559/12384 [13:55:02<12:19:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 53%|█████▎ | 6559/12384 [13:55:10<12:19:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 53%|█████▎ | 6560/12384 [13:55:10<12:18:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 53%|█████▎ | 6560/12384 [13:55:18<12:18:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 53%|█████▎ | 6561/12384 [13:55:18<12:18:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 53%|█████▎ | 6561/12384 [13:55:25<12:18:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 53%|█████▎ | 6562/12384 [13:55:25<12:17:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 53%|█████▎ | 6562/12384 [13:55:33<12:17:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 53%|█████▎ | 6563/12384 [13:55:33<12:20:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 53%|█████▎ | 6563/12384 [13:55:40<12:20:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6564/12384 [13:55:40<12:18:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6564/12384 [13:55:48<12:18:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 53%|█████▎ | 6565/12384 [13:55:48<12:18:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 53%|█████▎ | 6565/12384 [13:55:56<12:18:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 53%|█████▎ | 6566/12384 [13:55:56<12:19:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 53%|█████▎ | 6566/12384 [13:56:03<12:19:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 53%|█████▎ | 6567/12384 [13:56:03<12:19:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 53%|█████▎ | 6567/12384 [13:56:11<12:19:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 53%|█████▎ | 6568/12384 [13:56:11<12:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 53%|█████▎ | 6568/12384 [13:56:19<12:19:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 53%|█████▎ | 6569/12384 [13:56:19<12:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 53%|█████▎ | 6569/12384 [13:56:26<12:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 53%|█████▎ | 6570/12384 [13:56:26<12:18:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 53%|█████▎ | 6570/12384 [13:56:34<12:18:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 53%|█████▎ | 6571/12384 [13:56:34<12:17:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 53%|█████▎ | 6571/12384 [13:56:41<12:17:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 53%|█████▎ | 6572/12384 [13:56:41<12:17:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 53%|█████▎ | 6572/12384 [13:56:49<12:17:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 53%|█████▎ | 6573/12384 [13:56:49<12:27:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 53%|█████▎ | 6573/12384 [13:56:57<12:27:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 2: 53%|█████▎ | 6574/12384 [13:56:57<12:23:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 2: 53%|█████▎ | 6574/12384 [13:57:05<12:23:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6575/12384 [13:57:05<12:22:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6575/12384 [13:57:12<12:22:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 53%|█████▎ | 6576/12384 [13:57:12<12:20:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 53%|█████▎ | 6576/12384 [13:57:20<12:20:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 53%|█████▎ | 6577/12384 [13:57:20<12:19:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 53%|█████▎ | 6577/12384 [13:57:27<12:19:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 53%|█████▎ | 6578/12384 [13:57:27<12:17:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 53%|█████▎ | 6578/12384 [13:57:35<12:17:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6579/12384 [13:57:35<12:17:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6579/12384 [13:57:43<12:17:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 53%|█████▎ | 6580/12384 [13:57:43<12:16:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 53%|█████▎ | 6580/12384 [13:57:50<12:16:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6581/12384 [13:57:50<12:15:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6581/12384 [13:57:58<12:15:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 53%|█████▎ | 6582/12384 [13:57:58<12:15:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 53%|█████▎ | 6582/12384 [13:58:05<12:15:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 53%|█████▎ | 6583/12384 [13:58:05<12:17:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 53%|█████▎ | 6583/12384 [13:58:13<12:17:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 53%|█████▎ | 6584/12384 [13:58:13<12:17:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 53%|█████▎ | 6584/12384 [13:58:21<12:17:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 53%|█████▎ | 6585/12384 [13:58:21<12:17:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 53%|█████▎ | 6585/12384 [13:58:28<12:17:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6586/12384 [13:58:28<12:16:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6586/12384 [13:58:36<12:16:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6587/12384 [13:58:36<12:16:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6587/12384 [13:58:44<12:16:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 53%|█████▎ | 6588/12384 [13:58:44<12:15:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 53%|█████▎ | 6588/12384 [13:58:51<12:15:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 53%|█████▎ | 6589/12384 [13:58:51<12:15:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 53%|█████▎ | 6589/12384 [13:58:59<12:15:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 53%|█████▎ | 6590/12384 [13:58:59<12:15:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 53%|█████▎ | 6590/12384 [13:59:06<12:15:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 53%|█████▎ | 6591/12384 [13:59:06<12:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 53%|█████▎ | 6591/12384 [13:59:14<12:15:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 53%|█████▎ | 6592/12384 [13:59:14<12:14:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 53%|█████▎ | 6592/12384 [13:59:22<12:14:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 53%|█████▎ | 6593/12384 [13:59:22<12:13:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 53%|█████▎ | 6593/12384 [13:59:29<12:13:59, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 53%|█████▎ | 6594/12384 [13:59:29<12:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 53%|█████▎ | 6594/12384 [13:59:37<12:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6595/12384 [13:59:37<12:13:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6595/12384 [13:59:44<12:13:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6596/12384 [13:59:44<12:13:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6596/12384 [13:59:52<12:13:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6597/12384 [13:59:52<12:14:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6597/12384 [14:00:00<12:14:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 53%|█████▎ | 6598/12384 [14:00:00<12:13:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 53%|█████▎ | 6598/12384 [14:00:07<12:13:49, 7.61s/it, loss=0.0002, acc=0.9988, iter_time=7.66s]
Epoch 2: 53%|█████▎ | 6599/12384 [14:00:07<12:15:06, 7.62s/it, loss=0.0002, acc=0.9988, iter_time=7.66s]
Epoch 2: 53%|█████▎ | 6599/12384 [14:00:15<12:15:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 53%|█████▎ | 6600/12384 [14:00:15<12:23:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 53%|█████▎ | 6600/12384 [14:00:23<12:23:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 53%|█████▎ | 6601/12384 [14:00:23<12:19:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 53%|█████▎ | 6601/12384 [14:00:30<12:19:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6602/12384 [14:00:30<12:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6602/12384 [14:00:38<12:17:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 53%|█████▎ | 6603/12384 [14:00:38<12:24:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 53%|█████▎ | 6603/12384 [14:00:46<12:24:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 53%|█████▎ | 6604/12384 [14:00:46<12:20:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 53%|█████▎ | 6604/12384 [14:00:53<12:20:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 53%|█████▎ | 6605/12384 [14:00:53<12:17:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 53%|█████▎ | 6605/12384 [14:01:01<12:17:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 53%|█████▎ | 6606/12384 [14:01:01<12:16:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 53%|█████▎ | 6606/12384 [14:01:09<12:16:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 53%|█████▎ | 6607/12384 [14:01:09<12:15:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 53%|█████▎ | 6607/12384 [14:01:16<12:15:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 53%|█████▎ | 6608/12384 [14:01:16<12:14:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 53%|█████▎ | 6608/12384 [14:01:24<12:14:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 53%|█████▎ | 6609/12384 [14:01:24<12:13:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 53%|█████▎ | 6609/12384 [14:01:32<12:13:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6610/12384 [14:01:32<12:13:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 53%|█████▎ | 6610/12384 [14:01:39<12:13:30, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6611/12384 [14:01:39<12:12:47, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6611/12384 [14:01:47<12:12:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6612/12384 [14:01:47<12:12:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 53%|█████▎ | 6612/12384 [14:01:54<12:12:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6613/12384 [14:01:54<12:12:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 53%|█████▎ | 6613/12384 [14:02:02<12:12:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 53%|█████▎ | 6614/12384 [14:02:02<12:11:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 53%|█████▎ | 6614/12384 [14:02:10<12:11:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 53%|█████▎ | 6615/12384 [14:02:10<12:11:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 53%|█████▎ | 6615/12384 [14:02:17<12:11:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 53%|█████▎ | 6616/12384 [14:02:17<12:11:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 53%|█████▎ | 6616/12384 [14:02:25<12:11:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 53%|█████▎ | 6617/12384 [14:02:25<12:11:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 53%|█████▎ | 6617/12384 [14:02:32<12:11:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 53%|█████▎ | 6618/12384 [14:02:32<12:11:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 53%|█████▎ | 6618/12384 [14:02:40<12:11:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 53%|█████▎ | 6619/12384 [14:02:40<12:11:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 53%|█████▎ | 6619/12384 [14:02:48<12:11:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 53%|█████▎ | 6620/12384 [14:02:48<12:12:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 53%|█████▎ | 6620/12384 [14:02:55<12:12:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 53%|█████▎ | 6621/12384 [14:02:55<12:12:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 53%|█████▎ | 6621/12384 [14:03:03<12:12:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 53%|█████▎ | 6622/12384 [14:03:03<12:11:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 53%|█████▎ | 6622/12384 [14:03:11<12:11:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 53%|█████▎ | 6623/12384 [14:03:11<12:10:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 53%|█████▎ | 6623/12384 [14:03:18<12:10:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 53%|█████▎ | 6624/12384 [14:03:18<12:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 53%|█████▎ | 6624/12384 [14:03:26<12:10:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 53%|█████▎ | 6625/12384 [14:03:26<12:10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 53%|█████▎ | 6625/12384 [14:03:34<12:10:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 2: 54%|█████▎ | 6626/12384 [14:03:34<12:20:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 2: 54%|█████▎ | 6626/12384 [14:03:41<12:20:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 54%|█████▎ | 6627/12384 [14:03:41<12:18:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 54%|█████▎ | 6627/12384 [14:03:49<12:18:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 54%|█████▎ | 6628/12384 [14:03:49<12:15:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 54%|█████▎ | 6628/12384 [14:03:57<12:15:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 54%|█████▎ | 6629/12384 [14:03:57<12:13:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 54%|█████▎ | 6629/12384 [14:04:04<12:13:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 54%|█████▎ | 6630/12384 [14:04:04<12:12:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 54%|█████▎ | 6630/12384 [14:04:12<12:12:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 54%|█████▎ | 6631/12384 [14:04:12<12:11:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 54%|█████▎ | 6631/12384 [14:04:19<12:11:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 54%|█████▎ | 6632/12384 [14:04:19<12:10:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 54%|█████▎ | 6632/12384 [14:04:27<12:10:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 54%|█████▎ | 6633/12384 [14:04:27<12:10:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 54%|█████▎ | 6633/12384 [14:04:35<12:10:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 54%|█████▎ | 6634/12384 [14:04:35<12:09:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 54%|█████▎ | 6634/12384 [14:04:42<12:09:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 54%|█████▎ | 6635/12384 [14:04:42<12:09:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 54%|█████▎ | 6635/12384 [14:04:50<12:09:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 54%|█████▎ | 6636/12384 [14:04:50<12:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 54%|█████▎ | 6636/12384 [14:04:57<12:09:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 54%|█████▎ | 6637/12384 [14:04:57<12:09:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 54%|█████▎ | 6637/12384 [14:05:05<12:09:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 54%|█████▎ | 6638/12384 [14:05:05<12:09:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 54%|█████▎ | 6638/12384 [14:05:13<12:09:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▎ | 6639/12384 [14:05:13<12:08:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▎ | 6639/12384 [14:05:20<12:08:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 54%|█████▎ | 6640/12384 [14:05:20<12:08:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 54%|█████▎ | 6640/12384 [14:05:28<12:08:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 54%|█████▎ | 6641/12384 [14:05:28<12:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 54%|█████▎ | 6641/12384 [14:05:35<12:08:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 54%|█████▎ | 6642/12384 [14:05:35<12:08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 54%|█████▎ | 6642/12384 [14:05:43<12:08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▎ | 6643/12384 [14:05:43<12:08:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▎ | 6643/12384 [14:05:51<12:08:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 54%|█████▎ | 6644/12384 [14:05:51<12:08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 54%|█████▎ | 6644/12384 [14:05:58<12:08:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▎ | 6645/12384 [14:05:58<12:08:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▎ | 6645/12384 [14:06:06<12:08:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▎ | 6646/12384 [14:06:06<12:07:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▎ | 6646/12384 [14:06:14<12:07:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 54%|█████▎ | 6647/12384 [14:06:14<12:07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 54%|█████▎ | 6647/12384 [14:06:21<12:07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 54%|█████▎ | 6648/12384 [14:06:21<12:07:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 54%|█████▎ | 6648/12384 [14:06:29<12:07:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 54%|█████▎ | 6649/12384 [14:06:29<12:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 54%|█████▎ | 6649/12384 [14:06:36<12:06:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▎ | 6650/12384 [14:06:36<12:09:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▎ | 6650/12384 [14:06:44<12:09:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 54%|█████▎ | 6651/12384 [14:06:44<12:08:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 54%|█████▎ | 6651/12384 [14:06:52<12:08:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 54%|█████▎ | 6652/12384 [14:06:52<12:07:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 54%|█████▎ | 6652/12384 [14:07:00<12:07:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 54%|█████▎ | 6653/12384 [14:07:00<12:18:12, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 54%|█████▎ | 6653/12384 [14:07:07<12:18:12, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 54%|█████▎ | 6654/12384 [14:07:07<12:15:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 54%|█████▎ | 6654/12384 [14:07:15<12:15:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▎ | 6655/12384 [14:07:15<12:14:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▎ | 6655/12384 [14:07:23<12:14:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 54%|█████▎ | 6656/12384 [14:07:23<12:11:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 54%|█████▎ | 6656/12384 [14:07:30<12:11:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 54%|█████▍ | 6657/12384 [14:07:30<12:20:04, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 54%|█████▍ | 6657/12384 [14:07:38<12:20:04, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 54%|█████▍ | 6658/12384 [14:07:38<12:15:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 54%|█████▍ | 6658/12384 [14:07:46<12:15:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 54%|█████▍ | 6659/12384 [14:07:46<12:15:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 54%|█████▍ | 6659/12384 [14:07:53<12:15:36, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 2: 54%|█████▍ | 6660/12384 [14:07:53<12:13:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.30s]
Epoch 2: 54%|█████▍ | 6660/12384 [14:08:01<12:13:09, 7.69s/it, loss=0.0003, acc=0.9983, iter_time=7.04s]
Epoch 2: 54%|█████▍ | 6661/12384 [14:08:01<12:11:11, 7.67s/it, loss=0.0003, acc=0.9983, iter_time=7.04s]
Epoch 2: 54%|█████▍ | 6661/12384 [14:08:09<12:11:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 54%|█████▍ | 6662/12384 [14:08:09<12:09:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 54%|█████▍ | 6662/12384 [14:08:16<12:09:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 54%|█████▍ | 6663/12384 [14:08:16<12:08:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 54%|█████▍ | 6663/12384 [14:08:24<12:08:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 54%|█████▍ | 6664/12384 [14:08:24<12:07:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 54%|█████▍ | 6664/12384 [14:08:31<12:07:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 54%|█████▍ | 6665/12384 [14:08:31<12:06:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 54%|█████▍ | 6665/12384 [14:08:39<12:06:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▍ | 6666/12384 [14:08:39<12:05:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▍ | 6666/12384 [14:08:47<12:05:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▍ | 6667/12384 [14:08:47<12:05:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▍ | 6667/12384 [14:08:54<12:05:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 54%|█████▍ | 6668/12384 [14:08:54<12:05:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 54%|█████▍ | 6668/12384 [14:09:02<12:05:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 54%|█████▍ | 6669/12384 [14:09:02<12:05:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 54%|█████▍ | 6669/12384 [14:09:10<12:05:19, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.08s]
Epoch 2: 54%|█████▍ | 6670/12384 [14:09:10<12:04:39, 7.61s/it, loss=0.0002, acc=0.9998, iter_time=7.08s]
Epoch 2: 54%|█████▍ | 6670/12384 [14:09:17<12:04:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 54%|█████▍ | 6671/12384 [14:09:17<12:04:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 54%|█████▍ | 6671/12384 [14:09:25<12:04:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 54%|█████▍ | 6672/12384 [14:09:25<12:04:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 54%|█████▍ | 6672/12384 [14:09:32<12:04:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 54%|█████▍ | 6673/12384 [14:09:32<12:04:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 54%|█████▍ | 6673/12384 [14:09:40<12:04:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 54%|█████▍ | 6674/12384 [14:09:40<12:04:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 54%|█████▍ | 6674/12384 [14:09:48<12:04:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 54%|█████▍ | 6675/12384 [14:09:48<12:04:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 54%|█████▍ | 6675/12384 [14:09:55<12:04:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6676/12384 [14:09:55<12:03:55, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6676/12384 [14:10:03<12:03:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 54%|█████▍ | 6677/12384 [14:10:03<12:04:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 54%|█████▍ | 6677/12384 [14:10:10<12:04:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 54%|█████▍ | 6678/12384 [14:10:10<12:03:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 54%|█████▍ | 6678/12384 [14:10:18<12:03:50, 7.61s/it, loss=0.0001, acc=0.9996, iter_time=7.66s]
Epoch 2: 54%|█████▍ | 6679/12384 [14:10:18<12:13:59, 7.72s/it, loss=0.0001, acc=0.9996, iter_time=7.66s]
Epoch 2: 54%|█████▍ | 6679/12384 [14:10:26<12:13:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 54%|█████▍ | 6680/12384 [14:10:26<12:11:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 54%|█████▍ | 6680/12384 [14:10:34<12:11:57, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 2: 54%|█████▍ | 6681/12384 [14:10:34<12:08:54, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 2: 54%|█████▍ | 6681/12384 [14:10:41<12:08:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 54%|█████▍ | 6682/12384 [14:10:41<12:07:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 54%|█████▍ | 6682/12384 [14:10:49<12:07:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 54%|█████▍ | 6683/12384 [14:10:49<12:14:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 54%|█████▍ | 6683/12384 [14:10:57<12:14:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 54%|█████▍ | 6684/12384 [14:10:57<12:10:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 54%|█████▍ | 6684/12384 [14:11:04<12:10:09, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6685/12384 [14:11:04<12:07:36, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6685/12384 [14:11:12<12:07:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 54%|█████▍ | 6686/12384 [14:11:12<12:06:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 54%|█████▍ | 6686/12384 [14:11:20<12:06:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 54%|█████▍ | 6687/12384 [14:11:20<12:04:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 54%|█████▍ | 6687/12384 [14:11:27<12:04:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 54%|█████▍ | 6688/12384 [14:11:27<12:05:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 54%|█████▍ | 6688/12384 [14:11:35<12:05:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 54%|█████▍ | 6689/12384 [14:11:35<12:04:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 54%|█████▍ | 6689/12384 [14:11:42<12:04:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 54%|█████▍ | 6690/12384 [14:11:42<12:04:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 54%|█████▍ | 6690/12384 [14:11:50<12:04:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6691/12384 [14:11:50<12:06:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6691/12384 [14:11:58<12:06:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 54%|█████▍ | 6692/12384 [14:11:58<12:05:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 54%|█████▍ | 6692/12384 [14:12:05<12:05:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6693/12384 [14:12:05<12:04:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6693/12384 [14:12:13<12:04:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 54%|█████▍ | 6694/12384 [14:12:13<12:04:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 54%|█████▍ | 6694/12384 [14:12:21<12:04:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 54%|█████▍ | 6695/12384 [14:12:21<12:03:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 54%|█████▍ | 6695/12384 [14:12:28<12:03:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 54%|█████▍ | 6696/12384 [14:12:28<12:04:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 54%|█████▍ | 6696/12384 [14:12:36<12:04:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 54%|█████▍ | 6697/12384 [14:12:36<12:03:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 54%|█████▍ | 6697/12384 [14:12:44<12:03:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 54%|█████▍ | 6698/12384 [14:12:44<12:02:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 54%|█████▍ | 6698/12384 [14:12:51<12:02:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 54%|█████▍ | 6699/12384 [14:12:51<12:01:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 54%|█████▍ | 6699/12384 [14:12:59<12:01:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 54%|█████▍ | 6700/12384 [14:12:59<12:02:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 54%|█████▍ | 6700/12384 [14:13:06<12:02:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 54%|█████▍ | 6701/12384 [14:13:06<12:02:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 54%|█████▍ | 6701/12384 [14:13:14<12:02:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 54%|█████▍ | 6702/12384 [14:13:14<12:01:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 54%|█████▍ | 6702/12384 [14:13:22<12:01:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▍ | 6703/12384 [14:13:22<12:01:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 54%|█████▍ | 6703/12384 [14:13:29<12:01:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 54%|█████▍ | 6704/12384 [14:13:29<12:00:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 54%|█████▍ | 6704/12384 [14:13:37<12:00:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 54%|█████▍ | 6705/12384 [14:13:37<12:08:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 54%|█████▍ | 6705/12384 [14:13:45<12:08:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 54%|█████▍ | 6706/12384 [14:13:45<12:04:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 54%|█████▍ | 6706/12384 [14:13:52<12:04:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 54%|█████▍ | 6707/12384 [14:13:52<12:02:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 54%|█████▍ | 6707/12384 [14:14:00<12:02:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 54%|█████▍ | 6708/12384 [14:14:00<12:02:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 54%|█████▍ | 6708/12384 [14:14:08<12:02:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 54%|█████▍ | 6709/12384 [14:14:08<12:08:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 54%|█████▍ | 6709/12384 [14:14:15<12:08:54, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.58s]
Epoch 2: 54%|█████▍ | 6710/12384 [14:14:15<12:05:31, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.58s]
Epoch 2: 54%|█████▍ | 6710/12384 [14:14:23<12:05:31, 7.67s/it, loss=0.0013, acc=0.9961, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6711/12384 [14:14:23<12:03:26, 7.65s/it, loss=0.0013, acc=0.9961, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6711/12384 [14:14:31<12:03:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 54%|█████▍ | 6712/12384 [14:14:31<12:01:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 54%|█████▍ | 6712/12384 [14:14:38<12:01:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 2: 54%|█████▍ | 6713/12384 [14:14:38<12:01:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.47s]
Epoch 2: 54%|█████▍ | 6713/12384 [14:14:46<12:01:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 2: 54%|█████▍ | 6714/12384 [14:14:46<12:00:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 2: 54%|█████▍ | 6714/12384 [14:14:53<12:00:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 54%|█████▍ | 6715/12384 [14:14:53<12:00:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 54%|█████▍ | 6715/12384 [14:15:01<12:00:04, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=7.87s]
Epoch 2: 54%|█████▍ | 6716/12384 [14:15:01<11:59:30, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=7.87s]
Epoch 2: 54%|█████▍ | 6716/12384 [14:15:09<11:59:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 54%|█████▍ | 6717/12384 [14:15:09<11:58:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 54%|█████▍ | 6717/12384 [14:15:16<11:58:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 54%|█████▍ | 6718/12384 [14:15:16<11:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 54%|█████▍ | 6718/12384 [14:15:24<11:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 54%|█████▍ | 6719/12384 [14:15:24<11:58:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 54%|█████▍ | 6719/12384 [14:15:32<11:58:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 54%|█████▍ | 6720/12384 [14:15:32<12:00:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 54%|█████▍ | 6720/12384 [14:15:39<12:00:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 54%|█████▍ | 6721/12384 [14:15:39<11:59:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 54%|█████▍ | 6721/12384 [14:15:47<11:59:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 54%|█████▍ | 6722/12384 [14:15:47<11:59:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 54%|█████▍ | 6722/12384 [14:15:54<11:59:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 54%|█████▍ | 6723/12384 [14:15:54<11:58:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 54%|█████▍ | 6723/12384 [14:16:02<11:58:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 54%|█████▍ | 6724/12384 [14:16:02<11:57:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 54%|█████▍ | 6724/12384 [14:16:10<11:57:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6725/12384 [14:16:10<11:57:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6725/12384 [14:16:17<11:57:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 54%|█████▍ | 6726/12384 [14:16:17<11:57:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 54%|█████▍ | 6726/12384 [14:16:25<11:57:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 54%|█████▍ | 6727/12384 [14:16:25<11:56:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 54%|█████▍ | 6727/12384 [14:16:32<11:56:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 54%|█████▍ | 6728/12384 [14:16:32<11:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 54%|█████▍ | 6728/12384 [14:16:40<11:57:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 54%|█████▍ | 6729/12384 [14:16:40<11:56:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 54%|█████▍ | 6729/12384 [14:16:48<11:56:30, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 54%|█████▍ | 6730/12384 [14:16:48<11:56:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 54%|█████▍ | 6730/12384 [14:16:56<11:56:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 54%|█████▍ | 6731/12384 [14:16:56<12:06:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 54%|█████▍ | 6731/12384 [14:17:03<12:06:28, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 54%|█████▍ | 6732/12384 [14:17:03<12:08:40, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 54%|█████▍ | 6732/12384 [14:17:11<12:08:40, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 54%|█████▍ | 6733/12384 [14:17:11<12:05:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 54%|█████▍ | 6733/12384 [14:17:19<12:05:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 54%|█████▍ | 6734/12384 [14:17:19<12:03:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 54%|█████▍ | 6734/12384 [14:17:26<12:03:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 54%|█████▍ | 6735/12384 [14:17:26<12:01:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 54%|█████▍ | 6735/12384 [14:17:34<12:01:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 54%|█████▍ | 6736/12384 [14:17:34<12:00:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 54%|█████▍ | 6736/12384 [14:17:41<12:00:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 2: 54%|█████▍ | 6737/12384 [14:17:41<11:59:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.47s]
Epoch 2: 54%|█████▍ | 6737/12384 [14:17:49<11:59:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 54%|█████▍ | 6738/12384 [14:17:49<11:58:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 54%|█████▍ | 6738/12384 [14:17:57<11:58:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 54%|█████▍ | 6739/12384 [14:17:57<11:57:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 54%|█████▍ | 6739/12384 [14:18:04<11:57:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 54%|█████▍ | 6740/12384 [14:18:04<11:57:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.72s]
Epoch 2: 54%|█████▍ | 6740/12384 [14:18:12<11:57:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 54%|█████▍ | 6741/12384 [14:18:12<11:57:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 54%|█████▍ | 6741/12384 [14:18:20<11:57:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6742/12384 [14:18:20<11:56:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 54%|█████▍ | 6742/12384 [14:18:27<11:56:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.50s]
Epoch 2: 54%|█████▍ | 6743/12384 [14:18:27<11:55:44, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.50s]
Epoch 2: 54%|█████▍ | 6743/12384 [14:18:35<11:55:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 54%|█████▍ | 6744/12384 [14:18:35<11:55:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 54%|█████▍ | 6744/12384 [14:18:42<11:55:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 54%|█████▍ | 6745/12384 [14:18:42<11:56:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 54%|█████▍ | 6745/12384 [14:18:50<11:56:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 54%|█████▍ | 6746/12384 [14:18:50<11:55:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 54%|█████▍ | 6746/12384 [14:18:58<11:55:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 54%|█████▍ | 6747/12384 [14:18:58<11:54:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 54%|█████▍ | 6747/12384 [14:19:05<11:54:28, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 54%|█████▍ | 6748/12384 [14:19:05<11:53:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 54%|█████▍ | 6748/12384 [14:19:13<11:53:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 54%|█████▍ | 6749/12384 [14:19:13<11:55:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 54%|█████▍ | 6749/12384 [14:19:20<11:55:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6750/12384 [14:19:20<11:55:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6750/12384 [14:19:28<11:55:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 55%|█████▍ | 6751/12384 [14:19:28<11:54:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 55%|█████▍ | 6751/12384 [14:19:36<11:54:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 55%|█████▍ | 6752/12384 [14:19:36<11:53:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 55%|█████▍ | 6752/12384 [14:19:43<11:53:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 55%|█████▍ | 6753/12384 [14:19:43<11:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 55%|█████▍ | 6753/12384 [14:19:51<11:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▍ | 6754/12384 [14:19:51<11:53:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▍ | 6754/12384 [14:19:58<11:53:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▍ | 6755/12384 [14:19:58<11:53:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▍ | 6755/12384 [14:20:06<11:53:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6756/12384 [14:20:06<11:53:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6756/12384 [14:20:14<11:53:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 55%|█████▍ | 6757/12384 [14:20:14<12:02:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 55%|█████▍ | 6757/12384 [14:20:22<12:02:12, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 55%|█████▍ | 6758/12384 [14:20:22<11:59:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 55%|█████▍ | 6758/12384 [14:20:29<11:59:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6759/12384 [14:20:29<11:57:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6759/12384 [14:20:37<11:57:00, 7.65s/it, loss=0.0002, acc=0.9979, iter_time=7.58s]
Epoch 2: 55%|█████▍ | 6760/12384 [14:20:37<11:56:50, 7.65s/it, loss=0.0002, acc=0.9979, iter_time=7.58s]
Epoch 2: 55%|█████▍ | 6760/12384 [14:20:44<11:56:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▍ | 6761/12384 [14:20:44<11:55:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▍ | 6761/12384 [14:20:52<11:55:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 55%|█████▍ | 6762/12384 [14:20:52<11:55:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 55%|█████▍ | 6762/12384 [14:21:00<11:55:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 55%|█████▍ | 6763/12384 [14:21:00<11:55:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 55%|█████▍ | 6763/12384 [14:21:07<11:55:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 55%|█████▍ | 6764/12384 [14:21:07<11:54:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 55%|█████▍ | 6764/12384 [14:21:15<11:54:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 55%|█████▍ | 6765/12384 [14:21:15<11:55:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 55%|█████▍ | 6765/12384 [14:21:23<11:55:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 55%|█████▍ | 6766/12384 [14:21:23<11:55:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 55%|█████▍ | 6766/12384 [14:21:30<11:55:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 55%|█████▍ | 6767/12384 [14:21:30<11:54:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 55%|█████▍ | 6767/12384 [14:21:38<11:54:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 55%|█████▍ | 6768/12384 [14:21:38<11:53:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 55%|█████▍ | 6768/12384 [14:21:45<11:53:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 2: 55%|█████▍ | 6769/12384 [14:21:45<11:53:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 2: 55%|█████▍ | 6769/12384 [14:21:53<11:53:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 55%|█████▍ | 6770/12384 [14:21:53<11:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 55%|█████▍ | 6770/12384 [14:22:01<11:52:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▍ | 6771/12384 [14:22:01<11:52:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▍ | 6771/12384 [14:22:08<11:52:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 55%|█████▍ | 6772/12384 [14:22:08<11:51:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 55%|█████▍ | 6772/12384 [14:22:16<11:51:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▍ | 6773/12384 [14:22:16<11:51:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▍ | 6773/12384 [14:22:23<11:51:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▍ | 6774/12384 [14:22:23<11:51:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▍ | 6774/12384 [14:22:31<11:51:46, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.44s]
Epoch 2: 55%|█████▍ | 6775/12384 [14:22:31<11:51:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.44s]
Epoch 2: 55%|█████▍ | 6775/12384 [14:22:39<11:51:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 55%|█████▍ | 6776/12384 [14:22:39<11:52:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 55%|█████▍ | 6776/12384 [14:22:46<11:52:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▍ | 6777/12384 [14:22:46<11:51:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▍ | 6777/12384 [14:22:54<11:51:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6778/12384 [14:22:54<11:51:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6778/12384 [14:23:02<11:51:05, 7.61s/it, loss=0.0005, acc=0.9979, iter_time=6.38s]
Epoch 2: 55%|█████▍ | 6779/12384 [14:23:02<11:51:49, 7.62s/it, loss=0.0005, acc=0.9979, iter_time=6.38s]
Epoch 2: 55%|█████▍ | 6779/12384 [14:23:09<11:51:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 55%|█████▍ | 6780/12384 [14:23:09<11:51:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 55%|█████▍ | 6780/12384 [14:23:17<11:51:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 55%|█████▍ | 6781/12384 [14:23:17<11:50:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 55%|█████▍ | 6781/12384 [14:23:24<11:50:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 55%|█████▍ | 6782/12384 [14:23:24<11:50:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 55%|█████▍ | 6782/12384 [14:23:32<11:50:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 55%|█████▍ | 6783/12384 [14:23:32<11:50:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 55%|█████▍ | 6783/12384 [14:23:40<11:50:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 55%|█████▍ | 6784/12384 [14:23:40<12:00:29, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 55%|█████▍ | 6784/12384 [14:23:48<12:00:29, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 55%|█████▍ | 6785/12384 [14:23:48<11:57:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 55%|█████▍ | 6785/12384 [14:23:55<11:57:07, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 55%|█████▍ | 6786/12384 [14:23:55<11:55:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 55%|█████▍ | 6786/12384 [14:24:03<11:55:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 55%|█████▍ | 6787/12384 [14:24:03<11:54:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 55%|█████▍ | 6787/12384 [14:24:10<11:54:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 55%|█████▍ | 6788/12384 [14:24:10<11:52:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 55%|█████▍ | 6788/12384 [14:24:18<11:52:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 55%|█████▍ | 6789/12384 [14:24:18<11:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 55%|█████▍ | 6789/12384 [14:24:26<11:51:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▍ | 6790/12384 [14:24:26<11:51:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▍ | 6790/12384 [14:24:33<11:51:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 55%|█████▍ | 6791/12384 [14:24:33<11:51:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 55%|█████▍ | 6791/12384 [14:24:41<11:51:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 55%|█████▍ | 6792/12384 [14:24:41<11:50:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 55%|█████▍ | 6792/12384 [14:24:49<11:50:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 55%|█████▍ | 6793/12384 [14:24:49<11:50:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 55%|█████▍ | 6793/12384 [14:24:56<11:50:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▍ | 6794/12384 [14:24:56<11:49:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▍ | 6794/12384 [14:25:04<11:49:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 55%|█████▍ | 6795/12384 [14:25:04<11:49:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 55%|█████▍ | 6795/12384 [14:25:11<11:49:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 55%|█████▍ | 6796/12384 [14:25:11<11:49:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 55%|█████▍ | 6796/12384 [14:25:19<11:49:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6797/12384 [14:25:19<11:49:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▍ | 6797/12384 [14:25:27<11:49:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 55%|█████▍ | 6798/12384 [14:25:27<11:52:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 55%|█████▍ | 6798/12384 [14:25:34<11:52:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 55%|█████▍ | 6799/12384 [14:25:34<11:49:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 55%|█████▍ | 6799/12384 [14:25:42<11:49:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 2: 55%|█████▍ | 6800/12384 [14:25:42<11:49:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.90s]
Epoch 2: 55%|█████▍ | 6800/12384 [14:25:50<11:49:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 55%|█████▍ | 6801/12384 [14:25:50<11:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 55%|█████▍ | 6801/12384 [14:25:57<11:48:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 55%|█████▍ | 6802/12384 [14:25:57<11:48:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 55%|█████▍ | 6802/12384 [14:26:05<11:48:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 55%|█████▍ | 6803/12384 [14:26:05<11:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 55%|█████▍ | 6803/12384 [14:26:12<11:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 55%|█████▍ | 6804/12384 [14:26:12<11:48:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 55%|█████▍ | 6804/12384 [14:26:20<11:48:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 55%|█████▍ | 6805/12384 [14:26:20<11:48:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 55%|█████▍ | 6805/12384 [14:26:28<11:48:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 55%|█████▍ | 6806/12384 [14:26:28<11:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 55%|█████▍ | 6806/12384 [14:26:35<11:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 55%|█████▍ | 6807/12384 [14:26:35<11:47:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 55%|█████▍ | 6807/12384 [14:26:43<11:47:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 55%|█████▍ | 6808/12384 [14:26:43<11:46:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 55%|█████▍ | 6808/12384 [14:26:50<11:46:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 55%|█████▍ | 6809/12384 [14:26:50<11:46:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 55%|█████▍ | 6809/12384 [14:26:58<11:46:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 55%|█████▍ | 6810/12384 [14:26:58<11:55:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 55%|█████▍ | 6810/12384 [14:27:06<11:55:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 55%|█████▍ | 6811/12384 [14:27:06<11:52:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 55%|█████▍ | 6811/12384 [14:27:14<11:52:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 55%|█████▌ | 6812/12384 [14:27:14<11:58:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 55%|█████▌ | 6812/12384 [14:27:21<11:58:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▌ | 6813/12384 [14:27:21<11:54:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▌ | 6813/12384 [14:27:29<11:54:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 55%|█████▌ | 6814/12384 [14:27:29<11:52:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 55%|█████▌ | 6814/12384 [14:27:37<11:52:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 55%|█████▌ | 6815/12384 [14:27:37<11:50:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 55%|█████▌ | 6815/12384 [14:27:44<11:50:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 55%|█████▌ | 6816/12384 [14:27:44<11:52:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 55%|█████▌ | 6816/12384 [14:27:52<11:52:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 55%|█████▌ | 6817/12384 [14:27:52<11:50:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 55%|█████▌ | 6817/12384 [14:28:00<11:50:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 55%|█████▌ | 6818/12384 [14:28:00<11:48:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 55%|█████▌ | 6818/12384 [14:28:07<11:48:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 55%|█████▌ | 6819/12384 [14:28:07<11:47:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 55%|█████▌ | 6819/12384 [14:28:15<11:47:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 55%|█████▌ | 6820/12384 [14:28:15<11:49:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 55%|█████▌ | 6820/12384 [14:28:22<11:49:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 2: 55%|█████▌ | 6821/12384 [14:28:23<11:48:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 2: 55%|█████▌ | 6821/12384 [14:28:30<11:48:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 2: 55%|█████▌ | 6822/12384 [14:28:30<11:47:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.41s]
Epoch 2: 55%|█████▌ | 6822/12384 [14:28:38<11:47:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 55%|█████▌ | 6823/12384 [14:28:38<11:47:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 55%|█████▌ | 6823/12384 [14:28:45<11:47:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 55%|█████▌ | 6824/12384 [14:28:45<11:46:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 55%|█████▌ | 6824/12384 [14:28:53<11:46:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 55%|█████▌ | 6825/12384 [14:28:53<11:46:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 55%|█████▌ | 6825/12384 [14:29:01<11:46:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 55%|█████▌ | 6826/12384 [14:29:01<11:45:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 55%|█████▌ | 6826/12384 [14:29:08<11:45:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▌ | 6827/12384 [14:29:08<11:44:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▌ | 6827/12384 [14:29:16<11:44:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 55%|█████▌ | 6828/12384 [14:29:16<11:46:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 55%|█████▌ | 6828/12384 [14:29:23<11:46:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 55%|█████▌ | 6829/12384 [14:29:23<11:46:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 55%|█████▌ | 6829/12384 [14:29:31<11:46:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 55%|█████▌ | 6830/12384 [14:29:31<11:45:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 55%|█████▌ | 6830/12384 [14:29:39<11:45:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.66s]
Epoch 2: 55%|█████▌ | 6831/12384 [14:29:39<11:44:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.66s]
Epoch 2: 55%|█████▌ | 6831/12384 [14:29:46<11:44:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 55%|█████▌ | 6832/12384 [14:29:46<11:44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 55%|█████▌ | 6832/12384 [14:29:54<11:44:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 55%|█████▌ | 6833/12384 [14:29:54<11:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 55%|█████▌ | 6833/12384 [14:30:02<11:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▌ | 6834/12384 [14:30:02<11:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▌ | 6834/12384 [14:30:09<11:44:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▌ | 6835/12384 [14:30:09<11:44:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 55%|█████▌ | 6835/12384 [14:30:17<11:44:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▌ | 6836/12384 [14:30:17<11:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▌ | 6836/12384 [14:30:25<11:44:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▌ | 6837/12384 [14:30:25<11:53:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▌ | 6837/12384 [14:30:33<11:53:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 55%|█████▌ | 6838/12384 [14:30:33<11:58:59, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 55%|█████▌ | 6838/12384 [14:30:40<11:58:59, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▌ | 6839/12384 [14:30:40<11:53:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 55%|█████▌ | 6839/12384 [14:30:48<11:53:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 55%|█████▌ | 6840/12384 [14:30:48<11:50:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 55%|█████▌ | 6840/12384 [14:30:56<11:50:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 2: 55%|█████▌ | 6841/12384 [14:30:56<11:50:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 2: 55%|█████▌ | 6841/12384 [14:31:03<11:50:25, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 55%|█████▌ | 6842/12384 [14:31:03<11:48:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 55%|█████▌ | 6842/12384 [14:31:11<11:48:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.23s]
Epoch 2: 55%|█████▌ | 6843/12384 [14:31:11<11:49:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.23s]
Epoch 2: 55%|█████▌ | 6843/12384 [14:31:18<11:49:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 55%|█████▌ | 6844/12384 [14:31:18<11:46:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 55%|█████▌ | 6844/12384 [14:31:26<11:46:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▌ | 6845/12384 [14:31:26<11:46:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 55%|█████▌ | 6845/12384 [14:31:34<11:46:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 55%|█████▌ | 6846/12384 [14:31:34<11:45:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 55%|█████▌ | 6846/12384 [14:31:41<11:45:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 2: 55%|█████▌ | 6847/12384 [14:31:41<11:44:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.29s]
Epoch 2: 55%|█████▌ | 6847/12384 [14:31:49<11:44:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 55%|█████▌ | 6848/12384 [14:31:49<11:44:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 55%|█████▌ | 6848/12384 [14:31:57<11:44:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 55%|█████▌ | 6849/12384 [14:31:57<11:44:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 55%|█████▌ | 6849/12384 [14:32:04<11:44:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 55%|█████▌ | 6850/12384 [14:32:04<11:44:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 55%|█████▌ | 6850/12384 [14:32:12<11:44:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 55%|█████▌ | 6851/12384 [14:32:12<11:43:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 55%|█████▌ | 6851/12384 [14:32:19<11:43:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 55%|█████▌ | 6852/12384 [14:32:19<11:42:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 55%|█████▌ | 6852/12384 [14:32:27<11:42:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 55%|█████▌ | 6853/12384 [14:32:27<11:41:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 55%|█████▌ | 6853/12384 [14:32:35<11:41:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 55%|█████▌ | 6854/12384 [14:32:35<11:41:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 55%|█████▌ | 6854/12384 [14:32:42<11:41:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 55%|█████▌ | 6855/12384 [14:32:42<11:41:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 55%|█████▌ | 6855/12384 [14:32:50<11:41:55, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.79s]
Epoch 2: 55%|█████▌ | 6856/12384 [14:32:50<11:42:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.79s]
Epoch 2: 55%|█████▌ | 6856/12384 [14:32:58<11:42:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 55%|█████▌ | 6857/12384 [14:32:58<11:43:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 55%|█████▌ | 6857/12384 [14:33:05<11:43:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 55%|█████▌ | 6858/12384 [14:33:05<11:43:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 55%|█████▌ | 6858/12384 [14:33:13<11:43:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 55%|█████▌ | 6859/12384 [14:33:13<11:43:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 55%|█████▌ | 6859/12384 [14:33:21<11:43:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 55%|█████▌ | 6860/12384 [14:33:21<11:42:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 55%|█████▌ | 6860/12384 [14:33:28<11:42:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 55%|█████▌ | 6861/12384 [14:33:28<11:42:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 55%|█████▌ | 6861/12384 [14:33:36<11:42:09, 7.63s/it, loss=0.0015, acc=0.9980, iter_time=6.15s]
Epoch 2: 55%|█████▌ | 6862/12384 [14:33:36<11:40:56, 7.62s/it, loss=0.0015, acc=0.9980, iter_time=6.15s]
Epoch 2: 55%|█████▌ | 6862/12384 [14:33:44<11:40:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 55%|█████▌ | 6863/12384 [14:33:44<11:51:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 55%|█████▌ | 6863/12384 [14:33:51<11:51:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 55%|█████▌ | 6864/12384 [14:33:51<11:48:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 55%|█████▌ | 6864/12384 [14:33:59<11:48:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 55%|█████▌ | 6865/12384 [14:33:59<11:53:03, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 55%|█████▌ | 6865/12384 [14:34:07<11:53:03, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 2: 55%|█████▌ | 6866/12384 [14:34:07<11:48:43, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 2: 55%|█████▌ | 6866/12384 [14:34:14<11:48:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 55%|█████▌ | 6867/12384 [14:34:14<11:46:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 55%|█████▌ | 6867/12384 [14:34:22<11:46:15, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 55%|█████▌ | 6868/12384 [14:34:22<11:44:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 55%|█████▌ | 6868/12384 [14:34:30<11:44:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 55%|█████▌ | 6869/12384 [14:34:30<11:42:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 55%|█████▌ | 6869/12384 [14:34:37<11:42:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 55%|█████▌ | 6870/12384 [14:34:37<11:43:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 55%|█████▌ | 6870/12384 [14:34:45<11:43:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▌ | 6871/12384 [14:34:45<11:41:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 55%|█████▌ | 6871/12384 [14:34:53<11:41:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 55%|█████▌ | 6872/12384 [14:34:53<11:41:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 55%|█████▌ | 6872/12384 [14:35:00<11:41:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 55%|█████▌ | 6873/12384 [14:35:00<11:40:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 55%|█████▌ | 6873/12384 [14:35:08<11:40:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 56%|█████▌ | 6874/12384 [14:35:08<11:40:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 56%|█████▌ | 6874/12384 [14:35:15<11:40:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6875/12384 [14:35:15<11:40:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6875/12384 [14:35:23<11:40:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 56%|█████▌ | 6876/12384 [14:35:23<11:39:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 56%|█████▌ | 6876/12384 [14:35:31<11:39:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 56%|█████▌ | 6877/12384 [14:35:31<11:38:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 56%|█████▌ | 6877/12384 [14:35:38<11:38:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 56%|█████▌ | 6878/12384 [14:35:38<11:38:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 56%|█████▌ | 6878/12384 [14:35:46<11:38:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6879/12384 [14:35:46<11:38:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6879/12384 [14:35:53<11:38:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 56%|█████▌ | 6880/12384 [14:35:53<11:38:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 56%|█████▌ | 6880/12384 [14:36:01<11:38:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 56%|█████▌ | 6881/12384 [14:36:01<11:38:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 56%|█████▌ | 6881/12384 [14:36:09<11:38:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 56%|█████▌ | 6882/12384 [14:36:09<11:39:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 56%|█████▌ | 6882/12384 [14:36:16<11:39:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 56%|█████▌ | 6883/12384 [14:36:16<11:38:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 56%|█████▌ | 6883/12384 [14:36:24<11:38:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 56%|█████▌ | 6884/12384 [14:36:24<11:38:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 56%|█████▌ | 6884/12384 [14:36:32<11:38:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6885/12384 [14:36:32<11:37:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6885/12384 [14:36:39<11:37:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6886/12384 [14:36:39<11:37:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6886/12384 [14:36:47<11:37:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 56%|█████▌ | 6887/12384 [14:36:47<11:37:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 56%|█████▌ | 6887/12384 [14:36:54<11:37:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 56%|█████▌ | 6888/12384 [14:36:54<11:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.70s]
Epoch 2: 56%|█████▌ | 6888/12384 [14:37:02<11:37:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 56%|█████▌ | 6889/12384 [14:37:02<11:45:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 56%|█████▌ | 6889/12384 [14:37:10<11:45:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 56%|█████▌ | 6890/12384 [14:37:10<11:43:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 56%|█████▌ | 6890/12384 [14:37:18<11:43:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.04s]
Epoch 2: 56%|█████▌ | 6891/12384 [14:37:18<11:41:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.04s]
Epoch 2: 56%|█████▌ | 6891/12384 [14:37:25<11:41:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=12.17s]
Epoch 2: 56%|█████▌ | 6892/12384 [14:37:25<11:39:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=12.17s]
Epoch 2: 56%|█████▌ | 6892/12384 [14:37:33<11:39:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 56%|█████▌ | 6893/12384 [14:37:33<11:38:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 56%|█████▌ | 6893/12384 [14:37:40<11:38:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 56%|█████▌ | 6894/12384 [14:37:40<11:37:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 56%|█████▌ | 6894/12384 [14:37:48<11:37:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 56%|█████▌ | 6895/12384 [14:37:48<11:36:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 56%|█████▌ | 6895/12384 [14:37:56<11:36:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 56%|█████▌ | 6896/12384 [14:37:56<11:36:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 56%|█████▌ | 6896/12384 [14:38:03<11:36:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 56%|█████▌ | 6897/12384 [14:38:03<11:36:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 56%|█████▌ | 6897/12384 [14:38:11<11:36:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 2: 56%|█████▌ | 6898/12384 [14:38:11<11:36:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.23s]
Epoch 2: 56%|█████▌ | 6898/12384 [14:38:18<11:36:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 2: 56%|█████▌ | 6899/12384 [14:38:18<11:35:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 2: 56%|█████▌ | 6899/12384 [14:38:26<11:35:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 56%|█████▌ | 6900/12384 [14:38:26<11:36:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 56%|█████▌ | 6900/12384 [14:38:34<11:36:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 56%|█████▌ | 6901/12384 [14:38:34<11:35:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 56%|█████▌ | 6901/12384 [14:38:41<11:35:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 56%|█████▌ | 6902/12384 [14:38:41<11:36:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 56%|█████▌ | 6902/12384 [14:38:49<11:36:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 56%|█████▌ | 6903/12384 [14:38:49<11:35:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 56%|█████▌ | 6903/12384 [14:38:56<11:35:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 56%|█████▌ | 6904/12384 [14:38:56<11:35:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 56%|█████▌ | 6904/12384 [14:39:04<11:35:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 56%|█████▌ | 6905/12384 [14:39:04<11:34:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 56%|█████▌ | 6905/12384 [14:39:12<11:34:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 56%|█████▌ | 6906/12384 [14:39:12<11:35:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 56%|█████▌ | 6906/12384 [14:39:19<11:35:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6907/12384 [14:39:19<11:35:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6907/12384 [14:39:27<11:35:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 56%|█████▌ | 6908/12384 [14:39:27<11:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 56%|█████▌ | 6908/12384 [14:39:35<11:35:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 56%|█████▌ | 6909/12384 [14:39:35<11:34:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 56%|█████▌ | 6909/12384 [14:39:42<11:34:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 56%|█████▌ | 6910/12384 [14:39:42<11:34:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 56%|█████▌ | 6910/12384 [14:39:50<11:34:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 56%|█████▌ | 6911/12384 [14:39:50<11:34:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 56%|█████▌ | 6911/12384 [14:39:57<11:34:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 56%|█████▌ | 6912/12384 [14:39:57<11:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 56%|█████▌ | 6912/12384 [14:40:05<11:34:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 56%|█████▌ | 6913/12384 [14:40:05<11:34:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 56%|█████▌ | 6913/12384 [14:40:13<11:34:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 56%|█████▌ | 6914/12384 [14:40:13<11:34:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 56%|█████▌ | 6914/12384 [14:40:21<11:34:57, 7.62s/it, loss=0.0012, acc=0.9977, iter_time=9.79s]
Epoch 2: 56%|█████▌ | 6915/12384 [14:40:21<11:43:32, 7.72s/it, loss=0.0012, acc=0.9977, iter_time=9.79s]
Epoch 2: 56%|█████▌ | 6915/12384 [14:40:28<11:43:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 56%|█████▌ | 6916/12384 [14:40:28<11:40:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 56%|█████▌ | 6916/12384 [14:40:36<11:40:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 56%|█████▌ | 6917/12384 [14:40:36<11:45:50, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 56%|█████▌ | 6917/12384 [14:40:44<11:45:50, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 56%|█████▌ | 6918/12384 [14:40:44<11:41:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 56%|█████▌ | 6918/12384 [14:40:51<11:41:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 56%|█████▌ | 6919/12384 [14:40:51<11:38:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 56%|█████▌ | 6919/12384 [14:40:59<11:38:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 56%|█████▌ | 6920/12384 [14:40:59<11:36:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 56%|█████▌ | 6920/12384 [14:41:06<11:36:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 56%|█████▌ | 6921/12384 [14:41:06<11:35:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 56%|█████▌ | 6921/12384 [14:41:14<11:35:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 56%|█████▌ | 6922/12384 [14:41:14<11:36:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 56%|█████▌ | 6922/12384 [14:41:22<11:36:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 56%|█████▌ | 6923/12384 [14:41:22<11:34:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 56%|█████▌ | 6923/12384 [14:41:29<11:34:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 56%|█████▌ | 6924/12384 [14:41:29<11:35:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 56%|█████▌ | 6924/12384 [14:41:37<11:35:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 56%|█████▌ | 6925/12384 [14:41:37<11:35:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 56%|█████▌ | 6925/12384 [14:41:45<11:35:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 56%|█████▌ | 6926/12384 [14:41:45<11:34:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 56%|█████▌ | 6926/12384 [14:41:52<11:34:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 56%|█████▌ | 6927/12384 [14:41:52<11:34:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 56%|█████▌ | 6927/12384 [14:42:00<11:34:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 56%|█████▌ | 6928/12384 [14:42:00<11:33:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 56%|█████▌ | 6928/12384 [14:42:08<11:33:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 2: 56%|█████▌ | 6929/12384 [14:42:08<11:33:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.31s]
Epoch 2: 56%|█████▌ | 6929/12384 [14:42:15<11:33:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 56%|█████▌ | 6930/12384 [14:42:15<11:32:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 56%|█████▌ | 6930/12384 [14:42:23<11:32:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6931/12384 [14:42:23<11:32:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6931/12384 [14:42:30<11:32:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 56%|█████▌ | 6932/12384 [14:42:30<11:31:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 56%|█████▌ | 6932/12384 [14:42:38<11:31:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 56%|█████▌ | 6933/12384 [14:42:38<11:34:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 56%|█████▌ | 6933/12384 [14:42:46<11:34:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 2: 56%|█████▌ | 6934/12384 [14:42:46<11:33:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 2: 56%|█████▌ | 6934/12384 [14:42:53<11:33:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 56%|█████▌ | 6935/12384 [14:42:53<11:32:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 56%|█████▌ | 6935/12384 [14:43:01<11:32:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 2: 56%|█████▌ | 6936/12384 [14:43:01<11:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 2: 56%|█████▌ | 6936/12384 [14:43:08<11:31:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 56%|█████▌ | 6937/12384 [14:43:08<11:30:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 56%|█████▌ | 6937/12384 [14:43:16<11:30:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6938/12384 [14:43:16<11:30:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6938/12384 [14:43:24<11:30:12, 7.60s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6939/12384 [14:43:24<11:30:16, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6939/12384 [14:43:31<11:30:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 56%|█████▌ | 6940/12384 [14:43:31<11:30:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 56%|█████▌ | 6940/12384 [14:43:39<11:30:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 2: 56%|█████▌ | 6941/12384 [14:43:39<11:39:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.53s]
Epoch 2: 56%|█████▌ | 6941/12384 [14:43:47<11:39:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 56%|█████▌ | 6942/12384 [14:43:47<11:36:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 56%|█████▌ | 6942/12384 [14:43:55<11:36:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 2: 56%|█████▌ | 6943/12384 [14:43:55<11:42:03, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 2: 56%|█████▌ | 6943/12384 [14:44:02<11:42:03, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 56%|█████▌ | 6944/12384 [14:44:02<11:38:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 56%|█████▌ | 6944/12384 [14:44:10<11:38:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 56%|█████▌ | 6945/12384 [14:44:10<11:36:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 56%|█████▌ | 6945/12384 [14:44:18<11:36:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 56%|█████▌ | 6946/12384 [14:44:18<11:34:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 56%|█████▌ | 6946/12384 [14:44:25<11:34:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 2: 56%|█████▌ | 6947/12384 [14:44:25<11:32:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.97s]
Epoch 2: 56%|█████▌ | 6947/12384 [14:44:33<11:32:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 56%|█████▌ | 6948/12384 [14:44:33<11:31:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 56%|█████▌ | 6948/12384 [14:44:40<11:31:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 56%|█████▌ | 6949/12384 [14:44:40<11:31:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 56%|█████▌ | 6949/12384 [14:44:48<11:31:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6950/12384 [14:44:48<11:30:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6950/12384 [14:44:56<11:30:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 56%|█████▌ | 6951/12384 [14:44:56<11:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 56%|█████▌ | 6951/12384 [14:45:03<11:30:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 56%|█████▌ | 6952/12384 [14:45:03<11:29:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 56%|█████▌ | 6952/12384 [14:45:11<11:29:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 56%|█████▌ | 6953/12384 [14:45:11<11:32:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 56%|█████▌ | 6953/12384 [14:45:19<11:32:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 56%|█████▌ | 6954/12384 [14:45:19<11:31:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 56%|█████▌ | 6954/12384 [14:45:26<11:31:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 56%|█████▌ | 6955/12384 [14:45:26<11:30:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 56%|█████▌ | 6955/12384 [14:45:34<11:30:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6956/12384 [14:45:34<11:30:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6956/12384 [14:45:41<11:30:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6957/12384 [14:45:41<11:29:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6957/12384 [14:45:49<11:29:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6958/12384 [14:45:49<11:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▌ | 6958/12384 [14:45:57<11:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6959/12384 [14:45:57<11:30:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▌ | 6959/12384 [14:46:04<11:30:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 56%|█████▌ | 6960/12384 [14:46:04<11:29:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 56%|█████▌ | 6960/12384 [14:46:12<11:29:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 56%|█████▌ | 6961/12384 [14:46:12<11:29:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 56%|█████▌ | 6961/12384 [14:46:20<11:29:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 56%|█████▌ | 6962/12384 [14:46:20<11:28:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 56%|█████▌ | 6962/12384 [14:46:27<11:28:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 56%|█████▌ | 6963/12384 [14:46:27<11:29:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 56%|█████▌ | 6963/12384 [14:46:35<11:29:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 56%|█████▌ | 6964/12384 [14:46:35<11:28:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 56%|█████▌ | 6964/12384 [14:46:42<11:28:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 56%|█████▌ | 6965/12384 [14:46:42<11:27:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 56%|█████▌ | 6965/12384 [14:46:50<11:27:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▋ | 6966/12384 [14:46:50<11:27:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 56%|█████▋ | 6966/12384 [14:46:58<11:27:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 56%|█████▋ | 6967/12384 [14:46:58<11:27:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 56%|█████▋ | 6967/12384 [14:47:06<11:27:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.46s]
Epoch 2: 56%|█████▋ | 6968/12384 [14:47:06<11:35:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.46s]
Epoch 2: 56%|█████▋ | 6968/12384 [14:47:13<11:35:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 2: 56%|█████▋ | 6969/12384 [14:47:13<11:33:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 2: 56%|█████▋ | 6969/12384 [14:47:21<11:33:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 56%|█████▋ | 6970/12384 [14:47:21<11:31:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 56%|█████▋ | 6970/12384 [14:47:29<11:31:54, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 56%|█████▋ | 6971/12384 [14:47:29<11:31:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 56%|█████▋ | 6971/12384 [14:47:36<11:31:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 56%|█████▋ | 6972/12384 [14:47:36<11:29:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 56%|█████▋ | 6972/12384 [14:47:44<11:29:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 2: 56%|█████▋ | 6973/12384 [14:47:44<11:29:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 2: 56%|█████▋ | 6973/12384 [14:47:51<11:29:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 56%|█████▋ | 6974/12384 [14:47:51<11:28:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.94s]
Epoch 2: 56%|█████▋ | 6974/12384 [14:47:59<11:28:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 56%|█████▋ | 6975/12384 [14:47:59<11:28:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 56%|█████▋ | 6975/12384 [14:48:07<11:28:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 2: 56%|█████▋ | 6976/12384 [14:48:07<11:27:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 2: 56%|█████▋ | 6976/12384 [14:48:14<11:27:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 56%|█████▋ | 6977/12384 [14:48:14<11:26:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 56%|█████▋ | 6977/12384 [14:48:22<11:26:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 2: 56%|█████▋ | 6978/12384 [14:48:22<11:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 2: 56%|█████▋ | 6978/12384 [14:48:29<11:26:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 56%|█████▋ | 6979/12384 [14:48:29<11:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 56%|█████▋ | 6979/12384 [14:48:37<11:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 56%|█████▋ | 6980/12384 [14:48:37<11:25:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 56%|█████▋ | 6980/12384 [14:48:45<11:25:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▋ | 6981/12384 [14:48:45<11:25:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 56%|█████▋ | 6981/12384 [14:48:52<11:25:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 56%|█████▋ | 6982/12384 [14:48:52<11:27:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 56%|█████▋ | 6982/12384 [14:49:00<11:27:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 56%|█████▋ | 6983/12384 [14:49:00<11:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 56%|█████▋ | 6983/12384 [14:49:08<11:26:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 56%|█████▋ | 6984/12384 [14:49:08<11:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 56%|█████▋ | 6984/12384 [14:49:15<11:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 56%|█████▋ | 6985/12384 [14:49:15<11:25:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 56%|█████▋ | 6985/12384 [14:49:23<11:25:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 56%|█████▋ | 6986/12384 [14:49:23<11:25:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 56%|█████▋ | 6986/12384 [14:49:30<11:25:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 56%|█████▋ | 6987/12384 [14:49:30<11:25:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 56%|█████▋ | 6987/12384 [14:49:38<11:25:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 56%|█████▋ | 6988/12384 [14:49:38<11:25:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 56%|█████▋ | 6988/12384 [14:49:46<11:25:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 56%|█████▋ | 6989/12384 [14:49:46<11:25:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 56%|█████▋ | 6989/12384 [14:49:53<11:25:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 56%|█████▋ | 6990/12384 [14:49:53<11:24:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 56%|█████▋ | 6990/12384 [14:50:01<11:24:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 56%|█████▋ | 6991/12384 [14:50:01<11:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 56%|█████▋ | 6991/12384 [14:50:09<11:24:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.90s]
Epoch 2: 56%|█████▋ | 6992/12384 [14:50:09<11:25:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.90s]
Epoch 2: 56%|█████▋ | 6992/12384 [14:50:16<11:25:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 56%|█████▋ | 6993/12384 [14:50:16<11:25:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 56%|█████▋ | 6993/12384 [14:50:24<11:25:10, 7.63s/it, loss=0.0001, acc=0.9987, iter_time=10.27s]
Epoch 2: 56%|█████▋ | 6994/12384 [14:50:24<11:34:07, 7.73s/it, loss=0.0001, acc=0.9987, iter_time=10.27s]
Epoch 2: 56%|█████▋ | 6994/12384 [14:50:32<11:34:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 56%|█████▋ | 6995/12384 [14:50:32<11:38:43, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 56%|█████▋ | 6995/12384 [14:50:40<11:38:43, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 56%|█████▋ | 6996/12384 [14:50:40<11:33:48, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 56%|█████▋ | 6996/12384 [14:50:47<11:33:48, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 57%|█████▋ | 6997/12384 [14:50:47<11:29:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 57%|█████▋ | 6997/12384 [14:50:55<11:29:52, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=9.60s]
Epoch 2: 57%|█████▋ | 6998/12384 [14:50:55<11:27:52, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.60s]
Epoch 2: 57%|█████▋ | 6998/12384 [14:51:02<11:27:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 6999/12384 [14:51:02<11:27:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 6999/12384 [14:51:10<11:27:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 57%|█████▋ | 7000/12384 [14:51:10<11:28:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 57%|█████▋ | 7000/12384 [14:51:18<11:28:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 57%|█████▋ | 7001/12384 [14:51:18<11:27:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 57%|█████▋ | 7001/12384 [14:51:25<11:27:03, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7002/12384 [14:51:25<11:25:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7002/12384 [14:51:33<11:25:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 7003/12384 [14:51:33<11:24:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 7003/12384 [14:51:41<11:24:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 57%|█████▋ | 7004/12384 [14:51:41<11:22:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 57%|█████▋ | 7004/12384 [14:51:48<11:22:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 57%|█████▋ | 7005/12384 [14:51:48<11:22:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 57%|█████▋ | 7005/12384 [14:51:56<11:22:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 57%|█████▋ | 7006/12384 [14:51:56<11:22:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 57%|█████▋ | 7006/12384 [14:52:03<11:22:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 57%|█████▋ | 7007/12384 [14:52:03<11:21:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 57%|█████▋ | 7007/12384 [14:52:11<11:21:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 57%|█████▋ | 7008/12384 [14:52:11<11:22:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 57%|█████▋ | 7008/12384 [14:52:19<11:22:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 57%|█████▋ | 7009/12384 [14:52:19<11:22:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 57%|█████▋ | 7009/12384 [14:52:26<11:22:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 57%|█████▋ | 7010/12384 [14:52:26<11:23:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 57%|█████▋ | 7010/12384 [14:52:34<11:23:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 57%|█████▋ | 7011/12384 [14:52:34<11:23:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 57%|█████▋ | 7011/12384 [14:52:42<11:23:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 57%|█████▋ | 7012/12384 [14:52:42<11:23:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 57%|█████▋ | 7012/12384 [14:52:49<11:23:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 57%|█████▋ | 7013/12384 [14:52:49<11:22:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 57%|█████▋ | 7013/12384 [14:52:57<11:22:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7014/12384 [14:52:57<11:22:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7014/12384 [14:53:04<11:22:28, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7015/12384 [14:53:04<11:21:47, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7015/12384 [14:53:12<11:21:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 57%|█████▋ | 7016/12384 [14:53:12<11:21:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 57%|█████▋ | 7016/12384 [14:53:20<11:21:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 57%|█████▋ | 7017/12384 [14:53:20<11:21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 57%|█████▋ | 7017/12384 [14:53:27<11:21:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 57%|█████▋ | 7018/12384 [14:53:27<11:21:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 57%|█████▋ | 7018/12384 [14:53:35<11:21:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 57%|█████▋ | 7019/12384 [14:53:35<11:20:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 57%|█████▋ | 7019/12384 [14:53:43<11:20:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 57%|█████▋ | 7020/12384 [14:53:43<11:20:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 57%|█████▋ | 7020/12384 [14:53:50<11:20:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.35s]
Epoch 2: 57%|█████▋ | 7021/12384 [14:53:50<11:30:13, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.35s]
Epoch 2: 57%|█████▋ | 7021/12384 [14:53:58<11:30:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 57%|█████▋ | 7022/12384 [14:53:58<11:34:54, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 57%|█████▋ | 7022/12384 [14:54:06<11:34:54, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 57%|█████▋ | 7023/12384 [14:54:06<11:30:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 57%|█████▋ | 7023/12384 [14:54:14<11:30:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 57%|█████▋ | 7024/12384 [14:54:14<11:27:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 57%|█████▋ | 7024/12384 [14:54:21<11:27:33, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 57%|█████▋ | 7025/12384 [14:54:21<11:25:11, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 57%|█████▋ | 7025/12384 [14:54:29<11:25:11, 7.67s/it, loss=0.0002, acc=0.9997, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7026/12384 [14:54:29<11:23:01, 7.65s/it, loss=0.0002, acc=0.9997, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7026/12384 [14:54:36<11:23:01, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=7.31s]
Epoch 2: 57%|█████▋ | 7027/12384 [14:54:36<11:21:32, 7.63s/it, loss=0.0006, acc=0.9977, iter_time=7.31s]
Epoch 2: 57%|█████▋ | 7027/12384 [14:54:44<11:21:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 57%|█████▋ | 7028/12384 [14:54:44<11:20:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 57%|█████▋ | 7028/12384 [14:54:52<11:20:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 57%|█████▋ | 7029/12384 [14:54:52<11:19:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 57%|█████▋ | 7029/12384 [14:54:59<11:19:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 57%|█████▋ | 7030/12384 [14:54:59<11:19:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 57%|█████▋ | 7030/12384 [14:55:07<11:19:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 57%|█████▋ | 7031/12384 [14:55:07<11:20:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 57%|█████▋ | 7031/12384 [14:55:14<11:20:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 57%|█████▋ | 7032/12384 [14:55:14<11:19:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 57%|█████▋ | 7032/12384 [14:55:22<11:19:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 57%|█████▋ | 7033/12384 [14:55:22<11:18:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 57%|█████▋ | 7033/12384 [14:55:30<11:18:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 57%|█████▋ | 7034/12384 [14:55:30<11:18:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 57%|█████▋ | 7034/12384 [14:55:37<11:18:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 57%|█████▋ | 7035/12384 [14:55:37<11:18:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 57%|█████▋ | 7035/12384 [14:55:45<11:18:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 57%|█████▋ | 7036/12384 [14:55:45<11:20:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 57%|█████▋ | 7036/12384 [14:55:53<11:20:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 57%|█████▋ | 7037/12384 [14:55:53<11:20:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 57%|█████▋ | 7037/12384 [14:56:00<11:20:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 57%|█████▋ | 7038/12384 [14:56:00<11:22:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 57%|█████▋ | 7038/12384 [14:56:08<11:22:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 57%|█████▋ | 7039/12384 [14:56:08<11:21:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 57%|█████▋ | 7039/12384 [14:56:16<11:21:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 57%|█████▋ | 7040/12384 [14:56:16<11:19:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 57%|█████▋ | 7040/12384 [14:56:23<11:19:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 2: 57%|█████▋ | 7041/12384 [14:56:23<11:18:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 2: 57%|█████▋ | 7041/12384 [14:56:31<11:18:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 57%|█████▋ | 7042/12384 [14:56:31<11:17:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 57%|█████▋ | 7042/12384 [14:56:38<11:17:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 2: 57%|█████▋ | 7043/12384 [14:56:38<11:17:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 2: 57%|█████▋ | 7043/12384 [14:56:46<11:17:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.68s]
Epoch 2: 57%|█████▋ | 7044/12384 [14:56:46<11:19:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.68s]
Epoch 2: 57%|█████▋ | 7044/12384 [14:56:54<11:19:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 57%|█████▋ | 7045/12384 [14:56:54<11:18:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 57%|█████▋ | 7045/12384 [14:57:01<11:18:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 7046/12384 [14:57:01<11:17:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 7046/12384 [14:57:09<11:17:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 57%|█████▋ | 7047/12384 [14:57:09<11:26:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 57%|█████▋ | 7047/12384 [14:57:17<11:26:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 57%|█████▋ | 7048/12384 [14:57:17<11:24:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 57%|█████▋ | 7048/12384 [14:57:25<11:24:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 57%|█████▋ | 7049/12384 [14:57:25<11:28:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 57%|█████▋ | 7049/12384 [14:57:32<11:28:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 57%|█████▋ | 7050/12384 [14:57:32<11:25:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 57%|█████▋ | 7050/12384 [14:57:40<11:25:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 57%|█████▋ | 7051/12384 [14:57:40<11:24:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 57%|█████▋ | 7051/12384 [14:57:48<11:24:34, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 57%|█████▋ | 7052/12384 [14:57:48<11:21:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 57%|█████▋ | 7052/12384 [14:57:55<11:21:14, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 2: 57%|█████▋ | 7053/12384 [14:57:55<11:19:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 2: 57%|█████▋ | 7053/12384 [14:58:03<11:19:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7054/12384 [14:58:03<11:18:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7054/12384 [14:58:10<11:18:50, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.32s]
Epoch 2: 57%|█████▋ | 7055/12384 [14:58:10<11:18:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.32s]
Epoch 2: 57%|█████▋ | 7055/12384 [14:58:18<11:18:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 57%|█████▋ | 7056/12384 [14:58:18<11:17:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 57%|█████▋ | 7056/12384 [14:58:26<11:17:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 57%|█████▋ | 7057/12384 [14:58:26<11:17:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 57%|█████▋ | 7057/12384 [14:58:33<11:17:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 57%|█████▋ | 7058/12384 [14:58:33<11:17:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 57%|█████▋ | 7058/12384 [14:58:41<11:17:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 57%|█████▋ | 7059/12384 [14:58:41<11:15:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 57%|█████▋ | 7059/12384 [14:58:49<11:15:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 57%|█████▋ | 7060/12384 [14:58:49<11:15:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 57%|█████▋ | 7060/12384 [14:58:56<11:15:03, 7.61s/it, loss=0.0009, acc=0.9976, iter_time=7.59s]
Epoch 2: 57%|█████▋ | 7061/12384 [14:58:56<11:15:09, 7.61s/it, loss=0.0009, acc=0.9976, iter_time=7.59s]
Epoch 2: 57%|█████▋ | 7061/12384 [14:59:04<11:15:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7062/12384 [14:59:04<11:16:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7062/12384 [14:59:11<11:16:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 57%|█████▋ | 7063/12384 [14:59:11<11:15:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 57%|█████▋ | 7063/12384 [14:59:19<11:15:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 57%|█████▋ | 7064/12384 [14:59:19<11:15:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 57%|█████▋ | 7064/12384 [14:59:27<11:15:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 57%|█████▋ | 7065/12384 [14:59:27<11:13:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 57%|█████▋ | 7065/12384 [14:59:34<11:13:57, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 57%|█████▋ | 7066/12384 [14:59:34<11:13:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 57%|█████▋ | 7066/12384 [14:59:42<11:13:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 57%|█████▋ | 7067/12384 [14:59:42<11:14:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 57%|█████▋ | 7067/12384 [14:59:49<11:14:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7068/12384 [14:59:49<11:14:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7068/12384 [14:59:57<11:14:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 57%|█████▋ | 7069/12384 [14:59:57<11:14:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 57%|█████▋ | 7069/12384 [15:00:05<11:14:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 57%|█████▋ | 7070/12384 [15:00:05<11:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 57%|█████▋ | 7070/12384 [15:00:12<11:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 57%|█████▋ | 7071/12384 [15:00:12<11:14:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 57%|█████▋ | 7071/12384 [15:00:20<11:14:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 57%|█████▋ | 7072/12384 [15:00:20<11:15:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 57%|█████▋ | 7072/12384 [15:00:28<11:15:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 57%|█████▋ | 7073/12384 [15:00:28<11:23:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 57%|█████▋ | 7073/12384 [15:00:35<11:23:36, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.75s]
Epoch 2: 57%|█████▋ | 7074/12384 [15:00:35<11:20:57, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.75s]
Epoch 2: 57%|█████▋ | 7074/12384 [15:00:43<11:20:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 57%|█████▋ | 7075/12384 [15:00:43<11:26:18, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 57%|█████▋ | 7075/12384 [15:00:51<11:26:18, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 7076/12384 [15:00:51<11:22:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 7076/12384 [15:00:59<11:22:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7077/12384 [15:00:59<11:19:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7077/12384 [15:01:06<11:19:31, 7.68s/it, loss=0.0003, acc=0.9997, iter_time=7.61s]
Epoch 2: 57%|█████▋ | 7078/12384 [15:01:06<11:17:34, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=7.61s]
Epoch 2: 57%|█████▋ | 7078/12384 [15:01:14<11:17:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 57%|█████▋ | 7079/12384 [15:01:14<11:16:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 57%|█████▋ | 7079/12384 [15:01:21<11:16:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 57%|█████▋ | 7080/12384 [15:01:21<11:14:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 57%|█████▋ | 7080/12384 [15:01:29<11:14:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 2: 57%|█████▋ | 7081/12384 [15:01:29<11:14:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.62s]
Epoch 2: 57%|█████▋ | 7081/12384 [15:01:37<11:14:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 57%|█████▋ | 7082/12384 [15:01:37<11:13:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 57%|█████▋ | 7082/12384 [15:01:44<11:13:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 2: 57%|█████▋ | 7083/12384 [15:01:44<11:13:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.69s]
Epoch 2: 57%|█████▋ | 7083/12384 [15:01:52<11:13:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 57%|█████▋ | 7084/12384 [15:01:52<11:12:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 57%|█████▋ | 7084/12384 [15:01:59<11:12:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7085/12384 [15:01:59<11:12:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7085/12384 [15:02:07<11:12:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 57%|█████▋ | 7086/12384 [15:02:07<11:12:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 57%|█████▋ | 7086/12384 [15:02:15<11:12:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 57%|█████▋ | 7087/12384 [15:02:15<11:12:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 57%|█████▋ | 7087/12384 [15:02:22<11:12:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 57%|█████▋ | 7088/12384 [15:02:22<11:11:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 57%|█████▋ | 7088/12384 [15:02:30<11:11:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 2: 57%|█████▋ | 7089/12384 [15:02:30<11:11:33, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 2: 57%|█████▋ | 7089/12384 [15:02:38<11:11:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7090/12384 [15:02:38<11:11:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 57%|█████▋ | 7090/12384 [15:02:45<11:11:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 57%|█████▋ | 7091/12384 [15:02:45<11:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 57%|█████▋ | 7091/12384 [15:02:53<11:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 57%|█████▋ | 7092/12384 [15:02:53<11:11:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 57%|█████▋ | 7092/12384 [15:03:00<11:11:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 57%|█████▋ | 7093/12384 [15:03:00<11:10:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 57%|█████▋ | 7093/12384 [15:03:08<11:10:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 57%|█████▋ | 7094/12384 [15:03:08<11:09:50, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 57%|█████▋ | 7094/12384 [15:03:16<11:09:50, 7.60s/it, loss=0.0000, acc=0.9998, iter_time=10.01s]
Epoch 2: 57%|█████▋ | 7095/12384 [15:03:16<11:09:03, 7.59s/it, loss=0.0000, acc=0.9998, iter_time=10.01s]
Epoch 2: 57%|█████▋ | 7095/12384 [15:03:23<11:09:03, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 57%|█████▋ | 7096/12384 [15:03:23<11:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 57%|█████▋ | 7096/12384 [15:03:31<11:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 57%|█████▋ | 7097/12384 [15:03:31<11:13:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 57%|█████▋ | 7097/12384 [15:03:39<11:13:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 57%|█████▋ | 7098/12384 [15:03:39<11:12:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 57%|█████▋ | 7098/12384 [15:03:46<11:12:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 57%|█████▋ | 7099/12384 [15:03:46<11:20:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 57%|█████▋ | 7099/12384 [15:03:54<11:20:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 57%|█████▋ | 7100/12384 [15:03:54<11:16:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 57%|█████▋ | 7100/12384 [15:04:02<11:16:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 57%|█████▋ | 7101/12384 [15:04:02<11:21:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 57%|█████▋ | 7101/12384 [15:04:10<11:21:08, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 57%|█████▋ | 7102/12384 [15:04:10<11:17:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 57%|█████▋ | 7102/12384 [15:04:17<11:17:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 57%|█████▋ | 7103/12384 [15:04:17<11:15:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 57%|█████▋ | 7103/12384 [15:04:25<11:15:12, 7.67s/it, loss=0.0008, acc=0.9975, iter_time=7.98s]
Epoch 2: 57%|█████▋ | 7104/12384 [15:04:25<11:13:06, 7.65s/it, loss=0.0008, acc=0.9975, iter_time=7.98s]
Epoch 2: 57%|█████▋ | 7104/12384 [15:04:32<11:13:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 57%|█████▋ | 7105/12384 [15:04:32<11:11:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 57%|█████▋ | 7105/12384 [15:04:40<11:11:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 7106/12384 [15:04:40<11:11:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 57%|█████▋ | 7106/12384 [15:04:48<11:11:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7107/12384 [15:04:48<11:10:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 57%|█████▋ | 7107/12384 [15:04:55<11:10:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 57%|█████▋ | 7108/12384 [15:04:55<11:10:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 57%|█████▋ | 7108/12384 [15:05:03<11:10:00, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=8.73s]
Epoch 2: 57%|█████▋ | 7109/12384 [15:05:03<11:09:38, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=8.73s]
Epoch 2: 57%|█████▋ | 7109/12384 [15:05:10<11:09:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 57%|█████▋ | 7110/12384 [15:05:10<11:09:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 57%|█████▋ | 7110/12384 [15:05:18<11:09:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 57%|█████▋ | 7111/12384 [15:05:18<11:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 57%|█████▋ | 7111/12384 [15:05:26<11:09:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=11.20s]
Epoch 2: 57%|█████▋ | 7112/12384 [15:05:26<11:10:34, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=11.20s]
Epoch 2: 57%|█████▋ | 7112/12384 [15:05:33<11:10:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 57%|█████▋ | 7113/12384 [15:05:33<11:10:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 57%|█████▋ | 7113/12384 [15:05:41<11:10:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 57%|█████▋ | 7114/12384 [15:05:41<11:09:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 57%|█████▋ | 7114/12384 [15:05:49<11:09:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 57%|█████▋ | 7115/12384 [15:05:49<11:09:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 57%|█████▋ | 7115/12384 [15:05:56<11:09:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 57%|█████▋ | 7116/12384 [15:05:56<11:08:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 57%|█████▋ | 7116/12384 [15:06:04<11:08:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 57%|█████▋ | 7117/12384 [15:06:04<11:08:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 57%|█████▋ | 7117/12384 [15:06:11<11:08:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 57%|█████▋ | 7118/12384 [15:06:11<11:08:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 57%|█████▋ | 7118/12384 [15:06:19<11:08:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 57%|█████▋ | 7119/12384 [15:06:19<11:08:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 57%|█████▋ | 7119/12384 [15:06:27<11:08:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 57%|█████▋ | 7120/12384 [15:06:27<11:07:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 57%|█████▋ | 7120/12384 [15:06:34<11:07:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 2: 58%|█████▊ | 7121/12384 [15:06:34<11:07:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.60s]
Epoch 2: 58%|█████▊ | 7121/12384 [15:06:42<11:07:56, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.37s]
Epoch 2: 58%|█████▊ | 7122/12384 [15:06:42<11:07:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.37s]
Epoch 2: 58%|█████▊ | 7122/12384 [15:06:49<11:07:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 58%|█████▊ | 7123/12384 [15:06:49<11:06:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 58%|█████▊ | 7123/12384 [15:06:57<11:06:47, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7124/12384 [15:06:57<11:07:59, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7124/12384 [15:07:05<11:07:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 58%|█████▊ | 7125/12384 [15:07:05<11:16:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 58%|█████▊ | 7125/12384 [15:07:13<11:16:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 58%|█████▊ | 7126/12384 [15:07:13<11:13:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 58%|█████▊ | 7126/12384 [15:07:20<11:13:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 58%|█████▊ | 7127/12384 [15:07:20<11:18:54, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 58%|█████▊ | 7127/12384 [15:07:28<11:18:54, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 58%|█████▊ | 7128/12384 [15:07:28<11:15:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 58%|█████▊ | 7128/12384 [15:07:36<11:15:49, 7.71s/it, loss=0.0001, acc=0.9993, iter_time=7.24s]
Epoch 2: 58%|█████▊ | 7129/12384 [15:07:36<11:13:14, 7.69s/it, loss=0.0001, acc=0.9993, iter_time=7.24s]
Epoch 2: 58%|█████▊ | 7129/12384 [15:07:43<11:13:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 58%|█████▊ | 7130/12384 [15:07:43<11:10:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 58%|█████▊ | 7130/12384 [15:07:51<11:10:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 58%|█████▊ | 7131/12384 [15:07:51<11:09:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 58%|█████▊ | 7131/12384 [15:07:59<11:09:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 58%|█████▊ | 7132/12384 [15:07:59<11:08:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 58%|█████▊ | 7132/12384 [15:08:06<11:08:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 58%|█████▊ | 7133/12384 [15:08:06<11:07:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 58%|█████▊ | 7133/12384 [15:08:14<11:07:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 58%|█████▊ | 7134/12384 [15:08:14<11:07:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 58%|█████▊ | 7134/12384 [15:08:21<11:07:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 58%|█████▊ | 7135/12384 [15:08:21<11:06:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 58%|█████▊ | 7135/12384 [15:08:29<11:06:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 58%|█████▊ | 7136/12384 [15:08:29<11:06:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 58%|█████▊ | 7136/12384 [15:08:37<11:06:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 58%|█████▊ | 7137/12384 [15:08:37<11:07:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 58%|█████▊ | 7137/12384 [15:08:44<11:07:50, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=9.17s]
Epoch 2: 58%|█████▊ | 7138/12384 [15:08:44<11:07:39, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=9.17s]
Epoch 2: 58%|█████▊ | 7138/12384 [15:08:52<11:07:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7139/12384 [15:08:52<11:06:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7139/12384 [15:09:00<11:06:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7140/12384 [15:09:00<11:05:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7140/12384 [15:09:07<11:05:39, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7141/12384 [15:09:07<11:05:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7141/12384 [15:09:15<11:05:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7142/12384 [15:09:15<11:05:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7142/12384 [15:09:22<11:05:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 58%|█████▊ | 7143/12384 [15:09:22<11:04:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 58%|█████▊ | 7143/12384 [15:09:30<11:04:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 58%|█████▊ | 7144/12384 [15:09:30<11:03:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 58%|█████▊ | 7144/12384 [15:09:38<11:03:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 58%|█████▊ | 7145/12384 [15:09:38<11:04:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 58%|█████▊ | 7145/12384 [15:09:45<11:04:04, 7.61s/it, loss=0.0003, acc=0.9990, iter_time=7.63s]
Epoch 2: 58%|█████▊ | 7146/12384 [15:09:45<11:04:14, 7.61s/it, loss=0.0003, acc=0.9990, iter_time=7.63s]
Epoch 2: 58%|█████▊ | 7146/12384 [15:09:53<11:04:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 58%|█████▊ | 7147/12384 [15:09:53<11:06:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 58%|█████▊ | 7147/12384 [15:10:00<11:06:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7148/12384 [15:10:00<11:04:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7148/12384 [15:10:08<11:04:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7149/12384 [15:10:08<11:04:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7149/12384 [15:10:16<11:04:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7150/12384 [15:10:16<11:05:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7150/12384 [15:10:23<11:05:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 58%|█████▊ | 7151/12384 [15:10:23<11:04:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 58%|█████▊ | 7151/12384 [15:10:31<11:04:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 58%|█████▊ | 7152/12384 [15:10:31<11:11:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 58%|█████▊ | 7152/12384 [15:10:39<11:11:49, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=5.94s]
Epoch 2: 58%|█████▊ | 7153/12384 [15:10:39<11:10:20, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.94s]
Epoch 2: 58%|█████▊ | 7153/12384 [15:10:46<11:10:20, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=9.18s]
Epoch 2: 58%|█████▊ | 7154/12384 [15:10:46<11:07:43, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=9.18s]
Epoch 2: 58%|█████▊ | 7154/12384 [15:10:54<11:07:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 58%|█████▊ | 7155/12384 [15:10:54<11:05:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 58%|█████▊ | 7155/12384 [15:11:02<11:05:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 58%|█████▊ | 7156/12384 [15:11:02<11:05:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 58%|█████▊ | 7156/12384 [15:11:09<11:05:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7157/12384 [15:11:09<11:06:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7157/12384 [15:11:17<11:06:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 58%|█████▊ | 7158/12384 [15:11:17<11:05:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 58%|█████▊ | 7158/12384 [15:11:25<11:05:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 58%|█████▊ | 7159/12384 [15:11:25<11:04:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 58%|█████▊ | 7159/12384 [15:11:32<11:04:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7160/12384 [15:11:32<11:04:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7160/12384 [15:11:40<11:04:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7161/12384 [15:11:40<11:03:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7161/12384 [15:11:47<11:03:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 58%|█████▊ | 7162/12384 [15:11:47<11:03:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 58%|█████▊ | 7162/12384 [15:11:55<11:03:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 58%|█████▊ | 7163/12384 [15:11:55<11:02:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 58%|█████▊ | 7163/12384 [15:12:03<11:02:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 58%|█████▊ | 7164/12384 [15:12:03<11:01:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 58%|█████▊ | 7164/12384 [15:12:10<11:01:59, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 2: 58%|█████▊ | 7165/12384 [15:12:10<11:02:11, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 2: 58%|█████▊ | 7165/12384 [15:12:18<11:02:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7166/12384 [15:12:18<11:02:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7166/12384 [15:12:25<11:02:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7167/12384 [15:12:25<11:01:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7167/12384 [15:12:33<11:01:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 58%|█████▊ | 7168/12384 [15:12:33<11:01:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 58%|█████▊ | 7168/12384 [15:12:41<11:01:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 58%|█████▊ | 7169/12384 [15:12:41<11:01:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.28s]
Epoch 2: 58%|█████▊ | 7169/12384 [15:12:48<11:01:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 58%|█████▊ | 7170/12384 [15:12:48<11:01:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 58%|█████▊ | 7170/12384 [15:12:56<11:01:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 58%|█████▊ | 7171/12384 [15:12:56<11:01:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 58%|█████▊ | 7171/12384 [15:13:03<11:01:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 58%|█████▊ | 7172/12384 [15:13:03<11:00:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 58%|█████▊ | 7172/12384 [15:13:11<11:00:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 58%|█████▊ | 7173/12384 [15:13:11<11:00:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 58%|█████▊ | 7173/12384 [15:13:19<11:00:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 58%|█████▊ | 7174/12384 [15:13:19<11:00:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 58%|█████▊ | 7174/12384 [15:13:26<11:00:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7175/12384 [15:13:26<11:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7175/12384 [15:13:34<11:00:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 58%|█████▊ | 7176/12384 [15:13:34<11:00:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 58%|█████▊ | 7176/12384 [15:13:42<11:00:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 58%|█████▊ | 7177/12384 [15:13:42<11:01:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 58%|█████▊ | 7177/12384 [15:13:50<11:01:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 58%|█████▊ | 7178/12384 [15:13:50<11:10:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 58%|█████▊ | 7178/12384 [15:13:57<11:10:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 58%|█████▊ | 7179/12384 [15:13:57<11:06:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 58%|█████▊ | 7179/12384 [15:14:05<11:06:44, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 2: 58%|█████▊ | 7180/12384 [15:14:05<11:04:35, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 2: 58%|█████▊ | 7180/12384 [15:14:12<11:04:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 58%|█████▊ | 7181/12384 [15:14:12<11:02:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 58%|█████▊ | 7181/12384 [15:14:20<11:02:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 58%|█████▊ | 7182/12384 [15:14:20<11:02:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 58%|█████▊ | 7182/12384 [15:14:28<11:02:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 2: 58%|█████▊ | 7183/12384 [15:14:28<11:01:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 2: 58%|█████▊ | 7183/12384 [15:14:35<11:01:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 58%|█████▊ | 7184/12384 [15:14:35<11:02:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 58%|█████▊ | 7184/12384 [15:14:43<11:02:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 58%|█████▊ | 7185/12384 [15:14:43<11:01:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 58%|█████▊ | 7185/12384 [15:14:50<11:01:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7186/12384 [15:14:50<11:00:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7186/12384 [15:14:58<11:00:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 58%|█████▊ | 7187/12384 [15:14:58<10:59:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 58%|█████▊ | 7187/12384 [15:15:06<10:59:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 58%|█████▊ | 7188/12384 [15:15:06<10:59:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 58%|█████▊ | 7188/12384 [15:15:13<10:59:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 58%|█████▊ | 7189/12384 [15:15:13<10:58:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 58%|█████▊ | 7189/12384 [15:15:21<10:58:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 58%|█████▊ | 7190/12384 [15:15:21<10:59:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 58%|█████▊ | 7190/12384 [15:15:29<10:59:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7191/12384 [15:15:29<10:59:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7191/12384 [15:15:36<10:59:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 58%|█████▊ | 7192/12384 [15:15:36<10:59:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 58%|█████▊ | 7192/12384 [15:15:44<10:59:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 58%|█████▊ | 7193/12384 [15:15:44<10:59:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 58%|█████▊ | 7193/12384 [15:15:51<10:59:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7194/12384 [15:15:51<11:00:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7194/12384 [15:15:59<11:00:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 58%|█████▊ | 7195/12384 [15:15:59<10:59:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 58%|█████▊ | 7195/12384 [15:16:07<10:59:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7196/12384 [15:16:07<10:58:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7196/12384 [15:16:14<10:58:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7197/12384 [15:16:14<10:57:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7197/12384 [15:16:22<10:57:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7198/12384 [15:16:22<10:57:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7198/12384 [15:16:29<10:57:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7199/12384 [15:16:29<10:57:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7199/12384 [15:16:37<10:57:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 58%|█████▊ | 7200/12384 [15:16:37<10:58:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 58%|█████▊ | 7200/12384 [15:16:45<10:58:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 58%|█████▊ | 7201/12384 [15:16:45<10:57:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 58%|█████▊ | 7201/12384 [15:16:52<10:57:20, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 2: 58%|█████▊ | 7202/12384 [15:16:52<10:59:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 2: 58%|█████▊ | 7202/12384 [15:17:00<10:59:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7203/12384 [15:17:00<10:58:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7203/12384 [15:17:08<10:58:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7204/12384 [15:17:08<10:57:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 58%|█████▊ | 7204/12384 [15:17:16<10:57:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 58%|█████▊ | 7205/12384 [15:17:16<11:05:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 58%|█████▊ | 7205/12384 [15:17:23<11:05:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 58%|█████▊ | 7206/12384 [15:17:23<11:11:50, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 58%|█████▊ | 7206/12384 [15:17:31<11:11:50, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 58%|█████▊ | 7207/12384 [15:17:31<11:06:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 58%|█████▊ | 7207/12384 [15:17:39<11:06:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 58%|█████▊ | 7208/12384 [15:17:39<11:03:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 58%|█████▊ | 7208/12384 [15:17:46<11:03:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 58%|█████▊ | 7209/12384 [15:17:46<11:01:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 58%|█████▊ | 7209/12384 [15:17:54<11:01:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 58%|█████▊ | 7210/12384 [15:17:54<11:00:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 58%|█████▊ | 7210/12384 [15:18:02<11:00:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7211/12384 [15:18:02<10:59:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 58%|█████▊ | 7211/12384 [15:18:09<10:59:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 58%|█████▊ | 7212/12384 [15:18:09<10:58:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 58%|█████▊ | 7212/12384 [15:18:17<10:58:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7213/12384 [15:18:17<10:56:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7213/12384 [15:18:24<10:56:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 58%|█████▊ | 7214/12384 [15:18:24<10:55:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 58%|█████▊ | 7214/12384 [15:18:32<10:55:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 58%|█████▊ | 7215/12384 [15:18:32<10:55:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 58%|█████▊ | 7215/12384 [15:18:40<10:55:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 58%|█████▊ | 7216/12384 [15:18:40<10:55:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 58%|█████▊ | 7216/12384 [15:18:47<10:55:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 58%|█████▊ | 7217/12384 [15:18:47<10:54:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 58%|█████▊ | 7217/12384 [15:18:55<10:54:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7218/12384 [15:18:55<10:54:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7218/12384 [15:19:02<10:54:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 58%|█████▊ | 7219/12384 [15:19:02<10:53:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 58%|█████▊ | 7219/12384 [15:19:10<10:53:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 58%|█████▊ | 7220/12384 [15:19:10<10:54:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 58%|█████▊ | 7220/12384 [15:19:18<10:54:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 2: 58%|█████▊ | 7221/12384 [15:19:18<10:54:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.52s]
Epoch 2: 58%|█████▊ | 7221/12384 [15:19:25<10:54:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 2: 58%|█████▊ | 7222/12384 [15:19:25<10:54:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 2: 58%|█████▊ | 7222/12384 [15:19:33<10:54:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 2: 58%|█████▊ | 7223/12384 [15:19:33<10:54:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 2: 58%|█████▊ | 7223/12384 [15:19:40<10:54:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 58%|█████▊ | 7224/12384 [15:19:40<10:54:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.82s]
Epoch 2: 58%|█████▊ | 7224/12384 [15:19:48<10:54:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 2: 58%|█████▊ | 7225/12384 [15:19:48<10:53:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 2: 58%|█████▊ | 7225/12384 [15:19:56<10:53:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 58%|█████▊ | 7226/12384 [15:19:56<10:53:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 58%|█████▊ | 7226/12384 [15:20:03<10:53:11, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 58%|█████▊ | 7227/12384 [15:20:03<10:52:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 58%|█████▊ | 7227/12384 [15:20:11<10:52:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7228/12384 [15:20:11<10:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 58%|█████▊ | 7228/12384 [15:20:18<10:53:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 58%|█████▊ | 7229/12384 [15:20:18<10:53:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 58%|█████▊ | 7229/12384 [15:20:26<10:53:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 58%|█████▊ | 7230/12384 [15:20:26<10:53:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 58%|█████▊ | 7230/12384 [15:20:34<10:53:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 58%|█████▊ | 7231/12384 [15:20:34<11:01:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 58%|█████▊ | 7231/12384 [15:20:42<11:01:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 58%|█████▊ | 7232/12384 [15:20:42<11:04:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 58%|█████▊ | 7232/12384 [15:20:50<11:04:04, 7.73s/it, loss=0.0001, acc=0.9990, iter_time=7.69s]
Epoch 2: 58%|█████▊ | 7233/12384 [15:20:50<11:08:12, 7.78s/it, loss=0.0001, acc=0.9990, iter_time=7.69s]
Epoch 2: 58%|█████▊ | 7233/12384 [15:20:57<11:08:12, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7234/12384 [15:20:57<11:04:38, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 58%|█████▊ | 7234/12384 [15:21:05<11:04:38, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 58%|█████▊ | 7235/12384 [15:21:05<11:01:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 58%|█████▊ | 7235/12384 [15:21:13<11:01:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 58%|█████▊ | 7236/12384 [15:21:13<10:59:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 58%|█████▊ | 7236/12384 [15:21:20<10:59:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 58%|█████▊ | 7237/12384 [15:21:20<10:57:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 58%|█████▊ | 7237/12384 [15:21:28<10:57:42, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7238/12384 [15:21:28<10:55:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 2: 58%|█████▊ | 7238/12384 [15:21:35<10:55:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 58%|█████▊ | 7239/12384 [15:21:35<10:54:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 58%|█████▊ | 7239/12384 [15:21:43<10:54:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 58%|█████▊ | 7240/12384 [15:21:43<10:54:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 58%|█████▊ | 7240/12384 [15:21:51<10:54:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 58%|█████▊ | 7241/12384 [15:21:51<10:53:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 58%|█████▊ | 7241/12384 [15:21:58<10:53:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 58%|█████▊ | 7242/12384 [15:21:58<10:53:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 58%|█████▊ | 7242/12384 [15:22:06<10:53:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 58%|█████▊ | 7243/12384 [15:22:06<10:52:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 58%|█████▊ | 7243/12384 [15:22:13<10:52:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 58%|█████▊ | 7244/12384 [15:22:13<10:52:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 58%|█████▊ | 7244/12384 [15:22:21<10:52:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 59%|█████▊ | 7245/12384 [15:22:21<10:52:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 59%|█████▊ | 7245/12384 [15:22:29<10:52:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 59%|█████▊ | 7246/12384 [15:22:29<10:52:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 59%|█████▊ | 7246/12384 [15:22:36<10:52:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 59%|█████▊ | 7247/12384 [15:22:36<10:52:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 59%|█████▊ | 7247/12384 [15:22:44<10:52:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 59%|█████▊ | 7248/12384 [15:22:44<10:53:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 59%|█████▊ | 7248/12384 [15:22:52<10:53:57, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 2: 59%|█████▊ | 7249/12384 [15:22:52<10:52:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.28s]
Epoch 2: 59%|█████▊ | 7249/12384 [15:22:59<10:52:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 59%|█████▊ | 7250/12384 [15:22:59<10:52:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 59%|█████▊ | 7250/12384 [15:23:07<10:52:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▊ | 7251/12384 [15:23:07<10:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▊ | 7251/12384 [15:23:14<10:51:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 59%|█████▊ | 7252/12384 [15:23:14<10:50:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 59%|█████▊ | 7252/12384 [15:23:22<10:50:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 59%|█████▊ | 7253/12384 [15:23:22<10:50:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 59%|█████▊ | 7253/12384 [15:23:30<10:50:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 59%|█████▊ | 7254/12384 [15:23:30<10:49:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 59%|█████▊ | 7254/12384 [15:23:37<10:49:49, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 59%|█████▊ | 7255/12384 [15:23:37<10:50:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 59%|█████▊ | 7255/12384 [15:23:45<10:50:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 59%|█████▊ | 7256/12384 [15:23:45<10:49:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 59%|█████▊ | 7256/12384 [15:23:53<10:49:34, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 59%|█████▊ | 7257/12384 [15:23:53<10:56:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 59%|█████▊ | 7257/12384 [15:24:00<10:56:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 59%|█████▊ | 7258/12384 [15:24:00<10:54:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 59%|█████▊ | 7258/12384 [15:24:08<10:54:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 59%|█████▊ | 7259/12384 [15:24:08<10:55:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 59%|█████▊ | 7259/12384 [15:24:16<10:55:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 59%|█████▊ | 7260/12384 [15:24:16<11:00:56, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 59%|█████▊ | 7260/12384 [15:24:23<11:00:56, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 59%|█████▊ | 7261/12384 [15:24:23<10:57:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.57s]
Epoch 2: 59%|█████▊ | 7261/12384 [15:24:31<10:57:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 59%|█████▊ | 7262/12384 [15:24:31<10:55:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 59%|█████▊ | 7262/12384 [15:24:39<10:55:41, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 59%|█████▊ | 7263/12384 [15:24:39<10:53:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 59%|█████▊ | 7263/12384 [15:24:46<10:53:21, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=10.26s]
Epoch 2: 59%|█████▊ | 7264/12384 [15:24:46<10:51:52, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=10.26s]
Epoch 2: 59%|█████▊ | 7264/12384 [15:24:54<10:51:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 59%|█████▊ | 7265/12384 [15:24:54<10:51:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 59%|█████▊ | 7265/12384 [15:25:02<10:51:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▊ | 7266/12384 [15:25:02<10:50:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▊ | 7266/12384 [15:25:09<10:50:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 59%|█████▊ | 7267/12384 [15:25:09<10:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 59%|█████▊ | 7267/12384 [15:25:17<10:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▊ | 7268/12384 [15:25:17<10:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▊ | 7268/12384 [15:25:24<10:49:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 59%|█████▊ | 7269/12384 [15:25:24<10:48:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 59%|█████▊ | 7269/12384 [15:25:32<10:48:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 59%|█████▊ | 7270/12384 [15:25:32<10:50:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 59%|█████▊ | 7270/12384 [15:25:40<10:50:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 59%|█████▊ | 7271/12384 [15:25:40<10:50:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 59%|█████▊ | 7271/12384 [15:25:47<10:50:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 59%|█████▊ | 7272/12384 [15:25:47<10:51:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 59%|█████▊ | 7272/12384 [15:25:55<10:51:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 59%|█████▊ | 7273/12384 [15:25:55<10:50:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 59%|█████▊ | 7273/12384 [15:26:03<10:50:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▊ | 7274/12384 [15:26:03<10:49:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▊ | 7274/12384 [15:26:10<10:49:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▊ | 7275/12384 [15:26:10<10:49:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▊ | 7275/12384 [15:26:18<10:49:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 59%|█████▉ | 7276/12384 [15:26:18<10:48:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 59%|█████▉ | 7276/12384 [15:26:25<10:48:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.96s]
Epoch 2: 59%|█████▉ | 7277/12384 [15:26:25<10:48:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.96s]
Epoch 2: 59%|█████▉ | 7277/12384 [15:26:33<10:48:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 2: 59%|█████▉ | 7278/12384 [15:26:33<10:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 2: 59%|█████▉ | 7278/12384 [15:26:41<10:47:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 59%|█████▉ | 7279/12384 [15:26:41<10:46:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 59%|█████▉ | 7279/12384 [15:26:48<10:46:45, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 59%|█████▉ | 7280/12384 [15:26:48<10:47:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 59%|█████▉ | 7280/12384 [15:26:56<10:47:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 59%|█████▉ | 7281/12384 [15:26:56<10:46:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 59%|█████▉ | 7281/12384 [15:27:03<10:46:19, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 59%|█████▉ | 7282/12384 [15:27:03<10:46:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.11s]
Epoch 2: 59%|█████▉ | 7282/12384 [15:27:11<10:46:20, 7.60s/it, loss=0.0001, acc=0.9998, iter_time=7.25s]
Epoch 2: 59%|█████▉ | 7283/12384 [15:27:11<10:56:20, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=7.25s]
Epoch 2: 59%|█████▉ | 7283/12384 [15:27:19<10:56:20, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 59%|█████▉ | 7284/12384 [15:27:19<10:53:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 59%|█████▉ | 7284/12384 [15:27:27<10:53:11, 7.68s/it, loss=0.0001, acc=0.9993, iter_time=9.11s]
Epoch 2: 59%|█████▉ | 7285/12384 [15:27:27<10:51:24, 7.67s/it, loss=0.0001, acc=0.9993, iter_time=9.11s]
Epoch 2: 59%|█████▉ | 7285/12384 [15:27:34<10:51:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 59%|█████▉ | 7286/12384 [15:27:34<10:49:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 59%|█████▉ | 7286/12384 [15:27:42<10:49:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 59%|█████▉ | 7287/12384 [15:27:42<10:49:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 59%|█████▉ | 7287/12384 [15:27:49<10:49:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 2: 59%|█████▉ | 7288/12384 [15:27:49<10:49:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 2: 59%|█████▉ | 7288/12384 [15:27:57<10:49:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 59%|█████▉ | 7289/12384 [15:27:57<10:49:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 59%|█████▉ | 7289/12384 [15:28:05<10:49:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.45s]
Epoch 2: 59%|█████▉ | 7290/12384 [15:28:05<10:47:38, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.45s]
Epoch 2: 59%|█████▉ | 7290/12384 [15:28:12<10:47:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 59%|█████▉ | 7291/12384 [15:28:12<10:46:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.79s]
Epoch 2: 59%|█████▉ | 7291/12384 [15:28:20<10:46:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 59%|█████▉ | 7292/12384 [15:28:20<10:46:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 59%|█████▉ | 7292/12384 [15:28:28<10:46:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 59%|█████▉ | 7293/12384 [15:28:28<10:48:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 59%|█████▉ | 7293/12384 [15:28:35<10:48:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 59%|█████▉ | 7294/12384 [15:28:35<10:47:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 59%|█████▉ | 7294/12384 [15:28:43<10:47:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 59%|█████▉ | 7295/12384 [15:28:43<10:47:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 59%|█████▉ | 7295/12384 [15:28:50<10:47:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 59%|█████▉ | 7296/12384 [15:28:50<10:46:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 59%|█████▉ | 7296/12384 [15:28:58<10:46:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 59%|█████▉ | 7297/12384 [15:28:58<10:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 59%|█████▉ | 7297/12384 [15:29:06<10:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7298/12384 [15:29:06<10:46:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7298/12384 [15:29:13<10:46:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 59%|█████▉ | 7299/12384 [15:29:13<10:45:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 59%|█████▉ | 7299/12384 [15:29:21<10:45:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7300/12384 [15:29:21<10:45:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7300/12384 [15:29:29<10:45:18, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7301/12384 [15:29:29<10:44:58, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7301/12384 [15:29:36<10:44:58, 7.61s/it, loss=0.0014, acc=0.9973, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7302/12384 [15:29:36<10:45:00, 7.62s/it, loss=0.0014, acc=0.9973, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7302/12384 [15:29:44<10:45:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7303/12384 [15:29:44<10:45:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7303/12384 [15:29:51<10:45:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 59%|█████▉ | 7304/12384 [15:29:51<10:44:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 59%|█████▉ | 7304/12384 [15:29:59<10:44:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 59%|█████▉ | 7305/12384 [15:29:59<10:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 59%|█████▉ | 7305/12384 [15:30:07<10:44:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 59%|█████▉ | 7306/12384 [15:30:07<10:43:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 59%|█████▉ | 7306/12384 [15:30:14<10:43:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7307/12384 [15:30:14<10:43:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7307/12384 [15:30:22<10:43:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 59%|█████▉ | 7308/12384 [15:30:22<10:44:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.79s]
Epoch 2: 59%|█████▉ | 7308/12384 [15:30:30<10:44:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 59%|█████▉ | 7309/12384 [15:30:30<10:51:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.50s]
Epoch 2: 59%|█████▉ | 7309/12384 [15:30:37<10:51:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 59%|█████▉ | 7310/12384 [15:30:37<10:49:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 59%|█████▉ | 7310/12384 [15:30:45<10:49:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 59%|█████▉ | 7311/12384 [15:30:45<10:46:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 59%|█████▉ | 7311/12384 [15:30:53<10:46:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 59%|█████▉ | 7312/12384 [15:30:53<10:45:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 59%|█████▉ | 7312/12384 [15:31:00<10:45:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 59%|█████▉ | 7313/12384 [15:31:00<10:44:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 59%|█████▉ | 7313/12384 [15:31:08<10:44:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7314/12384 [15:31:08<10:43:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7314/12384 [15:31:15<10:43:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7315/12384 [15:31:15<10:43:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7315/12384 [15:31:23<10:43:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7316/12384 [15:31:23<10:43:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7316/12384 [15:31:31<10:43:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7317/12384 [15:31:31<10:43:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7317/12384 [15:31:38<10:43:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 59%|█████▉ | 7318/12384 [15:31:38<10:42:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 59%|█████▉ | 7318/12384 [15:31:46<10:42:02, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 59%|█████▉ | 7319/12384 [15:31:46<10:41:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.52s]
Epoch 2: 59%|█████▉ | 7319/12384 [15:31:53<10:41:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 59%|█████▉ | 7320/12384 [15:31:53<10:42:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 59%|█████▉ | 7320/12384 [15:32:01<10:42:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 59%|█████▉ | 7321/12384 [15:32:01<10:41:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 59%|█████▉ | 7321/12384 [15:32:09<10:41:38, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7322/12384 [15:32:09<10:41:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7322/12384 [15:32:16<10:41:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 59%|█████▉ | 7323/12384 [15:32:16<10:43:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 59%|█████▉ | 7323/12384 [15:32:24<10:43:35, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 2: 59%|█████▉ | 7324/12384 [15:32:24<10:42:49, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 2: 59%|█████▉ | 7324/12384 [15:32:31<10:42:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7325/12384 [15:32:31<10:42:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7325/12384 [15:32:39<10:42:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 59%|█████▉ | 7326/12384 [15:32:39<10:40:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 59%|█████▉ | 7326/12384 [15:32:47<10:40:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 59%|█████▉ | 7327/12384 [15:32:47<10:40:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 59%|█████▉ | 7327/12384 [15:32:54<10:40:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 59%|█████▉ | 7328/12384 [15:32:54<10:40:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.43s]
Epoch 2: 59%|█████▉ | 7328/12384 [15:33:02<10:40:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 59%|█████▉ | 7329/12384 [15:33:02<10:39:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 59%|█████▉ | 7329/12384 [15:33:09<10:39:56, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 59%|█████▉ | 7330/12384 [15:33:09<10:39:37, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 59%|█████▉ | 7330/12384 [15:33:17<10:39:37, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 59%|█████▉ | 7331/12384 [15:33:17<10:39:25, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 59%|█████▉ | 7331/12384 [15:33:25<10:39:25, 7.59s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 59%|█████▉ | 7332/12384 [15:33:25<10:40:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 59%|█████▉ | 7332/12384 [15:33:32<10:40:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 2: 59%|█████▉ | 7333/12384 [15:33:32<10:40:21, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.20s]
Epoch 2: 59%|█████▉ | 7333/12384 [15:33:40<10:40:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 59%|█████▉ | 7334/12384 [15:33:40<10:41:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 59%|█████▉ | 7334/12384 [15:33:48<10:41:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7335/12384 [15:33:48<10:41:25, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7335/12384 [15:33:55<10:41:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 59%|█████▉ | 7336/12384 [15:33:55<10:49:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 59%|█████▉ | 7336/12384 [15:34:03<10:49:14, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 59%|█████▉ | 7337/12384 [15:34:03<10:53:37, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 59%|█████▉ | 7337/12384 [15:34:11<10:53:37, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7338/12384 [15:34:11<10:49:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 59%|█████▉ | 7338/12384 [15:34:19<10:49:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7339/12384 [15:34:19<10:46:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7339/12384 [15:34:26<10:46:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7340/12384 [15:34:26<10:44:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7340/12384 [15:34:34<10:44:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7341/12384 [15:34:34<10:43:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7341/12384 [15:34:41<10:43:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 2: 59%|█████▉ | 7342/12384 [15:34:41<10:42:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 2: 59%|█████▉ | 7342/12384 [15:34:49<10:42:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 59%|█████▉ | 7343/12384 [15:34:49<10:41:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 59%|█████▉ | 7343/12384 [15:34:57<10:41:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 59%|█████▉ | 7344/12384 [15:34:57<10:40:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 59%|█████▉ | 7344/12384 [15:35:04<10:40:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 59%|█████▉ | 7345/12384 [15:35:04<10:39:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.35s]
Epoch 2: 59%|█████▉ | 7345/12384 [15:35:12<10:39:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 2: 59%|█████▉ | 7346/12384 [15:35:12<10:39:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 2: 59%|█████▉ | 7346/12384 [15:35:19<10:39:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 59%|█████▉ | 7347/12384 [15:35:19<10:39:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 59%|█████▉ | 7347/12384 [15:35:27<10:39:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 59%|█████▉ | 7348/12384 [15:35:27<10:38:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 59%|█████▉ | 7348/12384 [15:35:35<10:38:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 59%|█████▉ | 7349/12384 [15:35:35<10:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 59%|█████▉ | 7349/12384 [15:35:42<10:38:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 59%|█████▉ | 7350/12384 [15:35:42<10:40:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 59%|█████▉ | 7350/12384 [15:35:50<10:40:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 59%|█████▉ | 7351/12384 [15:35:50<10:39:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 59%|█████▉ | 7351/12384 [15:35:58<10:39:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 59%|█████▉ | 7352/12384 [15:35:58<10:38:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 59%|█████▉ | 7352/12384 [15:36:05<10:38:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 59%|█████▉ | 7353/12384 [15:36:05<10:39:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 59%|█████▉ | 7353/12384 [15:36:13<10:39:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 59%|█████▉ | 7354/12384 [15:36:13<10:39:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 59%|█████▉ | 7354/12384 [15:36:20<10:39:03, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=8.57s]
Epoch 2: 59%|█████▉ | 7355/12384 [15:36:20<10:38:28, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=8.57s]
Epoch 2: 59%|█████▉ | 7355/12384 [15:36:28<10:38:28, 7.62s/it, loss=0.0004, acc=0.9984, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7356/12384 [15:36:28<10:37:47, 7.61s/it, loss=0.0004, acc=0.9984, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7356/12384 [15:36:36<10:37:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 59%|█████▉ | 7357/12384 [15:36:36<10:37:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 59%|█████▉ | 7357/12384 [15:36:43<10:37:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 59%|█████▉ | 7358/12384 [15:36:43<10:37:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 59%|█████▉ | 7358/12384 [15:36:51<10:37:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 59%|█████▉ | 7359/12384 [15:36:51<10:38:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 59%|█████▉ | 7359/12384 [15:36:59<10:38:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 59%|█████▉ | 7360/12384 [15:36:59<10:37:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 59%|█████▉ | 7360/12384 [15:37:06<10:37:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 59%|█████▉ | 7361/12384 [15:37:06<10:37:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 59%|█████▉ | 7361/12384 [15:37:14<10:37:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 59%|█████▉ | 7362/12384 [15:37:14<10:45:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 59%|█████▉ | 7362/12384 [15:37:22<10:45:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 59%|█████▉ | 7363/12384 [15:37:22<10:43:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 59%|█████▉ | 7363/12384 [15:37:29<10:43:14, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7364/12384 [15:37:29<10:41:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 59%|█████▉ | 7364/12384 [15:37:37<10:41:29, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7365/12384 [15:37:37<10:39:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 59%|█████▉ | 7365/12384 [15:37:45<10:39:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 59%|█████▉ | 7366/12384 [15:37:45<10:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 59%|█████▉ | 7366/12384 [15:37:52<10:38:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 59%|█████▉ | 7367/12384 [15:37:52<10:37:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 59%|█████▉ | 7367/12384 [15:38:00<10:37:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 59%|█████▉ | 7368/12384 [15:38:00<10:37:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.22s]
Epoch 2: 59%|█████▉ | 7368/12384 [15:38:07<10:37:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 60%|█████▉ | 7369/12384 [15:38:07<10:36:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 60%|█████▉ | 7369/12384 [15:38:15<10:36:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|█████▉ | 7370/12384 [15:38:15<10:36:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|█████▉ | 7370/12384 [15:38:23<10:36:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7371/12384 [15:38:23<10:35:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7371/12384 [15:38:30<10:35:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7372/12384 [15:38:30<10:36:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7372/12384 [15:38:38<10:36:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 60%|█████▉ | 7373/12384 [15:38:38<10:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 60%|█████▉ | 7373/12384 [15:38:45<10:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7374/12384 [15:38:45<10:35:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7374/12384 [15:38:53<10:35:22, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|█████▉ | 7375/12384 [15:38:53<10:35:28, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|█████▉ | 7375/12384 [15:39:01<10:35:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 60%|█████▉ | 7376/12384 [15:39:01<10:35:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 60%|█████▉ | 7376/12384 [15:39:08<10:35:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 60%|█████▉ | 7377/12384 [15:39:08<10:35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 60%|█████▉ | 7377/12384 [15:39:16<10:35:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7378/12384 [15:39:16<10:35:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7378/12384 [15:39:23<10:35:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 60%|█████▉ | 7379/12384 [15:39:23<10:34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 60%|█████▉ | 7379/12384 [15:39:31<10:34:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 60%|█████▉ | 7380/12384 [15:39:31<10:34:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 60%|█████▉ | 7380/12384 [15:39:39<10:34:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7381/12384 [15:39:39<10:35:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7381/12384 [15:39:46<10:35:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 60%|█████▉ | 7382/12384 [15:39:46<10:34:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 60%|█████▉ | 7382/12384 [15:39:54<10:34:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 60%|█████▉ | 7383/12384 [15:39:54<10:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 60%|█████▉ | 7383/12384 [15:40:02<10:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 60%|█████▉ | 7384/12384 [15:40:02<10:34:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 60%|█████▉ | 7384/12384 [15:40:09<10:34:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 60%|█████▉ | 7385/12384 [15:40:09<10:36:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 60%|█████▉ | 7385/12384 [15:40:17<10:36:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 60%|█████▉ | 7386/12384 [15:40:17<10:35:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.87s]
Epoch 2: 60%|█████▉ | 7386/12384 [15:40:24<10:35:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 60%|█████▉ | 7387/12384 [15:40:24<10:34:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 60%|█████▉ | 7387/12384 [15:40:32<10:34:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 2: 60%|█████▉ | 7388/12384 [15:40:32<10:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 2: 60%|█████▉ | 7388/12384 [15:40:40<10:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 2: 60%|█████▉ | 7389/12384 [15:40:40<10:42:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 2: 60%|█████▉ | 7389/12384 [15:40:48<10:42:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 60%|█████▉ | 7390/12384 [15:40:48<10:39:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 60%|█████▉ | 7390/12384 [15:40:55<10:39:31, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 60%|█████▉ | 7391/12384 [15:40:55<10:39:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 60%|█████▉ | 7391/12384 [15:41:03<10:39:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 60%|█████▉ | 7392/12384 [15:41:03<10:37:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 60%|█████▉ | 7392/12384 [15:41:11<10:37:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 60%|█████▉ | 7393/12384 [15:41:11<10:36:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 60%|█████▉ | 7393/12384 [15:41:18<10:36:14, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 60%|█████▉ | 7394/12384 [15:41:18<10:35:57, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 2: 60%|█████▉ | 7394/12384 [15:41:26<10:35:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 60%|█████▉ | 7395/12384 [15:41:26<10:35:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 60%|█████▉ | 7395/12384 [15:41:33<10:35:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 60%|█████▉ | 7396/12384 [15:41:33<10:34:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 60%|█████▉ | 7396/12384 [15:41:41<10:34:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 60%|█████▉ | 7397/12384 [15:41:41<10:34:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 60%|█████▉ | 7397/12384 [15:41:49<10:34:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 60%|█████▉ | 7398/12384 [15:41:49<10:34:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 60%|█████▉ | 7398/12384 [15:41:56<10:34:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 60%|█████▉ | 7399/12384 [15:41:56<10:34:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 60%|█████▉ | 7399/12384 [15:42:04<10:34:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 60%|█████▉ | 7400/12384 [15:42:04<10:33:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 60%|█████▉ | 7400/12384 [15:42:11<10:33:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 60%|█████▉ | 7401/12384 [15:42:11<10:32:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 60%|█████▉ | 7401/12384 [15:42:19<10:32:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 60%|█████▉ | 7402/12384 [15:42:19<10:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 60%|█████▉ | 7402/12384 [15:42:27<10:31:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 60%|█████▉ | 7403/12384 [15:42:27<10:31:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 60%|█████▉ | 7403/12384 [15:42:34<10:31:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 60%|█████▉ | 7404/12384 [15:42:34<10:30:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 60%|█████▉ | 7404/12384 [15:42:42<10:30:58, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 60%|█████▉ | 7405/12384 [15:42:42<10:30:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 60%|█████▉ | 7405/12384 [15:42:50<10:30:20, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7406/12384 [15:42:50<10:32:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7406/12384 [15:42:57<10:32:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 60%|█████▉ | 7407/12384 [15:42:57<10:32:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 60%|█████▉ | 7407/12384 [15:43:05<10:32:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 60%|█████▉ | 7408/12384 [15:43:05<10:31:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 60%|█████▉ | 7408/12384 [15:43:12<10:31:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 60%|█████▉ | 7409/12384 [15:43:12<10:31:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 60%|█████▉ | 7409/12384 [15:43:20<10:31:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7410/12384 [15:43:20<10:30:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7410/12384 [15:43:28<10:30:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|█████▉ | 7411/12384 [15:43:28<10:30:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|█████▉ | 7411/12384 [15:43:35<10:30:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 60%|█████▉ | 7412/12384 [15:43:35<10:30:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 60%|█████▉ | 7412/12384 [15:43:43<10:30:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 60%|█████▉ | 7413/12384 [15:43:43<10:30:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 60%|█████▉ | 7413/12384 [15:43:50<10:30:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 60%|█████▉ | 7414/12384 [15:43:50<10:30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 60%|█████▉ | 7414/12384 [15:43:58<10:30:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 60%|█████▉ | 7415/12384 [15:43:58<10:38:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 60%|█████▉ | 7415/12384 [15:44:06<10:38:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 60%|█████▉ | 7416/12384 [15:44:06<10:36:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 60%|█████▉ | 7416/12384 [15:44:14<10:36:32, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 60%|█████▉ | 7417/12384 [15:44:14<10:34:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 60%|█████▉ | 7417/12384 [15:44:21<10:34:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7418/12384 [15:44:21<10:32:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7418/12384 [15:44:29<10:32:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7419/12384 [15:44:29<10:31:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7419/12384 [15:44:36<10:31:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|█████▉ | 7420/12384 [15:44:36<10:31:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|█████▉ | 7420/12384 [15:44:44<10:31:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7421/12384 [15:44:44<10:30:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|█████▉ | 7421/12384 [15:44:52<10:30:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7422/12384 [15:44:52<10:30:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7422/12384 [15:44:59<10:30:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7423/12384 [15:44:59<10:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7423/12384 [15:45:07<10:30:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 60%|█████▉ | 7424/12384 [15:45:07<10:29:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 60%|█████▉ | 7424/12384 [15:45:15<10:29:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 60%|█████▉ | 7425/12384 [15:45:15<10:29:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 60%|█████▉ | 7425/12384 [15:45:22<10:29:37, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7426/12384 [15:45:22<10:30:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|█████▉ | 7426/12384 [15:45:30<10:30:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 60%|█████▉ | 7427/12384 [15:45:30<10:32:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 60%|█████▉ | 7427/12384 [15:45:37<10:32:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 60%|█████▉ | 7428/12384 [15:45:37<10:31:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 60%|█████▉ | 7428/12384 [15:45:45<10:31:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 60%|█████▉ | 7429/12384 [15:45:45<10:31:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 60%|█████▉ | 7429/12384 [15:45:53<10:31:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 60%|█████▉ | 7430/12384 [15:45:53<10:30:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 60%|█████▉ | 7430/12384 [15:46:00<10:30:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 60%|██████ | 7431/12384 [15:46:00<10:29:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 60%|██████ | 7431/12384 [15:46:08<10:29:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 60%|██████ | 7432/12384 [15:46:08<10:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 60%|██████ | 7432/12384 [15:46:16<10:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 60%|██████ | 7433/12384 [15:46:16<10:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 60%|██████ | 7433/12384 [15:46:23<10:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|██████ | 7434/12384 [15:46:23<10:28:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|██████ | 7434/12384 [15:46:31<10:28:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 60%|██████ | 7435/12384 [15:46:31<10:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 60%|██████ | 7435/12384 [15:46:39<10:28:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 60%|██████ | 7436/12384 [15:46:39<10:30:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 60%|██████ | 7436/12384 [15:46:46<10:30:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 60%|██████ | 7437/12384 [15:46:46<10:29:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 60%|██████ | 7437/12384 [15:46:54<10:29:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|██████ | 7438/12384 [15:46:54<10:28:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|██████ | 7438/12384 [15:47:01<10:28:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 2: 60%|██████ | 7439/12384 [15:47:01<10:27:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.65s]
Epoch 2: 60%|██████ | 7439/12384 [15:47:09<10:27:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.93s]
Epoch 2: 60%|██████ | 7440/12384 [15:47:09<10:27:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.93s]
Epoch 2: 60%|██████ | 7440/12384 [15:47:17<10:27:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 60%|██████ | 7441/12384 [15:47:17<10:35:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.49s]
Epoch 2: 60%|██████ | 7441/12384 [15:47:25<10:35:31, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.22s]
Epoch 2: 60%|██████ | 7442/12384 [15:47:25<10:33:10, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.22s]
Epoch 2: 60%|██████ | 7442/12384 [15:47:32<10:33:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 60%|██████ | 7443/12384 [15:47:32<10:30:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 60%|██████ | 7443/12384 [15:47:40<10:30:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 60%|██████ | 7444/12384 [15:47:40<10:29:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 60%|██████ | 7444/12384 [15:47:47<10:29:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 60%|██████ | 7445/12384 [15:47:47<10:28:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 60%|██████ | 7445/12384 [15:47:55<10:28:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 2: 60%|██████ | 7446/12384 [15:47:55<10:26:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.19s]
Epoch 2: 60%|██████ | 7446/12384 [15:48:03<10:26:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 2: 60%|██████ | 7447/12384 [15:48:03<10:27:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.59s]
Epoch 2: 60%|██████ | 7447/12384 [15:48:10<10:27:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 60%|██████ | 7448/12384 [15:48:10<10:26:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 60%|██████ | 7448/12384 [15:48:18<10:26:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 60%|██████ | 7449/12384 [15:48:18<10:26:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 60%|██████ | 7449/12384 [15:48:25<10:26:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 60%|██████ | 7450/12384 [15:48:25<10:25:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.94s]
Epoch 2: 60%|██████ | 7450/12384 [15:48:33<10:25:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|██████ | 7451/12384 [15:48:33<10:25:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|██████ | 7451/12384 [15:48:41<10:25:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7452/12384 [15:48:41<10:25:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7452/12384 [15:48:48<10:25:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 60%|██████ | 7453/12384 [15:48:48<10:26:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 60%|██████ | 7453/12384 [15:48:56<10:26:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 2: 60%|██████ | 7454/12384 [15:48:56<10:25:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 2: 60%|██████ | 7454/12384 [15:49:03<10:25:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 60%|██████ | 7455/12384 [15:49:03<10:25:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 60%|██████ | 7455/12384 [15:49:11<10:25:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 60%|██████ | 7456/12384 [15:49:11<10:25:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 60%|██████ | 7456/12384 [15:49:19<10:25:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 60%|██████ | 7457/12384 [15:49:19<10:25:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 60%|██████ | 7457/12384 [15:49:26<10:25:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 60%|██████ | 7458/12384 [15:49:26<10:25:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 60%|██████ | 7458/12384 [15:49:34<10:25:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 60%|██████ | 7459/12384 [15:49:34<10:25:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 60%|██████ | 7459/12384 [15:49:42<10:25:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=9.37s]
Epoch 2: 60%|██████ | 7460/12384 [15:49:42<10:24:37, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=9.37s]
Epoch 2: 60%|██████ | 7460/12384 [15:49:49<10:24:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|██████ | 7461/12384 [15:49:49<10:24:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 60%|██████ | 7461/12384 [15:49:57<10:24:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 60%|██████ | 7462/12384 [15:49:57<10:24:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 60%|██████ | 7462/12384 [15:50:04<10:24:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 60%|██████ | 7463/12384 [15:50:04<10:23:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 60%|██████ | 7463/12384 [15:50:12<10:23:42, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 60%|██████ | 7464/12384 [15:50:12<10:23:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 60%|██████ | 7464/12384 [15:50:20<10:23:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 60%|██████ | 7465/12384 [15:50:20<10:23:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 60%|██████ | 7465/12384 [15:50:27<10:23:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 60%|██████ | 7466/12384 [15:50:27<10:23:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 60%|██████ | 7466/12384 [15:50:35<10:23:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 60%|██████ | 7467/12384 [15:50:35<10:31:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 60%|██████ | 7467/12384 [15:50:43<10:31:45, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 60%|██████ | 7468/12384 [15:50:43<10:29:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 60%|██████ | 7468/12384 [15:50:50<10:29:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 60%|██████ | 7469/12384 [15:50:50<10:27:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 60%|██████ | 7469/12384 [15:50:58<10:27:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 60%|██████ | 7470/12384 [15:50:58<10:25:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 60%|██████ | 7470/12384 [15:51:06<10:25:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 60%|██████ | 7471/12384 [15:51:06<10:24:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 60%|██████ | 7471/12384 [15:51:13<10:24:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 60%|██████ | 7472/12384 [15:51:13<10:24:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 60%|██████ | 7472/12384 [15:51:21<10:24:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 60%|██████ | 7473/12384 [15:51:21<10:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 60%|██████ | 7473/12384 [15:51:28<10:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7474/12384 [15:51:28<10:23:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7474/12384 [15:51:36<10:23:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7475/12384 [15:51:36<10:22:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7475/12384 [15:51:44<10:22:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 60%|██████ | 7476/12384 [15:51:44<10:22:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 60%|██████ | 7476/12384 [15:51:51<10:22:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 60%|██████ | 7477/12384 [15:51:51<10:22:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 60%|██████ | 7477/12384 [15:51:59<10:22:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7478/12384 [15:51:59<10:21:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7478/12384 [15:52:06<10:21:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 2: 60%|██████ | 7479/12384 [15:52:06<10:22:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.26s]
Epoch 2: 60%|██████ | 7479/12384 [15:52:14<10:22:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 60%|██████ | 7480/12384 [15:52:14<10:22:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 60%|██████ | 7480/12384 [15:52:22<10:22:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 60%|██████ | 7481/12384 [15:52:22<10:22:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 60%|██████ | 7481/12384 [15:52:29<10:22:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 60%|██████ | 7482/12384 [15:52:29<10:21:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 60%|██████ | 7482/12384 [15:52:37<10:21:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 60%|██████ | 7483/12384 [15:52:37<10:21:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 60%|██████ | 7483/12384 [15:52:44<10:21:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 60%|██████ | 7484/12384 [15:52:44<10:21:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 60%|██████ | 7484/12384 [15:52:52<10:21:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 60%|██████ | 7485/12384 [15:52:52<10:23:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 60%|██████ | 7485/12384 [15:53:00<10:23:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 60%|██████ | 7486/12384 [15:53:00<10:22:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 60%|██████ | 7486/12384 [15:53:07<10:22:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 60%|██████ | 7487/12384 [15:53:07<10:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 60%|██████ | 7487/12384 [15:53:15<10:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 60%|██████ | 7488/12384 [15:53:15<10:21:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 60%|██████ | 7488/12384 [15:53:23<10:21:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 60%|██████ | 7489/12384 [15:53:23<10:22:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 60%|██████ | 7489/12384 [15:53:30<10:22:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 60%|██████ | 7490/12384 [15:53:30<10:22:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 60%|██████ | 7490/12384 [15:53:38<10:22:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7491/12384 [15:53:38<10:21:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 60%|██████ | 7491/12384 [15:53:45<10:21:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|██████ | 7492/12384 [15:53:45<10:20:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 60%|██████ | 7492/12384 [15:53:53<10:20:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 61%|██████ | 7493/12384 [15:53:53<10:28:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 61%|██████ | 7493/12384 [15:54:01<10:28:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 2: 61%|██████ | 7494/12384 [15:54:01<10:28:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 2: 61%|██████ | 7494/12384 [15:54:09<10:28:47, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 61%|██████ | 7495/12384 [15:54:09<10:25:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 61%|██████ | 7495/12384 [15:54:16<10:25:59, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 61%|██████ | 7496/12384 [15:54:16<10:23:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 61%|██████ | 7496/12384 [15:54:24<10:23:59, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=4.67s]
Epoch 2: 61%|██████ | 7497/12384 [15:54:24<10:22:34, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=4.67s]
Epoch 2: 61%|██████ | 7497/12384 [15:54:32<10:22:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 2: 61%|██████ | 7498/12384 [15:54:32<10:20:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 2: 61%|██████ | 7498/12384 [15:54:39<10:20:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 61%|██████ | 7499/12384 [15:54:39<10:22:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 61%|██████ | 7499/12384 [15:54:47<10:22:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 2: 61%|██████ | 7500/12384 [15:54:47<10:21:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 2: 61%|██████ | 7500/12384 [15:54:54<10:21:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 61%|██████ | 7501/12384 [15:54:54<10:20:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 61%|██████ | 7501/12384 [15:55:02<10:20:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 61%|██████ | 7502/12384 [15:55:02<10:19:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 61%|██████ | 7502/12384 [15:55:10<10:19:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 61%|██████ | 7503/12384 [15:55:10<10:21:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 61%|██████ | 7503/12384 [15:55:17<10:21:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 2: 61%|██████ | 7504/12384 [15:55:17<10:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 2: 61%|██████ | 7504/12384 [15:55:25<10:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 61%|██████ | 7505/12384 [15:55:25<10:20:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 61%|██████ | 7505/12384 [15:55:33<10:20:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 61%|██████ | 7506/12384 [15:55:33<10:19:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 61%|██████ | 7506/12384 [15:55:40<10:19:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████ | 7507/12384 [15:55:40<10:18:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████ | 7507/12384 [15:55:48<10:18:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 61%|██████ | 7508/12384 [15:55:48<10:18:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 61%|██████ | 7508/12384 [15:55:55<10:18:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 61%|██████ | 7509/12384 [15:55:55<10:19:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 61%|██████ | 7509/12384 [15:56:03<10:19:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 2: 61%|██████ | 7510/12384 [15:56:03<10:18:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 2: 61%|██████ | 7510/12384 [15:56:11<10:18:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 61%|██████ | 7511/12384 [15:56:11<10:18:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 61%|██████ | 7511/12384 [15:56:18<10:18:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 61%|██████ | 7512/12384 [15:56:18<10:17:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 61%|██████ | 7512/12384 [15:56:26<10:17:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 61%|██████ | 7513/12384 [15:56:26<10:17:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 61%|██████ | 7513/12384 [15:56:33<10:17:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 61%|██████ | 7514/12384 [15:56:33<10:18:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 61%|██████ | 7514/12384 [15:56:41<10:18:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 61%|██████ | 7515/12384 [15:56:41<10:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 61%|██████ | 7515/12384 [15:56:49<10:17:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 61%|██████ | 7516/12384 [15:56:49<10:17:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 61%|██████ | 7516/12384 [15:56:56<10:17:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 61%|██████ | 7517/12384 [15:56:56<10:18:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 61%|██████ | 7517/12384 [15:57:04<10:18:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 61%|██████ | 7518/12384 [15:57:04<10:18:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 61%|██████ | 7518/12384 [15:57:12<10:18:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 61%|██████ | 7519/12384 [15:57:12<10:24:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 61%|██████ | 7519/12384 [15:57:20<10:24:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 61%|██████ | 7520/12384 [15:57:20<10:30:27, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 61%|██████ | 7520/12384 [15:57:27<10:30:27, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 61%|██████ | 7521/12384 [15:57:27<10:25:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 61%|██████ | 7521/12384 [15:57:35<10:25:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 61%|██████ | 7522/12384 [15:57:35<10:22:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 61%|██████ | 7522/12384 [15:57:43<10:22:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 61%|██████ | 7523/12384 [15:57:43<10:20:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 61%|██████ | 7523/12384 [15:57:50<10:20:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 61%|██████ | 7524/12384 [15:57:50<10:19:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 61%|██████ | 7524/12384 [15:57:58<10:19:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 61%|██████ | 7525/12384 [15:57:58<10:18:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 61%|██████ | 7525/12384 [15:58:05<10:18:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 61%|██████ | 7526/12384 [15:58:05<10:18:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 61%|██████ | 7526/12384 [15:58:13<10:18:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████ | 7527/12384 [15:58:13<10:17:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████ | 7527/12384 [15:58:21<10:17:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 61%|██████ | 7528/12384 [15:58:21<10:16:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 61%|██████ | 7528/12384 [15:58:28<10:16:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 2: 61%|██████ | 7529/12384 [15:58:28<10:16:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.67s]
Epoch 2: 61%|██████ | 7529/12384 [15:58:36<10:16:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 61%|██████ | 7530/12384 [15:58:36<10:16:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 61%|██████ | 7530/12384 [15:58:43<10:16:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 61%|██████ | 7531/12384 [15:58:43<10:15:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 61%|██████ | 7531/12384 [15:58:51<10:15:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 61%|██████ | 7532/12384 [15:58:51<10:15:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 61%|██████ | 7532/12384 [15:58:59<10:15:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 61%|██████ | 7533/12384 [15:58:59<10:15:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 61%|██████ | 7533/12384 [15:59:06<10:15:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 61%|██████ | 7534/12384 [15:59:06<10:16:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 61%|██████ | 7534/12384 [15:59:14<10:16:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 61%|██████ | 7535/12384 [15:59:14<10:15:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 61%|██████ | 7535/12384 [15:59:22<10:15:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 61%|██████ | 7536/12384 [15:59:22<10:15:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 61%|██████ | 7536/12384 [15:59:29<10:15:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 61%|██████ | 7537/12384 [15:59:29<10:15:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 61%|██████ | 7537/12384 [15:59:37<10:15:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 61%|██████ | 7538/12384 [15:59:37<10:21:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 61%|██████ | 7538/12384 [15:59:46<10:21:27, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=9.21s]
Epoch 2: 61%|██████ | 7539/12384 [15:59:46<10:51:04, 8.06s/it, loss=0.0002, acc=1.0000, iter_time=9.21s]
Epoch 2: 61%|██████ | 7539/12384 [15:59:55<10:51:04, 8.06s/it, loss=0.0003, acc=0.9988, iter_time=7.13s]
Epoch 2: 61%|██████ | 7540/12384 [15:59:55<11:08:45, 8.28s/it, loss=0.0003, acc=0.9988, iter_time=7.13s]
Epoch 2: 61%|██████ | 7540/12384 [16:00:03<11:08:45, 8.28s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 61%|██████ | 7541/12384 [16:00:03<11:11:29, 8.32s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 61%|██████ | 7541/12384 [16:00:12<11:11:29, 8.32s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 61%|██████ | 7542/12384 [16:00:12<11:12:48, 8.34s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 61%|██████ | 7542/12384 [16:00:19<11:12:48, 8.34s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 61%|██████ | 7543/12384 [16:00:19<10:58:43, 8.16s/it, loss=0.0000, acc=1.0000, iter_time=9.17s]
Epoch 2: 61%|██████ | 7543/12384 [16:00:27<10:58:43, 8.16s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 61%|██████ | 7544/12384 [16:00:27<10:46:48, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 61%|██████ | 7544/12384 [16:00:35<10:46:48, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 2: 61%|██████ | 7545/12384 [16:00:35<10:37:11, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 2: 61%|██████ | 7545/12384 [16:00:43<10:37:11, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 61%|██████ | 7546/12384 [16:00:43<10:48:02, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 61%|██████ | 7546/12384 [16:00:51<10:48:02, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 61%|██████ | 7547/12384 [16:00:51<10:39:31, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 61%|██████ | 7547/12384 [16:00:58<10:39:31, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 61%|██████ | 7548/12384 [16:00:58<10:31:39, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 61%|██████ | 7548/12384 [16:01:06<10:31:39, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 2: 61%|██████ | 7549/12384 [16:01:06<10:25:45, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=3.79s]
Epoch 2: 61%|██████ | 7549/12384 [16:01:14<10:25:45, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=11.40s]
Epoch 2: 61%|██████ | 7550/12384 [16:01:14<10:22:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.40s]
Epoch 2: 61%|██████ | 7550/12384 [16:01:21<10:22:06, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 61%|██████ | 7551/12384 [16:01:21<10:20:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 61%|██████ | 7551/12384 [16:01:29<10:20:41, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.67s]
Epoch 2: 61%|██████ | 7552/12384 [16:01:29<10:18:48, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=8.67s]
Epoch 2: 61%|██████ | 7552/12384 [16:01:36<10:18:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 61%|██████ | 7553/12384 [16:01:36<10:17:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 61%|██████ | 7553/12384 [16:01:44<10:17:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 61%|██████ | 7554/12384 [16:01:44<10:17:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 61%|██████ | 7554/12384 [16:01:52<10:17:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 61%|██████ | 7555/12384 [16:01:52<10:15:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 61%|██████ | 7555/12384 [16:01:59<10:15:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 61%|██████ | 7556/12384 [16:01:59<10:14:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 61%|██████ | 7556/12384 [16:02:07<10:14:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 61%|██████ | 7557/12384 [16:02:07<10:14:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 61%|██████ | 7557/12384 [16:02:15<10:14:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 61%|██████ | 7558/12384 [16:02:15<10:13:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 61%|██████ | 7558/12384 [16:02:22<10:13:14, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=6.71s]
Epoch 2: 61%|██████ | 7559/12384 [16:02:22<10:13:41, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.71s]
Epoch 2: 61%|██████ | 7559/12384 [16:02:30<10:13:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 61%|██████ | 7560/12384 [16:02:30<10:12:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 61%|██████ | 7560/12384 [16:02:37<10:12:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 61%|██████ | 7561/12384 [16:02:37<10:12:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.91s]
Epoch 2: 61%|██████ | 7561/12384 [16:02:45<10:12:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 61%|██████ | 7562/12384 [16:02:45<10:11:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 61%|██████ | 7562/12384 [16:02:53<10:11:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 61%|██████ | 7563/12384 [16:02:53<10:11:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 61%|██████ | 7563/12384 [16:03:00<10:11:03, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 61%|██████ | 7564/12384 [16:03:00<10:11:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 61%|██████ | 7564/12384 [16:03:08<10:11:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 61%|██████ | 7565/12384 [16:03:08<10:11:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 61%|██████ | 7565/12384 [16:03:15<10:11:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 61%|██████ | 7566/12384 [16:03:15<10:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 61%|██████ | 7566/12384 [16:03:23<10:10:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████ | 7567/12384 [16:03:23<10:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████ | 7567/12384 [16:03:31<10:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 61%|██████ | 7568/12384 [16:03:31<10:11:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 61%|██████ | 7568/12384 [16:03:38<10:11:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 61%|██████ | 7569/12384 [16:03:38<10:11:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 61%|██████ | 7569/12384 [16:03:46<10:11:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 61%|██████ | 7570/12384 [16:03:46<10:11:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 61%|██████ | 7570/12384 [16:03:54<10:11:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 61%|██████ | 7571/12384 [16:03:54<10:11:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 61%|██████ | 7571/12384 [16:04:01<10:11:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 2: 61%|██████ | 7572/12384 [16:04:01<10:12:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.29s]
Epoch 2: 61%|██████ | 7572/12384 [16:04:09<10:12:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 61%|██████ | 7573/12384 [16:04:09<10:20:22, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 61%|██████ | 7573/12384 [16:04:17<10:20:22, 7.74s/it, loss=0.0002, acc=0.9977, iter_time=6.87s]
Epoch 2: 61%|██████ | 7574/12384 [16:04:17<10:16:53, 7.70s/it, loss=0.0002, acc=0.9977, iter_time=6.87s]
Epoch 2: 61%|██████ | 7574/12384 [16:04:24<10:16:53, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 61%|██████ | 7575/12384 [16:04:24<10:14:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 61%|██████ | 7575/12384 [16:04:32<10:14:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 61%|██████ | 7576/12384 [16:04:32<10:12:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 61%|██████ | 7576/12384 [16:04:40<10:12:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 61%|██████ | 7577/12384 [16:04:40<10:12:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 61%|██████ | 7577/12384 [16:04:47<10:12:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 61%|██████ | 7578/12384 [16:04:47<10:11:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 61%|██████ | 7578/12384 [16:04:55<10:11:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 61%|██████ | 7579/12384 [16:04:55<10:10:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 61%|██████ | 7579/12384 [16:05:03<10:10:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 61%|██████ | 7580/12384 [16:05:03<10:10:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 61%|██████ | 7580/12384 [16:05:10<10:10:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 61%|██████ | 7581/12384 [16:05:10<10:10:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 61%|██████ | 7581/12384 [16:05:18<10:10:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 61%|██████ | 7582/12384 [16:05:18<10:10:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 61%|██████ | 7582/12384 [16:05:25<10:10:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 61%|██████ | 7583/12384 [16:05:25<10:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 61%|██████ | 7583/12384 [16:05:33<10:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 61%|██████ | 7584/12384 [16:05:33<10:09:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 61%|██████ | 7584/12384 [16:05:41<10:09:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 61%|██████ | 7585/12384 [16:05:41<10:09:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 61%|██████ | 7585/12384 [16:05:48<10:09:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 2: 61%|██████▏ | 7586/12384 [16:05:48<10:08:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 2: 61%|██████▏ | 7586/12384 [16:05:56<10:08:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 61%|██████▏ | 7587/12384 [16:05:56<10:08:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 61%|██████▏ | 7587/12384 [16:06:03<10:08:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 61%|██████▏ | 7588/12384 [16:06:03<10:09:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 61%|██████▏ | 7588/12384 [16:06:11<10:09:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 61%|██████▏ | 7589/12384 [16:06:11<10:09:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 61%|██████▏ | 7589/12384 [16:06:19<10:09:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 61%|██████▏ | 7590/12384 [16:06:19<10:08:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 61%|██████▏ | 7590/12384 [16:06:26<10:08:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 61%|██████▏ | 7591/12384 [16:06:26<10:08:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 61%|██████▏ | 7591/12384 [16:06:34<10:08:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 61%|██████▏ | 7592/12384 [16:06:34<10:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 61%|██████▏ | 7592/12384 [16:06:41<10:08:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 61%|██████▏ | 7593/12384 [16:06:42<10:07:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 61%|██████▏ | 7593/12384 [16:06:49<10:07:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 61%|██████▏ | 7594/12384 [16:06:49<10:07:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 61%|██████▏ | 7594/12384 [16:06:57<10:07:31, 7.61s/it, loss=0.0007, acc=0.9981, iter_time=4.82s]
Epoch 2: 61%|██████▏ | 7595/12384 [16:06:57<10:08:24, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=4.82s]
Epoch 2: 61%|██████▏ | 7595/12384 [16:07:04<10:08:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 61%|██████▏ | 7596/12384 [16:07:04<10:08:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.43s]
Epoch 2: 61%|██████▏ | 7596/12384 [16:07:12<10:08:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 61%|██████▏ | 7597/12384 [16:07:12<10:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 61%|██████▏ | 7597/12384 [16:07:20<10:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 61%|██████▏ | 7598/12384 [16:07:20<10:14:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 61%|██████▏ | 7598/12384 [16:07:28<10:14:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 61%|██████▏ | 7599/12384 [16:07:28<10:20:18, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 61%|██████▏ | 7599/12384 [16:07:35<10:20:18, 7.78s/it, loss=0.0003, acc=0.9998, iter_time=8.31s]
Epoch 2: 61%|██████▏ | 7600/12384 [16:07:35<10:16:07, 7.73s/it, loss=0.0003, acc=0.9998, iter_time=8.31s]
Epoch 2: 61%|██████▏ | 7600/12384 [16:07:43<10:16:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 2: 61%|██████▏ | 7601/12384 [16:07:43<10:13:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 2: 61%|██████▏ | 7601/12384 [16:07:51<10:13:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 61%|██████▏ | 7602/12384 [16:07:51<10:12:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 61%|██████▏ | 7602/12384 [16:07:58<10:12:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 61%|██████▏ | 7603/12384 [16:07:58<10:10:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 61%|██████▏ | 7603/12384 [16:08:06<10:10:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 61%|██████▏ | 7604/12384 [16:08:06<10:08:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 61%|██████▏ | 7604/12384 [16:08:14<10:08:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 61%|██████▏ | 7605/12384 [16:08:14<10:10:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 61%|██████▏ | 7605/12384 [16:08:21<10:10:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 61%|██████▏ | 7606/12384 [16:08:21<10:09:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 61%|██████▏ | 7606/12384 [16:08:29<10:09:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 61%|██████▏ | 7607/12384 [16:08:29<10:07:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 61%|██████▏ | 7607/12384 [16:08:36<10:07:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 61%|██████▏ | 7608/12384 [16:08:36<10:07:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 61%|██████▏ | 7608/12384 [16:08:44<10:07:18, 7.63s/it, loss=0.0001, acc=0.9995, iter_time=4.13s]
Epoch 2: 61%|██████▏ | 7609/12384 [16:08:44<10:06:03, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=4.13s]
Epoch 2: 61%|██████▏ | 7609/12384 [16:08:52<10:06:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 61%|██████▏ | 7610/12384 [16:08:52<10:05:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 2: 61%|██████▏ | 7610/12384 [16:08:59<10:05:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 61%|██████▏ | 7611/12384 [16:08:59<10:05:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 61%|██████▏ | 7611/12384 [16:09:07<10:05:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████▏ | 7612/12384 [16:09:07<10:04:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████▏ | 7612/12384 [16:09:14<10:04:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 61%|██████▏ | 7613/12384 [16:09:14<10:04:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 61%|██████▏ | 7613/12384 [16:09:22<10:04:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████▏ | 7614/12384 [16:09:22<10:04:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 61%|██████▏ | 7614/12384 [16:09:30<10:04:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 61%|██████▏ | 7615/12384 [16:09:30<10:04:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 61%|██████▏ | 7615/12384 [16:09:37<10:04:39, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=8.97s]
Epoch 2: 61%|██████▏ | 7616/12384 [16:09:37<10:04:48, 7.61s/it, loss=0.0001, acc=0.9992, iter_time=8.97s]
Epoch 2: 61%|██████▏ | 7616/12384 [16:09:45<10:04:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 62%|██████▏ | 7617/12384 [16:09:45<10:03:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 62%|██████▏ | 7617/12384 [16:09:53<10:03:52, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7618/12384 [16:09:53<10:04:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7618/12384 [16:10:00<10:04:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 2: 62%|██████▏ | 7619/12384 [16:10:00<10:05:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 2: 62%|██████▏ | 7619/12384 [16:10:08<10:05:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 62%|██████▏ | 7620/12384 [16:10:08<10:04:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 62%|██████▏ | 7620/12384 [16:10:15<10:04:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7621/12384 [16:10:15<10:05:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7621/12384 [16:10:23<10:05:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 62%|██████▏ | 7622/12384 [16:10:23<10:05:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 62%|██████▏ | 7622/12384 [16:10:31<10:05:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7623/12384 [16:10:31<10:04:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7623/12384 [16:10:38<10:04:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 62%|██████▏ | 7624/12384 [16:10:38<10:04:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 62%|██████▏ | 7624/12384 [16:10:46<10:04:22, 7.62s/it, loss=0.0002, acc=0.9986, iter_time=7.50s]
Epoch 2: 62%|██████▏ | 7625/12384 [16:10:46<10:13:41, 7.74s/it, loss=0.0002, acc=0.9986, iter_time=7.50s]
Epoch 2: 62%|██████▏ | 7625/12384 [16:10:54<10:13:41, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 62%|██████▏ | 7626/12384 [16:10:54<10:10:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 62%|██████▏ | 7626/12384 [16:11:02<10:10:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 62%|██████▏ | 7627/12384 [16:11:02<10:09:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 62%|██████▏ | 7627/12384 [16:11:09<10:09:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 62%|██████▏ | 7628/12384 [16:11:09<10:07:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 62%|██████▏ | 7628/12384 [16:11:17<10:07:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 62%|██████▏ | 7629/12384 [16:11:17<10:07:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 62%|██████▏ | 7629/12384 [16:11:24<10:07:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 62%|██████▏ | 7630/12384 [16:11:24<10:06:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 62%|██████▏ | 7630/12384 [16:11:32<10:06:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7631/12384 [16:11:32<10:05:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7631/12384 [16:11:40<10:05:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 62%|██████▏ | 7632/12384 [16:11:40<10:04:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 62%|██████▏ | 7632/12384 [16:11:47<10:04:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 62%|██████▏ | 7633/12384 [16:11:47<10:03:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 62%|██████▏ | 7633/12384 [16:11:55<10:03:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7634/12384 [16:11:55<10:03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7634/12384 [16:12:02<10:03:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 62%|██████▏ | 7635/12384 [16:12:02<10:02:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 62%|██████▏ | 7635/12384 [16:12:10<10:02:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 62%|██████▏ | 7636/12384 [16:12:10<10:02:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 62%|██████▏ | 7636/12384 [16:12:18<10:02:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 62%|██████▏ | 7637/12384 [16:12:18<10:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 62%|██████▏ | 7637/12384 [16:12:25<10:01:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 2: 62%|██████▏ | 7638/12384 [16:12:25<10:01:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 2: 62%|██████▏ | 7638/12384 [16:12:33<10:01:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 2: 62%|██████▏ | 7639/12384 [16:12:33<10:04:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.66s]
Epoch 2: 62%|██████▏ | 7639/12384 [16:12:41<10:04:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 62%|██████▏ | 7640/12384 [16:12:41<10:03:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 62%|██████▏ | 7640/12384 [16:12:48<10:03:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 62%|██████▏ | 7641/12384 [16:12:48<10:02:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 62%|██████▏ | 7641/12384 [16:12:56<10:02:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 62%|██████▏ | 7642/12384 [16:12:56<10:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 62%|██████▏ | 7642/12384 [16:13:03<10:02:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 62%|██████▏ | 7643/12384 [16:13:03<10:02:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 62%|██████▏ | 7643/12384 [16:13:11<10:02:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7644/12384 [16:13:11<10:01:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7644/12384 [16:13:19<10:01:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 62%|██████▏ | 7645/12384 [16:13:19<10:01:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 62%|██████▏ | 7645/12384 [16:13:26<10:01:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 62%|██████▏ | 7646/12384 [16:13:26<10:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 62%|██████▏ | 7646/12384 [16:13:34<10:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7647/12384 [16:13:34<10:02:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7647/12384 [16:13:42<10:02:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 62%|██████▏ | 7648/12384 [16:13:42<10:02:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 62%|██████▏ | 7648/12384 [16:13:49<10:02:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 62%|██████▏ | 7649/12384 [16:13:49<10:02:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 62%|██████▏ | 7649/12384 [16:13:57<10:02:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 62%|██████▏ | 7650/12384 [16:13:57<10:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 62%|██████▏ | 7650/12384 [16:14:05<10:01:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 62%|██████▏ | 7651/12384 [16:14:05<10:08:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 62%|██████▏ | 7651/12384 [16:14:12<10:08:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7652/12384 [16:14:12<10:06:40, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7652/12384 [16:14:20<10:06:40, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=4.51s]
Epoch 2: 62%|██████▏ | 7653/12384 [16:14:20<10:04:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.51s]
Epoch 2: 62%|██████▏ | 7653/12384 [16:14:28<10:04:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 62%|██████▏ | 7654/12384 [16:14:28<10:02:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 62%|██████▏ | 7654/12384 [16:14:35<10:02:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 62%|██████▏ | 7655/12384 [16:14:35<10:02:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 62%|██████▏ | 7655/12384 [16:14:43<10:02:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 62%|██████▏ | 7656/12384 [16:14:43<10:01:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 62%|██████▏ | 7656/12384 [16:14:50<10:01:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 62%|██████▏ | 7657/12384 [16:14:50<10:01:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 62%|██████▏ | 7657/12384 [16:14:58<10:01:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7658/12384 [16:14:58<10:00:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7658/12384 [16:15:06<10:00:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 62%|██████▏ | 7659/12384 [16:15:06<9:59:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 62%|██████▏ | 7659/12384 [16:15:13<9:59:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 62%|██████▏ | 7660/12384 [16:15:13<10:01:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 62%|██████▏ | 7660/12384 [16:15:21<10:01:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 2: 62%|██████▏ | 7661/12384 [16:15:21<10:00:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 2: 62%|██████▏ | 7661/12384 [16:15:29<10:00:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 62%|██████▏ | 7662/12384 [16:15:29<10:01:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 62%|██████▏ | 7662/12384 [16:15:36<10:01:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 62%|██████▏ | 7663/12384 [16:15:36<10:02:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 62%|██████▏ | 7663/12384 [16:15:44<10:02:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 62%|██████▏ | 7664/12384 [16:15:44<10:03:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 62%|██████▏ | 7664/12384 [16:15:52<10:03:55, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 62%|██████▏ | 7665/12384 [16:15:52<10:01:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 62%|██████▏ | 7665/12384 [16:15:59<10:01:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 62%|██████▏ | 7666/12384 [16:15:59<10:00:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 62%|██████▏ | 7666/12384 [16:16:07<10:00:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 62%|██████▏ | 7667/12384 [16:16:07<9:59:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 62%|██████▏ | 7667/12384 [16:16:14<9:59:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 2: 62%|██████▏ | 7668/12384 [16:16:14<9:59:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 2: 62%|██████▏ | 7668/12384 [16:16:22<9:59:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7669/12384 [16:16:22<9:59:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7669/12384 [16:16:30<9:59:02, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.31s]
Epoch 2: 62%|██████▏ | 7670/12384 [16:16:30<10:00:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.31s]
Epoch 2: 62%|██████▏ | 7670/12384 [16:16:37<10:00:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 62%|██████▏ | 7671/12384 [16:16:37<9:59:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 62%|██████▏ | 7671/12384 [16:16:45<9:59:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 62%|██████▏ | 7672/12384 [16:16:45<9:58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 62%|██████▏ | 7672/12384 [16:16:53<9:58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 62%|██████▏ | 7673/12384 [16:16:53<9:58:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 62%|██████▏ | 7673/12384 [16:17:00<9:58:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 62%|██████▏ | 7674/12384 [16:17:00<9:58:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 62%|██████▏ | 7674/12384 [16:17:08<9:58:10, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 2: 62%|██████▏ | 7675/12384 [16:17:08<9:57:34, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 2: 62%|██████▏ | 7675/12384 [16:17:15<9:57:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 62%|██████▏ | 7676/12384 [16:17:15<9:56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 62%|██████▏ | 7676/12384 [16:17:23<9:56:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 62%|██████▏ | 7677/12384 [16:17:23<10:04:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 62%|██████▏ | 7677/12384 [16:17:31<10:04:33, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7678/12384 [16:17:31<10:02:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7678/12384 [16:17:39<10:02:00, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 62%|██████▏ | 7679/12384 [16:17:39<10:01:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 62%|██████▏ | 7679/12384 [16:17:46<10:01:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 2: 62%|██████▏ | 7680/12384 [16:17:46<9:59:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.35s]
Epoch 2: 62%|██████▏ | 7680/12384 [16:17:54<9:59:31, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 2: 62%|██████▏ | 7681/12384 [16:17:54<9:57:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 2: 62%|██████▏ | 7681/12384 [16:18:01<9:57:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 2: 62%|██████▏ | 7682/12384 [16:18:01<9:56:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.35s]
Epoch 2: 62%|██████▏ | 7682/12384 [16:18:09<9:56:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 62%|██████▏ | 7683/12384 [16:18:09<9:56:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 62%|██████▏ | 7683/12384 [16:18:17<9:56:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7684/12384 [16:18:17<9:56:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7684/12384 [16:18:24<9:56:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 62%|██████▏ | 7685/12384 [16:18:24<9:57:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 62%|██████▏ | 7685/12384 [16:18:32<9:57:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 62%|██████▏ | 7686/12384 [16:18:32<9:57:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 62%|██████▏ | 7686/12384 [16:18:40<9:57:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 62%|██████▏ | 7687/12384 [16:18:40<9:56:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 62%|██████▏ | 7687/12384 [16:18:47<9:56:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 62%|██████▏ | 7688/12384 [16:18:47<9:55:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 62%|██████▏ | 7688/12384 [16:18:55<9:55:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 62%|██████▏ | 7689/12384 [16:18:55<9:58:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 62%|██████▏ | 7689/12384 [16:19:02<9:58:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7690/12384 [16:19:02<9:57:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7690/12384 [16:19:10<9:57:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7691/12384 [16:19:10<9:56:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7691/12384 [16:19:18<9:56:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7692/12384 [16:19:18<9:56:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7692/12384 [16:19:25<9:56:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7693/12384 [16:19:25<9:55:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7693/12384 [16:19:33<9:55:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 62%|██████▏ | 7694/12384 [16:19:33<9:55:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 62%|██████▏ | 7694/12384 [16:19:40<9:55:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 62%|██████▏ | 7695/12384 [16:19:40<9:54:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 62%|██████▏ | 7695/12384 [16:19:48<9:54:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 62%|██████▏ | 7696/12384 [16:19:48<9:54:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 62%|██████▏ | 7696/12384 [16:19:56<9:54:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 62%|██████▏ | 7697/12384 [16:19:56<9:54:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 62%|██████▏ | 7697/12384 [16:20:03<9:54:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 62%|██████▏ | 7698/12384 [16:20:03<9:55:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.76s]
Epoch 2: 62%|██████▏ | 7698/12384 [16:20:11<9:55:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 62%|██████▏ | 7699/12384 [16:20:11<9:55:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 62%|██████▏ | 7699/12384 [16:20:19<9:55:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 62%|██████▏ | 7700/12384 [16:20:19<9:55:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 62%|██████▏ | 7700/12384 [16:20:26<9:55:09, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=10.74s]
Epoch 2: 62%|██████▏ | 7701/12384 [16:20:26<9:54:28, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=10.74s]
Epoch 2: 62%|██████▏ | 7701/12384 [16:20:34<9:54:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 62%|██████▏ | 7702/12384 [16:20:34<9:54:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 62%|██████▏ | 7702/12384 [16:20:41<9:54:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 62%|██████▏ | 7703/12384 [16:20:41<9:53:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 62%|██████▏ | 7703/12384 [16:20:49<9:53:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 2: 62%|██████▏ | 7704/12384 [16:20:49<10:02:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 2: 62%|██████▏ | 7704/12384 [16:20:57<10:02:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 2: 62%|██████▏ | 7705/12384 [16:20:57<9:58:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.39s]
Epoch 2: 62%|██████▏ | 7705/12384 [16:21:05<9:58:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 62%|██████▏ | 7706/12384 [16:21:05<9:57:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 62%|██████▏ | 7706/12384 [16:21:12<9:57:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 62%|██████▏ | 7707/12384 [16:21:12<9:56:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 62%|██████▏ | 7707/12384 [16:21:20<9:56:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 62%|██████▏ | 7708/12384 [16:21:20<9:55:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 62%|██████▏ | 7708/12384 [16:21:27<9:55:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 62%|██████▏ | 7709/12384 [16:21:28<9:56:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 62%|██████▏ | 7709/12384 [16:21:35<9:56:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 2: 62%|██████▏ | 7710/12384 [16:21:35<9:54:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 2: 62%|██████▏ | 7710/12384 [16:21:43<9:54:53, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.26s]
Epoch 2: 62%|██████▏ | 7711/12384 [16:21:43<9:54:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.26s]
Epoch 2: 62%|██████▏ | 7711/12384 [16:21:50<9:54:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 2: 62%|██████▏ | 7712/12384 [16:21:50<9:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.35s]
Epoch 2: 62%|██████▏ | 7712/12384 [16:21:58<9:53:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 2: 62%|██████▏ | 7713/12384 [16:21:58<9:55:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 2: 62%|██████▏ | 7713/12384 [16:22:06<9:55:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 62%|██████▏ | 7714/12384 [16:22:06<9:54:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 62%|██████▏ | 7714/12384 [16:22:13<9:54:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7715/12384 [16:22:13<9:53:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 62%|██████▏ | 7715/12384 [16:22:21<9:53:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 62%|██████▏ | 7716/12384 [16:22:21<9:53:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 62%|██████▏ | 7716/12384 [16:22:29<9:53:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 2: 62%|██████▏ | 7717/12384 [16:22:29<9:53:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 2: 62%|██████▏ | 7717/12384 [16:22:36<9:53:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.73s]
Epoch 2: 62%|██████▏ | 7718/12384 [16:22:36<9:54:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.73s]
Epoch 2: 62%|██████▏ | 7718/12384 [16:22:44<9:54:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 62%|██████▏ | 7719/12384 [16:22:44<9:53:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 62%|██████▏ | 7719/12384 [16:22:51<9:53:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 62%|██████▏ | 7720/12384 [16:22:51<9:52:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 62%|██████▏ | 7720/12384 [16:22:59<9:52:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 62%|██████▏ | 7721/12384 [16:22:59<9:52:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 62%|██████▏ | 7721/12384 [16:23:07<9:52:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7722/12384 [16:23:07<9:52:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 62%|██████▏ | 7722/12384 [16:23:14<9:52:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 62%|██████▏ | 7723/12384 [16:23:14<9:51:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.64s]
Epoch 2: 62%|██████▏ | 7723/12384 [16:23:22<9:51:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 62%|██████▏ | 7724/12384 [16:23:22<9:51:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 62%|██████▏ | 7724/12384 [16:23:29<9:51:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 62%|██████▏ | 7725/12384 [16:23:29<9:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 62%|██████▏ | 7725/12384 [16:23:37<9:51:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 62%|██████▏ | 7726/12384 [16:23:37<9:52:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 62%|██████▏ | 7726/12384 [16:23:45<9:52:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 62%|██████▏ | 7727/12384 [16:23:45<9:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 62%|██████▏ | 7727/12384 [16:23:52<9:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 62%|██████▏ | 7728/12384 [16:23:52<9:51:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 62%|██████▏ | 7728/12384 [16:24:00<9:51:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 2: 62%|██████▏ | 7729/12384 [16:24:00<9:50:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.89s]
Epoch 2: 62%|██████▏ | 7729/12384 [16:24:08<9:50:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 62%|██████▏ | 7730/12384 [16:24:08<9:58:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 62%|██████▏ | 7730/12384 [16:24:16<9:58:25, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 62%|██████▏ | 7731/12384 [16:24:16<9:55:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 62%|██████▏ | 7731/12384 [16:24:23<9:55:57, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 62%|██████▏ | 7732/12384 [16:24:23<9:58:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 62%|██████▏ | 7732/12384 [16:24:31<9:58:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 62%|██████▏ | 7733/12384 [16:24:31<9:56:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 62%|██████▏ | 7733/12384 [16:24:39<9:56:16, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7734/12384 [16:24:39<9:54:07, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 62%|██████▏ | 7734/12384 [16:24:46<9:54:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 62%|██████▏ | 7735/12384 [16:24:46<9:52:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 62%|██████▏ | 7735/12384 [16:24:54<9:52:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 62%|██████▏ | 7736/12384 [16:24:54<9:51:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 62%|██████▏ | 7736/12384 [16:25:01<9:51:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 62%|██████▏ | 7737/12384 [16:25:01<9:51:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 62%|██████▏ | 7737/12384 [16:25:09<9:51:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 62%|██████▏ | 7738/12384 [16:25:09<9:51:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 62%|██████▏ | 7738/12384 [16:25:17<9:51:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 2: 62%|██████▏ | 7739/12384 [16:25:17<9:50:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 2: 62%|██████▏ | 7739/12384 [16:25:24<9:50:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 62%|██████▎ | 7740/12384 [16:25:24<9:49:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 62%|██████▎ | 7740/12384 [16:25:32<9:49:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 63%|██████▎ | 7741/12384 [16:25:32<9:50:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 63%|██████▎ | 7741/12384 [16:25:40<9:50:50, 7.64s/it, loss=0.0004, acc=0.9979, iter_time=7.68s]
Epoch 2: 63%|██████▎ | 7742/12384 [16:25:40<9:50:12, 7.63s/it, loss=0.0004, acc=0.9979, iter_time=7.68s]
Epoch 2: 63%|██████▎ | 7742/12384 [16:25:47<9:50:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 63%|██████▎ | 7743/12384 [16:25:47<9:49:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 63%|██████▎ | 7743/12384 [16:25:55<9:49:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 2: 63%|██████▎ | 7744/12384 [16:25:55<9:49:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 2: 63%|██████▎ | 7744/12384 [16:26:02<9:49:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 63%|██████▎ | 7745/12384 [16:26:02<9:48:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 63%|██████▎ | 7745/12384 [16:26:10<9:48:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 2: 63%|██████▎ | 7746/12384 [16:26:10<9:48:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.24s]
Epoch 2: 63%|██████▎ | 7746/12384 [16:26:18<9:48:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 63%|██████▎ | 7747/12384 [16:26:18<9:48:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.98s]
Epoch 2: 63%|██████▎ | 7747/12384 [16:26:25<9:48:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7748/12384 [16:26:25<9:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7748/12384 [16:26:33<9:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 63%|██████▎ | 7749/12384 [16:26:33<9:48:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 63%|██████▎ | 7749/12384 [16:26:40<9:48:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 63%|██████▎ | 7750/12384 [16:26:40<9:48:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 63%|██████▎ | 7750/12384 [16:26:48<9:48:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7751/12384 [16:26:48<9:48:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7751/12384 [16:26:56<9:48:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 63%|██████▎ | 7752/12384 [16:26:56<9:48:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 63%|██████▎ | 7752/12384 [16:27:03<9:48:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 63%|██████▎ | 7753/12384 [16:27:03<9:49:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 63%|██████▎ | 7753/12384 [16:27:11<9:49:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 63%|██████▎ | 7754/12384 [16:27:11<9:49:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 63%|██████▎ | 7754/12384 [16:27:19<9:49:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 63%|██████▎ | 7755/12384 [16:27:19<9:49:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 63%|██████▎ | 7755/12384 [16:27:26<9:49:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 2: 63%|██████▎ | 7756/12384 [16:27:26<9:49:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 2: 63%|██████▎ | 7756/12384 [16:27:34<9:49:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 63%|██████▎ | 7757/12384 [16:27:34<9:56:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 63%|██████▎ | 7757/12384 [16:27:42<9:56:31, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 63%|██████▎ | 7758/12384 [16:27:42<9:53:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 63%|██████▎ | 7758/12384 [16:27:50<9:53:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 63%|██████▎ | 7759/12384 [16:27:50<9:52:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 63%|██████▎ | 7759/12384 [16:27:57<9:52:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 2: 63%|██████▎ | 7760/12384 [16:27:57<9:51:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.51s]
Epoch 2: 63%|██████▎ | 7760/12384 [16:28:05<9:51:32, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 2: 63%|██████▎ | 7761/12384 [16:28:05<9:50:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.78s]
Epoch 2: 63%|██████▎ | 7761/12384 [16:28:12<9:50:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 63%|██████▎ | 7762/12384 [16:28:12<9:49:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 63%|██████▎ | 7762/12384 [16:28:20<9:49:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7763/12384 [16:28:20<9:48:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7763/12384 [16:28:28<9:48:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 63%|██████▎ | 7764/12384 [16:28:28<9:47:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 63%|██████▎ | 7764/12384 [16:28:35<9:47:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 63%|██████▎ | 7765/12384 [16:28:35<9:46:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 63%|██████▎ | 7765/12384 [16:28:43<9:46:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 63%|██████▎ | 7766/12384 [16:28:43<9:46:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 63%|██████▎ | 7766/12384 [16:28:51<9:46:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 63%|██████▎ | 7767/12384 [16:28:51<9:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 63%|██████▎ | 7767/12384 [16:28:58<9:46:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 63%|██████▎ | 7768/12384 [16:28:58<9:46:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 63%|██████▎ | 7768/12384 [16:29:06<9:46:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 63%|██████▎ | 7769/12384 [16:29:06<9:47:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 63%|██████▎ | 7769/12384 [16:29:13<9:47:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 63%|██████▎ | 7770/12384 [16:29:13<9:47:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 63%|██████▎ | 7770/12384 [16:29:21<9:47:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 63%|██████▎ | 7771/12384 [16:29:21<9:47:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 63%|██████▎ | 7771/12384 [16:29:29<9:47:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 63%|██████▎ | 7772/12384 [16:29:29<9:47:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 63%|██████▎ | 7772/12384 [16:29:36<9:47:04, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 63%|██████▎ | 7773/12384 [16:29:36<9:46:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.46s]
Epoch 2: 63%|██████▎ | 7773/12384 [16:29:44<9:46:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 63%|██████▎ | 7774/12384 [16:29:44<9:45:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 63%|██████▎ | 7774/12384 [16:29:52<9:45:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 63%|██████▎ | 7775/12384 [16:29:52<9:45:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 63%|██████▎ | 7775/12384 [16:29:59<9:45:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 63%|██████▎ | 7776/12384 [16:29:59<9:45:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 63%|██████▎ | 7776/12384 [16:30:07<9:45:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 63%|██████▎ | 7777/12384 [16:30:07<9:45:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 63%|██████▎ | 7777/12384 [16:30:14<9:45:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 63%|██████▎ | 7778/12384 [16:30:14<9:45:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 63%|██████▎ | 7778/12384 [16:30:22<9:45:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 63%|██████▎ | 7779/12384 [16:30:22<9:44:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 63%|██████▎ | 7779/12384 [16:30:30<9:44:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 2: 63%|██████▎ | 7780/12384 [16:30:30<9:44:03, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 2: 63%|██████▎ | 7780/12384 [16:30:38<9:44:03, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=10.42s]
Epoch 2: 63%|██████▎ | 7781/12384 [16:30:38<9:50:22, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=10.42s]
Epoch 2: 63%|██████▎ | 7781/12384 [16:30:45<9:50:22, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 63%|██████▎ | 7782/12384 [16:30:45<9:48:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 63%|██████▎ | 7782/12384 [16:30:53<9:48:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 63%|██████▎ | 7783/12384 [16:30:53<9:54:54, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 63%|██████▎ | 7783/12384 [16:31:01<9:54:54, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 63%|██████▎ | 7784/12384 [16:31:01<9:53:15, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 63%|██████▎ | 7784/12384 [16:31:08<9:53:15, 7.74s/it, loss=0.0012, acc=0.9998, iter_time=6.97s]
Epoch 2: 63%|██████▎ | 7785/12384 [16:31:08<9:50:36, 7.71s/it, loss=0.0012, acc=0.9998, iter_time=6.97s]
Epoch 2: 63%|██████▎ | 7785/12384 [16:31:16<9:50:36, 7.71s/it, loss=0.0006, acc=0.9979, iter_time=7.57s]
Epoch 2: 63%|██████▎ | 7786/12384 [16:31:16<9:47:57, 7.67s/it, loss=0.0006, acc=0.9979, iter_time=7.57s]
Epoch 2: 63%|██████▎ | 7786/12384 [16:31:24<9:47:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 63%|██████▎ | 7787/12384 [16:31:24<9:46:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 63%|██████▎ | 7787/12384 [16:31:31<9:46:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 63%|██████▎ | 7788/12384 [16:31:31<9:44:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.25s]
Epoch 2: 63%|██████▎ | 7788/12384 [16:31:39<9:44:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 2: 63%|██████▎ | 7789/12384 [16:31:39<9:43:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.95s]
Epoch 2: 63%|██████▎ | 7789/12384 [16:31:46<9:43:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 63%|██████▎ | 7790/12384 [16:31:46<9:43:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 63%|██████▎ | 7790/12384 [16:31:54<9:43:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 63%|██████▎ | 7791/12384 [16:31:54<9:43:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 63%|██████▎ | 7791/12384 [16:32:02<9:43:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 63%|██████▎ | 7792/12384 [16:32:02<9:43:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 63%|██████▎ | 7792/12384 [16:32:09<9:43:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 63%|██████▎ | 7793/12384 [16:32:09<9:42:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 63%|██████▎ | 7793/12384 [16:32:17<9:42:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 63%|██████▎ | 7794/12384 [16:32:17<9:42:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 63%|██████▎ | 7794/12384 [16:32:25<9:42:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 63%|██████▎ | 7795/12384 [16:32:25<9:42:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 63%|██████▎ | 7795/12384 [16:32:32<9:42:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 63%|██████▎ | 7796/12384 [16:32:32<9:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 63%|██████▎ | 7796/12384 [16:32:40<9:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 63%|██████▎ | 7797/12384 [16:32:40<9:42:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 63%|██████▎ | 7797/12384 [16:32:47<9:42:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 63%|██████▎ | 7798/12384 [16:32:47<9:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 63%|██████▎ | 7798/12384 [16:32:55<9:42:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 63%|██████▎ | 7799/12384 [16:32:55<9:42:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 63%|██████▎ | 7799/12384 [16:33:03<9:42:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 63%|██████▎ | 7800/12384 [16:33:03<9:41:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 63%|██████▎ | 7800/12384 [16:33:10<9:41:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 63%|██████▎ | 7801/12384 [16:33:10<9:44:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 63%|██████▎ | 7801/12384 [16:33:18<9:44:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 63%|██████▎ | 7802/12384 [16:33:18<9:43:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 63%|██████▎ | 7802/12384 [16:33:26<9:43:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 63%|██████▎ | 7803/12384 [16:33:26<9:42:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 63%|██████▎ | 7803/12384 [16:33:33<9:42:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 63%|██████▎ | 7804/12384 [16:33:33<9:41:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 63%|██████▎ | 7804/12384 [16:33:41<9:41:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 63%|██████▎ | 7805/12384 [16:33:41<9:41:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 63%|██████▎ | 7805/12384 [16:33:48<9:41:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7806/12384 [16:33:48<9:41:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7806/12384 [16:33:56<9:41:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 63%|██████▎ | 7807/12384 [16:33:56<9:47:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 63%|██████▎ | 7807/12384 [16:34:04<9:47:10, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=7.53s]
Epoch 2: 63%|██████▎ | 7808/12384 [16:34:04<9:44:30, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=7.53s]
Epoch 2: 63%|██████▎ | 7808/12384 [16:34:12<9:44:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 2: 63%|██████▎ | 7809/12384 [16:34:12<9:51:18, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 2: 63%|██████▎ | 7809/12384 [16:34:19<9:51:18, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 63%|██████▎ | 7810/12384 [16:34:19<9:47:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 63%|██████▎ | 7810/12384 [16:34:27<9:47:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 2: 63%|██████▎ | 7811/12384 [16:34:27<9:44:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 2: 63%|██████▎ | 7811/12384 [16:34:35<9:44:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 2: 63%|██████▎ | 7812/12384 [16:34:35<9:42:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.34s]
Epoch 2: 63%|██████▎ | 7812/12384 [16:34:42<9:42:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 63%|██████▎ | 7813/12384 [16:34:42<9:41:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 63%|██████▎ | 7813/12384 [16:34:50<9:41:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.25s]
Epoch 2: 63%|██████▎ | 7814/12384 [16:34:50<9:40:48, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.25s]
Epoch 2: 63%|██████▎ | 7814/12384 [16:34:57<9:40:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 2: 63%|██████▎ | 7815/12384 [16:34:57<9:40:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 2: 63%|██████▎ | 7815/12384 [16:35:05<9:40:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 63%|██████▎ | 7816/12384 [16:35:05<9:42:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 63%|██████▎ | 7816/12384 [16:35:13<9:42:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 63%|██████▎ | 7817/12384 [16:35:13<9:42:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.90s]
Epoch 2: 63%|██████▎ | 7817/12384 [16:35:21<9:42:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 63%|██████▎ | 7818/12384 [16:35:21<9:43:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 63%|██████▎ | 7818/12384 [16:35:28<9:43:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 63%|██████▎ | 7819/12384 [16:35:28<9:44:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 63%|██████▎ | 7819/12384 [16:35:36<9:44:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 63%|██████▎ | 7820/12384 [16:35:36<9:44:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 63%|██████▎ | 7820/12384 [16:35:44<9:44:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 63%|██████▎ | 7821/12384 [16:35:44<9:44:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 63%|██████▎ | 7821/12384 [16:35:51<9:44:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 2: 63%|██████▎ | 7822/12384 [16:35:51<9:44:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 2: 63%|██████▎ | 7822/12384 [16:35:59<9:44:45, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 63%|██████▎ | 7823/12384 [16:35:59<9:44:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 63%|██████▎ | 7823/12384 [16:36:07<9:44:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 63%|██████▎ | 7824/12384 [16:36:07<9:45:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 63%|██████▎ | 7824/12384 [16:36:14<9:45:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 63%|██████▎ | 7825/12384 [16:36:14<9:44:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 63%|██████▎ | 7825/12384 [16:36:22<9:44:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 63%|██████▎ | 7826/12384 [16:36:22<9:44:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 63%|██████▎ | 7826/12384 [16:36:30<9:44:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 63%|██████▎ | 7827/12384 [16:36:30<9:43:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 63%|██████▎ | 7827/12384 [16:36:37<9:43:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 63%|██████▎ | 7828/12384 [16:36:37<9:44:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 63%|██████▎ | 7828/12384 [16:36:45<9:44:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 63%|██████▎ | 7829/12384 [16:36:45<9:44:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 63%|██████▎ | 7829/12384 [16:36:53<9:44:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 63%|██████▎ | 7830/12384 [16:36:53<9:44:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 63%|██████▎ | 7830/12384 [16:37:01<9:44:38, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 63%|██████▎ | 7831/12384 [16:37:01<9:44:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.55s]
Epoch 2: 63%|██████▎ | 7831/12384 [16:37:08<9:44:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 2: 63%|██████▎ | 7832/12384 [16:37:08<9:44:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.25s]
Epoch 2: 63%|██████▎ | 7832/12384 [16:37:16<9:44:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 63%|██████▎ | 7833/12384 [16:37:16<9:44:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 63%|██████▎ | 7833/12384 [16:37:24<9:44:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 2: 63%|██████▎ | 7834/12384 [16:37:24<9:44:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.64s]
Epoch 2: 63%|██████▎ | 7834/12384 [16:37:32<9:44:24, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 2: 63%|██████▎ | 7835/12384 [16:37:32<9:53:02, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=10.83s]
Epoch 2: 63%|██████▎ | 7835/12384 [16:37:40<9:53:02, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 63%|██████▎ | 7836/12384 [16:37:40<9:50:20, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 63%|██████▎ | 7836/12384 [16:37:47<9:50:20, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 63%|██████▎ | 7837/12384 [16:37:47<9:47:53, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 63%|██████▎ | 7837/12384 [16:37:55<9:47:53, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 63%|██████▎ | 7838/12384 [16:37:55<9:46:48, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.78s]
Epoch 2: 63%|██████▎ | 7838/12384 [16:38:03<9:46:48, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 63%|██████▎ | 7839/12384 [16:38:03<9:45:35, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.63s]
Epoch 2: 63%|██████▎ | 7839/12384 [16:38:10<9:45:35, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 63%|██████▎ | 7840/12384 [16:38:10<9:44:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 63%|██████▎ | 7840/12384 [16:38:18<9:44:23, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 63%|██████▎ | 7841/12384 [16:38:18<9:44:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 63%|██████▎ | 7841/12384 [16:38:26<9:44:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 2: 63%|██████▎ | 7842/12384 [16:38:26<9:43:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.22s]
Epoch 2: 63%|██████▎ | 7842/12384 [16:38:33<9:43:46, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 63%|██████▎ | 7843/12384 [16:38:33<9:43:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 63%|██████▎ | 7843/12384 [16:38:41<9:43:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 63%|██████▎ | 7844/12384 [16:38:41<9:43:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 63%|██████▎ | 7844/12384 [16:38:49<9:43:13, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 63%|██████▎ | 7845/12384 [16:38:49<9:42:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 63%|██████▎ | 7845/12384 [16:38:56<9:42:32, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 63%|██████▎ | 7846/12384 [16:38:56<9:41:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 63%|██████▎ | 7846/12384 [16:39:04<9:41:35, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 63%|██████▎ | 7847/12384 [16:39:04<9:42:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 63%|██████▎ | 7847/12384 [16:39:12<9:42:35, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.10s]
Epoch 2: 63%|██████▎ | 7848/12384 [16:39:12<9:42:13, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.10s]
Epoch 2: 63%|██████▎ | 7848/12384 [16:39:20<9:42:13, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 63%|██████▎ | 7849/12384 [16:39:20<9:40:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 63%|██████▎ | 7849/12384 [16:39:27<9:40:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 63%|██████▎ | 7850/12384 [16:39:27<9:38:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 63%|██████▎ | 7850/12384 [16:39:35<9:38:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 63%|██████▎ | 7851/12384 [16:39:35<9:38:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 63%|██████▎ | 7851/12384 [16:39:42<9:38:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 63%|██████▎ | 7852/12384 [16:39:42<9:36:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 63%|██████▎ | 7852/12384 [16:39:50<9:36:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 63%|██████▎ | 7853/12384 [16:39:50<9:36:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.06s]
Epoch 2: 63%|██████▎ | 7853/12384 [16:39:58<9:36:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 63%|██████▎ | 7854/12384 [16:39:58<9:35:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 63%|██████▎ | 7854/12384 [16:40:05<9:35:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7855/12384 [16:40:05<9:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 63%|██████▎ | 7855/12384 [16:40:13<9:35:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 63%|██████▎ | 7856/12384 [16:40:13<9:35:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 63%|██████▎ | 7856/12384 [16:40:20<9:35:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 2: 63%|██████▎ | 7857/12384 [16:40:20<9:34:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.92s]
Epoch 2: 63%|██████▎ | 7857/12384 [16:40:28<9:34:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 63%|██████▎ | 7858/12384 [16:40:28<9:33:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 63%|██████▎ | 7858/12384 [16:40:36<9:33:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 63%|██████▎ | 7859/12384 [16:40:36<9:33:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 63%|██████▎ | 7859/12384 [16:40:44<9:33:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 63%|██████▎ | 7860/12384 [16:40:44<9:39:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 63%|██████▎ | 7860/12384 [16:40:52<9:39:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 63%|██████▎ | 7861/12384 [16:40:52<9:46:17, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 63%|██████▎ | 7861/12384 [16:40:59<9:46:17, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 63%|██████▎ | 7862/12384 [16:40:59<9:41:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 63%|██████▎ | 7862/12384 [16:41:07<9:41:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 63%|██████▎ | 7863/12384 [16:41:07<9:39:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 63%|██████▎ | 7863/12384 [16:41:14<9:39:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 2: 64%|██████▎ | 7864/12384 [16:41:14<9:39:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.55s]
Epoch 2: 64%|██████▎ | 7864/12384 [16:41:22<9:39:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 64%|██████▎ | 7865/12384 [16:41:22<9:39:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 64%|██████▎ | 7865/12384 [16:41:30<9:39:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7866/12384 [16:41:30<9:39:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7866/12384 [16:41:37<9:39:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 64%|██████▎ | 7867/12384 [16:41:37<9:37:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 64%|██████▎ | 7867/12384 [16:41:45<9:37:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7868/12384 [16:41:45<9:35:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7868/12384 [16:41:53<9:35:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▎ | 7869/12384 [16:41:53<9:34:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▎ | 7869/12384 [16:42:00<9:34:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 64%|██████▎ | 7870/12384 [16:42:00<9:34:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 64%|██████▎ | 7870/12384 [16:42:08<9:34:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 64%|██████▎ | 7871/12384 [16:42:08<9:33:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.15s]
Epoch 2: 64%|██████▎ | 7871/12384 [16:42:16<9:33:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7872/12384 [16:42:16<9:34:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7872/12384 [16:42:23<9:34:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 64%|██████▎ | 7873/12384 [16:42:23<9:33:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 64%|██████▎ | 7873/12384 [16:42:31<9:33:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7874/12384 [16:42:31<9:32:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7874/12384 [16:42:38<9:32:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 64%|██████▎ | 7875/12384 [16:42:38<9:32:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 64%|██████▎ | 7875/12384 [16:42:46<9:32:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 64%|██████▎ | 7876/12384 [16:42:46<9:32:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 64%|██████▎ | 7876/12384 [16:42:54<9:32:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7877/12384 [16:42:54<9:31:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7877/12384 [16:43:01<9:31:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7878/12384 [16:43:01<9:31:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7878/12384 [16:43:09<9:31:49, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7879/12384 [16:43:09<9:31:54, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▎ | 7879/12384 [16:43:16<9:31:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 64%|██████▎ | 7880/12384 [16:43:16<9:32:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 64%|██████▎ | 7880/12384 [16:43:24<9:32:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 64%|██████▎ | 7881/12384 [16:43:24<9:32:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 64%|██████▎ | 7881/12384 [16:43:32<9:32:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 2: 64%|██████▎ | 7882/12384 [16:43:32<9:32:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 2: 64%|██████▎ | 7882/12384 [16:43:39<9:32:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 64%|██████▎ | 7883/12384 [16:43:39<9:33:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 64%|██████▎ | 7883/12384 [16:43:47<9:33:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 64%|██████▎ | 7884/12384 [16:43:47<9:32:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 64%|██████▎ | 7884/12384 [16:43:55<9:32:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 64%|██████▎ | 7885/12384 [16:43:55<9:31:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 64%|██████▎ | 7885/12384 [16:44:03<9:31:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 64%|██████▎ | 7886/12384 [16:44:03<9:38:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 64%|██████▎ | 7886/12384 [16:44:10<9:38:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▎ | 7887/12384 [16:44:10<9:36:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▎ | 7887/12384 [16:44:18<9:36:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 64%|██████▎ | 7888/12384 [16:44:18<9:42:23, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 64%|██████▎ | 7888/12384 [16:44:26<9:42:23, 7.77s/it, loss=0.0003, acc=0.9979, iter_time=5.43s]
Epoch 2: 64%|██████▎ | 7889/12384 [16:44:26<9:38:31, 7.72s/it, loss=0.0003, acc=0.9979, iter_time=5.43s]
Epoch 2: 64%|██████▎ | 7889/12384 [16:44:33<9:38:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 64%|██████▎ | 7890/12384 [16:44:33<9:35:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 64%|██████▎ | 7890/12384 [16:44:41<9:35:29, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.35s]
Epoch 2: 64%|██████▎ | 7891/12384 [16:44:41<9:33:24, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.35s]
Epoch 2: 64%|██████▎ | 7891/12384 [16:44:49<9:33:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 64%|██████▎ | 7892/12384 [16:44:49<9:31:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 64%|██████▎ | 7892/12384 [16:44:56<9:31:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 64%|██████▎ | 7893/12384 [16:44:56<9:31:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 64%|██████▎ | 7893/12384 [16:45:04<9:31:14, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.61s]
Epoch 2: 64%|██████▎ | 7894/12384 [16:45:04<9:30:50, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.61s]
Epoch 2: 64%|██████▎ | 7894/12384 [16:45:11<9:30:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 64%|██████▍ | 7895/12384 [16:45:11<9:30:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 64%|██████▍ | 7895/12384 [16:45:19<9:30:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 64%|██████▍ | 7896/12384 [16:45:19<9:30:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 64%|██████▍ | 7896/12384 [16:45:27<9:30:40, 7.63s/it, loss=0.0004, acc=0.9983, iter_time=7.22s]
Epoch 2: 64%|██████▍ | 7897/12384 [16:45:27<9:30:17, 7.63s/it, loss=0.0004, acc=0.9983, iter_time=7.22s]
Epoch 2: 64%|██████▍ | 7897/12384 [16:45:34<9:30:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 64%|██████▍ | 7898/12384 [16:45:34<9:29:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 64%|██████▍ | 7898/12384 [16:45:42<9:29:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 64%|██████▍ | 7899/12384 [16:45:42<9:30:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 64%|██████▍ | 7899/12384 [16:45:50<9:30:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 64%|██████▍ | 7900/12384 [16:45:50<9:30:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 64%|██████▍ | 7900/12384 [16:45:57<9:30:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 64%|██████▍ | 7901/12384 [16:45:57<9:30:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 64%|██████▍ | 7901/12384 [16:46:05<9:30:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 64%|██████▍ | 7902/12384 [16:46:05<9:30:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 64%|██████▍ | 7902/12384 [16:46:12<9:30:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 64%|██████▍ | 7903/12384 [16:46:12<9:29:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 64%|██████▍ | 7903/12384 [16:46:20<9:29:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 64%|██████▍ | 7904/12384 [16:46:20<9:30:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 64%|██████▍ | 7904/12384 [16:46:28<9:30:57, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 64%|██████▍ | 7905/12384 [16:46:28<9:30:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 64%|██████▍ | 7905/12384 [16:46:35<9:30:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 64%|██████▍ | 7906/12384 [16:46:35<9:29:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 64%|██████▍ | 7906/12384 [16:46:43<9:29:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 64%|██████▍ | 7907/12384 [16:46:43<9:29:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 64%|██████▍ | 7907/12384 [16:46:51<9:29:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.88s]
Epoch 2: 64%|██████▍ | 7908/12384 [16:46:51<9:29:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.88s]
Epoch 2: 64%|██████▍ | 7908/12384 [16:46:58<9:29:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 64%|██████▍ | 7909/12384 [16:46:58<9:29:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 64%|██████▍ | 7909/12384 [16:47:06<9:29:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7910/12384 [16:47:06<9:28:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7910/12384 [16:47:13<9:28:26, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=7.61s]
Epoch 2: 64%|██████▍ | 7911/12384 [16:47:13<9:28:06, 7.62s/it, loss=0.0002, acc=0.9991, iter_time=7.61s]
Epoch 2: 64%|██████▍ | 7911/12384 [16:47:21<9:28:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 64%|██████▍ | 7912/12384 [16:47:21<9:34:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 64%|██████▍ | 7912/12384 [16:47:29<9:34:35, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 2: 64%|██████▍ | 7913/12384 [16:47:29<9:32:27, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 2: 64%|██████▍ | 7913/12384 [16:47:37<9:32:27, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 64%|██████▍ | 7914/12384 [16:47:37<9:38:13, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 64%|██████▍ | 7914/12384 [16:47:45<9:38:13, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 64%|██████▍ | 7915/12384 [16:47:45<9:35:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 64%|██████▍ | 7915/12384 [16:47:52<9:35:12, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 64%|██████▍ | 7916/12384 [16:47:52<9:32:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 64%|██████▍ | 7916/12384 [16:48:00<9:32:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 64%|██████▍ | 7917/12384 [16:48:00<9:30:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 64%|██████▍ | 7917/12384 [16:48:07<9:30:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7918/12384 [16:48:07<9:28:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7918/12384 [16:48:15<9:28:59, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7919/12384 [16:48:15<9:29:42, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7919/12384 [16:48:23<9:29:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 64%|██████▍ | 7920/12384 [16:48:23<9:29:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 64%|██████▍ | 7920/12384 [16:48:30<9:29:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 64%|██████▍ | 7921/12384 [16:48:30<9:27:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 64%|██████▍ | 7921/12384 [16:48:38<9:27:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 64%|██████▍ | 7922/12384 [16:48:38<9:27:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 64%|██████▍ | 7922/12384 [16:48:46<9:27:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 64%|██████▍ | 7923/12384 [16:48:46<9:27:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 64%|██████▍ | 7923/12384 [16:48:53<9:27:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 64%|██████▍ | 7924/12384 [16:48:53<9:26:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 64%|██████▍ | 7924/12384 [16:49:01<9:26:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 64%|██████▍ | 7925/12384 [16:49:01<9:26:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 64%|██████▍ | 7925/12384 [16:49:08<9:26:24, 7.62s/it, loss=0.0005, acc=0.9994, iter_time=7.63s]
Epoch 2: 64%|██████▍ | 7926/12384 [16:49:08<9:27:14, 7.63s/it, loss=0.0005, acc=0.9994, iter_time=7.63s]
Epoch 2: 64%|██████▍ | 7926/12384 [16:49:16<9:27:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 64%|██████▍ | 7927/12384 [16:49:16<9:26:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 64%|██████▍ | 7927/12384 [16:49:24<9:26:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 2: 64%|██████▍ | 7928/12384 [16:49:24<9:26:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.00s]
Epoch 2: 64%|██████▍ | 7928/12384 [16:49:31<9:26:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 64%|██████▍ | 7929/12384 [16:49:31<9:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 64%|██████▍ | 7929/12384 [16:49:39<9:25:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 64%|██████▍ | 7930/12384 [16:49:39<9:25:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 64%|██████▍ | 7930/12384 [16:49:46<9:25:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 64%|██████▍ | 7931/12384 [16:49:46<9:24:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 64%|██████▍ | 7931/12384 [16:49:54<9:24:38, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 64%|██████▍ | 7932/12384 [16:49:54<9:24:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 64%|██████▍ | 7932/12384 [16:50:02<9:24:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 64%|██████▍ | 7933/12384 [16:50:02<9:24:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 64%|██████▍ | 7933/12384 [16:50:09<9:24:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7934/12384 [16:50:09<9:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7934/12384 [16:50:17<9:24:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7935/12384 [16:50:17<9:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7935/12384 [16:50:25<9:24:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7936/12384 [16:50:25<9:25:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7936/12384 [16:50:32<9:25:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 64%|██████▍ | 7937/12384 [16:50:32<9:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.86s]
Epoch 2: 64%|██████▍ | 7937/12384 [16:50:40<9:24:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 64%|██████▍ | 7938/12384 [16:50:40<9:24:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 64%|██████▍ | 7938/12384 [16:50:47<9:24:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 64%|██████▍ | 7939/12384 [16:50:47<9:23:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 64%|██████▍ | 7939/12384 [16:50:55<9:23:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 64%|██████▍ | 7940/12384 [16:50:55<9:23:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 64%|██████▍ | 7940/12384 [16:51:03<9:23:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 64%|██████▍ | 7941/12384 [16:51:03<9:30:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 64%|██████▍ | 7941/12384 [16:51:11<9:30:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 64%|██████▍ | 7942/12384 [16:51:11<9:28:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 64%|██████▍ | 7942/12384 [16:51:18<9:28:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 64%|██████▍ | 7943/12384 [16:51:18<9:27:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 64%|██████▍ | 7943/12384 [16:51:26<9:27:01, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 64%|██████▍ | 7944/12384 [16:51:26<9:25:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 64%|██████▍ | 7944/12384 [16:51:33<9:25:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 64%|██████▍ | 7945/12384 [16:51:33<9:24:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.12s]
Epoch 2: 64%|██████▍ | 7945/12384 [16:51:41<9:24:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 64%|██████▍ | 7946/12384 [16:51:41<9:24:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 64%|██████▍ | 7946/12384 [16:51:49<9:24:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7947/12384 [16:51:49<9:23:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7947/12384 [16:51:56<9:23:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 64%|██████▍ | 7948/12384 [16:51:56<9:22:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 64%|██████▍ | 7948/12384 [16:52:04<9:22:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7949/12384 [16:52:04<9:22:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 64%|██████▍ | 7949/12384 [16:52:11<9:22:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 64%|██████▍ | 7950/12384 [16:52:11<9:22:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 64%|██████▍ | 7950/12384 [16:52:19<9:22:00, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 64%|██████▍ | 7951/12384 [16:52:19<9:22:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 64%|██████▍ | 7951/12384 [16:52:27<9:22:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 64%|██████▍ | 7952/12384 [16:52:27<9:22:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 64%|██████▍ | 7952/12384 [16:52:34<9:22:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 64%|██████▍ | 7953/12384 [16:52:34<9:22:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 64%|██████▍ | 7953/12384 [16:52:42<9:22:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7954/12384 [16:52:42<9:21:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7954/12384 [16:52:49<9:21:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 64%|██████▍ | 7955/12384 [16:52:49<9:22:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.01s]
Epoch 2: 64%|██████▍ | 7955/12384 [16:52:57<9:22:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 64%|██████▍ | 7956/12384 [16:52:57<9:21:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 64%|██████▍ | 7956/12384 [16:53:05<9:21:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 64%|██████▍ | 7957/12384 [16:53:05<9:21:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 64%|██████▍ | 7957/12384 [16:53:12<9:21:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 64%|██████▍ | 7958/12384 [16:53:12<9:25:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 64%|██████▍ | 7958/12384 [16:53:20<9:25:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 64%|██████▍ | 7959/12384 [16:53:20<9:24:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 64%|██████▍ | 7959/12384 [16:53:28<9:24:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 64%|██████▍ | 7960/12384 [16:53:28<9:24:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 64%|██████▍ | 7960/12384 [16:53:35<9:24:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 64%|██████▍ | 7961/12384 [16:53:35<9:24:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 64%|██████▍ | 7961/12384 [16:53:43<9:24:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 64%|██████▍ | 7962/12384 [16:53:43<9:23:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 64%|██████▍ | 7962/12384 [16:53:51<9:23:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 64%|██████▍ | 7963/12384 [16:53:51<9:22:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 64%|██████▍ | 7963/12384 [16:53:58<9:22:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 64%|██████▍ | 7964/12384 [16:53:58<9:21:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 64%|██████▍ | 7964/12384 [16:54:06<9:21:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 64%|██████▍ | 7965/12384 [16:54:06<9:22:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 64%|██████▍ | 7965/12384 [16:54:14<9:22:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 64%|██████▍ | 7966/12384 [16:54:14<9:22:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 64%|██████▍ | 7966/12384 [16:54:22<9:22:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 64%|██████▍ | 7967/12384 [16:54:22<9:29:14, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 64%|██████▍ | 7967/12384 [16:54:29<9:29:14, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 64%|██████▍ | 7968/12384 [16:54:29<9:26:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 64%|██████▍ | 7968/12384 [16:54:37<9:26:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 64%|██████▍ | 7969/12384 [16:54:37<9:24:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 64%|██████▍ | 7969/12384 [16:54:44<9:24:01, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7970/12384 [16:54:44<9:22:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 64%|██████▍ | 7970/12384 [16:54:52<9:22:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 64%|██████▍ | 7971/12384 [16:54:52<9:21:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 64%|██████▍ | 7971/12384 [16:55:00<9:21:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 64%|██████▍ | 7972/12384 [16:55:00<9:22:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 64%|██████▍ | 7972/12384 [16:55:07<9:22:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 64%|██████▍ | 7973/12384 [16:55:07<9:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 64%|██████▍ | 7973/12384 [16:55:15<9:20:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 64%|██████▍ | 7974/12384 [16:55:15<9:20:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 64%|██████▍ | 7974/12384 [16:55:22<9:20:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 64%|██████▍ | 7975/12384 [16:55:22<9:19:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 64%|██████▍ | 7975/12384 [16:55:30<9:19:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 64%|██████▍ | 7976/12384 [16:55:30<9:19:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 64%|██████▍ | 7976/12384 [16:55:38<9:19:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 64%|██████▍ | 7977/12384 [16:55:38<9:18:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 64%|██████▍ | 7977/12384 [16:55:45<9:18:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 64%|██████▍ | 7978/12384 [16:55:45<9:20:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 64%|██████▍ | 7978/12384 [16:55:53<9:20:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 64%|██████▍ | 7979/12384 [16:55:53<9:21:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 64%|██████▍ | 7979/12384 [16:56:01<9:21:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 64%|██████▍ | 7980/12384 [16:56:01<9:20:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 64%|██████▍ | 7980/12384 [16:56:08<9:20:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 64%|██████▍ | 7981/12384 [16:56:08<9:20:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 64%|██████▍ | 7981/12384 [16:56:16<9:20:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 64%|██████▍ | 7982/12384 [16:56:16<9:19:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 64%|██████▍ | 7982/12384 [16:56:23<9:19:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 64%|██████▍ | 7983/12384 [16:56:23<9:19:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.93s]
Epoch 2: 64%|██████▍ | 7983/12384 [16:56:31<9:19:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 64%|██████▍ | 7984/12384 [16:56:31<9:19:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 64%|██████▍ | 7984/12384 [16:56:39<9:19:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 64%|██████▍ | 7985/12384 [16:56:39<9:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 64%|██████▍ | 7985/12384 [16:56:46<9:18:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 64%|██████▍ | 7986/12384 [16:56:46<9:18:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 64%|██████▍ | 7986/12384 [16:56:54<9:18:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 64%|██████▍ | 7987/12384 [16:56:54<9:17:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 64%|██████▍ | 7987/12384 [16:57:01<9:17:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 65%|██████▍ | 7988/12384 [16:57:01<9:16:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 65%|██████▍ | 7988/12384 [16:57:09<9:16:47, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 65%|██████▍ | 7989/12384 [16:57:09<9:18:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 65%|██████▍ | 7989/12384 [16:57:17<9:18:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 65%|██████▍ | 7990/12384 [16:57:17<9:18:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 65%|██████▍ | 7990/12384 [16:57:24<9:18:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 65%|██████▍ | 7991/12384 [16:57:24<9:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 65%|██████▍ | 7991/12384 [16:57:32<9:17:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 65%|██████▍ | 7992/12384 [16:57:32<9:17:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 65%|██████▍ | 7992/12384 [16:57:40<9:17:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 65%|██████▍ | 7993/12384 [16:57:40<9:24:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 65%|██████▍ | 7993/12384 [16:57:48<9:24:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 65%|██████▍ | 7994/12384 [16:57:48<9:21:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 65%|██████▍ | 7994/12384 [16:57:55<9:21:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 65%|██████▍ | 7995/12384 [16:57:55<9:20:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 65%|██████▍ | 7995/12384 [16:58:03<9:20:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 65%|██████▍ | 7996/12384 [16:58:03<9:18:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 65%|██████▍ | 7996/12384 [16:58:10<9:18:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 65%|██████▍ | 7997/12384 [16:58:10<9:18:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 65%|██████▍ | 7997/12384 [16:58:18<9:18:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 65%|██████▍ | 7998/12384 [16:58:18<9:18:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 65%|██████▍ | 7998/12384 [16:58:26<9:18:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 65%|██████▍ | 7999/12384 [16:58:26<9:17:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 65%|██████▍ | 7999/12384 [16:58:33<9:17:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 65%|██████▍ | 8000/12384 [16:58:33<9:16:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 65%|██████▍ | 8000/12384 [16:58:41<9:16:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 65%|██████▍ | 8001/12384 [16:58:41<9:16:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 65%|██████▍ | 8001/12384 [16:58:48<9:16:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▍ | 8002/12384 [16:58:48<9:16:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▍ | 8002/12384 [16:58:56<9:16:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▍ | 8003/12384 [16:58:56<9:16:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▍ | 8003/12384 [16:59:04<9:16:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 65%|██████▍ | 8004/12384 [16:59:04<9:15:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 65%|██████▍ | 8004/12384 [16:59:11<9:15:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 65%|██████▍ | 8005/12384 [16:59:11<9:17:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 65%|██████▍ | 8005/12384 [16:59:19<9:17:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 65%|██████▍ | 8006/12384 [16:59:19<9:18:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.20s]
Epoch 2: 65%|██████▍ | 8006/12384 [16:59:27<9:18:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 65%|██████▍ | 8007/12384 [16:59:27<9:17:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 65%|██████▍ | 8007/12384 [16:59:34<9:17:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 65%|██████▍ | 8008/12384 [16:59:34<9:16:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 65%|██████▍ | 8008/12384 [16:59:42<9:16:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 65%|██████▍ | 8009/12384 [16:59:42<9:15:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 65%|██████▍ | 8009/12384 [16:59:49<9:15:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 65%|██████▍ | 8010/12384 [16:59:49<9:15:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 65%|██████▍ | 8010/12384 [16:59:57<9:15:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▍ | 8011/12384 [16:59:57<9:15:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▍ | 8011/12384 [17:00:05<9:15:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▍ | 8012/12384 [17:00:05<9:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▍ | 8012/12384 [17:00:12<9:15:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 65%|██████▍ | 8013/12384 [17:00:12<9:15:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 65%|██████▍ | 8013/12384 [17:00:20<9:15:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 65%|██████▍ | 8014/12384 [17:00:20<9:14:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 65%|██████▍ | 8014/12384 [17:00:28<9:14:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 65%|██████▍ | 8015/12384 [17:00:28<9:14:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 65%|██████▍ | 8015/12384 [17:00:35<9:14:23, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▍ | 8016/12384 [17:00:35<9:15:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▍ | 8016/12384 [17:00:43<9:15:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 65%|██████▍ | 8017/12384 [17:00:43<9:26:12, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 65%|██████▍ | 8017/12384 [17:00:51<9:26:12, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 65%|██████▍ | 8018/12384 [17:00:51<9:27:13, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 65%|██████▍ | 8018/12384 [17:00:59<9:27:13, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 2: 65%|██████▍ | 8019/12384 [17:00:59<9:36:39, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 2: 65%|██████▍ | 8019/12384 [17:01:07<9:36:39, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 65%|██████▍ | 8020/12384 [17:01:07<9:33:31, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 65%|██████▍ | 8020/12384 [17:01:15<9:33:31, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 2: 65%|██████▍ | 8021/12384 [17:01:15<9:30:55, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.11s]
Epoch 2: 65%|██████▍ | 8021/12384 [17:01:23<9:30:55, 7.85s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 2: 65%|██████▍ | 8022/12384 [17:01:23<9:28:06, 7.81s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 2: 65%|██████▍ | 8022/12384 [17:01:30<9:28:06, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 65%|██████▍ | 8023/12384 [17:01:30<9:25:30, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 65%|██████▍ | 8023/12384 [17:01:38<9:25:30, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 65%|██████▍ | 8024/12384 [17:01:38<9:23:19, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 65%|██████▍ | 8024/12384 [17:01:46<9:23:19, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=7.09s]
Epoch 2: 65%|██████▍ | 8025/12384 [17:01:46<9:21:43, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.09s]
Epoch 2: 65%|██████▍ | 8025/12384 [17:01:53<9:21:43, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 65%|██████▍ | 8026/12384 [17:01:53<9:20:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 65%|██████▍ | 8026/12384 [17:02:01<9:20:01, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 2: 65%|██████▍ | 8027/12384 [17:02:01<9:19:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 2: 65%|██████▍ | 8027/12384 [17:02:09<9:19:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 2: 65%|██████▍ | 8028/12384 [17:02:09<9:20:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.36s]
Epoch 2: 65%|██████▍ | 8028/12384 [17:02:17<9:20:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 65%|██████▍ | 8029/12384 [17:02:17<9:22:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 65%|██████▍ | 8029/12384 [17:02:24<9:22:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 65%|██████▍ | 8030/12384 [17:02:24<9:21:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.80s]
Epoch 2: 65%|██████▍ | 8030/12384 [17:02:32<9:21:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 65%|██████▍ | 8031/12384 [17:02:32<9:22:11, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 65%|██████▍ | 8031/12384 [17:02:40<9:22:11, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 65%|██████▍ | 8032/12384 [17:02:40<9:21:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 65%|██████▍ | 8032/12384 [17:02:48<9:21:59, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 2: 65%|██████▍ | 8033/12384 [17:02:48<9:22:22, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.34s]
Epoch 2: 65%|██████▍ | 8033/12384 [17:02:55<9:22:22, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 65%|██████▍ | 8034/12384 [17:02:55<9:22:45, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 65%|██████▍ | 8034/12384 [17:03:03<9:22:45, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 2: 65%|██████▍ | 8035/12384 [17:03:03<9:22:35, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=9.26s]
Epoch 2: 65%|██████▍ | 8035/12384 [17:03:11<9:22:35, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 2: 65%|██████▍ | 8036/12384 [17:03:11<9:24:14, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.43s]
Epoch 2: 65%|██████▍ | 8036/12384 [17:03:19<9:24:14, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 65%|██████▍ | 8037/12384 [17:03:19<9:20:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 65%|██████▍ | 8037/12384 [17:03:26<9:20:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 65%|██████▍ | 8038/12384 [17:03:26<9:17:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 65%|██████▍ | 8038/12384 [17:03:34<9:17:39, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 65%|██████▍ | 8039/12384 [17:03:34<9:16:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 65%|██████▍ | 8039/12384 [17:03:42<9:16:39, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 65%|██████▍ | 8040/12384 [17:03:42<9:16:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 65%|██████▍ | 8040/12384 [17:03:50<9:16:43, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▍ | 8041/12384 [17:03:50<9:22:10, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▍ | 8041/12384 [17:03:57<9:22:10, 7.77s/it, loss=0.0002, acc=0.9998, iter_time=5.50s]
Epoch 2: 65%|██████▍ | 8042/12384 [17:03:57<9:18:37, 7.72s/it, loss=0.0002, acc=0.9998, iter_time=5.50s]
Epoch 2: 65%|██████▍ | 8042/12384 [17:04:05<9:18:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 65%|██████▍ | 8043/12384 [17:04:05<9:26:44, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 65%|██████▍ | 8043/12384 [17:04:13<9:26:44, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 65%|██████▍ | 8044/12384 [17:04:13<9:24:01, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 65%|██████▍ | 8044/12384 [17:04:21<9:24:01, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 65%|██████▍ | 8045/12384 [17:04:21<9:27:24, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 65%|██████▍ | 8045/12384 [17:04:29<9:27:24, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 65%|██████▍ | 8046/12384 [17:04:29<9:23:34, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 65%|██████▍ | 8046/12384 [17:04:36<9:23:34, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 65%|██████▍ | 8047/12384 [17:04:36<9:19:57, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 65%|██████▍ | 8047/12384 [17:04:44<9:19:57, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 65%|██████▍ | 8048/12384 [17:04:44<9:17:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 65%|██████▍ | 8048/12384 [17:04:52<9:17:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 65%|██████▍ | 8049/12384 [17:04:52<9:14:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 65%|██████▍ | 8049/12384 [17:04:59<9:14:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▌ | 8050/12384 [17:04:59<9:12:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▌ | 8050/12384 [17:05:07<9:12:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▌ | 8051/12384 [17:05:07<9:13:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▌ | 8051/12384 [17:05:14<9:13:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 65%|██████▌ | 8052/12384 [17:05:14<9:12:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 65%|██████▌ | 8052/12384 [17:05:22<9:12:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 65%|██████▌ | 8053/12384 [17:05:22<9:11:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 65%|██████▌ | 8053/12384 [17:05:30<9:11:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 65%|██████▌ | 8054/12384 [17:05:30<9:10:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 65%|██████▌ | 8054/12384 [17:05:37<9:10:53, 7.63s/it, loss=0.0003, acc=0.9988, iter_time=6.11s]
Epoch 2: 65%|██████▌ | 8055/12384 [17:05:37<9:10:42, 7.63s/it, loss=0.0003, acc=0.9988, iter_time=6.11s]
Epoch 2: 65%|██████▌ | 8055/12384 [17:05:45<9:10:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 2: 65%|██████▌ | 8056/12384 [17:05:45<9:09:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 2: 65%|██████▌ | 8056/12384 [17:05:53<9:09:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 2: 65%|██████▌ | 8057/12384 [17:05:53<9:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.12s]
Epoch 2: 65%|██████▌ | 8057/12384 [17:06:00<9:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▌ | 8058/12384 [17:06:00<9:09:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▌ | 8058/12384 [17:06:08<9:09:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 65%|██████▌ | 8059/12384 [17:06:08<9:09:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.17s]
Epoch 2: 65%|██████▌ | 8059/12384 [17:06:15<9:09:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 65%|██████▌ | 8060/12384 [17:06:15<9:09:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 65%|██████▌ | 8060/12384 [17:06:23<9:09:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8061/12384 [17:06:23<9:09:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8061/12384 [17:06:31<9:09:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8062/12384 [17:06:31<9:10:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8062/12384 [17:06:38<9:10:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 65%|██████▌ | 8063/12384 [17:06:38<9:10:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 65%|██████▌ | 8063/12384 [17:06:46<9:10:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 65%|██████▌ | 8064/12384 [17:06:46<9:09:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 65%|██████▌ | 8064/12384 [17:06:54<9:09:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 65%|██████▌ | 8065/12384 [17:06:54<9:08:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 65%|██████▌ | 8065/12384 [17:07:01<9:08:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 65%|██████▌ | 8066/12384 [17:07:01<9:08:32, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 65%|██████▌ | 8066/12384 [17:07:09<9:08:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 65%|██████▌ | 8067/12384 [17:07:09<9:08:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 65%|██████▌ | 8067/12384 [17:07:16<9:08:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 65%|██████▌ | 8068/12384 [17:07:16<9:07:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 65%|██████▌ | 8068/12384 [17:07:24<9:07:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 65%|██████▌ | 8069/12384 [17:07:24<9:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 65%|██████▌ | 8069/12384 [17:07:32<9:07:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 65%|██████▌ | 8070/12384 [17:07:32<9:07:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 65%|██████▌ | 8070/12384 [17:07:39<9:07:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 65%|██████▌ | 8071/12384 [17:07:39<9:08:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 65%|██████▌ | 8071/12384 [17:07:47<9:08:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 65%|██████▌ | 8072/12384 [17:07:47<9:13:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 65%|██████▌ | 8072/12384 [17:07:55<9:13:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 65%|██████▌ | 8073/12384 [17:07:55<9:11:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 65%|██████▌ | 8073/12384 [17:08:02<9:11:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8074/12384 [17:08:02<9:10:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8074/12384 [17:08:10<9:10:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 65%|██████▌ | 8075/12384 [17:08:10<9:09:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 65%|██████▌ | 8075/12384 [17:08:18<9:09:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 65%|██████▌ | 8076/12384 [17:08:18<9:07:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.25s]
Epoch 2: 65%|██████▌ | 8076/12384 [17:08:25<9:07:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 65%|██████▌ | 8077/12384 [17:08:25<9:06:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 65%|██████▌ | 8077/12384 [17:08:33<9:06:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 65%|██████▌ | 8078/12384 [17:08:33<9:06:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 65%|██████▌ | 8078/12384 [17:08:40<9:06:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 65%|██████▌ | 8079/12384 [17:08:40<9:06:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 65%|██████▌ | 8079/12384 [17:08:48<9:06:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 65%|██████▌ | 8080/12384 [17:08:48<9:06:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 65%|██████▌ | 8080/12384 [17:08:56<9:06:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 65%|██████▌ | 8081/12384 [17:08:56<9:06:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 65%|██████▌ | 8081/12384 [17:09:03<9:06:09, 7.62s/it, loss=0.0002, acc=0.9993, iter_time=8.01s]
Epoch 2: 65%|██████▌ | 8082/12384 [17:09:03<9:05:56, 7.61s/it, loss=0.0002, acc=0.9993, iter_time=8.01s]
Epoch 2: 65%|██████▌ | 8082/12384 [17:09:11<9:05:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 65%|██████▌ | 8083/12384 [17:09:11<9:06:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 65%|██████▌ | 8083/12384 [17:09:19<9:06:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 65%|██████▌ | 8084/12384 [17:09:19<9:06:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 65%|██████▌ | 8084/12384 [17:09:26<9:06:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 65%|██████▌ | 8085/12384 [17:09:26<9:06:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 65%|██████▌ | 8085/12384 [17:09:34<9:06:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 65%|██████▌ | 8086/12384 [17:09:34<9:06:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 65%|██████▌ | 8086/12384 [17:09:41<9:06:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 65%|██████▌ | 8087/12384 [17:09:41<9:05:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 65%|██████▌ | 8087/12384 [17:09:49<9:05:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 65%|██████▌ | 8088/12384 [17:09:49<9:07:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 65%|██████▌ | 8088/12384 [17:09:57<9:07:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 65%|██████▌ | 8089/12384 [17:09:57<9:06:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 65%|██████▌ | 8089/12384 [17:10:04<9:06:06, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8090/12384 [17:10:04<9:05:59, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8090/12384 [17:10:12<9:05:59, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 2: 65%|██████▌ | 8091/12384 [17:10:12<9:05:47, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 2: 65%|██████▌ | 8091/12384 [17:10:20<9:05:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 65%|██████▌ | 8092/12384 [17:10:20<9:05:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 65%|██████▌ | 8092/12384 [17:10:27<9:05:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8093/12384 [17:10:27<9:04:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 65%|██████▌ | 8093/12384 [17:10:35<9:04:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.31s]
Epoch 2: 65%|██████▌ | 8094/12384 [17:10:35<9:04:34, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.31s]
Epoch 2: 65%|██████▌ | 8094/12384 [17:10:43<9:04:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 65%|██████▌ | 8095/12384 [17:10:43<9:10:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 65%|██████▌ | 8095/12384 [17:10:50<9:10:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 65%|██████▌ | 8096/12384 [17:10:50<9:08:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 65%|██████▌ | 8096/12384 [17:10:58<9:08:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 65%|██████▌ | 8097/12384 [17:10:58<9:07:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 65%|██████▌ | 8097/12384 [17:11:06<9:07:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 65%|██████▌ | 8098/12384 [17:11:06<9:12:41, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 65%|██████▌ | 8098/12384 [17:11:14<9:12:41, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 65%|██████▌ | 8099/12384 [17:11:14<9:32:00, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 65%|██████▌ | 8099/12384 [17:11:22<9:32:00, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 65%|██████▌ | 8100/12384 [17:11:22<9:31:41, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 65%|██████▌ | 8100/12384 [17:11:31<9:31:41, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 65%|██████▌ | 8101/12384 [17:11:31<9:37:35, 8.09s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 65%|██████▌ | 8101/12384 [17:11:38<9:37:35, 8.09s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▌ | 8102/12384 [17:11:38<9:27:33, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 65%|██████▌ | 8102/12384 [17:11:46<9:27:33, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 65%|██████▌ | 8103/12384 [17:11:46<9:20:13, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 65%|██████▌ | 8103/12384 [17:11:54<9:20:13, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 65%|██████▌ | 8104/12384 [17:11:54<9:14:46, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 65%|██████▌ | 8104/12384 [17:12:01<9:14:46, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 65%|██████▌ | 8105/12384 [17:12:01<9:13:17, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 65%|██████▌ | 8105/12384 [17:12:09<9:13:17, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 65%|██████▌ | 8106/12384 [17:12:09<9:09:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.59s]
Epoch 2: 65%|██████▌ | 8106/12384 [17:12:17<9:09:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 65%|██████▌ | 8107/12384 [17:12:17<9:06:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.71s]
Epoch 2: 65%|██████▌ | 8107/12384 [17:12:24<9:06:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 65%|██████▌ | 8108/12384 [17:12:24<9:05:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 65%|██████▌ | 8108/12384 [17:12:32<9:05:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 65%|██████▌ | 8109/12384 [17:12:32<9:04:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 65%|██████▌ | 8109/12384 [17:12:39<9:04:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 65%|██████▌ | 8110/12384 [17:12:39<9:03:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 65%|██████▌ | 8110/12384 [17:12:47<9:03:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 65%|██████▌ | 8111/12384 [17:12:47<9:03:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 65%|██████▌ | 8111/12384 [17:12:55<9:03:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 66%|██████▌ | 8112/12384 [17:12:55<9:03:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 66%|██████▌ | 8112/12384 [17:13:02<9:03:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 66%|██████▌ | 8113/12384 [17:13:02<9:03:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 66%|██████▌ | 8113/12384 [17:13:10<9:03:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 66%|██████▌ | 8114/12384 [17:13:10<9:02:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 66%|██████▌ | 8114/12384 [17:13:17<9:02:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8115/12384 [17:13:17<9:02:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8115/12384 [17:13:25<9:02:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8116/12384 [17:13:25<9:01:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8116/12384 [17:13:33<9:01:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 66%|██████▌ | 8117/12384 [17:13:33<9:01:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 66%|██████▌ | 8117/12384 [17:13:40<9:01:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 66%|██████▌ | 8118/12384 [17:13:40<9:01:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 66%|██████▌ | 8118/12384 [17:13:48<9:01:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 66%|██████▌ | 8119/12384 [17:13:48<9:00:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 66%|██████▌ | 8119/12384 [17:13:55<9:00:31, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 66%|██████▌ | 8120/12384 [17:13:55<9:00:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 66%|██████▌ | 8120/12384 [17:14:03<9:00:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 66%|██████▌ | 8121/12384 [17:14:03<9:00:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 66%|██████▌ | 8121/12384 [17:14:11<9:00:47, 7.61s/it, loss=0.0001, acc=0.9982, iter_time=7.66s]
Epoch 2: 66%|██████▌ | 8122/12384 [17:14:11<9:00:51, 7.61s/it, loss=0.0001, acc=0.9982, iter_time=7.66s]
Epoch 2: 66%|██████▌ | 8122/12384 [17:14:18<9:00:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▌ | 8123/12384 [17:14:18<9:00:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▌ | 8123/12384 [17:14:26<9:00:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8124/12384 [17:14:26<9:02:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8124/12384 [17:14:34<9:02:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 66%|██████▌ | 8125/12384 [17:14:34<9:08:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 66%|██████▌ | 8125/12384 [17:14:42<9:08:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 66%|██████▌ | 8126/12384 [17:14:42<9:06:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 66%|██████▌ | 8126/12384 [17:14:50<9:06:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 66%|██████▌ | 8127/12384 [17:14:50<9:19:15, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 66%|██████▌ | 8127/12384 [17:14:58<9:19:15, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 66%|██████▌ | 8128/12384 [17:14:58<9:13:32, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 66%|██████▌ | 8128/12384 [17:15:05<9:13:32, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 2: 66%|██████▌ | 8129/12384 [17:15:05<9:09:19, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.91s]
Epoch 2: 66%|██████▌ | 8129/12384 [17:15:13<9:09:19, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 2: 66%|██████▌ | 8130/12384 [17:15:13<9:08:42, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 2: 66%|██████▌ | 8130/12384 [17:15:20<9:08:42, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 66%|██████▌ | 8131/12384 [17:15:20<9:05:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 66%|██████▌ | 8131/12384 [17:15:28<9:05:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 66%|██████▌ | 8132/12384 [17:15:28<9:04:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 66%|██████▌ | 8132/12384 [17:15:36<9:04:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 66%|██████▌ | 8133/12384 [17:15:36<9:02:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 66%|██████▌ | 8133/12384 [17:15:43<9:02:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 66%|██████▌ | 8134/12384 [17:15:43<9:01:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 66%|██████▌ | 8134/12384 [17:15:51<9:01:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 66%|██████▌ | 8135/12384 [17:15:51<9:00:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 66%|██████▌ | 8135/12384 [17:15:59<9:00:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 2: 66%|██████▌ | 8136/12384 [17:15:59<9:00:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.98s]
Epoch 2: 66%|██████▌ | 8136/12384 [17:16:06<9:00:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 66%|██████▌ | 8137/12384 [17:16:06<8:59:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 66%|██████▌ | 8137/12384 [17:16:14<8:59:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 66%|██████▌ | 8138/12384 [17:16:14<8:59:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 66%|██████▌ | 8138/12384 [17:16:21<8:59:30, 7.62s/it, loss=0.0019, acc=0.9970, iter_time=6.14s]
Epoch 2: 66%|██████▌ | 8139/12384 [17:16:21<8:58:37, 7.61s/it, loss=0.0019, acc=0.9970, iter_time=6.14s]
Epoch 2: 66%|██████▌ | 8139/12384 [17:16:29<8:58:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 66%|██████▌ | 8140/12384 [17:16:29<8:57:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 66%|██████▌ | 8140/12384 [17:16:37<8:57:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 66%|██████▌ | 8141/12384 [17:16:37<8:57:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 66%|██████▌ | 8141/12384 [17:16:44<8:57:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 2: 66%|██████▌ | 8142/12384 [17:16:44<8:59:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 2: 66%|██████▌ | 8142/12384 [17:16:52<8:59:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 66%|██████▌ | 8143/12384 [17:16:52<8:59:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 66%|██████▌ | 8143/12384 [17:17:00<8:59:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 66%|██████▌ | 8144/12384 [17:17:00<8:59:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 66%|██████▌ | 8144/12384 [17:17:07<8:59:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▌ | 8145/12384 [17:17:07<8:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▌ | 8145/12384 [17:17:15<8:58:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 66%|██████▌ | 8146/12384 [17:17:15<8:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 66%|██████▌ | 8146/12384 [17:17:22<8:58:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 66%|██████▌ | 8147/12384 [17:17:22<8:57:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 66%|██████▌ | 8147/12384 [17:17:30<8:57:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 66%|██████▌ | 8148/12384 [17:17:30<8:57:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 66%|██████▌ | 8148/12384 [17:17:38<8:57:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 66%|██████▌ | 8149/12384 [17:17:38<8:57:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 66%|██████▌ | 8149/12384 [17:17:45<8:57:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 66%|██████▌ | 8150/12384 [17:17:45<8:56:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 66%|██████▌ | 8150/12384 [17:17:53<8:56:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▌ | 8151/12384 [17:17:53<9:03:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▌ | 8151/12384 [17:18:01<9:03:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 66%|██████▌ | 8152/12384 [17:18:01<9:01:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 66%|██████▌ | 8152/12384 [17:18:08<9:01:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 66%|██████▌ | 8153/12384 [17:18:08<8:59:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 66%|██████▌ | 8153/12384 [17:18:16<8:59:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 66%|██████▌ | 8154/12384 [17:18:16<8:59:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 66%|██████▌ | 8154/12384 [17:18:24<8:59:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 66%|██████▌ | 8155/12384 [17:18:24<8:58:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.42s]
Epoch 2: 66%|██████▌ | 8155/12384 [17:18:31<8:58:02, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 66%|██████▌ | 8156/12384 [17:18:31<8:57:14, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 66%|██████▌ | 8156/12384 [17:18:39<8:57:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 2: 66%|██████▌ | 8157/12384 [17:18:39<9:00:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.91s]
Epoch 2: 66%|██████▌ | 8157/12384 [17:18:47<9:00:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 66%|██████▌ | 8158/12384 [17:18:47<8:58:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 66%|██████▌ | 8158/12384 [17:18:54<8:58:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 66%|██████▌ | 8159/12384 [17:18:54<8:58:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 66%|██████▌ | 8159/12384 [17:19:02<8:58:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 66%|██████▌ | 8160/12384 [17:19:02<8:58:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 66%|██████▌ | 8160/12384 [17:19:09<8:58:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 66%|██████▌ | 8161/12384 [17:19:09<8:57:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 66%|██████▌ | 8161/12384 [17:19:17<8:57:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8162/12384 [17:19:17<8:57:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8162/12384 [17:19:25<8:57:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 66%|██████▌ | 8163/12384 [17:19:25<8:57:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 66%|██████▌ | 8163/12384 [17:19:32<8:57:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8164/12384 [17:19:32<8:56:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8164/12384 [17:19:40<8:56:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 66%|██████▌ | 8165/12384 [17:19:40<8:55:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 66%|██████▌ | 8165/12384 [17:19:48<8:55:16, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.03s]
Epoch 2: 66%|██████▌ | 8166/12384 [17:19:48<8:55:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.03s]
Epoch 2: 66%|██████▌ | 8166/12384 [17:19:55<8:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 66%|██████▌ | 8167/12384 [17:19:55<8:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 66%|██████▌ | 8167/12384 [17:20:03<8:55:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 2: 66%|██████▌ | 8168/12384 [17:20:03<8:54:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.83s]
Epoch 2: 66%|██████▌ | 8168/12384 [17:20:10<8:54:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 66%|██████▌ | 8169/12384 [17:20:10<8:55:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 66%|██████▌ | 8169/12384 [17:20:18<8:55:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 66%|██████▌ | 8170/12384 [17:20:18<8:54:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 66%|██████▌ | 8170/12384 [17:20:26<8:54:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 66%|██████▌ | 8171/12384 [17:20:26<8:54:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 66%|██████▌ | 8171/12384 [17:20:33<8:54:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 66%|██████▌ | 8172/12384 [17:20:33<8:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 66%|██████▌ | 8172/12384 [17:20:41<8:54:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▌ | 8173/12384 [17:20:41<8:54:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▌ | 8173/12384 [17:20:49<8:54:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 66%|██████▌ | 8174/12384 [17:20:49<9:00:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 66%|██████▌ | 8174/12384 [17:20:56<9:00:40, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 66%|██████▌ | 8175/12384 [17:20:56<8:58:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 66%|██████▌ | 8175/12384 [17:21:04<8:58:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 66%|██████▌ | 8176/12384 [17:21:04<8:57:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 66%|██████▌ | 8176/12384 [17:21:12<8:57:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 66%|██████▌ | 8177/12384 [17:21:12<9:03:28, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 66%|██████▌ | 8177/12384 [17:21:20<9:03:28, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 66%|██████▌ | 8178/12384 [17:21:20<9:00:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 66%|██████▌ | 8178/12384 [17:21:27<9:00:20, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8179/12384 [17:21:27<8:59:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8179/12384 [17:21:35<8:59:02, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▌ | 8180/12384 [17:21:35<8:57:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▌ | 8180/12384 [17:21:42<8:57:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 66%|██████▌ | 8181/12384 [17:21:42<8:55:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 66%|██████▌ | 8181/12384 [17:21:50<8:55:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 2: 66%|██████▌ | 8182/12384 [17:21:50<8:55:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 2: 66%|██████▌ | 8182/12384 [17:21:58<8:55:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 66%|██████▌ | 8183/12384 [17:21:58<8:56:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 66%|██████▌ | 8183/12384 [17:22:05<8:56:02, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 66%|██████▌ | 8184/12384 [17:22:05<8:55:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 66%|██████▌ | 8184/12384 [17:22:13<8:55:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.97s]
Epoch 2: 66%|██████▌ | 8185/12384 [17:22:13<8:55:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.97s]
Epoch 2: 66%|██████▌ | 8185/12384 [17:22:21<8:55:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 2: 66%|██████▌ | 8186/12384 [17:22:21<8:54:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 2: 66%|██████▌ | 8186/12384 [17:22:28<8:54:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 66%|██████▌ | 8187/12384 [17:22:28<8:53:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 66%|██████▌ | 8187/12384 [17:22:36<8:53:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 66%|██████▌ | 8188/12384 [17:22:36<8:52:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 66%|██████▌ | 8188/12384 [17:22:43<8:52:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 66%|██████▌ | 8189/12384 [17:22:43<8:52:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 66%|██████▌ | 8189/12384 [17:22:51<8:52:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 66%|██████▌ | 8190/12384 [17:22:51<8:52:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 66%|██████▌ | 8190/12384 [17:22:59<8:52:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8191/12384 [17:22:59<8:52:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8191/12384 [17:23:06<8:52:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 66%|██████▌ | 8192/12384 [17:23:06<8:52:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 66%|██████▌ | 8192/12384 [17:23:14<8:52:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 66%|██████▌ | 8193/12384 [17:23:14<8:52:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 66%|██████▌ | 8193/12384 [17:23:22<8:52:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 66%|██████▌ | 8194/12384 [17:23:22<8:51:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 66%|██████▌ | 8194/12384 [17:23:29<8:51:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 66%|██████▌ | 8195/12384 [17:23:29<8:51:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 66%|██████▌ | 8195/12384 [17:23:37<8:51:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▌ | 8196/12384 [17:23:37<8:52:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▌ | 8196/12384 [17:23:44<8:52:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 66%|██████▌ | 8197/12384 [17:23:44<8:51:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 66%|██████▌ | 8197/12384 [17:23:52<8:51:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 66%|██████▌ | 8198/12384 [17:23:52<8:51:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 66%|██████▌ | 8198/12384 [17:24:00<8:51:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▌ | 8199/12384 [17:24:00<8:50:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▌ | 8199/12384 [17:24:07<8:50:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 66%|██████▌ | 8200/12384 [17:24:07<8:51:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 66%|██████▌ | 8200/12384 [17:24:15<8:51:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 66%|██████▌ | 8201/12384 [17:24:15<8:56:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 66%|██████▌ | 8201/12384 [17:24:23<8:56:42, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8202/12384 [17:24:23<8:54:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▌ | 8202/12384 [17:24:31<8:54:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 66%|██████▌ | 8203/12384 [17:24:31<9:00:55, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 66%|██████▌ | 8203/12384 [17:24:38<9:00:55, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 66%|██████▌ | 8204/12384 [17:24:38<8:58:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 66%|██████▌ | 8204/12384 [17:24:46<8:58:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▋ | 8205/12384 [17:24:46<8:56:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▋ | 8205/12384 [17:24:54<8:56:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 66%|██████▋ | 8206/12384 [17:24:54<8:54:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 66%|██████▋ | 8206/12384 [17:25:01<8:54:22, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 66%|██████▋ | 8207/12384 [17:25:01<8:52:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.17s]
Epoch 2: 66%|██████▋ | 8207/12384 [17:25:09<8:52:35, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 66%|██████▋ | 8208/12384 [17:25:09<8:51:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 66%|██████▋ | 8208/12384 [17:25:16<8:51:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 66%|██████▋ | 8209/12384 [17:25:16<8:51:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 66%|██████▋ | 8209/12384 [17:25:24<8:51:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 66%|██████▋ | 8210/12384 [17:25:24<8:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 66%|██████▋ | 8210/12384 [17:25:32<8:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 66%|██████▋ | 8211/12384 [17:25:32<8:50:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 66%|██████▋ | 8211/12384 [17:25:39<8:50:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 66%|██████▋ | 8212/12384 [17:25:39<8:49:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 66%|██████▋ | 8212/12384 [17:25:47<8:49:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 66%|██████▋ | 8213/12384 [17:25:47<8:50:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 66%|██████▋ | 8213/12384 [17:25:55<8:50:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▋ | 8214/12384 [17:25:55<8:49:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 66%|██████▋ | 8214/12384 [17:26:02<8:49:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 66%|██████▋ | 8215/12384 [17:26:02<8:49:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 66%|██████▋ | 8215/12384 [17:26:10<8:49:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 66%|██████▋ | 8216/12384 [17:26:10<8:49:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 66%|██████▋ | 8216/12384 [17:26:17<8:49:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 66%|██████▋ | 8217/12384 [17:26:17<8:50:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 66%|██████▋ | 8217/12384 [17:26:25<8:50:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 2: 66%|██████▋ | 8218/12384 [17:26:25<8:49:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 2: 66%|██████▋ | 8218/12384 [17:26:33<8:49:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▋ | 8219/12384 [17:26:33<8:50:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▋ | 8219/12384 [17:26:40<8:50:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 66%|██████▋ | 8220/12384 [17:26:40<8:51:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 66%|██████▋ | 8220/12384 [17:26:48<8:51:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 66%|██████▋ | 8221/12384 [17:26:48<8:49:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 66%|██████▋ | 8221/12384 [17:26:56<8:49:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.99s]
Epoch 2: 66%|██████▋ | 8222/12384 [17:26:56<8:49:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.99s]
Epoch 2: 66%|██████▋ | 8222/12384 [17:27:03<8:49:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 66%|██████▋ | 8223/12384 [17:27:03<8:48:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 66%|██████▋ | 8223/12384 [17:27:11<8:48:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 66%|██████▋ | 8224/12384 [17:27:11<8:48:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 66%|██████▋ | 8224/12384 [17:27:18<8:48:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▋ | 8225/12384 [17:27:18<8:48:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▋ | 8225/12384 [17:27:26<8:48:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 66%|██████▋ | 8226/12384 [17:27:26<8:48:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 66%|██████▋ | 8226/12384 [17:27:34<8:48:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 66%|██████▋ | 8227/12384 [17:27:34<8:57:49, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 66%|██████▋ | 8227/12384 [17:27:42<8:57:49, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▋ | 8228/12384 [17:27:42<8:54:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▋ | 8228/12384 [17:27:50<8:54:48, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▋ | 8229/12384 [17:27:50<8:59:42, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 66%|██████▋ | 8229/12384 [17:27:57<8:59:42, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 66%|██████▋ | 8230/12384 [17:27:57<8:55:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 66%|██████▋ | 8230/12384 [17:28:05<8:55:28, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▋ | 8231/12384 [17:28:05<8:54:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 66%|██████▋ | 8231/12384 [17:28:13<8:54:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 66%|██████▋ | 8232/12384 [17:28:13<8:58:18, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 66%|██████▋ | 8232/12384 [17:28:21<8:58:18, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 66%|██████▋ | 8233/12384 [17:28:21<8:54:42, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.51s]
Epoch 2: 66%|██████▋ | 8233/12384 [17:28:28<8:54:42, 7.73s/it, loss=0.0004, acc=0.9986, iter_time=7.61s]
Epoch 2: 66%|██████▋ | 8234/12384 [17:28:28<8:51:57, 7.69s/it, loss=0.0004, acc=0.9986, iter_time=7.61s]
Epoch 2: 66%|██████▋ | 8234/12384 [17:28:36<8:51:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 66%|██████▋ | 8235/12384 [17:28:36<8:50:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 66%|██████▋ | 8235/12384 [17:28:43<8:50:20, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 67%|██████▋ | 8236/12384 [17:28:43<8:49:22, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.16s]
Epoch 2: 67%|██████▋ | 8236/12384 [17:28:51<8:49:22, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=5.91s]
Epoch 2: 67%|██████▋ | 8237/12384 [17:28:51<8:47:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.91s]
Epoch 2: 67%|██████▋ | 8237/12384 [17:28:59<8:47:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 67%|██████▋ | 8238/12384 [17:28:59<8:46:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 67%|██████▋ | 8238/12384 [17:29:06<8:46:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 67%|██████▋ | 8239/12384 [17:29:06<8:46:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 67%|██████▋ | 8239/12384 [17:29:14<8:46:22, 7.62s/it, loss=0.0003, acc=0.9990, iter_time=8.00s]
Epoch 2: 67%|██████▋ | 8240/12384 [17:29:14<8:46:13, 7.62s/it, loss=0.0003, acc=0.9990, iter_time=8.00s]
Epoch 2: 67%|██████▋ | 8240/12384 [17:29:21<8:46:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 67%|██████▋ | 8241/12384 [17:29:21<8:46:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 67%|██████▋ | 8241/12384 [17:29:29<8:46:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 67%|██████▋ | 8242/12384 [17:29:29<8:46:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 67%|██████▋ | 8242/12384 [17:29:37<8:46:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 67%|██████▋ | 8243/12384 [17:29:37<8:45:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 67%|██████▋ | 8243/12384 [17:29:44<8:45:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 67%|██████▋ | 8244/12384 [17:29:44<8:46:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 67%|██████▋ | 8244/12384 [17:29:52<8:46:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 67%|██████▋ | 8245/12384 [17:29:52<8:45:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 67%|██████▋ | 8245/12384 [17:30:00<8:45:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 67%|██████▋ | 8246/12384 [17:30:00<8:46:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 67%|██████▋ | 8246/12384 [17:30:07<8:46:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 67%|██████▋ | 8247/12384 [17:30:07<8:46:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 67%|██████▋ | 8247/12384 [17:30:15<8:46:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 67%|██████▋ | 8248/12384 [17:30:15<8:45:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 67%|██████▋ | 8248/12384 [17:30:22<8:45:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 67%|██████▋ | 8249/12384 [17:30:22<8:45:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 67%|██████▋ | 8249/12384 [17:30:30<8:45:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 67%|██████▋ | 8250/12384 [17:30:30<8:45:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 67%|██████▋ | 8250/12384 [17:30:38<8:45:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 67%|██████▋ | 8251/12384 [17:30:38<8:51:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 67%|██████▋ | 8251/12384 [17:30:46<8:51:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 67%|██████▋ | 8252/12384 [17:30:46<8:48:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 67%|██████▋ | 8252/12384 [17:30:53<8:48:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 67%|██████▋ | 8253/12384 [17:30:53<8:49:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 67%|██████▋ | 8253/12384 [17:31:02<8:49:21, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 67%|██████▋ | 8254/12384 [17:31:02<8:59:43, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 67%|██████▋ | 8254/12384 [17:31:09<8:59:43, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 67%|██████▋ | 8255/12384 [17:31:09<9:01:21, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 67%|██████▋ | 8255/12384 [17:31:18<9:01:21, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 2: 67%|██████▋ | 8256/12384 [17:31:18<9:09:59, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=8.37s]
Epoch 2: 67%|██████▋ | 8256/12384 [17:31:26<9:09:59, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 67%|██████▋ | 8257/12384 [17:31:26<9:07:26, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 67%|██████▋ | 8257/12384 [17:31:33<9:07:26, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 67%|██████▋ | 8258/12384 [17:31:33<9:05:57, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=6.37s]
Epoch 2: 67%|██████▋ | 8258/12384 [17:31:41<9:05:57, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 67%|██████▋ | 8259/12384 [17:31:41<9:04:06, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 67%|██████▋ | 8259/12384 [17:31:50<9:04:06, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 67%|██████▋ | 8260/12384 [17:31:50<9:27:25, 8.26s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 67%|██████▋ | 8260/12384 [17:31:58<9:27:25, 8.26s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 2: 67%|██████▋ | 8261/12384 [17:31:58<9:19:41, 8.14s/it, loss=0.0000, acc=1.0000, iter_time=11.16s]
Epoch 2: 67%|██████▋ | 8261/12384 [17:32:06<9:19:41, 8.14s/it, loss=0.0001, acc=1.0000, iter_time=6.81s]
Epoch 2: 67%|██████▋ | 8262/12384 [17:32:06<9:12:46, 8.05s/it, loss=0.0001, acc=1.0000, iter_time=6.81s]
Epoch 2: 67%|██████▋ | 8262/12384 [17:32:14<9:12:46, 8.05s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 2: 67%|██████▋ | 8263/12384 [17:32:14<9:08:33, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 2: 67%|██████▋ | 8263/12384 [17:32:22<9:08:33, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=11.70s]
Epoch 2: 67%|██████▋ | 8264/12384 [17:32:22<9:05:23, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=11.70s]
Epoch 2: 67%|██████▋ | 8264/12384 [17:32:30<9:05:23, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 67%|██████▋ | 8265/12384 [17:32:30<9:02:23, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 2: 67%|██████▋ | 8265/12384 [17:32:37<9:02:23, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 67%|██████▋ | 8266/12384 [17:32:37<9:01:07, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 67%|██████▋ | 8266/12384 [17:32:45<9:01:07, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 67%|██████▋ | 8267/12384 [17:32:45<9:01:25, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 67%|██████▋ | 8267/12384 [17:32:53<9:01:25, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 67%|██████▋ | 8268/12384 [17:32:53<9:01:24, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 67%|██████▋ | 8268/12384 [17:33:01<9:01:24, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 67%|██████▋ | 8269/12384 [17:33:01<9:00:19, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 67%|██████▋ | 8269/12384 [17:33:09<9:00:19, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 67%|██████▋ | 8270/12384 [17:33:09<8:59:54, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 67%|██████▋ | 8270/12384 [17:33:17<8:59:54, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 67%|██████▋ | 8271/12384 [17:33:17<9:00:06, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 67%|██████▋ | 8271/12384 [17:33:25<9:00:06, 7.88s/it, loss=0.0001, acc=1.0000, iter_time=7.77s]
Epoch 2: 67%|██████▋ | 8272/12384 [17:33:25<8:57:48, 7.85s/it, loss=0.0001, acc=1.0000, iter_time=7.77s]
Epoch 2: 67%|██████▋ | 8272/12384 [17:33:32<8:57:48, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 67%|██████▋ | 8273/12384 [17:33:32<8:58:10, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 67%|██████▋ | 8273/12384 [17:33:40<8:58:10, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 67%|██████▋ | 8274/12384 [17:33:40<8:57:20, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 67%|██████▋ | 8274/12384 [17:33:48<8:57:20, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 67%|██████▋ | 8275/12384 [17:33:48<8:58:10, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 67%|██████▋ | 8275/12384 [17:33:56<8:58:10, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 67%|██████▋ | 8276/12384 [17:33:56<8:57:40, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 67%|██████▋ | 8276/12384 [17:34:04<8:57:40, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 67%|██████▋ | 8277/12384 [17:34:04<8:57:30, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 67%|██████▋ | 8277/12384 [17:34:12<8:57:30, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 67%|██████▋ | 8278/12384 [17:34:12<9:05:34, 7.97s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 67%|██████▋ | 8278/12384 [17:34:20<9:05:34, 7.97s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 67%|██████▋ | 8279/12384 [17:34:20<9:02:53, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 67%|██████▋ | 8279/12384 [17:34:28<9:02:53, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 67%|██████▋ | 8280/12384 [17:34:28<9:02:52, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 67%|██████▋ | 8280/12384 [17:34:36<9:02:52, 7.94s/it, loss=0.0004, acc=0.9982, iter_time=6.58s]
Epoch 2: 67%|██████▋ | 8281/12384 [17:34:36<9:01:55, 7.92s/it, loss=0.0004, acc=0.9982, iter_time=6.58s]
Epoch 2: 67%|██████▋ | 8281/12384 [17:34:44<9:01:55, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 2: 67%|██████▋ | 8282/12384 [17:34:44<9:08:55, 8.03s/it, loss=0.0000, acc=1.0000, iter_time=10.04s]
Epoch 2: 67%|██████▋ | 8282/12384 [17:34:52<9:08:55, 8.03s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 67%|██████▋ | 8283/12384 [17:34:52<9:05:47, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=6.78s]
Epoch 2: 67%|██████▋ | 8283/12384 [17:35:00<9:05:47, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 67%|██████▋ | 8284/12384 [17:35:00<9:05:14, 7.98s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 67%|██████▋ | 8284/12384 [17:35:08<9:05:14, 7.98s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 67%|██████▋ | 8285/12384 [17:35:08<9:02:26, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=9.52s]
Epoch 2: 67%|██████▋ | 8285/12384 [17:35:16<9:02:26, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 67%|██████▋ | 8286/12384 [17:35:16<9:01:31, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 67%|██████▋ | 8286/12384 [17:35:24<9:01:31, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 67%|██████▋ | 8287/12384 [17:35:24<9:00:52, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 67%|██████▋ | 8287/12384 [17:35:31<9:00:52, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 2: 67%|██████▋ | 8288/12384 [17:35:31<8:55:00, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=9.78s]
Epoch 2: 67%|██████▋ | 8288/12384 [17:35:39<8:55:00, 7.84s/it, loss=0.0003, acc=0.9976, iter_time=4.93s]
Epoch 2: 67%|██████▋ | 8289/12384 [17:35:39<8:52:10, 7.80s/it, loss=0.0003, acc=0.9976, iter_time=4.93s]
Epoch 2: 67%|██████▋ | 8289/12384 [17:35:47<8:52:10, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 67%|██████▋ | 8290/12384 [17:35:47<8:47:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 67%|██████▋ | 8290/12384 [17:35:54<8:47:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 67%|██████▋ | 8291/12384 [17:35:54<8:46:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 67%|██████▋ | 8291/12384 [17:36:02<8:46:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 67%|██████▋ | 8292/12384 [17:36:02<8:44:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 67%|██████▋ | 8292/12384 [17:36:09<8:44:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 67%|██████▋ | 8293/12384 [17:36:09<8:42:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 67%|██████▋ | 8293/12384 [17:36:17<8:42:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 67%|██████▋ | 8294/12384 [17:36:17<8:41:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 67%|██████▋ | 8294/12384 [17:36:25<8:41:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 67%|██████▋ | 8295/12384 [17:36:25<8:41:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 67%|██████▋ | 8295/12384 [17:36:32<8:41:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 67%|██████▋ | 8296/12384 [17:36:32<8:40:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 67%|██████▋ | 8296/12384 [17:36:40<8:40:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 67%|██████▋ | 8297/12384 [17:36:40<8:39:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 67%|██████▋ | 8297/12384 [17:36:48<8:39:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 67%|██████▋ | 8298/12384 [17:36:48<8:39:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 67%|██████▋ | 8298/12384 [17:36:55<8:39:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 2: 67%|██████▋ | 8299/12384 [17:36:55<8:41:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 2: 67%|██████▋ | 8299/12384 [17:37:03<8:41:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 67%|██████▋ | 8300/12384 [17:37:03<8:43:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 67%|██████▋ | 8300/12384 [17:37:11<8:43:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 67%|██████▋ | 8301/12384 [17:37:11<8:41:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 67%|██████▋ | 8301/12384 [17:37:18<8:41:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 67%|██████▋ | 8302/12384 [17:37:18<8:40:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 67%|██████▋ | 8302/12384 [17:37:26<8:40:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 67%|██████▋ | 8303/12384 [17:37:26<8:39:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 67%|██████▋ | 8303/12384 [17:37:34<8:39:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 67%|██████▋ | 8304/12384 [17:37:34<8:44:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 67%|██████▋ | 8304/12384 [17:37:41<8:44:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 67%|██████▋ | 8305/12384 [17:37:41<8:42:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 67%|██████▋ | 8305/12384 [17:37:49<8:42:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 67%|██████▋ | 8306/12384 [17:37:49<8:40:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 67%|██████▋ | 8306/12384 [17:37:57<8:40:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 67%|██████▋ | 8307/12384 [17:37:57<8:39:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 67%|██████▋ | 8307/12384 [17:38:04<8:39:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 67%|██████▋ | 8308/12384 [17:38:04<8:38:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 67%|██████▋ | 8308/12384 [17:38:12<8:38:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 67%|██████▋ | 8309/12384 [17:38:12<8:44:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 67%|██████▋ | 8309/12384 [17:38:20<8:44:02, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 67%|██████▋ | 8310/12384 [17:38:20<8:42:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 67%|██████▋ | 8310/12384 [17:38:27<8:42:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 67%|██████▋ | 8311/12384 [17:38:27<8:40:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 67%|██████▋ | 8311/12384 [17:38:35<8:40:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 67%|██████▋ | 8312/12384 [17:38:35<8:39:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 2: 67%|██████▋ | 8312/12384 [17:38:43<8:39:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 67%|██████▋ | 8313/12384 [17:38:43<8:39:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 67%|██████▋ | 8313/12384 [17:38:50<8:39:41, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 67%|██████▋ | 8314/12384 [17:38:50<8:39:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 67%|██████▋ | 8314/12384 [17:38:58<8:39:19, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=5.66s]
Epoch 2: 67%|██████▋ | 8315/12384 [17:38:58<8:38:24, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=5.66s]
Epoch 2: 67%|██████▋ | 8315/12384 [17:39:05<8:38:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 2: 67%|██████▋ | 8316/12384 [17:39:05<8:37:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 2: 67%|██████▋ | 8316/12384 [17:39:13<8:37:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 67%|██████▋ | 8317/12384 [17:39:13<8:36:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 67%|██████▋ | 8317/12384 [17:39:21<8:36:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 67%|██████▋ | 8318/12384 [17:39:21<8:36:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 67%|██████▋ | 8318/12384 [17:39:28<8:36:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 67%|██████▋ | 8319/12384 [17:39:28<8:36:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 67%|██████▋ | 8319/12384 [17:39:36<8:36:07, 7.62s/it, loss=0.0005, acc=0.9968, iter_time=7.59s]
Epoch 2: 67%|██████▋ | 8320/12384 [17:39:36<8:36:23, 7.62s/it, loss=0.0005, acc=0.9968, iter_time=7.59s]
Epoch 2: 67%|██████▋ | 8320/12384 [17:39:44<8:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 67%|██████▋ | 8321/12384 [17:39:44<8:35:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 67%|██████▋ | 8321/12384 [17:39:51<8:35:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 67%|██████▋ | 8322/12384 [17:39:51<8:37:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 67%|██████▋ | 8322/12384 [17:39:59<8:37:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 67%|██████▋ | 8323/12384 [17:39:59<8:36:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 67%|██████▋ | 8323/12384 [17:40:07<8:36:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 67%|██████▋ | 8324/12384 [17:40:07<8:36:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 67%|██████▋ | 8324/12384 [17:40:14<8:36:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 67%|██████▋ | 8325/12384 [17:40:14<8:35:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 67%|██████▋ | 8325/12384 [17:40:22<8:35:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 67%|██████▋ | 8326/12384 [17:40:22<8:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 67%|██████▋ | 8326/12384 [17:40:29<8:35:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 67%|██████▋ | 8327/12384 [17:40:29<8:34:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 67%|██████▋ | 8327/12384 [17:40:37<8:34:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 67%|██████▋ | 8328/12384 [17:40:37<8:34:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 67%|██████▋ | 8328/12384 [17:40:45<8:34:04, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 67%|██████▋ | 8329/12384 [17:40:45<8:36:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 67%|██████▋ | 8329/12384 [17:40:53<8:36:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 67%|██████▋ | 8330/12384 [17:40:53<8:41:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 67%|██████▋ | 8330/12384 [17:41:00<8:41:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 67%|██████▋ | 8331/12384 [17:41:00<8:39:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 67%|██████▋ | 8331/12384 [17:41:08<8:39:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 67%|██████▋ | 8332/12384 [17:41:08<8:39:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 67%|██████▋ | 8332/12384 [17:41:15<8:39:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 67%|██████▋ | 8333/12384 [17:41:15<8:37:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.18s]
Epoch 2: 67%|██████▋ | 8333/12384 [17:41:23<8:37:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 67%|██████▋ | 8334/12384 [17:41:23<8:37:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 67%|██████▋ | 8334/12384 [17:41:31<8:37:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 67%|██████▋ | 8335/12384 [17:41:31<8:43:10, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 67%|██████▋ | 8335/12384 [17:41:39<8:43:10, 7.75s/it, loss=0.0004, acc=0.9963, iter_time=7.90s]
Epoch 2: 67%|██████▋ | 8336/12384 [17:41:39<8:40:38, 7.72s/it, loss=0.0004, acc=0.9963, iter_time=7.90s]
Epoch 2: 67%|██████▋ | 8336/12384 [17:41:46<8:40:38, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 67%|██████▋ | 8337/12384 [17:41:46<8:38:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 67%|██████▋ | 8337/12384 [17:41:54<8:38:06, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 67%|██████▋ | 8338/12384 [17:41:54<8:38:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 67%|██████▋ | 8338/12384 [17:42:02<8:38:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 67%|██████▋ | 8339/12384 [17:42:02<8:36:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 67%|██████▋ | 8339/12384 [17:42:09<8:36:52, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 67%|██████▋ | 8340/12384 [17:42:09<8:35:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 67%|██████▋ | 8340/12384 [17:42:17<8:35:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 67%|██████▋ | 8341/12384 [17:42:17<8:34:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 67%|██████▋ | 8341/12384 [17:42:25<8:34:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 67%|██████▋ | 8342/12384 [17:42:25<8:35:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 67%|██████▋ | 8342/12384 [17:42:33<8:35:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 67%|██████▋ | 8343/12384 [17:42:33<8:44:18, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 67%|██████▋ | 8343/12384 [17:42:41<8:44:18, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 67%|██████▋ | 8344/12384 [17:42:41<8:58:22, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 67%|██████▋ | 8344/12384 [17:42:49<8:58:22, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 67%|██████▋ | 8345/12384 [17:42:49<8:50:05, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 67%|██████▋ | 8345/12384 [17:42:56<8:50:05, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 67%|██████▋ | 8346/12384 [17:42:56<8:45:12, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 67%|██████▋ | 8346/12384 [17:43:04<8:45:12, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 67%|██████▋ | 8347/12384 [17:43:04<8:41:07, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 67%|██████▋ | 8347/12384 [17:43:12<8:41:07, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 67%|██████▋ | 8348/12384 [17:43:12<8:37:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 67%|██████▋ | 8348/12384 [17:43:19<8:37:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 67%|██████▋ | 8349/12384 [17:43:19<8:35:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 67%|██████▋ | 8349/12384 [17:43:27<8:35:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 67%|██████▋ | 8350/12384 [17:43:27<8:36:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 67%|██████▋ | 8350/12384 [17:43:34<8:36:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 67%|██████▋ | 8351/12384 [17:43:34<8:34:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 67%|██████▋ | 8351/12384 [17:43:42<8:34:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 67%|██████▋ | 8352/12384 [17:43:42<8:33:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 67%|██████▋ | 8352/12384 [17:43:50<8:33:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 67%|██████▋ | 8353/12384 [17:43:50<8:32:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 67%|██████▋ | 8353/12384 [17:43:57<8:32:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 67%|██████▋ | 8354/12384 [17:43:57<8:32:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.86s]
Epoch 2: 67%|██████▋ | 8354/12384 [17:44:05<8:32:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 67%|██████▋ | 8355/12384 [17:44:05<8:31:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 67%|██████▋ | 8355/12384 [17:44:13<8:31:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 67%|██████▋ | 8356/12384 [17:44:13<8:37:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 67%|██████▋ | 8356/12384 [17:44:20<8:37:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 67%|██████▋ | 8357/12384 [17:44:20<8:35:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 67%|██████▋ | 8357/12384 [17:44:28<8:35:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 67%|██████▋ | 8358/12384 [17:44:28<8:34:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.20s]
Epoch 2: 67%|██████▋ | 8358/12384 [17:44:36<8:34:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 67%|██████▋ | 8359/12384 [17:44:36<8:32:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 67%|██████▋ | 8359/12384 [17:44:43<8:32:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 68%|██████▊ | 8360/12384 [17:44:43<8:31:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 68%|██████▊ | 8360/12384 [17:44:51<8:31:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 68%|██████▊ | 8361/12384 [17:44:51<8:37:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 68%|██████▊ | 8361/12384 [17:44:59<8:37:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 68%|██████▊ | 8362/12384 [17:44:59<8:35:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 68%|██████▊ | 8362/12384 [17:45:06<8:35:19, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 68%|██████▊ | 8363/12384 [17:45:06<8:34:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 68%|██████▊ | 8363/12384 [17:45:14<8:34:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 68%|██████▊ | 8364/12384 [17:45:14<8:33:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 68%|██████▊ | 8364/12384 [17:45:22<8:33:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 2: 68%|██████▊ | 8365/12384 [17:45:22<8:32:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 2: 68%|██████▊ | 8365/12384 [17:45:29<8:32:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 68%|██████▊ | 8366/12384 [17:45:29<8:31:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 68%|██████▊ | 8366/12384 [17:45:37<8:31:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 68%|██████▊ | 8367/12384 [17:45:37<8:31:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 68%|██████▊ | 8367/12384 [17:45:45<8:31:00, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.98s]
Epoch 2: 68%|██████▊ | 8368/12384 [17:45:45<8:31:06, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.98s]
Epoch 2: 68%|██████▊ | 8368/12384 [17:45:52<8:31:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 68%|██████▊ | 8369/12384 [17:45:52<8:30:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 68%|██████▊ | 8369/12384 [17:46:00<8:30:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8370/12384 [17:46:00<8:30:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8370/12384 [17:46:07<8:30:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 68%|██████▊ | 8371/12384 [17:46:07<8:30:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 68%|██████▊ | 8371/12384 [17:46:15<8:30:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 2: 68%|██████▊ | 8372/12384 [17:46:15<8:30:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.78s]
Epoch 2: 68%|██████▊ | 8372/12384 [17:46:23<8:30:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 68%|██████▊ | 8373/12384 [17:46:23<8:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 68%|██████▊ | 8373/12384 [17:46:30<8:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 68%|██████▊ | 8374/12384 [17:46:30<8:29:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 68%|██████▊ | 8374/12384 [17:46:38<8:29:00, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 68%|██████▊ | 8375/12384 [17:46:38<8:28:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 68%|██████▊ | 8375/12384 [17:46:45<8:28:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 68%|██████▊ | 8376/12384 [17:46:45<8:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 68%|██████▊ | 8376/12384 [17:46:53<8:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 68%|██████▊ | 8377/12384 [17:46:53<8:28:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 68%|██████▊ | 8377/12384 [17:47:01<8:28:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 68%|██████▊ | 8378/12384 [17:47:01<8:28:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 68%|██████▊ | 8378/12384 [17:47:08<8:28:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8379/12384 [17:47:08<8:29:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8379/12384 [17:47:16<8:29:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 68%|██████▊ | 8380/12384 [17:47:16<8:29:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 68%|██████▊ | 8380/12384 [17:47:24<8:29:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8381/12384 [17:47:24<8:29:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8381/12384 [17:47:32<8:29:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 68%|██████▊ | 8382/12384 [17:47:32<8:34:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 68%|██████▊ | 8382/12384 [17:47:39<8:34:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 68%|██████▊ | 8383/12384 [17:47:39<8:32:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 68%|██████▊ | 8383/12384 [17:47:47<8:32:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 68%|██████▊ | 8384/12384 [17:47:47<8:31:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 68%|██████▊ | 8384/12384 [17:47:54<8:31:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 68%|██████▊ | 8385/12384 [17:47:54<8:30:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 68%|██████▊ | 8385/12384 [17:48:02<8:30:14, 7.66s/it, loss=0.0008, acc=0.9977, iter_time=5.36s]
Epoch 2: 68%|██████▊ | 8386/12384 [17:48:02<8:29:19, 7.64s/it, loss=0.0008, acc=0.9977, iter_time=5.36s]
Epoch 2: 68%|██████▊ | 8386/12384 [17:48:10<8:29:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 68%|██████▊ | 8387/12384 [17:48:10<8:34:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 68%|██████▊ | 8387/12384 [17:48:18<8:34:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 68%|██████▊ | 8388/12384 [17:48:18<8:32:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 68%|██████▊ | 8388/12384 [17:48:25<8:32:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8389/12384 [17:48:25<8:31:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8389/12384 [17:48:33<8:31:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8390/12384 [17:48:33<8:29:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8390/12384 [17:48:40<8:29:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 68%|██████▊ | 8391/12384 [17:48:40<8:28:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 68%|██████▊ | 8391/12384 [17:48:48<8:28:15, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 2: 68%|██████▊ | 8392/12384 [17:48:48<8:27:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 2: 68%|██████▊ | 8392/12384 [17:48:56<8:27:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 68%|██████▊ | 8393/12384 [17:48:56<8:26:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 68%|██████▊ | 8393/12384 [17:49:03<8:26:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 68%|██████▊ | 8394/12384 [17:49:03<8:29:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 68%|██████▊ | 8394/12384 [17:49:11<8:29:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 68%|██████▊ | 8395/12384 [17:49:11<8:30:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 68%|██████▊ | 8395/12384 [17:49:19<8:30:08, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 68%|██████▊ | 8396/12384 [17:49:19<8:28:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 68%|██████▊ | 8396/12384 [17:49:26<8:28:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 2: 68%|██████▊ | 8397/12384 [17:49:26<8:27:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 2: 68%|██████▊ | 8397/12384 [17:49:34<8:27:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 2: 68%|██████▊ | 8398/12384 [17:49:34<8:26:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.09s]
Epoch 2: 68%|██████▊ | 8398/12384 [17:49:42<8:26:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 68%|██████▊ | 8399/12384 [17:49:42<8:28:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 68%|██████▊ | 8399/12384 [17:49:49<8:28:32, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 68%|██████▊ | 8400/12384 [17:49:49<8:27:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 68%|██████▊ | 8400/12384 [17:49:57<8:27:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 2: 68%|██████▊ | 8401/12384 [17:49:57<8:27:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.19s]
Epoch 2: 68%|██████▊ | 8401/12384 [17:50:04<8:27:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 68%|██████▊ | 8402/12384 [17:50:04<8:26:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 68%|██████▊ | 8402/12384 [17:50:12<8:26:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.43s]
Epoch 2: 68%|██████▊ | 8403/12384 [17:50:12<8:26:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.43s]
Epoch 2: 68%|██████▊ | 8403/12384 [17:50:20<8:26:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.86s]
Epoch 2: 68%|██████▊ | 8404/12384 [17:50:20<8:26:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.86s]
Epoch 2: 68%|██████▊ | 8404/12384 [17:50:27<8:26:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 68%|██████▊ | 8405/12384 [17:50:27<8:25:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 68%|██████▊ | 8405/12384 [17:50:35<8:25:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.93s]
Epoch 2: 68%|██████▊ | 8406/12384 [17:50:35<8:25:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.93s]
Epoch 2: 68%|██████▊ | 8406/12384 [17:50:43<8:25:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 68%|██████▊ | 8407/12384 [17:50:43<8:24:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 68%|██████▊ | 8407/12384 [17:50:50<8:24:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 68%|██████▊ | 8408/12384 [17:50:50<8:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 68%|██████▊ | 8408/12384 [17:50:58<8:24:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 68%|██████▊ | 8409/12384 [17:50:58<8:29:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 68%|██████▊ | 8409/12384 [17:51:06<8:29:38, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 68%|██████▊ | 8410/12384 [17:51:06<8:29:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 68%|██████▊ | 8410/12384 [17:51:13<8:29:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 68%|██████▊ | 8411/12384 [17:51:13<8:27:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.44s]
Epoch 2: 68%|██████▊ | 8411/12384 [17:51:21<8:27:41, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 68%|██████▊ | 8412/12384 [17:51:21<8:26:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 68%|██████▊ | 8412/12384 [17:51:29<8:26:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 68%|██████▊ | 8413/12384 [17:51:29<8:32:40, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 68%|██████▊ | 8413/12384 [17:51:37<8:32:40, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 68%|██████▊ | 8414/12384 [17:51:37<8:30:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 68%|██████▊ | 8414/12384 [17:51:44<8:30:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 68%|██████▊ | 8415/12384 [17:51:44<8:29:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 68%|██████▊ | 8415/12384 [17:51:52<8:29:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.67s]
Epoch 2: 68%|██████▊ | 8416/12384 [17:51:52<8:27:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.67s]
Epoch 2: 68%|██████▊ | 8416/12384 [17:52:00<8:27:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 68%|██████▊ | 8417/12384 [17:52:00<8:26:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 68%|██████▊ | 8417/12384 [17:52:07<8:26:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 68%|██████▊ | 8418/12384 [17:52:07<8:25:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 68%|██████▊ | 8418/12384 [17:52:15<8:25:59, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 68%|██████▊ | 8419/12384 [17:52:15<8:25:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 68%|██████▊ | 8419/12384 [17:52:22<8:25:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 68%|██████▊ | 8420/12384 [17:52:22<8:24:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 68%|██████▊ | 8420/12384 [17:52:30<8:24:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8421/12384 [17:52:30<8:23:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8421/12384 [17:52:38<8:23:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 68%|██████▊ | 8422/12384 [17:52:38<8:24:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 68%|██████▊ | 8422/12384 [17:52:45<8:24:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 68%|██████▊ | 8423/12384 [17:52:45<8:25:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 68%|██████▊ | 8423/12384 [17:52:53<8:25:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 68%|██████▊ | 8424/12384 [17:52:53<8:25:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 68%|██████▊ | 8424/12384 [17:53:01<8:25:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 68%|██████▊ | 8425/12384 [17:53:01<8:25:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 68%|██████▊ | 8425/12384 [17:53:08<8:25:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 68%|██████▊ | 8426/12384 [17:53:08<8:25:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 68%|██████▊ | 8426/12384 [17:53:16<8:25:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8427/12384 [17:53:16<8:25:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8427/12384 [17:53:24<8:25:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 68%|██████▊ | 8428/12384 [17:53:24<8:24:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.88s]
Epoch 2: 68%|██████▊ | 8428/12384 [17:53:31<8:24:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 2: 68%|██████▊ | 8429/12384 [17:53:31<8:25:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.52s]
Epoch 2: 68%|██████▊ | 8429/12384 [17:53:39<8:25:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 68%|██████▊ | 8430/12384 [17:53:39<8:24:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.02s]
Epoch 2: 68%|██████▊ | 8430/12384 [17:53:47<8:24:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 68%|██████▊ | 8431/12384 [17:53:47<8:23:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 68%|██████▊ | 8431/12384 [17:53:54<8:23:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 68%|██████▊ | 8432/12384 [17:53:54<8:22:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 68%|██████▊ | 8432/12384 [17:54:02<8:22:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 68%|██████▊ | 8433/12384 [17:54:02<8:22:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 68%|██████▊ | 8433/12384 [17:54:09<8:22:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 68%|██████▊ | 8434/12384 [17:54:09<8:22:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.48s]
Epoch 2: 68%|██████▊ | 8434/12384 [17:54:17<8:22:12, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.07s]
Epoch 2: 68%|██████▊ | 8435/12384 [17:54:17<8:27:02, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.07s]
Epoch 2: 68%|██████▊ | 8435/12384 [17:54:25<8:27:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 68%|██████▊ | 8436/12384 [17:54:25<8:25:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 68%|██████▊ | 8436/12384 [17:54:33<8:25:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 68%|██████▊ | 8437/12384 [17:54:33<8:23:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 68%|██████▊ | 8437/12384 [17:54:40<8:23:35, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.78s]
Epoch 2: 68%|██████▊ | 8438/12384 [17:54:40<8:23:01, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.78s]
Epoch 2: 68%|██████▊ | 8438/12384 [17:54:48<8:23:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 68%|██████▊ | 8439/12384 [17:54:48<8:23:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 68%|██████▊ | 8439/12384 [17:54:56<8:23:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 68%|██████▊ | 8440/12384 [17:54:56<8:27:58, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 2: 68%|██████▊ | 8440/12384 [17:55:03<8:27:58, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 2: 68%|██████▊ | 8441/12384 [17:55:03<8:25:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.54s]
Epoch 2: 68%|██████▊ | 8441/12384 [17:55:11<8:25:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 68%|██████▊ | 8442/12384 [17:55:11<8:26:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 68%|██████▊ | 8442/12384 [17:55:19<8:26:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 68%|██████▊ | 8443/12384 [17:55:19<8:24:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 68%|██████▊ | 8443/12384 [17:55:26<8:24:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 68%|██████▊ | 8444/12384 [17:55:26<8:22:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 68%|██████▊ | 8444/12384 [17:55:34<8:22:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 68%|██████▊ | 8445/12384 [17:55:34<8:23:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.45s]
Epoch 2: 68%|██████▊ | 8445/12384 [17:55:42<8:23:11, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.78s]
Epoch 2: 68%|██████▊ | 8446/12384 [17:55:42<8:23:27, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.78s]
Epoch 2: 68%|██████▊ | 8446/12384 [17:55:50<8:23:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 68%|██████▊ | 8447/12384 [17:55:50<8:36:58, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 68%|██████▊ | 8447/12384 [17:55:58<8:36:58, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 2: 68%|██████▊ | 8448/12384 [17:55:58<8:45:51, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 2: 68%|██████▊ | 8448/12384 [17:56:07<8:45:51, 8.02s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 68%|██████▊ | 8449/12384 [17:56:07<8:51:18, 8.10s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 68%|██████▊ | 8449/12384 [17:56:15<8:51:18, 8.10s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 68%|██████▊ | 8450/12384 [17:56:15<8:51:34, 8.11s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 68%|██████▊ | 8450/12384 [17:56:23<8:51:34, 8.11s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 68%|██████▊ | 8451/12384 [17:56:23<8:50:51, 8.10s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 68%|██████▊ | 8451/12384 [17:56:31<8:50:51, 8.10s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 68%|██████▊ | 8452/12384 [17:56:31<8:47:02, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 68%|██████▊ | 8452/12384 [17:56:39<8:47:02, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 68%|██████▊ | 8453/12384 [17:56:39<8:43:53, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 68%|██████▊ | 8453/12384 [17:56:47<8:43:53, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 68%|██████▊ | 8454/12384 [17:56:47<8:40:32, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 68%|██████▊ | 8454/12384 [17:56:54<8:40:32, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 68%|██████▊ | 8455/12384 [17:56:54<8:39:16, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 68%|██████▊ | 8455/12384 [17:57:03<8:39:16, 7.93s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 68%|██████▊ | 8456/12384 [17:57:03<8:42:25, 7.98s/it, loss=0.0000, acc=1.0000, iter_time=8.50s]
Epoch 2: 68%|██████▊ | 8456/12384 [17:57:11<8:42:25, 7.98s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 68%|██████▊ | 8457/12384 [17:57:11<8:42:55, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 68%|██████▊ | 8457/12384 [17:57:19<8:42:55, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8458/12384 [17:57:19<8:42:50, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 68%|██████▊ | 8458/12384 [17:57:26<8:42:50, 7.99s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 68%|██████▊ | 8459/12384 [17:57:26<8:39:34, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 68%|██████▊ | 8459/12384 [17:57:34<8:39:34, 7.94s/it, loss=0.0005, acc=0.9987, iter_time=7.86s]
Epoch 2: 68%|██████▊ | 8460/12384 [17:57:34<8:37:52, 7.92s/it, loss=0.0005, acc=0.9987, iter_time=7.86s]
Epoch 2: 68%|██████▊ | 8460/12384 [17:57:42<8:37:52, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 68%|██████▊ | 8461/12384 [17:57:42<8:43:02, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 68%|██████▊ | 8461/12384 [17:57:50<8:43:02, 8.00s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 2: 68%|██████▊ | 8462/12384 [17:57:50<8:39:58, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 2: 68%|██████▊ | 8462/12384 [17:57:58<8:39:58, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 68%|██████▊ | 8463/12384 [17:57:58<8:37:41, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 68%|██████▊ | 8463/12384 [17:58:06<8:37:41, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 68%|██████▊ | 8464/12384 [17:58:06<8:32:48, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 68%|██████▊ | 8464/12384 [17:58:13<8:32:48, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 68%|██████▊ | 8465/12384 [17:58:13<8:30:26, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 68%|██████▊ | 8465/12384 [17:58:22<8:30:26, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 2: 68%|██████▊ | 8466/12384 [17:58:22<8:36:28, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 2: 68%|██████▊ | 8466/12384 [17:58:29<8:36:28, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 2: 68%|██████▊ | 8467/12384 [17:58:29<8:31:53, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=6.36s]
Epoch 2: 68%|██████▊ | 8467/12384 [17:58:37<8:31:53, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 68%|██████▊ | 8468/12384 [17:58:37<8:28:28, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 68%|██████▊ | 8468/12384 [17:58:45<8:28:28, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 68%|██████▊ | 8469/12384 [17:58:45<8:26:06, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 68%|██████▊ | 8469/12384 [17:58:52<8:26:06, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 68%|██████▊ | 8470/12384 [17:58:52<8:25:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 68%|██████▊ | 8470/12384 [17:59:00<8:25:20, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 68%|██████▊ | 8471/12384 [17:59:00<8:24:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 68%|██████▊ | 8471/12384 [17:59:08<8:24:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 68%|██████▊ | 8472/12384 [17:59:08<8:23:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 68%|██████▊ | 8472/12384 [17:59:15<8:23:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 68%|██████▊ | 8473/12384 [17:59:15<8:22:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 68%|██████▊ | 8473/12384 [17:59:23<8:22:57, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 68%|██████▊ | 8474/12384 [17:59:23<8:22:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 68%|██████▊ | 8474/12384 [17:59:31<8:22:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 68%|██████▊ | 8475/12384 [17:59:31<8:22:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 68%|██████▊ | 8475/12384 [17:59:39<8:22:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 2: 68%|██████▊ | 8476/12384 [17:59:39<8:22:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 2: 68%|██████▊ | 8476/12384 [17:59:46<8:22:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 68%|██████▊ | 8477/12384 [17:59:46<8:21:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.00s]
Epoch 2: 68%|██████▊ | 8477/12384 [17:59:54<8:21:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 68%|██████▊ | 8478/12384 [17:59:54<8:23:27, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 68%|██████▊ | 8478/12384 [18:00:02<8:23:27, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 68%|██████▊ | 8479/12384 [18:00:02<8:22:29, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.98s]
Epoch 2: 68%|██████▊ | 8479/12384 [18:00:09<8:22:29, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 68%|██████▊ | 8480/12384 [18:00:09<8:21:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 68%|██████▊ | 8480/12384 [18:00:17<8:21:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 68%|██████▊ | 8481/12384 [18:00:17<8:20:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 68%|██████▊ | 8481/12384 [18:00:25<8:20:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 68%|██████▊ | 8482/12384 [18:00:25<8:20:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 68%|██████▊ | 8482/12384 [18:00:33<8:20:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 68%|██████▊ | 8483/12384 [18:00:33<8:20:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 68%|██████▊ | 8483/12384 [18:00:40<8:20:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.23s]
Epoch 2: 69%|██████▊ | 8484/12384 [18:00:40<8:20:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.23s]
Epoch 2: 69%|██████▊ | 8484/12384 [18:00:48<8:20:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 69%|██████▊ | 8485/12384 [18:00:48<8:20:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 69%|██████▊ | 8485/12384 [18:00:56<8:20:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 69%|██████▊ | 8486/12384 [18:00:56<8:20:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 69%|██████▊ | 8486/12384 [18:01:04<8:20:03, 7.70s/it, loss=0.0002, acc=0.9991, iter_time=8.08s]
Epoch 2: 69%|██████▊ | 8487/12384 [18:01:04<8:26:37, 7.80s/it, loss=0.0002, acc=0.9991, iter_time=8.08s]
Epoch 2: 69%|██████▊ | 8487/12384 [18:01:11<8:26:37, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 69%|██████▊ | 8488/12384 [18:01:11<8:26:02, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 69%|██████▊ | 8488/12384 [18:01:19<8:26:02, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 69%|██████▊ | 8489/12384 [18:01:19<8:24:07, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=6.06s]
Epoch 2: 69%|██████▊ | 8489/12384 [18:01:27<8:24:07, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 69%|██████▊ | 8490/12384 [18:01:27<8:22:51, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 69%|██████▊ | 8490/12384 [18:01:35<8:22:51, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 69%|██████▊ | 8491/12384 [18:01:35<8:21:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.36s]
Epoch 2: 69%|██████▊ | 8491/12384 [18:01:42<8:21:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 69%|██████▊ | 8492/12384 [18:01:42<8:20:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 69%|██████▊ | 8492/12384 [18:01:50<8:20:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▊ | 8493/12384 [18:01:50<8:24:50, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▊ | 8493/12384 [18:01:58<8:24:50, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 69%|██████▊ | 8494/12384 [18:01:58<8:21:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 69%|██████▊ | 8494/12384 [18:02:05<8:21:17, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 69%|██████▊ | 8495/12384 [18:02:05<8:19:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.70s]
Epoch 2: 69%|██████▊ | 8495/12384 [18:02:13<8:19:10, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 69%|██████▊ | 8496/12384 [18:02:13<8:17:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 69%|██████▊ | 8496/12384 [18:02:21<8:17:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 69%|██████▊ | 8497/12384 [18:02:21<8:16:15, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 69%|██████▊ | 8497/12384 [18:02:28<8:16:15, 7.66s/it, loss=0.0004, acc=0.9990, iter_time=4.00s]
Epoch 2: 69%|██████▊ | 8498/12384 [18:02:28<8:15:08, 7.64s/it, loss=0.0004, acc=0.9990, iter_time=4.00s]
Epoch 2: 69%|██████▊ | 8498/12384 [18:02:36<8:15:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 69%|██████▊ | 8499/12384 [18:02:36<8:14:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 69%|██████▊ | 8499/12384 [18:02:44<8:14:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 69%|██████▊ | 8500/12384 [18:02:44<8:14:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.04s]
Epoch 2: 69%|██████▊ | 8500/12384 [18:02:51<8:14:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 69%|██████▊ | 8501/12384 [18:02:51<8:13:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 69%|██████▊ | 8501/12384 [18:02:59<8:13:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 69%|██████▊ | 8502/12384 [18:02:59<8:12:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 69%|██████▊ | 8502/12384 [18:03:06<8:12:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 69%|██████▊ | 8503/12384 [18:03:06<8:12:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 69%|██████▊ | 8503/12384 [18:03:14<8:12:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 69%|██████▊ | 8504/12384 [18:03:14<8:12:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 69%|██████▊ | 8504/12384 [18:03:22<8:12:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▊ | 8505/12384 [18:03:22<8:12:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▊ | 8505/12384 [18:03:29<8:12:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▊ | 8506/12384 [18:03:29<8:12:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▊ | 8506/12384 [18:03:37<8:12:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 69%|██████▊ | 8507/12384 [18:03:37<8:13:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 69%|██████▊ | 8507/12384 [18:03:45<8:13:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 69%|██████▊ | 8508/12384 [18:03:45<8:14:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 69%|██████▊ | 8508/12384 [18:03:52<8:14:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 2: 69%|██████▊ | 8509/12384 [18:03:52<8:13:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.05s]
Epoch 2: 69%|██████▊ | 8509/12384 [18:04:00<8:13:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▊ | 8510/12384 [18:04:00<8:12:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▊ | 8510/12384 [18:04:07<8:12:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 69%|██████▊ | 8511/12384 [18:04:07<8:11:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 69%|██████▊ | 8511/12384 [18:04:15<8:11:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 69%|██████▊ | 8512/12384 [18:04:15<8:11:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 69%|██████▊ | 8512/12384 [18:04:23<8:11:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.50s]
Epoch 2: 69%|██████▊ | 8513/12384 [18:04:23<8:16:26, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.50s]
Epoch 2: 69%|██████▊ | 8513/12384 [18:04:30<8:16:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 69%|██████▉ | 8514/12384 [18:04:30<8:15:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 69%|██████▉ | 8514/12384 [18:04:38<8:15:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 69%|██████▉ | 8515/12384 [18:04:38<8:13:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 69%|██████▉ | 8515/12384 [18:04:46<8:13:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 69%|██████▉ | 8516/12384 [18:04:46<8:12:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.34s]
Epoch 2: 69%|██████▉ | 8516/12384 [18:04:53<8:12:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 69%|██████▉ | 8517/12384 [18:04:53<8:11:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 69%|██████▉ | 8517/12384 [18:05:01<8:11:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 69%|██████▉ | 8518/12384 [18:05:01<8:11:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 69%|██████▉ | 8518/12384 [18:05:09<8:11:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 69%|██████▉ | 8519/12384 [18:05:09<8:17:39, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.83s]
Epoch 2: 69%|██████▉ | 8519/12384 [18:05:16<8:17:39, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 69%|██████▉ | 8520/12384 [18:05:16<8:15:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.72s]
Epoch 2: 69%|██████▉ | 8520/12384 [18:05:24<8:15:24, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 69%|██████▉ | 8521/12384 [18:05:24<8:14:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 69%|██████▉ | 8521/12384 [18:05:32<8:14:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 69%|██████▉ | 8522/12384 [18:05:32<8:13:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 69%|██████▉ | 8522/12384 [18:05:39<8:13:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 69%|██████▉ | 8523/12384 [18:05:39<8:12:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 69%|██████▉ | 8523/12384 [18:05:47<8:12:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 69%|██████▉ | 8524/12384 [18:05:47<8:11:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 69%|██████▉ | 8524/12384 [18:05:55<8:11:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 69%|██████▉ | 8525/12384 [18:05:55<8:10:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 69%|██████▉ | 8525/12384 [18:06:02<8:10:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 69%|██████▉ | 8526/12384 [18:06:02<8:10:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 69%|██████▉ | 8526/12384 [18:06:10<8:10:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 69%|██████▉ | 8527/12384 [18:06:10<8:11:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 69%|██████▉ | 8527/12384 [18:06:18<8:11:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 69%|██████▉ | 8528/12384 [18:06:18<8:10:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 69%|██████▉ | 8528/12384 [18:06:25<8:10:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 69%|██████▉ | 8529/12384 [18:06:25<8:09:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 69%|██████▉ | 8529/12384 [18:06:33<8:09:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 69%|██████▉ | 8530/12384 [18:06:33<8:09:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 69%|██████▉ | 8530/12384 [18:06:40<8:09:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▉ | 8531/12384 [18:06:40<8:09:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▉ | 8531/12384 [18:06:48<8:09:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 69%|██████▉ | 8532/12384 [18:06:48<8:09:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 69%|██████▉ | 8532/12384 [18:06:56<8:09:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 2: 69%|██████▉ | 8533/12384 [18:06:56<8:09:31, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.24s]
Epoch 2: 69%|██████▉ | 8533/12384 [18:07:03<8:09:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8534/12384 [18:07:03<8:09:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8534/12384 [18:07:11<8:09:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▉ | 8535/12384 [18:07:11<8:08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 69%|██████▉ | 8535/12384 [18:07:18<8:08:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 69%|██████▉ | 8536/12384 [18:07:18<8:08:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 69%|██████▉ | 8536/12384 [18:07:26<8:08:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 2: 69%|██████▉ | 8537/12384 [18:07:26<8:09:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 2: 69%|██████▉ | 8537/12384 [18:07:34<8:09:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 69%|██████▉ | 8538/12384 [18:07:34<8:08:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 69%|██████▉ | 8538/12384 [18:07:41<8:08:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 69%|██████▉ | 8539/12384 [18:07:41<8:08:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 69%|██████▉ | 8539/12384 [18:07:49<8:08:06, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.84s]
Epoch 2: 69%|██████▉ | 8540/12384 [18:07:49<8:07:36, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.84s]
Epoch 2: 69%|██████▉ | 8540/12384 [18:07:57<8:07:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8541/12384 [18:07:57<8:07:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8541/12384 [18:08:04<8:07:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.43s]
Epoch 2: 69%|██████▉ | 8542/12384 [18:08:04<8:07:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.43s]
Epoch 2: 69%|██████▉ | 8542/12384 [18:08:12<8:07:48, 7.62s/it, loss=0.0002, acc=0.9985, iter_time=11.79s]
Epoch 2: 69%|██████▉ | 8543/12384 [18:08:12<8:07:28, 7.61s/it, loss=0.0002, acc=0.9985, iter_time=11.79s]
Epoch 2: 69%|██████▉ | 8543/12384 [18:08:19<8:07:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 69%|██████▉ | 8544/12384 [18:08:19<8:07:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 69%|██████▉ | 8544/12384 [18:08:27<8:07:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 69%|██████▉ | 8545/12384 [18:08:27<8:13:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 69%|██████▉ | 8545/12384 [18:08:35<8:13:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 69%|██████▉ | 8546/12384 [18:08:35<8:11:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 69%|██████▉ | 8546/12384 [18:08:43<8:11:26, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 69%|██████▉ | 8547/12384 [18:08:43<8:11:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 69%|██████▉ | 8547/12384 [18:08:50<8:11:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 69%|██████▉ | 8548/12384 [18:08:50<8:09:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 69%|██████▉ | 8548/12384 [18:08:58<8:09:44, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8549/12384 [18:08:58<8:08:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8549/12384 [18:09:06<8:08:52, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 69%|██████▉ | 8550/12384 [18:09:06<8:08:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 69%|██████▉ | 8550/12384 [18:09:13<8:08:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 69%|██████▉ | 8551/12384 [18:09:13<8:07:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 69%|██████▉ | 8551/12384 [18:09:21<8:07:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 69%|██████▉ | 8552/12384 [18:09:21<8:07:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 69%|██████▉ | 8552/12384 [18:09:28<8:07:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 2: 69%|██████▉ | 8553/12384 [18:09:28<8:05:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.69s]
Epoch 2: 69%|██████▉ | 8553/12384 [18:09:36<8:05:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 69%|██████▉ | 8554/12384 [18:09:36<8:05:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 69%|██████▉ | 8554/12384 [18:09:44<8:05:21, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 69%|██████▉ | 8555/12384 [18:09:44<8:05:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 69%|██████▉ | 8555/12384 [18:09:51<8:05:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 69%|██████▉ | 8556/12384 [18:09:51<8:05:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 69%|██████▉ | 8556/12384 [18:09:59<8:05:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 69%|██████▉ | 8557/12384 [18:09:59<8:05:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 69%|██████▉ | 8557/12384 [18:10:06<8:05:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 69%|██████▉ | 8558/12384 [18:10:06<8:04:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 69%|██████▉ | 8558/12384 [18:10:14<8:04:54, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 2: 69%|██████▉ | 8559/12384 [18:10:14<8:04:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.60s]
Epoch 2: 69%|██████▉ | 8559/12384 [18:10:22<8:04:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 69%|██████▉ | 8560/12384 [18:10:22<8:05:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 69%|██████▉ | 8560/12384 [18:10:29<8:05:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 2: 69%|██████▉ | 8561/12384 [18:10:29<8:05:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 2: 69%|██████▉ | 8561/12384 [18:10:37<8:05:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 69%|██████▉ | 8562/12384 [18:10:37<8:05:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 69%|██████▉ | 8562/12384 [18:10:44<8:05:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 69%|██████▉ | 8563/12384 [18:10:44<8:05:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 69%|██████▉ | 8563/12384 [18:10:52<8:05:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 69%|██████▉ | 8564/12384 [18:10:52<8:05:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 69%|██████▉ | 8564/12384 [18:11:00<8:05:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 69%|██████▉ | 8565/12384 [18:11:00<8:05:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 69%|██████▉ | 8565/12384 [18:11:07<8:05:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 69%|██████▉ | 8566/12384 [18:11:07<8:07:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.07s]
Epoch 2: 69%|██████▉ | 8566/12384 [18:11:15<8:07:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 2: 69%|██████▉ | 8567/12384 [18:11:15<8:06:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.31s]
Epoch 2: 69%|██████▉ | 8567/12384 [18:11:23<8:06:40, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 69%|██████▉ | 8568/12384 [18:11:23<8:05:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 69%|██████▉ | 8568/12384 [18:11:30<8:05:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 69%|██████▉ | 8569/12384 [18:11:30<8:04:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 69%|██████▉ | 8569/12384 [18:11:38<8:04:58, 7.63s/it, loss=0.0001, acc=0.9986, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8570/12384 [18:11:38<8:06:01, 7.65s/it, loss=0.0001, acc=0.9986, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8570/12384 [18:11:46<8:06:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 69%|██████▉ | 8571/12384 [18:11:46<8:11:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 69%|██████▉ | 8571/12384 [18:11:54<8:11:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 69%|██████▉ | 8572/12384 [18:11:54<8:09:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 69%|██████▉ | 8572/12384 [18:12:01<8:09:24, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 69%|██████▉ | 8573/12384 [18:12:01<8:07:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 69%|██████▉ | 8573/12384 [18:12:09<8:07:10, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 69%|██████▉ | 8574/12384 [18:12:09<8:05:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 69%|██████▉ | 8574/12384 [18:12:16<8:05:54, 7.65s/it, loss=0.0006, acc=0.9986, iter_time=6.77s]
Epoch 2: 69%|██████▉ | 8575/12384 [18:12:16<8:04:47, 7.64s/it, loss=0.0006, acc=0.9986, iter_time=6.77s]
Epoch 2: 69%|██████▉ | 8575/12384 [18:12:24<8:04:47, 7.64s/it, loss=0.0001, acc=0.9992, iter_time=8.39s]
Epoch 2: 69%|██████▉ | 8576/12384 [18:12:24<8:04:10, 7.63s/it, loss=0.0001, acc=0.9992, iter_time=8.39s]
Epoch 2: 69%|██████▉ | 8576/12384 [18:12:32<8:04:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 69%|██████▉ | 8577/12384 [18:12:32<8:04:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 69%|██████▉ | 8577/12384 [18:12:39<8:04:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 69%|██████▉ | 8578/12384 [18:12:39<8:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 69%|██████▉ | 8578/12384 [18:12:47<8:03:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 69%|██████▉ | 8579/12384 [18:12:47<8:03:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.13s]
Epoch 2: 69%|██████▉ | 8579/12384 [18:12:54<8:03:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 69%|██████▉ | 8580/12384 [18:12:54<8:04:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.99s]
Epoch 2: 69%|██████▉ | 8580/12384 [18:13:02<8:04:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 69%|██████▉ | 8581/12384 [18:13:02<8:03:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 69%|██████▉ | 8581/12384 [18:13:10<8:03:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 2: 69%|██████▉ | 8582/12384 [18:13:10<8:03:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 2: 69%|██████▉ | 8582/12384 [18:13:17<8:03:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 2: 69%|██████▉ | 8583/12384 [18:13:17<8:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.03s]
Epoch 2: 69%|██████▉ | 8583/12384 [18:13:25<8:02:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 69%|██████▉ | 8584/12384 [18:13:25<8:04:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 69%|██████▉ | 8584/12384 [18:13:33<8:04:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 69%|██████▉ | 8585/12384 [18:13:33<8:03:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 69%|██████▉ | 8585/12384 [18:13:40<8:03:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 69%|██████▉ | 8586/12384 [18:13:40<8:04:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 69%|██████▉ | 8586/12384 [18:13:48<8:04:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 69%|██████▉ | 8587/12384 [18:13:48<8:03:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 69%|██████▉ | 8587/12384 [18:13:56<8:03:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 69%|██████▉ | 8588/12384 [18:13:56<8:02:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 69%|██████▉ | 8588/12384 [18:14:03<8:02:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8589/12384 [18:14:03<8:01:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8589/12384 [18:14:11<8:01:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 69%|██████▉ | 8590/12384 [18:14:11<8:03:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 69%|██████▉ | 8590/12384 [18:14:18<8:03:00, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 69%|██████▉ | 8591/12384 [18:14:18<8:02:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 69%|██████▉ | 8591/12384 [18:14:26<8:02:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 2: 69%|██████▉ | 8592/12384 [18:14:26<8:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 2: 69%|██████▉ | 8592/12384 [18:14:34<8:01:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 2: 69%|██████▉ | 8593/12384 [18:14:34<8:05:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 2: 69%|██████▉ | 8593/12384 [18:14:41<8:05:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 69%|██████▉ | 8594/12384 [18:14:41<8:04:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 69%|██████▉ | 8594/12384 [18:14:49<8:04:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 69%|██████▉ | 8595/12384 [18:14:49<8:03:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 69%|██████▉ | 8595/12384 [18:14:57<8:03:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 69%|██████▉ | 8596/12384 [18:14:57<8:02:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 69%|██████▉ | 8596/12384 [18:15:05<8:02:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 69%|██████▉ | 8597/12384 [18:15:05<8:07:52, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 69%|██████▉ | 8597/12384 [18:15:12<8:07:52, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 69%|██████▉ | 8598/12384 [18:15:12<8:05:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 69%|██████▉ | 8598/12384 [18:15:20<8:05:30, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 2: 69%|██████▉ | 8599/12384 [18:15:20<8:05:31, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 2: 69%|██████▉ | 8599/12384 [18:15:28<8:05:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 69%|██████▉ | 8600/12384 [18:15:28<8:04:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 69%|██████▉ | 8600/12384 [18:15:35<8:04:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 69%|██████▉ | 8601/12384 [18:15:35<8:04:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 69%|██████▉ | 8601/12384 [18:15:43<8:04:28, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=4.33s]
Epoch 2: 69%|██████▉ | 8602/12384 [18:15:43<8:03:06, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=4.33s]
Epoch 2: 69%|██████▉ | 8602/12384 [18:15:51<8:03:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 69%|██████▉ | 8603/12384 [18:15:51<8:02:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 69%|██████▉ | 8603/12384 [18:15:58<8:02:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8604/12384 [18:15:58<8:02:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 69%|██████▉ | 8604/12384 [18:16:06<8:02:00, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 2: 69%|██████▉ | 8605/12384 [18:16:06<8:02:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 2: 69%|██████▉ | 8605/12384 [18:16:14<8:02:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 69%|██████▉ | 8606/12384 [18:16:14<8:02:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 69%|██████▉ | 8606/12384 [18:16:21<8:02:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 70%|██████▉ | 8607/12384 [18:16:21<8:01:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 70%|██████▉ | 8607/12384 [18:16:29<8:01:59, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 70%|██████▉ | 8608/12384 [18:16:29<8:00:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 70%|██████▉ | 8608/12384 [18:16:36<8:00:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 70%|██████▉ | 8609/12384 [18:16:36<8:01:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 70%|██████▉ | 8609/12384 [18:16:44<8:01:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 70%|██████▉ | 8610/12384 [18:16:44<8:00:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 70%|██████▉ | 8610/12384 [18:16:52<8:00:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 70%|██████▉ | 8611/12384 [18:16:52<7:59:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 70%|██████▉ | 8611/12384 [18:16:59<7:59:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 70%|██████▉ | 8612/12384 [18:16:59<7:59:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 70%|██████▉ | 8612/12384 [18:17:07<7:59:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 70%|██████▉ | 8613/12384 [18:17:07<7:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 70%|██████▉ | 8613/12384 [18:17:15<7:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 70%|██████▉ | 8614/12384 [18:17:15<7:58:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 70%|██████▉ | 8614/12384 [18:17:22<7:58:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|██████▉ | 8615/12384 [18:17:22<7:58:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|██████▉ | 8615/12384 [18:17:30<7:58:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 70%|██████▉ | 8616/12384 [18:17:30<7:58:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 70%|██████▉ | 8616/12384 [18:17:37<7:58:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.60s]
Epoch 2: 70%|██████▉ | 8617/12384 [18:17:37<7:58:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.60s]
Epoch 2: 70%|██████▉ | 8617/12384 [18:17:45<7:58:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 2: 70%|██████▉ | 8618/12384 [18:17:45<7:59:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 2: 70%|██████▉ | 8618/12384 [18:17:53<7:59:48, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=9.25s]
Epoch 2: 70%|██████▉ | 8619/12384 [18:17:53<8:04:46, 7.73s/it, loss=0.0001, acc=0.9998, iter_time=9.25s]
Epoch 2: 70%|██████▉ | 8619/12384 [18:18:01<8:04:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 70%|██████▉ | 8620/12384 [18:18:01<8:02:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 70%|██████▉ | 8620/12384 [18:18:08<8:02:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 70%|██████▉ | 8621/12384 [18:18:08<8:00:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 70%|██████▉ | 8621/12384 [18:18:16<8:00:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|██████▉ | 8622/12384 [18:18:16<8:01:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|██████▉ | 8622/12384 [18:18:24<8:01:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 70%|██████▉ | 8623/12384 [18:18:24<8:00:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.74s]
Epoch 2: 70%|██████▉ | 8623/12384 [18:18:32<8:00:06, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.03s]
Epoch 2: 70%|██████▉ | 8624/12384 [18:18:32<8:06:06, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=9.03s]
Epoch 2: 70%|██████▉ | 8624/12384 [18:18:39<8:06:06, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 70%|██████▉ | 8625/12384 [18:18:39<8:04:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 70%|██████▉ | 8625/12384 [18:18:47<8:04:04, 7.73s/it, loss=0.0000, acc=0.9999, iter_time=7.67s]
Epoch 2: 70%|██████▉ | 8626/12384 [18:18:47<8:01:41, 7.69s/it, loss=0.0000, acc=0.9999, iter_time=7.67s]
Epoch 2: 70%|██████▉ | 8626/12384 [18:18:54<8:01:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 70%|██████▉ | 8627/12384 [18:18:54<7:59:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 70%|██████▉ | 8627/12384 [18:19:02<7:59:57, 7.66s/it, loss=0.0004, acc=0.9998, iter_time=8.53s]
Epoch 2: 70%|██████▉ | 8628/12384 [18:19:02<7:58:17, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=8.53s]
Epoch 2: 70%|██████▉ | 8628/12384 [18:19:10<7:58:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 70%|██████▉ | 8629/12384 [18:19:10<7:57:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 70%|██████▉ | 8629/12384 [18:19:17<7:57:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 70%|██████▉ | 8630/12384 [18:19:17<7:58:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 70%|██████▉ | 8630/12384 [18:19:25<7:58:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 70%|██████▉ | 8631/12384 [18:19:25<7:56:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.29s]
Epoch 2: 70%|██████▉ | 8631/12384 [18:19:32<7:56:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 70%|██████▉ | 8632/12384 [18:19:32<7:57:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 70%|██████▉ | 8632/12384 [18:19:40<7:57:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 70%|██████▉ | 8633/12384 [18:19:40<7:56:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 70%|██████▉ | 8633/12384 [18:19:48<7:56:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 70%|██████▉ | 8634/12384 [18:19:48<7:56:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 70%|██████▉ | 8634/12384 [18:19:55<7:56:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 70%|██████▉ | 8635/12384 [18:19:55<7:56:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 70%|██████▉ | 8635/12384 [18:20:03<7:56:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|██████▉ | 8636/12384 [18:20:03<7:56:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|██████▉ | 8636/12384 [18:20:11<7:56:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 70%|██████▉ | 8637/12384 [18:20:11<7:56:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 70%|██████▉ | 8637/12384 [18:20:18<7:56:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 70%|██████▉ | 8638/12384 [18:20:18<7:55:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 70%|██████▉ | 8638/12384 [18:20:26<7:55:45, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 2: 70%|██████▉ | 8639/12384 [18:20:26<7:54:40, 7.60s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 2: 70%|██████▉ | 8639/12384 [18:20:33<7:54:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 70%|██████▉ | 8640/12384 [18:20:33<7:55:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 70%|██████▉ | 8640/12384 [18:20:41<7:55:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 70%|██████▉ | 8641/12384 [18:20:41<7:54:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 70%|██████▉ | 8641/12384 [18:20:49<7:54:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 70%|██████▉ | 8642/12384 [18:20:49<7:54:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 70%|██████▉ | 8642/12384 [18:20:56<7:54:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 70%|██████▉ | 8643/12384 [18:20:56<7:54:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 70%|██████▉ | 8643/12384 [18:21:04<7:54:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 70%|██████▉ | 8644/12384 [18:21:04<7:54:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 70%|██████▉ | 8644/12384 [18:21:11<7:54:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 70%|██████▉ | 8645/12384 [18:21:11<7:54:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 70%|██████▉ | 8645/12384 [18:21:19<7:54:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 70%|██████▉ | 8646/12384 [18:21:19<7:54:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 70%|██████▉ | 8646/12384 [18:21:27<7:54:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 70%|██████▉ | 8647/12384 [18:21:27<7:53:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 70%|██████▉ | 8647/12384 [18:21:34<7:53:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 70%|██████▉ | 8648/12384 [18:21:34<7:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 70%|██████▉ | 8648/12384 [18:21:42<7:54:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 70%|██████▉ | 8649/12384 [18:21:42<7:54:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 70%|██████▉ | 8649/12384 [18:21:50<7:54:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 70%|██████▉ | 8650/12384 [18:21:50<7:59:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 70%|██████▉ | 8650/12384 [18:21:57<7:59:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 70%|██████▉ | 8651/12384 [18:21:57<7:57:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 70%|██████▉ | 8651/12384 [18:22:05<7:57:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 70%|██████▉ | 8652/12384 [18:22:05<7:56:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 70%|██████▉ | 8652/12384 [18:22:13<7:56:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 70%|██████▉ | 8653/12384 [18:22:13<7:55:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.67s]
Epoch 2: 70%|██████▉ | 8653/12384 [18:22:20<7:55:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 70%|██████▉ | 8654/12384 [18:22:20<7:55:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 70%|██████▉ | 8654/12384 [18:22:28<7:55:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 70%|██████▉ | 8655/12384 [18:22:28<7:54:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 70%|██████▉ | 8655/12384 [18:22:36<7:54:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 2: 70%|██████▉ | 8656/12384 [18:22:36<7:53:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 2: 70%|██████▉ | 8656/12384 [18:22:43<7:53:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 70%|██████▉ | 8657/12384 [18:22:43<7:53:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 70%|██████▉ | 8657/12384 [18:22:51<7:53:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 70%|██████▉ | 8658/12384 [18:22:51<7:52:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 70%|██████▉ | 8658/12384 [18:22:58<7:52:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 70%|██████▉ | 8659/12384 [18:22:58<7:52:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 70%|██████▉ | 8659/12384 [18:23:06<7:52:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 2: 70%|██████▉ | 8660/12384 [18:23:06<7:52:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 2: 70%|██████▉ | 8660/12384 [18:23:14<7:52:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 70%|██████▉ | 8661/12384 [18:23:14<7:53:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 70%|██████▉ | 8661/12384 [18:23:21<7:53:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 2: 70%|██████▉ | 8662/12384 [18:23:21<7:54:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.79s]
Epoch 2: 70%|██████▉ | 8662/12384 [18:23:29<7:54:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 70%|██████▉ | 8663/12384 [18:23:29<7:54:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 70%|██████▉ | 8663/12384 [18:23:37<7:54:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 70%|██████▉ | 8664/12384 [18:23:37<7:53:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 70%|██████▉ | 8664/12384 [18:23:44<7:53:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 2: 70%|██████▉ | 8665/12384 [18:23:44<7:52:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.93s]
Epoch 2: 70%|██████▉ | 8665/12384 [18:23:52<7:52:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 70%|██████▉ | 8666/12384 [18:23:52<7:52:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 70%|██████▉ | 8666/12384 [18:23:59<7:52:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 70%|██████▉ | 8667/12384 [18:23:59<7:52:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 70%|██████▉ | 8667/12384 [18:24:07<7:52:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 70%|██████▉ | 8668/12384 [18:24:07<7:53:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 70%|██████▉ | 8668/12384 [18:24:15<7:53:14, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 70%|███████ | 8669/12384 [18:24:15<7:52:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 70%|███████ | 8669/12384 [18:24:22<7:52:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 70%|███████ | 8670/12384 [18:24:22<7:51:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 70%|███████ | 8670/12384 [18:24:30<7:51:50, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 2: 70%|███████ | 8671/12384 [18:24:30<7:57:14, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.92s]
Epoch 2: 70%|███████ | 8671/12384 [18:24:38<7:57:14, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 70%|███████ | 8672/12384 [18:24:38<7:55:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 70%|███████ | 8672/12384 [18:24:46<7:55:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 70%|███████ | 8673/12384 [18:24:46<7:54:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 70%|███████ | 8673/12384 [18:24:53<7:54:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 70%|███████ | 8674/12384 [18:24:53<7:53:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 70%|███████ | 8674/12384 [18:25:01<7:53:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 70%|███████ | 8675/12384 [18:25:01<7:52:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 70%|███████ | 8675/12384 [18:25:08<7:52:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 70%|███████ | 8676/12384 [18:25:08<7:52:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 70%|███████ | 8676/12384 [18:25:16<7:52:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 70%|███████ | 8677/12384 [18:25:16<7:57:34, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 70%|███████ | 8677/12384 [18:25:24<7:57:34, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 70%|███████ | 8678/12384 [18:25:24<7:55:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 70%|███████ | 8678/12384 [18:25:32<7:55:13, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 70%|███████ | 8679/12384 [18:25:32<7:55:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 70%|███████ | 8679/12384 [18:25:39<7:55:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 70%|███████ | 8680/12384 [18:25:39<7:53:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 2: 70%|███████ | 8680/12384 [18:25:47<7:53:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 70%|███████ | 8681/12384 [18:25:47<7:52:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 70%|███████ | 8681/12384 [18:25:54<7:52:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 70%|███████ | 8682/12384 [18:25:54<7:51:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 70%|███████ | 8682/12384 [18:26:02<7:51:44, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 70%|███████ | 8683/12384 [18:26:02<7:51:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 70%|███████ | 8683/12384 [18:26:10<7:51:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 70%|███████ | 8684/12384 [18:26:10<7:50:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 70%|███████ | 8684/12384 [18:26:17<7:50:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 70%|███████ | 8685/12384 [18:26:17<7:50:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 70%|███████ | 8685/12384 [18:26:25<7:50:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 70%|███████ | 8686/12384 [18:26:25<7:51:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 70%|███████ | 8686/12384 [18:26:33<7:51:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 70%|███████ | 8687/12384 [18:26:33<7:50:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 70%|███████ | 8687/12384 [18:26:40<7:50:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 70%|███████ | 8688/12384 [18:26:40<7:49:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 70%|███████ | 8688/12384 [18:26:48<7:49:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 70%|███████ | 8689/12384 [18:26:48<7:49:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 70%|███████ | 8689/12384 [18:26:55<7:49:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 70%|███████ | 8690/12384 [18:26:55<7:49:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 70%|███████ | 8690/12384 [18:27:03<7:49:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 70%|███████ | 8691/12384 [18:27:03<7:50:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 70%|███████ | 8691/12384 [18:27:11<7:50:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 70%|███████ | 8692/12384 [18:27:11<7:49:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 70%|███████ | 8692/12384 [18:27:18<7:49:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 70%|███████ | 8693/12384 [18:27:18<7:48:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 70%|███████ | 8693/12384 [18:27:26<7:48:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 70%|███████ | 8694/12384 [18:27:26<7:48:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 70%|███████ | 8694/12384 [18:27:34<7:48:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 70%|███████ | 8695/12384 [18:27:34<7:48:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.03s]
Epoch 2: 70%|███████ | 8695/12384 [18:27:41<7:48:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 70%|███████ | 8696/12384 [18:27:41<7:48:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 2: 70%|███████ | 8696/12384 [18:27:49<7:48:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 2: 70%|███████ | 8697/12384 [18:27:49<7:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 2: 70%|███████ | 8697/12384 [18:27:56<7:48:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 70%|███████ | 8698/12384 [18:27:56<7:48:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 70%|███████ | 8698/12384 [18:28:04<7:48:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 70%|███████ | 8699/12384 [18:28:04<7:48:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 70%|███████ | 8699/12384 [18:28:12<7:48:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 70%|███████ | 8700/12384 [18:28:12<7:47:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 70%|███████ | 8700/12384 [18:28:19<7:47:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|███████ | 8701/12384 [18:28:19<7:47:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|███████ | 8701/12384 [18:28:27<7:47:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 70%|███████ | 8702/12384 [18:28:27<7:47:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 70%|███████ | 8702/12384 [18:28:35<7:47:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 2: 70%|███████ | 8703/12384 [18:28:35<7:55:02, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=3.18s]
Epoch 2: 70%|███████ | 8703/12384 [18:28:43<7:55:02, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=12.86s]
Epoch 2: 70%|███████ | 8704/12384 [18:28:43<7:52:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=12.86s]
Epoch 2: 70%|███████ | 8704/12384 [18:28:50<7:52:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 70%|███████ | 8705/12384 [18:28:50<7:51:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 70%|███████ | 8705/12384 [18:28:58<7:51:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 70%|███████ | 8706/12384 [18:28:58<7:50:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 70%|███████ | 8706/12384 [18:29:05<7:50:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 2: 70%|███████ | 8707/12384 [18:29:05<7:48:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 2: 70%|███████ | 8707/12384 [18:29:13<7:48:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 70%|███████ | 8708/12384 [18:29:13<7:47:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 70%|███████ | 8708/12384 [18:29:21<7:47:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 70%|███████ | 8709/12384 [18:29:21<7:46:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 70%|███████ | 8709/12384 [18:29:28<7:46:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 70%|███████ | 8710/12384 [18:29:28<7:46:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 70%|███████ | 8710/12384 [18:29:36<7:46:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 70%|███████ | 8711/12384 [18:29:36<7:46:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 70%|███████ | 8711/12384 [18:29:43<7:46:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 70%|███████ | 8712/12384 [18:29:43<7:45:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.33s]
Epoch 2: 70%|███████ | 8712/12384 [18:29:51<7:45:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 70%|███████ | 8713/12384 [18:29:51<7:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 70%|███████ | 8713/12384 [18:29:59<7:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 70%|███████ | 8714/12384 [18:29:59<7:45:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 70%|███████ | 8714/12384 [18:30:06<7:45:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 70%|███████ | 8715/12384 [18:30:06<7:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 70%|███████ | 8715/12384 [18:30:14<7:45:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 70%|███████ | 8716/12384 [18:30:14<7:45:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 70%|███████ | 8716/12384 [18:30:22<7:45:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 70%|███████ | 8717/12384 [18:30:22<7:45:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 70%|███████ | 8717/12384 [18:30:29<7:45:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 70%|███████ | 8718/12384 [18:30:29<7:46:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 70%|███████ | 8718/12384 [18:30:37<7:46:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 70%|███████ | 8719/12384 [18:30:37<7:47:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 70%|███████ | 8719/12384 [18:30:45<7:47:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 70%|███████ | 8720/12384 [18:30:45<7:47:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 70%|███████ | 8720/12384 [18:30:52<7:47:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 70%|███████ | 8721/12384 [18:30:52<7:47:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 70%|███████ | 8721/12384 [18:31:00<7:47:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.95s]
Epoch 2: 70%|███████ | 8722/12384 [18:31:00<7:46:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.95s]
Epoch 2: 70%|███████ | 8722/12384 [18:31:08<7:46:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 70%|███████ | 8723/12384 [18:31:08<7:45:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 70%|███████ | 8723/12384 [18:31:15<7:45:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 70%|███████ | 8724/12384 [18:31:15<7:45:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 70%|███████ | 8724/12384 [18:31:23<7:45:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 70%|███████ | 8725/12384 [18:31:23<7:45:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 70%|███████ | 8725/12384 [18:31:30<7:45:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|███████ | 8726/12384 [18:31:30<7:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 70%|███████ | 8726/12384 [18:31:38<7:44:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 70%|███████ | 8727/12384 [18:31:38<7:44:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 70%|███████ | 8727/12384 [18:31:46<7:44:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 70%|███████ | 8728/12384 [18:31:46<7:43:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 70%|███████ | 8728/12384 [18:31:53<7:43:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 70%|███████ | 8729/12384 [18:31:53<7:49:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 70%|███████ | 8729/12384 [18:32:01<7:49:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 70%|███████ | 8730/12384 [18:32:01<7:47:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 70%|███████ | 8730/12384 [18:32:09<7:47:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 71%|███████ | 8731/12384 [18:32:09<7:45:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 71%|███████ | 8731/12384 [18:32:16<7:45:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 71%|███████ | 8732/12384 [18:32:16<7:47:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 71%|███████ | 8732/12384 [18:32:24<7:47:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 71%|███████ | 8733/12384 [18:32:24<7:46:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 71%|███████ | 8733/12384 [18:32:32<7:46:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 71%|███████ | 8734/12384 [18:32:32<7:45:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 71%|███████ | 8734/12384 [18:32:39<7:45:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 71%|███████ | 8735/12384 [18:32:39<7:44:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 71%|███████ | 8735/12384 [18:32:47<7:44:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 71%|███████ | 8736/12384 [18:32:47<7:44:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 71%|███████ | 8736/12384 [18:32:55<7:44:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 71%|███████ | 8737/12384 [18:32:55<7:43:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 71%|███████ | 8737/12384 [18:33:02<7:43:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 71%|███████ | 8738/12384 [18:33:02<7:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 71%|███████ | 8738/12384 [18:33:10<7:43:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 71%|███████ | 8739/12384 [18:33:10<7:42:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 71%|███████ | 8739/12384 [18:33:17<7:42:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 71%|███████ | 8740/12384 [18:33:17<7:42:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 71%|███████ | 8740/12384 [18:33:25<7:42:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████ | 8741/12384 [18:33:25<7:42:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████ | 8741/12384 [18:33:33<7:42:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 71%|███████ | 8742/12384 [18:33:33<7:42:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 71%|███████ | 8742/12384 [18:33:40<7:42:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 2: 71%|███████ | 8743/12384 [18:33:40<7:44:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 2: 71%|███████ | 8743/12384 [18:33:48<7:44:22, 7.65s/it, loss=0.0006, acc=0.9983, iter_time=10.87s]
Epoch 2: 71%|███████ | 8744/12384 [18:33:48<7:43:33, 7.64s/it, loss=0.0006, acc=0.9983, iter_time=10.87s]
Epoch 2: 71%|███████ | 8744/12384 [18:33:56<7:43:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████ | 8745/12384 [18:33:56<7:43:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████ | 8745/12384 [18:34:03<7:43:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 71%|███████ | 8746/12384 [18:34:03<7:42:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 71%|███████ | 8746/12384 [18:34:11<7:42:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 71%|███████ | 8747/12384 [18:34:11<7:42:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 71%|███████ | 8747/12384 [18:34:18<7:42:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 2: 71%|███████ | 8748/12384 [18:34:18<7:41:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.61s]
Epoch 2: 71%|███████ | 8748/12384 [18:34:26<7:41:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 71%|███████ | 8749/12384 [18:34:26<7:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 71%|███████ | 8749/12384 [18:34:34<7:41:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 71%|███████ | 8750/12384 [18:34:34<7:46:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 71%|███████ | 8750/12384 [18:34:42<7:46:48, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████ | 8751/12384 [18:34:42<7:45:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████ | 8751/12384 [18:34:49<7:45:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 71%|███████ | 8752/12384 [18:34:49<7:43:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 71%|███████ | 8752/12384 [18:34:57<7:43:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 71%|███████ | 8753/12384 [18:34:57<7:42:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 71%|███████ | 8753/12384 [18:35:04<7:42:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 71%|███████ | 8754/12384 [18:35:04<7:41:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 71%|███████ | 8754/12384 [18:35:12<7:41:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 2: 71%|███████ | 8755/12384 [18:35:12<7:47:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 2: 71%|███████ | 8755/12384 [18:35:20<7:47:23, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 71%|███████ | 8756/12384 [18:35:20<7:45:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 71%|███████ | 8756/12384 [18:35:28<7:45:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 71%|███████ | 8757/12384 [18:35:28<7:44:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 71%|███████ | 8757/12384 [18:35:35<7:44:05, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████ | 8758/12384 [18:35:35<7:42:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████ | 8758/12384 [18:35:43<7:42:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████ | 8759/12384 [18:35:43<7:43:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████ | 8759/12384 [18:35:51<7:43:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 71%|███████ | 8760/12384 [18:35:51<7:43:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 2: 71%|███████ | 8760/12384 [18:35:58<7:43:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 71%|███████ | 8761/12384 [18:35:58<7:43:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 71%|███████ | 8761/12384 [18:36:06<7:43:00, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 71%|███████ | 8762/12384 [18:36:06<7:41:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 71%|███████ | 8762/12384 [18:36:13<7:41:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████ | 8763/12384 [18:36:13<7:41:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████ | 8763/12384 [18:36:21<7:41:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████ | 8764/12384 [18:36:21<7:40:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████ | 8764/12384 [18:36:29<7:40:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████ | 8765/12384 [18:36:29<7:39:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████ | 8765/12384 [18:36:36<7:39:49, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 71%|███████ | 8766/12384 [18:36:36<7:40:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 71%|███████ | 8766/12384 [18:36:44<7:40:59, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████ | 8767/12384 [18:36:44<7:40:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████ | 8767/12384 [18:36:52<7:40:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 71%|███████ | 8768/12384 [18:36:52<7:39:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 71%|███████ | 8768/12384 [18:36:59<7:39:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 71%|███████ | 8769/12384 [18:36:59<7:39:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 71%|███████ | 8769/12384 [18:37:07<7:39:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████ | 8770/12384 [18:37:07<7:40:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████ | 8770/12384 [18:37:14<7:40:02, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.11s]
Epoch 2: 71%|███████ | 8771/12384 [18:37:14<7:39:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.11s]
Epoch 2: 71%|███████ | 8771/12384 [18:37:22<7:39:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 71%|███████ | 8772/12384 [18:37:22<7:38:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.18s]
Epoch 2: 71%|███████ | 8772/12384 [18:37:30<7:38:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 71%|███████ | 8773/12384 [18:37:30<7:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 71%|███████ | 8773/12384 [18:37:37<7:38:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████ | 8774/12384 [18:37:37<7:38:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████ | 8774/12384 [18:37:45<7:38:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████ | 8775/12384 [18:37:45<7:38:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████ | 8775/12384 [18:37:53<7:38:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 71%|███████ | 8776/12384 [18:37:53<7:37:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 71%|███████ | 8776/12384 [18:38:00<7:37:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 2: 71%|███████ | 8777/12384 [18:38:00<7:38:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.99s]
Epoch 2: 71%|███████ | 8777/12384 [18:38:08<7:38:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 71%|███████ | 8778/12384 [18:38:08<7:37:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 71%|███████ | 8778/12384 [18:38:15<7:37:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 71%|███████ | 8779/12384 [18:38:15<7:37:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 71%|███████ | 8779/12384 [18:38:23<7:37:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 71%|███████ | 8780/12384 [18:38:23<7:37:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 71%|███████ | 8780/12384 [18:38:31<7:37:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 71%|███████ | 8781/12384 [18:38:31<7:43:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 71%|███████ | 8781/12384 [18:38:39<7:43:17, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 2: 71%|███████ | 8782/12384 [18:38:39<7:41:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 2: 71%|███████ | 8782/12384 [18:38:46<7:41:10, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 71%|███████ | 8783/12384 [18:38:46<7:39:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 71%|███████ | 8783/12384 [18:38:54<7:39:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 71%|███████ | 8784/12384 [18:38:54<7:40:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 71%|███████ | 8784/12384 [18:39:01<7:40:37, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 2: 71%|███████ | 8785/12384 [18:39:01<7:39:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 2: 71%|███████ | 8785/12384 [18:39:09<7:39:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.96s]
Epoch 2: 71%|███████ | 8786/12384 [18:39:09<7:38:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.96s]
Epoch 2: 71%|███████ | 8786/12384 [18:39:17<7:38:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 2: 71%|███████ | 8787/12384 [18:39:17<7:38:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.89s]
Epoch 2: 71%|███████ | 8787/12384 [18:39:24<7:38:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████ | 8788/12384 [18:39:24<7:37:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████ | 8788/12384 [18:39:32<7:37:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████ | 8789/12384 [18:39:32<7:36:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████ | 8789/12384 [18:39:40<7:36:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████ | 8790/12384 [18:39:40<7:36:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████ | 8790/12384 [18:39:47<7:36:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 71%|███████ | 8791/12384 [18:39:47<7:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 71%|███████ | 8791/12384 [18:39:55<7:36:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 71%|███████ | 8792/12384 [18:39:55<7:36:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 71%|███████ | 8792/12384 [18:40:02<7:36:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.24s]
Epoch 2: 71%|███████ | 8793/12384 [18:40:02<7:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.24s]
Epoch 2: 71%|███████ | 8793/12384 [18:40:10<7:36:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 71%|███████ | 8794/12384 [18:40:10<7:35:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.00s]
Epoch 2: 71%|███████ | 8794/12384 [18:40:18<7:35:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 71%|███████ | 8795/12384 [18:40:18<7:36:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 71%|███████ | 8795/12384 [18:40:25<7:36:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 71%|███████ | 8796/12384 [18:40:25<7:36:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 71%|███████ | 8796/12384 [18:40:33<7:36:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 71%|███████ | 8797/12384 [18:40:33<7:35:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 71%|███████ | 8797/12384 [18:40:41<7:35:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 71%|███████ | 8798/12384 [18:40:41<7:35:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 71%|███████ | 8798/12384 [18:40:48<7:35:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 71%|███████ | 8799/12384 [18:40:48<7:35:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 71%|███████ | 8799/12384 [18:40:56<7:35:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 71%|███████ | 8800/12384 [18:40:56<7:35:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 71%|███████ | 8800/12384 [18:41:03<7:35:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 71%|███████ | 8801/12384 [18:41:03<7:35:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 71%|███████ | 8801/12384 [18:41:11<7:35:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 71%|███████ | 8802/12384 [18:41:11<7:36:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 71%|███████ | 8802/12384 [18:41:19<7:36:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 71%|███████ | 8803/12384 [18:41:19<7:37:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 71%|███████ | 8803/12384 [18:41:26<7:37:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 2: 71%|███████ | 8804/12384 [18:41:26<7:36:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 2: 71%|███████ | 8804/12384 [18:41:34<7:36:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 71%|███████ | 8805/12384 [18:41:34<7:36:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 71%|███████ | 8805/12384 [18:41:42<7:36:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 71%|███████ | 8806/12384 [18:41:42<7:35:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 71%|███████ | 8806/12384 [18:41:49<7:35:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 71%|███████ | 8807/12384 [18:41:49<7:34:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 71%|███████ | 8807/12384 [18:41:57<7:34:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 2: 71%|███████ | 8808/12384 [18:41:57<7:40:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.66s]
Epoch 2: 71%|███████ | 8808/12384 [18:42:05<7:40:10, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 2: 71%|███████ | 8809/12384 [18:42:05<7:38:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 2: 71%|███████ | 8809/12384 [18:42:13<7:38:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 71%|███████ | 8810/12384 [18:42:13<7:37:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 71%|███████ | 8810/12384 [18:42:20<7:37:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 2: 71%|███████ | 8811/12384 [18:42:20<7:37:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 2: 71%|███████ | 8811/12384 [18:42:28<7:37:03, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 71%|███████ | 8812/12384 [18:42:28<7:35:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 71%|███████ | 8812/12384 [18:42:35<7:35:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 71%|███████ | 8813/12384 [18:42:35<7:35:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 71%|███████ | 8813/12384 [18:42:43<7:35:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 71%|███████ | 8814/12384 [18:42:43<7:35:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 71%|███████ | 8814/12384 [18:42:51<7:35:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 71%|███████ | 8815/12384 [18:42:51<7:34:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 71%|███████ | 8815/12384 [18:42:58<7:34:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 71%|███████ | 8816/12384 [18:42:58<7:34:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 71%|███████ | 8816/12384 [18:43:06<7:34:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 71%|███████ | 8817/12384 [18:43:06<7:33:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 71%|███████ | 8817/12384 [18:43:14<7:33:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████ | 8818/12384 [18:43:14<7:33:24, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████ | 8818/12384 [18:43:21<7:33:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 71%|███████ | 8819/12384 [18:43:21<7:32:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 71%|███████ | 8819/12384 [18:43:29<7:32:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 71%|███████ | 8820/12384 [18:43:29<7:34:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 71%|███████ | 8820/12384 [18:43:37<7:34:19, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 71%|███████ | 8821/12384 [18:43:37<7:34:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 71%|███████ | 8821/12384 [18:43:44<7:34:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 71%|███████ | 8822/12384 [18:43:44<7:33:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 71%|███████ | 8822/12384 [18:43:52<7:33:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 71%|███████ | 8823/12384 [18:43:52<7:32:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 71%|███████ | 8823/12384 [18:43:59<7:32:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 71%|███████▏ | 8824/12384 [18:43:59<7:32:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 71%|███████▏ | 8824/12384 [18:44:07<7:32:20, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 71%|███████▏ | 8825/12384 [18:44:07<7:32:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 71%|███████▏ | 8825/12384 [18:44:15<7:32:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████▏ | 8826/12384 [18:44:15<7:31:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████▏ | 8826/12384 [18:44:22<7:31:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████▏ | 8827/12384 [18:44:22<7:31:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████▏ | 8827/12384 [18:44:30<7:31:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████▏ | 8828/12384 [18:44:30<7:31:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████▏ | 8828/12384 [18:44:37<7:31:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 71%|███████▏ | 8829/12384 [18:44:38<7:31:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 71%|███████▏ | 8829/12384 [18:44:45<7:31:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 71%|███████▏ | 8830/12384 [18:44:45<7:31:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 71%|███████▏ | 8830/12384 [18:44:53<7:31:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 71%|███████▏ | 8831/12384 [18:44:53<7:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 71%|███████▏ | 8831/12384 [18:45:00<7:31:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 71%|███████▏ | 8832/12384 [18:45:00<7:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 71%|███████▏ | 8832/12384 [18:45:08<7:31:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 71%|███████▏ | 8833/12384 [18:45:08<7:31:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 71%|███████▏ | 8833/12384 [18:45:16<7:31:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 71%|███████▏ | 8834/12384 [18:45:16<7:37:05, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 71%|███████▏ | 8834/12384 [18:45:24<7:37:05, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 71%|███████▏ | 8835/12384 [18:45:24<7:34:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 71%|███████▏ | 8835/12384 [18:45:31<7:34:28, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 71%|███████▏ | 8836/12384 [18:45:31<7:32:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 71%|███████▏ | 8836/12384 [18:45:39<7:32:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 71%|███████▏ | 8837/12384 [18:45:39<7:32:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 71%|███████▏ | 8837/12384 [18:45:46<7:32:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 71%|███████▏ | 8838/12384 [18:45:46<7:31:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 71%|███████▏ | 8838/12384 [18:45:54<7:31:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████▏ | 8839/12384 [18:45:54<7:30:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████▏ | 8839/12384 [18:46:02<7:30:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 71%|███████▏ | 8840/12384 [18:46:02<7:30:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 71%|███████▏ | 8840/12384 [18:46:09<7:30:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 71%|███████▏ | 8841/12384 [18:46:09<7:29:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 71%|███████▏ | 8841/12384 [18:46:17<7:29:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████▏ | 8842/12384 [18:46:17<7:29:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████▏ | 8842/12384 [18:46:24<7:29:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████▏ | 8843/12384 [18:46:24<7:29:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 71%|███████▏ | 8843/12384 [18:46:32<7:29:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████▏ | 8844/12384 [18:46:32<7:29:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 71%|███████▏ | 8844/12384 [18:46:40<7:29:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 71%|███████▏ | 8845/12384 [18:46:40<7:30:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 71%|███████▏ | 8845/12384 [18:46:47<7:30:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 2: 71%|███████▏ | 8846/12384 [18:46:47<7:30:50, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 2: 71%|███████▏ | 8846/12384 [18:46:55<7:30:50, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.07s]
Epoch 2: 71%|███████▏ | 8847/12384 [18:46:55<7:29:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.07s]
Epoch 2: 71%|███████▏ | 8847/12384 [18:47:03<7:29:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 71%|███████▏ | 8848/12384 [18:47:03<7:29:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 71%|███████▏ | 8848/12384 [18:47:10<7:29:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 71%|███████▏ | 8849/12384 [18:47:10<7:29:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 71%|███████▏ | 8849/12384 [18:47:18<7:29:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████▏ | 8850/12384 [18:47:18<7:29:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████▏ | 8850/12384 [18:47:25<7:29:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████▏ | 8851/12384 [18:47:25<7:28:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 71%|███████▏ | 8851/12384 [18:47:33<7:28:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████▏ | 8852/12384 [18:47:33<7:28:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████▏ | 8852/12384 [18:47:41<7:28:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████▏ | 8853/12384 [18:47:41<7:27:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████▏ | 8853/12384 [18:47:48<7:27:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████▏ | 8854/12384 [18:47:48<7:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 71%|███████▏ | 8854/12384 [18:47:56<7:27:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8855/12384 [18:47:56<7:28:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8855/12384 [18:48:04<7:28:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 72%|███████▏ | 8856/12384 [18:48:04<7:33:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 2: 72%|███████▏ | 8856/12384 [18:48:11<7:33:01, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 2: 72%|███████▏ | 8857/12384 [18:48:11<7:31:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=3.68s]
Epoch 2: 72%|███████▏ | 8857/12384 [18:48:19<7:31:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 72%|███████▏ | 8858/12384 [18:48:19<7:29:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 72%|███████▏ | 8858/12384 [18:48:27<7:29:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.45s]
Epoch 2: 72%|███████▏ | 8859/12384 [18:48:27<7:28:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.45s]
Epoch 2: 72%|███████▏ | 8859/12384 [18:48:34<7:28:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8860/12384 [18:48:34<7:28:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8860/12384 [18:48:42<7:28:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 72%|███████▏ | 8861/12384 [18:48:42<7:33:39, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 72%|███████▏ | 8861/12384 [18:48:50<7:33:39, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 72%|███████▏ | 8862/12384 [18:48:50<7:30:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 72%|███████▏ | 8862/12384 [18:48:57<7:30:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 2: 72%|███████▏ | 8863/12384 [18:48:57<7:29:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 2: 72%|███████▏ | 8863/12384 [18:49:05<7:29:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8864/12384 [18:49:05<7:30:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8864/12384 [18:49:13<7:30:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 72%|███████▏ | 8865/12384 [18:49:13<7:28:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 72%|███████▏ | 8865/12384 [18:49:20<7:28:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 72%|███████▏ | 8866/12384 [18:49:20<7:27:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 72%|███████▏ | 8866/12384 [18:49:28<7:27:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8867/12384 [18:49:28<7:27:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8867/12384 [18:49:35<7:27:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 72%|███████▏ | 8868/12384 [18:49:35<7:26:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 72%|███████▏ | 8868/12384 [18:49:43<7:26:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 72%|███████▏ | 8869/12384 [18:49:43<7:26:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 72%|███████▏ | 8869/12384 [18:49:51<7:26:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 72%|███████▏ | 8870/12384 [18:49:51<7:26:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 72%|███████▏ | 8870/12384 [18:49:58<7:26:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 72%|███████▏ | 8871/12384 [18:49:58<7:26:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 72%|███████▏ | 8871/12384 [18:50:06<7:26:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 72%|███████▏ | 8872/12384 [18:50:06<7:27:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 72%|███████▏ | 8872/12384 [18:50:14<7:27:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 72%|███████▏ | 8873/12384 [18:50:14<7:26:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 72%|███████▏ | 8873/12384 [18:50:21<7:26:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 72%|███████▏ | 8874/12384 [18:50:21<7:27:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 72%|███████▏ | 8874/12384 [18:50:29<7:27:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 72%|███████▏ | 8875/12384 [18:50:29<7:26:41, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.83s]
Epoch 2: 72%|███████▏ | 8875/12384 [18:50:37<7:26:41, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.39s]
Epoch 2: 72%|███████▏ | 8876/12384 [18:50:37<7:26:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.39s]
Epoch 2: 72%|███████▏ | 8876/12384 [18:50:44<7:26:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8877/12384 [18:50:44<7:26:01, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8877/12384 [18:50:52<7:26:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 72%|███████▏ | 8878/12384 [18:50:52<7:25:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.46s]
Epoch 2: 72%|███████▏ | 8878/12384 [18:50:59<7:25:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 72%|███████▏ | 8879/12384 [18:50:59<7:24:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 72%|███████▏ | 8879/12384 [18:51:07<7:24:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 2: 72%|███████▏ | 8880/12384 [18:51:07<7:24:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.34s]
Epoch 2: 72%|███████▏ | 8880/12384 [18:51:15<7:24:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 72%|███████▏ | 8881/12384 [18:51:15<7:30:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 72%|███████▏ | 8881/12384 [18:51:23<7:30:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 72%|███████▏ | 8882/12384 [18:51:23<7:28:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 72%|███████▏ | 8882/12384 [18:51:30<7:28:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 72%|███████▏ | 8883/12384 [18:51:30<7:27:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 72%|███████▏ | 8883/12384 [18:51:38<7:27:10, 7.66s/it, loss=0.0002, acc=0.9990, iter_time=5.31s]
Epoch 2: 72%|███████▏ | 8884/12384 [18:51:38<7:26:01, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=5.31s]
Epoch 2: 72%|███████▏ | 8884/12384 [18:51:45<7:26:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 2: 72%|███████▏ | 8885/12384 [18:51:45<7:25:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.27s]
Epoch 2: 72%|███████▏ | 8885/12384 [18:51:53<7:25:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 72%|███████▏ | 8886/12384 [18:51:53<7:24:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 72%|███████▏ | 8886/12384 [18:52:01<7:24:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 72%|███████▏ | 8887/12384 [18:52:01<7:29:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 72%|███████▏ | 8887/12384 [18:52:09<7:29:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 72%|███████▏ | 8888/12384 [18:52:09<7:28:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 72%|███████▏ | 8888/12384 [18:52:16<7:28:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 72%|███████▏ | 8889/12384 [18:52:16<7:26:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 72%|███████▏ | 8889/12384 [18:52:24<7:26:51, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8890/12384 [18:52:24<7:26:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8890/12384 [18:52:32<7:26:30, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 72%|███████▏ | 8891/12384 [18:52:32<7:25:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 72%|███████▏ | 8891/12384 [18:52:39<7:25:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 72%|███████▏ | 8892/12384 [18:52:39<7:25:21, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 72%|███████▏ | 8892/12384 [18:52:47<7:25:21, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8893/12384 [18:52:47<7:24:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8893/12384 [18:52:54<7:24:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8894/12384 [18:52:54<7:23:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8894/12384 [18:53:02<7:23:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8895/12384 [18:53:02<7:23:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8895/12384 [18:53:10<7:23:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 72%|███████▏ | 8896/12384 [18:53:10<7:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 72%|███████▏ | 8896/12384 [18:53:17<7:22:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 72%|███████▏ | 8897/12384 [18:53:17<7:22:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.92s]
Epoch 2: 72%|███████▏ | 8897/12384 [18:53:25<7:22:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 72%|███████▏ | 8898/12384 [18:53:25<7:22:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 72%|███████▏ | 8898/12384 [18:53:32<7:22:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 72%|███████▏ | 8899/12384 [18:53:32<7:22:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 72%|███████▏ | 8899/12384 [18:53:40<7:22:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 72%|███████▏ | 8900/12384 [18:53:40<7:22:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 72%|███████▏ | 8900/12384 [18:53:48<7:22:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 72%|███████▏ | 8901/12384 [18:53:48<7:21:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 72%|███████▏ | 8901/12384 [18:53:55<7:21:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8902/12384 [18:53:55<7:21:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8902/12384 [18:54:03<7:21:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8903/12384 [18:54:03<7:21:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8903/12384 [18:54:11<7:21:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 72%|███████▏ | 8904/12384 [18:54:11<7:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 72%|███████▏ | 8904/12384 [18:54:18<7:22:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 72%|███████▏ | 8905/12384 [18:54:18<7:22:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 72%|███████▏ | 8905/12384 [18:54:26<7:22:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 72%|███████▏ | 8906/12384 [18:54:26<7:26:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 72%|███████▏ | 8906/12384 [18:54:34<7:26:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8907/12384 [18:54:34<7:24:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8907/12384 [18:54:41<7:24:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8908/12384 [18:54:41<7:23:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8908/12384 [18:54:49<7:23:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8909/12384 [18:54:49<7:22:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8909/12384 [18:54:56<7:22:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8910/12384 [18:54:56<7:21:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8910/12384 [18:55:04<7:21:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8911/12384 [18:55:04<7:21:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8911/12384 [18:55:12<7:21:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 72%|███████▏ | 8912/12384 [18:55:12<7:21:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 72%|███████▏ | 8912/12384 [18:55:20<7:21:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 72%|███████▏ | 8913/12384 [18:55:20<7:26:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 72%|███████▏ | 8913/12384 [18:55:27<7:26:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 72%|███████▏ | 8914/12384 [18:55:27<7:24:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 72%|███████▏ | 8914/12384 [18:55:35<7:24:37, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8915/12384 [18:55:35<7:23:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8915/12384 [18:55:43<7:23:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 72%|███████▏ | 8916/12384 [18:55:43<7:24:15, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 72%|███████▏ | 8916/12384 [18:55:50<7:24:15, 7.69s/it, loss=0.0003, acc=0.9998, iter_time=7.68s]
Epoch 2: 72%|███████▏ | 8917/12384 [18:55:50<7:23:09, 7.67s/it, loss=0.0003, acc=0.9998, iter_time=7.68s]
Epoch 2: 72%|███████▏ | 8917/12384 [18:55:58<7:23:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 72%|███████▏ | 8918/12384 [18:55:58<7:21:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 72%|███████▏ | 8918/12384 [18:56:06<7:21:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 72%|███████▏ | 8919/12384 [18:56:06<7:22:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 72%|███████▏ | 8919/12384 [18:56:13<7:22:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 72%|███████▏ | 8920/12384 [18:56:13<7:21:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 72%|███████▏ | 8920/12384 [18:56:21<7:21:20, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 2: 72%|███████▏ | 8921/12384 [18:56:21<7:20:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.15s]
Epoch 2: 72%|███████▏ | 8921/12384 [18:56:28<7:20:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 72%|███████▏ | 8922/12384 [18:56:28<7:20:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 72%|███████▏ | 8922/12384 [18:56:36<7:20:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8923/12384 [18:56:36<7:19:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8923/12384 [18:56:44<7:19:47, 7.62s/it, loss=0.0001, acc=0.9990, iter_time=5.79s]
Epoch 2: 72%|███████▏ | 8924/12384 [18:56:44<7:19:17, 7.62s/it, loss=0.0001, acc=0.9990, iter_time=5.79s]
Epoch 2: 72%|███████▏ | 8924/12384 [18:56:51<7:19:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 72%|███████▏ | 8925/12384 [18:56:51<7:19:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 72%|███████▏ | 8925/12384 [18:56:59<7:19:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 72%|███████▏ | 8926/12384 [18:56:59<7:18:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 72%|███████▏ | 8926/12384 [18:57:06<7:18:47, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 72%|███████▏ | 8927/12384 [18:57:06<7:18:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 72%|███████▏ | 8927/12384 [18:57:14<7:18:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 72%|███████▏ | 8928/12384 [18:57:14<7:18:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 72%|███████▏ | 8928/12384 [18:57:22<7:18:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 72%|███████▏ | 8929/12384 [18:57:22<7:18:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 72%|███████▏ | 8929/12384 [18:57:29<7:18:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 72%|███████▏ | 8930/12384 [18:57:29<7:18:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 72%|███████▏ | 8930/12384 [18:57:37<7:18:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 2: 72%|███████▏ | 8931/12384 [18:57:37<7:18:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 2: 72%|███████▏ | 8931/12384 [18:57:44<7:18:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 72%|███████▏ | 8932/12384 [18:57:44<7:17:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.44s]
Epoch 2: 72%|███████▏ | 8932/12384 [18:57:52<7:17:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 72%|███████▏ | 8933/12384 [18:57:52<7:17:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 72%|███████▏ | 8933/12384 [18:58:00<7:17:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8934/12384 [18:58:00<7:17:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8934/12384 [18:58:07<7:17:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 72%|███████▏ | 8935/12384 [18:58:07<7:17:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.32s]
Epoch 2: 72%|███████▏ | 8935/12384 [18:58:15<7:17:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 72%|███████▏ | 8936/12384 [18:58:15<7:17:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.86s]
Epoch 2: 72%|███████▏ | 8936/12384 [18:58:23<7:17:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 72%|███████▏ | 8937/12384 [18:58:23<7:19:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 72%|███████▏ | 8937/12384 [18:58:30<7:19:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 72%|███████▏ | 8938/12384 [18:58:30<7:18:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 72%|███████▏ | 8938/12384 [18:58:38<7:18:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 72%|███████▏ | 8939/12384 [18:58:38<7:23:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 72%|███████▏ | 8939/12384 [18:58:46<7:23:26, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 72%|███████▏ | 8940/12384 [18:58:46<7:21:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 72%|███████▏ | 8940/12384 [18:58:53<7:21:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8941/12384 [18:58:53<7:19:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 72%|███████▏ | 8941/12384 [18:59:01<7:19:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 72%|███████▏ | 8942/12384 [18:59:01<7:18:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 72%|███████▏ | 8942/12384 [18:59:09<7:18:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8943/12384 [18:59:09<7:17:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 72%|███████▏ | 8943/12384 [18:59:16<7:17:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 72%|███████▏ | 8944/12384 [18:59:16<7:17:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 72%|███████▏ | 8944/12384 [18:59:24<7:17:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 72%|███████▏ | 8945/12384 [18:59:24<7:16:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 72%|███████▏ | 8945/12384 [18:59:31<7:16:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8946/12384 [18:59:31<7:16:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 72%|███████▏ | 8946/12384 [18:59:39<7:16:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 72%|███████▏ | 8947/12384 [18:59:39<7:16:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 72%|███████▏ | 8947/12384 [18:59:47<7:16:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 72%|███████▏ | 8948/12384 [18:59:47<7:16:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 72%|███████▏ | 8948/12384 [18:59:54<7:16:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 72%|███████▏ | 8949/12384 [18:59:54<7:15:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 72%|███████▏ | 8949/12384 [19:00:02<7:15:29, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 72%|███████▏ | 8950/12384 [19:00:02<7:15:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 72%|███████▏ | 8950/12384 [19:00:09<7:15:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 72%|███████▏ | 8951/12384 [19:00:09<7:15:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 72%|███████▏ | 8951/12384 [19:00:17<7:15:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 72%|███████▏ | 8952/12384 [19:00:17<7:15:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 72%|███████▏ | 8952/12384 [19:00:25<7:15:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 2: 72%|███████▏ | 8953/12384 [19:00:25<7:15:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.45s]
Epoch 2: 72%|███████▏ | 8953/12384 [19:00:32<7:15:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 72%|███████▏ | 8954/12384 [19:00:32<7:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 72%|███████▏ | 8954/12384 [19:00:40<7:15:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 72%|███████▏ | 8955/12384 [19:00:40<7:15:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 72%|███████▏ | 8955/12384 [19:00:48<7:15:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 72%|███████▏ | 8956/12384 [19:00:48<7:15:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.18s]
Epoch 2: 72%|███████▏ | 8956/12384 [19:00:55<7:15:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 72%|███████▏ | 8957/12384 [19:00:55<7:15:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 72%|███████▏ | 8957/12384 [19:01:03<7:15:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 72%|███████▏ | 8958/12384 [19:01:03<7:15:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 72%|███████▏ | 8958/12384 [19:01:10<7:15:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 2: 72%|███████▏ | 8959/12384 [19:01:10<7:14:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.23s]
Epoch 2: 72%|███████▏ | 8959/12384 [19:01:18<7:14:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.74s]
Epoch 2: 72%|███████▏ | 8960/12384 [19:01:18<7:14:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.74s]
Epoch 2: 72%|███████▏ | 8960/12384 [19:01:26<7:14:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 2: 72%|███████▏ | 8961/12384 [19:01:26<7:14:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 2: 72%|███████▏ | 8961/12384 [19:01:33<7:14:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 2: 72%|███████▏ | 8962/12384 [19:01:33<7:14:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.21s]
Epoch 2: 72%|███████▏ | 8962/12384 [19:01:41<7:14:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 72%|███████▏ | 8963/12384 [19:01:41<7:14:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 72%|███████▏ | 8963/12384 [19:01:49<7:14:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 72%|███████▏ | 8964/12384 [19:01:49<7:13:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 72%|███████▏ | 8964/12384 [19:01:56<7:13:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 72%|███████▏ | 8965/12384 [19:01:56<7:19:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.14s]
Epoch 2: 72%|███████▏ | 8965/12384 [19:02:04<7:19:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 72%|███████▏ | 8966/12384 [19:02:04<7:17:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 72%|███████▏ | 8966/12384 [19:02:12<7:17:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 72%|███████▏ | 8967/12384 [19:02:12<7:16:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 72%|███████▏ | 8967/12384 [19:02:19<7:16:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 72%|███████▏ | 8968/12384 [19:02:19<7:15:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 72%|███████▏ | 8968/12384 [19:02:27<7:15:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 72%|███████▏ | 8969/12384 [19:02:27<7:14:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 72%|███████▏ | 8969/12384 [19:02:35<7:14:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 72%|███████▏ | 8970/12384 [19:02:35<7:13:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 72%|███████▏ | 8970/12384 [19:02:42<7:13:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 72%|███████▏ | 8971/12384 [19:02:42<7:13:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 72%|███████▏ | 8971/12384 [19:02:50<7:13:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 2: 72%|███████▏ | 8972/12384 [19:02:50<7:15:30, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 2: 72%|███████▏ | 8972/12384 [19:02:57<7:15:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 72%|███████▏ | 8973/12384 [19:02:57<7:14:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 72%|███████▏ | 8973/12384 [19:03:05<7:14:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 72%|███████▏ | 8974/12384 [19:03:05<7:13:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 2: 72%|███████▏ | 8974/12384 [19:03:13<7:13:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 72%|███████▏ | 8975/12384 [19:03:13<7:13:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 72%|███████▏ | 8975/12384 [19:03:20<7:13:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 72%|███████▏ | 8976/12384 [19:03:20<7:13:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 72%|███████▏ | 8976/12384 [19:03:28<7:13:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 72%|███████▏ | 8977/12384 [19:03:28<7:12:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 72%|███████▏ | 8977/12384 [19:03:36<7:12:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8978/12384 [19:03:36<7:12:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 72%|███████▏ | 8978/12384 [19:03:43<7:12:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 73%|███████▎ | 8979/12384 [19:03:43<7:12:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 73%|███████▎ | 8979/12384 [19:03:51<7:12:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 73%|███████▎ | 8980/12384 [19:03:51<7:11:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 73%|███████▎ | 8980/12384 [19:03:58<7:11:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 73%|███████▎ | 8981/12384 [19:03:58<7:11:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 73%|███████▎ | 8981/12384 [19:04:06<7:11:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 73%|███████▎ | 8982/12384 [19:04:06<7:11:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 73%|███████▎ | 8982/12384 [19:04:14<7:11:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 2: 73%|███████▎ | 8983/12384 [19:04:14<7:11:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.90s]
Epoch 2: 73%|███████▎ | 8983/12384 [19:04:21<7:11:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 2: 73%|███████▎ | 8984/12384 [19:04:21<7:11:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 2: 73%|███████▎ | 8984/12384 [19:04:29<7:11:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 73%|███████▎ | 8985/12384 [19:04:29<7:15:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 73%|███████▎ | 8985/12384 [19:04:37<7:15:51, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 8986/12384 [19:04:37<7:14:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 8986/12384 [19:04:44<7:14:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 8987/12384 [19:04:44<7:13:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 8987/12384 [19:04:52<7:13:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 73%|███████▎ | 8988/12384 [19:04:52<7:12:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 73%|███████▎ | 8988/12384 [19:05:00<7:12:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 73%|███████▎ | 8989/12384 [19:05:00<7:11:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 73%|███████▎ | 8989/12384 [19:05:07<7:11:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 8990/12384 [19:05:07<7:11:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 8990/12384 [19:05:15<7:11:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 73%|███████▎ | 8991/12384 [19:05:15<7:11:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 73%|███████▎ | 8991/12384 [19:05:23<7:11:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 73%|███████▎ | 8992/12384 [19:05:23<7:15:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.37s]
Epoch 2: 73%|███████▎ | 8992/12384 [19:05:30<7:15:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 73%|███████▎ | 8993/12384 [19:05:30<7:14:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 73%|███████▎ | 8993/12384 [19:05:38<7:14:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 73%|███████▎ | 8994/12384 [19:05:38<7:12:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 73%|███████▎ | 8994/12384 [19:05:46<7:12:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 73%|███████▎ | 8995/12384 [19:05:46<7:13:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.58s]
Epoch 2: 73%|███████▎ | 8995/12384 [19:05:53<7:13:36, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 73%|███████▎ | 8996/12384 [19:05:53<7:12:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 73%|███████▎ | 8996/12384 [19:06:01<7:12:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 73%|███████▎ | 8997/12384 [19:06:01<7:11:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 73%|███████▎ | 8997/12384 [19:06:09<7:11:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 73%|███████▎ | 8998/12384 [19:06:09<7:12:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 73%|███████▎ | 8998/12384 [19:06:16<7:12:53, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 73%|███████▎ | 8999/12384 [19:06:16<7:11:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 73%|███████▎ | 8999/12384 [19:06:24<7:11:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 73%|███████▎ | 9000/12384 [19:06:24<7:10:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 73%|███████▎ | 9000/12384 [19:06:31<7:10:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 73%|███████▎ | 9001/12384 [19:06:31<7:09:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 73%|███████▎ | 9001/12384 [19:06:39<7:09:54, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.95s]
Epoch 2: 73%|███████▎ | 9002/12384 [19:06:39<7:09:42, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=10.95s]
Epoch 2: 73%|███████▎ | 9002/12384 [19:06:47<7:09:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.17s]
Epoch 2: 73%|███████▎ | 9003/12384 [19:06:47<7:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.17s]
Epoch 2: 73%|███████▎ | 9003/12384 [19:06:54<7:09:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 73%|███████▎ | 9004/12384 [19:06:54<7:09:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 73%|███████▎ | 9004/12384 [19:07:02<7:09:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 73%|███████▎ | 9005/12384 [19:07:02<7:09:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.61s]
Epoch 2: 73%|███████▎ | 9005/12384 [19:07:10<7:09:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 73%|███████▎ | 9006/12384 [19:07:10<7:09:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 73%|███████▎ | 9006/12384 [19:07:17<7:09:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 73%|███████▎ | 9007/12384 [19:07:17<7:09:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 73%|███████▎ | 9007/12384 [19:07:25<7:09:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 73%|███████▎ | 9008/12384 [19:07:25<7:09:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 73%|███████▎ | 9008/12384 [19:07:32<7:09:29, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.21s]
Epoch 2: 73%|███████▎ | 9009/12384 [19:07:32<7:09:01, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.21s]
Epoch 2: 73%|███████▎ | 9009/12384 [19:07:40<7:09:01, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9010/12384 [19:07:40<7:09:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9010/12384 [19:07:48<7:09:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 73%|███████▎ | 9011/12384 [19:07:48<7:16:02, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 73%|███████▎ | 9011/12384 [19:07:56<7:16:02, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 73%|███████▎ | 9012/12384 [19:07:56<7:13:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.05s]
Epoch 2: 73%|███████▎ | 9012/12384 [19:08:03<7:13:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 73%|███████▎ | 9013/12384 [19:08:03<7:11:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 73%|███████▎ | 9013/12384 [19:08:11<7:11:14, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 73%|███████▎ | 9014/12384 [19:08:11<7:10:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 73%|███████▎ | 9014/12384 [19:08:19<7:10:06, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 73%|███████▎ | 9015/12384 [19:08:19<7:09:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 73%|███████▎ | 9015/12384 [19:08:26<7:09:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 73%|███████▎ | 9016/12384 [19:08:26<7:08:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 73%|███████▎ | 9016/12384 [19:08:34<7:08:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 73%|███████▎ | 9017/12384 [19:08:34<7:08:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.63s]
Epoch 2: 73%|███████▎ | 9017/12384 [19:08:42<7:08:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 2: 73%|███████▎ | 9018/12384 [19:08:42<7:13:08, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.68s]
Epoch 2: 73%|███████▎ | 9018/12384 [19:08:49<7:13:08, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 2: 73%|███████▎ | 9019/12384 [19:08:49<7:10:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.18s]
Epoch 2: 73%|███████▎ | 9019/12384 [19:08:57<7:10:51, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 2: 73%|███████▎ | 9020/12384 [19:08:57<7:09:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.87s]
Epoch 2: 73%|███████▎ | 9020/12384 [19:09:05<7:09:57, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 73%|███████▎ | 9021/12384 [19:09:05<7:09:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 73%|███████▎ | 9021/12384 [19:09:12<7:09:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 73%|███████▎ | 9022/12384 [19:09:12<7:08:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 73%|███████▎ | 9022/12384 [19:09:20<7:08:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 73%|███████▎ | 9023/12384 [19:09:20<7:07:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 73%|███████▎ | 9023/12384 [19:09:27<7:07:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 73%|███████▎ | 9024/12384 [19:09:27<7:06:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 73%|███████▎ | 9024/12384 [19:09:35<7:06:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 73%|███████▎ | 9025/12384 [19:09:35<7:07:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 73%|███████▎ | 9025/12384 [19:09:43<7:07:58, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 73%|███████▎ | 9026/12384 [19:09:43<7:07:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 73%|███████▎ | 9026/12384 [19:09:50<7:07:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9027/12384 [19:09:50<7:07:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9027/12384 [19:09:58<7:07:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9028/12384 [19:09:58<7:06:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9028/12384 [19:10:06<7:06:23, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 2: 73%|███████▎ | 9029/12384 [19:10:06<7:05:56, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 2: 73%|███████▎ | 9029/12384 [19:10:13<7:05:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 73%|███████▎ | 9030/12384 [19:10:13<7:05:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 73%|███████▎ | 9030/12384 [19:10:21<7:05:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 73%|███████▎ | 9031/12384 [19:10:21<7:05:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.84s]
Epoch 2: 73%|███████▎ | 9031/12384 [19:10:28<7:05:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 2: 73%|███████▎ | 9032/12384 [19:10:28<7:05:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 2: 73%|███████▎ | 9032/12384 [19:10:36<7:05:21, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.20s]
Epoch 2: 73%|███████▎ | 9033/12384 [19:10:36<7:05:13, 7.61s/it, loss=0.0001, acc=0.9999, iter_time=7.20s]
Epoch 2: 73%|███████▎ | 9033/12384 [19:10:44<7:05:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9034/12384 [19:10:44<7:04:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9034/12384 [19:10:51<7:04:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9035/12384 [19:10:51<7:04:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9035/12384 [19:10:59<7:04:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 73%|███████▎ | 9036/12384 [19:10:59<7:04:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 73%|███████▎ | 9036/12384 [19:11:07<7:04:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 73%|███████▎ | 9037/12384 [19:11:07<7:08:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.76s]
Epoch 2: 73%|███████▎ | 9037/12384 [19:11:14<7:08:55, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 73%|███████▎ | 9038/12384 [19:11:14<7:07:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 73%|███████▎ | 9038/12384 [19:11:22<7:07:45, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 73%|███████▎ | 9039/12384 [19:11:22<7:07:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 73%|███████▎ | 9039/12384 [19:11:30<7:07:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 73%|███████▎ | 9040/12384 [19:11:30<7:06:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 73%|███████▎ | 9040/12384 [19:11:37<7:06:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 73%|███████▎ | 9041/12384 [19:11:37<7:05:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 73%|███████▎ | 9041/12384 [19:11:45<7:05:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9042/12384 [19:11:45<7:04:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9042/12384 [19:11:52<7:04:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9043/12384 [19:11:52<7:04:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9043/12384 [19:12:00<7:04:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9044/12384 [19:12:00<7:04:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9044/12384 [19:12:08<7:04:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 73%|███████▎ | 9045/12384 [19:12:08<7:08:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 73%|███████▎ | 9045/12384 [19:12:16<7:08:55, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 73%|███████▎ | 9046/12384 [19:12:16<7:08:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 73%|███████▎ | 9046/12384 [19:12:23<7:08:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 73%|███████▎ | 9047/12384 [19:12:23<7:06:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 73%|███████▎ | 9047/12384 [19:12:31<7:06:26, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 73%|███████▎ | 9048/12384 [19:12:31<7:05:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 73%|███████▎ | 9048/12384 [19:12:38<7:05:32, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 73%|███████▎ | 9049/12384 [19:12:38<7:04:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 73%|███████▎ | 9049/12384 [19:12:46<7:04:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 73%|███████▎ | 9050/12384 [19:12:46<7:03:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 73%|███████▎ | 9050/12384 [19:12:54<7:03:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9051/12384 [19:12:54<7:04:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9051/12384 [19:13:01<7:04:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 73%|███████▎ | 9052/12384 [19:13:01<7:03:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 73%|███████▎ | 9052/12384 [19:13:09<7:03:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 73%|███████▎ | 9053/12384 [19:13:09<7:02:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.92s]
Epoch 2: 73%|███████▎ | 9053/12384 [19:13:17<7:02:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 73%|███████▎ | 9054/12384 [19:13:17<7:02:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 73%|███████▎ | 9054/12384 [19:13:24<7:02:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 73%|███████▎ | 9055/12384 [19:13:24<7:02:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 73%|███████▎ | 9055/12384 [19:13:32<7:02:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 73%|███████▎ | 9056/12384 [19:13:32<7:01:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 73%|███████▎ | 9056/12384 [19:13:39<7:01:54, 7.61s/it, loss=0.0005, acc=0.9981, iter_time=6.20s]
Epoch 2: 73%|███████▎ | 9057/12384 [19:13:39<7:01:51, 7.61s/it, loss=0.0005, acc=0.9981, iter_time=6.20s]
Epoch 2: 73%|███████▎ | 9057/12384 [19:13:47<7:01:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 73%|███████▎ | 9058/12384 [19:13:47<7:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 73%|███████▎ | 9058/12384 [19:13:55<7:01:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 73%|███████▎ | 9059/12384 [19:13:55<7:01:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.77s]
Epoch 2: 73%|███████▎ | 9059/12384 [19:14:02<7:01:41, 7.61s/it, loss=0.0007, acc=0.9987, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9060/12384 [19:14:02<7:01:34, 7.61s/it, loss=0.0007, acc=0.9987, iter_time=7.60s]
Epoch 2: 73%|███████▎ | 9060/12384 [19:14:10<7:01:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 2: 73%|███████▎ | 9061/12384 [19:14:10<7:01:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.90s]
Epoch 2: 73%|███████▎ | 9061/12384 [19:14:17<7:01:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 73%|███████▎ | 9062/12384 [19:14:17<7:01:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 73%|███████▎ | 9062/12384 [19:14:25<7:01:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 73%|███████▎ | 9063/12384 [19:14:25<7:01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 73%|███████▎ | 9063/12384 [19:14:33<7:01:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 2: 73%|███████▎ | 9064/12384 [19:14:33<7:01:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.24s]
Epoch 2: 73%|███████▎ | 9064/12384 [19:14:40<7:01:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 73%|███████▎ | 9065/12384 [19:14:40<7:00:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.62s]
Epoch 2: 73%|███████▎ | 9065/12384 [19:14:48<7:00:45, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 73%|███████▎ | 9066/12384 [19:14:48<7:00:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.45s]
Epoch 2: 73%|███████▎ | 9066/12384 [19:14:55<7:00:22, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 2: 73%|███████▎ | 9067/12384 [19:14:55<7:00:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.32s]
Epoch 2: 73%|███████▎ | 9067/12384 [19:15:03<7:00:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9068/12384 [19:15:03<7:00:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9068/12384 [19:15:11<7:00:16, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 73%|███████▎ | 9069/12384 [19:15:11<7:00:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 73%|███████▎ | 9069/12384 [19:15:18<7:00:06, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 73%|███████▎ | 9070/12384 [19:15:18<7:00:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 73%|███████▎ | 9070/12384 [19:15:26<7:00:01, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 73%|███████▎ | 9071/12384 [19:15:26<7:05:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 73%|███████▎ | 9071/12384 [19:15:34<7:05:59, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 73%|███████▎ | 9072/12384 [19:15:34<7:04:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 73%|███████▎ | 9072/12384 [19:15:41<7:04:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 73%|███████▎ | 9073/12384 [19:15:41<7:03:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 73%|███████▎ | 9073/12384 [19:15:49<7:03:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9074/12384 [19:15:49<7:01:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 73%|███████▎ | 9074/12384 [19:15:57<7:01:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 73%|███████▎ | 9075/12384 [19:15:57<7:00:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 73%|███████▎ | 9075/12384 [19:16:04<7:00:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 73%|███████▎ | 9076/12384 [19:16:04<6:59:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.79s]
Epoch 2: 73%|███████▎ | 9076/12384 [19:16:12<6:59:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 73%|███████▎ | 9077/12384 [19:16:12<6:59:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 73%|███████▎ | 9077/12384 [19:16:19<6:59:39, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 73%|███████▎ | 9078/12384 [19:16:19<7:00:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 73%|███████▎ | 9078/12384 [19:16:27<7:00:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 73%|███████▎ | 9079/12384 [19:16:27<7:00:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 73%|███████▎ | 9079/12384 [19:16:35<7:00:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 73%|███████▎ | 9080/12384 [19:16:35<7:00:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 73%|███████▎ | 9080/12384 [19:16:42<7:00:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 73%|███████▎ | 9081/12384 [19:16:42<7:00:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.08s]
Epoch 2: 73%|███████▎ | 9081/12384 [19:16:50<7:00:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 73%|███████▎ | 9082/12384 [19:16:50<7:00:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 73%|███████▎ | 9082/12384 [19:16:58<7:00:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 73%|███████▎ | 9083/12384 [19:16:58<6:59:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 73%|███████▎ | 9083/12384 [19:17:05<6:59:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 73%|███████▎ | 9084/12384 [19:17:05<6:59:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 73%|███████▎ | 9084/12384 [19:17:13<6:59:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 73%|███████▎ | 9085/12384 [19:17:13<6:59:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 73%|███████▎ | 9085/12384 [19:17:21<6:59:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 73%|███████▎ | 9086/12384 [19:17:21<6:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 73%|███████▎ | 9086/12384 [19:17:28<6:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 73%|███████▎ | 9087/12384 [19:17:28<6:58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 73%|███████▎ | 9087/12384 [19:17:36<6:58:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 73%|███████▎ | 9088/12384 [19:17:36<6:59:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 73%|███████▎ | 9088/12384 [19:17:43<6:59:51, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 2: 73%|███████▎ | 9089/12384 [19:17:43<6:59:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 2: 73%|███████▎ | 9089/12384 [19:17:51<6:59:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 73%|███████▎ | 9090/12384 [19:17:51<6:58:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 73%|███████▎ | 9090/12384 [19:17:59<6:58:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 2: 73%|███████▎ | 9091/12384 [19:17:59<6:57:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 2: 73%|███████▎ | 9091/12384 [19:18:06<6:57:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 73%|███████▎ | 9092/12384 [19:18:06<6:57:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 73%|███████▎ | 9092/12384 [19:18:14<6:57:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 73%|███████▎ | 9093/12384 [19:18:14<6:57:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 73%|███████▎ | 9093/12384 [19:18:21<6:57:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 2: 73%|███████▎ | 9094/12384 [19:18:21<6:57:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 2: 73%|███████▎ | 9094/12384 [19:18:29<6:57:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 73%|███████▎ | 9095/12384 [19:18:29<6:57:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 73%|███████▎ | 9095/12384 [19:18:37<6:57:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 73%|███████▎ | 9096/12384 [19:18:37<6:57:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 73%|███████▎ | 9096/12384 [19:18:45<6:57:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 73%|███████▎ | 9097/12384 [19:18:45<7:02:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 73%|███████▎ | 9097/12384 [19:18:52<7:02:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 73%|███████▎ | 9098/12384 [19:18:52<7:00:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 73%|███████▎ | 9098/12384 [19:19:00<7:00:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 73%|███████▎ | 9099/12384 [19:19:00<6:59:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 73%|███████▎ | 9099/12384 [19:19:07<6:59:23, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 2: 73%|███████▎ | 9100/12384 [19:19:07<6:58:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.02s]
Epoch 2: 73%|███████▎ | 9100/12384 [19:19:15<6:58:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 73%|███████▎ | 9101/12384 [19:19:15<6:57:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.99s]
Epoch 2: 73%|███████▎ | 9101/12384 [19:19:23<6:57:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 73%|███████▎ | 9102/12384 [19:19:23<6:56:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 73%|███████▎ | 9102/12384 [19:19:30<6:56:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 74%|███████▎ | 9103/12384 [19:19:30<6:56:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 74%|███████▎ | 9103/12384 [19:19:38<6:56:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 74%|███████▎ | 9104/12384 [19:19:38<6:56:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.77s]
Epoch 2: 74%|███████▎ | 9104/12384 [19:19:45<6:56:15, 7.61s/it, loss=0.0003, acc=0.9986, iter_time=7.68s]
Epoch 2: 74%|███████▎ | 9105/12384 [19:19:45<6:56:11, 7.62s/it, loss=0.0003, acc=0.9986, iter_time=7.68s]
Epoch 2: 74%|███████▎ | 9105/12384 [19:19:53<6:56:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▎ | 9106/12384 [19:19:53<6:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▎ | 9106/12384 [19:20:01<6:56:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 74%|███████▎ | 9107/12384 [19:20:01<6:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 74%|███████▎ | 9107/12384 [19:20:08<6:55:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 74%|███████▎ | 9108/12384 [19:20:08<6:55:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 74%|███████▎ | 9108/12384 [19:20:16<6:55:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 74%|███████▎ | 9109/12384 [19:20:16<6:55:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.08s]
Epoch 2: 74%|███████▎ | 9109/12384 [19:20:24<6:55:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 74%|███████▎ | 9110/12384 [19:20:24<6:57:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 74%|███████▎ | 9110/12384 [19:20:31<6:57:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 74%|███████▎ | 9111/12384 [19:20:31<6:56:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 74%|███████▎ | 9111/12384 [19:20:39<6:56:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▎ | 9112/12384 [19:20:39<6:56:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▎ | 9112/12384 [19:20:47<6:56:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 74%|███████▎ | 9113/12384 [19:20:47<6:55:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.79s]
Epoch 2: 74%|███████▎ | 9113/12384 [19:20:54<6:55:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 74%|███████▎ | 9114/12384 [19:20:54<6:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.47s]
Epoch 2: 74%|███████▎ | 9114/12384 [19:21:02<6:55:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 74%|███████▎ | 9115/12384 [19:21:02<6:55:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 74%|███████▎ | 9115/12384 [19:21:09<6:55:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 74%|███████▎ | 9116/12384 [19:21:09<6:54:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.80s]
Epoch 2: 74%|███████▎ | 9116/12384 [19:21:17<6:54:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 74%|███████▎ | 9117/12384 [19:21:17<6:54:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.65s]
Epoch 2: 74%|███████▎ | 9117/12384 [19:21:25<6:54:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 74%|███████▎ | 9118/12384 [19:21:25<6:54:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 74%|███████▎ | 9118/12384 [19:21:32<6:54:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 74%|███████▎ | 9119/12384 [19:21:32<6:54:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 74%|███████▎ | 9119/12384 [19:21:40<6:54:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 74%|███████▎ | 9120/12384 [19:21:40<6:53:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 74%|███████▎ | 9120/12384 [19:21:47<6:53:54, 7.61s/it, loss=0.0005, acc=0.9969, iter_time=7.63s]
Epoch 2: 74%|███████▎ | 9121/12384 [19:21:47<6:53:12, 7.60s/it, loss=0.0005, acc=0.9969, iter_time=7.63s]
Epoch 2: 74%|███████▎ | 9121/12384 [19:21:55<6:53:12, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▎ | 9122/12384 [19:21:55<6:53:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▎ | 9122/12384 [19:22:03<6:53:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 74%|███████▎ | 9123/12384 [19:22:03<7:00:02, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 74%|███████▎ | 9123/12384 [19:22:11<7:00:02, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 74%|███████▎ | 9124/12384 [19:22:11<6:59:48, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 74%|███████▎ | 9124/12384 [19:22:18<6:59:48, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 74%|███████▎ | 9125/12384 [19:22:18<6:57:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 74%|███████▎ | 9125/12384 [19:22:26<6:57:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▎ | 9126/12384 [19:22:26<6:56:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▎ | 9126/12384 [19:22:34<6:56:37, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 74%|███████▎ | 9127/12384 [19:22:34<6:55:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 2: 74%|███████▎ | 9127/12384 [19:22:41<6:55:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 74%|███████▎ | 9128/12384 [19:22:41<6:54:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.45s]
Epoch 2: 74%|███████▎ | 9128/12384 [19:22:49<6:54:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 74%|███████▎ | 9129/12384 [19:22:49<6:55:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 74%|███████▎ | 9129/12384 [19:22:57<6:55:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▎ | 9130/12384 [19:22:57<6:55:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▎ | 9130/12384 [19:23:04<6:55:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 74%|███████▎ | 9131/12384 [19:23:04<6:54:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 74%|███████▎ | 9131/12384 [19:23:12<6:54:30, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 74%|███████▎ | 9132/12384 [19:23:12<6:53:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 74%|███████▎ | 9132/12384 [19:23:19<6:53:29, 7.63s/it, loss=0.0001, acc=0.9987, iter_time=7.21s]
Epoch 2: 74%|███████▎ | 9133/12384 [19:23:19<6:53:03, 7.62s/it, loss=0.0001, acc=0.9987, iter_time=7.21s]
Epoch 2: 74%|███████▎ | 9133/12384 [19:23:27<6:53:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9134/12384 [19:23:27<6:52:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9134/12384 [19:23:35<6:52:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9135/12384 [19:23:35<6:52:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9135/12384 [19:23:42<6:52:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 74%|███████▍ | 9136/12384 [19:23:42<6:52:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 74%|███████▍ | 9136/12384 [19:23:50<6:52:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 74%|███████▍ | 9137/12384 [19:23:50<6:52:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.34s]
Epoch 2: 74%|███████▍ | 9137/12384 [19:23:57<6:52:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 74%|███████▍ | 9138/12384 [19:23:57<6:52:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 74%|███████▍ | 9138/12384 [19:24:05<6:52:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 74%|███████▍ | 9139/12384 [19:24:05<6:52:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 74%|███████▍ | 9139/12384 [19:24:13<6:52:34, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 74%|███████▍ | 9140/12384 [19:24:13<6:52:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 74%|███████▍ | 9140/12384 [19:24:20<6:52:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 74%|███████▍ | 9141/12384 [19:24:20<6:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 74%|███████▍ | 9141/12384 [19:24:28<6:51:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 74%|███████▍ | 9142/12384 [19:24:28<6:55:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.19s]
Epoch 2: 74%|███████▍ | 9142/12384 [19:24:36<6:55:46, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▍ | 9143/12384 [19:24:36<6:55:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▍ | 9143/12384 [19:24:43<6:55:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 74%|███████▍ | 9144/12384 [19:24:43<6:54:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 74%|███████▍ | 9144/12384 [19:24:51<6:54:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 74%|███████▍ | 9145/12384 [19:24:51<6:52:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 74%|███████▍ | 9145/12384 [19:24:59<6:52:54, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9146/12384 [19:24:59<6:51:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9146/12384 [19:25:06<6:51:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 74%|███████▍ | 9147/12384 [19:25:06<6:51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 74%|███████▍ | 9147/12384 [19:25:14<6:51:36, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 74%|███████▍ | 9148/12384 [19:25:14<6:50:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 74%|███████▍ | 9148/12384 [19:25:22<6:50:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 74%|███████▍ | 9149/12384 [19:25:22<6:56:40, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.19s]
Epoch 2: 74%|███████▍ | 9149/12384 [19:25:30<6:56:40, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 74%|███████▍ | 9150/12384 [19:25:30<6:56:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 74%|███████▍ | 9150/12384 [19:25:37<6:56:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 74%|███████▍ | 9151/12384 [19:25:37<6:56:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 74%|███████▍ | 9151/12384 [19:25:45<6:56:30, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 74%|███████▍ | 9152/12384 [19:25:45<6:54:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.91s]
Epoch 2: 74%|███████▍ | 9152/12384 [19:25:53<6:54:16, 7.69s/it, loss=0.0003, acc=0.9993, iter_time=7.21s]
Epoch 2: 74%|███████▍ | 9153/12384 [19:25:53<6:52:56, 7.67s/it, loss=0.0003, acc=0.9993, iter_time=7.21s]
Epoch 2: 74%|███████▍ | 9153/12384 [19:26:00<6:52:56, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9154/12384 [19:26:00<6:51:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9154/12384 [19:26:08<6:51:32, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9155/12384 [19:26:08<6:50:51, 7.63s/it, loss=0.0004, acc=0.9982, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9155/12384 [19:26:15<6:50:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▍ | 9156/12384 [19:26:15<6:50:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▍ | 9156/12384 [19:26:23<6:50:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 74%|███████▍ | 9157/12384 [19:26:23<6:50:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 74%|███████▍ | 9157/12384 [19:26:31<6:50:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 74%|███████▍ | 9158/12384 [19:26:31<6:50:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 74%|███████▍ | 9158/12384 [19:26:38<6:50:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 74%|███████▍ | 9159/12384 [19:26:38<6:50:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 74%|███████▍ | 9159/12384 [19:26:46<6:50:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 74%|███████▍ | 9160/12384 [19:26:46<6:49:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 74%|███████▍ | 9160/12384 [19:26:53<6:49:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 74%|███████▍ | 9161/12384 [19:26:53<6:48:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 74%|███████▍ | 9161/12384 [19:27:01<6:48:44, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 74%|███████▍ | 9162/12384 [19:27:01<6:49:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 74%|███████▍ | 9162/12384 [19:27:09<6:49:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 74%|███████▍ | 9163/12384 [19:27:09<6:49:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 74%|███████▍ | 9163/12384 [19:27:16<6:49:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▍ | 9164/12384 [19:27:16<6:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▍ | 9164/12384 [19:27:24<6:48:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▍ | 9165/12384 [19:27:24<6:48:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 74%|███████▍ | 9165/12384 [19:27:32<6:48:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 2: 74%|███████▍ | 9166/12384 [19:27:32<6:48:08, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.22s]
Epoch 2: 74%|███████▍ | 9166/12384 [19:27:39<6:48:08, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.99s]
Epoch 2: 74%|███████▍ | 9167/12384 [19:27:39<6:47:53, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=10.99s]
Epoch 2: 74%|███████▍ | 9167/12384 [19:27:47<6:47:53, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 74%|███████▍ | 9168/12384 [19:27:47<6:47:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 74%|███████▍ | 9168/12384 [19:27:54<6:47:52, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.09s]
Epoch 2: 74%|███████▍ | 9169/12384 [19:27:54<6:47:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.09s]
Epoch 2: 74%|███████▍ | 9169/12384 [19:28:02<6:47:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 2: 74%|███████▍ | 9170/12384 [19:28:02<6:49:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.48s]
Epoch 2: 74%|███████▍ | 9170/12384 [19:28:10<6:49:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 74%|███████▍ | 9171/12384 [19:28:10<6:48:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 74%|███████▍ | 9171/12384 [19:28:17<6:48:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9172/12384 [19:28:17<6:48:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9172/12384 [19:28:25<6:48:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 74%|███████▍ | 9173/12384 [19:28:25<6:49:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 74%|███████▍ | 9173/12384 [19:28:33<6:49:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 74%|███████▍ | 9174/12384 [19:28:33<6:48:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.46s]
Epoch 2: 74%|███████▍ | 9174/12384 [19:28:40<6:48:43, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=10.39s]
Epoch 2: 74%|███████▍ | 9175/12384 [19:28:40<6:48:20, 7.63s/it, loss=0.0003, acc=0.9999, iter_time=10.39s]
Epoch 2: 74%|███████▍ | 9175/12384 [19:28:48<6:48:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 74%|███████▍ | 9176/12384 [19:28:48<6:53:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 74%|███████▍ | 9176/12384 [19:28:56<6:53:07, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 2: 74%|███████▍ | 9177/12384 [19:28:56<6:51:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.48s]
Epoch 2: 74%|███████▍ | 9177/12384 [19:29:03<6:51:03, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 74%|███████▍ | 9178/12384 [19:29:03<6:49:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 74%|███████▍ | 9178/12384 [19:29:11<6:49:38, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 2: 74%|███████▍ | 9179/12384 [19:29:11<6:48:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 2: 74%|███████▍ | 9179/12384 [19:29:19<6:48:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 74%|███████▍ | 9180/12384 [19:29:19<6:47:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 74%|███████▍ | 9180/12384 [19:29:26<6:47:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 2: 74%|███████▍ | 9181/12384 [19:29:26<6:47:08, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 2: 74%|███████▍ | 9181/12384 [19:29:34<6:47:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 74%|███████▍ | 9182/12384 [19:29:34<6:46:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 74%|███████▍ | 9182/12384 [19:29:41<6:46:36, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 74%|███████▍ | 9183/12384 [19:29:41<6:46:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 74%|███████▍ | 9183/12384 [19:29:49<6:46:39, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 74%|███████▍ | 9184/12384 [19:29:49<6:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 74%|███████▍ | 9184/12384 [19:29:57<6:46:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 2: 74%|███████▍ | 9185/12384 [19:29:57<6:46:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.12s]
Epoch 2: 74%|███████▍ | 9185/12384 [19:30:04<6:46:39, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 74%|███████▍ | 9186/12384 [19:30:04<6:46:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.19s]
Epoch 2: 74%|███████▍ | 9186/12384 [19:30:12<6:46:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 74%|███████▍ | 9187/12384 [19:30:12<6:46:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 74%|███████▍ | 9187/12384 [19:30:20<6:46:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9188/12384 [19:30:20<6:47:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9188/12384 [19:30:27<6:47:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 74%|███████▍ | 9189/12384 [19:30:27<6:46:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.50s]
Epoch 2: 74%|███████▍ | 9189/12384 [19:30:35<6:46:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 74%|███████▍ | 9190/12384 [19:30:35<6:48:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 74%|███████▍ | 9190/12384 [19:30:43<6:48:12, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 74%|███████▍ | 9191/12384 [19:30:43<6:47:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 74%|███████▍ | 9191/12384 [19:30:50<6:47:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 74%|███████▍ | 9192/12384 [19:30:50<6:46:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 74%|███████▍ | 9192/12384 [19:30:58<6:46:27, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.02s]
Epoch 2: 74%|███████▍ | 9193/12384 [19:30:58<6:45:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.02s]
Epoch 2: 74%|███████▍ | 9193/12384 [19:31:05<6:45:45, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 2: 74%|███████▍ | 9194/12384 [19:31:05<6:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.54s]
Epoch 2: 74%|███████▍ | 9194/12384 [19:31:13<6:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 74%|███████▍ | 9195/12384 [19:31:13<6:49:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 74%|███████▍ | 9195/12384 [19:31:21<6:49:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 2: 74%|███████▍ | 9196/12384 [19:31:21<6:47:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.05s]
Epoch 2: 74%|███████▍ | 9196/12384 [19:31:29<6:47:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 74%|███████▍ | 9197/12384 [19:31:29<6:46:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 74%|███████▍ | 9197/12384 [19:31:36<6:46:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 74%|███████▍ | 9198/12384 [19:31:36<6:46:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 74%|███████▍ | 9198/12384 [19:31:44<6:46:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 74%|███████▍ | 9199/12384 [19:31:44<6:45:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 74%|███████▍ | 9199/12384 [19:31:51<6:45:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 74%|███████▍ | 9200/12384 [19:31:51<6:44:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 74%|███████▍ | 9200/12384 [19:31:59<6:44:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 74%|███████▍ | 9201/12384 [19:31:59<6:44:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 74%|███████▍ | 9201/12384 [19:32:07<6:44:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 74%|███████▍ | 9202/12384 [19:32:07<6:50:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 74%|███████▍ | 9202/12384 [19:32:15<6:50:26, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 2: 74%|███████▍ | 9203/12384 [19:32:15<6:48:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 2: 74%|███████▍ | 9203/12384 [19:32:22<6:48:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 74%|███████▍ | 9204/12384 [19:32:22<6:47:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 74%|███████▍ | 9204/12384 [19:32:30<6:47:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9205/12384 [19:32:30<6:47:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9205/12384 [19:32:38<6:47:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 74%|███████▍ | 9206/12384 [19:32:38<6:47:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 74%|███████▍ | 9206/12384 [19:32:45<6:47:30, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 74%|███████▍ | 9207/12384 [19:32:45<6:45:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.58s]
Epoch 2: 74%|███████▍ | 9207/12384 [19:32:53<6:45:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 74%|███████▍ | 9208/12384 [19:32:53<6:45:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 74%|███████▍ | 9208/12384 [19:33:01<6:45:13, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 74%|███████▍ | 9209/12384 [19:33:01<6:44:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.19s]
Epoch 2: 74%|███████▍ | 9209/12384 [19:33:08<6:44:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 74%|███████▍ | 9210/12384 [19:33:08<6:43:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 74%|███████▍ | 9210/12384 [19:33:16<6:43:32, 7.63s/it, loss=0.0001, acc=0.9989, iter_time=9.91s]
Epoch 2: 74%|███████▍ | 9211/12384 [19:33:16<6:42:50, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=9.91s]
Epoch 2: 74%|███████▍ | 9211/12384 [19:33:23<6:42:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9212/12384 [19:33:23<6:42:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9212/12384 [19:33:31<6:42:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9213/12384 [19:33:31<6:42:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9213/12384 [19:33:39<6:42:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9214/12384 [19:33:39<6:42:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9214/12384 [19:33:46<6:42:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9215/12384 [19:33:46<6:42:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 74%|███████▍ | 9215/12384 [19:33:54<6:42:05, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 74%|███████▍ | 9216/12384 [19:33:54<6:42:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 74%|███████▍ | 9216/12384 [19:34:01<6:42:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 74%|███████▍ | 9217/12384 [19:34:01<6:42:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 74%|███████▍ | 9217/12384 [19:34:09<6:42:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 74%|███████▍ | 9218/12384 [19:34:09<6:42:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 74%|███████▍ | 9218/12384 [19:34:17<6:42:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 74%|███████▍ | 9219/12384 [19:34:17<6:41:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 74%|███████▍ | 9219/12384 [19:34:24<6:41:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 2: 74%|███████▍ | 9220/12384 [19:34:24<6:42:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.56s]
Epoch 2: 74%|███████▍ | 9220/12384 [19:34:32<6:42:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 74%|███████▍ | 9221/12384 [19:34:32<6:41:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 74%|███████▍ | 9221/12384 [19:34:40<6:41:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 74%|███████▍ | 9222/12384 [19:34:40<6:41:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 74%|███████▍ | 9222/12384 [19:34:47<6:41:19, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9223/12384 [19:34:47<6:40:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 74%|███████▍ | 9223/12384 [19:34:55<6:40:50, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 74%|███████▍ | 9224/12384 [19:34:55<6:42:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 74%|███████▍ | 9224/12384 [19:35:02<6:42:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 74%|███████▍ | 9225/12384 [19:35:02<6:41:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 74%|███████▍ | 9225/12384 [19:35:10<6:41:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 74%|███████▍ | 9226/12384 [19:35:10<6:41:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 74%|███████▍ | 9226/12384 [19:35:18<6:41:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 75%|███████▍ | 9227/12384 [19:35:18<6:42:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 75%|███████▍ | 9227/12384 [19:35:25<6:42:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 75%|███████▍ | 9228/12384 [19:35:25<6:41:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.36s]
Epoch 2: 75%|███████▍ | 9228/12384 [19:35:33<6:41:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 75%|███████▍ | 9229/12384 [19:35:33<6:46:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 75%|███████▍ | 9229/12384 [19:35:41<6:46:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 75%|███████▍ | 9230/12384 [19:35:41<6:44:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 75%|███████▍ | 9230/12384 [19:35:49<6:44:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 75%|███████▍ | 9231/12384 [19:35:49<6:42:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 75%|███████▍ | 9231/12384 [19:35:56<6:42:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 75%|███████▍ | 9232/12384 [19:35:56<6:44:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 75%|███████▍ | 9232/12384 [19:36:04<6:44:49, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 75%|███████▍ | 9233/12384 [19:36:04<6:43:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 75%|███████▍ | 9233/12384 [19:36:12<6:43:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 75%|███████▍ | 9234/12384 [19:36:12<6:42:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.50s]
Epoch 2: 75%|███████▍ | 9234/12384 [19:36:19<6:42:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 75%|███████▍ | 9235/12384 [19:36:19<6:41:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 2: 75%|███████▍ | 9235/12384 [19:36:27<6:41:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 75%|███████▍ | 9236/12384 [19:36:27<6:40:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.96s]
Epoch 2: 75%|███████▍ | 9236/12384 [19:36:34<6:40:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9237/12384 [19:36:34<6:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9237/12384 [19:36:42<6:40:20, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▍ | 9238/12384 [19:36:42<6:39:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▍ | 9238/12384 [19:36:50<6:39:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9239/12384 [19:36:50<6:39:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9239/12384 [19:36:57<6:39:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 75%|███████▍ | 9240/12384 [19:36:57<6:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 75%|███████▍ | 9240/12384 [19:37:05<6:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 75%|███████▍ | 9241/12384 [19:37:05<6:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 75%|███████▍ | 9241/12384 [19:37:12<6:38:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 75%|███████▍ | 9242/12384 [19:37:12<6:38:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 75%|███████▍ | 9242/12384 [19:37:20<6:38:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 75%|███████▍ | 9243/12384 [19:37:20<6:38:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 75%|███████▍ | 9243/12384 [19:37:28<6:38:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▍ | 9244/12384 [19:37:28<6:38:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▍ | 9244/12384 [19:37:35<6:38:16, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 75%|███████▍ | 9245/12384 [19:37:35<6:38:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 75%|███████▍ | 9245/12384 [19:37:43<6:38:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 2: 75%|███████▍ | 9246/12384 [19:37:43<6:38:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.30s]
Epoch 2: 75%|███████▍ | 9246/12384 [19:37:50<6:38:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 75%|███████▍ | 9247/12384 [19:37:50<6:37:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 75%|███████▍ | 9247/12384 [19:37:58<6:37:33, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 75%|███████▍ | 9248/12384 [19:37:58<6:37:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 75%|███████▍ | 9248/12384 [19:38:06<6:37:15, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 75%|███████▍ | 9249/12384 [19:38:06<6:37:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 75%|███████▍ | 9249/12384 [19:38:13<6:37:14, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9250/12384 [19:38:13<6:37:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9250/12384 [19:38:21<6:37:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▍ | 9251/12384 [19:38:21<6:37:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▍ | 9251/12384 [19:38:29<6:37:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9252/12384 [19:38:29<6:37:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9252/12384 [19:38:36<6:37:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9253/12384 [19:38:36<6:37:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9253/12384 [19:38:44<6:37:18, 7.61s/it, loss=0.0001, acc=0.9995, iter_time=7.63s]
Epoch 2: 75%|███████▍ | 9254/12384 [19:38:44<6:37:15, 7.62s/it, loss=0.0001, acc=0.9995, iter_time=7.63s]
Epoch 2: 75%|███████▍ | 9254/12384 [19:38:52<6:37:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 75%|███████▍ | 9255/12384 [19:38:52<6:42:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 75%|███████▍ | 9255/12384 [19:38:59<6:42:10, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 75%|███████▍ | 9256/12384 [19:38:59<6:40:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 75%|███████▍ | 9256/12384 [19:39:07<6:40:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 2: 75%|███████▍ | 9257/12384 [19:39:07<6:39:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.43s]
Epoch 2: 75%|███████▍ | 9257/12384 [19:39:15<6:39:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 2: 75%|███████▍ | 9258/12384 [19:39:15<6:38:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.84s]
Epoch 2: 75%|███████▍ | 9258/12384 [19:39:22<6:38:38, 7.65s/it, loss=0.0002, acc=0.9991, iter_time=7.32s]
Epoch 2: 75%|███████▍ | 9259/12384 [19:39:22<6:37:52, 7.64s/it, loss=0.0002, acc=0.9991, iter_time=7.32s]
Epoch 2: 75%|███████▍ | 9259/12384 [19:39:30<6:37:52, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.24s]
Epoch 2: 75%|███████▍ | 9260/12384 [19:39:30<6:37:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.24s]
Epoch 2: 75%|███████▍ | 9260/12384 [19:39:37<6:37:19, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.84s]
Epoch 2: 75%|███████▍ | 9261/12384 [19:39:37<6:37:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.84s]
Epoch 2: 75%|███████▍ | 9261/12384 [19:39:45<6:37:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 2: 75%|███████▍ | 9262/12384 [19:39:45<6:37:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.39s]
Epoch 2: 75%|███████▍ | 9262/12384 [19:39:53<6:37:16, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 75%|███████▍ | 9263/12384 [19:39:53<6:37:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 75%|███████▍ | 9263/12384 [19:40:00<6:37:04, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.83s]
Epoch 2: 75%|███████▍ | 9264/12384 [19:40:00<6:37:16, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=8.83s]
Epoch 2: 75%|███████▍ | 9264/12384 [19:40:08<6:37:16, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 75%|███████▍ | 9265/12384 [19:40:08<6:36:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 75%|███████▍ | 9265/12384 [19:40:16<6:36:43, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 75%|███████▍ | 9266/12384 [19:40:16<6:38:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 75%|███████▍ | 9266/12384 [19:40:23<6:38:10, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▍ | 9267/12384 [19:40:23<6:37:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▍ | 9267/12384 [19:40:31<6:37:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9268/12384 [19:40:31<6:36:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9268/12384 [19:40:39<6:36:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9269/12384 [19:40:39<6:36:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9269/12384 [19:40:46<6:36:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9270/12384 [19:40:46<6:35:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▍ | 9270/12384 [19:40:54<6:35:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▍ | 9271/12384 [19:40:54<6:35:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▍ | 9271/12384 [19:41:01<6:35:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 75%|███████▍ | 9272/12384 [19:41:01<6:35:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 75%|███████▍ | 9272/12384 [19:41:09<6:35:00, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 75%|███████▍ | 9273/12384 [19:41:09<6:34:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 75%|███████▍ | 9273/12384 [19:41:17<6:34:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▍ | 9274/12384 [19:41:17<6:34:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▍ | 9274/12384 [19:41:24<6:34:18, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▍ | 9275/12384 [19:41:24<6:34:17, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▍ | 9275/12384 [19:41:32<6:34:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9276/12384 [19:41:32<6:34:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9276/12384 [19:41:39<6:34:07, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 75%|███████▍ | 9277/12384 [19:41:39<6:33:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 75%|███████▍ | 9277/12384 [19:41:47<6:33:36, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 75%|███████▍ | 9278/12384 [19:41:47<6:33:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 75%|███████▍ | 9278/12384 [19:41:55<6:33:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 75%|███████▍ | 9279/12384 [19:41:55<6:33:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 75%|███████▍ | 9279/12384 [19:42:02<6:33:27, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 75%|███████▍ | 9280/12384 [19:42:02<6:33:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 75%|███████▍ | 9280/12384 [19:42:10<6:33:24, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 75%|███████▍ | 9281/12384 [19:42:10<6:38:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 75%|███████▍ | 9281/12384 [19:42:18<6:38:53, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 75%|███████▍ | 9282/12384 [19:42:18<6:38:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 75%|███████▍ | 9282/12384 [19:42:25<6:38:29, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 75%|███████▍ | 9283/12384 [19:42:25<6:36:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 75%|███████▍ | 9283/12384 [19:42:33<6:36:52, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 2: 75%|███████▍ | 9284/12384 [19:42:33<6:35:58, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 2: 75%|███████▍ | 9284/12384 [19:42:41<6:35:58, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9285/12384 [19:42:41<6:35:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▍ | 9285/12384 [19:42:48<6:35:13, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▍ | 9286/12384 [19:42:48<6:34:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▍ | 9286/12384 [19:42:56<6:34:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 75%|███████▍ | 9287/12384 [19:42:56<6:34:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 75%|███████▍ | 9287/12384 [19:43:04<6:34:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 75%|███████▌ | 9288/12384 [19:43:04<6:33:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 75%|███████▌ | 9288/12384 [19:43:11<6:33:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 75%|███████▌ | 9289/12384 [19:43:11<6:34:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 75%|███████▌ | 9289/12384 [19:43:19<6:34:07, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▌ | 9290/12384 [19:43:19<6:33:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▌ | 9290/12384 [19:43:26<6:33:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▌ | 9291/12384 [19:43:26<6:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▌ | 9291/12384 [19:43:34<6:32:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 75%|███████▌ | 9292/12384 [19:43:34<6:34:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 75%|███████▌ | 9292/12384 [19:43:42<6:34:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 75%|███████▌ | 9293/12384 [19:43:42<6:33:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 75%|███████▌ | 9293/12384 [19:43:49<6:33:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 75%|███████▌ | 9294/12384 [19:43:49<6:32:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.57s]
Epoch 2: 75%|███████▌ | 9294/12384 [19:43:57<6:32:31, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.11s]
Epoch 2: 75%|███████▌ | 9295/12384 [19:43:57<6:31:54, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=4.11s]
Epoch 2: 75%|███████▌ | 9295/12384 [19:44:05<6:31:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 2: 75%|███████▌ | 9296/12384 [19:44:05<6:31:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=11.02s]
Epoch 2: 75%|███████▌ | 9296/12384 [19:44:12<6:31:23, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 75%|███████▌ | 9297/12384 [19:44:12<6:31:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 75%|███████▌ | 9297/12384 [19:44:20<6:31:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 75%|███████▌ | 9298/12384 [19:44:20<6:35:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 75%|███████▌ | 9298/12384 [19:44:28<6:35:47, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▌ | 9299/12384 [19:44:28<6:34:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▌ | 9299/12384 [19:44:35<6:34:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 75%|███████▌ | 9300/12384 [19:44:35<6:33:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.83s]
Epoch 2: 75%|███████▌ | 9300/12384 [19:44:43<6:33:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 75%|███████▌ | 9301/12384 [19:44:43<6:32:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.37s]
Epoch 2: 75%|███████▌ | 9301/12384 [19:44:51<6:32:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 75%|███████▌ | 9302/12384 [19:44:51<6:32:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 75%|███████▌ | 9302/12384 [19:44:58<6:32:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▌ | 9303/12384 [19:44:58<6:32:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▌ | 9303/12384 [19:45:06<6:32:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 75%|███████▌ | 9304/12384 [19:45:06<6:31:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 75%|███████▌ | 9304/12384 [19:45:14<6:31:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.33s]
Epoch 2: 75%|███████▌ | 9305/12384 [19:45:14<6:34:16, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.33s]
Epoch 2: 75%|███████▌ | 9305/12384 [19:45:21<6:34:16, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 2: 75%|███████▌ | 9306/12384 [19:45:21<6:32:48, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 2: 75%|███████▌ | 9306/12384 [19:45:29<6:32:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 75%|███████▌ | 9307/12384 [19:45:29<6:36:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.77s]
Epoch 2: 75%|███████▌ | 9307/12384 [19:45:37<6:36:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 75%|███████▌ | 9308/12384 [19:45:37<6:34:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.33s]
Epoch 2: 75%|███████▌ | 9308/12384 [19:45:44<6:34:20, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 75%|███████▌ | 9309/12384 [19:45:44<6:32:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.97s]
Epoch 2: 75%|███████▌ | 9309/12384 [19:45:52<6:32:37, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 75%|███████▌ | 9310/12384 [19:45:52<6:32:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.37s]
Epoch 2: 75%|███████▌ | 9310/12384 [19:46:00<6:32:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 75%|███████▌ | 9311/12384 [19:46:00<6:31:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 75%|███████▌ | 9311/12384 [19:46:07<6:31:32, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=8.01s]
Epoch 2: 75%|███████▌ | 9312/12384 [19:46:07<6:31:05, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=8.01s]
Epoch 2: 75%|███████▌ | 9312/12384 [19:46:15<6:31:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 75%|███████▌ | 9313/12384 [19:46:15<6:30:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 75%|███████▌ | 9313/12384 [19:46:22<6:30:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 75%|███████▌ | 9314/12384 [19:46:22<6:30:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 75%|███████▌ | 9314/12384 [19:46:30<6:30:04, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▌ | 9315/12384 [19:46:30<6:29:26, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▌ | 9315/12384 [19:46:38<6:29:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 75%|███████▌ | 9316/12384 [19:46:38<6:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 75%|███████▌ | 9316/12384 [19:46:45<6:29:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 75%|███████▌ | 9317/12384 [19:46:45<6:29:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 75%|███████▌ | 9317/12384 [19:46:53<6:29:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▌ | 9318/12384 [19:46:53<6:29:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 75%|███████▌ | 9318/12384 [19:47:00<6:29:18, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 75%|███████▌ | 9319/12384 [19:47:00<6:29:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.86s]
Epoch 2: 75%|███████▌ | 9319/12384 [19:47:08<6:29:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 75%|███████▌ | 9320/12384 [19:47:08<6:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.76s]
Epoch 2: 75%|███████▌ | 9320/12384 [19:47:16<6:29:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 75%|███████▌ | 9321/12384 [19:47:16<6:28:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 75%|███████▌ | 9321/12384 [19:47:23<6:28:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▌ | 9322/12384 [19:47:23<6:28:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▌ | 9322/12384 [19:47:31<6:28:53, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▌ | 9323/12384 [19:47:31<6:28:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▌ | 9323/12384 [19:47:39<6:28:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 75%|███████▌ | 9324/12384 [19:47:39<6:33:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 75%|███████▌ | 9324/12384 [19:47:46<6:33:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 75%|███████▌ | 9325/12384 [19:47:46<6:31:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 75%|███████▌ | 9325/12384 [19:47:54<6:31:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 2: 75%|███████▌ | 9326/12384 [19:47:54<6:30:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.68s]
Epoch 2: 75%|███████▌ | 9326/12384 [19:48:02<6:30:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 75%|███████▌ | 9327/12384 [19:48:02<6:29:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.83s]
Epoch 2: 75%|███████▌ | 9327/12384 [19:48:09<6:29:37, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 75%|███████▌ | 9328/12384 [19:48:09<6:28:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 75%|███████▌ | 9328/12384 [19:48:17<6:28:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 75%|███████▌ | 9329/12384 [19:48:17<6:28:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 75%|███████▌ | 9329/12384 [19:48:25<6:28:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 75%|███████▌ | 9330/12384 [19:48:25<6:27:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 75%|███████▌ | 9330/12384 [19:48:32<6:27:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 75%|███████▌ | 9331/12384 [19:48:32<6:28:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.12s]
Epoch 2: 75%|███████▌ | 9331/12384 [19:48:40<6:28:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 75%|███████▌ | 9332/12384 [19:48:40<6:28:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 75%|███████▌ | 9332/12384 [19:48:48<6:28:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 75%|███████▌ | 9333/12384 [19:48:48<6:32:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 75%|███████▌ | 9333/12384 [19:48:55<6:32:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 75%|███████▌ | 9334/12384 [19:48:55<6:30:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 75%|███████▌ | 9334/12384 [19:49:03<6:30:49, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 75%|███████▌ | 9335/12384 [19:49:03<6:29:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 75%|███████▌ | 9335/12384 [19:49:11<6:29:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 75%|███████▌ | 9336/12384 [19:49:11<6:28:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 75%|███████▌ | 9336/12384 [19:49:18<6:28:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 75%|███████▌ | 9337/12384 [19:49:18<6:27:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 75%|███████▌ | 9337/12384 [19:49:26<6:27:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 75%|███████▌ | 9338/12384 [19:49:26<6:27:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 75%|███████▌ | 9338/12384 [19:49:33<6:27:37, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 75%|███████▌ | 9339/12384 [19:49:33<6:26:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 75%|███████▌ | 9339/12384 [19:49:41<6:26:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 75%|███████▌ | 9340/12384 [19:49:41<6:26:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 75%|███████▌ | 9340/12384 [19:49:49<6:26:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 75%|███████▌ | 9341/12384 [19:49:49<6:26:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.91s]
Epoch 2: 75%|███████▌ | 9341/12384 [19:49:56<6:26:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▌ | 9342/12384 [19:49:56<6:26:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 75%|███████▌ | 9342/12384 [19:50:04<6:26:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 75%|███████▌ | 9343/12384 [19:50:04<6:26:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 75%|███████▌ | 9343/12384 [19:50:12<6:26:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 2: 75%|███████▌ | 9344/12384 [19:50:12<6:26:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.57s]
Epoch 2: 75%|███████▌ | 9344/12384 [19:50:19<6:26:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 75%|███████▌ | 9345/12384 [19:50:19<6:26:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 75%|███████▌ | 9345/12384 [19:50:27<6:26:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▌ | 9346/12384 [19:50:27<6:26:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▌ | 9346/12384 [19:50:34<6:26:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▌ | 9347/12384 [19:50:34<6:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 75%|███████▌ | 9347/12384 [19:50:42<6:25:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 75%|███████▌ | 9348/12384 [19:50:42<6:26:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 75%|███████▌ | 9348/12384 [19:50:50<6:26:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▌ | 9349/12384 [19:50:50<6:26:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 75%|███████▌ | 9349/12384 [19:50:57<6:26:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 76%|███████▌ | 9350/12384 [19:50:57<6:25:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.54s]
Epoch 2: 76%|███████▌ | 9350/12384 [19:51:05<6:25:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 76%|███████▌ | 9351/12384 [19:51:05<6:25:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 76%|███████▌ | 9351/12384 [19:51:13<6:25:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 2: 76%|███████▌ | 9352/12384 [19:51:13<6:25:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.75s]
Epoch 2: 76%|███████▌ | 9352/12384 [19:51:20<6:25:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 76%|███████▌ | 9353/12384 [19:51:20<6:24:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 76%|███████▌ | 9353/12384 [19:51:28<6:24:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 76%|███████▌ | 9354/12384 [19:51:28<6:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 76%|███████▌ | 9354/12384 [19:51:35<6:24:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 76%|███████▌ | 9355/12384 [19:51:35<6:24:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.45s]
Epoch 2: 76%|███████▌ | 9355/12384 [19:51:43<6:24:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 76%|███████▌ | 9356/12384 [19:51:43<6:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 76%|███████▌ | 9356/12384 [19:51:51<6:23:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 76%|███████▌ | 9357/12384 [19:51:51<6:23:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.10s]
Epoch 2: 76%|███████▌ | 9357/12384 [19:51:58<6:23:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 76%|███████▌ | 9358/12384 [19:51:58<6:24:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.20s]
Epoch 2: 76%|███████▌ | 9358/12384 [19:52:06<6:24:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9359/12384 [19:52:06<6:24:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9359/12384 [19:52:14<6:24:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 76%|███████▌ | 9360/12384 [19:52:14<6:28:51, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 76%|███████▌ | 9360/12384 [19:52:21<6:28:51, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 76%|███████▌ | 9361/12384 [19:52:21<6:26:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 76%|███████▌ | 9361/12384 [19:52:29<6:26:50, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 76%|███████▌ | 9362/12384 [19:52:29<6:25:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.95s]
Epoch 2: 76%|███████▌ | 9362/12384 [19:52:37<6:25:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 76%|███████▌ | 9363/12384 [19:52:37<6:25:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 76%|███████▌ | 9363/12384 [19:52:44<6:25:03, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.54s]
Epoch 2: 76%|███████▌ | 9364/12384 [19:52:44<6:24:18, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.54s]
Epoch 2: 76%|███████▌ | 9364/12384 [19:52:52<6:24:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 76%|███████▌ | 9365/12384 [19:52:52<6:23:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.33s]
Epoch 2: 76%|███████▌ | 9365/12384 [19:52:59<6:23:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 2: 76%|███████▌ | 9366/12384 [19:52:59<6:23:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 2: 76%|███████▌ | 9366/12384 [19:53:07<6:23:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 76%|███████▌ | 9367/12384 [19:53:07<6:22:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 76%|███████▌ | 9367/12384 [19:53:15<6:22:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 76%|███████▌ | 9368/12384 [19:53:15<6:23:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 76%|███████▌ | 9368/12384 [19:53:22<6:23:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 76%|███████▌ | 9369/12384 [19:53:22<6:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 76%|███████▌ | 9369/12384 [19:53:30<6:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 76%|███████▌ | 9370/12384 [19:53:30<6:25:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 76%|███████▌ | 9370/12384 [19:53:38<6:25:33, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 76%|███████▌ | 9371/12384 [19:53:38<6:26:06, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 76%|███████▌ | 9371/12384 [19:53:45<6:26:06, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.14s]
Epoch 2: 76%|███████▌ | 9372/12384 [19:53:46<6:25:53, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.14s]
Epoch 2: 76%|███████▌ | 9372/12384 [19:53:53<6:25:53, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 76%|███████▌ | 9373/12384 [19:53:53<6:24:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 76%|███████▌ | 9373/12384 [19:54:01<6:24:44, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 76%|███████▌ | 9374/12384 [19:54:01<6:23:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 76%|███████▌ | 9374/12384 [19:54:08<6:23:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 2: 76%|███████▌ | 9375/12384 [19:54:08<6:23:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.94s]
Epoch 2: 76%|███████▌ | 9375/12384 [19:54:16<6:23:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 76%|███████▌ | 9376/12384 [19:54:16<6:22:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.44s]
Epoch 2: 76%|███████▌ | 9376/12384 [19:54:24<6:22:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 76%|███████▌ | 9377/12384 [19:54:24<6:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 76%|███████▌ | 9377/12384 [19:54:31<6:22:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.87s]
Epoch 2: 76%|███████▌ | 9378/12384 [19:54:31<6:21:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.87s]
Epoch 2: 76%|███████▌ | 9378/12384 [19:54:39<6:21:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 76%|███████▌ | 9379/12384 [19:54:39<6:21:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.93s]
Epoch 2: 76%|███████▌ | 9379/12384 [19:54:46<6:21:38, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 76%|███████▌ | 9380/12384 [19:54:46<6:21:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 76%|███████▌ | 9380/12384 [19:54:54<6:21:09, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 76%|███████▌ | 9381/12384 [19:54:54<6:21:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.82s]
Epoch 2: 76%|███████▌ | 9381/12384 [19:55:02<6:21:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 76%|███████▌ | 9382/12384 [19:55:02<6:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 76%|███████▌ | 9382/12384 [19:55:09<6:21:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 76%|███████▌ | 9383/12384 [19:55:09<6:21:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 76%|███████▌ | 9383/12384 [19:55:17<6:21:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 76%|███████▌ | 9384/12384 [19:55:17<6:20:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 76%|███████▌ | 9384/12384 [19:55:25<6:20:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 76%|███████▌ | 9385/12384 [19:55:25<6:20:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 76%|███████▌ | 9385/12384 [19:55:32<6:20:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 76%|███████▌ | 9386/12384 [19:55:32<6:25:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 76%|███████▌ | 9386/12384 [19:55:40<6:25:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 76%|███████▌ | 9387/12384 [19:55:40<6:24:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 76%|███████▌ | 9387/12384 [19:55:48<6:24:01, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 76%|███████▌ | 9388/12384 [19:55:48<6:22:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 76%|███████▌ | 9388/12384 [19:55:55<6:22:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▌ | 9389/12384 [19:55:55<6:21:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▌ | 9389/12384 [19:56:03<6:21:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 76%|███████▌ | 9390/12384 [19:56:03<6:20:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 76%|███████▌ | 9390/12384 [19:56:10<6:20:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 76%|███████▌ | 9391/12384 [19:56:10<6:20:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 76%|███████▌ | 9391/12384 [19:56:18<6:20:12, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 76%|███████▌ | 9392/12384 [19:56:18<6:20:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 76%|███████▌ | 9392/12384 [19:56:26<6:20:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 2: 76%|███████▌ | 9393/12384 [19:56:26<6:19:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.95s]
Epoch 2: 76%|███████▌ | 9393/12384 [19:56:33<6:19:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 76%|███████▌ | 9394/12384 [19:56:33<6:20:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 76%|███████▌ | 9394/12384 [19:56:41<6:20:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 2: 76%|███████▌ | 9395/12384 [19:56:41<6:19:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 2: 76%|███████▌ | 9395/12384 [19:56:49<6:19:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 76%|███████▌ | 9396/12384 [19:56:49<6:19:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 76%|███████▌ | 9396/12384 [19:56:56<6:19:15, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 76%|███████▌ | 9397/12384 [19:56:56<6:18:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.35s]
Epoch 2: 76%|███████▌ | 9397/12384 [19:57:04<6:18:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9398/12384 [19:57:04<6:18:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9398/12384 [19:57:11<6:18:41, 7.61s/it, loss=0.0004, acc=0.9987, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9399/12384 [19:57:11<6:19:32, 7.63s/it, loss=0.0004, acc=0.9987, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9399/12384 [19:57:19<6:19:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▌ | 9400/12384 [19:57:19<6:19:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▌ | 9400/12384 [19:57:27<6:19:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 2: 76%|███████▌ | 9401/12384 [19:57:27<6:19:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 2: 76%|███████▌ | 9401/12384 [19:57:34<6:19:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 76%|███████▌ | 9402/12384 [19:57:34<6:18:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 76%|███████▌ | 9402/12384 [19:57:42<6:18:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 76%|███████▌ | 9403/12384 [19:57:42<6:22:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.02s]
Epoch 2: 76%|███████▌ | 9403/12384 [19:57:50<6:22:27, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 76%|███████▌ | 9404/12384 [19:57:50<6:20:48, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.66s]
Epoch 2: 76%|███████▌ | 9404/12384 [19:57:57<6:20:48, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.52s]
Epoch 2: 76%|███████▌ | 9405/12384 [19:57:57<6:19:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.52s]
Epoch 2: 76%|███████▌ | 9405/12384 [19:58:05<6:19:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9406/12384 [19:58:05<6:19:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9406/12384 [19:58:13<6:19:09, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 76%|███████▌ | 9407/12384 [19:58:13<6:20:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 76%|███████▌ | 9407/12384 [19:58:20<6:20:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 76%|███████▌ | 9408/12384 [19:58:20<6:19:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 76%|███████▌ | 9408/12384 [19:58:28<6:19:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 76%|███████▌ | 9409/12384 [19:58:28<6:19:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 76%|███████▌ | 9409/12384 [19:58:36<6:19:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 76%|███████▌ | 9410/12384 [19:58:36<6:18:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.64s]
Epoch 2: 76%|███████▌ | 9410/12384 [19:58:43<6:18:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 76%|███████▌ | 9411/12384 [19:58:43<6:17:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.71s]
Epoch 2: 76%|███████▌ | 9411/12384 [19:58:51<6:17:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 76%|███████▌ | 9412/12384 [19:58:51<6:17:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 76%|███████▌ | 9412/12384 [19:58:59<6:17:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 76%|███████▌ | 9413/12384 [19:58:59<6:22:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 76%|███████▌ | 9413/12384 [19:59:06<6:22:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 76%|███████▌ | 9414/12384 [19:59:06<6:20:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.43s]
Epoch 2: 76%|███████▌ | 9414/12384 [19:59:14<6:20:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 76%|███████▌ | 9415/12384 [19:59:14<6:18:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 76%|███████▌ | 9415/12384 [19:59:22<6:18:55, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 76%|███████▌ | 9416/12384 [19:59:22<6:18:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 76%|███████▌ | 9416/12384 [19:59:29<6:18:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 76%|███████▌ | 9417/12384 [19:59:29<6:17:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 76%|███████▌ | 9417/12384 [19:59:37<6:17:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9418/12384 [19:59:37<6:17:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9418/12384 [19:59:44<6:17:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▌ | 9419/12384 [19:59:44<6:16:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▌ | 9419/12384 [19:59:52<6:16:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 76%|███████▌ | 9420/12384 [19:59:52<6:17:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 76%|███████▌ | 9420/12384 [20:00:00<6:17:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 76%|███████▌ | 9421/12384 [20:00:00<6:16:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.16s]
Epoch 2: 76%|███████▌ | 9421/12384 [20:00:07<6:16:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 76%|███████▌ | 9422/12384 [20:00:07<6:16:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.59s]
Epoch 2: 76%|███████▌ | 9422/12384 [20:00:15<6:16:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 76%|███████▌ | 9423/12384 [20:00:15<6:15:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 76%|███████▌ | 9423/12384 [20:00:22<6:15:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 76%|███████▌ | 9424/12384 [20:00:22<6:15:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 76%|███████▌ | 9424/12384 [20:00:30<6:15:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 76%|███████▌ | 9425/12384 [20:00:30<6:15:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 76%|███████▌ | 9425/12384 [20:00:38<6:15:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 76%|███████▌ | 9426/12384 [20:00:38<6:15:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.13s]
Epoch 2: 76%|███████▌ | 9426/12384 [20:00:45<6:15:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 76%|███████▌ | 9427/12384 [20:00:45<6:14:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 76%|███████▌ | 9427/12384 [20:00:53<6:14:35, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 76%|███████▌ | 9428/12384 [20:00:53<6:14:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 76%|███████▌ | 9428/12384 [20:01:01<6:14:25, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 76%|███████▌ | 9429/12384 [20:01:01<6:18:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 76%|███████▌ | 9429/12384 [20:01:08<6:18:19, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▌ | 9430/12384 [20:01:08<6:17:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▌ | 9430/12384 [20:01:16<6:17:35, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▌ | 9431/12384 [20:01:16<6:16:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▌ | 9431/12384 [20:01:24<6:16:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 76%|███████▌ | 9432/12384 [20:01:24<6:15:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 76%|███████▌ | 9432/12384 [20:01:31<6:15:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 2: 76%|███████▌ | 9433/12384 [20:01:31<6:15:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.72s]
Epoch 2: 76%|███████▌ | 9433/12384 [20:01:39<6:15:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 76%|███████▌ | 9434/12384 [20:01:39<6:14:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 76%|███████▌ | 9434/12384 [20:01:46<6:14:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 76%|███████▌ | 9435/12384 [20:01:46<6:14:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 76%|███████▌ | 9435/12384 [20:01:54<6:14:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9436/12384 [20:01:54<6:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▌ | 9436/12384 [20:02:02<6:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 76%|███████▌ | 9437/12384 [20:02:02<6:13:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 76%|███████▌ | 9437/12384 [20:02:09<6:13:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 76%|███████▌ | 9438/12384 [20:02:09<6:13:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 76%|███████▌ | 9438/12384 [20:02:17<6:13:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 76%|███████▌ | 9439/12384 [20:02:17<6:18:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 76%|███████▌ | 9439/12384 [20:02:25<6:18:50, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.44s]
Epoch 2: 76%|███████▌ | 9440/12384 [20:02:25<6:17:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.44s]
Epoch 2: 76%|███████▌ | 9440/12384 [20:02:32<6:17:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 76%|███████▌ | 9441/12384 [20:02:32<6:15:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 76%|███████▌ | 9441/12384 [20:02:40<6:15:59, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▌ | 9442/12384 [20:02:40<6:15:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▌ | 9442/12384 [20:02:48<6:15:30, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 76%|███████▋ | 9443/12384 [20:02:48<6:14:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 76%|███████▋ | 9443/12384 [20:02:55<6:14:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 76%|███████▋ | 9444/12384 [20:02:55<6:13:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.11s]
Epoch 2: 76%|███████▋ | 9444/12384 [20:03:03<6:13:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 76%|███████▋ | 9445/12384 [20:03:03<6:13:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 76%|███████▋ | 9445/12384 [20:03:11<6:13:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 76%|███████▋ | 9446/12384 [20:03:11<6:13:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 76%|███████▋ | 9446/12384 [20:03:18<6:13:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▋ | 9447/12384 [20:03:18<6:12:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▋ | 9447/12384 [20:03:26<6:12:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▋ | 9448/12384 [20:03:26<6:14:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▋ | 9448/12384 [20:03:34<6:14:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 76%|███████▋ | 9449/12384 [20:03:34<6:14:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 76%|███████▋ | 9449/12384 [20:03:41<6:14:07, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 76%|███████▋ | 9450/12384 [20:03:41<6:13:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 76%|███████▋ | 9450/12384 [20:03:49<6:13:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▋ | 9451/12384 [20:03:49<6:12:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▋ | 9451/12384 [20:03:56<6:12:43, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 76%|███████▋ | 9452/12384 [20:03:56<6:12:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 76%|███████▋ | 9452/12384 [20:04:04<6:12:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 76%|███████▋ | 9453/12384 [20:04:04<6:12:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 76%|███████▋ | 9453/12384 [20:04:12<6:12:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 2: 76%|███████▋ | 9454/12384 [20:04:12<6:11:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.55s]
Epoch 2: 76%|███████▋ | 9454/12384 [20:04:19<6:11:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 76%|███████▋ | 9455/12384 [20:04:19<6:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.32s]
Epoch 2: 76%|███████▋ | 9455/12384 [20:04:27<6:11:45, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 76%|███████▋ | 9456/12384 [20:04:27<6:11:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 76%|███████▋ | 9456/12384 [20:04:34<6:11:17, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▋ | 9457/12384 [20:04:34<6:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 76%|███████▋ | 9457/12384 [20:04:42<6:11:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 76%|███████▋ | 9458/12384 [20:04:42<6:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 76%|███████▋ | 9458/12384 [20:04:50<6:11:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 76%|███████▋ | 9459/12384 [20:04:50<6:10:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 76%|███████▋ | 9459/12384 [20:04:57<6:10:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 76%|███████▋ | 9460/12384 [20:04:57<6:10:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 76%|███████▋ | 9460/12384 [20:05:05<6:10:51, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 76%|███████▋ | 9461/12384 [20:05:05<6:10:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 76%|███████▋ | 9461/12384 [20:05:12<6:10:36, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▋ | 9462/12384 [20:05:12<6:10:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▋ | 9462/12384 [20:05:20<6:10:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▋ | 9463/12384 [20:05:20<6:10:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 76%|███████▋ | 9463/12384 [20:05:28<6:10:13, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 76%|███████▋ | 9464/12384 [20:05:28<6:09:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 76%|███████▋ | 9464/12384 [20:05:36<6:09:55, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 76%|███████▋ | 9465/12384 [20:05:36<6:14:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.63s]
Epoch 2: 76%|███████▋ | 9465/12384 [20:05:43<6:14:31, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.06s]
Epoch 2: 76%|███████▋ | 9466/12384 [20:05:43<6:14:37, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.06s]
Epoch 2: 76%|███████▋ | 9466/12384 [20:05:51<6:14:37, 7.70s/it, loss=0.0007, acc=1.0000, iter_time=6.76s]
Epoch 2: 76%|███████▋ | 9467/12384 [20:05:51<6:14:16, 7.70s/it, loss=0.0007, acc=1.0000, iter_time=6.76s]
Epoch 2: 76%|███████▋ | 9467/12384 [20:05:59<6:14:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 76%|███████▋ | 9468/12384 [20:05:59<6:12:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.53s]
Epoch 2: 76%|███████▋ | 9468/12384 [20:06:06<6:12:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▋ | 9469/12384 [20:06:06<6:11:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 76%|███████▋ | 9469/12384 [20:06:14<6:11:28, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 76%|███████▋ | 9470/12384 [20:06:14<6:10:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.27s]
Epoch 2: 76%|███████▋ | 9470/12384 [20:06:21<6:10:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 76%|███████▋ | 9471/12384 [20:06:21<6:09:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.69s]
Epoch 2: 76%|███████▋ | 9471/12384 [20:06:29<6:09:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 2: 76%|███████▋ | 9472/12384 [20:06:29<6:09:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 2: 76%|███████▋ | 9472/12384 [20:06:37<6:09:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 76%|███████▋ | 9473/12384 [20:06:37<6:09:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 76%|███████▋ | 9473/12384 [20:06:44<6:09:20, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 77%|███████▋ | 9474/12384 [20:06:44<6:09:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 77%|███████▋ | 9474/12384 [20:06:52<6:09:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 77%|███████▋ | 9475/12384 [20:06:52<6:09:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 77%|███████▋ | 9475/12384 [20:06:59<6:09:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 77%|███████▋ | 9476/12384 [20:06:59<6:09:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 77%|███████▋ | 9476/12384 [20:07:07<6:09:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9477/12384 [20:07:07<6:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9477/12384 [20:07:15<6:08:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 77%|███████▋ | 9478/12384 [20:07:15<6:09:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.65s]
Epoch 2: 77%|███████▋ | 9478/12384 [20:07:22<6:09:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 77%|███████▋ | 9479/12384 [20:07:22<6:09:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 77%|███████▋ | 9479/12384 [20:07:30<6:09:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 77%|███████▋ | 9480/12384 [20:07:30<6:08:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 77%|███████▋ | 9480/12384 [20:07:38<6:08:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 77%|███████▋ | 9481/12384 [20:07:38<6:12:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.47s]
Epoch 2: 77%|███████▋ | 9481/12384 [20:07:45<6:12:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 77%|███████▋ | 9482/12384 [20:07:45<6:11:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 77%|███████▋ | 9482/12384 [20:07:53<6:11:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 77%|███████▋ | 9483/12384 [20:07:53<6:10:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 77%|███████▋ | 9483/12384 [20:08:01<6:10:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 77%|███████▋ | 9484/12384 [20:08:01<6:10:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 77%|███████▋ | 9484/12384 [20:08:08<6:10:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 77%|███████▋ | 9485/12384 [20:08:08<6:09:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 77%|███████▋ | 9485/12384 [20:08:16<6:09:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 77%|███████▋ | 9486/12384 [20:08:16<6:08:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 2: 77%|███████▋ | 9486/12384 [20:08:23<6:08:46, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9487/12384 [20:08:23<6:08:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9487/12384 [20:08:31<6:08:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 77%|███████▋ | 9488/12384 [20:08:31<6:07:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 77%|███████▋ | 9488/12384 [20:08:39<6:07:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 77%|███████▋ | 9489/12384 [20:08:39<6:08:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 77%|███████▋ | 9489/12384 [20:08:46<6:08:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 77%|███████▋ | 9490/12384 [20:08:46<6:07:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 77%|███████▋ | 9490/12384 [20:08:54<6:07:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 77%|███████▋ | 9491/12384 [20:08:54<6:11:35, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 77%|███████▋ | 9491/12384 [20:09:02<6:11:35, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 2: 77%|███████▋ | 9492/12384 [20:09:02<6:11:03, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 2: 77%|███████▋ | 9492/12384 [20:09:10<6:11:03, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 77%|███████▋ | 9493/12384 [20:09:10<6:14:04, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 77%|███████▋ | 9493/12384 [20:09:17<6:14:04, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 77%|███████▋ | 9494/12384 [20:09:17<6:11:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 77%|███████▋ | 9494/12384 [20:09:25<6:11:42, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 77%|███████▋ | 9495/12384 [20:09:25<6:10:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 77%|███████▋ | 9495/12384 [20:09:33<6:10:08, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 77%|███████▋ | 9496/12384 [20:09:33<6:10:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 77%|███████▋ | 9496/12384 [20:09:40<6:10:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 77%|███████▋ | 9497/12384 [20:09:40<6:09:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.53s]
Epoch 2: 77%|███████▋ | 9497/12384 [20:09:48<6:09:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9498/12384 [20:09:48<6:07:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9498/12384 [20:09:56<6:07:53, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 77%|███████▋ | 9499/12384 [20:09:56<6:06:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 77%|███████▋ | 9499/12384 [20:10:03<6:06:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 77%|███████▋ | 9500/12384 [20:10:03<6:06:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 2: 77%|███████▋ | 9500/12384 [20:10:11<6:06:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 77%|███████▋ | 9501/12384 [20:10:11<6:05:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 77%|███████▋ | 9501/12384 [20:10:18<6:05:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 77%|███████▋ | 9502/12384 [20:10:18<6:05:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 77%|███████▋ | 9502/12384 [20:10:26<6:05:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9503/12384 [20:10:26<6:05:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9503/12384 [20:10:34<6:05:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 77%|███████▋ | 9504/12384 [20:10:34<6:04:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 77%|███████▋ | 9504/12384 [20:10:41<6:04:48, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 77%|███████▋ | 9505/12384 [20:10:41<6:04:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 77%|███████▋ | 9505/12384 [20:10:49<6:04:32, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9506/12384 [20:10:49<6:05:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9506/12384 [20:10:57<6:05:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 77%|███████▋ | 9507/12384 [20:10:57<6:09:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 77%|███████▋ | 9507/12384 [20:11:04<6:09:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9508/12384 [20:11:04<6:08:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 77%|███████▋ | 9508/12384 [20:11:12<6:08:27, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 77%|███████▋ | 9509/12384 [20:11:12<6:06:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 77%|███████▋ | 9509/12384 [20:11:20<6:06:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 77%|███████▋ | 9510/12384 [20:11:20<6:09:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 77%|███████▋ | 9510/12384 [20:11:28<6:09:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 2: 77%|███████▋ | 9511/12384 [20:11:28<6:10:46, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 2: 77%|███████▋ | 9511/12384 [20:11:35<6:10:46, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 77%|███████▋ | 9512/12384 [20:11:35<6:10:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 77%|███████▋ | 9512/12384 [20:11:43<6:10:08, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 77%|███████▋ | 9513/12384 [20:11:43<6:09:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 77%|███████▋ | 9513/12384 [20:11:51<6:09:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 77%|███████▋ | 9514/12384 [20:11:51<6:08:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 77%|███████▋ | 9514/12384 [20:11:59<6:08:18, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 77%|███████▋ | 9515/12384 [20:11:59<6:09:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 77%|███████▋ | 9515/12384 [20:12:06<6:09:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 2: 77%|███████▋ | 9516/12384 [20:12:06<6:07:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.66s]
Epoch 2: 77%|███████▋ | 9516/12384 [20:12:14<6:07:59, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 77%|███████▋ | 9517/12384 [20:12:14<6:11:58, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 77%|███████▋ | 9517/12384 [20:12:22<6:11:58, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 77%|███████▋ | 9518/12384 [20:12:22<6:09:36, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.54s]
Epoch 2: 77%|███████▋ | 9518/12384 [20:12:29<6:09:36, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 2: 77%|███████▋ | 9519/12384 [20:12:29<6:08:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.03s]
Epoch 2: 77%|███████▋ | 9519/12384 [20:12:37<6:08:22, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 77%|███████▋ | 9520/12384 [20:12:37<6:07:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 77%|███████▋ | 9520/12384 [20:12:45<6:07:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 77%|███████▋ | 9521/12384 [20:12:45<6:07:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 77%|███████▋ | 9521/12384 [20:12:52<6:07:41, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 77%|███████▋ | 9522/12384 [20:12:52<6:07:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 77%|███████▋ | 9522/12384 [20:13:00<6:07:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 77%|███████▋ | 9523/12384 [20:13:00<6:07:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 77%|███████▋ | 9523/12384 [20:13:08<6:07:11, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 77%|███████▋ | 9524/12384 [20:13:08<6:07:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 77%|███████▋ | 9524/12384 [20:13:16<6:07:18, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 77%|███████▋ | 9525/12384 [20:13:16<6:06:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 77%|███████▋ | 9525/12384 [20:13:23<6:06:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 77%|███████▋ | 9526/12384 [20:13:23<6:05:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 77%|███████▋ | 9526/12384 [20:13:31<6:05:52, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 77%|███████▋ | 9527/12384 [20:13:31<6:05:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 77%|███████▋ | 9527/12384 [20:13:39<6:05:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 77%|███████▋ | 9528/12384 [20:13:39<6:05:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 77%|███████▋ | 9528/12384 [20:13:46<6:05:50, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 77%|███████▋ | 9529/12384 [20:13:46<6:06:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 77%|███████▋ | 9529/12384 [20:13:54<6:06:07, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 2: 77%|███████▋ | 9530/12384 [20:13:54<6:06:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 2: 77%|███████▋ | 9530/12384 [20:14:02<6:06:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 77%|███████▋ | 9531/12384 [20:14:02<6:06:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 77%|███████▋ | 9531/12384 [20:14:10<6:06:21, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 77%|███████▋ | 9532/12384 [20:14:10<6:08:17, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 77%|███████▋ | 9532/12384 [20:14:18<6:08:17, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 77%|███████▋ | 9533/12384 [20:14:18<6:10:35, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 77%|███████▋ | 9533/12384 [20:14:25<6:10:35, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 77%|███████▋ | 9534/12384 [20:14:25<6:11:04, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 77%|███████▋ | 9534/12384 [20:14:33<6:11:04, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 77%|███████▋ | 9535/12384 [20:14:33<6:09:48, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 77%|███████▋ | 9535/12384 [20:14:41<6:09:48, 7.79s/it, loss=0.0001, acc=1.0000, iter_time=8.75s]
Epoch 2: 77%|███████▋ | 9536/12384 [20:14:41<6:10:03, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=8.75s]
Epoch 2: 77%|███████▋ | 9536/12384 [20:14:49<6:10:03, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 77%|███████▋ | 9537/12384 [20:14:49<6:08:26, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 77%|███████▋ | 9537/12384 [20:14:56<6:08:26, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 77%|███████▋ | 9538/12384 [20:14:56<6:07:45, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.21s]
Epoch 2: 77%|███████▋ | 9538/12384 [20:15:04<6:07:45, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 2: 77%|███████▋ | 9539/12384 [20:15:04<6:06:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.24s]
Epoch 2: 77%|███████▋ | 9539/12384 [20:15:12<6:06:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 77%|███████▋ | 9540/12384 [20:15:12<6:05:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.10s]
Epoch 2: 77%|███████▋ | 9540/12384 [20:15:19<6:05:54, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 77%|███████▋ | 9541/12384 [20:15:19<6:05:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.51s]
Epoch 2: 77%|███████▋ | 9541/12384 [20:15:27<6:05:46, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 77%|███████▋ | 9542/12384 [20:15:27<6:05:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 77%|███████▋ | 9542/12384 [20:15:35<6:05:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 77%|███████▋ | 9543/12384 [20:15:35<6:04:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.82s]
Epoch 2: 77%|███████▋ | 9543/12384 [20:15:43<6:04:48, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 77%|███████▋ | 9544/12384 [20:15:43<6:09:04, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 77%|███████▋ | 9544/12384 [20:15:50<6:09:04, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 77%|███████▋ | 9545/12384 [20:15:50<6:07:22, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 77%|███████▋ | 9545/12384 [20:15:58<6:07:22, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 77%|███████▋ | 9546/12384 [20:15:58<6:06:28, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 77%|███████▋ | 9546/12384 [20:16:06<6:06:28, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 77%|███████▋ | 9547/12384 [20:16:06<6:06:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 77%|███████▋ | 9547/12384 [20:16:14<6:06:24, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 77%|███████▋ | 9548/12384 [20:16:14<6:05:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 77%|███████▋ | 9548/12384 [20:16:21<6:05:51, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 77%|███████▋ | 9549/12384 [20:16:21<6:04:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 77%|███████▋ | 9549/12384 [20:16:29<6:04:30, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 77%|███████▋ | 9550/12384 [20:16:29<6:09:13, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 77%|███████▋ | 9550/12384 [20:16:37<6:09:13, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 77%|███████▋ | 9551/12384 [20:16:37<6:07:42, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 77%|███████▋ | 9551/12384 [20:16:45<6:07:42, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 77%|███████▋ | 9552/12384 [20:16:45<6:06:05, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 77%|███████▋ | 9552/12384 [20:16:53<6:06:05, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 77%|███████▋ | 9553/12384 [20:16:53<6:05:26, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 77%|███████▋ | 9553/12384 [20:17:00<6:05:26, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 77%|███████▋ | 9554/12384 [20:17:00<6:05:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 77%|███████▋ | 9554/12384 [20:17:08<6:05:13, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 77%|███████▋ | 9555/12384 [20:17:08<6:04:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 77%|███████▋ | 9555/12384 [20:17:16<6:04:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 77%|███████▋ | 9556/12384 [20:17:16<6:04:34, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 77%|███████▋ | 9556/12384 [20:17:23<6:04:34, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 77%|███████▋ | 9557/12384 [20:17:23<6:04:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 77%|███████▋ | 9557/12384 [20:17:31<6:04:01, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 77%|███████▋ | 9558/12384 [20:17:31<6:03:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 77%|███████▋ | 9558/12384 [20:17:39<6:03:27, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 77%|███████▋ | 9559/12384 [20:17:39<6:03:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 77%|███████▋ | 9559/12384 [20:17:47<6:03:44, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 77%|███████▋ | 9560/12384 [20:17:47<6:03:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 77%|███████▋ | 9560/12384 [20:17:54<6:03:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 77%|███████▋ | 9561/12384 [20:17:54<6:02:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 77%|███████▋ | 9561/12384 [20:18:02<6:02:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 77%|███████▋ | 9562/12384 [20:18:02<6:02:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 77%|███████▋ | 9562/12384 [20:18:10<6:02:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 77%|███████▋ | 9563/12384 [20:18:10<6:01:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 77%|███████▋ | 9563/12384 [20:18:17<6:01:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 77%|███████▋ | 9564/12384 [20:18:17<6:01:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 77%|███████▋ | 9564/12384 [20:18:25<6:01:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 77%|███████▋ | 9565/12384 [20:18:25<6:00:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 77%|███████▋ | 9565/12384 [20:18:33<6:00:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 77%|███████▋ | 9566/12384 [20:18:33<6:01:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 77%|███████▋ | 9566/12384 [20:18:40<6:01:00, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=10.51s]
Epoch 2: 77%|███████▋ | 9567/12384 [20:18:40<6:00:20, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=10.51s]
Epoch 2: 77%|███████▋ | 9567/12384 [20:18:48<6:00:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 77%|███████▋ | 9568/12384 [20:18:48<6:01:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 77%|███████▋ | 9568/12384 [20:18:56<6:01:05, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 2: 77%|███████▋ | 9569/12384 [20:18:56<6:01:00, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.27s]
Epoch 2: 77%|███████▋ | 9569/12384 [20:19:04<6:01:00, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 77%|███████▋ | 9570/12384 [20:19:04<6:06:42, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=5.16s]
Epoch 2: 77%|███████▋ | 9570/12384 [20:19:11<6:06:42, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 2: 77%|███████▋ | 9571/12384 [20:19:11<6:04:23, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 2: 77%|███████▋ | 9571/12384 [20:19:19<6:04:23, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 77%|███████▋ | 9572/12384 [20:19:19<6:02:50, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 77%|███████▋ | 9572/12384 [20:19:27<6:02:50, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 77%|███████▋ | 9573/12384 [20:19:27<6:02:30, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.55s]
Epoch 2: 77%|███████▋ | 9573/12384 [20:19:35<6:02:30, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 77%|███████▋ | 9574/12384 [20:19:35<6:01:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 77%|███████▋ | 9574/12384 [20:19:42<6:01:39, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 77%|███████▋ | 9575/12384 [20:19:42<6:00:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.79s]
Epoch 2: 77%|███████▋ | 9575/12384 [20:19:50<6:00:36, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 77%|███████▋ | 9576/12384 [20:19:50<6:00:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 2: 77%|███████▋ | 9576/12384 [20:19:58<6:00:38, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 77%|███████▋ | 9577/12384 [20:19:58<6:00:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 77%|███████▋ | 9577/12384 [20:20:05<6:00:17, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.93s]
Epoch 2: 77%|███████▋ | 9578/12384 [20:20:05<6:00:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.93s]
Epoch 2: 77%|███████▋ | 9578/12384 [20:20:13<6:00:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 77%|███████▋ | 9579/12384 [20:20:13<6:00:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 77%|███████▋ | 9579/12384 [20:20:21<6:00:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 2: 77%|███████▋ | 9580/12384 [20:20:21<6:00:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.57s]
Epoch 2: 77%|███████▋ | 9580/12384 [20:20:28<6:00:02, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 77%|███████▋ | 9581/12384 [20:20:28<5:58:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.41s]
Epoch 2: 77%|███████▋ | 9581/12384 [20:20:36<5:58:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 77%|███████▋ | 9582/12384 [20:20:36<5:58:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.06s]
Epoch 2: 77%|███████▋ | 9582/12384 [20:20:44<5:58:06, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 77%|███████▋ | 9583/12384 [20:20:44<5:57:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 77%|███████▋ | 9583/12384 [20:20:51<5:57:27, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 77%|███████▋ | 9584/12384 [20:20:51<5:57:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 77%|███████▋ | 9584/12384 [20:20:59<5:57:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 2: 77%|███████▋ | 9585/12384 [20:20:59<6:02:36, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=6.04s]
Epoch 2: 77%|███████▋ | 9585/12384 [20:21:07<6:02:36, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 77%|███████▋ | 9586/12384 [20:21:07<6:04:26, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=9.96s]
Epoch 2: 77%|███████▋ | 9586/12384 [20:21:15<6:04:26, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 77%|███████▋ | 9587/12384 [20:21:15<6:04:32, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=6.38s]
Epoch 2: 77%|███████▋ | 9587/12384 [20:21:23<6:04:32, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 77%|███████▋ | 9588/12384 [20:21:23<6:03:10, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=9.13s]
Epoch 2: 77%|███████▋ | 9588/12384 [20:21:31<6:03:10, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 77%|███████▋ | 9589/12384 [20:21:31<6:02:04, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.77s]
Epoch 2: 77%|███████▋ | 9589/12384 [20:21:38<6:02:04, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 2: 77%|███████▋ | 9590/12384 [20:21:38<6:00:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 2: 77%|███████▋ | 9590/12384 [20:21:46<6:00:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 77%|███████▋ | 9591/12384 [20:21:46<5:59:47, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 77%|███████▋ | 9591/12384 [20:21:54<5:59:47, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 77%|███████▋ | 9592/12384 [20:21:54<5:59:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 77%|███████▋ | 9592/12384 [20:22:01<5:59:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 2: 77%|███████▋ | 9593/12384 [20:22:01<5:58:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 2: 77%|███████▋ | 9593/12384 [20:22:09<5:58:55, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 77%|███████▋ | 9594/12384 [20:22:09<5:58:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.27s]
Epoch 2: 77%|███████▋ | 9594/12384 [20:22:17<5:58:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 77%|███████▋ | 9595/12384 [20:22:17<5:58:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 77%|███████▋ | 9595/12384 [20:22:24<5:58:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 77%|███████▋ | 9596/12384 [20:22:24<5:59:19, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.75s]
Epoch 2: 77%|███████▋ | 9596/12384 [20:22:33<5:59:19, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 77%|███████▋ | 9597/12384 [20:22:33<6:08:52, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 77%|███████▋ | 9597/12384 [20:22:41<6:08:52, 7.94s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 2: 78%|███████▊ | 9598/12384 [20:22:41<6:06:23, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=11.42s]
Epoch 2: 78%|███████▊ | 9598/12384 [20:22:49<6:06:23, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 78%|███████▊ | 9599/12384 [20:22:49<6:11:57, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=8.38s]
Epoch 2: 78%|███████▊ | 9599/12384 [20:22:57<6:11:57, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 78%|███████▊ | 9600/12384 [20:22:57<6:07:11, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 78%|███████▊ | 9600/12384 [20:23:04<6:07:11, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 78%|███████▊ | 9601/12384 [20:23:04<6:04:21, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 78%|███████▊ | 9601/12384 [20:23:12<6:04:21, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 78%|███████▊ | 9602/12384 [20:23:12<6:02:20, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 78%|███████▊ | 9602/12384 [20:23:20<6:02:20, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 2: 78%|███████▊ | 9603/12384 [20:23:20<6:01:03, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=11.33s]
Epoch 2: 78%|███████▊ | 9603/12384 [20:23:28<6:01:03, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 78%|███████▊ | 9604/12384 [20:23:28<6:01:44, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.84s]
Epoch 2: 78%|███████▊ | 9604/12384 [20:23:36<6:01:44, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 78%|███████▊ | 9605/12384 [20:23:36<6:01:51, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 78%|███████▊ | 9605/12384 [20:23:43<6:01:51, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 78%|███████▊ | 9606/12384 [20:23:43<6:01:56, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.85s]
Epoch 2: 78%|███████▊ | 9606/12384 [20:23:51<6:01:56, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 2: 78%|███████▊ | 9607/12384 [20:23:51<6:02:30, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=4.60s]
Epoch 2: 78%|███████▊ | 9607/12384 [20:23:59<6:02:30, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=11.44s]
Epoch 2: 78%|███████▊ | 9608/12384 [20:23:59<6:02:30, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=11.44s]
Epoch 2: 78%|███████▊ | 9608/12384 [20:24:07<6:02:30, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 78%|███████▊ | 9609/12384 [20:24:07<6:02:24, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 78%|███████▊ | 9609/12384 [20:24:15<6:02:24, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 78%|███████▊ | 9610/12384 [20:24:15<6:02:01, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 78%|███████▊ | 9610/12384 [20:24:23<6:02:01, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 78%|███████▊ | 9611/12384 [20:24:23<6:02:36, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 78%|███████▊ | 9611/12384 [20:24:30<6:02:36, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 78%|███████▊ | 9612/12384 [20:24:30<6:02:07, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 78%|███████▊ | 9612/12384 [20:24:38<6:02:07, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 78%|███████▊ | 9613/12384 [20:24:38<6:01:51, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 78%|███████▊ | 9613/12384 [20:24:46<6:01:51, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 78%|███████▊ | 9614/12384 [20:24:46<6:01:59, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 78%|███████▊ | 9614/12384 [20:24:54<6:01:59, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9615/12384 [20:24:54<5:59:36, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9615/12384 [20:25:01<5:59:36, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 78%|███████▊ | 9616/12384 [20:25:01<5:58:13, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 78%|███████▊ | 9616/12384 [20:25:09<5:58:13, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 78%|███████▊ | 9617/12384 [20:25:09<5:57:26, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.81s]
Epoch 2: 78%|███████▊ | 9617/12384 [20:25:17<5:57:26, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 78%|███████▊ | 9618/12384 [20:25:17<5:56:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 78%|███████▊ | 9618/12384 [20:25:25<5:56:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 78%|███████▊ | 9619/12384 [20:25:25<5:56:03, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 78%|███████▊ | 9619/12384 [20:25:32<5:56:03, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 78%|███████▊ | 9620/12384 [20:25:32<5:55:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.67s]
Epoch 2: 78%|███████▊ | 9620/12384 [20:25:40<5:55:44, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 78%|███████▊ | 9621/12384 [20:25:40<5:55:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 78%|███████▊ | 9621/12384 [20:25:48<5:55:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 78%|███████▊ | 9622/12384 [20:25:48<5:54:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 78%|███████▊ | 9622/12384 [20:25:56<5:54:50, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 78%|███████▊ | 9623/12384 [20:25:56<6:00:17, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 78%|███████▊ | 9623/12384 [20:26:04<6:00:17, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 78%|███████▊ | 9624/12384 [20:26:04<5:58:33, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.43s]
Epoch 2: 78%|███████▊ | 9624/12384 [20:26:11<5:58:33, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 78%|███████▊ | 9625/12384 [20:26:11<5:56:49, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 78%|███████▊ | 9625/12384 [20:26:19<5:56:49, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 78%|███████▊ | 9626/12384 [20:26:19<5:56:14, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 78%|███████▊ | 9626/12384 [20:26:27<5:56:14, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 78%|███████▊ | 9627/12384 [20:26:27<5:54:58, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 78%|███████▊ | 9627/12384 [20:26:34<5:54:58, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 78%|███████▊ | 9628/12384 [20:26:34<5:54:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 78%|███████▊ | 9628/12384 [20:26:42<5:54:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 78%|███████▊ | 9629/12384 [20:26:42<5:54:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.37s]
Epoch 2: 78%|███████▊ | 9629/12384 [20:26:50<5:54:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 78%|███████▊ | 9630/12384 [20:26:50<5:53:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=11.01s]
Epoch 2: 78%|███████▊ | 9630/12384 [20:26:57<5:53:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9631/12384 [20:26:57<5:52:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9631/12384 [20:27:05<5:52:35, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 78%|███████▊ | 9632/12384 [20:27:05<5:52:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 78%|███████▊ | 9632/12384 [20:27:13<5:52:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 78%|███████▊ | 9633/12384 [20:27:13<5:52:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 78%|███████▊ | 9633/12384 [20:27:20<5:52:41, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 2: 78%|███████▊ | 9634/12384 [20:27:20<5:52:50, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 2: 78%|███████▊ | 9634/12384 [20:27:28<5:52:50, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 78%|███████▊ | 9635/12384 [20:27:28<5:53:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 78%|███████▊ | 9635/12384 [20:27:36<5:53:53, 7.72s/it, loss=0.0004, acc=0.9991, iter_time=10.07s]
Epoch 2: 78%|███████▊ | 9636/12384 [20:27:36<5:53:21, 7.72s/it, loss=0.0004, acc=0.9991, iter_time=10.07s]
Epoch 2: 78%|███████▊ | 9636/12384 [20:27:44<5:53:21, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 78%|███████▊ | 9637/12384 [20:27:44<5:53:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 78%|███████▊ | 9637/12384 [20:27:51<5:53:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 78%|███████▊ | 9638/12384 [20:27:51<5:52:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 78%|███████▊ | 9638/12384 [20:27:59<5:52:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 78%|███████▊ | 9639/12384 [20:27:59<5:52:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.07s]
Epoch 2: 78%|███████▊ | 9639/12384 [20:28:07<5:52:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 78%|███████▊ | 9640/12384 [20:28:07<5:52:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.74s]
Epoch 2: 78%|███████▊ | 9640/12384 [20:28:14<5:52:31, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 78%|███████▊ | 9641/12384 [20:28:14<5:51:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 78%|███████▊ | 9641/12384 [20:28:22<5:51:55, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 78%|███████▊ | 9642/12384 [20:28:22<5:51:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 78%|███████▊ | 9642/12384 [20:28:30<5:51:28, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 78%|███████▊ | 9643/12384 [20:28:30<5:51:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 78%|███████▊ | 9643/12384 [20:28:37<5:51:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9644/12384 [20:28:37<5:50:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9644/12384 [20:28:45<5:50:42, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 78%|███████▊ | 9645/12384 [20:28:45<5:49:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 78%|███████▊ | 9645/12384 [20:28:53<5:49:50, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 78%|███████▊ | 9646/12384 [20:28:53<5:49:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 78%|███████▊ | 9646/12384 [20:29:00<5:49:06, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 78%|███████▊ | 9647/12384 [20:29:00<5:48:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.80s]
Epoch 2: 78%|███████▊ | 9647/12384 [20:29:08<5:48:23, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 2: 78%|███████▊ | 9648/12384 [20:29:08<5:48:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.84s]
Epoch 2: 78%|███████▊ | 9648/12384 [20:29:16<5:48:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 78%|███████▊ | 9649/12384 [20:29:16<5:52:44, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 78%|███████▊ | 9649/12384 [20:29:23<5:52:44, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 78%|███████▊ | 9650/12384 [20:29:23<5:51:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.02s]
Epoch 2: 78%|███████▊ | 9650/12384 [20:29:31<5:51:05, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 78%|███████▊ | 9651/12384 [20:29:31<5:49:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 78%|███████▊ | 9651/12384 [20:29:39<5:49:48, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 78%|███████▊ | 9652/12384 [20:29:39<5:48:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 78%|███████▊ | 9652/12384 [20:29:46<5:48:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 78%|███████▊ | 9653/12384 [20:29:46<5:47:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 78%|███████▊ | 9653/12384 [20:29:54<5:47:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 78%|███████▊ | 9654/12384 [20:29:54<5:47:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 78%|███████▊ | 9654/12384 [20:30:02<5:47:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 78%|███████▊ | 9655/12384 [20:30:02<5:46:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 78%|███████▊ | 9655/12384 [20:30:09<5:46:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 78%|███████▊ | 9656/12384 [20:30:09<5:45:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.52s]
Epoch 2: 78%|███████▊ | 9656/12384 [20:30:17<5:45:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9657/12384 [20:30:17<5:45:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9657/12384 [20:30:24<5:45:55, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 78%|███████▊ | 9658/12384 [20:30:24<5:46:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 78%|███████▊ | 9658/12384 [20:30:32<5:46:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 78%|███████▊ | 9659/12384 [20:30:32<5:45:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 78%|███████▊ | 9659/12384 [20:30:40<5:45:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 78%|███████▊ | 9660/12384 [20:30:40<5:46:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 78%|███████▊ | 9660/12384 [20:30:47<5:46:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 78%|███████▊ | 9661/12384 [20:30:47<5:45:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.15s]
Epoch 2: 78%|███████▊ | 9661/12384 [20:30:55<5:45:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 78%|███████▊ | 9662/12384 [20:30:55<5:45:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 78%|███████▊ | 9662/12384 [20:31:02<5:45:26, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 2: 78%|███████▊ | 9663/12384 [20:31:02<5:45:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.04s]
Epoch 2: 78%|███████▊ | 9663/12384 [20:31:10<5:45:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.58s]
Epoch 2: 78%|███████▊ | 9664/12384 [20:31:10<5:45:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.58s]
Epoch 2: 78%|███████▊ | 9664/12384 [20:31:18<5:45:00, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 2: 78%|███████▊ | 9665/12384 [20:31:18<5:45:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.96s]
Epoch 2: 78%|███████▊ | 9665/12384 [20:31:25<5:45:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 78%|███████▊ | 9666/12384 [20:31:25<5:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 78%|███████▊ | 9666/12384 [20:31:33<5:45:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 78%|███████▊ | 9667/12384 [20:31:33<5:45:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 78%|███████▊ | 9667/12384 [20:31:41<5:45:23, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9668/12384 [20:31:41<5:45:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9668/12384 [20:31:48<5:45:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 78%|███████▊ | 9669/12384 [20:31:48<5:45:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 78%|███████▊ | 9669/12384 [20:31:56<5:45:27, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 78%|███████▊ | 9670/12384 [20:31:56<5:45:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 78%|███████▊ | 9670/12384 [20:32:03<5:45:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 78%|███████▊ | 9671/12384 [20:32:03<5:44:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 78%|███████▊ | 9671/12384 [20:32:11<5:44:27, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 78%|███████▊ | 9672/12384 [20:32:11<5:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.54s]
Epoch 2: 78%|███████▊ | 9672/12384 [20:32:19<5:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9673/12384 [20:32:19<5:44:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 78%|███████▊ | 9673/12384 [20:32:26<5:44:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 2: 78%|███████▊ | 9674/12384 [20:32:26<5:44:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 2: 78%|███████▊ | 9674/12384 [20:32:34<5:44:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 2: 78%|███████▊ | 9675/12384 [20:32:34<5:48:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.26s]
Epoch 2: 78%|███████▊ | 9675/12384 [20:32:42<5:48:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 78%|███████▊ | 9676/12384 [20:32:42<5:46:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 78%|███████▊ | 9676/12384 [20:32:49<5:46:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 78%|███████▊ | 9677/12384 [20:32:49<5:45:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.51s]
Epoch 2: 78%|███████▊ | 9677/12384 [20:32:57<5:45:50, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 78%|███████▊ | 9678/12384 [20:32:57<5:44:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 78%|███████▊ | 9678/12384 [20:33:05<5:44:33, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 78%|███████▊ | 9679/12384 [20:33:05<5:44:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.47s]
Epoch 2: 78%|███████▊ | 9679/12384 [20:33:12<5:44:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 78%|███████▊ | 9680/12384 [20:33:12<5:43:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.14s]
Epoch 2: 78%|███████▊ | 9680/12384 [20:33:20<5:43:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 78%|███████▊ | 9681/12384 [20:33:20<5:43:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 78%|███████▊ | 9681/12384 [20:33:27<5:43:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 78%|███████▊ | 9682/12384 [20:33:27<5:43:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 78%|███████▊ | 9682/12384 [20:33:35<5:43:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 2: 78%|███████▊ | 9683/12384 [20:33:35<5:43:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.61s]
Epoch 2: 78%|███████▊ | 9683/12384 [20:33:43<5:43:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 78%|███████▊ | 9684/12384 [20:33:43<5:42:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.23s]
Epoch 2: 78%|███████▊ | 9684/12384 [20:33:50<5:42:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 78%|███████▊ | 9685/12384 [20:33:50<5:42:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 78%|███████▊ | 9685/12384 [20:33:58<5:42:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 78%|███████▊ | 9686/12384 [20:33:58<5:43:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 78%|███████▊ | 9686/12384 [20:34:06<5:43:10, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 78%|███████▊ | 9687/12384 [20:34:06<5:42:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.46s]
Epoch 2: 78%|███████▊ | 9687/12384 [20:34:13<5:42:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 78%|███████▊ | 9688/12384 [20:34:13<5:42:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.32s]
Epoch 2: 78%|███████▊ | 9688/12384 [20:34:21<5:42:54, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 78%|███████▊ | 9689/12384 [20:34:21<5:42:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.36s]
Epoch 2: 78%|███████▊ | 9689/12384 [20:34:29<5:42:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 78%|███████▊ | 9690/12384 [20:34:29<5:42:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.90s]
Epoch 2: 78%|███████▊ | 9690/12384 [20:34:36<5:42:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.16s]
Epoch 2: 78%|███████▊ | 9691/12384 [20:34:36<5:42:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.16s]
Epoch 2: 78%|███████▊ | 9691/12384 [20:34:44<5:42:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 2: 78%|███████▊ | 9692/12384 [20:34:44<5:41:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 2: 78%|███████▊ | 9692/12384 [20:34:51<5:41:52, 7.62s/it, loss=0.0002, acc=0.9994, iter_time=7.63s]
Epoch 2: 78%|███████▊ | 9693/12384 [20:34:51<5:41:22, 7.61s/it, loss=0.0002, acc=0.9994, iter_time=7.63s]
Epoch 2: 78%|███████▊ | 9693/12384 [20:34:59<5:41:22, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=3.80s]
Epoch 2: 78%|███████▊ | 9694/12384 [20:34:59<5:41:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.80s]
Epoch 2: 78%|███████▊ | 9694/12384 [20:35:07<5:41:30, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.43s]
Epoch 2: 78%|███████▊ | 9695/12384 [20:35:07<5:41:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.43s]
Epoch 2: 78%|███████▊ | 9695/12384 [20:35:14<5:41:12, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 78%|███████▊ | 9696/12384 [20:35:14<5:40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 78%|███████▊ | 9696/12384 [20:35:22<5:40:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 78%|███████▊ | 9697/12384 [20:35:22<5:40:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 78%|███████▊ | 9697/12384 [20:35:29<5:40:48, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 78%|███████▊ | 9698/12384 [20:35:29<5:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 78%|███████▊ | 9698/12384 [20:35:37<5:40:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 2: 78%|███████▊ | 9699/12384 [20:35:37<5:40:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=5.46s]
Epoch 2: 78%|███████▊ | 9699/12384 [20:35:45<5:40:18, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 2: 78%|███████▊ | 9700/12384 [20:35:45<5:40:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.76s]
Epoch 2: 78%|███████▊ | 9700/12384 [20:35:53<5:40:24, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 78%|███████▊ | 9701/12384 [20:35:53<5:44:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.65s]
Epoch 2: 78%|███████▊ | 9701/12384 [20:36:00<5:44:28, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 78%|███████▊ | 9702/12384 [20:36:00<5:43:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 78%|███████▊ | 9702/12384 [20:36:08<5:43:09, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 78%|███████▊ | 9703/12384 [20:36:08<5:42:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.09s]
Epoch 2: 78%|███████▊ | 9703/12384 [20:36:15<5:42:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 78%|███████▊ | 9704/12384 [20:36:15<5:40:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 78%|███████▊ | 9704/12384 [20:36:23<5:40:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 78%|███████▊ | 9705/12384 [20:36:23<5:40:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.72s]
Epoch 2: 78%|███████▊ | 9705/12384 [20:36:31<5:40:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 78%|███████▊ | 9706/12384 [20:36:31<5:40:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 78%|███████▊ | 9706/12384 [20:36:38<5:40:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 78%|███████▊ | 9707/12384 [20:36:38<5:39:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 78%|███████▊ | 9707/12384 [20:36:46<5:39:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 78%|███████▊ | 9708/12384 [20:36:46<5:39:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.75s]
Epoch 2: 78%|███████▊ | 9708/12384 [20:36:53<5:39:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 78%|███████▊ | 9709/12384 [20:36:53<5:39:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 78%|███████▊ | 9709/12384 [20:37:01<5:39:19, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 78%|███████▊ | 9710/12384 [20:37:01<5:39:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 78%|███████▊ | 9710/12384 [20:37:09<5:39:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 78%|███████▊ | 9711/12384 [20:37:09<5:38:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 78%|███████▊ | 9711/12384 [20:37:16<5:38:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 78%|███████▊ | 9712/12384 [20:37:16<5:38:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.12s]
Epoch 2: 78%|███████▊ | 9712/12384 [20:37:24<5:38:57, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 78%|███████▊ | 9713/12384 [20:37:24<5:38:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 78%|███████▊ | 9713/12384 [20:37:31<5:38:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 78%|███████▊ | 9714/12384 [20:37:31<5:38:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 78%|███████▊ | 9714/12384 [20:37:39<5:38:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 78%|███████▊ | 9715/12384 [20:37:39<5:38:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 78%|███████▊ | 9715/12384 [20:37:47<5:38:59, 7.62s/it, loss=0.0002, acc=0.9980, iter_time=7.63s]
Epoch 2: 78%|███████▊ | 9716/12384 [20:37:47<5:39:05, 7.63s/it, loss=0.0002, acc=0.9980, iter_time=7.63s]
Epoch 2: 78%|███████▊ | 9716/12384 [20:37:54<5:39:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 78%|███████▊ | 9717/12384 [20:37:54<5:38:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.49s]
Epoch 2: 78%|███████▊ | 9717/12384 [20:38:02<5:38:27, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 78%|███████▊ | 9718/12384 [20:38:02<5:38:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.07s]
Epoch 2: 78%|███████▊ | 9718/12384 [20:38:10<5:38:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 2: 78%|███████▊ | 9719/12384 [20:38:10<5:39:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.15s]
Epoch 2: 78%|███████▊ | 9719/12384 [20:38:18<5:39:34, 7.65s/it, loss=0.0007, acc=0.9987, iter_time=9.65s]
Epoch 2: 78%|███████▊ | 9720/12384 [20:38:18<5:44:23, 7.76s/it, loss=0.0007, acc=0.9987, iter_time=9.65s]
Epoch 2: 78%|███████▊ | 9720/12384 [20:38:26<5:44:23, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 78%|███████▊ | 9721/12384 [20:38:26<5:48:15, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 78%|███████▊ | 9721/12384 [20:38:34<5:48:15, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 79%|███████▊ | 9722/12384 [20:38:34<5:51:19, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 79%|███████▊ | 9722/12384 [20:38:42<5:51:19, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 79%|███████▊ | 9723/12384 [20:38:42<5:56:03, 8.03s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 79%|███████▊ | 9723/12384 [20:38:50<5:56:03, 8.03s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 79%|███████▊ | 9724/12384 [20:38:50<5:50:15, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 79%|███████▊ | 9724/12384 [20:38:57<5:50:15, 7.90s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 79%|███████▊ | 9725/12384 [20:38:57<5:47:39, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.64s]
Epoch 2: 79%|███████▊ | 9725/12384 [20:39:05<5:47:39, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 79%|███████▊ | 9726/12384 [20:39:05<5:47:04, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 79%|███████▊ | 9726/12384 [20:39:13<5:47:04, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 79%|███████▊ | 9727/12384 [20:39:13<5:46:18, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 79%|███████▊ | 9727/12384 [20:39:22<5:46:18, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 79%|███████▊ | 9728/12384 [20:39:22<6:04:44, 8.24s/it, loss=0.0000, acc=1.0000, iter_time=10.36s]
Epoch 2: 79%|███████▊ | 9728/12384 [20:39:30<6:04:44, 8.24s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 79%|███████▊ | 9729/12384 [20:39:30<5:56:27, 8.06s/it, loss=0.0000, acc=1.0000, iter_time=4.06s]
Epoch 2: 79%|███████▊ | 9729/12384 [20:39:37<5:56:27, 8.06s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 79%|███████▊ | 9730/12384 [20:39:37<5:50:01, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=10.28s]
Epoch 2: 79%|███████▊ | 9730/12384 [20:39:45<5:50:01, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 79%|███████▊ | 9731/12384 [20:39:45<5:46:06, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=5.71s]
Epoch 2: 79%|███████▊ | 9731/12384 [20:39:53<5:46:06, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 79%|███████▊ | 9732/12384 [20:39:53<5:46:04, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=10.88s]
Epoch 2: 79%|███████▊ | 9732/12384 [20:40:00<5:46:04, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 79%|███████▊ | 9733/12384 [20:40:00<5:43:07, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.62s]
Epoch 2: 79%|███████▊ | 9733/12384 [20:40:08<5:43:07, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 79%|███████▊ | 9734/12384 [20:40:08<5:42:06, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 79%|███████▊ | 9734/12384 [20:40:16<5:42:06, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 79%|███████▊ | 9735/12384 [20:40:16<5:40:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.19s]
Epoch 2: 79%|███████▊ | 9735/12384 [20:40:23<5:40:07, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 79%|███████▊ | 9736/12384 [20:40:23<5:38:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 79%|███████▊ | 9736/12384 [20:40:31<5:38:43, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 79%|███████▊ | 9737/12384 [20:40:31<5:39:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 79%|███████▊ | 9737/12384 [20:40:39<5:39:11, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 79%|███████▊ | 9738/12384 [20:40:39<5:38:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.34s]
Epoch 2: 79%|███████▊ | 9738/12384 [20:40:46<5:38:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 79%|███████▊ | 9739/12384 [20:40:46<5:37:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 79%|███████▊ | 9739/12384 [20:40:54<5:37:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 79%|███████▊ | 9740/12384 [20:40:54<5:36:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 79%|███████▊ | 9740/12384 [20:41:02<5:36:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 79%|███████▊ | 9741/12384 [20:41:02<5:35:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.09s]
Epoch 2: 79%|███████▊ | 9741/12384 [20:41:09<5:35:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 79%|███████▊ | 9742/12384 [20:41:09<5:35:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 79%|███████▊ | 9742/12384 [20:41:17<5:35:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 79%|███████▊ | 9743/12384 [20:41:17<5:38:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 79%|███████▊ | 9743/12384 [20:41:25<5:38:33, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 79%|███████▊ | 9744/12384 [20:41:25<5:37:33, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 79%|███████▊ | 9744/12384 [20:41:32<5:37:33, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.91s]
Epoch 2: 79%|███████▊ | 9745/12384 [20:41:32<5:36:38, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.91s]
Epoch 2: 79%|███████▊ | 9745/12384 [20:41:40<5:36:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 2: 79%|███████▊ | 9746/12384 [20:41:40<5:35:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 2: 79%|███████▊ | 9746/12384 [20:41:47<5:35:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 79%|███████▊ | 9747/12384 [20:41:47<5:35:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.67s]
Epoch 2: 79%|███████▊ | 9747/12384 [20:41:55<5:35:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▊ | 9748/12384 [20:41:55<5:35:09, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▊ | 9748/12384 [20:42:03<5:35:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 79%|███████▊ | 9749/12384 [20:42:03<5:34:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 79%|███████▊ | 9749/12384 [20:42:10<5:34:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 79%|███████▊ | 9750/12384 [20:42:10<5:34:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 79%|███████▊ | 9750/12384 [20:42:18<5:34:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 79%|███████▊ | 9751/12384 [20:42:18<5:34:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 79%|███████▊ | 9751/12384 [20:42:26<5:34:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 79%|███████▊ | 9752/12384 [20:42:26<5:34:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 79%|███████▊ | 9752/12384 [20:42:33<5:34:26, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 79%|███████▉ | 9753/12384 [20:42:33<5:33:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 79%|███████▉ | 9753/12384 [20:42:41<5:33:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 79%|███████▉ | 9754/12384 [20:42:41<5:37:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 79%|███████▉ | 9754/12384 [20:42:49<5:37:58, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 79%|███████▉ | 9755/12384 [20:42:49<5:36:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.86s]
Epoch 2: 79%|███████▉ | 9755/12384 [20:42:56<5:36:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 79%|███████▉ | 9756/12384 [20:42:56<5:35:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.76s]
Epoch 2: 79%|███████▉ | 9756/12384 [20:43:04<5:35:21, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 79%|███████▉ | 9757/12384 [20:43:04<5:34:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.47s]
Epoch 2: 79%|███████▉ | 9757/12384 [20:43:12<5:34:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 79%|███████▉ | 9758/12384 [20:43:12<5:34:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.09s]
Epoch 2: 79%|███████▉ | 9758/12384 [20:43:19<5:34:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 79%|███████▉ | 9759/12384 [20:43:19<5:33:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.12s]
Epoch 2: 79%|███████▉ | 9759/12384 [20:43:27<5:33:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 2: 79%|███████▉ | 9760/12384 [20:43:27<5:33:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 2: 79%|███████▉ | 9760/12384 [20:43:34<5:33:17, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.61s]
Epoch 2: 79%|███████▉ | 9761/12384 [20:43:34<5:32:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.61s]
Epoch 2: 79%|███████▉ | 9761/12384 [20:43:42<5:32:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 2: 79%|███████▉ | 9762/12384 [20:43:42<5:32:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.58s]
Epoch 2: 79%|███████▉ | 9762/12384 [20:43:50<5:32:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 79%|███████▉ | 9763/12384 [20:43:50<5:32:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 79%|███████▉ | 9763/12384 [20:43:57<5:32:48, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 79%|███████▉ | 9764/12384 [20:43:57<5:32:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.85s]
Epoch 2: 79%|███████▉ | 9764/12384 [20:44:05<5:32:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 79%|███████▉ | 9765/12384 [20:44:05<5:33:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.75s]
Epoch 2: 79%|███████▉ | 9765/12384 [20:44:13<5:33:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 79%|███████▉ | 9766/12384 [20:44:13<5:33:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.57s]
Epoch 2: 79%|███████▉ | 9766/12384 [20:44:20<5:33:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 79%|███████▉ | 9767/12384 [20:44:20<5:32:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 79%|███████▉ | 9767/12384 [20:44:28<5:32:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 2: 79%|███████▉ | 9768/12384 [20:44:28<5:32:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 2: 79%|███████▉ | 9768/12384 [20:44:35<5:32:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 79%|███████▉ | 9769/12384 [20:44:35<5:32:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.49s]
Epoch 2: 79%|███████▉ | 9769/12384 [20:44:43<5:32:47, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 79%|███████▉ | 9770/12384 [20:44:43<5:35:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 79%|███████▉ | 9770/12384 [20:44:51<5:35:44, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9771/12384 [20:44:51<5:34:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9771/12384 [20:44:59<5:34:22, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▉ | 9772/12384 [20:44:59<5:33:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▉ | 9772/12384 [20:45:06<5:33:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 79%|███████▉ | 9773/12384 [20:45:06<5:32:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 79%|███████▉ | 9773/12384 [20:45:14<5:32:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 79%|███████▉ | 9774/12384 [20:45:14<5:31:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.96s]
Epoch 2: 79%|███████▉ | 9774/12384 [20:45:21<5:31:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 79%|███████▉ | 9775/12384 [20:45:21<5:31:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.22s]
Epoch 2: 79%|███████▉ | 9775/12384 [20:45:29<5:31:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 79%|███████▉ | 9776/12384 [20:45:29<5:31:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 79%|███████▉ | 9776/12384 [20:45:37<5:31:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 79%|███████▉ | 9777/12384 [20:45:37<5:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 79%|███████▉ | 9777/12384 [20:45:44<5:31:02, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 79%|███████▉ | 9778/12384 [20:45:44<5:30:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.10s]
Epoch 2: 79%|███████▉ | 9778/12384 [20:45:52<5:30:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 79%|███████▉ | 9779/12384 [20:45:52<5:30:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 79%|███████▉ | 9779/12384 [20:45:59<5:30:31, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 79%|███████▉ | 9780/12384 [20:45:59<5:30:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 79%|███████▉ | 9780/12384 [20:46:07<5:30:31, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 79%|███████▉ | 9781/12384 [20:46:07<5:34:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 79%|███████▉ | 9781/12384 [20:46:15<5:34:49, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 79%|███████▉ | 9782/12384 [20:46:15<5:33:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 79%|███████▉ | 9782/12384 [20:46:23<5:33:31, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 79%|███████▉ | 9783/12384 [20:46:23<5:32:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 79%|███████▉ | 9783/12384 [20:46:30<5:32:04, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 79%|███████▉ | 9784/12384 [20:46:30<5:31:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 79%|███████▉ | 9784/12384 [20:46:38<5:31:17, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 79%|███████▉ | 9785/12384 [20:46:38<5:30:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 79%|███████▉ | 9785/12384 [20:46:45<5:30:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 79%|███████▉ | 9786/12384 [20:46:45<5:29:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 79%|███████▉ | 9786/12384 [20:46:53<5:29:58, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▉ | 9787/12384 [20:46:53<5:29:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▉ | 9787/12384 [20:47:01<5:29:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9788/12384 [20:47:01<5:29:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9788/12384 [20:47:08<5:29:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 79%|███████▉ | 9789/12384 [20:47:08<5:29:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 79%|███████▉ | 9789/12384 [20:47:16<5:29:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▉ | 9790/12384 [20:47:16<5:29:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▉ | 9790/12384 [20:47:23<5:29:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 79%|███████▉ | 9791/12384 [20:47:23<5:29:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 79%|███████▉ | 9791/12384 [20:47:31<5:29:04, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9792/12384 [20:47:31<5:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9792/12384 [20:47:39<5:29:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 79%|███████▉ | 9793/12384 [20:47:39<5:28:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 79%|███████▉ | 9793/12384 [20:47:46<5:28:59, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▉ | 9794/12384 [20:47:46<5:29:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 79%|███████▉ | 9794/12384 [20:47:54<5:29:55, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 79%|███████▉ | 9795/12384 [20:47:54<5:29:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 79%|███████▉ | 9795/12384 [20:48:02<5:29:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 2: 79%|███████▉ | 9796/12384 [20:48:02<5:29:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.05s]
Epoch 2: 79%|███████▉ | 9796/12384 [20:48:09<5:29:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 2: 79%|███████▉ | 9797/12384 [20:48:09<5:29:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.16s]
Epoch 2: 79%|███████▉ | 9797/12384 [20:48:17<5:29:43, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 79%|███████▉ | 9798/12384 [20:48:17<5:28:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.70s]
Epoch 2: 79%|███████▉ | 9798/12384 [20:48:25<5:28:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9799/12384 [20:48:25<5:28:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9799/12384 [20:48:32<5:28:33, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 79%|███████▉ | 9800/12384 [20:48:32<5:27:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 79%|███████▉ | 9800/12384 [20:48:40<5:27:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 79%|███████▉ | 9801/12384 [20:48:40<5:27:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 79%|███████▉ | 9801/12384 [20:48:47<5:27:40, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 79%|███████▉ | 9802/12384 [20:48:47<5:27:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 79%|███████▉ | 9802/12384 [20:48:55<5:27:18, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 79%|███████▉ | 9803/12384 [20:48:55<5:28:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 79%|███████▉ | 9803/12384 [20:49:03<5:28:22, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.67s]
Epoch 2: 79%|███████▉ | 9804/12384 [20:49:03<5:27:58, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.67s]
Epoch 2: 79%|███████▉ | 9804/12384 [20:49:10<5:27:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 79%|███████▉ | 9805/12384 [20:49:10<5:27:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 79%|███████▉ | 9805/12384 [20:49:18<5:27:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 79%|███████▉ | 9806/12384 [20:49:18<5:27:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 79%|███████▉ | 9806/12384 [20:49:26<5:27:11, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 79%|███████▉ | 9807/12384 [20:49:26<5:31:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 2: 79%|███████▉ | 9807/12384 [20:49:33<5:31:41, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 79%|███████▉ | 9808/12384 [20:49:33<5:30:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.68s]
Epoch 2: 79%|███████▉ | 9808/12384 [20:49:41<5:30:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 79%|███████▉ | 9809/12384 [20:49:41<5:29:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.29s]
Epoch 2: 79%|███████▉ | 9809/12384 [20:49:49<5:29:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 79%|███████▉ | 9810/12384 [20:49:49<5:28:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.46s]
Epoch 2: 79%|███████▉ | 9810/12384 [20:49:56<5:28:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 79%|███████▉ | 9811/12384 [20:49:56<5:27:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.14s]
Epoch 2: 79%|███████▉ | 9811/12384 [20:50:04<5:27:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 79%|███████▉ | 9812/12384 [20:50:04<5:27:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.71s]
Epoch 2: 79%|███████▉ | 9812/12384 [20:50:12<5:27:18, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 79%|███████▉ | 9813/12384 [20:50:12<5:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.54s]
Epoch 2: 79%|███████▉ | 9813/12384 [20:50:19<5:26:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9814/12384 [20:50:19<5:26:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9814/12384 [20:50:27<5:26:06, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 79%|███████▉ | 9815/12384 [20:50:27<5:25:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 79%|███████▉ | 9815/12384 [20:50:34<5:25:43, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 2: 79%|███████▉ | 9816/12384 [20:50:34<5:25:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.84s]
Epoch 2: 79%|███████▉ | 9816/12384 [20:50:42<5:25:32, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 79%|███████▉ | 9817/12384 [20:50:42<5:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.36s]
Epoch 2: 79%|███████▉ | 9817/12384 [20:50:50<5:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 79%|███████▉ | 9818/12384 [20:50:50<5:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.92s]
Epoch 2: 79%|███████▉ | 9818/12384 [20:50:57<5:25:35, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 79%|███████▉ | 9819/12384 [20:50:57<5:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 79%|███████▉ | 9819/12384 [20:51:05<5:25:14, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9820/12384 [20:51:05<5:24:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9820/12384 [20:51:12<5:24:46, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9821/12384 [20:51:12<5:24:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 79%|███████▉ | 9821/12384 [20:51:20<5:24:37, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 79%|███████▉ | 9822/12384 [20:51:20<5:24:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 79%|███████▉ | 9822/12384 [20:51:28<5:24:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 79%|███████▉ | 9823/12384 [20:51:28<5:25:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.84s]
Epoch 2: 79%|███████▉ | 9823/12384 [20:51:35<5:25:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 79%|███████▉ | 9824/12384 [20:51:35<5:26:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.24s]
Epoch 2: 79%|███████▉ | 9824/12384 [20:51:44<5:26:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 2: 79%|███████▉ | 9825/12384 [20:51:44<5:35:30, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=6.22s]
Epoch 2: 79%|███████▉ | 9825/12384 [20:51:53<5:35:30, 7.87s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 79%|███████▉ | 9826/12384 [20:51:53<5:50:07, 8.21s/it, loss=0.0000, acc=1.0000, iter_time=8.07s]
Epoch 2: 79%|███████▉ | 9826/12384 [20:52:02<5:50:07, 8.21s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 79%|███████▉ | 9827/12384 [20:52:02<6:00:02, 8.45s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 79%|███████▉ | 9827/12384 [20:52:09<6:00:02, 8.45s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 79%|███████▉ | 9828/12384 [20:52:09<5:49:55, 8.21s/it, loss=0.0000, acc=1.0000, iter_time=8.59s]
Epoch 2: 79%|███████▉ | 9828/12384 [20:52:17<5:49:55, 8.21s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 79%|███████▉ | 9829/12384 [20:52:17<5:43:10, 8.06s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 79%|███████▉ | 9829/12384 [20:52:25<5:43:10, 8.06s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 79%|███████▉ | 9830/12384 [20:52:25<5:38:47, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 79%|███████▉ | 9830/12384 [20:52:32<5:38:47, 7.96s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 79%|███████▉ | 9831/12384 [20:52:32<5:35:21, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.67s]
Epoch 2: 79%|███████▉ | 9831/12384 [20:52:40<5:35:21, 7.88s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 79%|███████▉ | 9832/12384 [20:52:40<5:33:06, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=8.14s]
Epoch 2: 79%|███████▉ | 9832/12384 [20:52:48<5:33:06, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 79%|███████▉ | 9833/12384 [20:52:48<5:36:10, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=4.48s]
Epoch 2: 79%|███████▉ | 9833/12384 [20:52:56<5:36:10, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 79%|███████▉ | 9834/12384 [20:52:56<5:33:19, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=10.90s]
Epoch 2: 79%|███████▉ | 9834/12384 [20:53:04<5:33:19, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 79%|███████▉ | 9835/12384 [20:53:04<5:31:05, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=5.11s]
Epoch 2: 79%|███████▉ | 9835/12384 [20:53:11<5:31:05, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 79%|███████▉ | 9836/12384 [20:53:11<5:30:03, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.26s]
Epoch 2: 79%|███████▉ | 9836/12384 [20:53:19<5:30:03, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 79%|███████▉ | 9837/12384 [20:53:19<5:28:27, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 79%|███████▉ | 9837/12384 [20:53:27<5:28:27, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 79%|███████▉ | 9838/12384 [20:53:27<5:27:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 79%|███████▉ | 9838/12384 [20:53:34<5:27:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 79%|███████▉ | 9839/12384 [20:53:34<5:27:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 79%|███████▉ | 9839/12384 [20:53:42<5:27:05, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 2: 79%|███████▉ | 9840/12384 [20:53:42<5:26:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.06s]
Epoch 2: 79%|███████▉ | 9840/12384 [20:53:50<5:26:35, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 79%|███████▉ | 9841/12384 [20:53:50<5:25:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 79%|███████▉ | 9841/12384 [20:53:57<5:25:47, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 79%|███████▉ | 9842/12384 [20:53:57<5:25:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 79%|███████▉ | 9842/12384 [20:54:05<5:25:29, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 79%|███████▉ | 9843/12384 [20:54:05<5:25:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 79%|███████▉ | 9843/12384 [20:54:13<5:25:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 79%|███████▉ | 9844/12384 [20:54:13<5:24:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.60s]
Epoch 2: 79%|███████▉ | 9844/12384 [20:54:20<5:24:47, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 79%|███████▉ | 9845/12384 [20:54:20<5:24:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.93s]
Epoch 2: 79%|███████▉ | 9845/12384 [20:54:28<5:24:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 80%|███████▉ | 9846/12384 [20:54:28<5:24:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 80%|███████▉ | 9846/12384 [20:54:36<5:24:21, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 80%|███████▉ | 9847/12384 [20:54:36<5:24:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 80%|███████▉ | 9847/12384 [20:54:43<5:24:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 80%|███████▉ | 9848/12384 [20:54:43<5:24:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 80%|███████▉ | 9848/12384 [20:54:51<5:24:13, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 80%|███████▉ | 9849/12384 [20:54:51<5:24:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 80%|███████▉ | 9849/12384 [20:54:59<5:24:04, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 80%|███████▉ | 9850/12384 [20:54:59<5:24:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 80%|███████▉ | 9850/12384 [20:55:06<5:24:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 80%|███████▉ | 9851/12384 [20:55:06<5:24:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.32s]
Epoch 2: 80%|███████▉ | 9851/12384 [20:55:14<5:24:08, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 2: 80%|███████▉ | 9852/12384 [20:55:14<5:23:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.02s]
Epoch 2: 80%|███████▉ | 9852/12384 [20:55:22<5:23:56, 7.68s/it, loss=0.0007, acc=0.9972, iter_time=7.67s]
Epoch 2: 80%|███████▉ | 9853/12384 [20:55:22<5:23:40, 7.67s/it, loss=0.0007, acc=0.9972, iter_time=7.67s]
Epoch 2: 80%|███████▉ | 9853/12384 [20:55:30<5:23:40, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 80%|███████▉ | 9854/12384 [20:55:30<5:23:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 80%|███████▉ | 9854/12384 [20:55:37<5:23:54, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 80%|███████▉ | 9855/12384 [20:55:37<5:24:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 80%|███████▉ | 9855/12384 [20:55:45<5:24:04, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 80%|███████▉ | 9856/12384 [20:55:45<5:24:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 80%|███████▉ | 9856/12384 [20:55:53<5:24:09, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 80%|███████▉ | 9857/12384 [20:55:53<5:23:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 80%|███████▉ | 9857/12384 [20:56:00<5:23:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=3.34s]
Epoch 2: 80%|███████▉ | 9858/12384 [20:56:00<5:22:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=3.34s]
Epoch 2: 80%|███████▉ | 9858/12384 [20:56:08<5:22:43, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.94s]
Epoch 2: 80%|███████▉ | 9859/12384 [20:56:08<5:25:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=11.94s]
Epoch 2: 80%|███████▉ | 9859/12384 [20:56:16<5:25:52, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 80%|███████▉ | 9860/12384 [20:56:16<5:24:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 80%|███████▉ | 9860/12384 [20:56:23<5:24:00, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 80%|███████▉ | 9861/12384 [20:56:23<5:22:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 2: 80%|███████▉ | 9861/12384 [20:56:31<5:22:47, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 80%|███████▉ | 9862/12384 [20:56:31<5:21:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 2: 80%|███████▉ | 9862/12384 [20:56:39<5:21:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 80%|███████▉ | 9863/12384 [20:56:39<5:21:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 80%|███████▉ | 9863/12384 [20:56:46<5:21:10, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 2: 80%|███████▉ | 9864/12384 [20:56:46<5:20:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.64s]
Epoch 2: 80%|███████▉ | 9864/12384 [20:56:54<5:20:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 80%|███████▉ | 9865/12384 [20:56:54<5:20:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 80%|███████▉ | 9865/12384 [20:57:01<5:20:21, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|███████▉ | 9866/12384 [20:57:01<5:19:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|███████▉ | 9866/12384 [20:57:09<5:19:55, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 80%|███████▉ | 9867/12384 [20:57:09<5:20:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.21s]
Epoch 2: 80%|███████▉ | 9867/12384 [20:57:17<5:20:29, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 80%|███████▉ | 9868/12384 [20:57:17<5:19:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.06s]
Epoch 2: 80%|███████▉ | 9868/12384 [20:57:24<5:19:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 80%|███████▉ | 9869/12384 [20:57:24<5:19:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 80%|███████▉ | 9869/12384 [20:57:32<5:19:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 80%|███████▉ | 9870/12384 [20:57:32<5:18:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.40s]
Epoch 2: 80%|███████▉ | 9870/12384 [20:57:40<5:18:58, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 80%|███████▉ | 9871/12384 [20:57:40<5:28:46, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 80%|███████▉ | 9871/12384 [20:57:48<5:28:46, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 80%|███████▉ | 9872/12384 [20:57:48<5:25:48, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 80%|███████▉ | 9872/12384 [20:57:56<5:25:48, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 80%|███████▉ | 9873/12384 [20:57:56<5:23:58, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 80%|███████▉ | 9873/12384 [20:58:03<5:23:58, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 2: 80%|███████▉ | 9874/12384 [20:58:03<5:22:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=4.42s]
Epoch 2: 80%|███████▉ | 9874/12384 [20:58:11<5:22:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 80%|███████▉ | 9875/12384 [20:58:11<5:21:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 2: 80%|███████▉ | 9875/12384 [20:58:19<5:21:16, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 80%|███████▉ | 9876/12384 [20:58:19<5:31:07, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 80%|███████▉ | 9876/12384 [20:58:27<5:31:07, 7.92s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 80%|███████▉ | 9877/12384 [20:58:27<5:27:15, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=4.31s]
Epoch 2: 80%|███████▉ | 9877/12384 [20:58:36<5:27:15, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=12.04s]
Epoch 2: 80%|███████▉ | 9878/12384 [20:58:36<5:38:11, 8.10s/it, loss=0.0000, acc=1.0000, iter_time=12.04s]
Epoch 2: 80%|███████▉ | 9878/12384 [20:58:43<5:38:11, 8.10s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 80%|███████▉ | 9879/12384 [20:58:43<5:31:59, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 80%|███████▉ | 9879/12384 [20:58:51<5:31:59, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 80%|███████▉ | 9880/12384 [20:58:51<5:27:37, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.01s]
Epoch 2: 80%|███████▉ | 9880/12384 [20:58:58<5:27:37, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 80%|███████▉ | 9881/12384 [20:58:58<5:24:01, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 80%|███████▉ | 9881/12384 [20:59:06<5:24:01, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 80%|███████▉ | 9882/12384 [20:59:06<5:23:07, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 80%|███████▉ | 9882/12384 [20:59:14<5:23:07, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 2: 80%|███████▉ | 9883/12384 [20:59:14<5:21:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=4.43s]
Epoch 2: 80%|███████▉ | 9883/12384 [20:59:21<5:21:23, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 80%|███████▉ | 9884/12384 [20:59:21<5:20:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.39s]
Epoch 2: 80%|███████▉ | 9884/12384 [20:59:29<5:20:04, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 80%|███████▉ | 9885/12384 [20:59:29<5:23:26, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 80%|███████▉ | 9885/12384 [20:59:37<5:23:26, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 80%|███████▉ | 9886/12384 [20:59:37<5:21:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.22s]
Epoch 2: 80%|███████▉ | 9886/12384 [20:59:45<5:21:32, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|███████▉ | 9887/12384 [20:59:45<5:20:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|███████▉ | 9887/12384 [20:59:52<5:20:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 80%|███████▉ | 9888/12384 [20:59:52<5:19:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 80%|███████▉ | 9888/12384 [21:00:00<5:19:34, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 2: 80%|███████▉ | 9889/12384 [21:00:00<5:19:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.70s]
Epoch 2: 80%|███████▉ | 9889/12384 [21:00:08<5:19:07, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 2: 80%|███████▉ | 9890/12384 [21:00:08<5:18:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.51s]
Epoch 2: 80%|███████▉ | 9890/12384 [21:00:15<5:18:35, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 80%|███████▉ | 9891/12384 [21:00:15<5:17:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 80%|███████▉ | 9891/12384 [21:00:23<5:17:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 80%|███████▉ | 9892/12384 [21:00:23<5:17:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 80%|███████▉ | 9892/12384 [21:00:30<5:17:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 80%|███████▉ | 9893/12384 [21:00:30<5:17:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.36s]
Epoch 2: 80%|███████▉ | 9893/12384 [21:00:38<5:17:49, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 80%|███████▉ | 9894/12384 [21:00:38<5:17:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.27s]
Epoch 2: 80%|███████▉ | 9894/12384 [21:00:46<5:17:16, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 2: 80%|███████▉ | 9895/12384 [21:00:46<5:16:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 2: 80%|███████▉ | 9895/12384 [21:00:53<5:16:37, 7.63s/it, loss=0.0005, acc=0.9978, iter_time=10.62s]
Epoch 2: 80%|███████▉ | 9896/12384 [21:00:53<5:16:44, 7.64s/it, loss=0.0005, acc=0.9978, iter_time=10.62s]
Epoch 2: 80%|███████▉ | 9896/12384 [21:01:01<5:16:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 2: 80%|███████▉ | 9897/12384 [21:01:01<5:16:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.68s]
Epoch 2: 80%|███████▉ | 9897/12384 [21:01:09<5:16:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 80%|███████▉ | 9898/12384 [21:01:09<5:16:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.70s]
Epoch 2: 80%|███████▉ | 9898/12384 [21:01:16<5:16:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 80%|███████▉ | 9899/12384 [21:01:16<5:15:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.11s]
Epoch 2: 80%|███████▉ | 9899/12384 [21:01:24<5:15:57, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 80%|███████▉ | 9900/12384 [21:01:24<5:19:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 80%|███████▉ | 9900/12384 [21:01:32<5:19:21, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 80%|███████▉ | 9901/12384 [21:01:32<5:18:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.39s]
Epoch 2: 80%|███████▉ | 9901/12384 [21:01:39<5:18:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 80%|███████▉ | 9902/12384 [21:01:39<5:17:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 80%|███████▉ | 9902/12384 [21:01:47<5:17:38, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 80%|███████▉ | 9903/12384 [21:01:47<5:16:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.05s]
Epoch 2: 80%|███████▉ | 9903/12384 [21:01:55<5:16:43, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 80%|███████▉ | 9904/12384 [21:01:55<5:16:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.63s]
Epoch 2: 80%|███████▉ | 9904/12384 [21:02:02<5:16:05, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 80%|███████▉ | 9905/12384 [21:02:02<5:15:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 80%|███████▉ | 9905/12384 [21:02:10<5:15:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|███████▉ | 9906/12384 [21:02:10<5:15:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|███████▉ | 9906/12384 [21:02:17<5:15:04, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 80%|███████▉ | 9907/12384 [21:02:17<5:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 80%|███████▉ | 9907/12384 [21:02:25<5:14:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 80%|████████ | 9908/12384 [21:02:25<5:14:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.38s]
Epoch 2: 80%|████████ | 9908/12384 [21:02:33<5:14:33, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|████████ | 9909/12384 [21:02:33<5:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|████████ | 9909/12384 [21:02:40<5:14:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 80%|████████ | 9910/12384 [21:02:40<5:15:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.74s]
Epoch 2: 80%|████████ | 9910/12384 [21:02:48<5:15:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 80%|████████ | 9911/12384 [21:02:48<5:14:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.62s]
Epoch 2: 80%|████████ | 9911/12384 [21:02:56<5:14:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 80%|████████ | 9912/12384 [21:02:56<5:18:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.88s]
Epoch 2: 80%|████████ | 9912/12384 [21:03:04<5:18:38, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 80%|████████ | 9913/12384 [21:03:04<5:16:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 2: 80%|████████ | 9913/12384 [21:03:11<5:16:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 80%|████████ | 9914/12384 [21:03:11<5:17:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 80%|████████ | 9914/12384 [21:03:19<5:17:08, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 80%|████████ | 9915/12384 [21:03:19<5:16:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 80%|████████ | 9915/12384 [21:03:27<5:16:23, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 80%|████████ | 9916/12384 [21:03:27<5:15:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.16s]
Epoch 2: 80%|████████ | 9916/12384 [21:03:34<5:15:18, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 80%|████████ | 9917/12384 [21:03:34<5:14:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.49s]
Epoch 2: 80%|████████ | 9917/12384 [21:03:42<5:14:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 80%|████████ | 9918/12384 [21:03:42<5:15:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.25s]
Epoch 2: 80%|████████ | 9918/12384 [21:03:50<5:15:09, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 80%|████████ | 9919/12384 [21:03:50<5:14:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 80%|████████ | 9919/12384 [21:03:57<5:14:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 80%|████████ | 9920/12384 [21:03:57<5:13:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 80%|████████ | 9920/12384 [21:04:05<5:13:35, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 80%|████████ | 9921/12384 [21:04:05<5:12:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.04s]
Epoch 2: 80%|████████ | 9921/12384 [21:04:12<5:12:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 2: 80%|████████ | 9922/12384 [21:04:12<5:13:06, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.99s]
Epoch 2: 80%|████████ | 9922/12384 [21:04:20<5:13:06, 7.63s/it, loss=0.0009, acc=0.9974, iter_time=7.95s]
Epoch 2: 80%|████████ | 9923/12384 [21:04:20<5:13:51, 7.65s/it, loss=0.0009, acc=0.9974, iter_time=7.95s]
Epoch 2: 80%|████████ | 9923/12384 [21:04:28<5:13:51, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 2: 80%|████████ | 9924/12384 [21:04:28<5:16:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.14s]
Epoch 2: 80%|████████ | 9924/12384 [21:04:36<5:16:00, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 80%|████████ | 9925/12384 [21:04:36<5:17:16, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.53s]
Epoch 2: 80%|████████ | 9925/12384 [21:04:44<5:17:16, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 80%|████████ | 9926/12384 [21:04:44<5:21:41, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 80%|████████ | 9926/12384 [21:04:51<5:21:41, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 2: 80%|████████ | 9927/12384 [21:04:51<5:18:45, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=4.11s]
Epoch 2: 80%|████████ | 9927/12384 [21:04:59<5:18:45, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 2: 80%|████████ | 9928/12384 [21:04:59<5:19:12, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=11.28s]
Epoch 2: 80%|████████ | 9928/12384 [21:05:07<5:19:12, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 80%|████████ | 9929/12384 [21:05:07<5:17:06, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=3.87s]
Epoch 2: 80%|████████ | 9929/12384 [21:05:15<5:17:06, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 2: 80%|████████ | 9930/12384 [21:05:15<5:16:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.27s]
Epoch 2: 80%|████████ | 9930/12384 [21:05:22<5:16:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 2: 80%|████████ | 9931/12384 [21:05:22<5:15:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.88s]
Epoch 2: 80%|████████ | 9931/12384 [21:05:30<5:15:31, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 80%|████████ | 9932/12384 [21:05:30<5:14:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.11s]
Epoch 2: 80%|████████ | 9932/12384 [21:05:38<5:14:40, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 80%|████████ | 9933/12384 [21:05:38<5:14:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 80%|████████ | 9933/12384 [21:05:45<5:14:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 80%|████████ | 9934/12384 [21:05:45<5:13:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 80%|████████ | 9934/12384 [21:05:53<5:13:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 80%|████████ | 9935/12384 [21:05:53<5:13:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 80%|████████ | 9935/12384 [21:06:01<5:13:44, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 80%|████████ | 9936/12384 [21:06:01<5:15:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.20s]
Epoch 2: 80%|████████ | 9936/12384 [21:06:09<5:15:07, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 80%|████████ | 9937/12384 [21:06:09<5:15:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 80%|████████ | 9937/12384 [21:06:17<5:15:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 2: 80%|████████ | 9938/12384 [21:06:17<5:18:05, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=4.89s]
Epoch 2: 80%|████████ | 9938/12384 [21:06:24<5:18:05, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 80%|████████ | 9939/12384 [21:06:24<5:15:49, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.18s]
Epoch 2: 80%|████████ | 9939/12384 [21:06:32<5:15:49, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 80%|████████ | 9940/12384 [21:06:32<5:13:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.15s]
Epoch 2: 80%|████████ | 9940/12384 [21:06:39<5:13:54, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 80%|████████ | 9941/12384 [21:06:39<5:12:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 80%|████████ | 9941/12384 [21:06:47<5:12:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 80%|████████ | 9942/12384 [21:06:47<5:11:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.28s]
Epoch 2: 80%|████████ | 9942/12384 [21:06:55<5:11:54, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 80%|████████ | 9943/12384 [21:06:55<5:10:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.97s]
Epoch 2: 80%|████████ | 9943/12384 [21:07:02<5:10:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 80%|████████ | 9944/12384 [21:07:02<5:10:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 80%|████████ | 9944/12384 [21:07:10<5:10:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=3.58s]
Epoch 2: 80%|████████ | 9945/12384 [21:07:10<5:11:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.58s]
Epoch 2: 80%|████████ | 9945/12384 [21:07:18<5:11:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 80%|████████ | 9946/12384 [21:07:18<5:10:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=11.05s]
Epoch 2: 80%|████████ | 9946/12384 [21:07:25<5:10:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 80%|████████ | 9947/12384 [21:07:25<5:10:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 80%|████████ | 9947/12384 [21:07:33<5:10:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 80%|████████ | 9948/12384 [21:07:33<5:10:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.17s]
Epoch 2: 80%|████████ | 9948/12384 [21:07:40<5:10:08, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 80%|████████ | 9949/12384 [21:07:40<5:10:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.73s]
Epoch 2: 80%|████████ | 9949/12384 [21:07:48<5:10:39, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 80%|████████ | 9950/12384 [21:07:48<5:09:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 80%|████████ | 9950/12384 [21:07:56<5:09:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 80%|████████ | 9951/12384 [21:07:56<5:09:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.47s]
Epoch 2: 80%|████████ | 9951/12384 [21:08:03<5:09:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 2: 80%|████████ | 9952/12384 [21:08:03<5:09:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.10s]
Epoch 2: 80%|████████ | 9952/12384 [21:08:11<5:09:12, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 80%|████████ | 9953/12384 [21:08:11<5:12:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 80%|████████ | 9953/12384 [21:08:19<5:12:06, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 80%|████████ | 9954/12384 [21:08:19<5:10:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 80%|████████ | 9954/12384 [21:08:27<5:10:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 2: 80%|████████ | 9955/12384 [21:08:27<5:11:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.19s]
Epoch 2: 80%|████████ | 9955/12384 [21:08:34<5:11:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 80%|████████ | 9956/12384 [21:08:34<5:10:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 80%|████████ | 9956/12384 [21:08:42<5:10:19, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 80%|████████ | 9957/12384 [21:08:42<5:09:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 80%|████████ | 9957/12384 [21:08:49<5:09:29, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 80%|████████ | 9958/12384 [21:08:49<5:09:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 80%|████████ | 9958/12384 [21:08:57<5:09:26, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 80%|████████ | 9959/12384 [21:08:57<5:10:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 2: 80%|████████ | 9959/12384 [21:09:05<5:10:11, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 80%|████████ | 9960/12384 [21:09:05<5:09:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 80%|████████ | 9960/12384 [21:09:12<5:09:46, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 80%|████████ | 9961/12384 [21:09:12<5:09:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 80%|████████ | 9961/12384 [21:09:20<5:09:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 80%|████████ | 9962/12384 [21:09:20<5:08:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 80%|████████ | 9962/12384 [21:09:28<5:08:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 80%|████████ | 9963/12384 [21:09:28<5:08:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 80%|████████ | 9963/12384 [21:09:35<5:08:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|████████ | 9964/12384 [21:09:35<5:07:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 80%|████████ | 9964/12384 [21:09:43<5:07:40, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=7.64s]
Epoch 2: 80%|████████ | 9965/12384 [21:09:43<5:11:18, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=7.64s]
Epoch 2: 80%|████████ | 9965/12384 [21:09:51<5:11:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 80%|████████ | 9966/12384 [21:09:51<5:10:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 80%|████████ | 9966/12384 [21:09:59<5:10:16, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 80%|████████ | 9967/12384 [21:09:59<5:10:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 80%|████████ | 9967/12384 [21:10:06<5:10:19, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 80%|████████ | 9968/12384 [21:10:06<5:09:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.66s]
Epoch 2: 80%|████████ | 9968/12384 [21:10:14<5:09:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 80%|████████ | 9969/12384 [21:10:14<5:08:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.27s]
Epoch 2: 80%|████████ | 9969/12384 [21:10:21<5:08:49, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 2: 81%|████████ | 9970/12384 [21:10:21<5:08:07, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 2: 81%|████████ | 9970/12384 [21:10:29<5:08:07, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 81%|████████ | 9971/12384 [21:10:29<5:07:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 81%|████████ | 9971/12384 [21:10:37<5:07:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 81%|████████ | 9972/12384 [21:10:37<5:07:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 81%|████████ | 9972/12384 [21:10:44<5:07:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 81%|████████ | 9973/12384 [21:10:44<5:06:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 81%|████████ | 9973/12384 [21:10:52<5:06:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 81%|████████ | 9974/12384 [21:10:52<5:06:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 81%|████████ | 9974/12384 [21:11:00<5:06:19, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 81%|████████ | 9975/12384 [21:11:00<5:06:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 81%|████████ | 9975/12384 [21:11:07<5:06:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 81%|████████ | 9976/12384 [21:11:07<5:05:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 81%|████████ | 9976/12384 [21:11:15<5:05:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 81%|████████ | 9977/12384 [21:11:15<5:05:37, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 81%|████████ | 9977/12384 [21:11:22<5:05:37, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 2: 81%|████████ | 9978/12384 [21:11:22<5:05:22, 7.62s/it, loss=0.0001, acc=0.9989, iter_time=7.61s]
Epoch 2: 81%|████████ | 9978/12384 [21:11:30<5:05:22, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 81%|████████ | 9979/12384 [21:11:30<5:08:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 81%|████████ | 9979/12384 [21:11:38<5:08:26, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 81%|████████ | 9980/12384 [21:11:38<5:07:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 81%|████████ | 9980/12384 [21:11:46<5:07:15, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 81%|████████ | 9981/12384 [21:11:46<5:06:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.33s]
Epoch 2: 81%|████████ | 9981/12384 [21:11:53<5:06:48, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 81%|████████ | 9982/12384 [21:11:53<5:06:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 81%|████████ | 9982/12384 [21:12:01<5:06:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 2: 81%|████████ | 9983/12384 [21:12:01<5:05:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.73s]
Epoch 2: 81%|████████ | 9983/12384 [21:12:08<5:05:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 81%|████████ | 9984/12384 [21:12:08<5:05:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.50s]
Epoch 2: 81%|████████ | 9984/12384 [21:12:16<5:05:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 81%|████████ | 9985/12384 [21:12:16<5:06:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.30s]
Epoch 2: 81%|████████ | 9985/12384 [21:12:24<5:06:02, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 81%|████████ | 9986/12384 [21:12:24<5:06:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 81%|████████ | 9986/12384 [21:12:32<5:06:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 81%|████████ | 9987/12384 [21:12:32<5:09:36, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 81%|████████ | 9987/12384 [21:12:40<5:09:36, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 81%|████████ | 9988/12384 [21:12:40<5:11:51, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.94s]
Epoch 2: 81%|████████ | 9988/12384 [21:12:47<5:11:51, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 81%|████████ | 9989/12384 [21:12:47<5:11:37, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=4.30s]
Epoch 2: 81%|████████ | 9989/12384 [21:12:55<5:11:37, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 81%|████████ | 9990/12384 [21:12:55<5:11:57, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=10.15s]
Epoch 2: 81%|████████ | 9990/12384 [21:13:03<5:11:57, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 81%|████████ | 9991/12384 [21:13:03<5:15:21, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 81%|████████ | 9991/12384 [21:13:11<5:15:21, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 81%|████████ | 9992/12384 [21:13:11<5:13:13, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=9.46s]
Epoch 2: 81%|████████ | 9992/12384 [21:13:19<5:13:13, 7.86s/it, loss=0.0001, acc=0.9999, iter_time=7.37s]
Epoch 2: 81%|████████ | 9993/12384 [21:13:19<5:11:24, 7.81s/it, loss=0.0001, acc=0.9999, iter_time=7.37s]
Epoch 2: 81%|████████ | 9993/12384 [21:13:27<5:11:24, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 81%|████████ | 9994/12384 [21:13:27<5:10:08, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 81%|████████ | 9994/12384 [21:13:34<5:10:08, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 81%|████████ | 9995/12384 [21:13:34<5:09:21, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 81%|████████ | 9995/12384 [21:13:42<5:09:21, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 81%|████████ | 9996/12384 [21:13:42<5:08:50, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 81%|████████ | 9996/12384 [21:13:50<5:08:50, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 81%|████████ | 9997/12384 [21:13:50<5:09:35, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.81s]
Epoch 2: 81%|████████ | 9997/12384 [21:13:58<5:09:35, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 2: 81%|████████ | 9998/12384 [21:13:58<5:08:14, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=5.58s]
Epoch 2: 81%|████████ | 9998/12384 [21:14:05<5:08:14, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 81%|████████ | 9999/12384 [21:14:05<5:07:18, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 81%|████████ | 9999/12384 [21:14:13<5:07:18, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 81%|████████ | 10000/12384 [21:14:13<5:06:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.60s]
Epoch 2: 81%|████████ | 10000/12384 [21:14:21<5:06:19, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 2: 81%|████████ | 10001/12384 [21:14:21<5:06:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.98s]
Epoch 2: 81%|████████ | 10001/12384 [21:14:28<5:06:09, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 81%|████████ | 10002/12384 [21:14:28<5:06:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 81%|████████ | 10002/12384 [21:14:36<5:06:35, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 2: 81%|████████ | 10003/12384 [21:14:36<5:06:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.97s]
Epoch 2: 81%|████████ | 10003/12384 [21:14:44<5:06:02, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 81%|████████ | 10004/12384 [21:14:44<5:05:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.68s]
Epoch 2: 81%|████████ | 10004/12384 [21:14:52<5:05:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 81%|████████ | 10005/12384 [21:14:52<5:09:02, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 81%|████████ | 10005/12384 [21:15:00<5:09:02, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 81%|████████ | 10006/12384 [21:15:00<5:08:06, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=6.26s]
Epoch 2: 81%|████████ | 10006/12384 [21:15:07<5:08:06, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 81%|████████ | 10007/12384 [21:15:07<5:06:49, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 81%|████████ | 10007/12384 [21:15:15<5:06:49, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 2: 81%|████████ | 10008/12384 [21:15:15<5:06:19, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=9.47s]
Epoch 2: 81%|████████ | 10008/12384 [21:15:23<5:06:19, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 81%|████████ | 10009/12384 [21:15:23<5:07:56, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=7.45s]
Epoch 2: 81%|████████ | 10009/12384 [21:15:31<5:07:56, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 81%|████████ | 10010/12384 [21:15:31<5:14:38, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=8.40s]
Epoch 2: 81%|████████ | 10010/12384 [21:15:39<5:14:38, 7.95s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 81%|████████ | 10011/12384 [21:15:39<5:10:56, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 81%|████████ | 10011/12384 [21:15:46<5:10:56, 7.86s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 81%|████████ | 10012/12384 [21:15:46<5:08:27, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=6.64s]
Epoch 2: 81%|████████ | 10012/12384 [21:15:54<5:08:27, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 81%|████████ | 10013/12384 [21:15:54<5:06:51, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=9.48s]
Epoch 2: 81%|████████ | 10013/12384 [21:16:02<5:06:51, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 81%|████████ | 10014/12384 [21:16:02<5:06:04, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.92s]
Epoch 2: 81%|████████ | 10014/12384 [21:16:10<5:06:04, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 81%|████████ | 10015/12384 [21:16:10<5:06:01, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.95s]
Epoch 2: 81%|████████ | 10015/12384 [21:16:17<5:06:01, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 81%|████████ | 10016/12384 [21:16:17<5:05:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.15s]
Epoch 2: 81%|████████ | 10016/12384 [21:16:25<5:05:09, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 81%|████████ | 10017/12384 [21:16:25<5:09:04, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 81%|████████ | 10017/12384 [21:16:33<5:09:04, 7.83s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 81%|████████ | 10018/12384 [21:16:33<5:07:25, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=6.56s]
Epoch 2: 81%|████████ | 10018/12384 [21:16:41<5:07:25, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 81%|████████ | 10019/12384 [21:16:41<5:06:52, 7.79s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 81%|████████ | 10019/12384 [21:16:49<5:06:52, 7.79s/it, loss=0.0001, acc=1.0000, iter_time=6.75s]
Epoch 2: 81%|████████ | 10020/12384 [21:16:49<5:05:45, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=6.75s]
Epoch 2: 81%|████████ | 10020/12384 [21:16:56<5:05:45, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 81%|████████ | 10021/12384 [21:16:56<5:03:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.58s]
Epoch 2: 81%|████████ | 10021/12384 [21:17:04<5:03:42, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 81%|████████ | 10022/12384 [21:17:04<5:02:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.85s]
Epoch 2: 81%|████████ | 10022/12384 [21:17:11<5:02:17, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 81%|████████ | 10023/12384 [21:17:11<5:01:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 2: 81%|████████ | 10023/12384 [21:17:19<5:01:29, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=9.51s]
Epoch 2: 81%|████████ | 10024/12384 [21:17:19<5:00:45, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=9.51s]
Epoch 2: 81%|████████ | 10024/12384 [21:17:27<5:00:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 81%|████████ | 10025/12384 [21:17:27<4:59:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 81%|████████ | 10025/12384 [21:17:34<4:59:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 81%|████████ | 10026/12384 [21:17:34<4:59:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 81%|████████ | 10026/12384 [21:17:42<4:59:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 81%|████████ | 10027/12384 [21:17:42<4:59:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.41s]
Epoch 2: 81%|████████ | 10027/12384 [21:17:49<4:59:02, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 81%|████████ | 10028/12384 [21:17:49<4:58:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=8.78s]
Epoch 2: 81%|████████ | 10028/12384 [21:17:57<4:58:49, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 81%|████████ | 10029/12384 [21:17:57<4:58:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 81%|████████ | 10029/12384 [21:18:05<4:58:41, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 81%|████████ | 10030/12384 [21:18:05<4:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 81%|████████ | 10030/12384 [21:18:12<4:58:34, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 81%|████████ | 10031/12384 [21:18:12<4:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 81%|████████ | 10031/12384 [21:18:20<4:58:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 2: 81%|████████ | 10032/12384 [21:18:20<4:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.42s]
Epoch 2: 81%|████████ | 10032/12384 [21:18:27<4:58:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 2: 81%|████████ | 10033/12384 [21:18:27<4:58:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.65s]
Epoch 2: 81%|████████ | 10033/12384 [21:18:35<4:58:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 81%|████████ | 10034/12384 [21:18:35<4:58:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.96s]
Epoch 2: 81%|████████ | 10034/12384 [21:18:43<4:58:35, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 81%|████████ | 10035/12384 [21:18:43<4:58:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.89s]
Epoch 2: 81%|████████ | 10035/12384 [21:18:50<4:58:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 81%|████████ | 10036/12384 [21:18:50<4:59:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.29s]
Epoch 2: 81%|████████ | 10036/12384 [21:18:58<4:59:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 81%|████████ | 10037/12384 [21:18:58<4:58:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.04s]
Epoch 2: 81%|████████ | 10037/12384 [21:19:06<4:58:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 81%|████████ | 10038/12384 [21:19:06<4:58:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 81%|████████ | 10038/12384 [21:19:13<4:58:17, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 81%|████████ | 10039/12384 [21:19:13<4:58:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 81%|████████ | 10039/12384 [21:19:21<4:58:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 81%|████████ | 10040/12384 [21:19:21<5:00:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.12s]
Epoch 2: 81%|████████ | 10040/12384 [21:19:29<5:00:12, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 81%|████████ | 10041/12384 [21:19:29<5:01:45, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.54s]
Epoch 2: 81%|████████ | 10041/12384 [21:19:37<5:01:45, 7.73s/it, loss=0.0027, acc=0.9912, iter_time=7.67s]
Epoch 2: 81%|████████ | 10042/12384 [21:19:37<5:01:03, 7.71s/it, loss=0.0027, acc=0.9912, iter_time=7.67s]
Epoch 2: 81%|████████ | 10042/12384 [21:19:45<5:01:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 81%|████████ | 10043/12384 [21:19:45<5:05:13, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 81%|████████ | 10043/12384 [21:19:52<5:05:13, 7.82s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 81%|████████ | 10044/12384 [21:19:52<5:02:59, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.38s]
Epoch 2: 81%|████████ | 10044/12384 [21:20:00<5:02:59, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 81%|████████ | 10045/12384 [21:20:00<5:01:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.28s]
Epoch 2: 81%|████████ | 10045/12384 [21:20:08<5:01:45, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 2: 81%|████████ | 10046/12384 [21:20:08<5:00:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=3.92s]
Epoch 2: 81%|████████ | 10046/12384 [21:20:15<5:00:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 2: 81%|████████ | 10047/12384 [21:20:15<5:00:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=11.38s]
Epoch 2: 81%|████████ | 10047/12384 [21:20:23<5:00:04, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 81%|████████ | 10048/12384 [21:20:23<4:59:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 81%|████████ | 10048/12384 [21:20:31<4:59:43, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 81%|████████ | 10049/12384 [21:20:31<4:59:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 81%|████████ | 10049/12384 [21:20:39<4:59:49, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 81%|████████ | 10050/12384 [21:20:39<5:01:29, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 81%|████████ | 10050/12384 [21:20:46<5:01:29, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 81%|████████ | 10051/12384 [21:20:46<5:01:15, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 81%|████████ | 10051/12384 [21:20:54<5:01:15, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 81%|████████ | 10052/12384 [21:20:54<5:00:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.76s]
Epoch 2: 81%|████████ | 10052/12384 [21:21:02<5:00:00, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 81%|████████ | 10053/12384 [21:21:02<4:59:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.65s]
Epoch 2: 81%|████████ | 10053/12384 [21:21:09<4:59:53, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 81%|████████ | 10054/12384 [21:21:09<4:59:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 81%|████████ | 10054/12384 [21:21:17<4:59:58, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 2: 81%|████████ | 10055/12384 [21:21:17<4:59:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=4.41s]
Epoch 2: 81%|████████ | 10055/12384 [21:21:25<4:59:34, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=11.47s]
Epoch 2: 81%|████████ | 10056/12384 [21:21:25<4:59:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=11.47s]
Epoch 2: 81%|████████ | 10056/12384 [21:21:33<4:59:51, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 2: 81%|████████ | 10057/12384 [21:21:33<4:59:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.00s]
Epoch 2: 81%|████████ | 10057/12384 [21:21:40<4:59:30, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 2: 81%|████████ | 10058/12384 [21:21:40<4:58:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.01s]
Epoch 2: 81%|████████ | 10058/12384 [21:21:48<4:58:47, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 81%|████████ | 10059/12384 [21:21:48<4:58:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 81%|████████ | 10059/12384 [21:21:56<4:58:34, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 2: 81%|████████ | 10060/12384 [21:21:56<4:58:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.02s]
Epoch 2: 81%|████████ | 10060/12384 [21:22:03<4:58:23, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 81%|████████ | 10061/12384 [21:22:03<4:58:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.81s]
Epoch 2: 81%|████████ | 10061/12384 [21:22:11<4:58:26, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 81%|████████▏ | 10062/12384 [21:22:11<4:58:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.10s]
Epoch 2: 81%|████████▏ | 10062/12384 [21:22:19<4:58:37, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 81%|████████▏ | 10063/12384 [21:22:19<4:58:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.08s]
Epoch 2: 81%|████████▏ | 10063/12384 [21:22:27<4:58:36, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 81%|████████▏ | 10064/12384 [21:22:27<4:58:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=10.49s]
Epoch 2: 81%|████████▏ | 10064/12384 [21:22:34<4:58:06, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 81%|████████▏ | 10065/12384 [21:22:34<4:58:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 81%|████████▏ | 10065/12384 [21:22:42<4:58:25, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 81%|████████▏ | 10066/12384 [21:22:42<4:58:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.82s]
Epoch 2: 81%|████████▏ | 10066/12384 [21:22:50<4:58:46, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 81%|████████▏ | 10067/12384 [21:22:50<4:58:11, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 81%|████████▏ | 10067/12384 [21:22:58<4:58:11, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=6.05s]
Epoch 2: 81%|████████▏ | 10068/12384 [21:22:58<4:59:17, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=6.05s]
Epoch 2: 81%|████████▏ | 10068/12384 [21:23:06<4:59:17, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 2: 81%|████████▏ | 10069/12384 [21:23:06<5:02:45, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=11.57s]
Epoch 2: 81%|████████▏ | 10069/12384 [21:23:13<5:02:45, 7.85s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 81%|████████▏ | 10070/12384 [21:23:13<5:00:56, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=5.13s]
Epoch 2: 81%|████████▏ | 10070/12384 [21:23:21<5:00:56, 7.80s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 2: 81%|████████▏ | 10071/12384 [21:23:21<4:58:40, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=10.54s]
Epoch 2: 81%|████████▏ | 10071/12384 [21:23:29<4:58:40, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 81%|████████▏ | 10072/12384 [21:23:29<4:57:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 81%|████████▏ | 10072/12384 [21:23:36<4:57:28, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 81%|████████▏ | 10073/12384 [21:23:36<4:56:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.26s]
Epoch 2: 81%|████████▏ | 10073/12384 [21:23:44<4:56:10, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 81%|████████▏ | 10074/12384 [21:23:44<4:54:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 81%|████████▏ | 10074/12384 [21:23:51<4:54:57, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 81%|████████▏ | 10075/12384 [21:23:51<4:54:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.08s]
Epoch 2: 81%|████████▏ | 10075/12384 [21:23:59<4:54:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 81%|████████▏ | 10076/12384 [21:23:59<4:54:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 81%|████████▏ | 10076/12384 [21:24:07<4:54:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 81%|████████▏ | 10077/12384 [21:24:07<4:53:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 81%|████████▏ | 10077/12384 [21:24:14<4:53:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 81%|████████▏ | 10078/12384 [21:24:14<4:54:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=6.01s]
Epoch 2: 81%|████████▏ | 10078/12384 [21:24:22<4:54:36, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 81%|████████▏ | 10079/12384 [21:24:22<4:53:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.13s]
Epoch 2: 81%|████████▏ | 10079/12384 [21:24:30<4:53:58, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 81%|████████▏ | 10080/12384 [21:24:30<4:53:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 81%|████████▏ | 10080/12384 [21:24:37<4:53:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 81%|████████▏ | 10081/12384 [21:24:37<4:52:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 81%|████████▏ | 10081/12384 [21:24:45<4:52:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 81%|████████▏ | 10082/12384 [21:24:45<4:52:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 81%|████████▏ | 10082/12384 [21:24:53<4:52:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 81%|████████▏ | 10083/12384 [21:24:53<4:55:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.50s]
Epoch 2: 81%|████████▏ | 10083/12384 [21:25:00<4:55:43, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 81%|████████▏ | 10084/12384 [21:25:00<4:54:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 81%|████████▏ | 10084/12384 [21:25:08<4:54:21, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 81%|████████▏ | 10085/12384 [21:25:08<4:53:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.01s]
Epoch 2: 81%|████████▏ | 10085/12384 [21:25:16<4:53:34, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 2: 81%|████████▏ | 10086/12384 [21:25:16<4:53:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.23s]
Epoch 2: 81%|████████▏ | 10086/12384 [21:25:23<4:53:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 2: 81%|████████▏ | 10087/12384 [21:25:23<4:53:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.00s]
Epoch 2: 81%|████████▏ | 10087/12384 [21:25:31<4:53:25, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=11.70s]
Epoch 2: 81%|████████▏ | 10088/12384 [21:25:31<4:53:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=11.70s]
Epoch 2: 81%|████████▏ | 10088/12384 [21:25:39<4:53:27, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 81%|████████▏ | 10089/12384 [21:25:39<4:52:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 81%|████████▏ | 10089/12384 [21:25:46<4:52:36, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 81%|████████▏ | 10090/12384 [21:25:46<4:51:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 81%|████████▏ | 10090/12384 [21:25:54<4:51:51, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 81%|████████▏ | 10091/12384 [21:25:54<4:51:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 81%|████████▏ | 10091/12384 [21:26:01<4:51:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 81%|████████▏ | 10092/12384 [21:26:01<4:51:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 81%|████████▏ | 10092/12384 [21:26:09<4:51:11, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 82%|████████▏ | 10093/12384 [21:26:09<4:51:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 82%|████████▏ | 10093/12384 [21:26:17<4:51:01, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10094/12384 [21:26:17<4:50:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10094/12384 [21:26:24<4:50:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 82%|████████▏ | 10095/12384 [21:26:24<4:50:21, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.06s]
Epoch 2: 82%|████████▏ | 10095/12384 [21:26:32<4:50:21, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=8.43s]
Epoch 2: 82%|████████▏ | 10096/12384 [21:26:32<4:54:03, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=8.43s]
Epoch 2: 82%|████████▏ | 10096/12384 [21:26:40<4:54:03, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 82%|████████▏ | 10097/12384 [21:26:40<4:53:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 82%|████████▏ | 10097/12384 [21:26:48<4:53:29, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 82%|████████▏ | 10098/12384 [21:26:48<4:52:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 82%|████████▏ | 10098/12384 [21:26:55<4:52:17, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 82%|████████▏ | 10099/12384 [21:26:55<4:52:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 82%|████████▏ | 10099/12384 [21:27:03<4:52:23, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 82%|████████▏ | 10100/12384 [21:27:03<4:51:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.68s]
Epoch 2: 82%|████████▏ | 10100/12384 [21:27:10<4:51:42, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 82%|████████▏ | 10101/12384 [21:27:10<4:51:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 82%|████████▏ | 10101/12384 [21:27:18<4:51:12, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 82%|████████▏ | 10102/12384 [21:27:18<4:50:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 82%|████████▏ | 10102/12384 [21:27:26<4:50:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 82%|████████▏ | 10103/12384 [21:27:26<4:50:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 82%|████████▏ | 10103/12384 [21:27:33<4:50:22, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 82%|████████▏ | 10104/12384 [21:27:33<4:49:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 82%|████████▏ | 10104/12384 [21:27:41<4:49:58, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 82%|████████▏ | 10105/12384 [21:27:41<4:49:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.23s]
Epoch 2: 82%|████████▏ | 10105/12384 [21:27:49<4:49:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10106/12384 [21:27:49<4:49:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10106/12384 [21:27:56<4:49:27, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10107/12384 [21:27:56<4:49:22, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10107/12384 [21:28:04<4:49:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 82%|████████▏ | 10108/12384 [21:28:04<4:50:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.74s]
Epoch 2: 82%|████████▏ | 10108/12384 [21:28:12<4:50:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 82%|████████▏ | 10109/12384 [21:28:12<4:49:56, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 82%|████████▏ | 10109/12384 [21:28:19<4:49:56, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 2: 82%|████████▏ | 10110/12384 [21:28:19<4:52:33, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 2: 82%|████████▏ | 10110/12384 [21:28:27<4:52:33, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 82%|████████▏ | 10111/12384 [21:28:27<4:51:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.67s]
Epoch 2: 82%|████████▏ | 10111/12384 [21:28:35<4:51:18, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 82%|████████▏ | 10112/12384 [21:28:35<4:50:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.93s]
Epoch 2: 82%|████████▏ | 10112/12384 [21:28:42<4:50:28, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 82%|████████▏ | 10113/12384 [21:28:42<4:49:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 82%|████████▏ | 10113/12384 [21:28:50<4:49:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 82%|████████▏ | 10114/12384 [21:28:50<4:49:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 82%|████████▏ | 10114/12384 [21:28:58<4:49:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10115/12384 [21:28:58<4:48:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10115/12384 [21:29:05<4:48:49, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 82%|████████▏ | 10116/12384 [21:29:05<4:48:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.37s]
Epoch 2: 82%|████████▏ | 10116/12384 [21:29:13<4:48:28, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 82%|████████▏ | 10117/12384 [21:29:13<4:48:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.88s]
Epoch 2: 82%|████████▏ | 10117/12384 [21:29:20<4:48:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 82%|████████▏ | 10118/12384 [21:29:20<4:48:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 82%|████████▏ | 10118/12384 [21:29:28<4:48:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 82%|████████▏ | 10119/12384 [21:29:28<4:48:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 82%|████████▏ | 10119/12384 [21:29:36<4:48:07, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 82%|████████▏ | 10120/12384 [21:29:36<4:47:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.56s]
Epoch 2: 82%|████████▏ | 10120/12384 [21:29:43<4:47:40, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 82%|████████▏ | 10121/12384 [21:29:43<4:47:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 82%|████████▏ | 10121/12384 [21:29:51<4:47:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 82%|████████▏ | 10122/12384 [21:29:51<4:50:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.44s]
Epoch 2: 82%|████████▏ | 10122/12384 [21:29:59<4:50:56, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 82%|████████▏ | 10123/12384 [21:29:59<4:49:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.62s]
Epoch 2: 82%|████████▏ | 10123/12384 [21:30:06<4:49:13, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 82%|████████▏ | 10124/12384 [21:30:06<4:48:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 82%|████████▏ | 10124/12384 [21:30:14<4:48:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 82%|████████▏ | 10125/12384 [21:30:14<4:47:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 82%|████████▏ | 10125/12384 [21:30:22<4:47:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.01s]
Epoch 2: 82%|████████▏ | 10126/12384 [21:30:22<4:47:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.01s]
Epoch 2: 82%|████████▏ | 10126/12384 [21:30:29<4:47:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 82%|████████▏ | 10127/12384 [21:30:29<4:48:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.78s]
Epoch 2: 82%|████████▏ | 10127/12384 [21:30:37<4:48:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 82%|████████▏ | 10128/12384 [21:30:37<4:47:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 82%|████████▏ | 10128/12384 [21:30:45<4:47:48, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 82%|████████▏ | 10129/12384 [21:30:45<4:47:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 82%|████████▏ | 10129/12384 [21:30:52<4:47:02, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10130/12384 [21:30:52<4:46:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10130/12384 [21:31:00<4:46:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 82%|████████▏ | 10131/12384 [21:31:00<4:46:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 82%|████████▏ | 10131/12384 [21:31:08<4:46:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 82%|████████▏ | 10132/12384 [21:31:08<4:46:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 2: 82%|████████▏ | 10132/12384 [21:31:15<4:46:29, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 82%|████████▏ | 10133/12384 [21:31:15<4:46:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 82%|████████▏ | 10133/12384 [21:31:23<4:46:18, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=8.57s]
Epoch 2: 82%|████████▏ | 10134/12384 [21:31:23<4:46:55, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=8.57s]
Epoch 2: 82%|████████▏ | 10134/12384 [21:31:30<4:46:55, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=7.70s]
Epoch 2: 82%|████████▏ | 10135/12384 [21:31:30<4:46:17, 7.64s/it, loss=0.0002, acc=0.9992, iter_time=7.70s]
Epoch 2: 82%|████████▏ | 10135/12384 [21:31:38<4:46:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 82%|████████▏ | 10136/12384 [21:31:38<4:45:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 82%|████████▏ | 10136/12384 [21:31:46<4:45:46, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 82%|████████▏ | 10137/12384 [21:31:46<4:45:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.87s]
Epoch 2: 82%|████████▏ | 10137/12384 [21:31:53<4:45:13, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 82%|████████▏ | 10138/12384 [21:31:53<4:44:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.34s]
Epoch 2: 82%|████████▏ | 10138/12384 [21:32:01<4:44:56, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 82%|████████▏ | 10139/12384 [21:32:01<4:45:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.21s]
Epoch 2: 82%|████████▏ | 10139/12384 [21:32:08<4:45:14, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.46s]
Epoch 2: 82%|████████▏ | 10140/12384 [21:32:08<4:44:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=3.46s]
Epoch 2: 82%|████████▏ | 10140/12384 [21:32:16<4:44:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=11.79s]
Epoch 2: 82%|████████▏ | 10141/12384 [21:32:16<4:44:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.79s]
Epoch 2: 82%|████████▏ | 10141/12384 [21:32:24<4:44:33, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 82%|████████▏ | 10142/12384 [21:32:24<4:44:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.07s]
Epoch 2: 82%|████████▏ | 10142/12384 [21:32:31<4:44:28, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 82%|████████▏ | 10143/12384 [21:32:31<4:44:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.35s]
Epoch 2: 82%|████████▏ | 10143/12384 [21:32:39<4:44:28, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 82%|████████▏ | 10144/12384 [21:32:39<4:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.80s]
Epoch 2: 82%|████████▏ | 10144/12384 [21:32:47<4:44:10, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 82%|████████▏ | 10145/12384 [21:32:47<4:43:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.22s]
Epoch 2: 82%|████████▏ | 10145/12384 [21:32:54<4:43:59, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 82%|████████▏ | 10146/12384 [21:32:54<4:44:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 82%|████████▏ | 10146/12384 [21:33:02<4:44:26, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 82%|████████▏ | 10147/12384 [21:33:02<4:45:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.72s]
Epoch 2: 82%|████████▏ | 10147/12384 [21:33:10<4:45:01, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 82%|████████▏ | 10148/12384 [21:33:10<4:44:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.31s]
Epoch 2: 82%|████████▏ | 10148/12384 [21:33:17<4:44:34, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 82%|████████▏ | 10149/12384 [21:33:17<4:47:56, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.95s]
Epoch 2: 82%|████████▏ | 10149/12384 [21:33:25<4:47:56, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=7.90s]
Epoch 2: 82%|████████▏ | 10150/12384 [21:33:25<4:47:18, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.90s]
Epoch 2: 82%|████████▏ | 10150/12384 [21:33:33<4:47:18, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 82%|████████▏ | 10151/12384 [21:33:33<4:46:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 82%|████████▏ | 10151/12384 [21:33:40<4:46:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 82%|████████▏ | 10152/12384 [21:33:40<4:45:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 82%|████████▏ | 10152/12384 [21:33:48<4:45:05, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 82%|████████▏ | 10153/12384 [21:33:48<4:45:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 2: 82%|████████▏ | 10153/12384 [21:33:56<4:45:24, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 82%|████████▏ | 10154/12384 [21:33:56<4:44:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.21s]
Epoch 2: 82%|████████▏ | 10154/12384 [21:34:03<4:44:25, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 82%|████████▏ | 10155/12384 [21:34:03<4:43:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.69s]
Epoch 2: 82%|████████▏ | 10155/12384 [21:34:11<4:43:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 82%|████████▏ | 10156/12384 [21:34:11<4:43:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.63s]
Epoch 2: 82%|████████▏ | 10156/12384 [21:34:19<4:43:11, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 82%|████████▏ | 10157/12384 [21:34:19<4:43:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.58s]
Epoch 2: 82%|████████▏ | 10157/12384 [21:34:26<4:43:39, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 82%|████████▏ | 10158/12384 [21:34:26<4:43:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.49s]
Epoch 2: 82%|████████▏ | 10158/12384 [21:34:34<4:43:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 82%|████████▏ | 10159/12384 [21:34:34<4:42:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 82%|████████▏ | 10159/12384 [21:34:41<4:42:44, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 82%|████████▏ | 10160/12384 [21:34:41<4:43:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.99s]
Epoch 2: 82%|████████▏ | 10160/12384 [21:34:49<4:43:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 82%|████████▏ | 10161/12384 [21:34:49<4:42:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.31s]
Epoch 2: 82%|████████▏ | 10161/12384 [21:34:57<4:42:53, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 82%|████████▏ | 10162/12384 [21:34:57<4:42:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 2: 82%|████████▏ | 10162/12384 [21:35:04<4:42:37, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.71s]
Epoch 2: 82%|████████▏ | 10163/12384 [21:35:04<4:42:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=3.71s]
Epoch 2: 82%|████████▏ | 10163/12384 [21:35:12<4:42:24, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.51s]
Epoch 2: 82%|████████▏ | 10164/12384 [21:35:12<4:42:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.51s]
Epoch 2: 82%|████████▏ | 10164/12384 [21:35:20<4:42:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 82%|████████▏ | 10165/12384 [21:35:20<4:42:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 82%|████████▏ | 10165/12384 [21:35:27<4:42:26, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 82%|████████▏ | 10166/12384 [21:35:27<4:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 82%|████████▏ | 10166/12384 [21:35:35<4:42:03, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 82%|████████▏ | 10167/12384 [21:35:35<4:41:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.58s]
Epoch 2: 82%|████████▏ | 10167/12384 [21:35:43<4:41:56, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 2: 82%|████████▏ | 10168/12384 [21:35:43<4:43:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=11.22s]
Epoch 2: 82%|████████▏ | 10168/12384 [21:35:50<4:43:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 82%|████████▏ | 10169/12384 [21:35:50<4:44:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.40s]
Epoch 2: 82%|████████▏ | 10169/12384 [21:35:58<4:44:37, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 82%|████████▏ | 10170/12384 [21:35:58<4:43:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 82%|████████▏ | 10170/12384 [21:36:06<4:43:54, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 2: 82%|████████▏ | 10171/12384 [21:36:06<4:43:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.29s]
Epoch 2: 82%|████████▏ | 10171/12384 [21:36:14<4:43:57, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 82%|████████▏ | 10172/12384 [21:36:14<4:43:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.07s]
Epoch 2: 82%|████████▏ | 10172/12384 [21:36:21<4:43:56, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 82%|████████▏ | 10173/12384 [21:36:21<4:43:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 82%|████████▏ | 10173/12384 [21:36:29<4:43:41, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 82%|████████▏ | 10174/12384 [21:36:29<4:43:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 82%|████████▏ | 10174/12384 [21:36:37<4:43:01, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 82%|████████▏ | 10175/12384 [21:36:37<4:45:56, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 82%|████████▏ | 10175/12384 [21:36:44<4:45:56, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 82%|████████▏ | 10176/12384 [21:36:44<4:44:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.87s]
Epoch 2: 82%|████████▏ | 10176/12384 [21:36:52<4:44:13, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 82%|████████▏ | 10177/12384 [21:36:52<4:42:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.41s]
Epoch 2: 82%|████████▏ | 10177/12384 [21:37:00<4:42:57, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 82%|████████▏ | 10178/12384 [21:37:00<4:41:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.87s]
Epoch 2: 82%|████████▏ | 10178/12384 [21:37:07<4:41:49, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 82%|████████▏ | 10179/12384 [21:37:07<4:41:03, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.59s]
Epoch 2: 82%|████████▏ | 10179/12384 [21:37:15<4:41:03, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10180/12384 [21:37:15<4:40:30, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10180/12384 [21:37:22<4:40:30, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10181/12384 [21:37:22<4:40:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10181/12384 [21:37:30<4:40:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 82%|████████▏ | 10182/12384 [21:37:30<4:39:47, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 2: 82%|████████▏ | 10182/12384 [21:37:38<4:39:47, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 2: 82%|████████▏ | 10183/12384 [21:37:38<4:39:15, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.19s]
Epoch 2: 82%|████████▏ | 10183/12384 [21:37:45<4:39:15, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 82%|████████▏ | 10184/12384 [21:37:45<4:39:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 82%|████████▏ | 10184/12384 [21:37:53<4:39:03, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 82%|████████▏ | 10185/12384 [21:37:53<4:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 82%|████████▏ | 10185/12384 [21:38:01<4:39:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 82%|████████▏ | 10186/12384 [21:38:01<4:39:03, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 82%|████████▏ | 10186/12384 [21:38:08<4:39:03, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 2: 82%|████████▏ | 10187/12384 [21:38:08<4:39:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.91s]
Epoch 2: 82%|████████▏ | 10187/12384 [21:38:16<4:39:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 82%|████████▏ | 10188/12384 [21:38:16<4:39:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.84s]
Epoch 2: 82%|████████▏ | 10188/12384 [21:38:24<4:39:44, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 82%|████████▏ | 10189/12384 [21:38:24<4:42:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 82%|████████▏ | 10189/12384 [21:38:31<4:42:15, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10190/12384 [21:38:31<4:41:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10190/12384 [21:38:39<4:41:12, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10191/12384 [21:38:39<4:40:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10191/12384 [21:38:47<4:40:03, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 82%|████████▏ | 10192/12384 [21:38:47<4:39:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 82%|████████▏ | 10192/12384 [21:38:54<4:39:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 82%|████████▏ | 10193/12384 [21:38:54<4:38:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.44s]
Epoch 2: 82%|████████▏ | 10193/12384 [21:39:02<4:38:48, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 82%|████████▏ | 10194/12384 [21:39:02<4:38:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.82s]
Epoch 2: 82%|████████▏ | 10194/12384 [21:39:09<4:38:31, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 82%|████████▏ | 10195/12384 [21:39:09<4:38:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.42s]
Epoch 2: 82%|████████▏ | 10195/12384 [21:39:17<4:38:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 82%|████████▏ | 10196/12384 [21:39:17<4:37:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.83s]
Epoch 2: 82%|████████▏ | 10196/12384 [21:39:25<4:37:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10197/12384 [21:39:25<4:37:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10197/12384 [21:39:32<4:37:42, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10198/12384 [21:39:32<4:38:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 82%|████████▏ | 10198/12384 [21:39:40<4:38:02, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 82%|████████▏ | 10199/12384 [21:39:40<4:37:52, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 82%|████████▏ | 10199/12384 [21:39:48<4:37:52, 7.63s/it, loss=0.0003, acc=0.9985, iter_time=8.02s]
Epoch 2: 82%|████████▏ | 10200/12384 [21:39:48<4:37:47, 7.63s/it, loss=0.0003, acc=0.9985, iter_time=8.02s]
Epoch 2: 82%|████████▏ | 10200/12384 [21:39:56<4:37:47, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 82%|████████▏ | 10201/12384 [21:39:56<4:41:13, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.29s]
Epoch 2: 82%|████████▏ | 10201/12384 [21:40:03<4:41:13, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 2: 82%|████████▏ | 10202/12384 [21:40:03<4:39:54, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 2: 82%|████████▏ | 10202/12384 [21:40:11<4:39:54, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 82%|████████▏ | 10203/12384 [21:40:11<4:38:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 2: 82%|████████▏ | 10203/12384 [21:40:18<4:38:28, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 82%|████████▏ | 10204/12384 [21:40:18<4:37:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.31s]
Epoch 2: 82%|████████▏ | 10204/12384 [21:40:26<4:37:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10205/12384 [21:40:26<4:37:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 82%|████████▏ | 10205/12384 [21:40:34<4:37:09, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 82%|████████▏ | 10206/12384 [21:40:34<4:37:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.98s]
Epoch 2: 82%|████████▏ | 10206/12384 [21:40:41<4:37:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 82%|████████▏ | 10207/12384 [21:40:41<4:36:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.26s]
Epoch 2: 82%|████████▏ | 10207/12384 [21:40:49<4:36:49, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 82%|████████▏ | 10208/12384 [21:40:49<4:36:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.57s]
Epoch 2: 82%|████████▏ | 10208/12384 [21:40:56<4:36:29, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 82%|████████▏ | 10209/12384 [21:40:56<4:36:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 82%|████████▏ | 10209/12384 [21:41:04<4:36:10, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 82%|████████▏ | 10210/12384 [21:41:04<4:35:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.56s]
Epoch 2: 82%|████████▏ | 10210/12384 [21:41:12<4:35:42, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 82%|████████▏ | 10211/12384 [21:41:12<4:35:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.63s]
Epoch 2: 82%|████████▏ | 10211/12384 [21:41:19<4:35:30, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 82%|████████▏ | 10212/12384 [21:41:19<4:35:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=5.52s]
Epoch 2: 82%|████████▏ | 10212/12384 [21:41:27<4:35:37, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 82%|████████▏ | 10213/12384 [21:41:27<4:35:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.40s]
Epoch 2: 82%|████████▏ | 10213/12384 [21:41:34<4:35:07, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 82%|████████▏ | 10214/12384 [21:41:34<4:34:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 82%|████████▏ | 10214/12384 [21:41:42<4:34:53, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 82%|████████▏ | 10215/12384 [21:41:42<4:37:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.90s]
Epoch 2: 82%|████████▏ | 10215/12384 [21:41:50<4:37:59, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 82%|████████▏ | 10216/12384 [21:41:50<4:36:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 2: 82%|████████▏ | 10216/12384 [21:41:58<4:36:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 83%|████████▎ | 10217/12384 [21:41:58<4:37:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.32s]
Epoch 2: 83%|████████▎ | 10217/12384 [21:42:05<4:37:20, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10218/12384 [21:42:05<4:36:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10218/12384 [21:42:13<4:36:11, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 83%|████████▎ | 10219/12384 [21:42:13<4:35:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 83%|████████▎ | 10219/12384 [21:42:20<4:35:36, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 83%|████████▎ | 10220/12384 [21:42:20<4:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.08s]
Epoch 2: 83%|████████▎ | 10220/12384 [21:42:28<4:34:54, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 83%|████████▎ | 10221/12384 [21:42:28<4:34:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.99s]
Epoch 2: 83%|████████▎ | 10221/12384 [21:42:36<4:34:34, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 83%|████████▎ | 10222/12384 [21:42:36<4:34:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 83%|████████▎ | 10222/12384 [21:42:43<4:34:24, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 2: 83%|████████▎ | 10223/12384 [21:42:43<4:34:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=10.18s]
Epoch 2: 83%|████████▎ | 10223/12384 [21:42:51<4:34:13, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 83%|████████▎ | 10224/12384 [21:42:51<4:34:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 83%|████████▎ | 10224/12384 [21:42:59<4:34:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 83%|████████▎ | 10225/12384 [21:42:59<4:34:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.27s]
Epoch 2: 83%|████████▎ | 10225/12384 [21:43:06<4:34:42, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 83%|████████▎ | 10226/12384 [21:43:06<4:34:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.00s]
Epoch 2: 83%|████████▎ | 10226/12384 [21:43:14<4:34:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 2: 83%|████████▎ | 10227/12384 [21:43:14<4:39:02, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=10.79s]
Epoch 2: 83%|████████▎ | 10227/12384 [21:43:22<4:39:02, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 83%|████████▎ | 10228/12384 [21:43:22<4:37:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 83%|████████▎ | 10228/12384 [21:43:30<4:37:55, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 83%|████████▎ | 10229/12384 [21:43:30<4:37:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 83%|████████▎ | 10229/12384 [21:43:37<4:37:41, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 83%|████████▎ | 10230/12384 [21:43:37<4:37:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.69s]
Epoch 2: 83%|████████▎ | 10230/12384 [21:43:45<4:37:03, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 83%|████████▎ | 10231/12384 [21:43:45<4:36:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 83%|████████▎ | 10231/12384 [21:43:53<4:36:39, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 83%|████████▎ | 10232/12384 [21:43:53<4:39:05, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=8.16s]
Epoch 2: 83%|████████▎ | 10232/12384 [21:44:01<4:39:05, 7.78s/it, loss=0.0000, acc=1.0000, iter_time=3.13s]
Epoch 2: 83%|████████▎ | 10233/12384 [21:44:01<4:37:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=3.13s]
Epoch 2: 83%|████████▎ | 10233/12384 [21:44:08<4:37:33, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 83%|████████▎ | 10234/12384 [21:44:08<4:35:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=10.72s]
Epoch 2: 83%|████████▎ | 10234/12384 [21:44:16<4:35:52, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 83%|████████▎ | 10235/12384 [21:44:16<4:34:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.81s]
Epoch 2: 83%|████████▎ | 10235/12384 [21:44:23<4:34:56, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 83%|████████▎ | 10236/12384 [21:44:23<4:34:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 83%|████████▎ | 10236/12384 [21:44:31<4:34:19, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 83%|████████▎ | 10237/12384 [21:44:31<4:34:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 83%|████████▎ | 10237/12384 [21:44:39<4:34:00, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 83%|████████▎ | 10238/12384 [21:44:39<4:33:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 83%|████████▎ | 10238/12384 [21:44:46<4:33:13, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10239/12384 [21:44:46<4:32:41, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10239/12384 [21:44:54<4:32:41, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 2: 83%|████████▎ | 10240/12384 [21:44:54<4:32:21, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.98s]
Epoch 2: 83%|████████▎ | 10240/12384 [21:45:02<4:32:21, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 83%|████████▎ | 10241/12384 [21:45:02<4:32:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.24s]
Epoch 2: 83%|████████▎ | 10241/12384 [21:45:09<4:32:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 83%|████████▎ | 10242/12384 [21:45:09<4:35:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 83%|████████▎ | 10242/12384 [21:45:17<4:35:12, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 83%|████████▎ | 10243/12384 [21:45:17<4:35:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 83%|████████▎ | 10243/12384 [21:45:25<4:35:04, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 83%|████████▎ | 10244/12384 [21:45:25<4:35:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 83%|████████▎ | 10244/12384 [21:45:33<4:35:07, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 83%|████████▎ | 10245/12384 [21:45:33<4:34:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.73s]
Epoch 2: 83%|████████▎ | 10245/12384 [21:45:40<4:34:57, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=2.96s]
Epoch 2: 83%|████████▎ | 10246/12384 [21:45:40<4:33:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=2.96s]
Epoch 2: 83%|████████▎ | 10246/12384 [21:45:48<4:33:45, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=12.01s]
Epoch 2: 83%|████████▎ | 10247/12384 [21:45:48<4:33:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=12.01s]
Epoch 2: 83%|████████▎ | 10247/12384 [21:45:55<4:33:05, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 83%|████████▎ | 10248/12384 [21:45:55<4:32:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.33s]
Epoch 2: 83%|████████▎ | 10248/12384 [21:46:03<4:32:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.72s]
Epoch 2: 83%|████████▎ | 10249/12384 [21:46:03<4:32:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=3.72s]
Epoch 2: 83%|████████▎ | 10249/12384 [21:46:11<4:32:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 2: 83%|████████▎ | 10250/12384 [21:46:11<4:31:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.17s]
Epoch 2: 83%|████████▎ | 10250/12384 [21:46:18<4:31:55, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 83%|████████▎ | 10251/12384 [21:46:18<4:31:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.53s]
Epoch 2: 83%|████████▎ | 10251/12384 [21:46:26<4:31:38, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 83%|████████▎ | 10252/12384 [21:46:26<4:31:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.74s]
Epoch 2: 83%|████████▎ | 10252/12384 [21:46:34<4:31:28, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 83%|████████▎ | 10253/12384 [21:46:34<4:37:12, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.88s]
Epoch 2: 83%|████████▎ | 10253/12384 [21:46:44<4:37:12, 7.81s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 83%|████████▎ | 10254/12384 [21:46:44<4:55:23, 8.32s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 2: 83%|████████▎ | 10254/12384 [21:46:53<4:55:23, 8.32s/it, loss=0.0001, acc=1.0000, iter_time=11.40s]
Epoch 2: 83%|████████▎ | 10255/12384 [21:46:53<5:05:24, 8.61s/it, loss=0.0001, acc=1.0000, iter_time=11.40s]
Epoch 2: 83%|████████▎ | 10255/12384 [21:47:04<5:05:24, 8.61s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 2: 83%|████████▎ | 10256/12384 [21:47:04<5:32:51, 9.38s/it, loss=0.0000, acc=1.0000, iter_time=11.50s]
Epoch 2: 83%|████████▎ | 10256/12384 [21:47:18<5:32:51, 9.38s/it, loss=0.0000, acc=1.0000, iter_time=13.00s]
Epoch 2: 83%|████████▎ | 10257/12384 [21:47:18<6:17:31, 10.65s/it, loss=0.0000, acc=1.0000, iter_time=13.00s]
Epoch 2: 83%|████████▎ | 10257/12384 [21:47:32<6:17:31, 10.65s/it, loss=0.0000, acc=1.0000, iter_time=14.00s]
Epoch 2: 83%|████████▎ | 10258/12384 [21:47:32<6:55:05, 11.71s/it, loss=0.0000, acc=1.0000, iter_time=14.00s]
Epoch 2: 83%|████████▎ | 10258/12384 [21:47:40<6:55:05, 11.71s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 83%|████████▎ | 10259/12384 [21:47:40<6:18:48, 10.70s/it, loss=0.0000, acc=1.0000, iter_time=8.75s]
Epoch 2: 83%|████████▎ | 10259/12384 [21:47:48<6:18:48, 10.70s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 83%|████████▎ | 10260/12384 [21:47:48<5:46:37, 9.79s/it, loss=0.0000, acc=1.0000, iter_time=7.75s]
Epoch 2: 83%|████████▎ | 10260/12384 [21:47:56<5:46:37, 9.79s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 83%|████████▎ | 10261/12384 [21:47:56<5:23:46, 9.15s/it, loss=0.0000, acc=1.0000, iter_time=7.67s]
Epoch 2: 83%|████████▎ | 10261/12384 [21:48:03<5:23:46, 9.15s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 83%|████████▎ | 10262/12384 [21:48:03<5:07:16, 8.69s/it, loss=0.0000, acc=1.0000, iter_time=6.69s]
Epoch 2: 83%|████████▎ | 10262/12384 [21:48:11<5:07:16, 8.69s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 83%|████████▎ | 10263/12384 [21:48:11<4:56:07, 8.38s/it, loss=0.0000, acc=1.0000, iter_time=8.24s]
Epoch 2: 83%|████████▎ | 10263/12384 [21:48:19<4:56:07, 8.38s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 83%|████████▎ | 10264/12384 [21:48:19<4:50:18, 8.22s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 83%|████████▎ | 10264/12384 [21:48:26<4:50:18, 8.22s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 83%|████████▎ | 10265/12384 [21:48:26<4:43:49, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 83%|████████▎ | 10265/12384 [21:48:34<4:43:49, 8.04s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 83%|████████▎ | 10266/12384 [21:48:34<4:39:10, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 2: 83%|████████▎ | 10266/12384 [21:48:42<4:39:10, 7.91s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 83%|████████▎ | 10267/12384 [21:48:42<4:36:44, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 2: 83%|████████▎ | 10267/12384 [21:48:49<4:36:44, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 83%|████████▎ | 10268/12384 [21:48:49<4:34:05, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=9.42s]
Epoch 2: 83%|████████▎ | 10268/12384 [21:48:57<4:34:05, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 83%|████████▎ | 10269/12384 [21:48:57<4:32:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.35s]
Epoch 2: 83%|████████▎ | 10269/12384 [21:49:04<4:32:22, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 83%|████████▎ | 10270/12384 [21:49:04<4:30:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.86s]
Epoch 2: 83%|████████▎ | 10270/12384 [21:49:12<4:30:56, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 83%|████████▎ | 10271/12384 [21:49:12<4:30:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 83%|████████▎ | 10271/12384 [21:49:20<4:30:02, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 83%|████████▎ | 10272/12384 [21:49:20<4:29:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.03s]
Epoch 2: 83%|████████▎ | 10272/12384 [21:49:27<4:29:29, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 83%|████████▎ | 10273/12384 [21:49:27<4:28:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.20s]
Epoch 2: 83%|████████▎ | 10273/12384 [21:49:35<4:28:30, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10274/12384 [21:49:35<4:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10274/12384 [21:49:43<4:28:07, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 83%|████████▎ | 10275/12384 [21:49:43<4:27:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 83%|████████▎ | 10275/12384 [21:49:50<4:27:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 83%|████████▎ | 10276/12384 [21:49:50<4:29:11, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.75s]
Epoch 2: 83%|████████▎ | 10276/12384 [21:49:59<4:29:11, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.80s]
Epoch 2: 83%|████████▎ | 10277/12384 [21:49:59<4:43:10, 8.06s/it, loss=0.0001, acc=1.0000, iter_time=10.80s]
Epoch 2: 83%|████████▎ | 10277/12384 [21:50:08<4:43:10, 8.06s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 83%|████████▎ | 10278/12384 [21:50:08<4:53:12, 8.35s/it, loss=0.0000, acc=1.0000, iter_time=9.21s]
Epoch 2: 83%|████████▎ | 10278/12384 [21:50:17<4:53:12, 8.35s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 83%|████████▎ | 10279/12384 [21:50:17<4:56:29, 8.45s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 2: 83%|████████▎ | 10279/12384 [21:50:26<4:56:29, 8.45s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 83%|████████▎ | 10280/12384 [21:50:26<5:01:06, 8.59s/it, loss=0.0000, acc=1.0000, iter_time=9.73s]
Epoch 2: 83%|████████▎ | 10280/12384 [21:50:34<5:01:06, 8.59s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 83%|████████▎ | 10281/12384 [21:50:34<4:59:55, 8.56s/it, loss=0.0000, acc=1.0000, iter_time=8.48s]
Epoch 2: 83%|████████▎ | 10281/12384 [21:50:43<4:59:55, 8.56s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 2: 83%|████████▎ | 10282/12384 [21:50:43<4:59:19, 8.54s/it, loss=0.0000, acc=1.0000, iter_time=8.91s]
Epoch 2: 83%|████████▎ | 10282/12384 [21:50:51<4:59:19, 8.54s/it, loss=0.0001, acc=1.0000, iter_time=8.10s]
Epoch 2: 83%|████████▎ | 10283/12384 [21:50:51<4:58:34, 8.53s/it, loss=0.0001, acc=1.0000, iter_time=8.10s]
Epoch 2: 83%|████████▎ | 10283/12384 [21:51:00<4:58:34, 8.53s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 83%|████████▎ | 10284/12384 [21:51:00<4:58:22, 8.53s/it, loss=0.0000, acc=1.0000, iter_time=5.89s]
Epoch 2: 83%|████████▎ | 10284/12384 [21:51:08<4:58:22, 8.53s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 83%|████████▎ | 10285/12384 [21:51:08<4:54:57, 8.43s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 83%|████████▎ | 10285/12384 [21:51:16<4:54:57, 8.43s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 83%|████████▎ | 10286/12384 [21:51:16<4:46:12, 8.19s/it, loss=0.0000, acc=1.0000, iter_time=6.73s]
Epoch 2: 83%|████████▎ | 10286/12384 [21:51:23<4:46:12, 8.19s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 83%|████████▎ | 10287/12384 [21:51:23<4:39:54, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 2: 83%|████████▎ | 10287/12384 [21:51:31<4:39:54, 8.01s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 83%|████████▎ | 10288/12384 [21:51:31<4:35:45, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.97s]
Epoch 2: 83%|████████▎ | 10288/12384 [21:51:39<4:35:45, 7.89s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 83%|████████▎ | 10289/12384 [21:51:39<4:33:45, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=7.35s]
Epoch 2: 83%|████████▎ | 10289/12384 [21:51:46<4:33:45, 7.84s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 83%|████████▎ | 10290/12384 [21:51:46<4:31:18, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 83%|████████▎ | 10290/12384 [21:51:54<4:31:18, 7.77s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 83%|████████▎ | 10291/12384 [21:51:54<4:29:35, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=10.14s]
Epoch 2: 83%|████████▎ | 10291/12384 [21:52:02<4:29:35, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 83%|████████▎ | 10292/12384 [21:52:02<4:28:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.53s]
Epoch 2: 83%|████████▎ | 10292/12384 [21:52:09<4:28:05, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 83%|████████▎ | 10293/12384 [21:52:09<4:27:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 2: 83%|████████▎ | 10293/12384 [21:52:17<4:27:40, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 83%|████████▎ | 10294/12384 [21:52:17<4:26:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 83%|████████▎ | 10294/12384 [21:52:24<4:26:34, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10295/12384 [21:52:24<4:26:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10295/12384 [21:52:32<4:26:01, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 83%|████████▎ | 10296/12384 [21:52:32<4:28:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 2: 83%|████████▎ | 10296/12384 [21:52:40<4:28:40, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 83%|████████▎ | 10297/12384 [21:52:40<4:27:18, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.21s]
Epoch 2: 83%|████████▎ | 10297/12384 [21:52:48<4:27:18, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 2: 83%|████████▎ | 10298/12384 [21:52:48<4:27:17, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 2: 83%|████████▎ | 10298/12384 [21:52:55<4:27:17, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 83%|████████▎ | 10299/12384 [21:52:55<4:26:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=5.61s]
Epoch 2: 83%|████████▎ | 10299/12384 [21:53:03<4:26:24, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 83%|████████▎ | 10300/12384 [21:53:03<4:25:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.39s]
Epoch 2: 83%|████████▎ | 10300/12384 [21:53:10<4:25:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 83%|████████▎ | 10301/12384 [21:53:10<4:25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 2: 83%|████████▎ | 10301/12384 [21:53:18<4:25:12, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 83%|████████▎ | 10302/12384 [21:53:18<4:24:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 83%|████████▎ | 10302/12384 [21:53:26<4:24:40, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 83%|████████▎ | 10303/12384 [21:53:26<4:24:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 2: 83%|████████▎ | 10303/12384 [21:53:33<4:24:23, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 83%|████████▎ | 10304/12384 [21:53:33<4:24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.00s]
Epoch 2: 83%|████████▎ | 10304/12384 [21:53:41<4:24:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 83%|████████▎ | 10305/12384 [21:53:41<4:24:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 83%|████████▎ | 10305/12384 [21:53:49<4:24:04, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 83%|████████▎ | 10306/12384 [21:53:49<4:27:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=5.09s]
Epoch 2: 83%|████████▎ | 10306/12384 [21:53:56<4:27:22, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 83%|████████▎ | 10307/12384 [21:53:56<4:25:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=10.45s]
Epoch 2: 83%|████████▎ | 10307/12384 [21:54:04<4:25:49, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 83%|████████▎ | 10308/12384 [21:54:04<4:24:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.28s]
Epoch 2: 83%|████████▎ | 10308/12384 [21:54:12<4:24:56, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 83%|████████▎ | 10309/12384 [21:54:12<4:24:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.97s]
Epoch 2: 83%|████████▎ | 10309/12384 [21:54:19<4:24:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 83%|████████▎ | 10310/12384 [21:54:19<4:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.82s]
Epoch 2: 83%|████████▎ | 10310/12384 [21:54:27<4:23:32, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 2: 83%|████████▎ | 10311/12384 [21:54:27<4:23:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.09s]
Epoch 2: 83%|████████▎ | 10311/12384 [21:54:34<4:23:16, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 83%|████████▎ | 10312/12384 [21:54:34<4:23:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.80s]
Epoch 2: 83%|████████▎ | 10312/12384 [21:54:42<4:23:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 83%|████████▎ | 10313/12384 [21:54:42<4:22:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 2: 83%|████████▎ | 10313/12384 [21:54:50<4:22:56, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 83%|████████▎ | 10314/12384 [21:54:50<4:22:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 2: 83%|████████▎ | 10314/12384 [21:54:57<4:22:50, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 83%|████████▎ | 10315/12384 [21:54:57<4:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.05s]
Epoch 2: 83%|████████▎ | 10315/12384 [21:55:05<4:22:41, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 83%|████████▎ | 10316/12384 [21:55:05<4:22:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 2: 83%|████████▎ | 10316/12384 [21:55:12<4:22:25, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10317/12384 [21:55:12<4:22:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10317/12384 [21:55:20<4:22:01, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 83%|████████▎ | 10318/12384 [21:55:20<4:21:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=6.13s]
Epoch 2: 83%|████████▎ | 10318/12384 [21:55:28<4:21:51, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 83%|████████▎ | 10319/12384 [21:55:28<4:21:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=7.55s]
Epoch 2: 83%|████████▎ | 10319/12384 [21:55:35<4:21:40, 7.60s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 83%|████████▎ | 10320/12384 [21:55:35<4:21:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 83%|████████▎ | 10320/12384 [21:55:43<4:21:54, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 83%|████████▎ | 10321/12384 [21:55:43<4:21:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=4.26s]
Epoch 2: 83%|████████▎ | 10321/12384 [21:55:51<4:21:46, 7.61s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 83%|████████▎ | 10322/12384 [21:55:51<4:24:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=11.34s]
Epoch 2: 83%|████████▎ | 10322/12384 [21:55:58<4:24:52, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10323/12384 [21:55:58<4:23:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10323/12384 [21:56:06<4:23:39, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 83%|████████▎ | 10324/12384 [21:56:06<4:22:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.30s]
Epoch 2: 83%|████████▎ | 10324/12384 [21:56:14<4:22:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 83%|████████▎ | 10325/12384 [21:56:14<4:21:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.09s]
Epoch 2: 83%|████████▎ | 10325/12384 [21:56:21<4:21:59, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 2: 83%|████████▎ | 10326/12384 [21:56:21<4:21:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.13s]
Epoch 2: 83%|████████▎ | 10326/12384 [21:56:29<4:21:25, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 83%|████████▎ | 10327/12384 [21:56:29<4:21:08, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.31s]
Epoch 2: 83%|████████▎ | 10327/12384 [21:56:37<4:21:08, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=9.59s]
Epoch 2: 83%|████████▎ | 10328/12384 [21:56:37<4:21:56, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.59s]
Epoch 2: 83%|████████▎ | 10328/12384 [21:56:44<4:21:56, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 83%|████████▎ | 10329/12384 [21:56:44<4:21:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.80s]
Epoch 2: 83%|████████▎ | 10329/12384 [21:56:52<4:21:31, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 83%|████████▎ | 10330/12384 [21:56:52<4:21:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.09s]
Epoch 2: 83%|████████▎ | 10330/12384 [21:56:59<4:21:15, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 83%|████████▎ | 10331/12384 [21:56:59<4:21:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.85s]
Epoch 2: 83%|████████▎ | 10331/12384 [21:57:07<4:21:00, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 83%|████████▎ | 10332/12384 [21:57:07<4:20:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.81s]
Epoch 2: 83%|████████▎ | 10332/12384 [21:57:15<4:20:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 83%|████████▎ | 10333/12384 [21:57:15<4:24:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.25s]
Epoch 2: 83%|████████▎ | 10333/12384 [21:57:23<4:24:04, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10334/12384 [21:57:23<4:22:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 2: 83%|████████▎ | 10334/12384 [21:57:30<4:22:34, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 83%|████████▎ | 10335/12384 [21:57:30<4:21:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.92s]
Epoch 2: 83%|████████▎ | 10335/12384 [21:57:38<4:21:38, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 83%|████████▎ | 10336/12384 [21:57:38<4:22:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=8.10s]
Epoch 2: 83%|████████▎ | 10336/12384 [21:57:46<4:22:29, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 83%|████████▎ | 10337/12384 [21:57:46<4:21:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.95s]
Epoch 2: 83%|████████▎ | 10337/12384 [21:57:53<4:21:53, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 83%|████████▎ | 10338/12384 [21:57:53<4:21:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.90s]
Epoch 2: 83%|████████▎ | 10338/12384 [21:58:01<4:21:12, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 2: 83%|████████▎ | 10339/12384 [21:58:01<4:21:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=9.77s]
Epoch 2: 83%|████████▎ | 10339/12384 [21:58:09<4:21:34, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 83%|████████▎ | 10340/12384 [21:58:09<4:20:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 2: 83%|████████▎ | 10340/12384 [21:58:16<4:20:52, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 84%|████████▎ | 10341/12384 [21:58:16<4:20:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.51s]
Epoch 2: 84%|████████▎ | 10341/12384 [21:58:24<4:20:17, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 84%|████████▎ | 10342/12384 [21:58:24<4:20:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=9.74s]
Epoch 2: 84%|████████▎ | 10342/12384 [21:58:31<4:20:14, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 84%|████████▎ | 10343/12384 [21:58:31<4:19:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=6.12s]
Epoch 2: 84%|████████▎ | 10343/12384 [21:58:39<4:19:22, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 84%|████████▎ | 10344/12384 [21:58:39<4:19:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.03s]
Epoch 2: 84%|████████▎ | 10344/12384 [21:58:47<4:19:09, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 84%|████████▎ | 10345/12384 [21:58:47<4:18:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=4.52s]
Epoch 2: 84%|████████▎ | 10345/12384 [21:58:54<4:18:51, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 84%|████████▎ | 10346/12384 [21:58:54<4:18:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.77s]
Epoch 2: 84%|████████▎ | 10346/12384 [21:59:02<4:18:52, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]
Epoch 2: 84%|████████▎ | 10347/12384 [21:59:02<4:19:38, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.71s]W0313 16:43:46.522000 62173 site-packages/torch/distributed/elastic/agent/server/api.py:725] Received 15 death signal, shutting down workers
+W0313 16:43:46.523000 62173 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62352 closing signal SIGTERM
+W0313 16:43:46.524000 62173 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62353 closing signal SIGTERM
+W0313 16:43:46.524000 62173 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62354 closing signal SIGTERM
+W0313 16:43:46.525000 62173 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62355 closing signal SIGTERM
+W0313 16:43:46.525000 62173 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62356 closing signal SIGTERM
+W0313 16:43:46.525000 62173 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62357 closing signal SIGTERM
+W0313 16:43:46.525000 62173 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62358 closing signal SIGTERM
+W0313 16:43:46.526000 62173 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62359 closing signal SIGTERM
+Traceback (most recent call last):
+ File "", line 198, in _run_module_as_main
+ File "", line 88, in _run_code
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 940, in
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/errors/__init__.py", line 357, in wrapper
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 936, in main
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 927, in run
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 156, in __call__
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 284, in launch_agent
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/metrics/api.py", line 138, in wrapper
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/agent/server/api.py", line 717, in run
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/agent/server/api.py", line 881, in _invoke_run
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/api.py", line 85, in _terminate_process_handler
+torch.distributed.elastic.multiprocessing.api.SignalException: Process 62173 got signal: 15
diff --git a/syxin_old/train_random_anchor.log b/syxin_old/train_random_anchor.log
new file mode 100644
index 0000000000000000000000000000000000000000..a2f6d647b948741a49a601aa862dc0a3ad744ed5
--- /dev/null
+++ b/syxin_old/train_random_anchor.log
@@ -0,0 +1,97 @@
+nohup: ignoring input
+
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+[W324 18:48:28.089205442 Utils.hpp:137] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:08, 2.13s/it][W324 18:48:31.931154830 Utils.hpp:137] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 18:48:31.063963362 Utils.hpp:137] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 18:48:31.127784704 Utils.hpp:137] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 18:48:31.302012762 Utils.hpp:137] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 18:48:31.311609901 Utils.hpp:137] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 18:48:31.376922106 Utils.hpp:137] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[W324 18:48:32.592823608 Utils.hpp:137] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.35s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.68s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.74s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.78s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.84s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.83s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:06<00:04, 2.20s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:03<00:12, 3.17s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:03<00:12, 3.19s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:01, 1.97s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.53s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.62s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.61s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.48s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.78s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 145.81it/s]
+
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.72s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.72s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:06<00:09, 3.03s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:06<00:09, 3.03s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.45s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.57s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.59s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.68s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.69s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.15s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:09<00:05, 2.98s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:09<00:05, 2.98s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.59s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.95s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 148.22it/s]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.33s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.32s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.41s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.41s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.75s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.75s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.09s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.10s/it]
+
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 148.78it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 147.89it/s]
+
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.80s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.80s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.17s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.17s/it]
+
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 149.97it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 144.76it/s]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:11<00:02, 2.70s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:11<00:02, 2.70s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:12<00:00, 2.03s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:12<00:00, 2.03s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:12<00:00, 2.43s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:12<00:00, 2.43s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 147.58it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 146.91it/s]
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/distributed_c10d.py:4876: UserWarning: barrier(): using the device under current context. You can specify `device_id` in `init_process_group` to mute this warning.
+ warnings.warn( # warn only once
+[rank0]:[W324 18:48:53.286559498 ProcessGroupNCCL.cpp:5072] Guessing device ID based on global rank. This can cause a hang if rank to GPU mapping is heterogeneous. You can specify device_id in init_process_group()
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+[rank3]:[W324 18:49:00.755365938 Utils.hpp:112] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[rank1]:[W324 18:49:00.767535335 Utils.hpp:112] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[rank2]:[W324 18:49:00.770508168 Utils.hpp:112] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[rank6]:[W324 18:49:00.771645742 Utils.hpp:112] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[rank7]:[W324 18:49:00.772019337 Utils.hpp:112] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[rank5]:[W324 18:49:00.772389239 Utils.hpp:112] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[rank0]:[W324 18:49:00.772792117 Utils.hpp:112] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+[rank4]:[W324 18:49:00.773187057 Utils.hpp:112] Warning: Environment variable NCCL_ASYNC_ERROR_HANDLING is deprecated; use TORCH_NCCL_ASYNC_ERROR_HANDLING instead (function operator())
+
Epoch 0: 0%| | 0/99077 [00:00, ?it/s]
Epoch 0: 0%| | 0/99077 [00:01, ?it/s, loss=13.8710, acc=0.0031, iter_time=1.26s]
Epoch 0: 0%| | 1/99077 [00:01<34:23:50, 1.25s/it, loss=13.8710, acc=0.0031, iter_time=1.26s]
Epoch 0: 0%| | 1/99077 [00:01<34:23:50, 1.25s/it, loss=13.9765, acc=0.0000, iter_time=0.39s]
Epoch 0: 0%| | 2/99077 [00:01<21:12:46, 1.30it/s, loss=13.9765, acc=0.0000, iter_time=0.39s]
Epoch 0: 0%| | 2/99077 [00:02<21:12:46, 1.30it/s, loss=12.4888, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 3/99077 [00:02<16:55:25, 1.63it/s, loss=12.4888, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 3/99077 [00:02<16:55:25, 1.63it/s, loss=10.2651, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 4/99077 [00:02<14:53:18, 1.85it/s, loss=10.2651, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 4/99077 [00:02<14:53:18, 1.85it/s, loss=11.1887, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 5/99077 [00:02<13:45:15, 2.00it/s, loss=11.1887, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 5/99077 [00:03<13:45:15, 2.00it/s, loss=13.4169, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 6/99077 [00:03<13:04:54, 2.10it/s, loss=13.4169, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 6/99077 [00:03<13:04:54, 2.10it/s, loss=12.6732, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 7/99077 [00:03<12:39:00, 2.18it/s, loss=12.6732, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 7/99077 [00:04<12:39:00, 2.18it/s, loss=11.6319, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 8/99077 [00:04<12:22:49, 2.22it/s, loss=11.6319, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 8/99077 [00:05<12:22:49, 2.22it/s, loss=11.3662, acc=0.0000, iter_time=0.81s]
Epoch 0: 0%| | 9/99077 [00:05<15:18:21, 1.80it/s, loss=11.3662, acc=0.0000, iter_time=0.81s]
Epoch 0: 0%| | 9/99077 [00:05<15:18:21, 1.80it/s, loss=14.0717, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 10/99077 [00:05<14:12:13, 1.94it/s, loss=14.0717, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 10/99077 [00:05<14:12:13, 1.94it/s, loss=14.8573, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 11/99077 [00:05<13:27:16, 2.05it/s, loss=14.8573, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 11/99077 [00:06<13:27:16, 2.05it/s, loss=10.9801, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 12/99077 [00:06<12:52:08, 2.14it/s, loss=10.9801, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 12/99077 [00:06<12:52:08, 2.14it/s, loss=12.9438, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 13/99077 [00:06<12:31:40, 2.20it/s, loss=12.9438, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 13/99077 [00:07<12:31:40, 2.20it/s, loss=11.3991, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 14/99077 [00:07<12:19:23, 2.23it/s, loss=11.3991, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 14/99077 [00:07<12:19:23, 2.23it/s, loss=13.9139, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 15/99077 [00:07<12:04:31, 2.28it/s, loss=13.9139, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 15/99077 [00:08<12:04:31, 2.28it/s, loss=12.5221, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 16/99077 [00:08<11:58:39, 2.30it/s, loss=12.5221, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 16/99077 [00:08<11:58:39, 2.30it/s, loss=12.2158, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 17/99077 [00:08<11:56:02, 2.31it/s, loss=12.2158, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 17/99077 [00:08<11:56:02, 2.31it/s, loss=17.6235, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 18/99077 [00:08<11:39:02, 2.36it/s, loss=17.6235, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 18/99077 [00:09<11:39:02, 2.36it/s, loss=12.0257, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 19/99077 [00:09<11:33:16, 2.38it/s, loss=12.0257, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 19/99077 [00:09<11:33:16, 2.38it/s, loss=12.5958, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 20/99077 [00:09<11:38:16, 2.36it/s, loss=12.5958, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 20/99077 [00:10<11:38:16, 2.36it/s, loss=12.9043, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 21/99077 [00:10<11:40:21, 2.36it/s, loss=12.9043, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 21/99077 [00:10<11:40:21, 2.36it/s, loss=13.1043, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 22/99077 [00:10<11:42:09, 2.35it/s, loss=13.1043, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 22/99077 [00:10<11:42:09, 2.35it/s, loss=15.3768, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 23/99077 [00:10<11:44:46, 2.34it/s, loss=15.3768, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 23/99077 [00:11<11:44:46, 2.34it/s, loss=11.1989, acc=0.0031, iter_time=0.44s]
Epoch 0: 0%| | 24/99077 [00:11<11:47:16, 2.33it/s, loss=11.1989, acc=0.0031, iter_time=0.44s]
Epoch 0: 0%| | 24/99077 [00:11<11:47:16, 2.33it/s, loss=13.8976, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 25/99077 [00:11<11:46:18, 2.34it/s, loss=13.8976, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 25/99077 [00:12<11:46:18, 2.34it/s, loss=13.8520, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 26/99077 [00:12<11:45:53, 2.34it/s, loss=13.8520, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 26/99077 [00:12<11:45:53, 2.34it/s, loss=11.0260, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 27/99077 [00:12<11:45:05, 2.34it/s, loss=11.0260, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 27/99077 [00:13<11:45:05, 2.34it/s, loss=10.1774, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 28/99077 [00:13<11:36:31, 2.37it/s, loss=10.1774, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 28/99077 [00:13<11:36:31, 2.37it/s, loss=13.3967, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 29/99077 [00:13<11:32:26, 2.38it/s, loss=13.3967, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 29/99077 [00:13<11:32:26, 2.38it/s, loss=14.1579, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 30/99077 [00:13<11:36:27, 2.37it/s, loss=14.1579, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 30/99077 [00:14<11:36:27, 2.37it/s, loss=12.4593, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 31/99077 [00:14<11:38:30, 2.36it/s, loss=12.4593, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 31/99077 [00:14<11:38:30, 2.36it/s, loss=9.9426, acc=0.0031, iter_time=0.41s]
Epoch 0: 0%| | 32/99077 [00:14<11:34:18, 2.38it/s, loss=9.9426, acc=0.0031, iter_time=0.41s]
Epoch 0: 0%| | 32/99077 [00:15<11:34:18, 2.38it/s, loss=11.7165, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 33/99077 [00:15<11:39:20, 2.36it/s, loss=11.7165, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 33/99077 [00:15<11:39:20, 2.36it/s, loss=11.4410, acc=0.0052, iter_time=0.40s]
Epoch 0: 0%| | 34/99077 [00:15<11:41:06, 2.35it/s, loss=11.4410, acc=0.0052, iter_time=0.40s]
Epoch 0: 0%| | 34/99077 [00:16<11:41:06, 2.35it/s, loss=11.7763, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 35/99077 [00:16<11:41:24, 2.35it/s, loss=11.7763, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 35/99077 [00:16<11:41:24, 2.35it/s, loss=10.8383, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 36/99077 [00:16<11:43:41, 2.35it/s, loss=10.8383, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 36/99077 [00:17<11:43:41, 2.35it/s, loss=14.9072, acc=0.0010, iter_time=0.77s]
Epoch 0: 0%| | 37/99077 [00:17<14:54:20, 1.85it/s, loss=14.9072, acc=0.0010, iter_time=0.77s]
Epoch 0: 0%| | 37/99077 [00:17<14:54:20, 1.85it/s, loss=11.0706, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 38/99077 [00:17<13:58:25, 1.97it/s, loss=11.0706, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 38/99077 [00:18<13:58:25, 1.97it/s, loss=14.2416, acc=0.0021, iter_time=0.46s]
Epoch 0: 0%| | 39/99077 [00:18<13:19:46, 2.06it/s, loss=14.2416, acc=0.0021, iter_time=0.46s]
Epoch 0: 0%| | 39/99077 [00:18<13:19:46, 2.06it/s, loss=13.1443, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 40/99077 [00:18<12:50:13, 2.14it/s, loss=13.1443, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 40/99077 [00:18<12:50:13, 2.14it/s, loss=11.2656, acc=0.0052, iter_time=0.41s]
Epoch 0: 0%| | 41/99077 [00:18<12:18:34, 2.23it/s, loss=11.2656, acc=0.0052, iter_time=0.41s]
Epoch 0: 0%| | 41/99077 [00:19<12:18:34, 2.23it/s, loss=13.1926, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 42/99077 [00:19<12:08:09, 2.27it/s, loss=13.1926, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 42/99077 [00:19<12:08:09, 2.27it/s, loss=10.2414, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 43/99077 [00:19<12:01:46, 2.29it/s, loss=10.2414, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 43/99077 [00:20<12:01:46, 2.29it/s, loss=11.0006, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 44/99077 [00:20<11:57:07, 2.30it/s, loss=11.0006, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 44/99077 [00:20<11:57:07, 2.30it/s, loss=12.4089, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 45/99077 [00:20<11:53:54, 2.31it/s, loss=12.4089, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 45/99077 [00:21<11:53:54, 2.31it/s, loss=13.6205, acc=0.0031, iter_time=0.43s]
Epoch 0: 0%| | 46/99077 [00:21<11:51:53, 2.32it/s, loss=13.6205, acc=0.0031, iter_time=0.43s]
Epoch 0: 0%| | 46/99077 [00:21<11:51:53, 2.32it/s, loss=13.4763, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 47/99077 [00:21<11:52:48, 2.32it/s, loss=13.4763, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 47/99077 [00:21<11:52:48, 2.32it/s, loss=12.6840, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 48/99077 [00:21<11:51:42, 2.32it/s, loss=12.6840, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 48/99077 [00:22<11:51:42, 2.32it/s, loss=10.2276, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 49/99077 [00:22<11:47:45, 2.33it/s, loss=10.2276, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 49/99077 [00:22<11:47:45, 2.33it/s, loss=14.8760, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 50/99077 [00:22<11:48:11, 2.33it/s, loss=14.8760, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 50/99077 [00:23<11:48:11, 2.33it/s, loss=11.7846, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 51/99077 [00:23<11:48:01, 2.33it/s, loss=11.7846, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 51/99077 [00:23<11:48:01, 2.33it/s, loss=16.3344, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 52/99077 [00:23<11:48:50, 2.33it/s, loss=16.3344, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 52/99077 [00:24<11:48:50, 2.33it/s, loss=13.6097, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 53/99077 [00:24<11:47:58, 2.33it/s, loss=13.6097, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 53/99077 [00:24<11:47:58, 2.33it/s, loss=11.9641, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 54/99077 [00:24<11:38:28, 2.36it/s, loss=11.9641, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 54/99077 [00:24<11:38:28, 2.36it/s, loss=13.8353, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 55/99077 [00:24<11:40:44, 2.36it/s, loss=13.8353, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 55/99077 [00:25<11:40:44, 2.36it/s, loss=14.1820, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 56/99077 [00:25<11:38:00, 2.36it/s, loss=14.1820, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 56/99077 [00:25<11:38:00, 2.36it/s, loss=13.5609, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 57/99077 [00:25<11:40:14, 2.36it/s, loss=13.5609, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 57/99077 [00:26<11:40:14, 2.36it/s, loss=13.2704, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 58/99077 [00:26<11:42:23, 2.35it/s, loss=13.2704, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 58/99077 [00:26<11:42:23, 2.35it/s, loss=11.9523, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 59/99077 [00:26<11:40:24, 2.36it/s, loss=11.9523, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 59/99077 [00:27<11:40:24, 2.36it/s, loss=12.8820, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 60/99077 [00:27<11:42:03, 2.35it/s, loss=12.8820, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 60/99077 [00:27<11:42:03, 2.35it/s, loss=12.2972, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 61/99077 [00:27<11:44:38, 2.34it/s, loss=12.2972, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 61/99077 [00:28<11:44:38, 2.34it/s, loss=11.2447, acc=0.0000, iter_time=0.79s]
Epoch 0: 0%| | 62/99077 [00:28<14:50:54, 1.85it/s, loss=11.2447, acc=0.0000, iter_time=0.79s]
Epoch 0: 0%| | 62/99077 [00:28<14:50:54, 1.85it/s, loss=12.2107, acc=0.0021, iter_time=0.47s]
Epoch 0: 0%| | 63/99077 [00:28<13:58:10, 1.97it/s, loss=12.2107, acc=0.0021, iter_time=0.47s]
Epoch 0: 0%| | 63/99077 [00:29<13:58:10, 1.97it/s, loss=10.2726, acc=0.0010, iter_time=0.70s]
Epoch 0: 0%| | 64/99077 [00:29<15:17:30, 1.80it/s, loss=10.2726, acc=0.0010, iter_time=0.70s]
Epoch 0: 0%| | 64/99077 [00:29<15:17:30, 1.80it/s, loss=13.5985, acc=0.0021, iter_time=0.39s]
Epoch 0: 0%| | 65/99077 [00:29<14:15:22, 1.93it/s, loss=13.5985, acc=0.0021, iter_time=0.39s]
Epoch 0: 0%| | 65/99077 [00:30<14:15:22, 1.93it/s, loss=14.2180, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 66/99077 [00:30<13:29:35, 2.04it/s, loss=14.2180, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 66/99077 [00:30<13:29:35, 2.04it/s, loss=13.6456, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 67/99077 [00:30<13:00:08, 2.12it/s, loss=13.6456, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 67/99077 [00:31<13:00:08, 2.12it/s, loss=14.2725, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 68/99077 [00:31<12:38:16, 2.18it/s, loss=14.2725, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 68/99077 [00:31<12:38:16, 2.18it/s, loss=12.0614, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 69/99077 [00:31<12:22:29, 2.22it/s, loss=12.0614, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 69/99077 [00:31<12:22:29, 2.22it/s, loss=10.4446, acc=0.0051, iter_time=0.35s]
Epoch 0: 0%| | 70/99077 [00:31<12:11:09, 2.26it/s, loss=10.4446, acc=0.0051, iter_time=0.35s]
Epoch 0: 0%| | 70/99077 [00:32<12:11:09, 2.26it/s, loss=12.0591, acc=0.0000, iter_time=0.50s]
Epoch 0: 0%| | 71/99077 [00:32<12:05:06, 2.28it/s, loss=12.0591, acc=0.0000, iter_time=0.50s]
Epoch 0: 0%| | 71/99077 [00:32<12:05:06, 2.28it/s, loss=11.6029, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 72/99077 [00:32<12:01:17, 2.29it/s, loss=11.6029, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 72/99077 [00:33<12:01:17, 2.29it/s, loss=11.1675, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 73/99077 [00:33<11:56:05, 2.30it/s, loss=11.1675, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 73/99077 [00:33<11:56:05, 2.30it/s, loss=12.6584, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 74/99077 [00:33<11:45:34, 2.34it/s, loss=12.6584, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 74/99077 [00:34<11:45:34, 2.34it/s, loss=12.6786, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 75/99077 [00:34<11:45:15, 2.34it/s, loss=12.6786, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 75/99077 [00:34<11:45:15, 2.34it/s, loss=12.5739, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 76/99077 [00:34<11:47:10, 2.33it/s, loss=12.5739, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 76/99077 [00:34<11:47:10, 2.33it/s, loss=11.7176, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 77/99077 [00:34<11:37:11, 2.37it/s, loss=11.7176, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 77/99077 [00:35<11:37:11, 2.37it/s, loss=13.5247, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 78/99077 [00:35<11:31:22, 2.39it/s, loss=13.5247, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 78/99077 [00:35<11:31:22, 2.39it/s, loss=10.9316, acc=0.0031, iter_time=0.40s]
Epoch 0: 0%| | 79/99077 [00:35<11:23:49, 2.41it/s, loss=10.9316, acc=0.0031, iter_time=0.40s]
Epoch 0: 0%| | 79/99077 [00:36<11:23:49, 2.41it/s, loss=13.2660, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 80/99077 [00:36<11:31:39, 2.39it/s, loss=13.2660, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 80/99077 [00:36<11:31:39, 2.39it/s, loss=11.9419, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 81/99077 [00:36<11:37:26, 2.37it/s, loss=11.9419, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 81/99077 [00:37<11:37:26, 2.37it/s, loss=12.3308, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 82/99077 [00:37<11:39:59, 2.36it/s, loss=12.3308, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 82/99077 [00:37<11:39:59, 2.36it/s, loss=15.6599, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 83/99077 [00:37<11:42:02, 2.35it/s, loss=15.6599, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 83/99077 [00:37<11:42:02, 2.35it/s, loss=13.8169, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 84/99077 [00:37<11:43:10, 2.35it/s, loss=13.8169, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 84/99077 [00:38<11:43:10, 2.35it/s, loss=11.9970, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 85/99077 [00:38<11:44:08, 2.34it/s, loss=11.9970, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 85/99077 [00:38<11:44:08, 2.34it/s, loss=12.0296, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 86/99077 [00:38<11:45:26, 2.34it/s, loss=12.0296, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 86/99077 [00:39<11:45:26, 2.34it/s, loss=11.6182, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 87/99077 [00:39<11:45:40, 2.34it/s, loss=11.6182, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 87/99077 [00:39<11:45:40, 2.34it/s, loss=12.3590, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 88/99077 [00:39<11:36:37, 2.37it/s, loss=12.3590, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 88/99077 [00:40<11:36:37, 2.37it/s, loss=12.0996, acc=0.0000, iter_time=0.77s]
Epoch 0: 0%| | 89/99077 [00:40<14:51:05, 1.85it/s, loss=12.0996, acc=0.0000, iter_time=0.77s]
Epoch 0: 0%| | 89/99077 [00:40<14:51:05, 1.85it/s, loss=12.9596, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 90/99077 [00:40<13:43:00, 2.00it/s, loss=12.9596, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 90/99077 [00:41<13:43:00, 2.00it/s, loss=12.3350, acc=0.0031, iter_time=0.40s]
Epoch 0: 0%| | 91/99077 [00:41<12:57:42, 2.12it/s, loss=12.3350, acc=0.0031, iter_time=0.40s]
Epoch 0: 0%| | 91/99077 [00:41<12:57:42, 2.12it/s, loss=12.8364, acc=0.0052, iter_time=0.41s]
Epoch 0: 0%| | 92/99077 [00:41<12:36:28, 2.18it/s, loss=12.8364, acc=0.0052, iter_time=0.41s]
Epoch 0: 0%| | 92/99077 [00:42<12:36:28, 2.18it/s, loss=12.2415, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 93/99077 [00:42<12:21:37, 2.22it/s, loss=12.2415, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 93/99077 [00:42<12:21:37, 2.22it/s, loss=13.4821, acc=0.0042, iter_time=0.43s]
Epoch 0: 0%| | 94/99077 [00:42<12:10:34, 2.26it/s, loss=13.4821, acc=0.0042, iter_time=0.43s]
Epoch 0: 0%| | 94/99077 [00:42<12:10:34, 2.26it/s, loss=11.2615, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 95/99077 [00:42<11:55:00, 2.31it/s, loss=11.2615, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 95/99077 [00:43<11:55:00, 2.31it/s, loss=11.8608, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 96/99077 [00:43<11:53:28, 2.31it/s, loss=11.8608, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 96/99077 [00:43<11:53:28, 2.31it/s, loss=11.8328, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 97/99077 [00:43<11:50:36, 2.32it/s, loss=11.8328, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 97/99077 [00:44<11:50:36, 2.32it/s, loss=12.6176, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 98/99077 [00:44<11:49:17, 2.33it/s, loss=12.6176, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 98/99077 [00:44<11:49:17, 2.33it/s, loss=13.5855, acc=0.0031, iter_time=0.44s]
Epoch 0: 0%| | 99/99077 [00:44<11:48:31, 2.33it/s, loss=13.5855, acc=0.0031, iter_time=0.44s]
Epoch 0: 0%| | 99/99077 [00:45<11:48:31, 2.33it/s, loss=15.2188, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 100/99077 [00:45<11:34:22, 2.38it/s, loss=15.2188, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 100/99077 [00:45<11:34:22, 2.38it/s, loss=12.4472, acc=0.0021, iter_time=0.39s]
Epoch 0: 0%| | 101/99077 [00:45<11:40:03, 2.36it/s, loss=12.4472, acc=0.0021, iter_time=0.39s]
Epoch 0: 0%| | 101/99077 [00:45<11:40:03, 2.36it/s, loss=14.8117, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 102/99077 [00:45<11:41:44, 2.35it/s, loss=14.8117, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 102/99077 [00:46<11:41:44, 2.35it/s, loss=11.1735, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 103/99077 [00:46<11:41:14, 2.35it/s, loss=11.1735, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 103/99077 [00:46<11:41:14, 2.35it/s, loss=12.2144, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 104/99077 [00:46<11:44:21, 2.34it/s, loss=12.2144, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 104/99077 [00:47<11:44:21, 2.34it/s, loss=15.1962, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 105/99077 [00:47<11:45:57, 2.34it/s, loss=15.1962, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 105/99077 [00:47<11:45:57, 2.34it/s, loss=10.9325, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 106/99077 [00:47<11:45:25, 2.34it/s, loss=10.9325, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 106/99077 [00:48<11:45:25, 2.34it/s, loss=12.3950, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 107/99077 [00:48<11:37:35, 2.36it/s, loss=12.3950, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 107/99077 [00:48<11:37:35, 2.36it/s, loss=12.0318, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 108/99077 [00:48<11:39:55, 2.36it/s, loss=12.0318, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 108/99077 [00:48<11:39:55, 2.36it/s, loss=10.1541, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 109/99077 [00:48<11:36:10, 2.37it/s, loss=10.1541, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 109/99077 [00:49<11:36:10, 2.37it/s, loss=11.5682, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 110/99077 [00:49<11:37:40, 2.36it/s, loss=11.5682, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 110/99077 [00:49<11:37:40, 2.36it/s, loss=13.8740, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 111/99077 [00:49<11:40:48, 2.35it/s, loss=13.8740, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 111/99077 [00:50<11:40:48, 2.35it/s, loss=11.0895, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 112/99077 [00:50<11:41:37, 2.35it/s, loss=11.0895, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 112/99077 [00:50<11:41:37, 2.35it/s, loss=12.2371, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 113/99077 [00:50<11:43:56, 2.34it/s, loss=12.2371, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 113/99077 [00:51<11:43:56, 2.34it/s, loss=11.2508, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 114/99077 [00:51<11:46:04, 2.34it/s, loss=11.2508, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 114/99077 [00:51<11:46:04, 2.34it/s, loss=11.5391, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 115/99077 [00:51<11:47:09, 2.33it/s, loss=11.5391, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 115/99077 [00:52<11:47:09, 2.33it/s, loss=14.3449, acc=0.0010, iter_time=0.77s]
Epoch 0: 0%| | 116/99077 [00:52<14:38:03, 1.88it/s, loss=14.3449, acc=0.0010, iter_time=0.77s]
Epoch 0: 0%| | 116/99077 [00:52<14:38:03, 1.88it/s, loss=13.4550, acc=0.0010, iter_time=0.39s]
Epoch 0: 0%| | 117/99077 [00:52<13:37:33, 2.02it/s, loss=13.4550, acc=0.0010, iter_time=0.39s]
Epoch 0: 0%| | 117/99077 [00:53<13:37:33, 2.02it/s, loss=12.6586, acc=0.0042, iter_time=0.42s]
Epoch 0: 0%| | 118/99077 [00:53<12:59:44, 2.12it/s, loss=12.6586, acc=0.0042, iter_time=0.42s]
Epoch 0: 0%| | 118/99077 [00:53<12:59:44, 2.12it/s, loss=13.4241, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 119/99077 [00:53<12:34:07, 2.19it/s, loss=13.4241, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 119/99077 [00:53<12:34:07, 2.19it/s, loss=14.7787, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 120/99077 [00:53<12:10:24, 2.26it/s, loss=14.7787, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 120/99077 [00:54<12:10:24, 2.26it/s, loss=10.8083, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 121/99077 [00:54<12:01:06, 2.29it/s, loss=10.8083, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 121/99077 [00:54<12:01:06, 2.29it/s, loss=16.0318, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 122/99077 [00:54<11:58:09, 2.30it/s, loss=16.0318, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 122/99077 [00:55<11:58:09, 2.30it/s, loss=12.4363, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 123/99077 [00:55<11:56:24, 2.30it/s, loss=12.4363, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 123/99077 [00:55<11:56:24, 2.30it/s, loss=10.8431, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 124/99077 [00:55<11:53:00, 2.31it/s, loss=10.8431, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 124/99077 [00:56<11:53:00, 2.31it/s, loss=13.7557, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 125/99077 [00:56<11:45:34, 2.34it/s, loss=13.7557, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 125/99077 [00:56<11:45:34, 2.34it/s, loss=13.9480, acc=0.0029, iter_time=0.36s]
Epoch 0: 0%| | 126/99077 [00:56<11:45:26, 2.34it/s, loss=13.9480, acc=0.0029, iter_time=0.36s]
Epoch 0: 0%| | 126/99077 [00:56<11:45:26, 2.34it/s, loss=10.6232, acc=0.0021, iter_time=0.48s]
Epoch 0: 0%| | 127/99077 [00:56<11:36:19, 2.37it/s, loss=10.6232, acc=0.0021, iter_time=0.48s]
Epoch 0: 0%| | 127/99077 [00:57<11:36:19, 2.37it/s, loss=11.7058, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 128/99077 [00:57<11:42:49, 2.35it/s, loss=11.7058, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 128/99077 [00:57<11:42:49, 2.35it/s, loss=11.6551, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 129/99077 [00:57<11:35:02, 2.37it/s, loss=11.6551, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 129/99077 [00:58<11:35:02, 2.37it/s, loss=13.9434, acc=0.0031, iter_time=0.41s]
Epoch 0: 0%| | 130/99077 [00:58<11:37:49, 2.36it/s, loss=13.9434, acc=0.0031, iter_time=0.41s]
Epoch 0: 0%| | 130/99077 [00:58<11:37:49, 2.36it/s, loss=10.3400, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 131/99077 [00:58<11:37:56, 2.36it/s, loss=10.3400, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 131/99077 [00:58<11:37:56, 2.36it/s, loss=11.3008, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 132/99077 [00:58<11:42:03, 2.35it/s, loss=11.3008, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 132/99077 [00:59<11:42:03, 2.35it/s, loss=14.0675, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 133/99077 [00:59<11:41:57, 2.35it/s, loss=14.0675, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 133/99077 [00:59<11:41:57, 2.35it/s, loss=11.6035, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 134/99077 [00:59<11:43:36, 2.34it/s, loss=11.6035, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 134/99077 [01:00<11:43:36, 2.34it/s, loss=13.7789, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 135/99077 [01:00<11:45:34, 2.34it/s, loss=13.7789, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 135/99077 [01:00<11:45:34, 2.34it/s, loss=12.5972, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 136/99077 [01:00<11:45:01, 2.34it/s, loss=12.5972, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 136/99077 [01:01<11:45:01, 2.34it/s, loss=11.7832, acc=0.0031, iter_time=0.41s]
Epoch 0: 0%| | 137/99077 [01:01<11:47:13, 2.33it/s, loss=11.7832, acc=0.0031, iter_time=0.41s]
Epoch 0: 0%| | 137/99077 [01:01<11:47:13, 2.33it/s, loss=12.5960, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 138/99077 [01:01<11:37:26, 2.36it/s, loss=12.5960, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 138/99077 [01:01<11:37:26, 2.36it/s, loss=12.3302, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 139/99077 [01:01<11:40:00, 2.36it/s, loss=12.3302, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 139/99077 [01:02<11:40:00, 2.36it/s, loss=13.1441, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 140/99077 [01:02<11:41:41, 2.35it/s, loss=13.1441, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 140/99077 [01:02<11:41:41, 2.35it/s, loss=12.3028, acc=0.0042, iter_time=0.44s]
Epoch 0: 0%| | 141/99077 [01:02<11:40:46, 2.35it/s, loss=12.3028, acc=0.0042, iter_time=0.44s]
Epoch 0: 0%| | 141/99077 [01:03<11:40:46, 2.35it/s, loss=10.5691, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 142/99077 [01:03<11:43:45, 2.34it/s, loss=10.5691, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 142/99077 [01:04<11:43:45, 2.34it/s, loss=15.0239, acc=0.0000, iter_time=0.76s]
Epoch 0: 0%| | 143/99077 [01:04<14:43:50, 1.87it/s, loss=15.0239, acc=0.0000, iter_time=0.76s]
Epoch 0: 0%| | 143/99077 [01:04<14:43:50, 1.87it/s, loss=13.3353, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 144/99077 [01:04<13:50:10, 1.99it/s, loss=13.3353, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 144/99077 [01:04<13:50:10, 1.99it/s, loss=17.4680, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 145/99077 [01:04<13:12:07, 2.08it/s, loss=17.4680, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 145/99077 [01:05<13:12:07, 2.08it/s, loss=13.5514, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 146/99077 [01:05<12:38:54, 2.17it/s, loss=13.5514, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 146/99077 [01:05<12:38:54, 2.17it/s, loss=12.1692, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 147/99077 [01:05<12:07:58, 2.26it/s, loss=12.1692, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 147/99077 [01:06<12:07:58, 2.26it/s, loss=16.4592, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 148/99077 [01:06<11:56:34, 2.30it/s, loss=16.4592, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 148/99077 [01:06<11:56:34, 2.30it/s, loss=12.8787, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 149/99077 [01:06<11:54:04, 2.31it/s, loss=12.8787, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 149/99077 [01:06<11:54:04, 2.31it/s, loss=13.2928, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 150/99077 [01:06<11:37:36, 2.36it/s, loss=13.2928, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 150/99077 [01:07<11:37:36, 2.36it/s, loss=14.3081, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 151/99077 [01:07<11:41:04, 2.35it/s, loss=14.3081, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 151/99077 [01:07<11:41:04, 2.35it/s, loss=12.2806, acc=0.0031, iter_time=0.42s]
Epoch 0: 0%| | 152/99077 [01:07<11:44:36, 2.34it/s, loss=12.2806, acc=0.0031, iter_time=0.42s]
Epoch 0: 0%| | 152/99077 [01:08<11:44:36, 2.34it/s, loss=13.0896, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 153/99077 [01:08<11:37:25, 2.36it/s, loss=13.0896, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 153/99077 [01:08<11:37:25, 2.36it/s, loss=13.8200, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 154/99077 [01:08<11:40:52, 2.35it/s, loss=13.8200, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 154/99077 [01:09<11:40:52, 2.35it/s, loss=14.2496, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 155/99077 [01:09<11:32:52, 2.38it/s, loss=14.2496, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 155/99077 [01:09<11:32:52, 2.38it/s, loss=13.8418, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 156/99077 [01:09<11:32:47, 2.38it/s, loss=13.8418, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 156/99077 [01:09<11:32:47, 2.38it/s, loss=13.3679, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 157/99077 [01:09<11:38:20, 2.36it/s, loss=13.3679, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 157/99077 [01:10<11:38:20, 2.36it/s, loss=13.1375, acc=0.0052, iter_time=0.40s]
Epoch 0: 0%| | 158/99077 [01:10<11:38:35, 2.36it/s, loss=13.1375, acc=0.0052, iter_time=0.40s]
Epoch 0: 0%| | 158/99077 [01:10<11:38:35, 2.36it/s, loss=11.1591, acc=0.0067, iter_time=0.34s]
Epoch 0: 0%| | 159/99077 [01:10<11:40:30, 2.35it/s, loss=11.1591, acc=0.0067, iter_time=0.34s]
Epoch 0: 0%| | 159/99077 [01:11<11:40:30, 2.35it/s, loss=11.6970, acc=0.0010, iter_time=0.52s]
Epoch 0: 0%| | 160/99077 [01:11<11:43:56, 2.34it/s, loss=11.6970, acc=0.0010, iter_time=0.52s]
Epoch 0: 0%| | 160/99077 [01:11<11:43:56, 2.34it/s, loss=13.9916, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 161/99077 [01:11<11:42:32, 2.35it/s, loss=13.9916, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 161/99077 [01:12<11:42:32, 2.35it/s, loss=17.2993, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 162/99077 [01:12<11:32:28, 2.38it/s, loss=17.2993, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 162/99077 [01:12<11:32:28, 2.38it/s, loss=14.2383, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 163/99077 [01:12<11:38:05, 2.36it/s, loss=14.2383, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 163/99077 [01:12<11:38:05, 2.36it/s, loss=12.0189, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 164/99077 [01:12<11:42:02, 2.35it/s, loss=12.0189, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 164/99077 [01:13<11:42:02, 2.35it/s, loss=14.7737, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 165/99077 [01:13<11:35:07, 2.37it/s, loss=14.7737, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 165/99077 [01:13<11:35:07, 2.37it/s, loss=15.0791, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 166/99077 [01:13<11:39:50, 2.36it/s, loss=15.0791, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 166/99077 [01:14<11:39:50, 2.36it/s, loss=13.4310, acc=0.0031, iter_time=0.45s]
Epoch 0: 0%| | 167/99077 [01:14<11:43:33, 2.34it/s, loss=13.4310, acc=0.0031, iter_time=0.45s]
Epoch 0: 0%| | 167/99077 [01:14<11:43:33, 2.34it/s, loss=13.6317, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 168/99077 [01:14<11:35:07, 2.37it/s, loss=13.6317, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 168/99077 [01:15<11:35:07, 2.37it/s, loss=15.4211, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 169/99077 [01:15<11:38:38, 2.36it/s, loss=15.4211, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 169/99077 [01:15<11:38:38, 2.36it/s, loss=13.1964, acc=0.0000, iter_time=0.75s]
Epoch 0: 0%| | 170/99077 [01:15<14:36:48, 1.88it/s, loss=13.1964, acc=0.0000, iter_time=0.75s]
Epoch 0: 0%| | 170/99077 [01:16<14:36:48, 1.88it/s, loss=12.6561, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 171/99077 [01:16<13:31:45, 2.03it/s, loss=12.6561, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 171/99077 [01:16<13:31:45, 2.03it/s, loss=11.7912, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 172/99077 [01:16<13:00:50, 2.11it/s, loss=11.7912, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 172/99077 [01:17<13:00:50, 2.11it/s, loss=12.7795, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 173/99077 [01:17<12:39:53, 2.17it/s, loss=12.7795, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 173/99077 [01:17<12:39:53, 2.17it/s, loss=12.1343, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 174/99077 [01:17<12:14:18, 2.24it/s, loss=12.1343, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 174/99077 [01:17<12:14:18, 2.24it/s, loss=11.6329, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 175/99077 [01:17<11:51:49, 2.32it/s, loss=11.6329, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 175/99077 [01:18<11:51:49, 2.32it/s, loss=12.6692, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 176/99077 [01:18<11:49:27, 2.32it/s, loss=12.6692, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 176/99077 [01:18<11:49:27, 2.32it/s, loss=13.1118, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 177/99077 [01:18<11:50:14, 2.32it/s, loss=13.1118, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 177/99077 [01:19<11:50:14, 2.32it/s, loss=10.7652, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 178/99077 [01:19<11:51:31, 2.32it/s, loss=10.7652, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 178/99077 [01:19<11:51:31, 2.32it/s, loss=15.1640, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 179/99077 [01:19<11:50:49, 2.32it/s, loss=15.1640, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 179/99077 [01:20<11:50:49, 2.32it/s, loss=10.8032, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 180/99077 [01:20<11:50:10, 2.32it/s, loss=10.8032, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 180/99077 [01:20<11:50:10, 2.32it/s, loss=16.0077, acc=0.0033, iter_time=0.30s]
Epoch 0: 0%| | 181/99077 [01:20<11:35:40, 2.37it/s, loss=16.0077, acc=0.0033, iter_time=0.30s]
Epoch 0: 0%| | 181/99077 [01:20<11:35:40, 2.37it/s, loss=12.9898, acc=0.0000, iter_time=0.50s]
Epoch 0: 0%| | 182/99077 [01:20<11:34:38, 2.37it/s, loss=12.9898, acc=0.0000, iter_time=0.50s]
Epoch 0: 0%| | 182/99077 [01:21<11:34:38, 2.37it/s, loss=13.0400, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 183/99077 [01:21<11:28:01, 2.40it/s, loss=13.0400, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 183/99077 [01:21<11:28:01, 2.40it/s, loss=11.2748, acc=0.0063, iter_time=0.39s]
Epoch 0: 0%| | 184/99077 [01:21<11:23:29, 2.41it/s, loss=11.2748, acc=0.0063, iter_time=0.39s]
Epoch 0: 0%| | 184/99077 [01:22<11:23:29, 2.41it/s, loss=12.6640, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 185/99077 [01:22<11:27:37, 2.40it/s, loss=12.6640, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 185/99077 [01:22<11:27:37, 2.40it/s, loss=16.3328, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 186/99077 [01:22<11:35:10, 2.37it/s, loss=16.3328, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 186/99077 [01:22<11:35:10, 2.37it/s, loss=11.5004, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 187/99077 [01:22<11:38:11, 2.36it/s, loss=11.5004, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 187/99077 [01:23<11:38:11, 2.36it/s, loss=12.9528, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 188/99077 [01:23<11:41:52, 2.35it/s, loss=12.9528, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 188/99077 [01:23<11:41:52, 2.35it/s, loss=12.7828, acc=0.0063, iter_time=0.40s]
Epoch 0: 0%| | 189/99077 [01:23<11:38:28, 2.36it/s, loss=12.7828, acc=0.0063, iter_time=0.40s]
Epoch 0: 0%| | 189/99077 [01:24<11:38:28, 2.36it/s, loss=13.1720, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 190/99077 [01:24<11:43:38, 2.34it/s, loss=13.1720, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 190/99077 [01:24<11:43:38, 2.34it/s, loss=9.3302, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 191/99077 [01:24<11:31:59, 2.38it/s, loss=9.3302, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 191/99077 [01:25<11:31:59, 2.38it/s, loss=16.3958, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 192/99077 [01:25<11:38:09, 2.36it/s, loss=16.3958, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 192/99077 [01:25<11:38:09, 2.36it/s, loss=12.8500, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 193/99077 [01:25<11:41:26, 2.35it/s, loss=12.8500, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 193/99077 [01:25<11:41:26, 2.35it/s, loss=11.7762, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 194/99077 [01:25<11:44:28, 2.34it/s, loss=11.7762, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 194/99077 [01:26<11:44:28, 2.34it/s, loss=13.1377, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 195/99077 [01:26<11:46:40, 2.33it/s, loss=13.1377, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 195/99077 [01:26<11:46:40, 2.33it/s, loss=12.4222, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 196/99077 [01:26<11:45:34, 2.34it/s, loss=12.4222, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 196/99077 [01:27<11:45:34, 2.34it/s, loss=14.5180, acc=0.0021, iter_time=0.80s]
Epoch 0: 0%| | 197/99077 [01:27<14:44:19, 1.86it/s, loss=14.5180, acc=0.0021, iter_time=0.80s]
Epoch 0: 0%| | 197/99077 [01:27<14:44:19, 1.86it/s, loss=12.6480, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 198/99077 [01:27<13:44:59, 2.00it/s, loss=12.6480, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 198/99077 [01:28<13:44:59, 2.00it/s, loss=12.8655, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 199/99077 [01:28<13:10:20, 2.09it/s, loss=12.8655, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 199/99077 [01:28<13:10:20, 2.09it/s, loss=14.7090, acc=0.0031, iter_time=0.45s]
Epoch 0: 0%| | 200/99077 [01:28<12:30:12, 2.20it/s, loss=14.7090, acc=0.0031, iter_time=0.45s]
Epoch 0: 0%| | 200/99077 [01:29<12:30:12, 2.20it/s, loss=11.8165, acc=0.0021, iter_time=0.39s]
Epoch 0: 0%| | 201/99077 [01:29<12:18:52, 2.23it/s, loss=11.8165, acc=0.0021, iter_time=0.39s]
Epoch 0: 0%| | 201/99077 [01:29<12:18:52, 2.23it/s, loss=13.1780, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 202/99077 [01:29<12:04:55, 2.27it/s, loss=13.1780, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 202/99077 [01:30<12:04:55, 2.27it/s, loss=11.9501, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 203/99077 [01:30<12:00:58, 2.29it/s, loss=11.9501, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 203/99077 [01:30<12:00:58, 2.29it/s, loss=12.2011, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 204/99077 [01:30<11:52:11, 2.31it/s, loss=12.2011, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 204/99077 [01:30<11:52:11, 2.31it/s, loss=12.1879, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 205/99077 [01:30<11:49:55, 2.32it/s, loss=12.1879, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 205/99077 [01:31<11:49:55, 2.32it/s, loss=10.0905, acc=0.0031, iter_time=0.43s]
Epoch 0: 0%| | 206/99077 [01:31<11:50:16, 2.32it/s, loss=10.0905, acc=0.0031, iter_time=0.43s]
Epoch 0: 0%| | 206/99077 [01:31<11:50:16, 2.32it/s, loss=11.8113, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 207/99077 [01:31<11:50:31, 2.32it/s, loss=11.8113, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 207/99077 [01:32<11:50:31, 2.32it/s, loss=13.0134, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 208/99077 [01:32<11:52:37, 2.31it/s, loss=13.0134, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 208/99077 [01:32<11:52:37, 2.31it/s, loss=11.2383, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 209/99077 [01:32<11:51:36, 2.32it/s, loss=11.2383, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 209/99077 [01:33<11:51:36, 2.32it/s, loss=12.0988, acc=0.0031, iter_time=0.43s]
Epoch 0: 0%| | 210/99077 [01:33<11:41:52, 2.35it/s, loss=12.0988, acc=0.0031, iter_time=0.43s]
Epoch 0: 0%| | 210/99077 [01:33<11:41:52, 2.35it/s, loss=13.5727, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 211/99077 [01:33<11:36:46, 2.36it/s, loss=13.5727, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 211/99077 [01:33<11:36:46, 2.36it/s, loss=11.4905, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 212/99077 [01:33<11:31:31, 2.38it/s, loss=11.4905, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 212/99077 [01:34<11:31:31, 2.38it/s, loss=10.5586, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 213/99077 [01:34<11:37:02, 2.36it/s, loss=10.5586, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 213/99077 [01:34<11:37:02, 2.36it/s, loss=9.9480, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 214/99077 [01:34<11:40:57, 2.35it/s, loss=9.9480, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 214/99077 [01:35<11:40:57, 2.35it/s, loss=11.3813, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 215/99077 [01:35<11:43:45, 2.34it/s, loss=11.3813, acc=0.0000, iter_time=0.46s]
Epoch 0: 0%| | 215/99077 [01:35<11:43:45, 2.34it/s, loss=13.0045, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 216/99077 [01:35<11:45:58, 2.33it/s, loss=13.0045, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 216/99077 [01:36<11:45:58, 2.33it/s, loss=15.6541, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 217/99077 [01:36<11:46:51, 2.33it/s, loss=15.6541, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 217/99077 [01:36<11:46:51, 2.33it/s, loss=15.4768, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 218/99077 [01:36<11:47:08, 2.33it/s, loss=15.4768, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 218/99077 [01:36<11:47:08, 2.33it/s, loss=12.9046, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 219/99077 [01:36<11:45:15, 2.34it/s, loss=12.9046, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 219/99077 [01:37<11:45:15, 2.34it/s, loss=15.3748, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 220/99077 [01:37<11:46:52, 2.33it/s, loss=15.3748, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 220/99077 [01:37<11:46:52, 2.33it/s, loss=12.5441, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 221/99077 [01:37<11:41:46, 2.35it/s, loss=12.5441, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 221/99077 [01:38<11:41:46, 2.35it/s, loss=12.0571, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 222/99077 [01:38<11:31:11, 2.38it/s, loss=12.0571, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 222/99077 [01:38<11:31:11, 2.38it/s, loss=11.7320, acc=0.0010, iter_time=0.39s]
Epoch 0: 0%| | 223/99077 [01:38<11:25:33, 2.40it/s, loss=11.7320, acc=0.0010, iter_time=0.39s]
Epoch 0: 0%| | 223/99077 [01:39<11:25:33, 2.40it/s, loss=9.8993, acc=0.0021, iter_time=0.73s]
Epoch 0: 0%| | 224/99077 [01:39<14:16:09, 1.92it/s, loss=9.8993, acc=0.0021, iter_time=0.73s]
Epoch 0: 0%| | 224/99077 [01:39<14:16:09, 1.92it/s, loss=14.1583, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 225/99077 [01:39<13:23:27, 2.05it/s, loss=14.1583, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 225/99077 [01:40<13:23:27, 2.05it/s, loss=12.6046, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 226/99077 [01:40<12:54:41, 2.13it/s, loss=12.6046, acc=0.0021, iter_time=0.41s]
Epoch 0: 0%| | 226/99077 [01:40<12:54:41, 2.13it/s, loss=12.3423, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 227/99077 [01:40<12:35:44, 2.18it/s, loss=12.3423, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 227/99077 [01:41<12:35:44, 2.18it/s, loss=12.0200, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 228/99077 [01:41<12:22:01, 2.22it/s, loss=12.0200, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 228/99077 [01:41<12:22:01, 2.22it/s, loss=11.8680, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 229/99077 [01:41<12:09:54, 2.26it/s, loss=11.8680, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 229/99077 [01:41<12:09:54, 2.26it/s, loss=13.3599, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 230/99077 [01:41<12:03:15, 2.28it/s, loss=13.3599, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 230/99077 [01:42<12:03:15, 2.28it/s, loss=12.1727, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 231/99077 [01:42<11:53:36, 2.31it/s, loss=12.1727, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 231/99077 [01:42<11:53:36, 2.31it/s, loss=11.1910, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 232/99077 [01:42<11:52:52, 2.31it/s, loss=11.1910, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 232/99077 [01:43<11:52:52, 2.31it/s, loss=11.2822, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 233/99077 [01:43<11:52:52, 2.31it/s, loss=11.2822, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 233/99077 [01:43<11:52:52, 2.31it/s, loss=10.8063, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 234/99077 [01:43<11:49:35, 2.32it/s, loss=10.8063, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 234/99077 [01:44<11:49:35, 2.32it/s, loss=11.3968, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 235/99077 [01:44<11:46:52, 2.33it/s, loss=11.3968, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 235/99077 [01:44<11:46:52, 2.33it/s, loss=11.8453, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 236/99077 [01:44<11:45:47, 2.33it/s, loss=11.8453, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 236/99077 [01:44<11:45:47, 2.33it/s, loss=12.4428, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 237/99077 [01:44<11:46:55, 2.33it/s, loss=12.4428, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 237/99077 [01:45<11:46:55, 2.33it/s, loss=15.3881, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 238/99077 [01:45<11:35:22, 2.37it/s, loss=15.3881, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 238/99077 [01:45<11:35:22, 2.37it/s, loss=11.9211, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 239/99077 [01:45<11:37:22, 2.36it/s, loss=11.9211, acc=0.0021, iter_time=0.44s]
Epoch 0: 0%| | 239/99077 [01:46<11:37:22, 2.36it/s, loss=13.8449, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 240/99077 [01:46<11:39:53, 2.35it/s, loss=13.8449, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 240/99077 [01:46<11:39:53, 2.35it/s, loss=14.1646, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 241/99077 [01:46<11:42:07, 2.35it/s, loss=14.1646, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 241/99077 [01:47<11:42:07, 2.35it/s, loss=11.5674, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 242/99077 [01:47<11:45:05, 2.34it/s, loss=11.5674, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 242/99077 [01:47<11:45:05, 2.34it/s, loss=11.0313, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 243/99077 [01:47<11:46:36, 2.33it/s, loss=11.0313, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 243/99077 [01:47<11:46:36, 2.33it/s, loss=9.0890, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 244/99077 [01:47<11:47:27, 2.33it/s, loss=9.0890, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 244/99077 [01:48<11:47:27, 2.33it/s, loss=12.4938, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 245/99077 [01:48<11:40:25, 2.35it/s, loss=12.4938, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 245/99077 [01:48<11:40:25, 2.35it/s, loss=11.9112, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 246/99077 [01:48<11:28:51, 2.39it/s, loss=11.9112, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 246/99077 [01:49<11:28:51, 2.39it/s, loss=16.1924, acc=0.0032, iter_time=0.42s]
Epoch 0: 0%| | 247/99077 [01:49<11:35:10, 2.37it/s, loss=16.1924, acc=0.0032, iter_time=0.42s]
Epoch 0: 0%| | 247/99077 [01:49<11:35:10, 2.37it/s, loss=12.1205, acc=0.0031, iter_time=0.42s]
Epoch 0: 0%| | 248/99077 [01:49<11:39:39, 2.35it/s, loss=12.1205, acc=0.0031, iter_time=0.42s]
Epoch 0: 0%| | 248/99077 [01:50<11:39:39, 2.35it/s, loss=13.1931, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 249/99077 [01:50<11:41:33, 2.35it/s, loss=13.1931, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 249/99077 [01:50<11:41:33, 2.35it/s, loss=15.0664, acc=0.0000, iter_time=0.47s]
Epoch 0: 0%| | 250/99077 [01:50<11:43:55, 2.34it/s, loss=15.0664, acc=0.0000, iter_time=0.47s]
Epoch 0: 0%| | 250/99077 [01:51<11:43:55, 2.34it/s, loss=11.8584, acc=0.0000, iter_time=0.72s]
Epoch 0: 0%| | 251/99077 [01:51<14:46:35, 1.86it/s, loss=11.8584, acc=0.0000, iter_time=0.72s]
Epoch 0: 0%| | 251/99077 [01:51<14:46:35, 1.86it/s, loss=14.6666, acc=0.0000, iter_time=0.48s]
Epoch 0: 0%| | 252/99077 [01:51<13:52:45, 1.98it/s, loss=14.6666, acc=0.0000, iter_time=0.48s]
Epoch 0: 0%| | 252/99077 [01:52<13:52:45, 1.98it/s, loss=13.1931, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 253/99077 [01:52<13:16:14, 2.07it/s, loss=13.1931, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 253/99077 [01:52<13:16:14, 2.07it/s, loss=13.5653, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 254/99077 [01:52<12:44:19, 2.15it/s, loss=13.5653, acc=0.0010, iter_time=0.40s]
Epoch 0: 0%| | 254/99077 [01:52<12:44:19, 2.15it/s, loss=11.4822, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 255/99077 [01:52<12:27:16, 2.20it/s, loss=11.4822, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 255/99077 [01:53<12:27:16, 2.20it/s, loss=13.8277, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 256/99077 [01:53<12:13:23, 2.25it/s, loss=13.8277, acc=0.0021, iter_time=0.45s]
Epoch 0: 0%| | 256/99077 [01:53<12:13:23, 2.25it/s, loss=14.6724, acc=0.0000, iter_time=0.39s]
Epoch 0: 0%| | 257/99077 [01:53<12:05:36, 2.27it/s, loss=14.6724, acc=0.0000, iter_time=0.39s]
Epoch 0: 0%| | 257/99077 [01:54<12:05:36, 2.27it/s, loss=10.5941, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 258/99077 [01:54<11:59:28, 2.29it/s, loss=10.5941, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 258/99077 [01:54<11:59:28, 2.29it/s, loss=12.1260, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 259/99077 [01:54<11:56:10, 2.30it/s, loss=12.1260, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 259/99077 [01:55<11:56:10, 2.30it/s, loss=13.5369, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 260/99077 [01:55<11:53:49, 2.31it/s, loss=13.5369, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 260/99077 [01:55<11:53:49, 2.31it/s, loss=11.4667, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 261/99077 [01:55<11:41:33, 2.35it/s, loss=11.4667, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 261/99077 [01:55<11:41:33, 2.35it/s, loss=12.5131, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 262/99077 [01:55<11:44:32, 2.34it/s, loss=12.5131, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 262/99077 [01:56<11:44:32, 2.34it/s, loss=12.6439, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 263/99077 [01:56<11:39:36, 2.35it/s, loss=12.6439, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 263/99077 [01:56<11:39:36, 2.35it/s, loss=13.4355, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 264/99077 [01:56<11:31:43, 2.38it/s, loss=13.4355, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 264/99077 [01:57<11:31:43, 2.38it/s, loss=13.1517, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 265/99077 [01:57<11:37:34, 2.36it/s, loss=13.1517, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 265/99077 [01:57<11:37:34, 2.36it/s, loss=11.9796, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 266/99077 [01:57<11:41:18, 2.35it/s, loss=11.9796, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 266/99077 [01:58<11:41:18, 2.35it/s, loss=11.9453, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 267/99077 [01:58<11:45:04, 2.34it/s, loss=11.9453, acc=0.0000, iter_time=0.40s]
Epoch 0: 0%| | 267/99077 [01:58<11:45:04, 2.34it/s, loss=12.4259, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 268/99077 [01:58<11:46:18, 2.33it/s, loss=12.4259, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 268/99077 [01:58<11:46:18, 2.33it/s, loss=12.9401, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 269/99077 [01:58<11:34:03, 2.37it/s, loss=12.9401, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 269/99077 [01:59<11:34:03, 2.37it/s, loss=14.1790, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 270/99077 [01:59<11:26:23, 2.40it/s, loss=14.1790, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 270/99077 [01:59<11:26:23, 2.40it/s, loss=12.3884, acc=0.0000, iter_time=0.39s]
Epoch 0: 0%| | 271/99077 [01:59<11:16:09, 2.44it/s, loss=12.3884, acc=0.0000, iter_time=0.39s]
Epoch 0: 0%| | 271/99077 [02:00<11:16:09, 2.44it/s, loss=12.1609, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 272/99077 [02:00<11:22:31, 2.41it/s, loss=12.1609, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 272/99077 [02:00<11:22:31, 2.41it/s, loss=17.5727, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 273/99077 [02:00<11:28:57, 2.39it/s, loss=17.5727, acc=0.0000, iter_time=0.45s]
Epoch 0: 0%| | 273/99077 [02:00<11:28:57, 2.39it/s, loss=10.8771, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 274/99077 [02:00<11:33:51, 2.37it/s, loss=10.8771, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 274/99077 [02:01<11:33:51, 2.37it/s, loss=12.4583, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 275/99077 [02:01<11:36:03, 2.37it/s, loss=12.4583, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 275/99077 [02:01<11:36:03, 2.37it/s, loss=11.1853, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 276/99077 [02:01<11:39:03, 2.36it/s, loss=11.1853, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 276/99077 [02:02<11:39:03, 2.36it/s, loss=12.0613, acc=0.0000, iter_time=0.75s]
Epoch 0: 0%| | 277/99077 [02:02<14:41:25, 1.87it/s, loss=12.0613, acc=0.0000, iter_time=0.75s]
Epoch 0: 0%| | 277/99077 [02:03<14:41:25, 1.87it/s, loss=13.4157, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 278/99077 [02:03<13:50:22, 1.98it/s, loss=13.4157, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 278/99077 [02:03<13:50:22, 1.98it/s, loss=14.9592, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 279/99077 [02:03<13:11:34, 2.08it/s, loss=14.9592, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 279/99077 [02:03<13:11:34, 2.08it/s, loss=11.5899, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 280/99077 [02:03<12:42:28, 2.16it/s, loss=11.5899, acc=0.0010, iter_time=0.42s]
Epoch 0: 0%| | 280/99077 [02:04<12:42:28, 2.16it/s, loss=10.8112, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 281/99077 [02:04<12:19:59, 2.23it/s, loss=10.8112, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 281/99077 [02:04<12:19:59, 2.23it/s, loss=10.6341, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 282/99077 [02:04<12:09:49, 2.26it/s, loss=10.6341, acc=0.0000, iter_time=0.41s]
Epoch 0: 0%| | 282/99077 [02:05<12:09:49, 2.26it/s, loss=10.8727, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 283/99077 [02:05<12:02:34, 2.28it/s, loss=10.8727, acc=0.0000, iter_time=0.44s]
Epoch 0: 0%| | 283/99077 [02:05<12:02:34, 2.28it/s, loss=12.4612, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 284/99077 [02:05<11:57:15, 2.30it/s, loss=12.4612, acc=0.0021, iter_time=0.43s]
Epoch 0: 0%| | 284/99077 [02:06<11:57:15, 2.30it/s, loss=10.4729, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 285/99077 [02:06<11:55:26, 2.30it/s, loss=10.4729, acc=0.0010, iter_time=0.45s]
Epoch 0: 0%| | 285/99077 [02:06<11:55:26, 2.30it/s, loss=13.9179, acc=0.0012, iter_time=0.36s]
Epoch 0: 0%| | 286/99077 [02:06<11:51:44, 2.31it/s, loss=13.9179, acc=0.0012, iter_time=0.36s]
Epoch 0: 0%| | 286/99077 [02:06<11:51:44, 2.31it/s, loss=12.7594, acc=0.0010, iter_time=0.49s]
Epoch 0: 0%| | 287/99077 [02:06<11:50:41, 2.32it/s, loss=12.7594, acc=0.0010, iter_time=0.49s]
Epoch 0: 0%| | 287/99077 [02:07<11:50:41, 2.32it/s, loss=16.1911, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 288/99077 [02:07<11:50:04, 2.32it/s, loss=16.1911, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 288/99077 [02:07<11:50:04, 2.32it/s, loss=15.4104, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 289/99077 [02:07<11:47:31, 2.33it/s, loss=15.4104, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 289/99077 [02:08<11:47:31, 2.33it/s, loss=12.1436, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 290/99077 [02:08<11:41:38, 2.35it/s, loss=12.1436, acc=0.0000, iter_time=0.42s]
Epoch 0: 0%| | 290/99077 [02:08<11:41:38, 2.35it/s, loss=14.3671, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 291/99077 [02:08<11:40:44, 2.35it/s, loss=14.3671, acc=0.0000, iter_time=0.43s]
Epoch 0: 0%| | 291/99077 [02:09<11:40:44, 2.35it/s, loss=12.3109, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 292/99077 [02:09<11:43:44, 2.34it/s, loss=12.3109, acc=0.0010, iter_time=0.44s]
Epoch 0: 0%| | 292/99077 [02:09<11:43:44, 2.34it/s, loss=12.1134, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 293/99077 [02:09<11:46:10, 2.33it/s, loss=12.1134, acc=0.0010, iter_time=0.43s]
Epoch 0: 0%| | 293/99077 [02:09<11:46:10, 2.33it/s, loss=11.0256, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 294/99077 [02:09<11:45:12, 2.33it/s, loss=11.0256, acc=0.0021, iter_time=0.40s]
Epoch 0: 0%| | 294/99077 [02:10<11:45:12, 2.33it/s, loss=14.4205, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 295/99077 [02:10<11:47:10, 2.33it/s, loss=14.4205, acc=0.0010, iter_time=0.46s]
Epoch 0: 0%| | 295/99077 [02:10<11:47:10, 2.33it/s, loss=12.9786, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 296/99077 [02:10<11:46:36, 2.33it/s, loss=12.9786, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 296/99077 [02:11<11:46:36, 2.33it/s, loss=12.5237, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 297/99077 [02:11<11:47:22, 2.33it/s, loss=12.5237, acc=0.0021, iter_time=0.42s]
Epoch 0: 0%| | 297/99077 [02:11<11:47:22, 2.33it/s, loss=13.2488, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 298/99077 [02:11<11:38:51, 2.36it/s, loss=13.2488, acc=0.0010, iter_time=0.41s]
Epoch 0: 0%| | 298/99077 [02:12<11:38:51, 2.36it/s, loss=12.5601, acc=0.0031, iter_time=0.43s]
Epoch 0: 0%| | 299/99077 [02:12<11:40:56, 2.35it/s, loss=12.5601, acc=0.0031, iter_time=0.43s]
Epoch 0: 0%| | 299/99077 [02:12<12:11:02, 2.25it/s, loss=12.5601, acc=0.0031, iter_time=0.43s]
diff --git a/syxin_old/train_run.log b/syxin_old/train_run.log
new file mode 100644
index 0000000000000000000000000000000000000000..875217bbad77b589cbfd698897475d36eec01817
--- /dev/null
+++ b/syxin_old/train_run.log
@@ -0,0 +1,160 @@
+nohup: ignoring input
+
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.45s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.52s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:11, 2.75s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.53s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.63s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.63s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.63s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.65s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.38s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.45s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.42s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.47s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.47s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.47s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.64s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.68s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:06<00:04, 2.23s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.33s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.30s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.33s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.33s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.33s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.47s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.58s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:01, 1.98s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.47s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:08<00:00, 1.80s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 136.65it/s]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:02, 2.13s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:02, 2.15s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.20s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.18s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.19s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.22s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.61s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.92s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.62s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.94s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.25it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 134.12it/s]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.32s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.66s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.97s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.68s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.03s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.67s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.67s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.98s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.97s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 136.77it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 135.96it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 140.11it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 134.90it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.72s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.08s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.84it/s]
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+
Generating train split: 0%| | 0/818627 [00:00, ? examples/s]
Generating train split: 3%|▎ | 21099/818627 [00:00<00:26, 30030.49 examples/s]
Generating train split: 5%|▌ | 42198/818627 [00:01<00:17, 43755.10 examples/s]
Generating train split: 8%|▊ | 63297/818627 [00:01<00:15, 49769.91 examples/s]
Generating train split: 10%|█ | 84396/818627 [00:01<00:12, 59025.10 examples/s]trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+
Generating train split: 15%|█▌ | 123428/818627 [00:02<00:13, 52187.41 examples/s]
Generating train split: 18%|█▊ | 144527/818627 [00:02<00:12, 54845.71 examples/s]trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+
Generating train split: 20%|██ | 165626/818627 [00:03<00:11, 56976.82 examples/s]trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+
Generating train split: 23%|██▎ | 186725/818627 [00:03<00:09, 63670.22 examples/s]trainable params: 30,670,848 || all params: 8,221,406,208 || trainable%: 0.3731
+
Generating train split: 28%|██▊ | 225757/818627 [00:04<00:10, 55873.15 examples/s]
Generating train split: 30%|███ | 246856/818627 [00:04<00:09, 58534.11 examples/s]
Generating train split: 33%|███▎ | 267955/818627 [00:04<00:09, 61059.60 examples/s]
Generating train split: 35%|███▌ | 289054/818627 [00:05<00:07, 66219.69 examples/s]
Generating train split: 40%|████ | 328086/818627 [00:05<00:08, 56094.39 examples/s]
Generating train split: 43%|████▎ | 349185/818627 [00:06<00:07, 59947.84 examples/s]
Generating train split: 45%|████▌ | 370284/818627 [00:06<00:06, 64154.00 examples/s]
Generating train split: 48%|████▊ | 391383/818627 [00:06<00:06, 71038.98 examples/s]
Generating train split: 53%|█████▎ | 430414/818627 [00:07<00:06, 57855.95 examples/s]
Generating train split: 55%|█████▌ | 451513/818627 [00:07<00:05, 63594.79 examples/s]
Generating train split: 58%|█████▊ | 472612/818627 [00:08<00:05, 63903.25 examples/s]
Generating train split: 60%|██████ | 493711/818627 [00:08<00:04, 70582.68 examples/s]
Generating train split: 65%|██████▌ | 532742/818627 [00:09<00:04, 60344.18 examples/s]
Generating train split: 68%|██████▊ | 553841/818627 [00:09<00:04, 62926.09 examples/s]
Generating train split: 70%|███████ | 574940/818627 [00:09<00:03, 63850.58 examples/s]
Generating train split: 73%|███████▎ | 596039/818627 [00:09<00:03, 71040.78 examples/s]
Generating train split: 78%|███████▊ | 635070/818627 [00:10<00:03, 60401.73 examples/s]
Generating train split: 80%|████████ | 656169/818627 [00:10<00:02, 63395.22 examples/s]
Generating train split: 83%|████████▎ | 677268/818627 [00:11<00:02, 63964.74 examples/s]
Generating train split: 85%|████████▌ | 698367/818627 [00:11<00:01, 71087.78 examples/s]
Generating train split: 90%|█████████ | 737398/818627 [00:12<00:01, 58668.28 examples/s]
Generating train split: 93%|█████████▎| 758497/818627 [00:12<00:00, 61436.57 examples/s]
Generating train split: 95%|█████████▌| 779596/818627 [00:12<00:00, 65323.89 examples/s]
Generating train split: 98%|█████████▊| 800695/818627 [00:13<00:00, 72488.34 examples/s]
Generating train split: 100%|██████████| 818627/818627 [00:13<00:00, 62459.97 examples/s]
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
Map (num_proc=16): 0%| | 0/818627 [00:00, ? examples/s]/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/data/parse.py:84: UserWarning: The first message is from system, we will use the system prompt from the data and ignore the system prompt from the template
+ warnings.warn(
+
Map (num_proc=16): 0%| | 1000/818627 [00:14<3:22:32, 67.28 examples/s]
Map (num_proc=16): 0%| | 3000/818627 [00:15<56:50, 239.17 examples/s]
Map (num_proc=16): 0%| | 4000/818627 [00:16<39:27, 344.09 examples/s]
Map (num_proc=16): 1%| | 6000/818627 [00:16<20:12, 670.38 examples/s]
Map (num_proc=16): 1%| | 7000/818627 [00:16<15:26, 875.68 examples/s]
Map (num_proc=16): 1%| | 8000/818627 [00:16<11:45, 1149.73 examples/s]
Map (num_proc=16): 1%| | 9000/818627 [00:16<09:12, 1465.91 examples/s]
Map (num_proc=16): 1%|▏ | 12000/818627 [00:17<04:33, 2954.26 examples/s]
Map (num_proc=16): 2%|▏ | 14000/818627 [00:17<03:57, 3384.29 examples/s]
Map (num_proc=16): 2%|▏ | 15000/818627 [00:17<03:58, 3373.13 examples/s]
Map (num_proc=16): 2%|▏ | 16000/818627 [00:20<10:04, 1326.98 examples/s]
Map (num_proc=16): 2%|▏ | 17000/818627 [00:29<36:21, 367.47 examples/s]
Map (num_proc=16): 2%|▏ | 18000/818627 [00:29<29:25, 453.40 examples/s]
Map (num_proc=16): 2%|▏ | 19000/818627 [00:30<22:57, 580.50 examples/s]
Map (num_proc=16): 2%|▏ | 20000/818627 [00:30<18:10, 732.18 examples/s]
Map (num_proc=16): 3%|▎ | 21000/818627 [00:30<14:11, 936.61 examples/s]
Map (num_proc=16): 3%|▎ | 23000/818627 [00:31<08:23, 1581.73 examples/s]
Map (num_proc=16): 3%|▎ | 24000/818627 [00:31<07:01, 1886.27 examples/s]
Map (num_proc=16): 3%|▎ | 27000/818627 [00:31<04:47, 2749.47 examples/s]
Map (num_proc=16): 4%|▎ | 30000/818627 [00:32<03:04, 4271.83 examples/s]
Map (num_proc=16): 4%|▍ | 31000/818627 [00:32<03:15, 4025.64 examples/s]
Map (num_proc=16): 4%|▍ | 32000/818627 [00:33<06:12, 2112.68 examples/s]
Map (num_proc=16): 4%|▍ | 33000/818627 [00:43<32:12, 406.52 examples/s]
Map (num_proc=16): 4%|▍ | 34000/818627 [00:44<26:41, 489.98 examples/s]
Map (num_proc=16): 4%|▍ | 35000/818627 [00:44<20:59, 622.14 examples/s]
Map (num_proc=16): 4%|▍ | 36000/818627 [00:45<19:32, 667.42 examples/s]
Map (num_proc=16): 5%|▍ | 37000/818627 [00:45<14:34, 894.26 examples/s]
Map (num_proc=16): 5%|▍ | 38000/818627 [00:46<11:30, 1130.17 examples/s]
Map (num_proc=16): 5%|▍ | 39000/818627 [00:46<08:35, 1513.32 examples/s]
Map (num_proc=16): 5%|▍ | 40000/818627 [00:46<06:45, 1921.55 examples/s]
Map (num_proc=16): 5%|▌ | 41000/818627 [00:46<05:10, 2504.08 examples/s]
Map (num_proc=16): 5%|▌ | 42000/818627 [00:46<04:21, 2971.13 examples/s]
Map (num_proc=16): 5%|▌ | 43000/818627 [00:46<03:49, 3377.86 examples/s]
Map (num_proc=16): 5%|▌ | 44000/818627 [00:47<03:28, 3707.90 examples/s]
Map (num_proc=16): 5%|▌ | 45000/818627 [00:47<03:35, 3595.20 examples/s]
Map (num_proc=16): 6%|▌ | 46000/818627 [00:47<03:23, 3790.74 examples/s]
Map (num_proc=16): 6%|▌ | 47000/818627 [00:47<03:05, 4153.83 examples/s]
Map (num_proc=16): 6%|▌ | 48000/818627 [00:49<06:43, 1912.10 examples/s]
Map (num_proc=16): 6%|▌ | 49000/818627 [00:58<40:07, 319.71 examples/s]
Map (num_proc=16): 6%|▌ | 51000/818627 [00:58<22:24, 571.12 examples/s]
Map (num_proc=16): 6%|▋ | 52000/818627 [00:59<18:41, 683.31 examples/s]
Map (num_proc=16): 6%|▋ | 53000/818627 [01:00<18:12, 700.76 examples/s]
Map (num_proc=16): 7%|▋ | 54000/818627 [01:00<13:40, 932.03 examples/s]
Map (num_proc=16): 7%|▋ | 55000/818627 [01:00<11:07, 1143.98 examples/s]
Map (num_proc=16): 7%|▋ | 56000/818627 [01:01<08:25, 1508.69 examples/s]
Map (num_proc=16): 7%|▋ | 57000/818627 [01:01<06:54, 1837.61 examples/s]
Map (num_proc=16): 7%|▋ | 58000/818627 [01:01<05:23, 2350.91 examples/s]
Map (num_proc=16): 7%|▋ | 59000/818627 [01:01<05:41, 2225.23 examples/s]
Map (num_proc=16): 7%|▋ | 61000/818627 [01:02<04:13, 2990.24 examples/s]
Map (num_proc=16): 8%|▊ | 63000/818627 [01:03<04:17, 2933.29 examples/s]
Map (num_proc=16): 8%|▊ | 64000/818627 [01:03<04:20, 2896.54 examples/s]
Map (num_proc=16): 8%|▊ | 65000/818627 [01:12<31:39, 396.66 examples/s]
Map (num_proc=16): 8%|▊ | 67000/818627 [01:13<19:12, 652.31 examples/s]
Map (num_proc=16): 8%|▊ | 68000/818627 [01:13<15:23, 812.46 examples/s]
Map (num_proc=16): 8%|▊ | 69000/818627 [01:14<14:59, 833.46 examples/s]
Map (num_proc=16): 9%|▊ | 70000/818627 [01:15<15:39, 797.12 examples/s]
Map (num_proc=16): 9%|▊ | 71000/818627 [01:15<12:02, 1034.26 examples/s]
Map (num_proc=16): 9%|▉ | 72000/818627 [01:16<10:33, 1177.79 examples/s]
Map (num_proc=16): 9%|▉ | 73000/818627 [01:16<08:29, 1464.56 examples/s]
Map (num_proc=16): 9%|▉ | 76000/818627 [01:17<04:32, 2724.51 examples/s]
Map (num_proc=16): 9%|▉ | 77000/818627 [01:17<04:07, 2994.35 examples/s]
Map (num_proc=16): 10%|▉ | 78000/818627 [01:17<04:01, 3068.14 examples/s]
Map (num_proc=16): 10%|▉ | 79000/818627 [01:18<05:04, 2429.51 examples/s]
Map (num_proc=16): 10%|▉ | 81000/818627 [01:27<25:37, 479.91 examples/s]
Map (num_proc=16): 10%|█ | 82000/818627 [01:27<21:25, 573.19 examples/s]
Map (num_proc=16): 10%|█ | 83000/818627 [01:27<16:27, 744.94 examples/s]
Map (num_proc=16): 10%|█ | 84000/818627 [01:28<12:47, 957.23 examples/s]
Map (num_proc=16): 10%|█ | 85000/818627 [01:28<10:40, 1146.03 examples/s]
Map (num_proc=16): 11%|█ | 86000/818627 [01:30<14:41, 831.25 examples/s]
Map (num_proc=16): 11%|█ | 87000/818627 [01:31<12:19, 989.83 examples/s]
Map (num_proc=16): 11%|█ | 88000/818627 [01:31<09:06, 1338.04 examples/s]
Map (num_proc=16): 11%|█ | 89000/818627 [01:31<07:24, 1641.69 examples/s]
Map (num_proc=16): 11%|█ | 90000/818627 [01:31<06:37, 1832.97 examples/s]
Map (num_proc=16): 11%|█ | 91000/818627 [01:31<05:05, 2379.48 examples/s]
Map (num_proc=16): 11%|█▏ | 93000/818627 [01:32<03:34, 3380.52 examples/s]
Map (num_proc=16): 12%|█▏ | 95000/818627 [01:32<02:24, 5003.25 examples/s]
Map (num_proc=16): 12%|█▏ | 96000/818627 [01:32<03:29, 3443.05 examples/s]
Map (num_proc=16): 12%|█▏ | 97000/818627 [01:41<26:51, 447.73 examples/s]
Map (num_proc=16): 12%|█▏ | 98000/818627 [01:43<25:26, 472.02 examples/s]
Map (num_proc=16): 12%|█▏ | 99000/818627 [01:43<20:29, 585.33 examples/s]
Map (num_proc=16): 12%|█▏ | 101000/818627 [01:44<13:55, 858.57 examples/s]
Map (num_proc=16): 12%|█▏ | 102000/818627 [01:45<13:12, 903.90 examples/s]
Map (num_proc=16): 13%|█▎ | 103000/818627 [01:45<10:59, 1084.56 examples/s]
Map (num_proc=16): 13%|█▎ | 104000/818627 [01:46<08:24, 1415.86 examples/s]
Map (num_proc=16): 13%|█▎ | 105000/818627 [01:46<07:04, 1682.62 examples/s]
Map (num_proc=16): 13%|█▎ | 107000/818627 [01:46<04:31, 2620.50 examples/s]
Map (num_proc=16): 13%|█▎ | 108000/818627 [01:46<04:18, 2749.75 examples/s]
Map (num_proc=16): 13%|█▎ | 110000/818627 [01:47<03:26, 3424.57 examples/s]
Map (num_proc=16): 14%|█▎ | 112000/818627 [01:49<06:02, 1947.49 examples/s]
Map (num_proc=16): 14%|█▍ | 113000/818627 [01:56<22:39, 519.17 examples/s]
Map (num_proc=16): 14%|█▍ | 114000/818627 [01:57<20:57, 560.50 examples/s]
Map (num_proc=16): 14%|█▍ | 115000/818627 [01:58<19:31, 600.82 examples/s]
Map (num_proc=16): 14%|█▍ | 116000/818627 [01:59<14:58, 781.78 examples/s]
Map (num_proc=16): 14%|█▍ | 117000/818627 [02:00<14:24, 811.16 examples/s]
Map (num_proc=16): 14%|█▍ | 118000/818627 [02:00<10:48, 1080.97 examples/s]
Map (num_proc=16): 15%|█▍ | 119000/818627 [02:00<08:36, 1355.17 examples/s]
Map (num_proc=16): 15%|█▍ | 120000/818627 [02:00<06:52, 1694.01 examples/s]
Map (num_proc=16): 15%|█▍ | 121000/818627 [02:01<05:49, 1997.95 examples/s]
Map (num_proc=16): 15%|█▍ | 122000/818627 [02:01<04:47, 2427.26 examples/s]
Map (num_proc=16): 15%|█▌ | 123000/818627 [02:01<04:24, 2625.21 examples/s]
Map (num_proc=16): 15%|█▌ | 124000/818627 [02:01<04:02, 2859.45 examples/s]
Map (num_proc=16): 16%|█▌ | 127000/818627 [02:02<03:55, 2934.37 examples/s]
Map (num_proc=16): 16%|█▌ | 128000/818627 [02:03<05:17, 2177.69 examples/s]
Map (num_proc=16): 16%|█▌ | 129000/818627 [02:11<25:03, 458.79 examples/s]
Map (num_proc=16): 16%|█▌ | 130000/818627 [02:12<21:05, 544.24 examples/s]
Map (num_proc=16): 16%|█▌ | 131000/818627 [02:15<24:21, 470.58 examples/s]
Map (num_proc=16): 16%|█▌ | 132000/818627 [02:16<21:24, 534.47 examples/s]
Map (num_proc=16): 17%|█▋ | 137000/818627 [02:16<07:38, 1485.91 examples/s]
Map (num_proc=16): 17%|█▋ | 138000/818627 [02:17<06:36, 1715.85 examples/s]
Map (num_proc=16): 17%|█▋ | 139000/818627 [02:17<05:45, 1969.60 examples/s]
Map (num_proc=16): 17%|█▋ | 140000/818627 [02:17<05:18, 2127.37 examples/s]
Map (num_proc=16): 17%|█▋ | 141000/818627 [02:17<04:50, 2332.31 examples/s]
Map (num_proc=16): 17%|█▋ | 142000/818627 [02:18<05:49, 1933.51 examples/s]
Map (num_proc=16): 17%|█▋ | 143000/818627 [02:19<05:30, 2045.49 examples/s]
Map (num_proc=16): 18%|█▊ | 144000/818627 [02:19<04:24, 2553.31 examples/s]
Map (num_proc=16): 18%|█▊ | 145000/818627 [02:25<23:26, 478.98 examples/s]
Map (num_proc=16): 18%|█▊ | 146000/818627 [02:26<19:02, 588.51 examples/s]
Map (num_proc=16): 18%|█▊ | 147000/818627 [02:30<26:23, 424.09 examples/s]
Map (num_proc=16): 18%|█▊ | 149000/818627 [02:30<15:12, 734.07 examples/s]
Map (num_proc=16): 18%|█▊ | 150000/818627 [02:31<13:04, 852.66 examples/s]
Map (num_proc=16): 19%|█▊ | 152000/818627 [02:31<08:20, 1331.68 examples/s]
Map (num_proc=16): 19%|█▉ | 154000/818627 [02:31<05:27, 2026.73 examples/s]
Map (num_proc=16): 19%|█▉ | 155000/818627 [02:31<05:01, 2201.44 examples/s]
Map (num_proc=16): 19%|█▉ | 157000/818627 [02:32<04:46, 2306.80 examples/s]
Map (num_proc=16): 19%|█▉ | 158000/818627 [02:32<04:13, 2608.19 examples/s]
Map (num_proc=16): 19%|█▉ | 159000/818627 [02:33<04:35, 2392.63 examples/s]
Map (num_proc=16): 20%|█▉ | 160000/818627 [02:33<04:09, 2640.98 examples/s]
Map (num_proc=16): 20%|█▉ | 161000/818627 [02:40<22:05, 496.12 examples/s]
Map (num_proc=16): 20%|█▉ | 163000/818627 [02:44<22:08, 493.39 examples/s]
Map (num_proc=16): 20%|██ | 164000/818627 [02:45<19:15, 566.52 examples/s]
Map (num_proc=16): 20%|██ | 165000/818627 [02:45<15:15, 714.33 examples/s]
Map (num_proc=16): 20%|██ | 166000/818627 [02:45<12:05, 899.64 examples/s]
Map (num_proc=16): 20%|██ | 167000/818627 [02:46<09:52, 1100.62 examples/s]
Map (num_proc=16): 21%|██ | 169000/818627 [02:46<06:13, 1739.76 examples/s]
Map (num_proc=16): 21%|██ | 170000/818627 [02:46<05:02, 2144.43 examples/s]
Map (num_proc=16): 21%|██ | 173000/818627 [02:48<04:46, 2249.73 examples/s]
Map (num_proc=16): 21%|██▏ | 174000/818627 [02:48<04:19, 2485.07 examples/s]
Map (num_proc=16): 21%|██▏ | 175000/818627 [02:48<03:53, 2758.63 examples/s]
Map (num_proc=16): 21%|██▏ | 176000/818627 [02:48<04:08, 2590.10 examples/s]
Map (num_proc=16): 22%|██▏ | 177000/818627 [02:55<19:56, 536.30 examples/s]
Map (num_proc=16): 22%|██▏ | 178000/818627 [02:55<16:52, 632.53 examples/s]
Map (num_proc=16): 22%|██▏ | 179000/818627 [02:58<20:44, 513.91 examples/s]
Map (num_proc=16): 22%|██▏ | 180000/818627 [03:00<19:02, 559.16 examples/s]
Map (num_proc=16): 22%|██▏ | 181000/818627 [03:00<14:27, 734.70 examples/s]
Map (num_proc=16): 22%|██▏ | 183000/818627 [03:00<08:36, 1229.52 examples/s]
Map (num_proc=16): 22%|██▏ | 184000/818627 [03:01<07:28, 1414.58 examples/s]
Map (num_proc=16): 23%|██▎ | 187000/818627 [03:01<03:50, 2734.90 examples/s]
Map (num_proc=16): 23%|██▎ | 189000/818627 [03:02<04:18, 2434.74 examples/s]
Map (num_proc=16): 23%|██▎ | 190000/818627 [03:02<03:55, 2672.73 examples/s]
Map (num_proc=16): 23%|██▎ | 191000/818627 [03:03<05:28, 1911.89 examples/s]
Map (num_proc=16): 24%|██▎ | 193000/818627 [03:09<14:13, 732.66 examples/s]
Map (num_proc=16): 24%|██▎ | 194000/818627 [03:10<14:33, 715.46 examples/s]
Map (num_proc=16): 24%|██▍ | 195000/818627 [03:12<16:25, 632.94 examples/s]
Map (num_proc=16): 24%|██▍ | 196000/818627 [03:14<16:29, 629.27 examples/s]
Map (num_proc=16): 24%|██▍ | 197000/818627 [03:15<13:47, 751.30 examples/s]
Map (num_proc=16): 24%|██▍ | 198000/818627 [03:15<11:08, 929.03 examples/s]
Map (num_proc=16): 24%|██▍ | 199000/818627 [03:15<09:06, 1133.78 examples/s]
Map (num_proc=16): 24%|██▍ | 200000/818627 [03:16<07:04, 1456.29 examples/s]
Map (num_proc=16): 25%|██▍ | 201000/818627 [03:16<05:58, 1723.36 examples/s]
Map (num_proc=16): 25%|██▍ | 202000/818627 [03:16<04:47, 2147.57 examples/s]
Map (num_proc=16): 25%|██▍ | 203000/818627 [03:16<04:13, 2432.96 examples/s]
Map (num_proc=16): 25%|██▍ | 204000/818627 [03:17<03:39, 2796.06 examples/s]
Map (num_proc=16): 25%|██▌ | 205000/818627 [03:17<03:05, 3299.31 examples/s]
Map (num_proc=16): 25%|██▌ | 206000/818627 [03:17<03:40, 2777.51 examples/s]
Map (num_proc=16): 25%|██▌ | 207000/818627 [03:18<03:53, 2617.42 examples/s]
Map (num_proc=16): 25%|██▌ | 208000/818627 [03:18<03:13, 3157.07 examples/s]
Map (num_proc=16): 26%|██▌ | 209000/818627 [03:23<17:51, 569.17 examples/s]
Map (num_proc=16): 26%|██▌ | 210000/818627 [03:24<16:05, 630.70 examples/s]
Map (num_proc=16): 26%|██▌ | 211000/818627 [03:27<19:05, 530.29 examples/s]
Map (num_proc=16): 26%|██▌ | 212000/818627 [03:28<16:42, 605.11 examples/s]
Map (num_proc=16): 26%|██▌ | 213000/818627 [03:30<18:21, 549.91 examples/s]
Map (num_proc=16): 26%|██▌ | 214000/818627 [03:30<14:00, 719.62 examples/s]
Map (num_proc=16): 26%|██▋ | 215000/818627 [03:31<10:30, 957.26 examples/s]
Map (num_proc=16): 27%|██▋ | 217000/818627 [03:31<06:05, 1646.03 examples/s]
Map (num_proc=16): 27%|██▋ | 219000/818627 [03:31<04:35, 2175.69 examples/s]
Map (num_proc=16): 27%|██▋ | 220000/818627 [03:31<03:49, 2603.65 examples/s]
Map (num_proc=16): 27%|██▋ | 221000/818627 [03:32<03:22, 2957.96 examples/s]
Map (num_proc=16): 27%|██▋ | 222000/818627 [03:32<03:17, 3021.29 examples/s]
Map (num_proc=16): 27%|██▋ | 223000/818627 [03:33<03:55, 2528.25 examples/s]
Map (num_proc=16): 27%|██▋ | 225000/818627 [03:37<12:35, 786.04 examples/s]
Map (num_proc=16): 28%|██▊ | 226000/818627 [03:39<13:17, 743.44 examples/s]
Map (num_proc=16): 28%|██▊ | 227000/818627 [03:41<15:08, 651.43 examples/s]
Map (num_proc=16): 28%|██▊ | 228000/818627 [03:44<19:41, 500.05 examples/s]
Map (num_proc=16): 28%|██▊ | 229000/818627 [03:45<16:12, 606.40 examples/s]
Map (num_proc=16): 28%|██▊ | 230000/818627 [03:45<12:05, 811.84 examples/s]
Map (num_proc=16): 28%|██▊ | 231000/818627 [03:45<09:14, 1059.86 examples/s]
Map (num_proc=16): 28%|██▊ | 232000/818627 [03:46<07:23, 1322.74 examples/s]
Map (num_proc=16): 28%|██▊ | 233000/818627 [03:46<05:50, 1672.37 examples/s]
Map (num_proc=16): 29%|██▊ | 234000/818627 [03:46<04:33, 2134.06 examples/s]
Map (num_proc=16): 29%|██▊ | 235000/818627 [03:46<03:34, 2725.91 examples/s]
Map (num_proc=16): 29%|██▉ | 236000/818627 [03:46<03:01, 3214.81 examples/s]
Map (num_proc=16): 29%|██▉ | 237000/818627 [03:47<03:17, 2945.42 examples/s]
Map (num_proc=16): 29%|██▉ | 239000/818627 [03:48<04:50, 1995.19 examples/s]
Map (num_proc=16): 29%|██▉ | 240000/818627 [03:48<04:07, 2340.20 examples/s]
Map (num_proc=16): 29%|██▉ | 241000/818627 [03:52<11:11, 860.23 examples/s]
Map (num_proc=16): 30%|██▉ | 242000/818627 [03:53<12:15, 783.70 examples/s]
Map (num_proc=16): 30%|██▉ | 243000/818627 [03:55<12:49, 748.32 examples/s]
Map (num_proc=16): 30%|██▉ | 244000/818627 [03:59<19:46, 484.39 examples/s]
Map (num_proc=16): 30%|██▉ | 245000/818627 [03:59<15:44, 607.52 examples/s]
Map (num_proc=16): 30%|███ | 246000/818627 [04:00<12:59, 734.43 examples/s]
Map (num_proc=16): 30%|███ | 247000/818627 [04:00<09:27, 1007.46 examples/s]
Map (num_proc=16): 30%|███ | 248000/818627 [04:01<08:10, 1164.43 examples/s]
Map (num_proc=16): 30%|███ | 249000/818627 [04:01<06:28, 1465.77 examples/s]
Map (num_proc=16): 31%|███ | 251000/818627 [04:01<04:47, 1973.40 examples/s]
Map (num_proc=16): 31%|███ | 252000/818627 [04:02<04:31, 2085.01 examples/s]
Map (num_proc=16): 31%|███ | 253000/818627 [04:02<03:55, 2406.25 examples/s]
Map (num_proc=16): 31%|███ | 254000/818627 [04:03<04:36, 2039.06 examples/s]
Map (num_proc=16): 31%|███▏ | 256000/818627 [04:03<02:57, 3167.29 examples/s]
Map (num_proc=16): 31%|███▏ | 257000/818627 [04:06<09:08, 1024.46 examples/s]
Map (num_proc=16): 32%|███▏ | 258000/818627 [04:08<11:32, 809.56 examples/s]
Map (num_proc=16): 32%|███▏ | 259000/818627 [04:09<11:11, 833.19 examples/s]
Map (num_proc=16): 32%|███▏ | 260000/818627 [04:14<19:27, 478.55 examples/s]
Map (num_proc=16): 32%|███▏ | 261000/818627 [04:14<15:44, 590.58 examples/s]
Map (num_proc=16): 32%|███▏ | 262000/818627 [04:15<13:35, 682.23 examples/s]
Map (num_proc=16): 32%|███▏ | 263000/818627 [04:15<10:06, 915.94 examples/s]
Map (num_proc=16): 32%|███▏ | 264000/818627 [04:16<08:17, 1114.81 examples/s]
Map (num_proc=16): 32%|███▏ | 266000/818627 [04:16<04:51, 1896.88 examples/s]
Map (num_proc=16): 33%|███▎ | 268000/818627 [04:17<04:14, 2162.15 examples/s]
Map (num_proc=16): 33%|███▎ | 269000/818627 [04:17<03:40, 2498.09 examples/s]
Map (num_proc=16): 33%|███▎ | 270000/818627 [04:17<03:12, 2850.12 examples/s]
Map (num_proc=16): 33%|███▎ | 271000/818627 [04:18<04:44, 1926.31 examples/s]
Map (num_proc=16): 33%|███▎ | 272000/818627 [04:19<05:22, 1694.83 examples/s]
Map (num_proc=16): 33%|███▎ | 273000/818627 [04:22<10:41, 849.90 examples/s]
Map (num_proc=16): 33%|███▎ | 274000/818627 [04:22<09:57, 911.14 examples/s]
Map (num_proc=16): 34%|███▎ | 275000/818627 [04:24<10:10, 890.91 examples/s]
Map (num_proc=16): 34%|███▎ | 276000/818627 [04:28<19:06, 473.23 examples/s]
Map (num_proc=16): 34%|███▍ | 277000/818627 [04:29<14:49, 608.82 examples/s]
Map (num_proc=16): 34%|███▍ | 278000/818627 [04:29<12:13, 736.95 examples/s]
Map (num_proc=16): 34%|███▍ | 279000/818627 [04:31<11:44, 766.24 examples/s]
Map (num_proc=16): 34%|███▍ | 280000/818627 [04:31<08:33, 1049.55 examples/s]
Map (num_proc=16): 34%|███▍ | 282000/818627 [04:31<05:37, 1588.56 examples/s]
Map (num_proc=16): 35%|███▍ | 284000/818627 [04:32<04:17, 2075.25 examples/s]
Map (num_proc=16): 35%|███▍ | 286000/818627 [04:33<04:56, 1795.95 examples/s]
Map (num_proc=16): 35%|███▌ | 288000/818627 [04:34<05:15, 1682.81 examples/s]
Map (num_proc=16): 35%|███▌ | 289000/818627 [04:37<07:57, 1109.76 examples/s]
Map (num_proc=16): 35%|███▌ | 290000/818627 [04:37<06:59, 1260.34 examples/s]
Map (num_proc=16): 36%|███▌ | 291000/818627 [04:38<07:22, 1191.22 examples/s]
Map (num_proc=16): 36%|███▌ | 292000/818627 [04:43<16:00, 548.30 examples/s]
Map (num_proc=16): 36%|███▌ | 294000/818627 [04:44<12:13, 715.65 examples/s]
Map (num_proc=16): 36%|███▌ | 295000/818627 [04:45<11:33, 755.43 examples/s]
Map (num_proc=16): 36%|███▌ | 296000/818627 [04:46<09:44, 894.47 examples/s]
Map (num_proc=16): 36%|███▋ | 297000/818627 [04:46<08:02, 1080.15 examples/s]
Map (num_proc=16): 37%|███▋ | 300000/818627 [04:47<04:45, 1816.14 examples/s]
Map (num_proc=16): 37%|███▋ | 302000/818627 [04:47<03:59, 2158.99 examples/s]
Map (num_proc=16): 37%|███▋ | 303000/818627 [04:48<04:31, 1897.89 examples/s]
Map (num_proc=16): 37%|███▋ | 304000/818627 [04:49<05:46, 1483.67 examples/s]
Map (num_proc=16): 37%|███▋ | 305000/818627 [04:52<09:16, 922.26 examples/s]
Map (num_proc=16): 37%|███▋ | 306000/818627 [04:52<07:17, 1172.16 examples/s]
Map (num_proc=16): 38%|███▊ | 307000/818627 [04:53<07:39, 1112.63 examples/s]
Map (num_proc=16): 38%|███▊ | 308000/818627 [04:57<15:04, 564.72 examples/s]
Map (num_proc=16): 38%|███▊ | 309000/818627 [04:58<11:47, 720.64 examples/s]
Map (num_proc=16): 38%|███▊ | 310000/818627 [04:59<11:31, 735.91 examples/s]
Map (num_proc=16): 38%|███▊ | 311000/818627 [04:59<09:37, 878.74 examples/s]
Map (num_proc=16): 38%|███▊ | 312000/818627 [05:00<09:01, 935.59 examples/s]
Map (num_proc=16): 38%|███▊ | 314000/818627 [05:01<07:00, 1199.63 examples/s]
Map (num_proc=16): 38%|███▊ | 315000/818627 [05:02<05:56, 1412.18 examples/s]
Map (num_proc=16): 39%|███▊ | 316000/818627 [05:02<04:58, 1683.04 examples/s]
Map (num_proc=16): 39%|███▉ | 318000/818627 [05:02<03:12, 2601.54 examples/s]
Map (num_proc=16): 39%|███▉ | 319000/818627 [05:03<04:35, 1811.38 examples/s]
Map (num_proc=16): 39%|███▉ | 320000/818627 [05:05<05:54, 1405.80 examples/s]
Map (num_proc=16): 39%|███▉ | 321000/818627 [05:06<08:29, 975.77 examples/s]
Map (num_proc=16): 39%|███▉ | 322000/818627 [05:07<08:12, 1009.21 examples/s]
Map (num_proc=16): 39%|███▉ | 323000/818627 [05:08<07:46, 1061.45 examples/s]
Map (num_proc=16): 40%|███▉ | 324000/818627 [05:11<13:08, 627.05 examples/s]
Map (num_proc=16): 40%|███▉ | 325000/818627 [05:12<09:56, 827.58 examples/s]
Map (num_proc=16): 40%|███▉ | 326000/818627 [05:14<11:33, 710.30 examples/s]
Map (num_proc=16): 40%|███▉ | 327000/818627 [05:14<09:24, 870.29 examples/s]
Map (num_proc=16): 40%|████ | 328000/818627 [05:15<08:58, 911.35 examples/s]
Map (num_proc=16): 40%|████ | 329000/818627 [05:15<07:21, 1110.16 examples/s]
Map (num_proc=16): 40%|████ | 330000/818627 [05:16<06:06, 1332.38 examples/s]
Map (num_proc=16): 40%|████ | 331000/818627 [05:16<05:13, 1554.11 examples/s]
Map (num_proc=16): 41%|████ | 333000/818627 [05:17<03:56, 2057.37 examples/s]
Map (num_proc=16): 41%|████ | 335000/818627 [05:18<04:35, 1757.34 examples/s]
Map (num_proc=16): 41%|████ | 336000/818627 [05:20<06:22, 1260.87 examples/s]
Map (num_proc=16): 41%|████ | 337000/818627 [05:21<07:01, 1143.27 examples/s]
Map (num_proc=16): 41%|████▏ | 338000/818627 [05:21<06:11, 1292.30 examples/s]
Map (num_proc=16): 41%|████▏ | 339000/818627 [05:22<06:29, 1232.59 examples/s]
Map (num_proc=16): 42%|████▏ | 340000/818627 [05:26<13:18, 599.35 examples/s]
Map (num_proc=16): 42%|████▏ | 341000/818627 [05:26<09:57, 799.65 examples/s]
Map (num_proc=16): 42%|████▏ | 342000/818627 [05:29<12:56, 613.62 examples/s]
Map (num_proc=16): 42%|████▏ | 344000/818627 [05:29<07:38, 1035.50 examples/s]
Map (num_proc=16): 42%|████▏ | 345000/818627 [05:30<07:50, 1005.71 examples/s]
Map (num_proc=16): 42%|████▏ | 346000/818627 [05:31<06:39, 1182.79 examples/s]
Map (num_proc=16): 42%|████▏ | 347000/818627 [05:31<05:18, 1479.14 examples/s]
Map (num_proc=16): 43%|████▎ | 349000/818627 [05:31<03:26, 2278.26 examples/s]
Map (num_proc=16): 43%|████▎ | 350000/818627 [05:32<03:00, 2593.83 examples/s]
Map (num_proc=16): 43%|████▎ | 351000/818627 [05:34<06:49, 1140.75 examples/s]
Map (num_proc=16): 43%|████▎ | 352000/818627 [05:35<06:35, 1180.26 examples/s]
Map (num_proc=16): 43%|████▎ | 353000/818627 [05:36<07:45, 1000.36 examples/s]
Map (num_proc=16): 43%|████▎ | 354000/818627 [05:36<06:16, 1234.36 examples/s]
Map (num_proc=16): 43%|████▎ | 355000/818627 [05:38<07:03, 1094.04 examples/s]
Map (num_proc=16): 43%|████▎ | 356000/818627 [05:41<12:38, 609.95 examples/s]
Map (num_proc=16): 44%|████▎ | 357000/818627 [05:41<10:00, 768.48 examples/s]
Map (num_proc=16): 44%|████▎ | 358000/818627 [05:44<12:43, 603.11 examples/s]
Map (num_proc=16): 44%|████▍ | 359000/818627 [05:44<09:34, 799.78 examples/s]
Map (num_proc=16): 44%|████▍ | 360000/818627 [05:45<07:55, 964.90 examples/s]
Map (num_proc=16): 44%|████▍ | 361000/818627 [05:45<06:42, 1137.68 examples/s]
Map (num_proc=16): 44%|████▍ | 363000/818627 [05:45<03:46, 2009.31 examples/s]
Map (num_proc=16): 44%|████▍ | 364000/818627 [05:46<04:16, 1769.84 examples/s]
Map (num_proc=16): 45%|████▍ | 365000/818627 [05:46<03:48, 1982.70 examples/s]
Map (num_proc=16): 45%|████▍ | 366000/818627 [05:47<03:17, 2292.50 examples/s]
Map (num_proc=16): 45%|████▍ | 367000/818627 [05:48<06:02, 1246.08 examples/s]
Map (num_proc=16): 45%|████▍ | 368000/818627 [05:49<06:21, 1180.48 examples/s]
Map (num_proc=16): 45%|████▌ | 369000/818627 [05:51<06:59, 1072.49 examples/s]
Map (num_proc=16): 45%|████▌ | 370000/818627 [05:51<05:48, 1287.02 examples/s]
Map (num_proc=16): 45%|████▌ | 371000/818627 [05:52<05:51, 1275.22 examples/s]
Map (num_proc=16): 45%|████▌ | 372000/818627 [05:56<12:25, 598.86 examples/s]
Map (num_proc=16): 46%|████▌ | 374000/818627 [05:59<11:48, 627.23 examples/s]
Map (num_proc=16): 46%|████▌ | 375000/818627 [05:59<09:54, 745.66 examples/s]
Map (num_proc=16): 46%|████▌ | 376000/818627 [05:59<07:44, 952.23 examples/s]
Map (num_proc=16): 46%|████▌ | 377000/818627 [06:00<07:39, 961.59 examples/s]
Map (num_proc=16): 46%|████▋ | 379000/818627 [06:01<04:56, 1484.53 examples/s]
Map (num_proc=16): 46%|████▋ | 380000/818627 [06:01<04:33, 1602.44 examples/s]
Map (num_proc=16): 47%|████▋ | 381000/818627 [06:02<04:02, 1805.60 examples/s]
Map (num_proc=16): 47%|████▋ | 383000/818627 [06:04<05:20, 1357.24 examples/s]
Map (num_proc=16): 47%|████▋ | 384000/818627 [06:04<05:34, 1298.98 examples/s]
Map (num_proc=16): 47%|████▋ | 385000/818627 [06:05<05:46, 1250.18 examples/s]
Map (num_proc=16): 47%|████▋ | 387000/818627 [06:06<03:51, 1860.89 examples/s]
Map (num_proc=16): 47%|████▋ | 388000/818627 [06:10<09:30, 754.17 examples/s]
Map (num_proc=16): 48%|████▊ | 389000/818627 [06:10<08:12, 872.13 examples/s]
Map (num_proc=16): 48%|████▊ | 390000/818627 [06:13<12:03, 592.30 examples/s]
Map (num_proc=16): 48%|████▊ | 391000/818627 [06:14<10:02, 709.43 examples/s]
Map (num_proc=16): 48%|████▊ | 392000/818627 [06:14<07:28, 951.68 examples/s]
Map (num_proc=16): 48%|████▊ | 393000/818627 [06:15<07:35, 935.25 examples/s]
Map (num_proc=16): 48%|████▊ | 394000/818627 [06:16<05:41, 1242.54 examples/s]
Map (num_proc=16): 48%|████▊ | 395000/818627 [06:16<05:08, 1375.25 examples/s]
Map (num_proc=16): 48%|████▊ | 396000/818627 [06:17<05:24, 1303.92 examples/s]
Map (num_proc=16): 48%|████▊ | 397000/818627 [06:17<04:04, 1725.33 examples/s]
Map (num_proc=16): 49%|████▊ | 398000/818627 [06:19<06:09, 1139.84 examples/s]
Map (num_proc=16): 49%|████▊ | 399000/818627 [06:19<05:10, 1353.53 examples/s]
Map (num_proc=16): 49%|████▉ | 400000/818627 [06:19<04:28, 1560.26 examples/s]
Map (num_proc=16): 49%|████▉ | 401000/818627 [06:20<03:40, 1894.33 examples/s]
Map (num_proc=16): 49%|████▉ | 402000/818627 [06:20<02:49, 2464.81 examples/s]
Map (num_proc=16): 49%|████▉ | 404000/818627 [06:24<08:12, 841.05 examples/s]
Map (num_proc=16): 49%|████▉ | 405000/818627 [06:25<08:31, 808.61 examples/s]
Map (num_proc=16): 50%|████▉ | 406000/818627 [06:28<11:43, 586.95 examples/s]
Map (num_proc=16): 50%|████▉ | 407000/818627 [06:29<10:11, 673.09 examples/s]
Map (num_proc=16): 50%|████▉ | 409000/818627 [06:30<06:33, 1041.21 examples/s]
Map (num_proc=16): 50%|█████ | 410000/818627 [06:31<06:08, 1109.22 examples/s]
Map (num_proc=16): 50%|█████ | 411000/818627 [06:31<05:34, 1216.87 examples/s]
Map (num_proc=16): 50%|█████ | 413000/818627 [06:33<05:03, 1335.61 examples/s]
Map (num_proc=16): 51%|█████ | 414000/818627 [06:33<05:10, 1302.42 examples/s]
Map (num_proc=16): 51%|█████ | 415000/818627 [06:34<05:00, 1341.14 examples/s]
Map (num_proc=16): 51%|█████ | 416000/818627 [06:34<04:03, 1650.62 examples/s]
Map (num_proc=16): 51%|█████ | 417000/818627 [06:35<03:26, 1941.22 examples/s]
Map (num_proc=16): 51%|█████ | 418000/818627 [06:35<02:52, 2329.17 examples/s]
Map (num_proc=16): 51%|█████ | 419000/818627 [06:35<02:15, 2942.97 examples/s]
Map (num_proc=16): 51%|█████▏ | 420000/818627 [06:38<07:55, 838.76 examples/s]
Map (num_proc=16): 51%|█████▏ | 421000/818627 [06:40<08:32, 775.89 examples/s]
Map (num_proc=16): 52%|█████▏ | 422000/818627 [06:44<14:01, 471.60 examples/s]
Map (num_proc=16): 52%|█████▏ | 423000/818627 [06:44<11:00, 598.55 examples/s]
Map (num_proc=16): 52%|█████▏ | 424000/818627 [06:45<08:05, 812.43 examples/s]
Map (num_proc=16): 52%|█████▏ | 425000/818627 [06:45<06:24, 1024.89 examples/s]
Map (num_proc=16): 52%|█████▏ | 426000/818627 [06:46<06:51, 954.22 examples/s]
Map (num_proc=16): 52%|█████▏ | 427000/818627 [06:47<06:33, 994.20 examples/s]
Map (num_proc=16): 52%|█████▏ | 429000/818627 [06:48<04:23, 1477.09 examples/s]
Map (num_proc=16): 53%|█████▎ | 430000/818627 [06:48<04:14, 1525.60 examples/s]
Map (num_proc=16): 53%|█████▎ | 431000/818627 [06:49<04:41, 1375.22 examples/s]
Map (num_proc=16): 53%|█████▎ | 433000/818627 [06:49<02:53, 2217.51 examples/s]
Map (num_proc=16): 53%|█████▎ | 434000/818627 [06:50<03:45, 1707.14 examples/s]
Map (num_proc=16): 53%|█████▎ | 436000/818627 [06:52<04:49, 1323.52 examples/s]
Map (num_proc=16): 53%|█████▎ | 437000/818627 [06:54<06:22, 998.21 examples/s]
Map (num_proc=16): 54%|█████▎ | 438000/818627 [06:59<11:36, 546.23 examples/s]
Map (num_proc=16): 54%|█████▎ | 439000/818627 [06:59<08:53, 711.54 examples/s]
Map (num_proc=16): 54%|█████▎ | 440000/818627 [06:59<07:11, 877.11 examples/s]
Map (num_proc=16): 54%|█████▍ | 441000/818627 [07:00<06:35, 955.85 examples/s]
Map (num_proc=16): 54%|█████▍ | 442000/818627 [07:01<06:41, 939.07 examples/s]
Map (num_proc=16): 54%|█████▍ | 443000/818627 [07:02<05:48, 1078.96 examples/s]
Map (num_proc=16): 54%|█████▍ | 444000/818627 [07:02<04:59, 1250.36 examples/s]
Map (num_proc=16): 54%|█████▍ | 445000/818627 [07:03<04:46, 1302.57 examples/s]
Map (num_proc=16): 54%|█████▍ | 446000/818627 [07:03<03:58, 1561.58 examples/s]
Map (num_proc=16): 55%|█████▍ | 447000/818627 [07:03<03:07, 1984.00 examples/s]
Map (num_proc=16): 55%|█████▍ | 448000/818627 [07:04<02:54, 2129.56 examples/s]
Map (num_proc=16): 55%|█████▍ | 449000/818627 [07:04<02:37, 2352.73 examples/s]
Map (num_proc=16): 55%|█████▍ | 450000/818627 [07:05<03:38, 1686.66 examples/s]
Map (num_proc=16): 55%|█████▌ | 451000/818627 [07:06<03:40, 1669.93 examples/s]
Map (num_proc=16): 55%|█████▌ | 452000/818627 [07:07<04:32, 1347.04 examples/s]
Map (num_proc=16): 55%|█████▌ | 453000/818627 [07:08<04:47, 1269.88 examples/s]
Map (num_proc=16): 55%|█████▌ | 454000/818627 [07:13<13:14, 459.19 examples/s]
Map (num_proc=16): 56%|█████▌ | 455000/818627 [07:13<09:43, 623.15 examples/s]
Map (num_proc=16): 56%|█████▌ | 456000/818627 [07:15<09:03, 667.79 examples/s]
Map (num_proc=16): 56%|█████▌ | 457000/818627 [07:15<07:10, 839.72 examples/s]
Map (num_proc=16): 56%|█████▌ | 458000/818627 [07:16<06:17, 955.85 examples/s]
Map (num_proc=16): 56%|█████▌ | 459000/818627 [07:17<06:10, 969.46 examples/s]
Map (num_proc=16): 56%|█████▌ | 460000/818627 [07:17<04:58, 1201.19 examples/s]
Map (num_proc=16): 56%|█████▋ | 461000/818627 [07:17<03:43, 1600.83 examples/s]
Map (num_proc=16): 56%|█████▋ | 462000/818627 [07:18<03:15, 1827.00 examples/s]
Map (num_proc=16): 57%|█████▋ | 463000/818627 [07:18<02:50, 2087.87 examples/s]
Map (num_proc=16): 57%|█████▋ | 464000/818627 [07:19<03:33, 1658.89 examples/s]
Map (num_proc=16): 57%|█████▋ | 465000/818627 [07:19<02:43, 2165.22 examples/s]
Map (num_proc=16): 57%|█████▋ | 466000/818627 [07:20<02:53, 2036.90 examples/s]
Map (num_proc=16): 57%|█████▋ | 467000/818627 [07:21<04:07, 1421.75 examples/s]
Map (num_proc=16): 57%|█████▋ | 468000/818627 [07:21<03:56, 1485.64 examples/s]
Map (num_proc=16): 57%|█████▋ | 469000/818627 [07:22<04:00, 1451.02 examples/s]
Map (num_proc=16): 57%|█████▋ | 470000/818627 [07:27<12:02, 482.84 examples/s]
Map (num_proc=16): 58%|█████▊ | 471000/818627 [07:29<10:38, 544.29 examples/s]
Map (num_proc=16): 58%|█████▊ | 472000/818627 [07:30<09:29, 608.79 examples/s]
Map (num_proc=16): 58%|█████▊ | 473000/818627 [07:30<07:21, 782.27 examples/s]
Map (num_proc=16): 58%|█████▊ | 474000/818627 [07:31<05:58, 962.23 examples/s]
Map (num_proc=16): 58%|█████▊ | 475000/818627 [07:31<04:51, 1180.22 examples/s]
Map (num_proc=16): 58%|█████▊ | 476000/818627 [07:33<05:35, 1022.06 examples/s]
Map (num_proc=16): 58%|█████▊ | 477000/818627 [07:33<04:06, 1386.43 examples/s]
Map (num_proc=16): 59%|█████▊ | 479000/818627 [07:33<02:41, 2099.06 examples/s]
Map (num_proc=16): 59%|█████▊ | 480000/818627 [07:33<02:26, 2317.73 examples/s]
Map (num_proc=16): 59%|█████▉ | 481000/818627 [07:34<02:15, 2490.11 examples/s]
Map (num_proc=16): 59%|█████▉ | 482000/818627 [07:34<02:51, 1967.14 examples/s]
Map (num_proc=16): 59%|█████▉ | 483000/818627 [07:36<04:04, 1372.60 examples/s]
Map (num_proc=16): 59%|█████▉ | 484000/818627 [07:36<03:15, 1715.63 examples/s]
Map (num_proc=16): 59%|█████▉ | 485000/818627 [07:37<04:04, 1367.17 examples/s]
Map (num_proc=16): 59%|█████▉ | 486000/818627 [07:42<10:47, 513.64 examples/s]
Map (num_proc=16): 59%|█████▉ | 487000/818627 [07:43<10:01, 551.04 examples/s]
Map (num_proc=16): 60%|█████▉ | 488000/818627 [07:45<09:22, 587.59 examples/s]
Map (num_proc=16): 60%|█████▉ | 489000/818627 [07:46<08:00, 686.49 examples/s]
Map (num_proc=16): 60%|█████▉ | 490000/818627 [07:46<06:05, 898.83 examples/s]
Map (num_proc=16): 60%|█████▉ | 491000/818627 [07:47<05:14, 1042.22 examples/s]
Map (num_proc=16): 60%|██████ | 492000/818627 [07:47<04:27, 1221.07 examples/s]
Map (num_proc=16): 60%|██████ | 494000/818627 [07:47<02:44, 1968.59 examples/s]
Map (num_proc=16): 60%|██████ | 495000/818627 [07:48<03:00, 1791.68 examples/s]
Map (num_proc=16): 61%|██████ | 497000/818627 [07:49<02:20, 2296.31 examples/s]
Map (num_proc=16): 61%|██████ | 498000/818627 [07:49<02:36, 2047.99 examples/s]
Map (num_proc=16): 61%|██████ | 499000/818627 [07:50<02:31, 2112.48 examples/s]
Map (num_proc=16): 61%|██████ | 500000/818627 [07:50<02:17, 2319.51 examples/s]
Map (num_proc=16): 61%|██████ | 501000/818627 [07:52<04:23, 1205.24 examples/s]
Map (num_proc=16): 61%|██████▏ | 502000/818627 [07:57<10:55, 483.36 examples/s]
Map (num_proc=16): 61%|██████▏ | 503000/818627 [07:58<08:52, 592.47 examples/s]
Map (num_proc=16): 62%|██████▏ | 504000/818627 [08:00<09:53, 530.51 examples/s]
Map (num_proc=16): 62%|██████▏ | 505000/818627 [08:01<07:16, 718.56 examples/s]
Map (num_proc=16): 62%|██████▏ | 506000/818627 [08:01<05:35, 931.51 examples/s]
Map (num_proc=16): 62%|██████▏ | 507000/818627 [08:01<04:15, 1221.32 examples/s]
Map (num_proc=16): 62%|██████▏ | 508000/818627 [08:01<03:35, 1441.76 examples/s]
Map (num_proc=16): 62%|██████▏ | 509000/818627 [08:02<02:56, 1754.10 examples/s]
Map (num_proc=16): 62%|██████▏ | 510000/818627 [08:03<03:25, 1498.21 examples/s]
Map (num_proc=16): 62%|██████▏ | 511000/818627 [08:03<03:02, 1684.81 examples/s]
Map (num_proc=16): 63%|██████▎ | 512000/818627 [08:03<02:34, 1985.53 examples/s]
Map (num_proc=16): 63%|██████▎ | 513000/818627 [08:04<02:05, 2428.67 examples/s]
Map (num_proc=16): 63%|██████▎ | 514000/818627 [08:04<02:14, 2267.02 examples/s]
Map (num_proc=16): 63%|██████▎ | 515000/818627 [08:05<02:17, 2203.40 examples/s]
Map (num_proc=16): 63%|██████▎ | 516000/818627 [08:05<02:29, 2021.70 examples/s]
Map (num_proc=16): 63%|██████▎ | 517000/818627 [08:07<04:10, 1202.70 examples/s]
Map (num_proc=16): 63%|██████▎ | 518000/818627 [08:12<10:37, 471.72 examples/s]
Map (num_proc=16): 63%|██████▎ | 519000/818627 [08:12<08:17, 602.25 examples/s]
Map (num_proc=16): 64%|██████▎ | 520000/818627 [08:15<10:06, 492.19 examples/s]
Map (num_proc=16): 64%|██████▎ | 521000/818627 [08:16<07:45, 639.70 examples/s]
Map (num_proc=16): 64%|██████▍ | 523000/818627 [08:16<04:24, 1119.67 examples/s]
Map (num_proc=16): 64%|██████▍ | 524000/818627 [08:16<03:38, 1350.09 examples/s]
Map (num_proc=16): 64%|██████▍ | 525000/818627 [08:17<03:26, 1419.22 examples/s]
Map (num_proc=16): 64%|██████▍ | 526000/818627 [08:17<03:12, 1518.75 examples/s]
Map (num_proc=16): 64%|██████▍ | 527000/818627 [08:18<02:58, 1635.38 examples/s]
Map (num_proc=16): 64%|██████▍ | 528000/818627 [08:18<02:39, 1818.26 examples/s]
Map (num_proc=16): 65%|██████▍ | 530000/818627 [08:19<01:59, 2419.70 examples/s]
Map (num_proc=16): 65%|██████▍ | 531000/818627 [08:19<01:44, 2740.11 examples/s]
Map (num_proc=16): 65%|██████▍ | 532000/818627 [08:20<01:59, 2399.82 examples/s]
Map (num_proc=16): 65%|██████▌ | 533000/818627 [08:21<03:33, 1340.66 examples/s]
Map (num_proc=16): 65%|██████▌ | 534000/818627 [08:26<09:13, 514.27 examples/s]
Map (num_proc=16): 65%|██████▌ | 535000/818627 [08:28<08:14, 573.23 examples/s]
Map (num_proc=16): 65%|██████▌ | 536000/818627 [08:30<09:11, 512.51 examples/s]
Map (num_proc=16): 66%|██████▌ | 537000/818627 [08:31<07:34, 619.02 examples/s]
Map (num_proc=16): 66%|██████▌ | 538000/818627 [08:31<05:31, 847.37 examples/s]
Map (num_proc=16): 66%|██████▌ | 539000/818627 [08:31<04:07, 1130.00 examples/s]
Map (num_proc=16): 66%|██████▌ | 541000/818627 [08:32<02:57, 1564.20 examples/s]
Map (num_proc=16): 66%|██████▌ | 542000/818627 [08:32<02:46, 1665.73 examples/s]
Map (num_proc=16): 66%|██████▋ | 543000/818627 [08:33<02:45, 1669.09 examples/s]
Map (num_proc=16): 66%|██████▋ | 544000/818627 [08:33<02:17, 2003.69 examples/s]
Map (num_proc=16): 67%|██████▋ | 545000/818627 [08:34<02:17, 1982.86 examples/s]
Map (num_proc=16): 67%|██████▋ | 546000/818627 [08:34<01:51, 2438.58 examples/s]
Map (num_proc=16): 67%|██████▋ | 547000/818627 [08:34<01:42, 2662.87 examples/s]
Map (num_proc=16): 67%|██████▋ | 548000/818627 [08:34<01:28, 3048.48 examples/s]
Map (num_proc=16): 67%|██████▋ | 549000/818627 [08:35<01:58, 2282.84 examples/s]
Map (num_proc=16): 67%|██████▋ | 550000/818627 [08:41<08:46, 509.97 examples/s]
Map (num_proc=16): 67%|██████▋ | 551000/818627 [08:42<08:09, 546.48 examples/s]
Map (num_proc=16): 67%|██████▋ | 552000/818627 [08:45<10:06, 439.79 examples/s]
Map (num_proc=16): 68%|██████▊ | 554000/818627 [08:46<05:46, 763.05 examples/s]
Map (num_proc=16): 68%|██████▊ | 555000/818627 [08:46<04:34, 958.79 examples/s]
Map (num_proc=16): 68%|██████▊ | 556000/818627 [08:47<03:56, 1109.89 examples/s]
Map (num_proc=16): 68%|██████▊ | 557000/818627 [08:47<02:58, 1463.14 examples/s]
Map (num_proc=16): 68%|██████▊ | 558000/818627 [08:47<02:30, 1727.02 examples/s]
Map (num_proc=16): 68%|██████▊ | 559000/818627 [08:48<02:53, 1496.65 examples/s]
Map (num_proc=16): 68%|██████▊ | 560000/818627 [08:48<02:23, 1800.71 examples/s]
Map (num_proc=16): 69%|██████▊ | 561000/818627 [08:48<01:49, 2354.55 examples/s]
Map (num_proc=16): 69%|██████▊ | 562000/818627 [08:49<01:45, 2424.18 examples/s]
Map (num_proc=16): 69%|██████▉ | 564000/818627 [08:49<01:45, 2416.13 examples/s]
Map (num_proc=16): 69%|██████▉ | 565000/818627 [08:50<01:29, 2835.61 examples/s]
Map (num_proc=16): 69%|██████▉ | 566000/818627 [08:56<07:56, 530.45 examples/s]
Map (num_proc=16): 69%|██████▉ | 567000/818627 [08:58<08:34, 489.38 examples/s]
Map (num_proc=16): 69%|██████▉ | 568000/818627 [09:00<07:55, 527.07 examples/s]
Map (num_proc=16): 70%|██████▉ | 569000/818627 [09:00<06:21, 653.63 examples/s]
Map (num_proc=16): 70%|██████▉ | 570000/818627 [09:01<04:56, 837.62 examples/s]
Map (num_proc=16): 70%|██████▉ | 573000/818627 [09:01<02:34, 1593.11 examples/s]
Map (num_proc=16): 70%|███████ | 574000/818627 [09:03<03:07, 1301.45 examples/s]
Map (num_proc=16): 70%|███████ | 576000/818627 [09:04<02:46, 1461.15 examples/s]
Map (num_proc=16): 71%|███████ | 578000/818627 [09:04<01:52, 2139.58 examples/s]
Map (num_proc=16): 71%|███████ | 579000/818627 [09:04<01:38, 2424.08 examples/s]
Map (num_proc=16): 71%|███████ | 580000/818627 [09:04<01:26, 2762.13 examples/s]
Map (num_proc=16): 71%|███████ | 581000/818627 [09:05<01:30, 2628.87 examples/s]
Map (num_proc=16): 71%|███████ | 582000/818627 [09:10<06:42, 587.20 examples/s]
Map (num_proc=16): 71%|███████ | 583000/818627 [09:14<08:49, 444.68 examples/s]
Map (num_proc=16): 71%|███████▏ | 584000/818627 [09:14<06:40, 586.46 examples/s]
Map (num_proc=16): 71%|███████▏ | 585000/818627 [09:15<05:56, 654.90 examples/s]
Map (num_proc=16): 72%|███████▏ | 586000/818627 [09:15<04:20, 892.56 examples/s]
Map (num_proc=16): 72%|███████▏ | 588000/818627 [09:16<02:52, 1333.59 examples/s]
Map (num_proc=16): 72%|███████▏ | 589000/818627 [09:16<02:33, 1497.49 examples/s]
Map (num_proc=16): 72%|███████▏ | 590000/818627 [09:17<02:46, 1375.66 examples/s]
Map (num_proc=16): 72%|███████▏ | 591000/818627 [09:18<02:42, 1403.02 examples/s]
Map (num_proc=16): 72%|███████▏ | 592000/818627 [09:18<02:04, 1819.07 examples/s]
Map (num_proc=16): 72%|███████▏ | 593000/818627 [09:18<01:35, 2365.46 examples/s]
Map (num_proc=16): 73%|███████▎ | 594000/818627 [09:19<01:59, 1882.64 examples/s]
Map (num_proc=16): 73%|███████▎ | 597000/818627 [09:19<01:07, 3271.95 examples/s]
Map (num_proc=16): 73%|███████▎ | 598000/818627 [09:25<05:20, 688.47 examples/s]
Map (num_proc=16): 73%|███████▎ | 599000/818627 [09:29<06:58, 524.86 examples/s]
Map (num_proc=16): 73%|███████▎ | 600000/818627 [09:30<06:02, 602.54 examples/s]
Map (num_proc=16): 73%|███████▎ | 601000/818627 [09:30<04:41, 773.28 examples/s]
Map (num_proc=16): 74%|███████▎ | 602000/818627 [09:30<03:37, 997.69 examples/s]
Map (num_proc=16): 74%|███████▎ | 603000/818627 [09:31<03:35, 1001.66 examples/s]
Map (num_proc=16): 74%|███████▍ | 604000/818627 [09:31<02:39, 1343.87 examples/s]
Map (num_proc=16): 74%|███████▍ | 606000/818627 [09:32<02:23, 1477.44 examples/s]
Map (num_proc=16): 74%|███████▍ | 607000/818627 [09:33<02:08, 1643.41 examples/s]
Map (num_proc=16): 74%|███████▍ | 608000/818627 [09:33<01:58, 1778.93 examples/s]
Map (num_proc=16): 75%|███████▍ | 610000/818627 [09:34<01:34, 2214.90 examples/s]
Map (num_proc=16): 75%|███████▍ | 611000/818627 [09:34<01:46, 1956.59 examples/s]
Map (num_proc=16): 75%|███████▍ | 612000/818627 [09:35<01:28, 2338.32 examples/s]
Map (num_proc=16): 75%|███████▍ | 613000/818627 [09:35<01:11, 2892.18 examples/s]
Map (num_proc=16): 75%|███████▌ | 614000/818627 [09:40<05:57, 572.71 examples/s]
Map (num_proc=16): 75%|███████▌ | 615000/818627 [09:43<06:46, 501.06 examples/s]
Map (num_proc=16): 75%|███████▌ | 616000/818627 [09:44<05:50, 577.42 examples/s]
Map (num_proc=16): 75%|███████▌ | 617000/818627 [09:45<05:29, 611.44 examples/s]
Map (num_proc=16): 76%|███████▌ | 619000/818627 [09:46<03:11, 1041.51 examples/s]
Map (num_proc=16): 76%|███████▌ | 621000/818627 [09:46<02:14, 1471.83 examples/s]
Map (num_proc=16): 76%|███████▌ | 622000/818627 [09:47<02:07, 1538.02 examples/s]
Map (num_proc=16): 76%|███████▌ | 623000/818627 [09:48<02:32, 1282.53 examples/s]
Map (num_proc=16): 76%|███████▌ | 624000/818627 [09:48<02:02, 1592.29 examples/s]
Map (num_proc=16): 76%|███████▋ | 626000/818627 [09:49<01:29, 2149.59 examples/s]
Map (num_proc=16): 77%|███████▋ | 627000/818627 [09:49<01:27, 2188.52 examples/s]
Map (num_proc=16): 77%|███████▋ | 628000/818627 [09:49<01:20, 2380.88 examples/s]
Map (num_proc=16): 77%|███████▋ | 629000/818627 [09:50<01:27, 2163.53 examples/s]
Map (num_proc=16): 77%|███████▋ | 630000/818627 [09:55<05:19, 590.45 examples/s]
Map (num_proc=16): 77%|███████▋ | 631000/818627 [09:57<05:23, 579.94 examples/s]
Map (num_proc=16): 77%|███████▋ | 632000/818627 [09:58<05:15, 591.76 examples/s]
Map (num_proc=16): 77%|███████▋ | 633000/818627 [10:00<05:18, 582.65 examples/s]
Map (num_proc=16): 77%|███████▋ | 634000/818627 [10:00<04:06, 749.57 examples/s]
Map (num_proc=16): 78%|███████▊ | 635000/818627 [10:01<03:08, 974.14 examples/s]
Map (num_proc=16): 78%|███████▊ | 636000/818627 [10:01<02:18, 1315.05 examples/s]
Map (num_proc=16): 78%|███████▊ | 639000/818627 [10:02<01:50, 1624.96 examples/s]
Map (num_proc=16): 78%|███████▊ | 641000/818627 [10:03<01:41, 1752.05 examples/s]
Map (num_proc=16): 79%|███████▊ | 643000/818627 [10:03<01:10, 2500.28 examples/s]
Map (num_proc=16): 79%|███████▊ | 644000/818627 [10:04<01:06, 2642.92 examples/s]
Map (num_proc=16): 79%|███████▉ | 645000/818627 [10:04<01:18, 2198.44 examples/s]
Map (num_proc=16): 79%|███████▉ | 646000/818627 [10:09<04:09, 692.33 examples/s]
Map (num_proc=16): 79%|███████▉ | 647000/818627 [10:12<05:02, 568.06 examples/s]
Map (num_proc=16): 79%|███████▉ | 648000/818627 [10:12<04:04, 697.72 examples/s]
Map (num_proc=16): 79%|███████▉ | 649000/818627 [10:14<04:23, 643.01 examples/s]
Map (num_proc=16): 79%|███████▉ | 650000/818627 [10:15<03:36, 778.34 examples/s]
Map (num_proc=16): 80%|███████▉ | 651000/818627 [10:16<03:07, 895.10 examples/s]
Map (num_proc=16): 80%|███████▉ | 652000/818627 [10:16<02:22, 1170.50 examples/s]
Map (num_proc=16): 80%|████████ | 655000/818627 [10:17<01:48, 1512.28 examples/s]
Map (num_proc=16): 80%|████████ | 657000/818627 [10:18<01:38, 1647.19 examples/s]
Map (num_proc=16): 80%|████████ | 658000/818627 [10:19<01:30, 1773.94 examples/s]
Map (num_proc=16): 81%|████████ | 659000/818627 [10:19<01:31, 1741.24 examples/s]
Map (num_proc=16): 81%|████████ | 660000/818627 [10:20<01:24, 1877.00 examples/s]
Map (num_proc=16): 81%|████████ | 661000/818627 [10:23<03:10, 827.40 examples/s]
Map (num_proc=16): 81%|████████ | 662000/818627 [10:24<02:56, 888.53 examples/s]
Map (num_proc=16): 81%|████████ | 663000/818627 [10:26<03:50, 675.82 examples/s]
Map (num_proc=16): 81%|████████ | 664000/818627 [10:27<03:00, 854.72 examples/s]
Map (num_proc=16): 81%|████████ | 665000/818627 [10:30<04:28, 571.75 examples/s]
Map (num_proc=16): 81%|████████▏ | 666000/818627 [10:30<03:27, 735.15 examples/s]
Map (num_proc=16): 82%|████████▏ | 668000/818627 [10:31<02:05, 1203.31 examples/s]
Map (num_proc=16): 82%|████████▏ | 670000/818627 [10:31<01:24, 1758.99 examples/s]
Map (num_proc=16): 82%|████████▏ | 671000/818627 [10:32<01:47, 1368.12 examples/s]
Map (num_proc=16): 82%|████████▏ | 672000/818627 [10:33<01:40, 1451.83 examples/s]
Map (num_proc=16): 82%|████████▏ | 674000/818627 [10:33<01:19, 1809.14 examples/s]
Map (num_proc=16): 82%|████████▏ | 675000/818627 [10:35<01:37, 1479.40 examples/s]
Map (num_proc=16): 83%|████████▎ | 676000/818627 [10:35<01:33, 1519.03 examples/s]
Map (num_proc=16): 83%|████████▎ | 677000/818627 [10:37<02:33, 923.62 examples/s]
Map (num_proc=16): 83%|████████▎ | 678000/818627 [10:39<02:33, 917.78 examples/s]
Map (num_proc=16): 83%|████████▎ | 679000/818627 [10:42<03:46, 616.63 examples/s]
Map (num_proc=16): 83%|████████▎ | 680000/818627 [10:42<03:16, 703.73 examples/s]
Map (num_proc=16): 83%|████████▎ | 681000/818627 [10:44<03:37, 633.47 examples/s]
Map (num_proc=16): 83%|████████▎ | 682000/818627 [10:45<02:52, 789.99 examples/s]
Map (num_proc=16): 83%|████████▎ | 683000/818627 [10:45<02:17, 985.34 examples/s]
Map (num_proc=16): 84%|████████▎ | 685000/818627 [10:46<01:37, 1364.62 examples/s]
Map (num_proc=16): 84%|████████▍ | 686000/818627 [10:46<01:22, 1603.14 examples/s]
Map (num_proc=16): 84%|████████▍ | 687000/818627 [10:48<01:38, 1333.46 examples/s]
Map (num_proc=16): 84%|████████▍ | 688000/818627 [10:48<01:21, 1603.02 examples/s]
Map (num_proc=16): 84%|████████▍ | 689000/818627 [10:48<01:09, 1875.03 examples/s]
Map (num_proc=16): 84%|████████▍ | 691000/818627 [10:50<01:34, 1352.50 examples/s]
Map (num_proc=16): 85%|████████▍ | 692000/818627 [10:51<01:39, 1271.30 examples/s]
Map (num_proc=16): 85%|████████▍ | 693000/818627 [10:52<01:45, 1191.99 examples/s]
Map (num_proc=16): 85%|████████▍ | 694000/818627 [10:53<01:56, 1070.20 examples/s]
Map (num_proc=16): 85%|████████▍ | 695000/818627 [10:56<03:06, 664.40 examples/s]
Map (num_proc=16): 85%|████████▌ | 696000/818627 [10:57<02:50, 719.57 examples/s]
Map (num_proc=16): 85%|████████▌ | 697000/818627 [10:59<03:10, 637.94 examples/s]
Map (num_proc=16): 85%|████████▌ | 698000/818627 [11:00<02:24, 837.09 examples/s]
Map (num_proc=16): 85%|████████▌ | 699000/818627 [11:00<02:02, 975.41 examples/s]
Map (num_proc=16): 86%|████████▌ | 701000/818627 [11:01<01:21, 1436.38 examples/s]
Map (num_proc=16): 86%|████████▌ | 702000/818627 [11:02<01:25, 1359.27 examples/s]
Map (num_proc=16): 86%|████████▌ | 703000/818627 [11:02<01:15, 1531.90 examples/s]
Map (num_proc=16): 86%|████████▌ | 704000/818627 [11:03<01:06, 1723.94 examples/s]
Map (num_proc=16): 86%|████████▌ | 705000/818627 [11:03<01:01, 1847.57 examples/s]
Map (num_proc=16): 86%|████████▌ | 706000/818627 [11:04<01:04, 1732.88 examples/s]
Map (num_proc=16): 86%|████████▋ | 707000/818627 [11:06<01:57, 953.68 examples/s]
Map (num_proc=16): 86%|████████▋ | 708000/818627 [11:06<01:35, 1157.16 examples/s]
Map (num_proc=16): 87%|████████▋ | 709000/818627 [11:07<01:16, 1434.11 examples/s]
Map (num_proc=16): 87%|████████▋ | 710000/818627 [11:08<01:32, 1178.11 examples/s]
Map (num_proc=16): 87%|████████▋ | 711000/818627 [11:10<02:23, 748.06 examples/s]
Map (num_proc=16): 87%|████████▋ | 712000/818627 [11:13<03:04, 576.73 examples/s]
Map (num_proc=16): 87%|████████▋ | 713000/818627 [11:14<02:41, 654.95 examples/s]
Map (num_proc=16): 87%|████████▋ | 714000/818627 [11:15<02:25, 717.36 examples/s]
Map (num_proc=16): 87%|████████▋ | 715000/818627 [11:15<01:45, 986.78 examples/s]
Map (num_proc=16): 87%|████████▋ | 716000/818627 [11:15<01:21, 1252.36 examples/s]
Map (num_proc=16): 88%|████████▊ | 717000/818627 [11:17<01:41, 997.39 examples/s]
Map (num_proc=16): 88%|████████▊ | 718000/818627 [11:17<01:20, 1255.82 examples/s]
Map (num_proc=16): 88%|████████▊ | 720000/818627 [11:18<01:02, 1580.53 examples/s]
Map (num_proc=16): 88%|████████▊ | 722000/818627 [11:21<01:25, 1135.11 examples/s]
Map (num_proc=16): 88%|████████▊ | 723000/818627 [11:21<01:22, 1158.89 examples/s]
Map (num_proc=16): 88%|████████▊ | 724000/818627 [11:22<01:22, 1146.13 examples/s]
Map (num_proc=16): 89%|████████▊ | 725000/818627 [11:23<01:08, 1373.89 examples/s]
Map (num_proc=16): 89%|████████▊ | 726000/818627 [11:24<01:23, 1105.31 examples/s]
Map (num_proc=16): 89%|████████▉ | 727000/818627 [11:24<01:05, 1401.17 examples/s]
Map (num_proc=16): 89%|████████▉ | 728000/818627 [11:28<02:10, 692.59 examples/s]
Map (num_proc=16): 89%|████████▉ | 729000/818627 [11:28<01:39, 899.28 examples/s]
Map (num_proc=16): 89%|████████▉ | 730000/818627 [11:30<02:01, 731.21 examples/s]
Map (num_proc=16): 89%|████████▉ | 732000/818627 [11:31<01:24, 1021.39 examples/s]
Map (num_proc=16): 90%|████████▉ | 734000/818627 [11:32<01:06, 1273.42 examples/s]
Map (num_proc=16): 90%|████████▉ | 735000/818627 [11:32<01:02, 1334.00 examples/s]
Map (num_proc=16): 90%|████████▉ | 736000/818627 [11:33<01:02, 1315.26 examples/s]
Map (num_proc=16): 90%|█████████ | 738000/818627 [11:35<01:04, 1256.15 examples/s]
Map (num_proc=16): 90%|█████████ | 739000/818627 [11:37<01:26, 922.67 examples/s]
Map (num_proc=16): 90%|█████████ | 740000/818627 [11:37<01:10, 1117.88 examples/s]
Map (num_proc=16): 91%|█████████ | 741000/818627 [11:38<01:03, 1215.15 examples/s]
Map (num_proc=16): 91%|█████████ | 742000/818627 [11:38<00:52, 1457.76 examples/s]
Map (num_proc=16): 91%|█████████ | 743000/818627 [11:39<01:00, 1253.43 examples/s]
Map (num_proc=16): 91%|█████████ | 744000/818627 [11:42<01:37, 761.79 examples/s]
Map (num_proc=16): 91%|█████████ | 745000/818627 [11:43<01:22, 889.52 examples/s]
Map (num_proc=16): 91%|█████████ | 746000/818627 [11:45<01:49, 663.50 examples/s]
Map (num_proc=16): 91%|█████████▏| 747000/818627 [11:45<01:24, 849.41 examples/s]
Map (num_proc=16): 91%|█████████▏| 748000/818627 [11:46<01:02, 1127.99 examples/s]
Map (num_proc=16): 91%|█████████▏| 749000/818627 [11:47<01:03, 1092.66 examples/s]
Map (num_proc=16): 92%|█████████▏| 750000/818627 [11:47<01:00, 1136.48 examples/s]
Map (num_proc=16): 92%|█████████▏| 751000/818627 [11:49<01:06, 1023.60 examples/s]
Map (num_proc=16): 92%|█████████▏| 752000/818627 [11:49<00:47, 1399.11 examples/s]
Map (num_proc=16): 92%|█████████▏| 753000/818627 [11:49<00:42, 1526.52 examples/s]
Map (num_proc=16): 92%|█████████▏| 754000/818627 [11:50<00:45, 1422.10 examples/s]
Map (num_proc=16): 92%|█████████▏| 755000/818627 [11:52<01:05, 970.82 examples/s]
Map (num_proc=16): 92%|█████████▏| 756000/818627 [11:52<00:52, 1188.07 examples/s]
Map (num_proc=16): 93%|█████████▎| 758000/818627 [11:53<00:31, 1938.14 examples/s]
Map (num_proc=16): 93%|█████████▎| 759000/818627 [11:54<00:48, 1237.66 examples/s]
Map (num_proc=16): 93%|█████████▎| 760000/818627 [11:57<01:16, 766.83 examples/s]
Map (num_proc=16): 93%|█████████▎| 761000/818627 [11:58<01:07, 857.12 examples/s]
Map (num_proc=16): 93%|█████████▎| 762000/818627 [11:59<01:13, 771.13 examples/s]
Map (num_proc=16): 93%|█████████▎| 763000/818627 [12:00<01:00, 914.79 examples/s]
Map (num_proc=16): 93%|█████████▎| 764000/818627 [12:01<01:05, 828.83 examples/s]
Map (num_proc=16): 93%|█████████▎| 765000/818627 [12:02<00:51, 1049.41 examples/s]
Map (num_proc=16): 94%|█████████▎| 766000/818627 [12:02<00:44, 1190.67 examples/s]
Map (num_proc=16): 94%|█████████▎| 767000/818627 [12:03<00:46, 1119.54 examples/s]
Map (num_proc=16): 94%|█████████▍| 769000/818627 [12:04<00:31, 1570.35 examples/s]
Map (num_proc=16): 94%|█████████▍| 770000/818627 [12:04<00:26, 1864.64 examples/s]
Map (num_proc=16): 94%|█████████▍| 771000/818627 [12:06<00:38, 1233.80 examples/s]
Map (num_proc=16): 94%|█████████▍| 772000/818627 [12:07<00:39, 1167.64 examples/s]
Map (num_proc=16): 94%|█████████▍| 773000/818627 [12:07<00:30, 1517.64 examples/s]
Map (num_proc=16): 95%|█████████▍| 774000/818627 [12:07<00:24, 1817.98 examples/s]
Map (num_proc=16): 95%|█████████▍| 775000/818627 [12:09<00:43, 1006.15 examples/s]
Map (num_proc=16): 95%|█████████▍| 776000/818627 [12:11<00:55, 772.62 examples/s]
Map (num_proc=16): 95%|█████████▍| 777000/818627 [12:13<00:56, 738.62 examples/s]
Map (num_proc=16): 95%|█████████▌| 778000/818627 [12:14<00:54, 745.96 examples/s]
Map (num_proc=16): 95%|█████████▌| 779000/818627 [12:14<00:40, 967.42 examples/s]
Map (num_proc=16): 95%|█████████▌| 780000/818627 [12:17<00:52, 738.99 examples/s]
Map (num_proc=16): 95%|█████████▌| 781000/818627 [12:17<00:39, 963.69 examples/s]
Map (num_proc=16): 96%|█████████▌| 782000/818627 [12:17<00:29, 1230.70 examples/s]
Map (num_proc=16): 96%|█████████▌| 783000/818627 [12:18<00:24, 1443.97 examples/s]
Map (num_proc=16): 96%|█████████▌| 784000/818627 [12:18<00:26, 1325.98 examples/s]
Map (num_proc=16): 96%|█████████▌| 786000/818627 [12:19<00:16, 2004.56 examples/s]
Map (num_proc=16): 96%|█████████▌| 787000/818627 [12:19<00:13, 2380.06 examples/s]
Map (num_proc=16): 96%|█████████▋| 788000/818627 [12:21<00:25, 1199.25 examples/s]
Map (num_proc=16): 96%|█████████▋| 789164/818627 [12:22<00:25, 1155.33 examples/s]
Map (num_proc=16): 97%|█████████▋| 790164/818627 [12:23<00:23, 1223.14 examples/s]
Map (num_proc=16): 97%|█████████▋| 791164/818627 [12:25<00:31, 867.02 examples/s]
Map (num_proc=16): 97%|█████████▋| 792164/818627 [12:25<00:22, 1164.92 examples/s]
Map (num_proc=16): 97%|█████████▋| 793328/818627 [12:27<00:31, 808.79 examples/s]
Map (num_proc=16): 97%|█████████▋| 794328/818627 [12:28<00:27, 878.01 examples/s]
Map (num_proc=16): 97%|█████████▋| 795493/818627 [12:30<00:32, 719.58 examples/s]
Map (num_proc=16): 97%|█████████▋| 797493/818627 [12:31<00:18, 1152.03 examples/s]
Map (num_proc=16): 98%|█████████▊| 798493/818627 [12:31<00:14, 1363.23 examples/s]
Map (num_proc=16): 98%|█████████▊| 799493/818627 [12:32<00:13, 1404.64 examples/s]
Map (num_proc=16): 98%|█████████▊| 800493/818627 [12:32<00:09, 1820.57 examples/s]
Map (num_proc=16): 98%|█████████▊| 801493/818627 [12:32<00:07, 2278.21 examples/s]
Map (num_proc=16): 98%|█████████▊| 802493/818627 [12:32<00:06, 2365.50 examples/s]
Map (num_proc=16): 98%|█████████▊| 803821/818627 [12:34<00:10, 1393.91 examples/s]
Map (num_proc=16): 98%|█████████▊| 804821/818627 [12:35<00:09, 1491.32 examples/s]
Map (num_proc=16): 98%|█████████▊| 805821/818627 [12:35<00:07, 1623.12 examples/s]
Map (num_proc=16): 99%|█████████▊| 806821/818627 [12:37<00:09, 1197.73 examples/s]
Map (num_proc=16): 99%|█████████▊| 807985/818627 [12:39<00:12, 862.85 examples/s]
Map (num_proc=16): 99%|█████████▉| 808985/818627 [12:39<00:10, 953.63 examples/s]
Map (num_proc=16): 99%|█████████▉| 809150/818627 [12:40<00:11, 796.40 examples/s]
Map (num_proc=16): 99%|█████████▉| 809314/818627 [12:41<00:14, 642.08 examples/s]
Map (num_proc=16): 99%|█████████▉| 810314/818627 [12:41<00:07, 1050.65 examples/s]
Map (num_proc=16): 99%|█████████▉| 811314/818627 [12:41<00:04, 1465.11 examples/s]
Map (num_proc=16): 99%|█████████▉| 812314/818627 [12:42<00:03, 1792.62 examples/s]
Map (num_proc=16): 99%|█████████▉| 813314/818627 [12:42<00:02, 2431.36 examples/s]
Map (num_proc=16): 99%|█████████▉| 814478/818627 [12:42<00:01, 2373.55 examples/s]
Map (num_proc=16): 100%|█████████▉| 814970/818627 [12:43<00:02, 1691.06 examples/s]
Map (num_proc=16): 100%|█████████▉| 815970/818627 [12:43<00:01, 2348.92 examples/s]
Map (num_proc=16): 100%|█████████▉| 817134/818627 [12:44<00:00, 2392.13 examples/s]
Map (num_proc=16): 100%|█████████▉| 818298/818627 [12:45<00:00, 1574.09 examples/s]
Map (num_proc=16): 100%|██████████| 818627/818627 [12:46<00:00, 1067.63 examples/s]
+/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/distributed_c10d.py:4876: UserWarning: barrier(): using the device under current context. You can specify `device_id` in `init_process_group` to mute this warning.
+ warnings.warn( # warn only once
+[rank0]:[W323 13:02:24.876799111 ProcessGroupNCCL.cpp:5072] Guessing device ID based on global rank. This can cause a hang if rank to GPU mapping is heterogeneous. You can specify device_id in init_process_group()
+
Filter: 0%| | 0/818627 [00:00, ? examples/s]dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkldataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkldataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
Filter: 0%| | 2000/818627 [00:00<01:11, 11400.34 examples/s]
Filter: 0%| | 0/818627 [00:00, ? examples/s]
Filter: 0%| | 0/818627 [00:00, ? examples/s]
Filter: 0%| | 0/818627 [00:00, ? examples/s]
Filter: 0%| | 0/818627 [00:00, ? examples/s]
Filter: 0%| | 0/818627 [00:00, ? examples/s]
Filter: 0%| | 0/818627 [00:00, ? examples/s]
Filter: 0%| | 0/818627 [00:00, ? examples/s]
Filter: 0%| | 4000/818627 [00:00<01:05, 12518.10 examples/s]
Filter: 0%| | 2000/818627 [00:00<01:01, 13204.46 examples/s]
Filter: 0%| | 2000/818627 [00:00<01:01, 13277.48 examples/s]
Filter: 0%| | 2000/818627 [00:00<01:02, 13120.03 examples/s]
Filter: 0%| | 2000/818627 [00:00<01:05, 12512.49 examples/s]
Filter: 0%| | 2000/818627 [00:00<01:05, 12535.75 examples/s]
Filter: 0%| | 2000/818627 [00:00<01:05, 12423.02 examples/s]
Filter: 0%| | 2000/818627 [00:00<01:04, 12657.85 examples/s]
Filter: 1%| | 6000/818627 [00:00<01:03, 12877.81 examples/s]
Filter: 0%| | 4000/818627 [00:00<01:00, 13554.32 examples/s]
Filter: 0%| | 4000/818627 [00:00<01:00, 13570.42 examples/s]
Filter: 0%| | 4000/818627 [00:00<01:01, 13251.77 examples/s]
Filter: 0%| | 4000/818627 [00:00<01:00, 13398.59 examples/s]
Filter: 0%| | 4000/818627 [00:00<01:00, 13363.44 examples/s]
Filter: 0%| | 4000/818627 [00:00<01:02, 12949.76 examples/s]
Filter: 0%| | 4000/818627 [00:00<00:59, 13676.50 examples/s]
Filter: 1%| | 6000/818627 [00:00<00:58, 13868.97 examples/s]
Filter: 1%| | 6000/818627 [00:00<00:58, 13879.95 examples/s]
Filter: 1%| | 8000/818627 [00:00<01:02, 12891.83 examples/s]
Filter: 1%| | 6000/818627 [00:00<01:00, 13543.11 examples/s]
Filter: 1%| | 6000/818627 [00:00<00:59, 13675.20 examples/s]
Filter: 1%| | 6000/818627 [00:00<00:59, 13659.49 examples/s]
Filter: 1%| | 6000/818627 [00:00<01:01, 13297.93 examples/s]
Filter: 1%| | 6000/818627 [00:00<00:58, 13912.57 examples/s]
Filter: 1%| | 8000/818627 [00:00<00:57, 14011.63 examples/s]
Filter: 1%| | 8000/818627 [00:00<00:57, 14015.93 examples/s]
Filter: 1%| | 8000/818627 [00:00<00:58, 13831.75 examples/s]
Filter: 1%| | 10000/818627 [00:00<01:01, 13162.99 examples/s]
Filter: 1%| | 8000/818627 [00:00<00:58, 13898.62 examples/s]
Filter: 1%| | 8000/818627 [00:00<00:56, 14243.11 examples/s]
Filter: 1%| | 8000/818627 [00:00<00:58, 13811.77 examples/s]
Filter: 1%| | 8000/818627 [00:00<00:59, 13616.11 examples/s]
Filter: 1%| | 10000/818627 [00:00<00:57, 14100.08 examples/s]
Filter: 1%| | 10000/818627 [00:00<00:57, 14077.49 examples/s]
Filter: 1%| | 10000/818627 [00:00<00:57, 14000.84 examples/s]
Filter: 1%| | 10000/818627 [00:00<00:56, 14276.05 examples/s]
Filter: 1%|▏ | 12000/818627 [00:00<01:00, 13337.54 examples/s]
Filter: 1%| | 10000/818627 [00:00<00:58, 13924.02 examples/s]
Filter: 1%| | 10000/818627 [00:00<00:58, 13806.44 examples/s]
Filter: 1%| | 10000/818627 [00:00<00:58, 13783.25 examples/s]
Filter: 1%|▏ | 12000/818627 [00:00<00:57, 14136.98 examples/s]
Filter: 1%|▏ | 12000/818627 [00:00<00:57, 14069.06 examples/s]
Filter: 1%|▏ | 12000/818627 [00:00<00:55, 14405.74 examples/s]
Filter: 1%|▏ | 12000/818627 [00:00<00:57, 14029.46 examples/s]
Filter: 1%|▏ | 12000/818627 [00:00<00:57, 13961.00 examples/s]
Filter: 2%|▏ | 14000/818627 [00:01<00:59, 13479.30 examples/s]
Filter: 1%|▏ | 12000/818627 [00:00<00:58, 13878.21 examples/s]
Filter: 1%|▏ | 12000/818627 [00:00<00:58, 13798.14 examples/s]
Filter: 2%|▏ | 14000/818627 [00:00<00:56, 14158.44 examples/s]
Filter: 2%|▏ | 14000/818627 [00:01<00:57, 14113.94 examples/s]
Filter: 2%|▏ | 14000/818627 [00:00<00:55, 14511.25 examples/s]
Filter: 2%|▏ | 14000/818627 [00:01<00:57, 14009.55 examples/s]
Filter: 2%|▏ | 14000/818627 [00:01<00:56, 14138.88 examples/s]
Filter: 2%|▏ | 16000/818627 [00:01<00:58, 13649.21 examples/s]
Filter: 2%|▏ | 14000/818627 [00:01<00:57, 13945.39 examples/s]
Filter: 2%|▏ | 14000/818627 [00:01<00:58, 13746.89 examples/s]
Filter: 2%|▏ | 16000/818627 [00:01<00:55, 14590.84 examples/s]
Filter: 2%|▏ | 16000/818627 [00:01<00:56, 14176.40 examples/s]
Filter: 2%|▏ | 16000/818627 [00:01<00:56, 14148.68 examples/s]
Filter: 2%|▏ | 16000/818627 [00:01<00:56, 14121.84 examples/s]
Filter: 2%|▏ | 16000/818627 [00:01<00:56, 14254.81 examples/s]
Filter: 2%|▏ | 18000/818627 [00:01<00:58, 13803.61 examples/s]
Filter: 2%|▏ | 16000/818627 [00:01<00:57, 13997.92 examples/s]
Filter: 2%|▏ | 16000/818627 [00:01<00:57, 13867.91 examples/s]
Filter: 2%|▏ | 18000/818627 [00:01<00:55, 14508.21 examples/s]
Filter: 2%|▏ | 18000/818627 [00:01<00:56, 14153.72 examples/s]
Filter: 2%|▏ | 18000/818627 [00:01<00:56, 14085.85 examples/s]
Filter: 2%|▏ | 18000/818627 [00:01<00:56, 14215.11 examples/s]
Filter: 2%|▏ | 18000/818627 [00:01<00:56, 14236.18 examples/s]
Filter: 2%|▏ | 20000/818627 [00:01<00:57, 13917.15 examples/s]
Filter: 2%|▏ | 18000/818627 [00:01<00:57, 14028.79 examples/s]
Filter: 2%|▏ | 18000/818627 [00:01<00:57, 13949.00 examples/s]
Filter: 2%|▏ | 20000/818627 [00:01<00:55, 14504.57 examples/s]
Filter: 2%|▏ | 20000/818627 [00:01<00:56, 14131.58 examples/s]
Filter: 2%|▏ | 20000/818627 [00:01<00:56, 14018.55 examples/s]
Filter: 2%|▏ | 20000/818627 [00:01<00:55, 14262.53 examples/s]
Filter: 2%|▏ | 20000/818627 [00:01<00:55, 14321.75 examples/s]
Filter: 3%|▎ | 22000/818627 [00:01<00:56, 14004.91 examples/s]
Filter: 2%|▏ | 20000/818627 [00:01<00:56, 14077.81 examples/s]
Filter: 2%|▏ | 20000/818627 [00:01<00:57, 13888.90 examples/s]
Filter: 3%|▎ | 22000/818627 [00:01<00:54, 14538.69 examples/s]
Filter: 3%|▎ | 22000/818627 [00:01<00:56, 14185.56 examples/s]
Filter: 3%|▎ | 22000/818627 [00:01<00:56, 14131.28 examples/s]
Filter: 3%|▎ | 22000/818627 [00:01<00:55, 14303.39 examples/s]
Filter: 3%|▎ | 22000/818627 [00:01<00:55, 14246.28 examples/s]
Filter: 3%|▎ | 24000/818627 [00:01<00:56, 14048.20 examples/s]
Filter: 3%|▎ | 22000/818627 [00:01<00:56, 14120.18 examples/s]
Filter: 3%|▎ | 22000/818627 [00:01<00:56, 13996.76 examples/s]
Filter: 3%|▎ | 24000/818627 [00:01<00:54, 14564.46 examples/s]
Filter: 3%|▎ | 24000/818627 [00:01<00:55, 14212.41 examples/s]
Filter: 3%|▎ | 24000/818627 [00:01<00:55, 14323.48 examples/s]
Filter: 3%|▎ | 24000/818627 [00:01<00:56, 14077.61 examples/s]
Filter: 3%|▎ | 24000/818627 [00:01<00:55, 14211.23 examples/s]
Filter: 3%|▎ | 26000/818627 [00:01<00:56, 14074.35 examples/s]
Filter: 3%|▎ | 24000/818627 [00:01<00:56, 14155.35 examples/s]
Filter: 3%|▎ | 24000/818627 [00:01<00:56, 14055.55 examples/s]
Filter: 3%|▎ | 26000/818627 [00:01<00:54, 14551.04 examples/s]
Filter: 3%|▎ | 26000/818627 [00:01<00:55, 14335.99 examples/s]
Filter: 3%|▎ | 26000/818627 [00:01<00:55, 14182.95 examples/s]
Filter: 3%|▎ | 26000/818627 [00:01<00:55, 14298.64 examples/s]
Filter: 3%|▎ | 26000/818627 [00:01<00:56, 13967.63 examples/s]
Filter: 3%|▎ | 26000/818627 [00:01<00:55, 14174.18 examples/s]
Filter: 3%|▎ | 28000/818627 [00:02<00:56, 14091.64 examples/s]
Filter: 3%|▎ | 26000/818627 [00:01<00:56, 14088.83 examples/s]
Filter: 3%|▎ | 28000/818627 [00:01<00:54, 14415.51 examples/s]
Filter: 3%|▎ | 28000/818627 [00:01<00:55, 14325.99 examples/s]
Filter: 3%|▎ | 28000/818627 [00:01<00:55, 14335.07 examples/s]
Filter: 3%|▎ | 28000/818627 [00:01<00:56, 14016.86 examples/s]
Filter: 3%|▎ | 28000/818627 [00:01<00:56, 13902.27 examples/s]
Filter: 3%|▎ | 28000/818627 [00:02<00:55, 14192.26 examples/s]
Filter: 4%|▎ | 30000/818627 [00:02<00:56, 13977.71 examples/s]
Filter: 3%|▎ | 28000/818627 [00:02<00:56, 14106.09 examples/s]
Filter: 4%|▎ | 30000/818627 [00:02<00:54, 14364.38 examples/s]
Filter: 4%|▎ | 30000/818627 [00:02<00:55, 14323.92 examples/s]
Filter: 4%|▎ | 30000/818627 [00:02<00:54, 14375.71 examples/s]
Filter: 4%|▎ | 30000/818627 [00:02<00:55, 14117.48 examples/s]
Filter: 4%|▎ | 30000/818627 [00:02<00:56, 14031.85 examples/s]
Filter: 4%|▎ | 30000/818627 [00:02<00:55, 14193.13 examples/s]
Filter: 4%|▍ | 32000/818627 [00:02<00:56, 13925.90 examples/s]
Filter: 4%|▎ | 30000/818627 [00:02<00:55, 14107.29 examples/s]
Filter: 4%|▍ | 32000/818627 [00:02<00:54, 14433.31 examples/s]
Filter: 4%|▍ | 32000/818627 [00:02<00:55, 14278.09 examples/s]
Filter: 4%|▍ | 32000/818627 [00:02<00:54, 14373.54 examples/s]
Filter: 4%|▍ | 32000/818627 [00:02<00:55, 14159.47 examples/s]
Filter: 4%|▍ | 32000/818627 [00:02<00:55, 14113.71 examples/s]
Filter: 4%|▍ | 32000/818627 [00:02<00:55, 14216.58 examples/s]
Filter: 4%|▍ | 34000/818627 [00:02<00:56, 13902.51 examples/s]
Filter: 4%|▍ | 32000/818627 [00:02<00:56, 13981.79 examples/s]
Filter: 4%|▍ | 34000/818627 [00:02<00:54, 14463.23 examples/s]
Filter: 4%|▍ | 34000/818627 [00:02<00:55, 14229.85 examples/s]
Filter: 4%|▍ | 34000/818627 [00:02<00:55, 14255.88 examples/s]
Filter: 4%|▍ | 34000/818627 [00:02<00:55, 14186.90 examples/s]
Filter: 4%|▍ | 34000/818627 [00:02<00:55, 14152.93 examples/s]
Filter: 4%|▍ | 34000/818627 [00:02<00:55, 14218.36 examples/s]
Filter: 4%|▍ | 36000/818627 [00:02<00:55, 13986.67 examples/s]
Filter: 4%|▍ | 34000/818627 [00:02<00:56, 13920.86 examples/s]
Filter: 4%|▍ | 36000/818627 [00:02<00:54, 14485.56 examples/s]
Filter: 4%|▍ | 36000/818627 [00:02<00:54, 14238.98 examples/s]
Filter: 4%|▍ | 36000/818627 [00:02<00:54, 14317.20 examples/s]
Filter: 4%|▍ | 36000/818627 [00:02<00:54, 14240.04 examples/s]
Filter: 4%|▍ | 36000/818627 [00:02<00:55, 14212.13 examples/s]
Filter: 4%|▍ | 36000/818627 [00:02<00:55, 14203.00 examples/s]
Filter: 5%|▍ | 38000/818627 [00:02<00:55, 14049.12 examples/s]
Filter: 4%|▍ | 36000/818627 [00:02<00:56, 13971.10 examples/s]
Filter: 5%|▍ | 38000/818627 [00:02<00:53, 14518.27 examples/s]
Filter: 5%|▍ | 38000/818627 [00:02<00:54, 14353.55 examples/s]
Filter: 5%|▍ | 38000/818627 [00:02<00:54, 14267.89 examples/s]
Filter: 5%|▍ | 38000/818627 [00:02<00:54, 14275.03 examples/s]
Filter: 5%|▍ | 38000/818627 [00:02<00:54, 14280.99 examples/s]
Filter: 5%|▍ | 38000/818627 [00:02<00:54, 14223.56 examples/s]
Filter: 5%|▍ | 40000/818627 [00:02<00:55, 14003.99 examples/s]
Filter: 5%|▍ | 38000/818627 [00:02<00:56, 13901.15 examples/s]
Filter: 5%|▍ | 40000/818627 [00:02<00:53, 14489.95 examples/s]
Filter: 5%|▍ | 40000/818627 [00:02<00:54, 14285.94 examples/s]
Filter: 5%|▍ | 40000/818627 [00:02<00:54, 14240.76 examples/s]
Filter: 5%|▍ | 40000/818627 [00:02<00:54, 14302.69 examples/s]
Filter: 5%|▍ | 40000/818627 [00:02<00:54, 14292.64 examples/s]
Filter: 5%|▍ | 40000/818627 [00:02<00:54, 14183.43 examples/s]
Filter: 5%|▌ | 42000/818627 [00:03<00:55, 14075.58 examples/s]
Filter: 5%|▍ | 40000/818627 [00:02<00:56, 13878.57 examples/s]
Filter: 5%|▌ | 42000/818627 [00:02<00:53, 14553.00 examples/s]
Filter: 5%|▌ | 42000/818627 [00:02<00:54, 14171.68 examples/s]
Filter: 5%|▌ | 42000/818627 [00:02<00:55, 14053.30 examples/s]
Filter: 5%|▌ | 42000/818627 [00:02<00:55, 14067.16 examples/s]
Filter: 5%|▌ | 42000/818627 [00:02<00:55, 14104.88 examples/s]
Filter: 5%|▌ | 42000/818627 [00:02<00:55, 14072.99 examples/s]
Filter: 5%|▌ | 44000/818627 [00:03<00:55, 13974.93 examples/s]
Filter: 5%|▌ | 42000/818627 [00:03<00:56, 13857.21 examples/s]
Filter: 5%|▌ | 44000/818627 [00:03<00:53, 14454.86 examples/s]
Filter: 5%|▌ | 44000/818627 [00:03<00:55, 14008.87 examples/s]
Filter: 5%|▌ | 44000/818627 [00:03<00:55, 14010.19 examples/s]
Filter: 5%|▌ | 44000/818627 [00:03<00:54, 14180.72 examples/s]
Filter: 5%|▌ | 44000/818627 [00:03<00:55, 14070.87 examples/s]
Filter: 5%|▌ | 44000/818627 [00:03<00:55, 13991.98 examples/s]
Filter: 6%|▌ | 46000/818627 [00:03<00:54, 14049.80 examples/s]
Filter: 5%|▌ | 44000/818627 [00:03<00:55, 13955.86 examples/s]
Filter: 6%|▌ | 46000/818627 [00:03<00:53, 14494.37 examples/s]
Filter: 6%|▌ | 46000/818627 [00:03<00:54, 14122.52 examples/s]
Filter: 6%|▌ | 46000/818627 [00:03<00:54, 14098.79 examples/s]
Filter: 6%|▌ | 46000/818627 [00:03<00:54, 14255.28 examples/s]
Filter: 6%|▌ | 46000/818627 [00:03<00:54, 14175.04 examples/s]
Filter: 6%|▌ | 46000/818627 [00:03<00:55, 13943.13 examples/s]
Filter: 6%|▌ | 48000/818627 [00:03<00:54, 14108.64 examples/s]
Filter: 6%|▌ | 46000/818627 [00:03<00:55, 14029.27 examples/s]
Filter: 6%|▌ | 48000/818627 [00:03<00:53, 14521.78 examples/s]
Filter: 6%|▌ | 48000/818627 [00:03<00:54, 14209.33 examples/s]
Filter: 6%|▌ | 48000/818627 [00:03<00:54, 14057.02 examples/s]
Filter: 6%|▌ | 48000/818627 [00:03<00:54, 14178.44 examples/s]
Filter: 6%|▌ | 48000/818627 [00:03<00:55, 13989.66 examples/s]
Filter: 6%|▌ | 48000/818627 [00:03<00:54, 14016.51 examples/s]
Filter: 6%|▌ | 50000/818627 [00:03<00:54, 14034.10 examples/s]
Filter: 6%|▌ | 48000/818627 [00:03<00:54, 14065.85 examples/s]
Filter: 6%|▌ | 50000/818627 [00:03<00:52, 14541.54 examples/s]
Filter: 6%|▌ | 50000/818627 [00:03<00:54, 14225.55 examples/s]
Filter: 6%|▌ | 50000/818627 [00:03<00:54, 14152.23 examples/s]
Filter: 6%|▌ | 50000/818627 [00:03<00:53, 14253.99 examples/s]
Filter: 6%|▌ | 50000/818627 [00:03<00:55, 13889.48 examples/s]
Filter: 6%|▌ | 50000/818627 [00:03<00:55, 13963.01 examples/s]
Filter: 6%|▋ | 52000/818627 [00:03<00:54, 13957.42 examples/s]
Filter: 6%|▌ | 50000/818627 [00:03<00:54, 14102.72 examples/s]
Filter: 6%|▋ | 52000/818627 [00:03<00:52, 14569.05 examples/s]
Filter: 6%|▋ | 52000/818627 [00:03<00:53, 14203.27 examples/s]
Filter: 6%|▋ | 52000/818627 [00:03<00:53, 14274.01 examples/s]
Filter: 6%|▋ | 52000/818627 [00:03<00:53, 14220.83 examples/s]
Filter: 6%|▋ | 52000/818627 [00:03<00:54, 14014.22 examples/s]
Filter: 6%|▋ | 52000/818627 [00:03<00:54, 14029.35 examples/s]
Filter: 7%|▋ | 54000/818627 [00:03<00:55, 13835.61 examples/s]
Filter: 6%|▋ | 52000/818627 [00:03<00:54, 14053.05 examples/s]
Filter: 7%|▋ | 54000/818627 [00:03<00:52, 14523.84 examples/s]
Filter: 7%|▋ | 54000/818627 [00:03<00:53, 14211.46 examples/s]
Filter: 7%|▋ | 54000/818627 [00:03<00:54, 14158.91 examples/s]
Filter: 7%|▋ | 54000/818627 [00:03<00:53, 14159.96 examples/s]
Filter: 7%|▋ | 54000/818627 [00:03<00:54, 14012.49 examples/s]
Filter: 7%|▋ | 54000/818627 [00:03<00:55, 13791.79 examples/s]
Filter: 7%|▋ | 56000/818627 [00:04<00:55, 13818.88 examples/s]
Filter: 7%|▋ | 54000/818627 [00:03<00:54, 14100.16 examples/s]
Filter: 7%|▋ | 56000/818627 [00:03<00:52, 14526.15 examples/s]
Filter: 7%|▋ | 56000/818627 [00:03<00:53, 14238.76 examples/s]
Filter: 7%|▋ | 56000/818627 [00:03<00:53, 14199.94 examples/s]
Filter: 7%|▋ | 56000/818627 [00:03<00:53, 14216.77 examples/s]
Filter: 7%|▋ | 56000/818627 [00:03<00:53, 14140.94 examples/s]
Filter: 7%|▋ | 56000/818627 [00:04<00:55, 13802.97 examples/s]
Filter: 7%|▋ | 56000/818627 [00:04<00:54, 14110.92 examples/s]
Filter: 7%|▋ | 58000/818627 [00:04<00:54, 13897.90 examples/s]
Filter: 7%|▋ | 58000/818627 [00:04<00:52, 14523.63 examples/s]
Filter: 7%|▋ | 58000/818627 [00:04<00:53, 14237.35 examples/s]
Filter: 7%|▋ | 58000/818627 [00:04<00:53, 14216.92 examples/s]
Filter: 7%|▋ | 58000/818627 [00:04<00:53, 14228.24 examples/s]
Filter: 7%|▋ | 58000/818627 [00:04<00:53, 14124.94 examples/s]
Filter: 7%|▋ | 58000/818627 [00:04<00:54, 13915.49 examples/s]
Filter: 7%|▋ | 60000/818627 [00:04<00:54, 13991.24 examples/s]
Filter: 7%|▋ | 58000/818627 [00:04<00:53, 14123.46 examples/s]
Filter: 7%|▋ | 60000/818627 [00:04<00:52, 14556.13 examples/s]
Filter: 7%|▋ | 60000/818627 [00:04<00:53, 14224.96 examples/s]
Filter: 7%|▋ | 60000/818627 [00:04<00:53, 14122.55 examples/s]
Filter: 7%|▋ | 60000/818627 [00:04<00:53, 14109.64 examples/s]
Filter: 7%|▋ | 60000/818627 [00:04<00:53, 14214.91 examples/s]
Filter: 7%|▋ | 60000/818627 [00:04<00:54, 14004.72 examples/s]
Filter: 8%|▊ | 62000/818627 [00:04<00:53, 14069.43 examples/s]
Filter: 7%|▋ | 60000/818627 [00:04<00:54, 14002.10 examples/s]
Filter: 8%|▊ | 62000/818627 [00:04<00:51, 14570.90 examples/s]
Filter: 8%|▊ | 62000/818627 [00:04<00:53, 14207.15 examples/s]
Filter: 8%|▊ | 62000/818627 [00:04<00:53, 14152.31 examples/s]
Filter: 8%|▊ | 62000/818627 [00:04<00:53, 14087.86 examples/s]
Filter: 8%|▊ | 62000/818627 [00:04<00:52, 14280.83 examples/s]
Filter: 8%|▊ | 62000/818627 [00:04<00:53, 14060.39 examples/s]
Filter: 8%|▊ | 64000/818627 [00:04<00:53, 14126.58 examples/s]
Filter: 8%|▊ | 64000/818627 [00:04<00:51, 14557.62 examples/s]
Filter: 8%|▊ | 62000/818627 [00:04<00:54, 13895.66 examples/s]
Filter: 8%|▊ | 64000/818627 [00:04<00:53, 14205.35 examples/s]
Filter: 8%|▊ | 64000/818627 [00:04<00:53, 14170.53 examples/s]
Filter: 8%|▊ | 64000/818627 [00:04<00:53, 14171.87 examples/s]
Filter: 8%|▊ | 64000/818627 [00:04<00:53, 14005.87 examples/s]
Filter: 8%|▊ | 64000/818627 [00:04<00:53, 14101.15 examples/s]
Filter: 8%|▊ | 66000/818627 [00:04<00:53, 14144.00 examples/s]
Filter: 8%|▊ | 66000/818627 [00:04<00:51, 14560.97 examples/s]
Filter: 8%|▊ | 64000/818627 [00:04<00:54, 13948.02 examples/s]
Filter: 8%|▊ | 66000/818627 [00:04<00:53, 14196.20 examples/s]
Filter: 8%|▊ | 66000/818627 [00:04<00:53, 14074.97 examples/s]
Filter: 8%|▊ | 66000/818627 [00:04<00:53, 14081.73 examples/s]
Filter: 8%|▊ | 66000/818627 [00:04<00:53, 14119.38 examples/s]
Filter: 8%|▊ | 66000/818627 [00:04<00:53, 14134.16 examples/s]
Filter: 8%|▊ | 68000/818627 [00:04<00:52, 14184.90 examples/s]
Filter: 8%|▊ | 68000/818627 [00:04<00:51, 14551.45 examples/s]
Filter: 8%|▊ | 66000/818627 [00:04<00:54, 13770.73 examples/s]
Filter: 8%|▊ | 68000/818627 [00:04<00:53, 14072.28 examples/s]
Filter: 8%|▊ | 68000/818627 [00:04<00:53, 14129.43 examples/s]
Filter: 8%|▊ | 68000/818627 [00:04<00:53, 14141.22 examples/s]
Filter: 8%|▊ | 68000/818627 [00:04<00:54, 13786.74 examples/s]
Filter: 8%|▊ | 68000/818627 [00:04<00:53, 14142.77 examples/s]
Filter: 9%|▊ | 70000/818627 [00:04<00:51, 14549.75 examples/s]
Filter: 9%|▊ | 70000/818627 [00:05<00:52, 14224.59 examples/s]
Filter: 8%|▊ | 68000/818627 [00:04<00:54, 13815.22 examples/s]
Filter: 9%|▊ | 70000/818627 [00:04<00:53, 14080.62 examples/s]
Filter: 9%|▊ | 70000/818627 [00:04<00:52, 14165.62 examples/s]
Filter: 9%|▊ | 70000/818627 [00:04<00:52, 14178.24 examples/s]
Filter: 9%|▊ | 70000/818627 [00:04<00:53, 13910.02 examples/s]
Filter: 9%|▊ | 70000/818627 [00:04<00:52, 14175.54 examples/s]
Filter: 9%|▉ | 72000/818627 [00:04<00:51, 14590.17 examples/s]
Filter: 9%|▉ | 72000/818627 [00:05<00:52, 14094.54 examples/s]
Filter: 9%|▊ | 70000/818627 [00:05<00:54, 13772.09 examples/s]
Filter: 9%|▉ | 72000/818627 [00:05<00:52, 14188.04 examples/s]
Filter: 9%|▉ | 72000/818627 [00:05<00:52, 14112.69 examples/s]
Filter: 9%|▉ | 72000/818627 [00:05<00:52, 14208.03 examples/s]
Filter: 9%|▉ | 72000/818627 [00:05<00:53, 14024.31 examples/s]
Filter: 9%|▉ | 74000/818627 [00:05<00:51, 14589.41 examples/s]
Filter: 9%|▉ | 72000/818627 [00:05<00:52, 14203.93 examples/s]
Filter: 9%|▉ | 74000/818627 [00:05<00:52, 14143.86 examples/s]
Filter: 9%|▉ | 72000/818627 [00:05<00:53, 13862.12 examples/s]
Filter: 9%|▉ | 74000/818627 [00:05<00:52, 14144.25 examples/s]
Filter: 9%|▉ | 74000/818627 [00:05<00:52, 14090.48 examples/s]
Filter: 9%|▉ | 74000/818627 [00:05<00:53, 13982.69 examples/s]
Filter: 9%|▉ | 74000/818627 [00:05<00:52, 14094.12 examples/s]
Filter: 9%|▉ | 74000/818627 [00:05<00:52, 14226.85 examples/s]
Filter: 9%|▉ | 76000/818627 [00:05<00:52, 14102.11 examples/s]
Filter: 9%|▉ | 74000/818627 [00:05<00:53, 13904.91 examples/s]
Filter: 10%|▉ | 78000/818627 [00:05<00:52, 14055.49 examples/s]
Filter: 9%|▉ | 76000/818627 [00:05<01:26, 8566.38 examples/s]
Filter: 9%|▉ | 76000/818627 [00:05<01:32, 8061.19 examples/s]
Filter: 9%|▉ | 76000/818627 [00:05<01:32, 8032.91 examples/s]
Filter: 9%|▉ | 76000/818627 [00:05<01:32, 8069.45 examples/s]
Filter: 9%|▉ | 76000/818627 [00:05<01:36, 7734.26 examples/s]
Filter: 9%|▉ | 76000/818627 [00:05<01:32, 8019.52 examples/s]
Filter: 9%|▉ | 76000/818627 [00:05<01:52, 6574.59 examples/s]
Filter: 10%|▉ | 78000/818627 [00:05<01:17, 9569.97 examples/s]
Filter: 10%|▉ | 78000/818627 [00:05<01:20, 9230.97 examples/s]
Filter: 10%|▉ | 78000/818627 [00:05<01:20, 9216.27 examples/s]
Filter: 10%|▉ | 78000/818627 [00:05<01:20, 9245.76 examples/s]
Filter: 10%|▉ | 80000/818627 [00:06<01:29, 8283.21 examples/s]
Filter: 10%|▉ | 78000/818627 [00:05<01:22, 8947.42 examples/s]
Filter: 10%|▉ | 78000/818627 [00:05<01:20, 9196.25 examples/s]
Filter: 10%|▉ | 78000/818627 [00:05<01:34, 7842.03 examples/s]
Filter: 10%|▉ | 80000/818627 [00:06<01:09, 10572.29 examples/s]
Filter: 10%|▉ | 80000/818627 [00:06<01:11, 10281.26 examples/s]
Filter: 10%|▉ | 80000/818627 [00:06<01:11, 10295.43 examples/s]
Filter: 10%|▉ | 80000/818627 [00:06<01:11, 10281.77 examples/s]
Filter: 10%|▉ | 80000/818627 [00:06<01:13, 10070.61 examples/s]
Filter: 10%|█ | 82000/818627 [00:06<01:18, 9332.37 examples/s]
Filter: 10%|▉ | 80000/818627 [00:06<01:12, 10248.96 examples/s]
Filter: 10%|▉ | 80000/818627 [00:06<01:21, 9108.51 examples/s]
Filter: 10%|█ | 82000/818627 [00:06<01:05, 11200.20 examples/s]
Filter: 10%|█ | 82000/818627 [00:06<01:04, 11415.31 examples/s]
Filter: 10%|█ | 82000/818627 [00:06<01:05, 11221.87 examples/s]
Filter: 10%|█ | 82000/818627 [00:06<01:05, 11210.74 examples/s]
Filter: 10%|█ | 82000/818627 [00:06<01:06, 11041.83 examples/s]
Filter: 10%|█ | 84000/818627 [00:06<01:11, 10265.49 examples/s]
Filter: 10%|█ | 82000/818627 [00:06<01:11, 10278.98 examples/s]
Filter: 10%|█ | 82000/818627 [00:06<01:06, 11153.21 examples/s]
Filter: 10%|█ | 84000/818627 [00:06<01:01, 11959.27 examples/s]
Filter: 10%|█ | 84000/818627 [00:06<01:01, 11894.98 examples/s]
Filter: 10%|█ | 84000/818627 [00:06<01:01, 12019.10 examples/s]
Filter: 10%|█ | 84000/818627 [00:06<01:01, 12005.93 examples/s]
Filter: 10%|█ | 84000/818627 [00:06<01:02, 11761.87 examples/s]
Filter: 11%|█ | 86000/818627 [00:06<01:06, 11050.40 examples/s]
Filter: 10%|█ | 84000/818627 [00:06<01:05, 11292.34 examples/s]
Filter: 10%|█ | 84000/818627 [00:06<01:02, 11842.10 examples/s]
Filter: 11%|█ | 86000/818627 [00:06<00:58, 12472.06 examples/s]
Filter: 11%|█ | 86000/818627 [00:06<00:58, 12422.55 examples/s]
Filter: 11%|█ | 86000/818627 [00:06<00:58, 12527.59 examples/s]
Filter: 11%|█ | 86000/818627 [00:06<00:59, 12348.02 examples/s]
Filter: 11%|█ | 86000/818627 [00:06<00:59, 12326.06 examples/s]
Filter: 11%|█ | 88000/818627 [00:06<01:02, 11706.82 examples/s]
Filter: 11%|█ | 86000/818627 [00:06<01:00, 12142.45 examples/s]
Filter: 11%|█ | 86000/818627 [00:06<00:58, 12434.11 examples/s]
Filter: 11%|█ | 88000/818627 [00:06<00:56, 12905.68 examples/s]
Filter: 11%|█ | 88000/818627 [00:06<00:56, 12868.19 examples/s]
Filter: 11%|█ | 88000/818627 [00:06<00:56, 12962.84 examples/s]
Filter: 11%|█ | 88000/818627 [00:06<00:57, 12770.56 examples/s]
Filter: 11%|█ | 88000/818627 [00:06<00:56, 12838.62 examples/s]
Filter: 11%|█ | 88000/818627 [00:06<00:57, 12787.68 examples/s]
Filter: 11%|█ | 90000/818627 [00:06<00:59, 12193.49 examples/s]
Filter: 11%|█ | 88000/818627 [00:06<00:56, 12852.22 examples/s]
Filter: 11%|█ | 90000/818627 [00:06<00:55, 13211.78 examples/s]
Filter: 11%|█ | 90000/818627 [00:06<00:55, 13163.79 examples/s]
Filter: 11%|█ | 90000/818627 [00:06<00:55, 13078.07 examples/s]
Filter: 11%|█ | 90000/818627 [00:06<00:55, 13196.24 examples/s]
Filter: 11%|█ | 90000/818627 [00:06<00:55, 13222.28 examples/s]
Filter: 11%|█ | 90000/818627 [00:06<00:54, 13303.42 examples/s]
Filter: 11%|█ | 92000/818627 [00:06<00:57, 12634.85 examples/s]
Filter: 11%|█ | 90000/818627 [00:06<00:55, 13181.72 examples/s]
Filter: 11%|█ | 92000/818627 [00:06<00:54, 13454.83 examples/s]
Filter: 11%|█ | 92000/818627 [00:06<00:54, 13422.53 examples/s]
Filter: 11%|█ | 92000/818627 [00:06<00:54, 13290.32 examples/s]
Filter: 11%|█ | 92000/818627 [00:06<00:53, 13459.61 examples/s]
Filter: 11%|█ | 92000/818627 [00:06<00:53, 13513.37 examples/s]
Filter: 11%|█ | 92000/818627 [00:06<00:53, 13694.37 examples/s]
Filter: 11%|█▏ | 94000/818627 [00:07<00:55, 12985.88 examples/s]
Filter: 11%|█ | 92000/818627 [00:06<00:54, 13422.58 examples/s]
Filter: 11%|█▏ | 94000/818627 [00:07<00:53, 13518.16 examples/s]
Filter: 11%|█▏ | 94000/818627 [00:07<00:53, 13543.08 examples/s]
Filter: 11%|█▏ | 94000/818627 [00:07<00:52, 13730.63 examples/s]
Filter: 11%|█▏ | 94000/818627 [00:07<00:53, 13491.75 examples/s]
Filter: 11%|█▏ | 94000/818627 [00:07<00:52, 13728.41 examples/s]
Filter: 11%|█▏ | 94000/818627 [00:07<00:51, 13982.14 examples/s]
Filter: 12%|█▏ | 96000/818627 [00:07<00:54, 13154.79 examples/s]
Filter: 11%|█▏ | 94000/818627 [00:07<00:53, 13493.16 examples/s]
Filter: 12%|█▏ | 96000/818627 [00:07<00:52, 13662.38 examples/s]
Filter: 12%|█▏ | 96000/818627 [00:07<00:51, 13904.97 examples/s]
Filter: 12%|█▏ | 96000/818627 [00:07<00:52, 13713.23 examples/s]
Filter: 12%|█▏ | 96000/818627 [00:07<00:52, 13694.53 examples/s]
Filter: 12%|█▏ | 96000/818627 [00:07<00:52, 13891.57 examples/s]
Filter: 12%|█▏ | 96000/818627 [00:07<00:50, 14214.87 examples/s]
Filter: 12%|█▏ | 98000/818627 [00:07<00:54, 13136.57 examples/s]
Filter: 12%|█▏ | 96000/818627 [00:07<00:53, 13607.56 examples/s]
Filter: 12%|█▏ | 98000/818627 [00:07<00:52, 13653.84 examples/s]
Filter: 12%|█▏ | 98000/818627 [00:07<00:51, 13874.81 examples/s]
Filter: 12%|█▏ | 98000/818627 [00:07<00:52, 13736.62 examples/s]
Filter: 12%|█▏ | 98000/818627 [00:07<00:53, 13570.70 examples/s]
Filter: 12%|█▏ | 98000/818627 [00:07<00:51, 13949.13 examples/s]
Filter: 12%|█▏ | 98000/818627 [00:07<00:50, 14256.28 examples/s]
Filter: 12%|█▏ | 100000/818627 [00:07<00:53, 13390.57 examples/s]
Filter: 12%|█▏ | 98000/818627 [00:07<00:52, 13736.66 examples/s]
Filter: 12%|█▏ | 100000/818627 [00:07<00:51, 14018.99 examples/s]
Filter: 12%|█▏ | 100000/818627 [00:07<00:52, 13790.80 examples/s]
Filter: 12%|█▏ | 100000/818627 [00:07<00:51, 13892.85 examples/s]
Filter: 12%|█▏ | 100000/818627 [00:07<00:51, 14050.76 examples/s]
Filter: 12%|█▏ | 100000/818627 [00:07<00:52, 13588.70 examples/s]
Filter: 12%|█▏ | 100000/818627 [00:07<00:50, 14280.72 examples/s]
Filter: 12%|█▏ | 102000/818627 [00:07<00:53, 13471.21 examples/s]
Filter: 12%|█▏ | 100000/818627 [00:07<00:51, 13831.36 examples/s]
Filter: 12%|█▏ | 102000/818627 [00:07<00:50, 14057.56 examples/s]
Filter: 12%|█▏ | 102000/818627 [00:07<00:51, 13992.63 examples/s]
Filter: 12%|█▏ | 102000/818627 [00:07<00:51, 13852.49 examples/s]
Filter: 12%|█▏ | 102000/818627 [00:07<00:51, 13998.72 examples/s]
Filter: 12%|█▏ | 102000/818627 [00:07<00:49, 14416.64 examples/s]
Filter: 12%|█▏ | 102000/818627 [00:07<00:52, 13731.62 examples/s]
Filter: 13%|█▎ | 104000/818627 [00:07<00:52, 13612.50 examples/s]
Filter: 12%|█▏ | 102000/818627 [00:07<00:51, 13898.95 examples/s]
Filter: 13%|█▎ | 104000/818627 [00:07<00:51, 13930.96 examples/s]
Filter: 13%|█▎ | 104000/818627 [00:07<00:51, 14005.06 examples/s]
Filter: 13%|█▎ | 104000/818627 [00:07<00:51, 13939.53 examples/s]
Filter: 13%|█▎ | 104000/818627 [00:07<00:49, 14490.65 examples/s]
Filter: 13%|█▎ | 104000/818627 [00:07<00:50, 14085.03 examples/s]
Filter: 13%|█▎ | 104000/818627 [00:07<00:52, 13560.30 examples/s]
Filter: 13%|█▎ | 106000/818627 [00:08<00:52, 13636.94 examples/s]
Filter: 13%|█▎ | 104000/818627 [00:07<00:51, 13958.80 examples/s]
Filter: 13%|█▎ | 106000/818627 [00:07<00:50, 14038.80 examples/s]
Filter: 13%|█▎ | 106000/818627 [00:07<00:49, 14531.15 examples/s]
Filter: 13%|█▎ | 106000/818627 [00:07<00:51, 13897.35 examples/s]
Filter: 13%|█▎ | 106000/818627 [00:07<00:51, 13930.68 examples/s]
Filter: 13%|█▎ | 106000/818627 [00:07<00:50, 14075.59 examples/s]
Filter: 13%|█▎ | 106000/818627 [00:07<00:52, 13696.75 examples/s]
Filter: 13%|█▎ | 108000/818627 [00:08<00:51, 13760.09 examples/s]
Filter: 13%|█▎ | 106000/818627 [00:07<00:50, 13996.03 examples/s]
Filter: 13%|█▎ | 108000/818627 [00:08<00:50, 14047.79 examples/s]
Filter: 13%|█▎ | 108000/818627 [00:08<00:50, 14058.58 examples/s]
Filter: 13%|█▎ | 108000/818627 [00:08<00:49, 14396.94 examples/s]
Filter: 13%|█▎ | 108000/818627 [00:08<00:50, 13973.27 examples/s]
Filter: 13%|█▎ | 108000/818627 [00:08<00:50, 14062.67 examples/s]
Filter: 13%|█▎ | 108000/818627 [00:08<00:51, 13790.39 examples/s]
Filter: 13%|█▎ | 108000/818627 [00:08<00:50, 14039.43 examples/s]
Filter: 13%|█▎ | 110000/818627 [00:08<00:51, 13706.44 examples/s]
Filter: 13%|█▎ | 110000/818627 [00:08<00:49, 14399.74 examples/s]
Filter: 13%|█▎ | 110000/818627 [00:08<00:50, 14073.65 examples/s]
Filter: 13%|█▎ | 110000/818627 [00:08<00:50, 14123.62 examples/s]
Filter: 13%|█▎ | 110000/818627 [00:08<00:50, 14062.44 examples/s]
Filter: 13%|█▎ | 110000/818627 [00:08<00:50, 14144.06 examples/s]
Filter: 13%|█▎ | 110000/818627 [00:08<00:51, 13864.61 examples/s]
Filter: 13%|█▎ | 110000/818627 [00:08<00:50, 14059.76 examples/s]
Filter: 14%|█▎ | 112000/818627 [00:08<00:51, 13691.78 examples/s]
Filter: 14%|█▎ | 112000/818627 [00:08<00:49, 14420.79 examples/s]
Filter: 14%|█▎ | 112000/818627 [00:08<00:49, 14147.42 examples/s]
Filter: 14%|█▎ | 112000/818627 [00:08<00:49, 14138.50 examples/s]
Filter: 14%|█▎ | 112000/818627 [00:08<00:50, 14066.03 examples/s]
Filter: 14%|█▎ | 112000/818627 [00:08<00:49, 14214.20 examples/s]
Filter: 14%|█▎ | 112000/818627 [00:08<00:51, 13793.32 examples/s]
Filter: 14%|█▎ | 112000/818627 [00:08<00:50, 14093.88 examples/s]
Filter: 14%|█▍ | 114000/818627 [00:08<00:51, 13808.68 examples/s]
Filter: 14%|█▍ | 114000/818627 [00:08<00:49, 14183.10 examples/s]
Filter: 14%|█▍ | 114000/818627 [00:08<00:49, 14229.26 examples/s]
Filter: 14%|█▍ | 114000/818627 [00:08<00:50, 14049.68 examples/s]
Filter: 14%|█▍ | 114000/818627 [00:08<00:50, 14063.78 examples/s]
Filter: 14%|█▍ | 114000/818627 [00:08<00:49, 14263.73 examples/s]
Filter: 14%|█▍ | 114000/818627 [00:08<00:50, 13880.02 examples/s]
Filter: 14%|█▍ | 114000/818627 [00:08<00:49, 14109.94 examples/s]
Filter: 14%|█▍ | 116000/818627 [00:08<00:51, 13737.30 examples/s]
Filter: 14%|█▍ | 116000/818627 [00:08<00:49, 14321.11 examples/s]
Filter: 14%|█▍ | 116000/818627 [00:08<00:49, 14163.38 examples/s]
Filter: 14%|█▍ | 116000/818627 [00:08<00:49, 14169.77 examples/s]
Filter: 14%|█▍ | 116000/818627 [00:08<00:49, 14302.64 examples/s]
Filter: 14%|█▍ | 116000/818627 [00:08<00:50, 13998.93 examples/s]
Filter: 14%|█▍ | 116000/818627 [00:08<00:50, 13946.19 examples/s]
Filter: 14%|█▍ | 116000/818627 [00:08<00:50, 14009.92 examples/s]
Filter: 14%|█▍ | 118000/818627 [00:08<00:51, 13729.76 examples/s]
Filter: 14%|█▍ | 118000/818627 [00:08<00:49, 14245.22 examples/s]
Filter: 14%|█▍ | 118000/818627 [00:08<00:49, 14191.65 examples/s]
Filter: 14%|█▍ | 118000/818627 [00:08<00:49, 14231.56 examples/s]
Filter: 14%|█▍ | 118000/818627 [00:08<00:48, 14321.33 examples/s]
Filter: 14%|█▍ | 118000/818627 [00:08<00:50, 13954.35 examples/s]
Filter: 14%|█▍ | 118000/818627 [00:08<00:50, 13962.62 examples/s]
Filter: 14%|█▍ | 118000/818627 [00:08<00:49, 14039.25 examples/s]
Filter: 15%|█▍ | 120000/818627 [00:09<00:50, 13857.93 examples/s]
Filter: 15%|█▍ | 120000/818627 [00:08<00:49, 14227.77 examples/s]
Filter: 15%|█▍ | 120000/818627 [00:08<00:49, 14233.59 examples/s]
Filter: 15%|█▍ | 120000/818627 [00:08<00:49, 14120.99 examples/s]
Filter: 15%|█▍ | 120000/818627 [00:08<00:49, 14201.25 examples/s]
Filter: 15%|█▍ | 120000/818627 [00:08<00:49, 14031.09 examples/s]
Filter: 15%|█▍ | 120000/818627 [00:08<00:49, 14016.48 examples/s]
Filter: 15%|█▍ | 120000/818627 [00:08<00:49, 14017.96 examples/s]
Filter: 15%|█▍ | 122000/818627 [00:09<00:50, 13890.46 examples/s]
Filter: 15%|█▍ | 122000/818627 [00:08<00:48, 14263.26 examples/s]
Filter: 15%|█▍ | 122000/818627 [00:09<00:49, 14207.06 examples/s]
Filter: 15%|█▍ | 122000/818627 [00:09<00:49, 14144.65 examples/s]
Filter: 15%|█▍ | 122000/818627 [00:09<00:49, 14201.92 examples/s]
Filter: 15%|█▍ | 122000/818627 [00:09<00:49, 13943.10 examples/s]
Filter: 15%|█▍ | 122000/818627 [00:09<00:49, 14012.67 examples/s]
Filter: 15%|█▍ | 122000/818627 [00:09<00:49, 14051.55 examples/s]
Filter: 15%|█▌ | 124000/818627 [00:09<00:49, 13982.31 examples/s]
Filter: 15%|█▌ | 124000/818627 [00:09<00:48, 14228.98 examples/s]
Filter: 15%|█▌ | 124000/818627 [00:09<00:48, 14207.92 examples/s]
Filter: 15%|█▌ | 124000/818627 [00:09<00:49, 14041.79 examples/s]
Filter: 15%|█▌ | 124000/818627 [00:09<00:48, 14178.97 examples/s]
Filter: 15%|█▌ | 124000/818627 [00:09<00:49, 13906.36 examples/s]
Filter: 15%|█▌ | 124000/818627 [00:09<00:49, 13939.38 examples/s]
Filter: 15%|█▌ | 124000/818627 [00:09<00:50, 13878.02 examples/s]
Filter: 15%|█▌ | 126000/818627 [00:09<00:49, 13940.03 examples/s]
Filter: 15%|█▌ | 126000/818627 [00:09<00:48, 14235.53 examples/s]
Filter: 15%|█▌ | 126000/818627 [00:09<00:48, 14233.33 examples/s]
Filter: 15%|█▌ | 126000/818627 [00:09<00:48, 14261.41 examples/s]
Filter: 15%|█▌ | 126000/818627 [00:09<00:49, 14090.75 examples/s]
Filter: 15%|█▌ | 126000/818627 [00:09<00:49, 13925.29 examples/s]
Filter: 15%|█▌ | 126000/818627 [00:09<00:49, 13966.39 examples/s]
Filter: 15%|█▌ | 126000/818627 [00:09<00:49, 13924.10 examples/s]
Filter: 16%|█▌ | 128000/818627 [00:09<00:49, 13942.10 examples/s]
Filter: 16%|█▌ | 128000/818627 [00:09<00:48, 14239.05 examples/s]
Filter: 16%|█▌ | 128000/818627 [00:09<00:48, 14231.90 examples/s]
Filter: 16%|█▌ | 128000/818627 [00:09<00:48, 14265.32 examples/s]
Filter: 16%|█▌ | 128000/818627 [00:09<00:49, 14084.11 examples/s]
Filter: 16%|█▌ | 128000/818627 [00:09<00:49, 14049.48 examples/s]
Filter: 16%|█▌ | 128000/818627 [00:09<00:50, 13791.71 examples/s]
Filter: 16%|█▌ | 128000/818627 [00:09<00:49, 13841.82 examples/s]
Filter: 16%|█▌ | 130000/818627 [00:09<00:49, 13989.51 examples/s]
Filter: 16%|█▌ | 130000/818627 [00:09<00:48, 14226.35 examples/s]
Filter: 16%|█▌ | 130000/818627 [00:09<00:48, 14224.26 examples/s]
Filter: 16%|█▌ | 130000/818627 [00:09<00:48, 14278.68 examples/s]
Filter: 16%|█▌ | 130000/818627 [00:09<00:48, 14077.97 examples/s]
Filter: 16%|█▌ | 130000/818627 [00:09<00:48, 14123.21 examples/s]
Filter: 16%|█▌ | 130000/818627 [00:09<00:49, 13798.88 examples/s]
Filter: 16%|█▌ | 130000/818627 [00:09<00:49, 13921.96 examples/s]
Filter: 16%|█▌ | 132000/818627 [00:09<00:48, 14024.06 examples/s]
Filter: 16%|█▌ | 132000/818627 [00:09<00:48, 14247.38 examples/s]
Filter: 16%|█▌ | 132000/818627 [00:09<00:47, 14322.10 examples/s]
Filter: 16%|█▌ | 132000/818627 [00:09<00:48, 14131.92 examples/s]
Filter: 16%|█▌ | 132000/818627 [00:09<00:48, 14126.69 examples/s]
Filter: 16%|█▌ | 132000/818627 [00:09<00:48, 14205.52 examples/s]
Filter: 16%|█▌ | 132000/818627 [00:09<00:49, 13902.98 examples/s]
Filter: 16%|█▌ | 132000/818627 [00:09<00:49, 14009.35 examples/s]
Filter: 16%|█▋ | 134000/818627 [00:10<00:48, 14003.40 examples/s]
Filter: 16%|█▋ | 134000/818627 [00:09<00:48, 14247.81 examples/s]
Filter: 16%|█▋ | 134000/818627 [00:09<00:47, 14328.01 examples/s]
Filter: 16%|█▋ | 134000/818627 [00:09<00:48, 14227.95 examples/s]
Filter: 16%|█▋ | 134000/818627 [00:09<00:48, 14253.15 examples/s]
Filter: 16%|█▋ | 134000/818627 [00:09<00:48, 14252.97 examples/s]
Filter: 16%|█▋ | 134000/818627 [00:09<00:49, 13937.85 examples/s]
Filter: 16%|█▋ | 134000/818627 [00:09<00:49, 13936.49 examples/s]
Filter: 17%|█▋ | 136000/818627 [00:10<00:49, 13882.17 examples/s]
Filter: 17%|█▋ | 136000/818627 [00:09<00:47, 14284.97 examples/s]
Filter: 17%|█▋ | 136000/818627 [00:09<00:47, 14321.63 examples/s]
Filter: 17%|█▋ | 136000/818627 [00:09<00:47, 14236.94 examples/s]
Filter: 17%|█▋ | 136000/818627 [00:09<00:47, 14392.18 examples/s]
Filter: 17%|█▋ | 136000/818627 [00:09<00:47, 14306.40 examples/s]
Filter: 17%|█▋ | 136000/818627 [00:10<00:48, 13998.39 examples/s]
Filter: 17%|█▋ | 136000/818627 [00:10<00:48, 13998.58 examples/s]
Filter: 17%|█▋ | 138000/818627 [00:10<00:49, 13820.55 examples/s]
Filter: 17%|█▋ | 138000/818627 [00:10<00:47, 14403.39 examples/s]
Filter: 17%|█▋ | 138000/818627 [00:10<00:47, 14291.65 examples/s]
Filter: 17%|█▋ | 138000/818627 [00:10<00:47, 14240.09 examples/s]
Filter: 17%|█▋ | 138000/818627 [00:10<00:48, 13906.67 examples/s]
Filter: 17%|█▋ | 138000/818627 [00:10<00:47, 14269.31 examples/s]
Filter: 17%|█▋ | 138000/818627 [00:10<00:48, 14034.08 examples/s]
Filter: 17%|█▋ | 138000/818627 [00:10<00:48, 13940.60 examples/s]
Filter: 17%|█▋ | 140000/818627 [00:10<00:48, 13864.69 examples/s]
Filter: 17%|█▋ | 140000/818627 [00:10<00:47, 14311.22 examples/s]
Filter: 17%|█▋ | 140000/818627 [00:10<00:47, 14164.55 examples/s]
Filter: 17%|█▋ | 140000/818627 [00:10<00:47, 14195.10 examples/s]
Filter: 17%|█▋ | 140000/818627 [00:10<00:48, 13918.01 examples/s]
Filter: 17%|█▋ | 140000/818627 [00:10<00:47, 14200.59 examples/s]
Filter: 17%|█▋ | 140000/818627 [00:10<00:48, 14023.00 examples/s]
Filter: 17%|█▋ | 140000/818627 [00:10<00:48, 14000.30 examples/s]
Filter: 17%|█▋ | 142000/818627 [00:10<00:48, 13927.36 examples/s]
Filter: 17%|█▋ | 142000/818627 [00:10<00:47, 14347.05 examples/s]
Filter: 17%|█▋ | 142000/818627 [00:10<00:47, 14199.46 examples/s]
Filter: 17%|█▋ | 142000/818627 [00:10<00:47, 14113.54 examples/s]
Filter: 17%|█▋ | 142000/818627 [00:10<00:48, 14057.79 examples/s]
Filter: 17%|█▋ | 142000/818627 [00:10<00:47, 14110.72 examples/s]
Filter: 17%|█▋ | 142000/818627 [00:10<00:48, 14049.29 examples/s]
Filter: 17%|█▋ | 142000/818627 [00:10<00:48, 14044.35 examples/s]
Filter: 18%|█▊ | 144000/818627 [00:10<00:46, 14377.67 examples/s]
Filter: 18%|█▊ | 144000/818627 [00:10<00:48, 13948.47 examples/s]
Filter: 18%|█▊ | 144000/818627 [00:10<00:47, 14247.68 examples/s]
Filter: 18%|█▊ | 144000/818627 [00:10<00:47, 14195.73 examples/s]
Filter: 18%|█▊ | 144000/818627 [00:10<00:47, 14150.84 examples/s]
Filter: 18%|█▊ | 144000/818627 [00:10<00:48, 14052.04 examples/s]
Filter: 18%|█▊ | 144000/818627 [00:10<00:47, 14083.58 examples/s]
Filter: 18%|█▊ | 144000/818627 [00:10<00:48, 13964.26 examples/s]
Filter: 18%|█▊ | 146000/818627 [00:10<00:46, 14384.14 examples/s]
Filter: 18%|█▊ | 146000/818627 [00:10<00:47, 14223.92 examples/s]
Filter: 18%|█▊ | 146000/818627 [00:10<00:48, 13913.92 examples/s]
Filter: 18%|█▊ | 146000/818627 [00:10<00:47, 14229.13 examples/s]
Filter: 18%|█▊ | 146000/818627 [00:10<00:47, 14215.54 examples/s]
Filter: 18%|█▊ | 146000/818627 [00:10<00:47, 14121.47 examples/s]
Filter: 18%|█▊ | 146000/818627 [00:10<00:47, 14119.49 examples/s]
Filter: 18%|█▊ | 146000/818627 [00:10<00:48, 13769.41 examples/s]
Filter: 18%|█▊ | 148000/818627 [00:10<00:47, 14192.95 examples/s]
Filter: 18%|█▊ | 148000/818627 [00:11<00:48, 13930.81 examples/s]
Filter: 18%|█▊ | 148000/818627 [00:10<00:47, 14001.63 examples/s]
Filter: 18%|█▊ | 148000/818627 [00:10<00:47, 14115.08 examples/s]
Filter: 18%|█▊ | 148000/818627 [00:10<00:46, 14268.75 examples/s]
Filter: 18%|█▊ | 148000/818627 [00:10<00:47, 14177.11 examples/s]
Filter: 18%|█▊ | 148000/818627 [00:10<00:47, 14164.84 examples/s]
Filter: 18%|█▊ | 148000/818627 [00:10<00:48, 13755.07 examples/s]
Filter: 18%|█▊ | 150000/818627 [00:10<00:47, 14188.36 examples/s]
Filter: 18%|█▊ | 150000/818627 [00:10<00:47, 14139.67 examples/s]
Filter: 18%|█▊ | 150000/818627 [00:10<00:47, 14194.72 examples/s]
Filter: 18%|█▊ | 150000/818627 [00:11<00:47, 13955.97 examples/s]
Filter: 18%|█▊ | 150000/818627 [00:10<00:46, 14314.37 examples/s]
Filter: 18%|█▊ | 150000/818627 [00:10<00:46, 14246.51 examples/s]
Filter: 18%|█▊ | 150000/818627 [00:11<00:47, 14179.60 examples/s]
Filter: 18%|█▊ | 150000/818627 [00:11<00:48, 13863.76 examples/s]
Filter: 19%|█▊ | 152000/818627 [00:11<00:46, 14226.88 examples/s]
Filter: 19%|█▊ | 152000/818627 [00:11<00:47, 14078.05 examples/s]
Filter: 19%|█▊ | 152000/818627 [00:11<00:47, 14126.85 examples/s]
Filter: 19%|█▊ | 152000/818627 [00:11<00:46, 14235.34 examples/s]
Filter: 19%|█▊ | 152000/818627 [00:11<00:47, 13930.21 examples/s]
Filter: 19%|█▊ | 152000/818627 [00:11<00:46, 14288.27 examples/s]
Filter: 19%|█▊ | 152000/818627 [00:11<00:46, 14195.95 examples/s]
Filter: 19%|█▊ | 152000/818627 [00:11<00:47, 13918.61 examples/s]
Filter: 19%|█▉ | 154000/818627 [00:11<00:46, 14163.50 examples/s]
Filter: 19%|█▉ | 154000/818627 [00:11<00:47, 14094.87 examples/s]
Filter: 19%|█▉ | 154000/818627 [00:11<00:47, 14124.71 examples/s]
Filter: 19%|█▉ | 154000/818627 [00:11<00:46, 14189.12 examples/s]
Filter: 19%|█▉ | 154000/818627 [00:11<00:47, 13973.86 examples/s]
Filter: 19%|█▉ | 154000/818627 [00:11<00:46, 14255.99 examples/s]
Filter: 19%|█▉ | 154000/818627 [00:11<00:46, 14217.04 examples/s]
Filter: 19%|█▉ | 154000/818627 [00:11<00:47, 13954.17 examples/s]
Filter: 19%|█▉ | 156000/818627 [00:11<00:47, 14092.36 examples/s]
Filter: 19%|█▉ | 156000/818627 [00:11<00:46, 14151.01 examples/s]
Filter: 19%|█▉ | 156000/818627 [00:11<00:47, 14055.82 examples/s]
Filter: 19%|█▉ | 156000/818627 [00:11<00:46, 14142.13 examples/s]
Filter: 19%|█▉ | 156000/818627 [00:11<00:47, 13882.17 examples/s]
Filter: 19%|█▉ | 156000/818627 [00:11<00:47, 13857.86 examples/s]
Filter: 19%|█▉ | 156000/818627 [00:11<00:46, 14231.92 examples/s]
Filter: 19%|█▉ | 156000/818627 [00:11<00:47, 14003.59 examples/s]
Filter: 19%|█▉ | 158000/818627 [00:11<00:46, 14216.13 examples/s]
Filter: 19%|█▉ | 158000/818627 [00:11<00:46, 14235.97 examples/s]
Filter: 19%|█▉ | 158000/818627 [00:11<00:47, 14052.79 examples/s]
Filter: 19%|█▉ | 158000/818627 [00:11<00:47, 13996.59 examples/s]
Filter: 19%|█▉ | 158000/818627 [00:11<00:47, 13864.67 examples/s]
Filter: 19%|█▉ | 158000/818627 [00:11<00:48, 13726.97 examples/s]
Filter: 19%|█▉ | 158000/818627 [00:11<00:46, 14146.98 examples/s]
Filter: 19%|█▉ | 158000/818627 [00:11<00:47, 14031.12 examples/s]
Filter: 20%|█▉ | 160000/818627 [00:11<00:46, 14251.13 examples/s]
Filter: 20%|█▉ | 160000/818627 [00:11<00:46, 14287.04 examples/s]
Filter: 20%|█▉ | 160000/818627 [00:11<00:46, 14164.70 examples/s]
Filter: 20%|█▉ | 160000/818627 [00:11<00:46, 14122.62 examples/s]
Filter: 20%|█▉ | 160000/818627 [00:11<00:47, 13774.76 examples/s]
Filter: 20%|█▉ | 160000/818627 [00:11<00:47, 13829.53 examples/s]
Filter: 20%|█▉ | 160000/818627 [00:11<00:46, 14116.31 examples/s]
Filter: 20%|█▉ | 160000/818627 [00:11<00:46, 14050.94 examples/s]
Filter: 20%|█▉ | 162000/818627 [00:11<00:46, 14267.49 examples/s]
Filter: 20%|█▉ | 162000/818627 [00:11<00:46, 14173.22 examples/s]
Filter: 20%|█▉ | 162000/818627 [00:11<00:46, 14180.51 examples/s]
Filter: 20%|█▉ | 162000/818627 [00:11<00:46, 14084.64 examples/s]
Filter: 20%|█▉ | 162000/818627 [00:12<00:47, 13814.41 examples/s]
Filter: 20%|█▉ | 162000/818627 [00:11<00:47, 13934.62 examples/s]
Filter: 20%|█▉ | 162000/818627 [00:11<00:46, 14135.85 examples/s]
Filter: 20%|██ | 164000/818627 [00:11<00:46, 14201.95 examples/s]
Filter: 20%|██ | 164000/818627 [00:11<00:45, 14252.03 examples/s]
Filter: 20%|██ | 164000/818627 [00:11<00:46, 14141.89 examples/s]
Filter: 20%|█▉ | 162000/818627 [00:11<00:47, 13959.99 examples/s]
Filter: 20%|██ | 164000/818627 [00:11<00:46, 14091.90 examples/s]
Filter: 20%|██ | 164000/818627 [00:12<00:47, 13834.86 examples/s]
Filter: 20%|██ | 164000/818627 [00:11<00:46, 14003.07 examples/s]
Filter: 20%|██ | 164000/818627 [00:12<00:46, 14148.68 examples/s]
Filter: 20%|██ | 164000/818627 [00:12<00:46, 14030.85 examples/s]
Filter: 20%|██ | 166000/818627 [00:12<00:46, 14173.99 examples/s]
Filter: 20%|██ | 166000/818627 [00:12<00:46, 14112.22 examples/s]
Filter: 20%|██ | 166000/818627 [00:12<00:45, 14194.07 examples/s]
Filter: 20%|██ | 166000/818627 [00:12<00:46, 14111.29 examples/s]
Filter: 20%|██ | 166000/818627 [00:12<00:47, 13778.86 examples/s]
Filter: 20%|██ | 166000/818627 [00:12<00:46, 14026.25 examples/s]
Filter: 20%|██ | 166000/818627 [00:12<00:47, 13884.05 examples/s]
Filter: 21%|██ | 168000/818627 [00:12<00:45, 14228.15 examples/s]
Filter: 21%|██ | 168000/818627 [00:12<00:45, 14247.14 examples/s]
Filter: 21%|██ | 168000/818627 [00:12<00:45, 14185.99 examples/s]
Filter: 21%|██ | 168000/818627 [00:12<00:45, 14188.70 examples/s]
Filter: 20%|██ | 166000/818627 [00:12<00:46, 13990.27 examples/s]
Filter: 21%|██ | 168000/818627 [00:12<00:47, 13831.54 examples/s]
Filter: 21%|██ | 168000/818627 [00:12<00:46, 14068.36 examples/s]
Filter: 21%|██ | 168000/818627 [00:12<00:46, 13988.42 examples/s]
Filter: 21%|██ | 170000/818627 [00:12<00:45, 14298.67 examples/s]
Filter: 21%|██ | 170000/818627 [00:12<00:45, 14279.26 examples/s]
Filter: 21%|██ | 170000/818627 [00:12<00:45, 14250.75 examples/s]
Filter: 21%|██ | 170000/818627 [00:12<00:45, 14120.73 examples/s]
Filter: 21%|██ | 168000/818627 [00:12<00:46, 14043.35 examples/s]
Filter: 21%|██ | 170000/818627 [00:12<00:45, 14117.54 examples/s]
Filter: 21%|██ | 170000/818627 [00:12<00:47, 13728.60 examples/s]
Filter: 21%|██ | 170000/818627 [00:12<00:46, 14042.41 examples/s]
Filter: 21%|██ | 172000/818627 [00:12<00:45, 14304.75 examples/s]
Filter: 21%|██ | 172000/818627 [00:12<00:45, 14284.89 examples/s]
Filter: 21%|██ | 172000/818627 [00:12<00:45, 14273.01 examples/s]
Filter: 21%|██ | 172000/818627 [00:12<00:45, 14095.65 examples/s]
Filter: 21%|██ | 170000/818627 [00:12<00:46, 14088.02 examples/s]
Filter: 21%|██ | 172000/818627 [00:12<00:45, 14180.48 examples/s]
Filter: 21%|██ | 172000/818627 [00:12<00:47, 13644.66 examples/s]
Filter: 21%|██ | 172000/818627 [00:12<00:45, 14063.58 examples/s]
Filter: 21%|██▏ | 174000/818627 [00:12<00:45, 14284.13 examples/s]
Filter: 21%|██▏ | 174000/818627 [00:12<00:45, 14304.12 examples/s]
Filter: 21%|██▏ | 174000/818627 [00:12<00:45, 14207.40 examples/s]
Filter: 21%|██ | 172000/818627 [00:12<00:45, 14109.45 examples/s]
Filter: 21%|██▏ | 174000/818627 [00:12<00:46, 13981.28 examples/s]
Filter: 21%|██▏ | 174000/818627 [00:12<00:45, 14055.89 examples/s]
Filter: 21%|██▏ | 174000/818627 [00:12<00:47, 13638.25 examples/s]
Filter: 21%|██▏ | 174000/818627 [00:12<00:45, 14105.78 examples/s]
Filter: 21%|██▏ | 176000/818627 [00:12<00:44, 14338.70 examples/s]
Filter: 21%|██▏ | 176000/818627 [00:12<00:45, 14275.75 examples/s]
Filter: 21%|██▏ | 176000/818627 [00:12<00:45, 14103.08 examples/s]
Filter: 21%|██▏ | 174000/818627 [00:12<00:45, 14134.31 examples/s]
Filter: 21%|██▏ | 176000/818627 [00:12<00:46, 13844.05 examples/s]
Filter: 21%|██▏ | 176000/818627 [00:12<00:45, 14095.52 examples/s]
Filter: 21%|██▏ | 176000/818627 [00:13<00:46, 13732.43 examples/s]
Filter: 21%|██▏ | 176000/818627 [00:12<00:45, 14138.29 examples/s]
Filter: 22%|██▏ | 178000/818627 [00:12<00:44, 14351.48 examples/s]
Filter: 22%|██▏ | 178000/818627 [00:12<00:45, 14211.89 examples/s]
Filter: 21%|██▏ | 176000/818627 [00:12<00:45, 14156.05 examples/s]
Filter: 22%|██▏ | 178000/818627 [00:12<00:45, 14070.19 examples/s]
Filter: 22%|██▏ | 178000/818627 [00:12<00:45, 14014.69 examples/s]
Filter: 22%|██▏ | 178000/818627 [00:12<00:45, 14009.06 examples/s]
Filter: 22%|██▏ | 178000/818627 [00:13<00:46, 13680.60 examples/s]
Filter: 22%|██▏ | 178000/818627 [00:13<00:45, 14133.44 examples/s]
Filter: 22%|██▏ | 180000/818627 [00:13<00:44, 14341.89 examples/s]
Filter: 22%|██▏ | 180000/818627 [00:13<00:44, 14222.92 examples/s]
Filter: 22%|██▏ | 180000/818627 [00:13<00:45, 14167.85 examples/s]
Filter: 22%|██▏ | 178000/818627 [00:13<00:45, 14176.69 examples/s]
Filter: 22%|██▏ | 180000/818627 [00:13<00:45, 14129.62 examples/s]
Filter: 22%|██▏ | 180000/818627 [00:13<00:45, 14081.46 examples/s]
Filter: 22%|██▏ | 180000/818627 [00:13<00:46, 13640.32 examples/s]
Filter: 22%|██▏ | 180000/818627 [00:13<00:45, 14137.74 examples/s]
Filter: 22%|██▏ | 182000/818627 [00:13<00:44, 14318.34 examples/s]
Filter: 22%|██▏ | 182000/818627 [00:13<00:44, 14275.79 examples/s]
Filter: 22%|██▏ | 182000/818627 [00:13<00:44, 14180.61 examples/s]
Filter: 22%|██▏ | 180000/818627 [00:13<00:45, 14181.30 examples/s]
Filter: 22%|██▏ | 182000/818627 [00:13<00:45, 14105.18 examples/s]
Filter: 22%|██▏ | 182000/818627 [00:13<00:45, 14111.31 examples/s]
Filter: 22%|██▏ | 182000/818627 [00:13<00:45, 14143.58 examples/s]
Filter: 22%|██▏ | 182000/818627 [00:13<00:46, 13593.55 examples/s]
Filter: 22%|██▏ | 184000/818627 [00:13<00:44, 14125.79 examples/s]
Filter: 22%|██▏ | 184000/818627 [00:13<00:44, 14311.31 examples/s]
Filter: 22%|██▏ | 184000/818627 [00:13<00:44, 14138.79 examples/s]
Filter: 22%|██▏ | 182000/818627 [00:13<00:45, 14115.53 examples/s]
Filter: 22%|██▏ | 184000/818627 [00:13<00:45, 14069.65 examples/s]
Filter: 22%|██▏ | 184000/818627 [00:13<00:45, 14064.05 examples/s]
Filter: 22%|██▏ | 184000/818627 [00:13<00:44, 14120.03 examples/s]
Filter: 22%|██▏ | 184000/818627 [00:13<00:46, 13730.28 examples/s]
Filter: 23%|██▎ | 186000/818627 [00:13<00:44, 14310.78 examples/s]
Filter: 23%|██▎ | 186000/818627 [00:13<00:45, 14027.63 examples/s]
Filter: 23%|██▎ | 186000/818627 [00:13<00:44, 14200.68 examples/s]
Filter: 23%|██▎ | 186000/818627 [00:13<00:44, 14147.13 examples/s]
Filter: 22%|██▏ | 184000/818627 [00:13<00:45, 14092.92 examples/s]
Filter: 23%|██▎ | 186000/818627 [00:13<00:44, 14089.69 examples/s]
Filter: 23%|██▎ | 186000/818627 [00:13<00:44, 14108.71 examples/s]
Filter: 23%|██▎ | 186000/818627 [00:13<00:46, 13721.38 examples/s]
Filter: 23%|██▎ | 188000/818627 [00:13<00:44, 14306.60 examples/s]
Filter: 23%|██▎ | 188000/818627 [00:13<00:44, 14136.28 examples/s]
Filter: 23%|██▎ | 188000/818627 [00:13<00:44, 14267.59 examples/s]
Filter: 23%|██▎ | 188000/818627 [00:13<00:44, 14239.09 examples/s]
Filter: 23%|██▎ | 186000/818627 [00:13<00:44, 14097.25 examples/s]
Filter: 23%|██▎ | 188000/818627 [00:13<00:44, 14128.73 examples/s]
Filter: 23%|██▎ | 188000/818627 [00:13<00:44, 14101.18 examples/s]
Filter: 23%|██▎ | 188000/818627 [00:13<00:45, 13741.86 examples/s]
Filter: 23%|██▎ | 190000/818627 [00:13<00:44, 14252.12 examples/s]
Filter: 23%|██▎ | 190000/818627 [00:13<00:43, 14311.47 examples/s]
Filter: 23%|██▎ | 190000/818627 [00:13<00:44, 14078.76 examples/s]
Filter: 23%|██▎ | 190000/818627 [00:13<00:44, 14243.41 examples/s]
Filter: 23%|██▎ | 188000/818627 [00:13<00:45, 13950.62 examples/s]
Filter: 23%|██▎ | 190000/818627 [00:13<00:44, 14081.28 examples/s]
Filter: 23%|██▎ | 190000/818627 [00:13<00:44, 14108.91 examples/s]
Filter: 23%|██▎ | 190000/818627 [00:14<00:45, 13838.37 examples/s]
Filter: 23%|██▎ | 192000/818627 [00:13<00:44, 14183.71 examples/s]
Filter: 23%|██▎ | 192000/818627 [00:13<00:44, 14201.61 examples/s]
Filter: 23%|██▎ | 192000/818627 [00:13<00:43, 14339.49 examples/s]
Filter: 23%|██▎ | 192000/818627 [00:13<00:44, 14195.17 examples/s]
Filter: 23%|██▎ | 190000/818627 [00:13<00:44, 14026.67 examples/s]
Filter: 23%|██▎ | 192000/818627 [00:13<00:44, 14138.04 examples/s]
Filter: 23%|██▎ | 192000/818627 [00:14<00:44, 14130.82 examples/s]
Filter: 23%|██▎ | 192000/818627 [00:14<00:44, 13925.92 examples/s]
Filter: 24%|██▎ | 194000/818627 [00:14<00:43, 14282.85 examples/s]
Filter: 24%|██▎ | 194000/818627 [00:14<00:43, 14249.63 examples/s]
Filter: 24%|██▎ | 194000/818627 [00:14<00:43, 14358.40 examples/s]
Filter: 24%|██▎ | 194000/818627 [00:14<00:43, 14299.27 examples/s]
Filter: 23%|██▎ | 192000/818627 [00:14<00:44, 14078.88 examples/s]
Filter: 24%|██▎ | 194000/818627 [00:14<00:44, 14155.57 examples/s]
Filter: 24%|██▎ | 194000/818627 [00:14<00:44, 14026.74 examples/s]
Filter: 24%|██▎ | 194000/818627 [00:14<00:45, 13858.25 examples/s]
Filter: 24%|██▍ | 196000/818627 [00:14<00:43, 14318.43 examples/s]
Filter: 24%|██▍ | 196000/818627 [00:14<00:43, 14399.55 examples/s]
Filter: 24%|██▍ | 196000/818627 [00:14<00:43, 14305.83 examples/s]
Filter: 24%|██▍ | 196000/818627 [00:14<00:43, 14369.70 examples/s]
Filter: 24%|██▎ | 194000/818627 [00:14<00:44, 14122.42 examples/s]
Filter: 24%|██▍ | 196000/818627 [00:14<00:44, 14145.26 examples/s]
Filter: 24%|██▍ | 196000/818627 [00:14<00:44, 14052.02 examples/s]
Filter: 24%|██▍ | 196000/818627 [00:14<00:44, 13942.51 examples/s]
Filter: 24%|██▍ | 198000/818627 [00:14<00:43, 14333.88 examples/s]
Filter: 24%|██▍ | 198000/818627 [00:14<00:43, 14382.18 examples/s]
Filter: 24%|██▍ | 198000/818627 [00:14<00:43, 14316.89 examples/s]
Filter: 24%|██▍ | 198000/818627 [00:14<00:43, 14279.23 examples/s]
Filter: 24%|██▍ | 196000/818627 [00:14<00:44, 14004.24 examples/s]
Filter: 24%|██▍ | 198000/818627 [00:14<00:43, 14172.14 examples/s]
Filter: 24%|██▍ | 198000/818627 [00:14<00:44, 14004.05 examples/s]
Filter: 24%|██▍ | 198000/818627 [00:14<00:44, 13980.24 examples/s]
Filter: 24%|██▍ | 200000/818627 [00:14<00:43, 14353.72 examples/s]
Filter: 24%|██▍ | 200000/818627 [00:14<00:43, 14345.93 examples/s]
Filter: 24%|██▍ | 200000/818627 [00:14<00:43, 14254.13 examples/s]
Filter: 24%|██▍ | 200000/818627 [00:14<00:43, 14327.85 examples/s]
Filter: 24%|██▍ | 198000/818627 [00:14<00:44, 14055.32 examples/s]
Filter: 24%|██▍ | 200000/818627 [00:14<00:43, 14184.79 examples/s]
Filter: 24%|██▍ | 200000/818627 [00:14<00:44, 14018.39 examples/s]
Filter: 24%|██▍ | 200000/818627 [00:14<00:44, 13997.03 examples/s]
Filter: 25%|██▍ | 202000/818627 [00:14<00:42, 14372.47 examples/s]
Filter: 25%|██▍ | 202000/818627 [00:14<00:42, 14372.82 examples/s]
Filter: 25%|██▍ | 202000/818627 [00:14<00:43, 14170.03 examples/s]
Filter: 25%|██▍ | 202000/818627 [00:14<00:43, 14209.32 examples/s]
Filter: 24%|██▍ | 200000/818627 [00:14<00:43, 14077.99 examples/s]
Filter: 25%|██▍ | 202000/818627 [00:14<00:43, 14198.22 examples/s]
Filter: 25%|██▍ | 202000/818627 [00:14<00:44, 13786.18 examples/s]
Filter: 25%|██▍ | 202000/818627 [00:14<00:43, 14033.87 examples/s]
Filter: 25%|██▍ | 204000/818627 [00:14<00:42, 14391.86 examples/s]
Filter: 25%|██▍ | 204000/818627 [00:14<00:43, 14261.79 examples/s]
Filter: 25%|██▍ | 204000/818627 [00:14<00:43, 14162.26 examples/s]
Filter: 25%|██▍ | 204000/818627 [00:14<00:42, 14295.18 examples/s]
Filter: 25%|██▍ | 202000/818627 [00:14<00:43, 14118.86 examples/s]
Filter: 25%|██▍ | 204000/818627 [00:14<00:43, 14214.30 examples/s]
Filter: 25%|██▍ | 204000/818627 [00:14<00:44, 13901.87 examples/s]
Filter: 25%|██▍ | 204000/818627 [00:15<00:43, 14068.89 examples/s]
Filter: 25%|██▌ | 206000/818627 [00:14<00:42, 14285.77 examples/s]
Filter: 25%|██▌ | 206000/818627 [00:14<00:43, 14012.64 examples/s]
Filter: 25%|██▌ | 206000/818627 [00:14<00:43, 14108.92 examples/s]
Filter: 25%|██▌ | 206000/818627 [00:14<00:43, 14207.46 examples/s]
Filter: 25%|██▍ | 204000/818627 [00:14<00:43, 14025.68 examples/s]
Filter: 25%|██▌ | 206000/818627 [00:14<00:43, 14215.48 examples/s]
Filter: 25%|██▌ | 206000/818627 [00:15<00:43, 13960.62 examples/s]
Filter: 25%|██▌ | 206000/818627 [00:15<00:43, 14009.55 examples/s]
Filter: 25%|██▌ | 208000/818627 [00:15<00:42, 14277.88 examples/s]
Filter: 25%|██▌ | 208000/818627 [00:15<00:43, 14122.49 examples/s]
Filter: 25%|██▌ | 208000/818627 [00:15<00:43, 14183.21 examples/s]
Filter: 25%|██▌ | 208000/818627 [00:15<00:42, 14249.22 examples/s]
Filter: 25%|██▌ | 206000/818627 [00:15<00:43, 14055.55 examples/s]
Filter: 25%|██▌ | 208000/818627 [00:15<00:44, 13846.44 examples/s]
Filter: 25%|██▌ | 208000/818627 [00:15<00:44, 13873.82 examples/s]
Filter: 25%|██▌ | 208000/818627 [00:15<00:44, 13764.96 examples/s]
Filter: 26%|██▌ | 210000/818627 [00:15<00:42, 14257.20 examples/s]
Filter: 26%|██▌ | 210000/818627 [00:15<00:42, 14198.22 examples/s]
Filter: 26%|██▌ | 210000/818627 [00:15<00:42, 14279.73 examples/s]
Filter: 26%|██▌ | 210000/818627 [00:15<00:42, 14224.53 examples/s]
Filter: 25%|██▌ | 208000/818627 [00:15<00:44, 13863.00 examples/s]
Filter: 26%|██▌ | 210000/818627 [00:15<00:43, 13934.82 examples/s]
Filter: 26%|██▌ | 210000/818627 [00:15<00:43, 13930.45 examples/s]
Filter: 26%|██▌ | 210000/818627 [00:15<00:44, 13722.20 examples/s]
Filter: 26%|██▌ | 212000/818627 [00:15<00:42, 14232.38 examples/s]
Filter: 26%|██▌ | 212000/818627 [00:15<00:42, 14167.74 examples/s]
Filter: 26%|██▌ | 212000/818627 [00:15<00:42, 14266.68 examples/s]
Filter: 26%|██▌ | 212000/818627 [00:15<00:42, 14176.85 examples/s]
Filter: 26%|██▌ | 210000/818627 [00:15<00:44, 13800.93 examples/s]
Filter: 26%|██▌ | 212000/818627 [00:15<00:43, 13867.27 examples/s]
Filter: 26%|██▌ | 212000/818627 [00:15<00:43, 13960.23 examples/s]
Filter: 26%|██▌ | 212000/818627 [00:15<00:44, 13672.85 examples/s]
Filter: 26%|██▌ | 214000/818627 [00:15<00:42, 14217.79 examples/s]
Filter: 26%|██▌ | 214000/818627 [00:15<00:42, 14205.22 examples/s]
Filter: 26%|██▌ | 214000/818627 [00:15<00:42, 14284.61 examples/s]
Filter: 26%|██▌ | 214000/818627 [00:15<00:42, 14249.51 examples/s]
Filter: 26%|██▌ | 212000/818627 [00:15<00:43, 13847.30 examples/s]
Filter: 26%|██▌ | 214000/818627 [00:15<00:43, 13948.94 examples/s]
Filter: 26%|██▌ | 214000/818627 [00:15<00:43, 13997.94 examples/s]
Filter: 26%|██▋ | 216000/818627 [00:15<00:42, 14256.13 examples/s]
Filter: 26%|██▋ | 216000/818627 [00:15<00:42, 14260.49 examples/s]
Filter: 26%|██▌ | 214000/818627 [00:15<00:44, 13603.96 examples/s]
Filter: 26%|██▋ | 216000/818627 [00:15<00:43, 14009.11 examples/s]
Filter: 26%|██▋ | 216000/818627 [00:15<00:42, 14261.20 examples/s]
Filter: 26%|██▌ | 214000/818627 [00:15<00:43, 13771.16 examples/s]
Filter: 26%|██▋ | 216000/818627 [00:15<00:43, 14009.07 examples/s]
Filter: 26%|██▋ | 216000/818627 [00:15<00:43, 13871.47 examples/s]
Filter: 27%|██▋ | 218000/818627 [00:15<00:42, 14267.68 examples/s]
Filter: 27%|██▋ | 218000/818627 [00:15<00:42, 14107.64 examples/s]
Filter: 27%|██▋ | 218000/818627 [00:15<00:42, 14252.37 examples/s]
Filter: 27%|██▋ | 218000/818627 [00:15<00:41, 14310.37 examples/s]
Filter: 26%|██▋ | 216000/818627 [00:15<00:43, 13699.07 examples/s]
Filter: 26%|██▋ | 216000/818627 [00:15<00:43, 13740.62 examples/s]
Filter: 27%|██▋ | 218000/818627 [00:15<00:43, 13930.33 examples/s]
Filter: 27%|██▋ | 218000/818627 [00:15<00:43, 13919.45 examples/s]
Filter: 27%|██▋ | 220000/818627 [00:15<00:42, 14163.88 examples/s]
Filter: 27%|██▋ | 220000/818627 [00:15<00:41, 14294.85 examples/s]
Filter: 27%|██▋ | 220000/818627 [00:15<00:42, 14052.61 examples/s]
Filter: 27%|██▋ | 220000/818627 [00:15<00:42, 14153.05 examples/s]
Filter: 27%|██▋ | 218000/818627 [00:16<00:45, 13323.31 examples/s]
Filter: 27%|██▋ | 218000/818627 [00:15<00:43, 13831.89 examples/s]
Filter: 27%|██▋ | 220000/818627 [00:15<00:42, 14024.96 examples/s]
Filter: 27%|██▋ | 220000/818627 [00:16<00:42, 13957.17 examples/s]
Filter: 27%|██▋ | 222000/818627 [00:16<00:42, 14141.51 examples/s]
Filter: 27%|██▋ | 222000/818627 [00:16<00:41, 14206.91 examples/s]
Filter: 27%|██▋ | 222000/818627 [00:16<00:42, 14097.29 examples/s]
Filter: 27%|██▋ | 222000/818627 [00:16<00:42, 14191.21 examples/s]
Filter: 27%|██▋ | 220000/818627 [00:16<00:44, 13432.40 examples/s]
Filter: 27%|██▋ | 220000/818627 [00:16<00:43, 13888.48 examples/s]
Filter: 27%|██▋ | 222000/818627 [00:16<00:42, 13957.88 examples/s]
Filter: 27%|██▋ | 222000/818627 [00:16<00:42, 13984.61 examples/s]
Filter: 27%|██▋ | 224000/818627 [00:16<00:41, 14200.30 examples/s]
Filter: 27%|██▋ | 224000/818627 [00:16<00:41, 14190.05 examples/s]
Filter: 27%|██▋ | 224000/818627 [00:16<00:41, 14231.84 examples/s]
Filter: 27%|██▋ | 224000/818627 [00:16<00:41, 14248.04 examples/s]
Filter: 27%|██▋ | 222000/818627 [00:16<00:43, 13591.21 examples/s]
Filter: 27%|██▋ | 222000/818627 [00:16<00:42, 13932.45 examples/s]
Filter: 27%|██▋ | 224000/818627 [00:16<00:42, 13916.45 examples/s]
Filter: 27%|██▋ | 224000/818627 [00:16<00:42, 14018.99 examples/s]
Filter: 28%|██▊ | 226000/818627 [00:16<00:41, 14210.57 examples/s]
Filter: 28%|██▊ | 226000/818627 [00:16<00:41, 14253.52 examples/s]
Filter: 28%|██▊ | 226000/818627 [00:16<00:41, 14201.06 examples/s]
Filter: 28%|██▊ | 226000/818627 [00:16<00:41, 14230.97 examples/s]
Filter: 27%|██▋ | 224000/818627 [00:16<00:43, 13655.16 examples/s]
Filter: 27%|██▋ | 224000/818627 [00:16<00:42, 13973.34 examples/s]
Filter: 28%|██▊ | 226000/818627 [00:16<00:42, 13887.04 examples/s]
Filter: 28%|██▊ | 226000/818627 [00:16<00:42, 14017.41 examples/s]
Filter: 28%|██▊ | 228000/818627 [00:16<00:41, 14258.28 examples/s]
Filter: 28%|██▊ | 228000/818627 [00:16<00:41, 14274.14 examples/s]
Filter: 28%|██▊ | 228000/818627 [00:16<00:41, 14127.94 examples/s]
Filter: 28%|██▊ | 228000/818627 [00:16<00:41, 14130.06 examples/s]
Filter: 28%|██▊ | 226000/818627 [00:16<00:44, 13431.37 examples/s]
Filter: 28%|██▊ | 226000/818627 [00:16<00:42, 14009.50 examples/s]
Filter: 28%|██▊ | 228000/818627 [00:16<00:42, 13989.56 examples/s]
Filter: 28%|██▊ | 228000/818627 [00:16<00:42, 13891.12 examples/s]
Filter: 28%|██▊ | 230000/818627 [00:16<00:41, 14256.02 examples/s]
Filter: 28%|██▊ | 230000/818627 [00:16<00:41, 14155.59 examples/s]
Filter: 28%|██▊ | 230000/818627 [00:16<00:41, 14095.38 examples/s]
Filter: 28%|██▊ | 230000/818627 [00:16<00:41, 14149.62 examples/s]
Filter: 28%|██▊ | 228000/818627 [00:16<00:43, 13447.75 examples/s]
Filter: 28%|██▊ | 228000/818627 [00:16<00:42, 13936.11 examples/s]
Filter: 28%|██▊ | 230000/818627 [00:16<00:42, 14014.73 examples/s]
Filter: 28%|██▊ | 230000/818627 [00:16<00:42, 13941.55 examples/s]
Filter: 28%|██▊ | 232000/818627 [00:16<00:41, 14208.96 examples/s]
Filter: 28%|██▊ | 232000/818627 [00:16<00:41, 14218.34 examples/s]
Filter: 28%|██▊ | 232000/818627 [00:16<00:41, 14206.82 examples/s]
Filter: 28%|██▊ | 232000/818627 [00:16<00:41, 14223.12 examples/s]
Filter: 28%|██▊ | 230000/818627 [00:16<00:43, 13615.93 examples/s]
Filter: 28%|██▊ | 230000/818627 [00:16<00:42, 13852.26 examples/s]
Filter: 28%|██▊ | 232000/818627 [00:16<00:41, 14070.61 examples/s]
Filter: 29%|██▊ | 234000/818627 [00:16<00:41, 14252.57 examples/s]
Filter: 29%|██▊ | 234000/818627 [00:16<00:40, 14274.84 examples/s]
Filter: 29%|██▊ | 234000/818627 [00:16<00:41, 14214.29 examples/s]
Filter: 28%|██▊ | 232000/818627 [00:16<00:42, 13962.89 examples/s]
Filter: 29%|██▊ | 234000/818627 [00:16<00:41, 14162.63 examples/s]
Filter: 28%|██▊ | 232000/818627 [00:17<00:42, 13720.03 examples/s]
Filter: 28%|██▊ | 232000/818627 [00:16<00:42, 13909.72 examples/s]
Filter: 29%|██▊ | 234000/818627 [00:16<00:41, 14000.41 examples/s]
Filter: 29%|██▉ | 236000/818627 [00:17<00:40, 14309.73 examples/s]
Filter: 29%|██▉ | 236000/818627 [00:17<00:40, 14256.64 examples/s]
Filter: 29%|██▊ | 234000/818627 [00:17<00:41, 13986.16 examples/s]
Filter: 29%|██▉ | 236000/818627 [00:17<00:41, 14185.18 examples/s]
Filter: 29%|██▉ | 236000/818627 [00:17<00:40, 14227.08 examples/s]
Filter: 29%|██▊ | 234000/818627 [00:17<00:42, 13817.60 examples/s]
Filter: 29%|██▊ | 234000/818627 [00:17<00:41, 13947.65 examples/s]
Filter: 29%|██▉ | 236000/818627 [00:17<00:41, 14051.94 examples/s]
Filter: 29%|██▉ | 238000/818627 [00:17<00:40, 14308.58 examples/s]
Filter: 29%|██▉ | 238000/818627 [00:17<00:40, 14265.45 examples/s]
Filter: 29%|██▉ | 238000/818627 [00:17<00:40, 14265.36 examples/s]
Filter: 29%|██▉ | 238000/818627 [00:17<00:41, 14114.76 examples/s]
Filter: 29%|██▉ | 236000/818627 [00:17<00:42, 13867.43 examples/s]
Filter: 29%|██▉ | 236000/818627 [00:17<00:42, 13765.47 examples/s]
Filter: 29%|██▉ | 236000/818627 [00:17<00:42, 13809.45 examples/s]
Filter: 29%|██▉ | 238000/818627 [00:17<00:41, 13998.64 examples/s]
Filter: 29%|██▉ | 240000/818627 [00:17<00:40, 14196.75 examples/s]
Filter: 29%|██▉ | 240000/818627 [00:17<00:40, 14204.78 examples/s]
Filter: 29%|██▉ | 240000/818627 [00:17<00:40, 14264.06 examples/s]
Filter: 29%|██▉ | 240000/818627 [00:17<00:41, 14102.83 examples/s]
Filter: 29%|██▉ | 238000/818627 [00:17<00:41, 13827.27 examples/s]
Filter: 29%|██▉ | 238000/818627 [00:17<00:42, 13627.97 examples/s]
Filter: 29%|██▉ | 240000/818627 [00:17<00:41, 14070.52 examples/s]
Filter: 29%|██▉ | 238000/818627 [00:17<00:42, 13737.12 examples/s]
Filter: 30%|██▉ | 242000/818627 [00:17<00:40, 14240.43 examples/s]
Filter: 30%|██▉ | 242000/818627 [00:17<00:40, 14225.79 examples/s]
Filter: 30%|██▉ | 242000/818627 [00:17<00:40, 14302.91 examples/s]
Filter: 30%|██▉ | 242000/818627 [00:17<00:40, 14187.00 examples/s]
Filter: 29%|██▉ | 240000/818627 [00:17<00:41, 13889.66 examples/s]
Filter: 29%|██▉ | 240000/818627 [00:17<00:42, 13756.25 examples/s]
Filter: 29%|██▉ | 240000/818627 [00:17<00:41, 13825.36 examples/s]
Filter: 30%|██▉ | 242000/818627 [00:17<00:41, 13979.01 examples/s]
Filter: 30%|██▉ | 244000/818627 [00:17<00:40, 14296.38 examples/s]
Filter: 30%|██▉ | 244000/818627 [00:17<00:40, 14231.79 examples/s]
Filter: 30%|██▉ | 244000/818627 [00:17<00:40, 14243.15 examples/s]
Filter: 30%|██▉ | 244000/818627 [00:17<00:41, 13966.34 examples/s]
Filter: 30%|██▉ | 242000/818627 [00:17<00:41, 13928.08 examples/s]
Filter: 30%|██▉ | 242000/818627 [00:17<00:41, 13826.16 examples/s]
Filter: 30%|██▉ | 242000/818627 [00:17<00:41, 13861.85 examples/s]
Filter: 30%|██▉ | 244000/818627 [00:17<00:40, 14022.96 examples/s]
Filter: 30%|███ | 246000/818627 [00:17<00:40, 14178.05 examples/s]
Filter: 30%|███ | 246000/818627 [00:17<00:40, 14213.67 examples/s]
Filter: 30%|███ | 246000/818627 [00:17<00:40, 14242.56 examples/s]
Filter: 30%|███ | 246000/818627 [00:17<00:40, 14105.12 examples/s]
Filter: 30%|██▉ | 244000/818627 [00:17<00:41, 13768.69 examples/s]
Filter: 30%|██▉ | 244000/818627 [00:18<00:41, 13904.33 examples/s]
Filter: 30%|██▉ | 244000/818627 [00:17<00:41, 13872.68 examples/s]
Filter: 30%|███ | 246000/818627 [00:17<00:41, 13928.14 examples/s]
Filter: 30%|███ | 248000/818627 [00:17<00:40, 14219.14 examples/s]
Filter: 30%|███ | 248000/818627 [00:17<00:40, 14259.67 examples/s]
Filter: 30%|███ | 248000/818627 [00:17<00:40, 14174.65 examples/s]
Filter: 30%|███ | 248000/818627 [00:17<00:40, 14139.16 examples/s]
Filter: 30%|███ | 246000/818627 [00:17<00:41, 13672.44 examples/s]
Filter: 30%|███ | 246000/818627 [00:18<00:40, 13966.90 examples/s]
Filter: 30%|███ | 246000/818627 [00:17<00:41, 13904.54 examples/s]
Filter: 30%|███ | 248000/818627 [00:17<00:40, 14003.93 examples/s]
Filter: 31%|███ | 250000/818627 [00:17<00:39, 14245.39 examples/s]
Filter: 31%|███ | 250000/818627 [00:18<00:39, 14255.32 examples/s]
Filter: 31%|███ | 250000/818627 [00:18<00:40, 14193.29 examples/s]
Filter: 31%|███ | 250000/818627 [00:18<00:40, 14174.20 examples/s]
Filter: 30%|███ | 248000/818627 [00:18<00:41, 13785.41 examples/s]
Filter: 30%|███ | 248000/818627 [00:18<00:40, 13973.29 examples/s]
Filter: 31%|███ | 250000/818627 [00:18<00:40, 14055.21 examples/s]
Filter: 30%|███ | 248000/818627 [00:18<00:40, 13944.04 examples/s]
Filter: 31%|███ | 252000/818627 [00:18<00:39, 14238.64 examples/s]
Filter: 31%|███ | 252000/818627 [00:18<00:39, 14225.46 examples/s]
Filter: 31%|███ | 252000/818627 [00:18<00:39, 14200.30 examples/s]
Filter: 31%|███ | 252000/818627 [00:18<00:39, 14176.86 examples/s]
Filter: 31%|███ | 250000/818627 [00:18<00:41, 13858.61 examples/s]
Filter: 31%|███ | 250000/818627 [00:18<00:40, 14032.10 examples/s]
Filter: 31%|███ | 252000/818627 [00:18<00:40, 14104.86 examples/s]
Filter: 31%|███ | 250000/818627 [00:18<00:40, 13961.82 examples/s]
Filter: 31%|███ | 254000/818627 [00:18<00:39, 14255.02 examples/s]
Filter: 31%|███ | 254000/818627 [00:18<00:39, 14204.38 examples/s]
Filter: 31%|███ | 254000/818627 [00:18<00:39, 14260.28 examples/s]
Filter: 31%|███ | 254000/818627 [00:18<00:39, 14154.43 examples/s]
Filter: 31%|███ | 252000/818627 [00:18<00:40, 13924.48 examples/s]
Filter: 31%|███ | 252000/818627 [00:18<00:40, 13957.64 examples/s]
Filter: 31%|███ | 254000/818627 [00:18<00:39, 14133.29 examples/s]
Filter: 31%|███ | 252000/818627 [00:18<00:40, 13991.03 examples/s]
Filter: 31%|███▏ | 256000/818627 [00:18<00:39, 14249.54 examples/s]
Filter: 31%|███▏ | 256000/818627 [00:18<00:39, 14209.62 examples/s]
Filter: 31%|███▏ | 256000/818627 [00:18<00:39, 14259.94 examples/s]
Filter: 31%|███▏ | 256000/818627 [00:18<00:39, 14228.46 examples/s]
Filter: 31%|███ | 254000/818627 [00:18<00:40, 13942.17 examples/s]
Filter: 31%|███ | 254000/818627 [00:18<00:40, 13962.75 examples/s]
Filter: 31%|███▏ | 256000/818627 [00:18<00:40, 14051.54 examples/s]
Filter: 31%|███ | 254000/818627 [00:18<00:40, 14002.08 examples/s]
Filter: 32%|███▏ | 258000/818627 [00:18<00:39, 14257.81 examples/s]
Filter: 32%|███▏ | 258000/818627 [00:18<00:39, 14272.66 examples/s]
Filter: 32%|███▏ | 258000/818627 [00:18<00:39, 14225.56 examples/s]
Filter: 32%|███▏ | 258000/818627 [00:18<00:39, 14133.25 examples/s]
Filter: 31%|███▏ | 256000/818627 [00:18<00:40, 13988.30 examples/s]
Filter: 31%|███▏ | 256000/818627 [00:18<00:40, 14036.58 examples/s]
Filter: 32%|███▏ | 258000/818627 [00:18<00:39, 14096.73 examples/s]
Filter: 31%|███▏ | 256000/818627 [00:18<00:40, 14001.06 examples/s]
Filter: 32%|███▏ | 260000/818627 [00:18<00:39, 14308.78 examples/s]
Filter: 32%|███▏ | 260000/818627 [00:18<00:39, 14255.51 examples/s]
Filter: 32%|███▏ | 260000/818627 [00:18<00:39, 14197.76 examples/s]
Filter: 32%|███▏ | 260000/818627 [00:18<00:39, 14022.37 examples/s]
Filter: 32%|███▏ | 258000/818627 [00:18<00:40, 13989.70 examples/s]
Filter: 32%|███▏ | 258000/818627 [00:19<00:39, 14033.00 examples/s]
Filter: 32%|███▏ | 260000/818627 [00:18<00:39, 14013.11 examples/s]
Filter: 32%|███▏ | 258000/818627 [00:18<00:40, 13713.90 examples/s]
Filter: 32%|███▏ | 262000/818627 [00:18<00:38, 14368.39 examples/s]
Filter: 32%|███▏ | 262000/818627 [00:18<00:39, 14206.50 examples/s]
Filter: 32%|███▏ | 262000/818627 [00:18<00:39, 14197.46 examples/s]
Filter: 32%|███▏ | 262000/818627 [00:18<00:39, 14069.87 examples/s]
Filter: 32%|███▏ | 260000/818627 [00:18<00:40, 13886.48 examples/s]
Filter: 32%|███▏ | 260000/818627 [00:19<00:40, 13936.33 examples/s]
Filter: 32%|███▏ | 262000/818627 [00:18<00:40, 13885.45 examples/s]
Filter: 32%|███▏ | 260000/818627 [00:18<00:40, 13675.67 examples/s]
Filter: 32%|███▏ | 264000/818627 [00:18<00:39, 14185.25 examples/s]
Filter: 32%|███▏ | 264000/818627 [00:19<00:39, 14137.64 examples/s]
Filter: 32%|███▏ | 264000/818627 [00:19<00:39, 14173.98 examples/s]
Filter: 32%|███▏ | 264000/818627 [00:19<00:39, 13932.58 examples/s]
Filter: 32%|███▏ | 262000/818627 [00:19<00:40, 13875.18 examples/s]
Filter: 32%|███▏ | 262000/818627 [00:19<00:39, 13953.77 examples/s]
Filter: 32%|███▏ | 264000/818627 [00:19<00:39, 14013.35 examples/s]
Filter: 32%|███▏ | 266000/818627 [00:19<00:38, 14269.29 examples/s]
Filter: 32%|███▏ | 262000/818627 [00:19<00:40, 13717.18 examples/s]
Filter: 32%|███▏ | 266000/818627 [00:19<00:39, 14167.52 examples/s]
Filter: 32%|███▏ | 266000/818627 [00:19<00:38, 14188.68 examples/s]
Filter: 32%|███▏ | 266000/818627 [00:19<00:39, 13941.59 examples/s]
Filter: 32%|███▏ | 264000/818627 [00:19<00:40, 13799.96 examples/s]
Filter: 32%|███▏ | 264000/818627 [00:19<00:39, 13978.10 examples/s]
Filter: 32%|███▏ | 266000/818627 [00:19<00:39, 14099.99 examples/s]
Filter: 33%|███▎ | 268000/818627 [00:19<00:38, 14346.78 examples/s]
Filter: 32%|███▏ | 264000/818627 [00:19<00:40, 13780.81 examples/s]
Filter: 33%|███▎ | 268000/818627 [00:19<00:38, 14212.96 examples/s]
Filter: 33%|███▎ | 268000/818627 [00:19<00:38, 14187.90 examples/s]
Filter: 33%|███▎ | 268000/818627 [00:19<00:39, 14034.52 examples/s]
Filter: 32%|███▏ | 266000/818627 [00:19<00:39, 13866.28 examples/s]
Filter: 32%|███▏ | 266000/818627 [00:19<00:39, 13963.39 examples/s]
Filter: 33%|███▎ | 268000/818627 [00:19<00:39, 14029.27 examples/s]
Filter: 33%|███▎ | 270000/818627 [00:19<00:38, 14281.48 examples/s]
Filter: 33%|███▎ | 270000/818627 [00:19<00:38, 14210.49 examples/s]
Filter: 33%|███▎ | 270000/818627 [00:19<00:38, 14217.53 examples/s]
Filter: 32%|███▏ | 266000/818627 [00:19<00:39, 13826.03 examples/s]
Filter: 33%|███▎ | 270000/818627 [00:19<00:38, 14120.72 examples/s]
Filter: 33%|███▎ | 268000/818627 [00:19<00:39, 13901.39 examples/s]
Filter: 33%|███▎ | 268000/818627 [00:19<00:39, 13988.99 examples/s]
Filter: 33%|███▎ | 270000/818627 [00:19<00:38, 14106.81 examples/s]
Filter: 33%|███▎ | 272000/818627 [00:19<00:38, 14362.21 examples/s]
Filter: 33%|███▎ | 272000/818627 [00:19<00:38, 14204.51 examples/s]
Filter: 33%|███▎ | 272000/818627 [00:19<00:38, 14214.53 examples/s]
Filter: 33%|███▎ | 268000/818627 [00:19<00:39, 13860.90 examples/s]
Filter: 33%|███▎ | 272000/818627 [00:19<00:38, 14050.38 examples/s]
Filter: 33%|███▎ | 270000/818627 [00:19<00:39, 13934.81 examples/s]
Filter: 33%|███▎ | 270000/818627 [00:19<00:39, 14023.00 examples/s]
Filter: 33%|███▎ | 272000/818627 [00:19<00:38, 14164.59 examples/s]
Filter: 33%|███▎ | 274000/818627 [00:19<00:37, 14434.37 examples/s]
Filter: 33%|███▎ | 274000/818627 [00:19<00:38, 14219.81 examples/s]
Filter: 33%|███▎ | 274000/818627 [00:19<00:38, 14154.65 examples/s]
Filter: 33%|███▎ | 270000/818627 [00:19<00:39, 13872.76 examples/s]
Filter: 33%|███▎ | 274000/818627 [00:19<00:38, 14104.49 examples/s]
Filter: 33%|███▎ | 272000/818627 [00:19<00:39, 13957.33 examples/s]
Filter: 33%|███▎ | 272000/818627 [00:20<00:39, 13859.58 examples/s]
Filter: 34%|███▎ | 276000/818627 [00:19<00:37, 14470.64 examples/s]
Filter: 33%|███▎ | 274000/818627 [00:19<00:39, 13832.10 examples/s]
Filter: 34%|███▎ | 276000/818627 [00:19<00:38, 14195.13 examples/s]
Filter: 34%|███▎ | 276000/818627 [00:19<00:38, 14163.02 examples/s]
Filter: 33%|███▎ | 272000/818627 [00:19<00:39, 13724.95 examples/s]
Filter: 34%|███▎ | 276000/818627 [00:19<00:38, 14116.25 examples/s]
Filter: 33%|███▎ | 274000/818627 [00:19<00:39, 13962.67 examples/s]
Filter: 33%|███▎ | 274000/818627 [00:20<00:39, 13885.39 examples/s]
Filter: 34%|███▍ | 278000/818627 [00:19<00:37, 14445.52 examples/s]
Filter: 34%|███▎ | 276000/818627 [00:19<00:39, 13804.04 examples/s]
Filter: 34%|███▍ | 278000/818627 [00:19<00:38, 14149.32 examples/s]
Filter: 34%|███▍ | 278000/818627 [00:19<00:38, 14155.34 examples/s]
Filter: 34%|███▍ | 278000/818627 [00:20<00:38, 14115.28 examples/s]
Filter: 33%|███▎ | 274000/818627 [00:20<00:39, 13617.09 examples/s]
Filter: 34%|███▎ | 276000/818627 [00:20<00:38, 13982.11 examples/s]
Filter: 34%|███▍ | 280000/818627 [00:20<00:37, 14434.93 examples/s]
Filter: 34%|███▎ | 276000/818627 [00:20<00:38, 13922.18 examples/s]
Filter: 34%|███▍ | 278000/818627 [00:20<00:38, 13894.49 examples/s]
Filter: 34%|███▍ | 280000/818627 [00:20<00:38, 14162.57 examples/s]
Filter: 34%|███▍ | 280000/818627 [00:20<00:38, 14142.92 examples/s]
Filter: 34%|███▍ | 280000/818627 [00:20<00:38, 14140.03 examples/s]
Filter: 34%|███▎ | 276000/818627 [00:20<00:39, 13667.49 examples/s]
Filter: 34%|███▍ | 278000/818627 [00:20<00:38, 13979.12 examples/s]
Filter: 34%|███▍ | 282000/818627 [00:20<00:37, 14332.93 examples/s]
Filter: 34%|███▍ | 278000/818627 [00:20<00:38, 13908.38 examples/s]
Filter: 34%|███▍ | 280000/818627 [00:20<00:38, 13974.47 examples/s]
Filter: 34%|███▍ | 282000/818627 [00:20<00:37, 14144.21 examples/s]
Filter: 34%|███▍ | 282000/818627 [00:20<00:38, 14027.12 examples/s]
Filter: 34%|███▍ | 282000/818627 [00:20<00:37, 14140.19 examples/s]
Filter: 34%|███▍ | 278000/818627 [00:20<00:39, 13697.83 examples/s]
Filter: 34%|███▍ | 280000/818627 [00:20<00:38, 13995.26 examples/s]
Filter: 35%|███▍ | 284000/818627 [00:20<00:37, 14385.63 examples/s]
Filter: 34%|███▍ | 280000/818627 [00:20<00:38, 13916.87 examples/s]
Filter: 34%|███▍ | 282000/818627 [00:20<00:38, 14053.64 examples/s]
Filter: 35%|███▍ | 284000/818627 [00:20<00:38, 14052.34 examples/s]
Filter: 35%|███▍ | 284000/818627 [00:20<00:38, 13989.25 examples/s]
Filter: 35%|███▍ | 284000/818627 [00:20<00:37, 14153.86 examples/s]
Filter: 34%|███▍ | 280000/818627 [00:20<00:39, 13758.64 examples/s]
Filter: 34%|███▍ | 282000/818627 [00:20<00:38, 14023.50 examples/s]
Filter: 35%|███▍ | 286000/818627 [00:20<00:37, 14303.22 examples/s]
Filter: 35%|███▍ | 284000/818627 [00:20<00:37, 14127.61 examples/s]
Filter: 34%|███▍ | 282000/818627 [00:20<00:39, 13682.80 examples/s]
Filter: 35%|███▍ | 286000/818627 [00:20<00:37, 14098.56 examples/s]
Filter: 35%|███▍ | 286000/818627 [00:20<00:37, 14039.07 examples/s]
Filter: 35%|███▍ | 286000/818627 [00:20<00:37, 14197.44 examples/s]
Filter: 34%|███▍ | 282000/818627 [00:20<00:39, 13577.37 examples/s]
Filter: 35%|███▍ | 284000/818627 [00:20<00:38, 14022.60 examples/s]
Filter: 35%|███▌ | 288000/818627 [00:20<00:37, 14249.98 examples/s]
Filter: 35%|███▍ | 286000/818627 [00:20<00:37, 14176.17 examples/s]
Filter: 35%|███▍ | 284000/818627 [00:20<00:38, 13734.83 examples/s]
Filter: 35%|███▌ | 288000/818627 [00:20<00:37, 14140.06 examples/s]
Filter: 35%|███▌ | 288000/818627 [00:20<00:37, 14101.76 examples/s]
Filter: 35%|███▌ | 288000/818627 [00:20<00:37, 14213.00 examples/s]
Filter: 35%|███▍ | 284000/818627 [00:20<00:39, 13557.54 examples/s]
Filter: 35%|███▍ | 286000/818627 [00:20<00:38, 13899.30 examples/s]
Filter: 35%|███▌ | 290000/818627 [00:20<00:37, 14001.50 examples/s]
Filter: 35%|███▌ | 288000/818627 [00:20<00:37, 14177.18 examples/s]
Filter: 35%|███▍ | 286000/818627 [00:21<00:38, 13812.73 examples/s]
Filter: 35%|███▌ | 290000/818627 [00:20<00:37, 14152.89 examples/s]
Filter: 35%|███▌ | 290000/818627 [00:20<00:37, 14155.95 examples/s]
Filter: 35%|███▌ | 290000/818627 [00:20<00:37, 14234.97 examples/s]
Filter: 35%|███▍ | 286000/818627 [00:20<00:39, 13532.16 examples/s]
Filter: 35%|███▌ | 288000/818627 [00:20<00:38, 13932.94 examples/s]
Filter: 36%|███▌ | 292000/818627 [00:20<00:37, 14119.19 examples/s]
Filter: 35%|███▌ | 290000/818627 [00:20<00:37, 14200.99 examples/s]
Filter: 35%|███▌ | 288000/818627 [00:21<00:38, 13843.00 examples/s]
Filter: 36%|███▌ | 292000/818627 [00:20<00:37, 14168.75 examples/s]
Filter: 36%|███▌ | 292000/818627 [00:20<00:37, 14192.04 examples/s]
Filter: 36%|███▌ | 292000/818627 [00:20<00:36, 14258.36 examples/s]
Filter: 35%|███▌ | 288000/818627 [00:21<00:38, 13655.90 examples/s]
Filter: 35%|███▌ | 290000/818627 [00:21<00:37, 13951.94 examples/s]
Filter: 36%|███▌ | 294000/818627 [00:21<00:36, 14252.75 examples/s]
Filter: 36%|███▌ | 292000/818627 [00:21<00:37, 14216.58 examples/s]
Filter: 35%|███▌ | 290000/818627 [00:21<00:38, 13861.67 examples/s]
Filter: 36%|███▌ | 294000/818627 [00:21<00:36, 14210.74 examples/s]
Filter: 36%|███▌ | 294000/818627 [00:21<00:37, 14065.15 examples/s]
Filter: 36%|███▌ | 294000/818627 [00:21<00:36, 14282.21 examples/s]
Filter: 35%|███▌ | 290000/818627 [00:21<00:38, 13747.72 examples/s]
Filter: 36%|███▌ | 292000/818627 [00:21<00:37, 13984.79 examples/s]
Filter: 36%|███▌ | 296000/818627 [00:21<00:36, 14334.90 examples/s]
Filter: 36%|███▌ | 294000/818627 [00:21<00:36, 14242.61 examples/s]
Filter: 36%|███▌ | 296000/818627 [00:21<00:36, 14191.11 examples/s]
Filter: 36%|███▌ | 292000/818627 [00:21<00:37, 13896.10 examples/s]
Filter: 36%|███▌ | 296000/818627 [00:21<00:37, 14114.73 examples/s]
Filter: 36%|███▌ | 296000/818627 [00:21<00:36, 14213.47 examples/s]
Filter: 36%|███▌ | 292000/818627 [00:21<00:38, 13674.62 examples/s]
Filter: 36%|███▌ | 294000/818627 [00:21<00:37, 14002.49 examples/s]
Filter: 36%|███▋ | 298000/818627 [00:21<00:36, 14383.07 examples/s]
Filter: 36%|███▌ | 296000/818627 [00:21<00:36, 14229.74 examples/s]
Filter: 36%|███▋ | 298000/818627 [00:21<00:36, 14166.97 examples/s]
Filter: 36%|███▌ | 294000/818627 [00:21<00:37, 13910.11 examples/s]
Filter: 36%|███▋ | 298000/818627 [00:21<00:36, 14223.71 examples/s]
Filter: 36%|███▋ | 298000/818627 [00:21<00:37, 14027.24 examples/s]
Filter: 36%|███▌ | 294000/818627 [00:21<00:38, 13753.48 examples/s]
Filter: 36%|███▌ | 296000/818627 [00:21<00:37, 13818.38 examples/s]
Filter: 37%|███▋ | 300000/818627 [00:21<00:36, 14297.79 examples/s]
Filter: 36%|███▋ | 298000/818627 [00:21<00:36, 14110.45 examples/s]
Filter: 37%|███▋ | 300000/818627 [00:21<00:36, 14035.10 examples/s]
Filter: 37%|███▋ | 300000/818627 [00:21<00:36, 14233.81 examples/s]
Filter: 37%|███▋ | 300000/818627 [00:21<00:36, 14114.57 examples/s]
Filter: 36%|███▌ | 296000/818627 [00:21<00:37, 13789.53 examples/s]
Filter: 36%|███▌ | 296000/818627 [00:21<00:37, 13814.38 examples/s]
Filter: 36%|███▋ | 298000/818627 [00:21<00:37, 13708.05 examples/s]
Filter: 37%|███▋ | 302000/818627 [00:21<00:36, 14332.01 examples/s]
Filter: 37%|███▋ | 300000/818627 [00:21<00:36, 14147.62 examples/s]
Filter: 37%|███▋ | 302000/818627 [00:21<00:36, 14234.46 examples/s]
Filter: 37%|███▋ | 302000/818627 [00:21<00:36, 14087.20 examples/s]
Filter: 37%|███▋ | 302000/818627 [00:21<00:36, 14146.58 examples/s]
Filter: 36%|███▋ | 298000/818627 [00:21<00:37, 13847.83 examples/s]
Filter: 36%|███▋ | 298000/818627 [00:21<00:37, 13853.60 examples/s]
Filter: 37%|███▋ | 300000/818627 [00:21<00:37, 13797.54 examples/s]
Filter: 37%|███▋ | 304000/818627 [00:21<00:35, 14402.82 examples/s]
Filter: 37%|███▋ | 302000/818627 [00:21<00:36, 14074.91 examples/s]
Filter: 37%|███▋ | 304000/818627 [00:21<00:36, 14131.11 examples/s]
Filter: 37%|███▋ | 304000/818627 [00:21<00:36, 14174.83 examples/s]
Filter: 37%|███▋ | 304000/818627 [00:21<00:36, 14208.37 examples/s]
Filter: 37%|███▋ | 300000/818627 [00:22<00:37, 13860.72 examples/s]
Filter: 37%|███▋ | 300000/818627 [00:21<00:37, 13754.99 examples/s]
Filter: 37%|███▋ | 302000/818627 [00:21<00:37, 13878.45 examples/s]
Filter: 37%|███▋ | 306000/818627 [00:21<00:35, 14314.28 examples/s]
Filter: 37%|███▋ | 304000/818627 [00:21<00:36, 13997.88 examples/s]
Filter: 37%|███▋ | 306000/818627 [00:21<00:36, 14164.19 examples/s]
Filter: 37%|███▋ | 306000/818627 [00:21<00:35, 14240.26 examples/s]
Filter: 37%|███▋ | 306000/818627 [00:21<00:36, 14194.40 examples/s]
Filter: 37%|███▋ | 302000/818627 [00:22<00:37, 13720.48 examples/s]
Filter: 37%|███▋ | 302000/818627 [00:22<00:37, 13778.17 examples/s]
Filter: 37%|███▋ | 304000/818627 [00:22<00:37, 13687.89 examples/s]
Filter: 37%|███▋ | 306000/818627 [00:22<00:36, 14040.53 examples/s]
Filter: 37%|███▋ | 304000/818627 [00:22<00:37, 13583.32 examples/s]
Filter: 37%|███▋ | 304000/818627 [00:22<00:37, 13812.66 examples/s]
Filter: 37%|███▋ | 306000/818627 [00:22<00:37, 13782.62 examples/s]
Filter: 37%|███▋ | 306000/818627 [00:22<00:37, 13590.61 examples/s]
Filter: 37%|███▋ | 306000/818627 [00:22<00:37, 13811.96 examples/s]
Filter: 38%|███▊ | 308000/818627 [00:22<01:00, 8426.86 examples/s]
Filter: 38%|███▊ | 308000/818627 [00:22<00:37, 13573.18 examples/s]
Filter: 38%|███▊ | 308000/818627 [00:22<01:02, 8131.74 examples/s]
Filter: 38%|███▊ | 308000/818627 [00:22<01:02, 8124.68 examples/s]
Filter: 38%|███▊ | 308000/818627 [00:22<01:02, 8106.88 examples/s]
Filter: 38%|███▊ | 310000/818627 [00:22<00:53, 9428.46 examples/s]
Filter: 38%|███▊ | 308000/818627 [00:22<01:01, 8332.30 examples/s]
Filter: 38%|███▊ | 310000/818627 [00:22<00:37, 13694.54 examples/s]
Filter: 38%|███▊ | 310000/818627 [00:22<00:54, 9285.69 examples/s]
Filter: 38%|███▊ | 310000/818627 [00:22<00:55, 9214.16 examples/s]
Filter: 38%|███▊ | 310000/818627 [00:22<00:55, 9109.89 examples/s]
Filter: 38%|███▊ | 308000/818627 [00:22<01:00, 8425.14 examples/s]
Filter: 38%|███▊ | 312000/818627 [00:22<00:48, 10441.26 examples/s]
Filter: 38%|███▊ | 310000/818627 [00:22<00:53, 9442.74 examples/s]
Filter: 38%|███▊ | 312000/818627 [00:22<00:37, 13638.35 examples/s]
Filter: 38%|███▊ | 312000/818627 [00:22<00:49, 10304.23 examples/s]
Filter: 38%|███▊ | 312000/818627 [00:22<00:49, 10268.00 examples/s]
Filter: 38%|███▊ | 312000/818627 [00:22<00:50, 10111.69 examples/s]
Filter: 38%|███▊ | 310000/818627 [00:22<00:53, 9496.91 examples/s]
Filter: 38%|███▊ | 308000/818627 [00:22<01:02, 8128.63 examples/s]
Filter: 38%|███▊ | 314000/818627 [00:22<00:44, 11267.66 examples/s]
Filter: 38%|███▊ | 312000/818627 [00:22<00:48, 10447.92 examples/s]
Filter: 38%|███▊ | 314000/818627 [00:22<00:45, 11159.40 examples/s]
Filter: 38%|███▊ | 314000/818627 [00:22<00:45, 11168.17 examples/s]
Filter: 38%|███▊ | 314000/818627 [00:22<00:45, 11016.55 examples/s]
Filter: 38%|███▊ | 312000/818627 [00:22<00:48, 10483.19 examples/s]
Filter: 38%|███▊ | 310000/818627 [00:22<00:55, 9242.68 examples/s]
Filter: 39%|███▊ | 316000/818627 [00:22<00:41, 11987.13 examples/s]
Filter: 38%|███▊ | 314000/818627 [00:22<00:44, 11292.72 examples/s]
Filter: 39%|███▊ | 316000/818627 [00:23<00:42, 11919.35 examples/s]
Filter: 39%|███▊ | 316000/818627 [00:23<00:42, 11831.16 examples/s]
Filter: 39%|███▊ | 316000/818627 [00:23<00:42, 11823.34 examples/s]
Filter: 38%|███▊ | 312000/818627 [00:23<00:49, 10270.98 examples/s]
Filter: 38%|███▊ | 314000/818627 [00:23<00:45, 11207.75 examples/s]
Filter: 39%|███▉ | 318000/818627 [00:23<00:39, 12592.25 examples/s]
Filter: 39%|███▊ | 316000/818627 [00:23<00:41, 12018.68 examples/s]
Filter: 39%|███▉ | 318000/818627 [00:23<00:40, 12425.38 examples/s]
Filter: 39%|███▉ | 318000/818627 [00:23<00:40, 12427.39 examples/s]
Filter: 39%|███▉ | 318000/818627 [00:23<00:40, 12437.58 examples/s]
Filter: 38%|███▊ | 314000/818627 [00:23<01:01, 8224.08 examples/s]
Filter: 38%|███▊ | 314000/818627 [00:23<00:45, 11147.00 examples/s]
Filter: 39%|███▊ | 316000/818627 [00:23<00:42, 11936.56 examples/s]
Filter: 39%|███▉ | 320000/818627 [00:23<00:38, 13056.83 examples/s]
Filter: 39%|███▉ | 318000/818627 [00:23<00:39, 12577.62 examples/s]
Filter: 39%|███▉ | 320000/818627 [00:23<00:38, 12913.31 examples/s]
Filter: 39%|███▉ | 320000/818627 [00:23<00:38, 12896.75 examples/s]
Filter: 39%|███▉ | 320000/818627 [00:23<00:38, 12924.26 examples/s]
Filter: 39%|███▊ | 316000/818627 [00:23<00:53, 9422.65 examples/s]
Filter: 39%|███▉ | 318000/818627 [00:23<00:40, 12490.81 examples/s]
Filter: 39%|███▉ | 322000/818627 [00:23<00:37, 13284.35 examples/s]
Filter: 39%|███▊ | 316000/818627 [00:23<00:42, 11796.68 examples/s]
Filter: 39%|███▉ | 320000/818627 [00:23<00:38, 12925.80 examples/s]
Filter: 39%|███▉ | 322000/818627 [00:23<00:37, 13248.31 examples/s]
Filter: 39%|███▉ | 322000/818627 [00:23<00:37, 13261.20 examples/s]
Filter: 39%|███▉ | 322000/818627 [00:23<00:37, 13307.31 examples/s]
Filter: 39%|███▉ | 318000/818627 [00:23<00:47, 10507.50 examples/s]
Filter: 40%|███▉ | 324000/818627 [00:23<00:36, 13454.85 examples/s]
Filter: 39%|███▉ | 320000/818627 [00:23<00:38, 12807.95 examples/s]
Filter: 39%|███▉ | 318000/818627 [00:23<00:40, 12369.50 examples/s]
Filter: 39%|███▉ | 322000/818627 [00:23<00:37, 13174.81 examples/s]
Filter: 40%|███▉ | 324000/818627 [00:23<00:36, 13443.19 examples/s]
Filter: 40%|███▉ | 324000/818627 [00:23<00:36, 13516.69 examples/s]
Filter: 39%|███▉ | 320000/818627 [00:23<00:43, 11434.39 examples/s]
Filter: 40%|███▉ | 324000/818627 [00:23<00:36, 13474.29 examples/s]
Filter: 40%|███▉ | 326000/818627 [00:23<00:36, 13635.88 examples/s]
Filter: 39%|███▉ | 322000/818627 [00:23<00:37, 13162.95 examples/s]
Filter: 39%|███▉ | 320000/818627 [00:23<00:38, 12806.00 examples/s]
Filter: 40%|███▉ | 324000/818627 [00:23<00:36, 13396.33 examples/s]
Filter: 40%|███▉ | 326000/818627 [00:23<00:35, 13709.09 examples/s]
Filter: 40%|███▉ | 326000/818627 [00:23<00:36, 13571.97 examples/s]
Filter: 39%|███▉ | 322000/818627 [00:23<00:40, 12171.47 examples/s]
Filter: 40%|███▉ | 326000/818627 [00:23<00:36, 13675.24 examples/s]
Filter: 40%|███▉ | 324000/818627 [00:23<00:36, 13407.41 examples/s]
Filter: 40%|████ | 328000/818627 [00:23<00:35, 13642.82 examples/s]
Filter: 39%|███▉ | 322000/818627 [00:23<00:37, 13092.71 examples/s]
Filter: 40%|███▉ | 326000/818627 [00:23<00:36, 13606.26 examples/s]
Filter: 40%|████ | 328000/818627 [00:23<00:35, 13828.63 examples/s]
Filter: 40%|███▉ | 324000/818627 [00:24<00:38, 12759.83 examples/s]
Filter: 40%|████ | 328000/818627 [00:23<00:35, 13739.04 examples/s]
Filter: 40%|████ | 328000/818627 [00:23<00:35, 13864.94 examples/s]
Filter: 40%|███▉ | 326000/818627 [00:23<00:36, 13587.76 examples/s]
Filter: 40%|████ | 330000/818627 [00:23<00:35, 13702.91 examples/s]
Filter: 40%|███▉ | 324000/818627 [00:23<00:37, 13231.18 examples/s]
Filter: 40%|████ | 328000/818627 [00:23<00:35, 13755.63 examples/s]
Filter: 40%|███▉ | 326000/818627 [00:24<00:37, 13227.60 examples/s]
Filter: 40%|████ | 330000/818627 [00:24<00:35, 13924.29 examples/s]
Filter: 40%|████ | 330000/818627 [00:24<00:35, 13897.01 examples/s]
Filter: 40%|████ | 330000/818627 [00:24<00:34, 14001.62 examples/s]
Filter: 41%|████ | 332000/818627 [00:24<00:35, 13872.41 examples/s]
Filter: 40%|████ | 328000/818627 [00:24<00:36, 13557.67 examples/s]
Filter: 40%|███▉ | 326000/818627 [00:24<00:36, 13382.06 examples/s]
Filter: 40%|████ | 330000/818627 [00:24<00:35, 13868.98 examples/s]
Filter: 41%|████ | 332000/818627 [00:24<00:34, 13975.53 examples/s]
Filter: 41%|████ | 332000/818627 [00:24<00:34, 14098.20 examples/s]
Filter: 41%|████ | 332000/818627 [00:24<00:34, 13911.72 examples/s]
Filter: 40%|████ | 328000/818627 [00:24<00:36, 13260.31 examples/s]
Filter: 41%|████ | 334000/818627 [00:24<00:34, 13974.55 examples/s]
Filter: 40%|████ | 330000/818627 [00:24<00:35, 13704.80 examples/s]
Filter: 40%|████ | 328000/818627 [00:24<00:36, 13534.64 examples/s]
Filter: 41%|████ | 332000/818627 [00:24<00:34, 13920.51 examples/s]
Filter: 41%|████ | 334000/818627 [00:24<00:34, 14113.89 examples/s]
Filter: 41%|████ | 334000/818627 [00:24<00:34, 13994.58 examples/s]
Filter: 41%|████ | 334000/818627 [00:24<00:34, 14016.44 examples/s]
Filter: 40%|████ | 330000/818627 [00:24<00:36, 13548.11 examples/s]
Filter: 41%|████ | 336000/818627 [00:24<00:34, 14051.49 examples/s]
Filter: 41%|████ | 332000/818627 [00:24<00:35, 13692.60 examples/s]
Filter: 40%|████ | 330000/818627 [00:24<00:36, 13545.62 examples/s]
Filter: 41%|████ | 334000/818627 [00:24<00:35, 13765.57 examples/s]
Filter: 41%|████ | 336000/818627 [00:24<00:34, 14086.73 examples/s]
Filter: 41%|████ | 336000/818627 [00:24<00:34, 14137.91 examples/s]
Filter: 41%|████ | 332000/818627 [00:24<00:35, 13696.56 examples/s]
Filter: 41%|████ | 336000/818627 [00:24<00:34, 13830.30 examples/s]
Filter: 41%|████▏ | 338000/818627 [00:24<00:34, 14124.92 examples/s]
Filter: 41%|████ | 334000/818627 [00:24<00:35, 13814.16 examples/s]
Filter: 41%|████ | 332000/818627 [00:24<00:35, 13675.89 examples/s]
Filter: 41%|████ | 336000/818627 [00:24<00:35, 13769.39 examples/s]
Filter: 41%|████▏ | 338000/818627 [00:24<00:33, 14158.22 examples/s]
Filter: 41%|████▏ | 338000/818627 [00:24<00:34, 14116.81 examples/s]
Filter: 41%|████▏ | 338000/818627 [00:24<00:34, 13989.33 examples/s]
Filter: 41%|████ | 334000/818627 [00:24<00:35, 13769.22 examples/s]
Filter: 42%|████▏ | 340000/818627 [00:24<00:34, 13840.97 examples/s]
Filter: 41%|████ | 336000/818627 [00:24<00:34, 13889.76 examples/s]
Filter: 41%|████ | 334000/818627 [00:24<00:35, 13658.50 examples/s]
Filter: 41%|████▏ | 338000/818627 [00:24<00:34, 13873.75 examples/s]
Filter: 42%|████▏ | 340000/818627 [00:24<00:33, 14167.37 examples/s]
Filter: 42%|████▏ | 340000/818627 [00:24<00:33, 14128.75 examples/s]
Filter: 42%|████▏ | 340000/818627 [00:24<00:34, 14074.03 examples/s]
Filter: 41%|████ | 336000/818627 [00:24<00:34, 13865.18 examples/s]
Filter: 42%|████▏ | 342000/818627 [00:24<00:34, 13905.62 examples/s]
Filter: 41%|████▏ | 338000/818627 [00:24<00:34, 13829.24 examples/s]
Filter: 41%|████ | 336000/818627 [00:24<00:35, 13697.72 examples/s]
Filter: 42%|████▏ | 340000/818627 [00:24<00:34, 13915.83 examples/s]
Filter: 42%|████▏ | 342000/818627 [00:24<00:33, 14108.33 examples/s]
Filter: 42%|████▏ | 342000/818627 [00:24<00:33, 14082.98 examples/s]
Filter: 42%|████▏ | 342000/818627 [00:24<00:33, 14120.52 examples/s]
Filter: 41%|████▏ | 338000/818627 [00:25<00:34, 14039.77 examples/s]
Filter: 42%|████▏ | 344000/818627 [00:24<00:34, 13905.55 examples/s]
Filter: 42%|████▏ | 340000/818627 [00:24<00:34, 13705.13 examples/s]
Filter: 41%|████▏ | 338000/818627 [00:25<00:35, 13673.71 examples/s]
Filter: 42%|████▏ | 342000/818627 [00:25<00:34, 13981.91 examples/s]
Filter: 42%|████▏ | 344000/818627 [00:25<00:33, 14154.36 examples/s]
Filter: 42%|████▏ | 344000/818627 [00:25<00:33, 14129.34 examples/s]
Filter: 42%|████▏ | 344000/818627 [00:25<00:33, 14192.59 examples/s]
Filter: 42%|████▏ | 340000/818627 [00:25<00:34, 13949.34 examples/s]
Filter: 42%|████▏ | 346000/818627 [00:25<00:33, 14033.65 examples/s]
Filter: 42%|████▏ | 342000/818627 [00:25<00:34, 13656.12 examples/s]
Filter: 42%|████▏ | 340000/818627 [00:25<00:34, 13761.18 examples/s]
Filter: 42%|████▏ | 344000/818627 [00:25<00:33, 14011.23 examples/s]
Filter: 42%|████▏ | 346000/818627 [00:25<00:33, 14045.99 examples/s]
Filter: 42%|████▏ | 346000/818627 [00:25<00:33, 14058.29 examples/s]
Filter: 42%|████▏ | 346000/818627 [00:25<00:33, 14122.67 examples/s]
Filter: 42%|████▏ | 342000/818627 [00:25<00:34, 13960.88 examples/s]
Filter: 43%|████▎ | 348000/818627 [00:25<00:33, 14103.00 examples/s]
Filter: 42%|████▏ | 344000/818627 [00:25<00:34, 13754.62 examples/s]
Filter: 42%|████▏ | 342000/818627 [00:25<00:34, 13819.31 examples/s]
Filter: 42%|████▏ | 346000/818627 [00:25<00:33, 14036.92 examples/s]
Filter: 43%|████▎ | 348000/818627 [00:25<00:33, 13957.44 examples/s]
Filter: 43%|████▎ | 348000/818627 [00:25<00:33, 14016.94 examples/s]
Filter: 43%|████▎ | 348000/818627 [00:25<00:33, 13965.26 examples/s]
Filter: 42%|████▏ | 344000/818627 [00:25<00:33, 14003.71 examples/s]
Filter: 43%|████▎ | 350000/818627 [00:25<00:33, 14150.18 examples/s]
Filter: 42%|████▏ | 346000/818627 [00:25<00:34, 13836.18 examples/s]
Filter: 42%|████▏ | 344000/818627 [00:25<00:34, 13863.62 examples/s]
Filter: 43%|████▎ | 348000/818627 [00:25<00:33, 13951.43 examples/s]
Filter: 43%|████▎ | 350000/818627 [00:25<00:33, 14024.50 examples/s]
Filter: 43%|████▎ | 350000/818627 [00:25<00:33, 14056.58 examples/s]
Filter: 42%|████▏ | 346000/818627 [00:25<00:33, 14107.07 examples/s]
Filter: 43%|████▎ | 350000/818627 [00:25<00:33, 13947.54 examples/s]
Filter: 43%|████▎ | 352000/818627 [00:25<00:32, 14210.71 examples/s]
Filter: 43%|████▎ | 348000/818627 [00:25<00:34, 13786.27 examples/s]
Filter: 42%|████▏ | 346000/818627 [00:25<00:34, 13774.26 examples/s]
Filter: 43%|████▎ | 350000/818627 [00:25<00:33, 13884.67 examples/s]
Filter: 43%|████▎ | 348000/818627 [00:25<00:33, 14198.22 examples/s]
Filter: 43%|████▎ | 352000/818627 [00:25<00:33, 14066.57 examples/s]
Filter: 43%|████▎ | 352000/818627 [00:25<00:33, 14082.79 examples/s]
Filter: 43%|████▎ | 352000/818627 [00:25<00:33, 13999.98 examples/s]
Filter: 43%|████▎ | 354000/818627 [00:25<00:32, 14177.74 examples/s]
Filter: 43%|████▎ | 350000/818627 [00:25<00:33, 13850.88 examples/s]
Filter: 43%|████▎ | 348000/818627 [00:25<00:33, 13853.21 examples/s]
Filter: 43%|████▎ | 352000/818627 [00:25<00:33, 13848.69 examples/s]
Filter: 43%|████▎ | 350000/818627 [00:25<00:32, 14266.98 examples/s]
Filter: 43%|████▎ | 354000/818627 [00:25<00:32, 14145.54 examples/s]
Filter: 43%|████▎ | 354000/818627 [00:25<00:32, 14120.00 examples/s]
Filter: 43%|████▎ | 354000/818627 [00:25<00:33, 14004.29 examples/s]
Filter: 43%|████▎ | 356000/818627 [00:25<00:32, 14083.37 examples/s]
Filter: 43%|████▎ | 352000/818627 [00:25<00:33, 13918.21 examples/s]
Filter: 43%|████▎ | 350000/818627 [00:25<00:34, 13774.53 examples/s]
Filter: 43%|████▎ | 352000/818627 [00:26<00:33, 14078.67 examples/s]
Filter: 43%|████▎ | 356000/818627 [00:25<00:32, 14033.08 examples/s]
Filter: 43%|████▎ | 356000/818627 [00:25<00:33, 14004.30 examples/s]
Filter: 43%|████▎ | 354000/818627 [00:25<00:34, 13459.55 examples/s]
Filter: 43%|████▎ | 356000/818627 [00:25<00:33, 13981.80 examples/s]
Filter: 44%|████▎ | 358000/818627 [00:25<00:32, 14126.66 examples/s]
Filter: 43%|████▎ | 354000/818627 [00:26<00:34, 13615.72 examples/s]
Filter: 43%|████▎ | 352000/818627 [00:26<00:33, 13740.86 examples/s]
Filter: 44%|████▎ | 358000/818627 [00:26<00:32, 14074.55 examples/s]
Filter: 44%|████▎ | 358000/818627 [00:26<00:32, 14074.56 examples/s]
Filter: 43%|████▎ | 354000/818627 [00:26<00:33, 14041.12 examples/s]
Filter: 44%|████▎ | 358000/818627 [00:26<00:32, 14102.26 examples/s]
Filter: 43%|████▎ | 356000/818627 [00:26<00:34, 13411.34 examples/s]
Filter: 44%|████▍ | 360000/818627 [00:26<00:32, 14204.65 examples/s]
Filter: 43%|████▎ | 356000/818627 [00:26<00:33, 13708.91 examples/s]
Filter: 43%|████▎ | 354000/818627 [00:26<00:33, 13826.93 examples/s]
Filter: 43%|████▎ | 356000/818627 [00:26<00:32, 14158.88 examples/s]
Filter: 44%|████▍ | 360000/818627 [00:26<00:32, 14124.21 examples/s]
Filter: 44%|████▍ | 360000/818627 [00:26<00:32, 14182.60 examples/s]
Filter: 44%|████▍ | 360000/818627 [00:26<00:32, 14059.45 examples/s]
Filter: 44%|████▎ | 358000/818627 [00:26<00:33, 13617.18 examples/s]
Filter: 44%|████▍ | 362000/818627 [00:26<00:32, 14269.29 examples/s]
Filter: 44%|████▎ | 358000/818627 [00:26<00:33, 13701.91 examples/s]
Filter: 43%|████▎ | 356000/818627 [00:26<00:33, 13790.70 examples/s]
Filter: 44%|████▍ | 362000/818627 [00:26<00:32, 14155.48 examples/s]
Filter: 44%|████▎ | 358000/818627 [00:26<00:32, 14117.68 examples/s]
Filter: 44%|████▍ | 362000/818627 [00:26<00:32, 14126.87 examples/s]
Filter: 44%|████▍ | 362000/818627 [00:26<00:32, 14104.50 examples/s]
Filter: 44%|████▍ | 360000/818627 [00:26<00:33, 13631.95 examples/s]
Filter: 44%|████▍ | 364000/818627 [00:26<00:31, 14265.81 examples/s]
Filter: 44%|████▍ | 360000/818627 [00:26<00:33, 13777.42 examples/s]
Filter: 44%|████▍ | 360000/818627 [00:26<00:32, 14065.62 examples/s]
Filter: 44%|████▍ | 364000/818627 [00:26<00:32, 14088.90 examples/s]
Filter: 44%|████▍ | 364000/818627 [00:26<00:32, 14119.56 examples/s]
Filter: 44%|████▍ | 364000/818627 [00:26<00:32, 14003.76 examples/s]
Filter: 44%|████▎ | 358000/818627 [00:26<00:33, 13710.08 examples/s]
Filter: 44%|████▍ | 362000/818627 [00:26<00:33, 13619.11 examples/s]
Filter: 45%|████▍ | 366000/818627 [00:26<00:32, 14130.00 examples/s]
Filter: 44%|████▍ | 362000/818627 [00:26<00:33, 13834.54 examples/s]
Filter: 44%|████▍ | 362000/818627 [00:26<00:32, 14137.53 examples/s]
Filter: 45%|████▍ | 366000/818627 [00:26<00:32, 14079.93 examples/s]
Filter: 45%|████▍ | 366000/818627 [00:26<00:32, 14083.23 examples/s]
Filter: 45%|████▍ | 366000/818627 [00:26<00:32, 14106.26 examples/s]
Filter: 44%|████▍ | 360000/818627 [00:26<00:33, 13743.88 examples/s]
Filter: 44%|████▍ | 364000/818627 [00:26<00:33, 13610.58 examples/s]
Filter: 45%|████▍ | 368000/818627 [00:26<00:32, 14067.56 examples/s]
Filter: 44%|████▍ | 364000/818627 [00:26<00:31, 14224.25 examples/s]
Filter: 44%|████▍ | 364000/818627 [00:26<00:32, 13915.27 examples/s]
Filter: 45%|████▍ | 368000/818627 [00:26<00:31, 14137.04 examples/s]
Filter: 45%|████▍ | 368000/818627 [00:26<00:31, 14110.23 examples/s]
Filter: 45%|████▍ | 368000/818627 [00:26<00:32, 14032.30 examples/s]
Filter: 44%|████▍ | 362000/818627 [00:26<00:33, 13682.51 examples/s]
Filter: 45%|████▍ | 366000/818627 [00:26<00:32, 13772.28 examples/s]
Filter: 45%|████▌ | 370000/818627 [00:26<00:31, 14131.11 examples/s]
Filter: 45%|████▍ | 366000/818627 [00:26<00:32, 13973.60 examples/s]
Filter: 45%|████▍ | 366000/818627 [00:27<00:32, 14139.16 examples/s]
Filter: 45%|████▌ | 370000/818627 [00:26<00:31, 14179.60 examples/s]
Filter: 45%|████▌ | 370000/818627 [00:26<00:31, 14110.55 examples/s]
Filter: 45%|████▌ | 370000/818627 [00:26<00:31, 14056.51 examples/s]
Filter: 44%|████▍ | 364000/818627 [00:26<00:33, 13763.84 examples/s]
Filter: 45%|████▍ | 368000/818627 [00:26<00:32, 13882.36 examples/s]
Filter: 45%|████▌ | 372000/818627 [00:26<00:31, 14187.38 examples/s]
Filter: 45%|████▍ | 368000/818627 [00:27<00:31, 14206.51 examples/s]
Filter: 45%|████▌ | 372000/818627 [00:27<00:31, 14203.54 examples/s]
Filter: 45%|████▍ | 368000/818627 [00:27<00:32, 13907.94 examples/s]
Filter: 45%|████▌ | 372000/818627 [00:27<00:31, 14143.92 examples/s]
Filter: 45%|████▌ | 372000/818627 [00:27<00:31, 14112.46 examples/s]
Filter: 45%|████▍ | 366000/818627 [00:27<00:32, 13726.90 examples/s]
Filter: 45%|████▌ | 370000/818627 [00:27<00:32, 13836.31 examples/s]
Filter: 46%|████▌ | 374000/818627 [00:27<00:31, 14227.63 examples/s]
Filter: 45%|████▌ | 370000/818627 [00:27<00:31, 14255.02 examples/s]
Filter: 46%|████▌ | 374000/818627 [00:27<00:31, 14188.52 examples/s]
Filter: 46%|████▌ | 374000/818627 [00:27<00:31, 14162.01 examples/s]
Filter: 45%|████▌ | 370000/818627 [00:27<00:32, 13968.99 examples/s]
Filter: 46%|████▌ | 374000/818627 [00:27<00:31, 14157.58 examples/s]
Filter: 45%|████▍ | 368000/818627 [00:27<00:32, 13833.80 examples/s]
Filter: 45%|████▌ | 372000/818627 [00:27<00:32, 13907.72 examples/s]
Filter: 46%|████▌ | 376000/818627 [00:27<00:31, 14166.34 examples/s]
Filter: 45%|████▌ | 372000/818627 [00:27<00:31, 14170.86 examples/s]
Filter: 46%|████▌ | 376000/818627 [00:27<00:31, 14104.98 examples/s]
Filter: 46%|████▌ | 376000/818627 [00:27<00:31, 14098.54 examples/s]
Filter: 45%|████▌ | 372000/818627 [00:27<00:32, 13955.39 examples/s]
Filter: 46%|████▌ | 376000/818627 [00:27<00:31, 13965.92 examples/s]
Filter: 45%|████▌ | 370000/818627 [00:27<00:32, 13704.30 examples/s]
Filter: 46%|████▌ | 374000/818627 [00:27<00:32, 13656.29 examples/s]
Filter: 46%|████▌ | 378000/818627 [00:27<00:31, 14105.94 examples/s]
Filter: 46%|████▌ | 374000/818627 [00:27<00:31, 14205.70 examples/s]
Filter: 46%|████▌ | 374000/818627 [00:27<00:31, 13989.31 examples/s]
Filter: 46%|████▌ | 378000/818627 [00:27<00:31, 14070.19 examples/s]
Filter: 46%|████▌ | 378000/818627 [00:27<00:31, 14049.51 examples/s]
Filter: 46%|████▌ | 378000/818627 [00:27<00:31, 13912.38 examples/s]
Filter: 45%|████▌ | 372000/818627 [00:27<00:32, 13581.23 examples/s]
Filter: 46%|████▌ | 376000/818627 [00:27<00:32, 13705.73 examples/s]
Filter: 46%|████▋ | 380000/818627 [00:27<00:31, 13999.84 examples/s]
Filter: 46%|████▌ | 376000/818627 [00:27<00:31, 14256.74 examples/s]
Filter: 46%|████▋ | 380000/818627 [00:27<00:31, 14116.66 examples/s]
Filter: 46%|████▋ | 380000/818627 [00:27<00:31, 14106.89 examples/s]
Filter: 46%|████▌ | 376000/818627 [00:27<00:31, 14038.16 examples/s]
Filter: 46%|████▋ | 380000/818627 [00:27<00:31, 14061.18 examples/s]
Filter: 46%|████▌ | 374000/818627 [00:27<00:32, 13677.35 examples/s]
Filter: 46%|████▌ | 378000/818627 [00:27<00:32, 13720.23 examples/s]
Filter: 47%|████▋ | 382000/818627 [00:27<00:30, 14131.88 examples/s]
Filter: 46%|████▌ | 378000/818627 [00:27<00:31, 14165.95 examples/s]
Filter: 47%|████▋ | 382000/818627 [00:27<00:30, 14159.51 examples/s]
Filter: 47%|████▋ | 382000/818627 [00:27<00:30, 14153.09 examples/s]
Filter: 46%|████▌ | 378000/818627 [00:27<00:31, 14088.59 examples/s]
Filter: 47%|████▋ | 382000/818627 [00:27<00:30, 14153.12 examples/s]
Filter: 46%|████▌ | 376000/818627 [00:27<00:32, 13770.18 examples/s]
Filter: 46%|████▋ | 380000/818627 [00:27<00:31, 13838.93 examples/s]
Filter: 47%|████▋ | 384000/818627 [00:27<00:30, 14186.42 examples/s]
Filter: 46%|████▋ | 380000/818627 [00:28<00:30, 14217.39 examples/s]
Filter: 47%|████▋ | 384000/818627 [00:27<00:30, 14228.80 examples/s]
Filter: 47%|████▋ | 384000/818627 [00:27<00:30, 14176.17 examples/s]
Filter: 47%|████▋ | 384000/818627 [00:27<00:30, 14092.11 examples/s]
Filter: 46%|████▋ | 380000/818627 [00:27<00:31, 14065.18 examples/s]
Filter: 46%|████▌ | 378000/818627 [00:27<00:32, 13608.70 examples/s]
Filter: 47%|████▋ | 382000/818627 [00:27<00:31, 13688.22 examples/s]
Filter: 47%|████▋ | 386000/818627 [00:27<00:30, 14103.62 examples/s]
Filter: 47%|████▋ | 382000/818627 [00:28<00:31, 13953.63 examples/s]
Filter: 47%|████▋ | 386000/818627 [00:28<00:30, 14118.63 examples/s]
Filter: 47%|████▋ | 386000/818627 [00:28<00:30, 14082.61 examples/s]
Filter: 47%|████▋ | 382000/818627 [00:28<00:31, 13951.03 examples/s]
Filter: 47%|████▋ | 386000/818627 [00:28<00:31, 13949.57 examples/s]
Filter: 46%|████▋ | 380000/818627 [00:28<00:31, 13729.99 examples/s]
Filter: 47%|████▋ | 384000/818627 [00:28<00:31, 13823.73 examples/s]
Filter: 47%|████▋ | 388000/818627 [00:28<00:30, 14174.52 examples/s]
Filter: 47%|████▋ | 384000/818627 [00:28<00:31, 13994.53 examples/s]
Filter: 47%|████▋ | 388000/818627 [00:28<00:30, 14004.94 examples/s]
Filter: 47%|████▋ | 388000/818627 [00:28<00:30, 13973.72 examples/s]
Filter: 47%|████▋ | 388000/818627 [00:28<00:30, 14009.98 examples/s]
Filter: 47%|████▋ | 384000/818627 [00:28<00:31, 13988.97 examples/s]
Filter: 47%|████▋ | 382000/818627 [00:28<00:31, 13682.83 examples/s]
Filter: 47%|████▋ | 386000/818627 [00:28<00:31, 13777.60 examples/s]
Filter: 48%|████▊ | 390000/818627 [00:28<00:30, 13911.39 examples/s]
Filter: 47%|████▋ | 386000/818627 [00:28<00:30, 14120.16 examples/s]
Filter: 48%|████▊ | 390000/818627 [00:28<00:30, 14045.03 examples/s]
Filter: 48%|████▊ | 390000/818627 [00:28<00:30, 13966.91 examples/s]
Filter: 48%|████▊ | 390000/818627 [00:28<00:30, 13924.96 examples/s]
Filter: 47%|████▋ | 386000/818627 [00:28<00:31, 13935.37 examples/s]
Filter: 47%|████▋ | 384000/818627 [00:28<00:31, 13775.07 examples/s]
Filter: 47%|████▋ | 388000/818627 [00:28<00:31, 13677.12 examples/s]
Filter: 48%|████▊ | 392000/818627 [00:28<00:30, 13842.73 examples/s]
Filter: 47%|████▋ | 388000/818627 [00:28<00:30, 14050.65 examples/s]
Filter: 48%|████▊ | 392000/818627 [00:28<00:30, 14073.80 examples/s]
Filter: 48%|████▊ | 392000/818627 [00:28<00:30, 13975.19 examples/s]
Filter: 48%|████▊ | 392000/818627 [00:28<00:30, 13799.80 examples/s]
Filter: 47%|████▋ | 388000/818627 [00:28<00:31, 13755.50 examples/s]
Filter: 47%|████▋ | 386000/818627 [00:28<00:31, 13701.26 examples/s]
Filter: 48%|████▊ | 390000/818627 [00:28<00:31, 13683.99 examples/s]
Filter: 48%|████▊ | 394000/818627 [00:28<00:30, 13920.21 examples/s]
Filter: 48%|████▊ | 390000/818627 [00:28<00:30, 13980.67 examples/s]
Filter: 48%|████▊ | 394000/818627 [00:28<00:30, 13941.09 examples/s]
Filter: 48%|████▊ | 394000/818627 [00:28<00:30, 13937.04 examples/s]
Filter: 48%|████▊ | 394000/818627 [00:28<00:30, 13771.71 examples/s]
Filter: 48%|████▊ | 390000/818627 [00:28<00:31, 13648.23 examples/s]
Filter: 47%|████▋ | 388000/818627 [00:28<00:31, 13710.25 examples/s]
Filter: 48%|████▊ | 392000/818627 [00:28<00:31, 13708.02 examples/s]
Filter: 48%|████▊ | 396000/818627 [00:28<00:30, 13970.89 examples/s]
Filter: 48%|████▊ | 392000/818627 [00:28<00:30, 14048.83 examples/s]
Filter: 48%|████▊ | 396000/818627 [00:28<00:30, 13953.13 examples/s]
Filter: 48%|████▊ | 396000/818627 [00:28<00:30, 13983.31 examples/s]
Filter: 48%|████▊ | 396000/818627 [00:28<00:30, 13904.72 examples/s]
Filter: 48%|████▊ | 392000/818627 [00:28<00:31, 13667.93 examples/s]
Filter: 48%|████▊ | 390000/818627 [00:28<00:31, 13769.27 examples/s]
Filter: 48%|████▊ | 394000/818627 [00:28<00:30, 13767.16 examples/s]
Filter: 49%|████▊ | 398000/818627 [00:28<00:29, 14070.28 examples/s]
Filter: 48%|████▊ | 394000/818627 [00:29<00:30, 13980.80 examples/s]
Filter: 49%|████▊ | 398000/818627 [00:28<00:29, 14028.84 examples/s]
Filter: 49%|████▊ | 398000/818627 [00:28<00:30, 13925.26 examples/s]
Filter: 49%|████▊ | 398000/818627 [00:28<00:29, 14028.19 examples/s]
Filter: 48%|████▊ | 394000/818627 [00:28<00:30, 13795.02 examples/s]
Filter: 48%|████▊ | 392000/818627 [00:28<00:30, 13853.27 examples/s]
Filter: 48%|████▊ | 396000/818627 [00:28<00:30, 13871.62 examples/s]
Filter: 49%|████▉ | 400000/818627 [00:28<00:29, 14151.30 examples/s]
Filter: 48%|████▊ | 396000/818627 [00:29<00:30, 14049.38 examples/s]
Filter: 49%|████▉ | 400000/818627 [00:29<00:29, 14038.13 examples/s]
Filter: 49%|████▉ | 400000/818627 [00:29<00:29, 14028.63 examples/s]
Filter: 49%|████▉ | 400000/818627 [00:29<00:29, 14100.04 examples/s]
Filter: 48%|████▊ | 396000/818627 [00:29<00:30, 13894.42 examples/s]
Filter: 48%|████▊ | 394000/818627 [00:29<00:30, 13761.39 examples/s]
Filter: 49%|████▊ | 398000/818627 [00:29<00:30, 13944.72 examples/s]
Filter: 49%|████▉ | 402000/818627 [00:29<00:29, 14201.61 examples/s]
Filter: 49%|████▊ | 398000/818627 [00:29<00:29, 14120.48 examples/s]
Filter: 49%|████▉ | 402000/818627 [00:29<00:29, 14105.05 examples/s]
Filter: 49%|████▉ | 402000/818627 [00:29<00:29, 13959.65 examples/s]
Filter: 49%|████▉ | 402000/818627 [00:29<00:29, 14093.60 examples/s]
Filter: 49%|████▊ | 398000/818627 [00:29<00:30, 13964.87 examples/s]
Filter: 48%|████▊ | 396000/818627 [00:29<00:30, 13826.81 examples/s]
Filter: 49%|████▉ | 400000/818627 [00:29<00:29, 13981.50 examples/s]
Filter: 49%|████▉ | 404000/818627 [00:29<00:29, 14233.92 examples/s]
Filter: 49%|████▉ | 400000/818627 [00:29<00:29, 14051.79 examples/s]
Filter: 49%|████▉ | 404000/818627 [00:29<00:29, 14021.78 examples/s]
Filter: 49%|████▉ | 404000/818627 [00:29<00:29, 14159.00 examples/s]
Filter: 49%|████▉ | 404000/818627 [00:29<00:29, 14100.51 examples/s]
Filter: 49%|████▉ | 400000/818627 [00:29<00:29, 14019.25 examples/s]
Filter: 49%|████▊ | 398000/818627 [00:29<00:30, 13891.01 examples/s]
Filter: 49%|████▉ | 402000/818627 [00:29<00:29, 14018.68 examples/s]
Filter: 50%|████▉ | 406000/818627 [00:29<00:29, 14161.10 examples/s]
Filter: 49%|████▉ | 402000/818627 [00:29<00:29, 14007.02 examples/s]
Filter: 50%|████▉ | 406000/818627 [00:29<00:29, 14170.49 examples/s]
Filter: 50%|████▉ | 406000/818627 [00:29<00:29, 14204.39 examples/s]
Filter: 50%|████▉ | 406000/818627 [00:29<00:29, 14082.76 examples/s]
Filter: 49%|████▉ | 402000/818627 [00:29<00:29, 14061.71 examples/s]
Filter: 50%|████▉ | 408000/818627 [00:29<00:28, 14225.01 examples/s]
Filter: 49%|████▉ | 400000/818627 [00:29<00:30, 13796.93 examples/s]
Filter: 49%|████▉ | 404000/818627 [00:29<00:29, 13928.87 examples/s]
Filter: 49%|████▉ | 404000/818627 [00:29<00:29, 14067.87 examples/s]
Filter: 50%|████▉ | 408000/818627 [00:29<00:28, 14223.01 examples/s]
Filter: 50%|████▉ | 408000/818627 [00:29<00:28, 14184.00 examples/s]
Filter: 50%|████▉ | 408000/818627 [00:29<00:29, 14129.85 examples/s]
Filter: 49%|████▉ | 404000/818627 [00:29<00:29, 14061.97 examples/s]
Filter: 50%|█████ | 410000/818627 [00:29<00:28, 14265.43 examples/s]
Filter: 50%|████▉ | 406000/818627 [00:29<00:29, 13997.65 examples/s]
Filter: 49%|████▉ | 402000/818627 [00:29<00:30, 13752.33 examples/s]
Filter: 50%|████▉ | 406000/818627 [00:29<00:29, 13893.94 examples/s]
Filter: 50%|█████ | 410000/818627 [00:29<00:28, 14179.15 examples/s]
Filter: 50%|█████ | 410000/818627 [00:29<00:29, 14027.74 examples/s]
Filter: 50%|█████ | 410000/818627 [00:29<00:29, 14001.48 examples/s]
Filter: 50%|████▉ | 406000/818627 [00:29<00:29, 13836.86 examples/s]
Filter: 50%|█████ | 412000/818627 [00:29<00:28, 14162.87 examples/s]
Filter: 49%|████▉ | 404000/818627 [00:29<00:30, 13816.40 examples/s]
Filter: 50%|████▉ | 408000/818627 [00:29<00:29, 13904.51 examples/s]
Filter: 50%|████▉ | 408000/818627 [00:30<00:29, 13997.87 examples/s]
Filter: 50%|█████ | 412000/818627 [00:29<00:28, 14047.30 examples/s]
Filter: 50%|█████ | 412000/818627 [00:29<00:29, 14013.94 examples/s]
Filter: 50%|█████ | 412000/818627 [00:29<00:28, 14031.05 examples/s]
Filter: 50%|████▉ | 408000/818627 [00:29<00:29, 13918.94 examples/s]
Filter: 51%|█████ | 414000/818627 [00:29<00:28, 14094.85 examples/s]
Filter: 50%|█████ | 410000/818627 [00:29<00:29, 13795.04 examples/s]
Filter: 50%|████▉ | 406000/818627 [00:29<00:30, 13718.64 examples/s]
Filter: 50%|█████ | 410000/818627 [00:30<00:29, 14042.95 examples/s]
Filter: 51%|█████ | 414000/818627 [00:30<00:28, 14099.87 examples/s]
Filter: 51%|█████ | 414000/818627 [00:30<00:28, 14096.28 examples/s]
Filter: 51%|█████ | 414000/818627 [00:30<00:28, 14019.60 examples/s]
Filter: 50%|█████ | 410000/818627 [00:30<00:29, 13967.04 examples/s]
Filter: 51%|█████ | 416000/818627 [00:30<00:28, 14193.84 examples/s]
Filter: 50%|█████ | 412000/818627 [00:30<00:29, 13882.54 examples/s]
Filter: 50%|████▉ | 408000/818627 [00:30<00:29, 13800.47 examples/s]
Filter: 50%|█████ | 412000/818627 [00:30<00:28, 14133.38 examples/s]
Filter: 51%|█████ | 416000/818627 [00:30<00:28, 14116.82 examples/s]
Filter: 51%|█████ | 416000/818627 [00:30<00:28, 14136.60 examples/s]
Filter: 51%|█████ | 416000/818627 [00:30<00:28, 14115.87 examples/s]
Filter: 50%|█████ | 412000/818627 [00:30<00:29, 13936.22 examples/s]
Filter: 51%|█████ | 418000/818627 [00:30<00:28, 14138.61 examples/s]
Filter: 50%|█████ | 410000/818627 [00:30<00:29, 13840.07 examples/s]
Filter: 51%|█████ | 414000/818627 [00:30<00:29, 13765.10 examples/s]
Filter: 51%|█████ | 414000/818627 [00:30<00:28, 14200.35 examples/s]
Filter: 51%|█████ | 418000/818627 [00:30<00:28, 14183.43 examples/s]
Filter: 51%|█████ | 418000/818627 [00:30<00:28, 14157.81 examples/s]
Filter: 51%|█████ | 418000/818627 [00:30<00:28, 14193.45 examples/s]
Filter: 51%|█████ | 414000/818627 [00:30<00:28, 13955.57 examples/s]
Filter: 51%|█████▏ | 420000/818627 [00:30<00:28, 13945.37 examples/s]
Filter: 50%|█████ | 412000/818627 [00:30<00:29, 13780.72 examples/s]
Filter: 51%|█████ | 416000/818627 [00:30<00:29, 13746.48 examples/s]
Filter: 51%|█████ | 416000/818627 [00:30<00:28, 14238.17 examples/s]
Filter: 51%|█████▏ | 420000/818627 [00:30<00:28, 14208.32 examples/s]
Filter: 51%|█████▏ | 420000/818627 [00:30<00:28, 14218.85 examples/s]
Filter: 51%|█████▏ | 420000/818627 [00:30<00:27, 14250.66 examples/s]
Filter: 51%|█████ | 416000/818627 [00:30<00:28, 14001.34 examples/s]
Filter: 52%|█████▏ | 422000/818627 [00:30<00:28, 13846.54 examples/s]
Filter: 51%|█████ | 418000/818627 [00:30<00:28, 13857.62 examples/s]
Filter: 51%|█████ | 414000/818627 [00:30<00:29, 13691.81 examples/s]
Filter: 51%|█████ | 418000/818627 [00:30<00:28, 14147.50 examples/s]
Filter: 52%|█████▏ | 422000/818627 [00:30<00:27, 14219.15 examples/s]
Filter: 52%|█████▏ | 422000/818627 [00:30<00:27, 14223.68 examples/s]
Filter: 52%|█████▏ | 422000/818627 [00:30<00:27, 14294.22 examples/s]
Filter: 51%|█████ | 418000/818627 [00:30<00:28, 14049.41 examples/s]
Filter: 52%|█████▏ | 424000/818627 [00:30<00:28, 14009.89 examples/s]
Filter: 51%|█████▏ | 420000/818627 [00:30<00:28, 13943.31 examples/s]
Filter: 51%|█████ | 416000/818627 [00:30<00:29, 13713.81 examples/s]
Filter: 51%|█████▏ | 420000/818627 [00:30<00:28, 14191.21 examples/s]
Filter: 52%|█████▏ | 424000/818627 [00:30<00:27, 14228.75 examples/s]
Filter: 52%|█████▏ | 424000/818627 [00:30<00:27, 14278.66 examples/s]
Filter: 52%|█████▏ | 424000/818627 [00:30<00:27, 14221.40 examples/s]
Filter: 51%|█████▏ | 420000/818627 [00:30<00:28, 14085.07 examples/s]
Filter: 52%|█████▏ | 426000/818627 [00:30<00:27, 14141.21 examples/s]
Filter: 52%|█████▏ | 422000/818627 [00:30<00:28, 14010.74 examples/s]
Filter: 51%|█████ | 418000/818627 [00:30<00:29, 13813.32 examples/s]
Filter: 52%|█████▏ | 422000/818627 [00:31<00:28, 14112.05 examples/s]
Filter: 52%|█████▏ | 426000/818627 [00:30<00:27, 14230.02 examples/s]
Filter: 52%|█████▏ | 426000/818627 [00:30<00:27, 14268.54 examples/s]
Filter: 52%|█████▏ | 426000/818627 [00:30<00:27, 14232.25 examples/s]
Filter: 52%|█████▏ | 422000/818627 [00:30<00:28, 14107.21 examples/s]
Filter: 52%|█████▏ | 428000/818627 [00:30<00:27, 14191.54 examples/s]
Filter: 52%|█████▏ | 424000/818627 [00:30<00:28, 13897.32 examples/s]
Filter: 51%|█████▏ | 420000/818627 [00:30<00:28, 13842.09 examples/s]
Filter: 52%|█████▏ | 424000/818627 [00:31<00:28, 14045.74 examples/s]
Filter: 52%|█████▏ | 428000/818627 [00:30<00:27, 14213.12 examples/s]
Filter: 52%|█████▏ | 428000/818627 [00:30<00:27, 14188.82 examples/s]
Filter: 52%|█████▏ | 428000/818627 [00:30<00:27, 14179.39 examples/s]
Filter: 52%|█████▏ | 424000/818627 [00:31<00:27, 14129.33 examples/s]
Filter: 53%|█████▎ | 430000/818627 [00:31<00:27, 14240.09 examples/s]
Filter: 52%|█████▏ | 426000/818627 [00:31<00:28, 13935.38 examples/s]
Filter: 52%|█████▏ | 422000/818627 [00:31<00:28, 13893.87 examples/s]
Filter: 53%|█████▎ | 430000/818627 [00:31<00:27, 14207.91 examples/s]
Filter: 53%|█████▎ | 430000/818627 [00:31<00:27, 14206.79 examples/s]
Filter: 52%|█████▏ | 426000/818627 [00:31<00:28, 14008.69 examples/s]
Filter: 53%|█████▎ | 430000/818627 [00:31<00:27, 14095.24 examples/s]
Filter: 52%|█████▏ | 426000/818627 [00:31<00:27, 14076.52 examples/s]
Filter: 53%|█████▎ | 432000/818627 [00:31<00:27, 14290.64 examples/s]
Filter: 52%|█████▏ | 428000/818627 [00:31<00:28, 13842.36 examples/s]
Filter: 52%|█████▏ | 424000/818627 [00:31<00:28, 13802.49 examples/s]
Filter: 53%|█████▎ | 432000/818627 [00:31<00:27, 14214.44 examples/s]
Filter: 53%|█████▎ | 432000/818627 [00:31<00:27, 14217.17 examples/s]
Filter: 52%|█████▏ | 428000/818627 [00:31<00:27, 14096.66 examples/s]
Filter: 53%|█████▎ | 432000/818627 [00:31<00:27, 14143.18 examples/s]
Filter: 52%|█████▏ | 428000/818627 [00:31<00:28, 13928.25 examples/s]
Filter: 53%|█████▎ | 434000/818627 [00:31<00:28, 13444.91 examples/s]
Filter: 53%|█████▎ | 430000/818627 [00:31<00:28, 13799.49 examples/s]
Filter: 52%|█████▏ | 426000/818627 [00:31<00:28, 13853.07 examples/s]
Filter: 53%|█████▎ | 434000/818627 [00:31<00:27, 14200.53 examples/s]
Filter: 53%|█████▎ | 430000/818627 [00:31<00:27, 14163.98 examples/s]
Filter: 53%|█████▎ | 434000/818627 [00:31<00:27, 14200.50 examples/s]
Filter: 53%|█████▎ | 434000/818627 [00:31<00:27, 14048.64 examples/s]
Filter: 53%|█████▎ | 430000/818627 [00:31<00:27, 13901.00 examples/s]
Filter: 53%|█████▎ | 432000/818627 [00:31<00:28, 13778.71 examples/s]
Filter: 52%|█████▏ | 428000/818627 [00:31<00:28, 13891.42 examples/s]
Filter: 53%|█████▎ | 436000/818627 [00:31<00:29, 12988.10 examples/s]
Filter: 53%|█████▎ | 436000/818627 [00:31<00:26, 14210.96 examples/s]
Filter: 53%|█████▎ | 436000/818627 [00:31<00:27, 14072.67 examples/s]
Filter: 53%|█████▎ | 436000/818627 [00:31<00:27, 14107.44 examples/s]
Filter: 53%|█████▎ | 432000/818627 [00:31<00:27, 13965.81 examples/s]
Filter: 53%|█████▎ | 432000/818627 [00:31<00:27, 13974.04 examples/s]
Filter: 53%|█████▎ | 430000/818627 [00:31<00:27, 13918.27 examples/s]
Filter: 53%|█████▎ | 434000/818627 [00:31<00:27, 13758.38 examples/s]
Filter: 54%|█████▎ | 438000/818627 [00:31<00:26, 14205.94 examples/s]
Filter: 54%|█████▎ | 438000/818627 [00:31<00:29, 12864.32 examples/s]
Filter: 54%|█████▎ | 438000/818627 [00:31<00:26, 14111.11 examples/s]
Filter: 54%|█████▎ | 438000/818627 [00:31<00:26, 14147.95 examples/s]
Filter: 53%|█████▎ | 434000/818627 [00:31<00:27, 14038.42 examples/s]
Filter: 53%|█████▎ | 434000/818627 [00:31<00:27, 14032.29 examples/s]
Filter: 53%|█████▎ | 432000/818627 [00:31<00:27, 13947.58 examples/s]
Filter: 53%|█████▎ | 436000/818627 [00:31<00:27, 13739.73 examples/s]
Filter: 54%|█████▎ | 440000/818627 [00:31<00:26, 14187.25 examples/s]
Filter: 54%|█████▎ | 440000/818627 [00:31<00:26, 14142.64 examples/s]
Filter: 54%|█████▎ | 440000/818627 [00:31<00:26, 14213.96 examples/s]
Filter: 53%|█████▎ | 436000/818627 [00:32<00:27, 14012.23 examples/s]
Filter: 54%|█████▎ | 440000/818627 [00:31<00:29, 12777.92 examples/s]
Filter: 53%|█████▎ | 436000/818627 [00:31<00:27, 14069.22 examples/s]
Filter: 53%|█████▎ | 434000/818627 [00:31<00:27, 13947.42 examples/s]
Filter: 54%|█████▎ | 438000/818627 [00:31<00:27, 13840.90 examples/s]
Filter: 54%|█████▍ | 442000/818627 [00:31<00:26, 14189.08 examples/s]
Filter: 54%|█████▍ | 442000/818627 [00:31<00:26, 14108.72 examples/s]
Filter: 54%|█████▍ | 442000/818627 [00:31<00:26, 14263.10 examples/s]
Filter: 54%|█████▎ | 438000/818627 [00:32<00:27, 14083.57 examples/s]
Filter: 54%|█████▍ | 442000/818627 [00:31<00:28, 13032.74 examples/s]
Filter: 54%|█████▎ | 438000/818627 [00:32<00:27, 14092.67 examples/s]
Filter: 53%|█████▎ | 436000/818627 [00:32<00:27, 13957.79 examples/s]
Filter: 54%|█████▎ | 440000/818627 [00:32<00:27, 13787.06 examples/s]
Filter: 54%|█████▍ | 444000/818627 [00:32<00:26, 14192.46 examples/s]
Filter: 54%|█████▍ | 444000/818627 [00:32<00:26, 14244.40 examples/s]
Filter: 54%|█████▍ | 444000/818627 [00:32<00:26, 14015.11 examples/s]
Filter: 54%|█████▎ | 440000/818627 [00:32<00:26, 14163.86 examples/s]
Filter: 54%|█████▍ | 444000/818627 [00:32<00:27, 13470.70 examples/s]
Filter: 54%|█████▎ | 440000/818627 [00:32<00:26, 14105.06 examples/s]
Filter: 54%|█████▎ | 438000/818627 [00:32<00:27, 13970.27 examples/s]
Filter: 54%|█████▍ | 442000/818627 [00:32<00:27, 13768.62 examples/s]
Filter: 54%|█████▍ | 446000/818627 [00:32<00:26, 14204.91 examples/s]
Filter: 54%|█████▍ | 446000/818627 [00:32<00:26, 14244.65 examples/s]
Filter: 54%|█████▍ | 446000/818627 [00:32<00:26, 14120.07 examples/s]
Filter: 54%|█████▍ | 442000/818627 [00:32<00:26, 14204.43 examples/s]
Filter: 54%|█████▍ | 446000/818627 [00:32<00:26, 13811.33 examples/s]
Filter: 54%|█████▍ | 442000/818627 [00:32<00:26, 14010.48 examples/s]
Filter: 54%|█████▎ | 440000/818627 [00:32<00:27, 13979.48 examples/s]
Filter: 54%|█████▍ | 444000/818627 [00:32<00:27, 13869.49 examples/s]
Filter: 55%|█████▍ | 448000/818627 [00:32<00:26, 14179.23 examples/s]
Filter: 55%|█████▍ | 448000/818627 [00:32<00:26, 14200.18 examples/s]
Filter: 54%|█████▍ | 444000/818627 [00:32<00:26, 14213.76 examples/s]
Filter: 55%|█████▍ | 448000/818627 [00:32<00:26, 14062.52 examples/s]
Filter: 55%|█████▍ | 448000/818627 [00:32<00:26, 14062.71 examples/s]
Filter: 54%|█████▍ | 444000/818627 [00:32<00:26, 14037.08 examples/s]
Filter: 54%|█████▍ | 442000/818627 [00:32<00:27, 13861.09 examples/s]
Filter: 55%|█████▍ | 450000/818627 [00:32<00:26, 14064.25 examples/s]
Filter: 55%|█████▍ | 450000/818627 [00:32<00:26, 13969.36 examples/s]
Filter: 55%|█████▍ | 450000/818627 [00:32<00:26, 14001.68 examples/s]
Filter: 54%|█████▍ | 446000/818627 [00:32<00:27, 13672.15 examples/s]
Filter: 54%|█████▍ | 446000/818627 [00:32<00:26, 13997.36 examples/s]
Filter: 55%|█████▍ | 450000/818627 [00:32<00:26, 14026.93 examples/s]
Filter: 54%|█████▍ | 446000/818627 [00:32<00:26, 13974.22 examples/s]
Filter: 54%|█████▍ | 444000/818627 [00:32<00:27, 13801.01 examples/s]
Filter: 55%|█████▌ | 452000/818627 [00:32<00:26, 14074.79 examples/s]
Filter: 55%|█████▌ | 452000/818627 [00:32<00:26, 14048.82 examples/s]
Filter: 55%|█████▌ | 452000/818627 [00:32<00:26, 14069.60 examples/s]
Filter: 55%|█████▌ | 452000/818627 [00:32<00:25, 14214.07 examples/s]
Filter: 55%|█████▍ | 448000/818627 [00:32<00:26, 14055.60 examples/s]
Filter: 55%|█████▍ | 448000/818627 [00:32<00:26, 13785.22 examples/s]
Filter: 55%|█████▍ | 448000/818627 [00:32<00:26, 14046.77 examples/s]
Filter: 55%|█████▌ | 454000/818627 [00:32<00:25, 14278.87 examples/s]
Filter: 55%|█████▌ | 454000/818627 [00:32<00:25, 14147.46 examples/s]
Filter: 55%|█████▌ | 454000/818627 [00:32<00:25, 14053.38 examples/s]
Filter: 54%|█████▍ | 446000/818627 [00:32<00:27, 13754.34 examples/s]
Filter: 55%|█████▍ | 450000/818627 [00:33<00:26, 14127.27 examples/s]
Filter: 55%|█████▌ | 454000/818627 [00:32<00:25, 14037.45 examples/s]
Filter: 55%|█████▍ | 450000/818627 [00:32<00:26, 13770.62 examples/s]
Filter: 55%|█████▍ | 450000/818627 [00:32<00:26, 14081.15 examples/s]
Filter: 56%|█████▌ | 456000/818627 [00:32<00:25, 14139.04 examples/s]
Filter: 56%|█████▌ | 456000/818627 [00:32<00:25, 14000.03 examples/s]
Filter: 56%|█████▌ | 456000/818627 [00:32<00:25, 14061.76 examples/s]
Filter: 56%|█████▌ | 456000/818627 [00:32<00:25, 14048.01 examples/s]
Filter: 55%|█████▌ | 452000/818627 [00:33<00:26, 14023.92 examples/s]
Filter: 55%|█████▍ | 448000/818627 [00:32<00:27, 13721.37 examples/s]
Filter: 55%|█████▌ | 452000/818627 [00:32<00:26, 13851.87 examples/s]
Filter: 55%|█████▌ | 452000/818627 [00:33<00:26, 14086.55 examples/s]
Filter: 56%|█████▌ | 458000/818627 [00:33<00:25, 14071.54 examples/s]
Filter: 56%|█████▌ | 458000/818627 [00:33<00:25, 14058.35 examples/s]
Filter: 56%|█████▌ | 458000/818627 [00:33<00:25, 14011.54 examples/s]
Filter: 56%|█████▌ | 458000/818627 [00:33<00:25, 13979.31 examples/s]
Filter: 55%|█████▌ | 454000/818627 [00:33<00:26, 13990.38 examples/s]
Filter: 55%|█████▍ | 450000/818627 [00:33<00:27, 13651.12 examples/s]
Filter: 55%|█████▌ | 454000/818627 [00:33<00:26, 13768.88 examples/s]
Filter: 55%|█████▌ | 454000/818627 [00:33<00:25, 14104.76 examples/s]
Filter: 56%|█████▌ | 460000/818627 [00:33<00:25, 14095.74 examples/s]
Filter: 56%|█████▌ | 460000/818627 [00:33<00:25, 14175.47 examples/s]
Filter: 56%|█████▌ | 460000/818627 [00:33<00:25, 14090.89 examples/s]
Filter: 56%|█████▌ | 460000/818627 [00:33<00:25, 14082.11 examples/s]
Filter: 56%|█████▌ | 456000/818627 [00:33<00:25, 14033.91 examples/s]
Filter: 55%|█████▌ | 452000/818627 [00:33<00:26, 13721.75 examples/s]
Filter: 56%|█████▌ | 456000/818627 [00:33<00:26, 13829.08 examples/s]
Filter: 56%|█████▌ | 456000/818627 [00:33<00:25, 13985.96 examples/s]
Filter: 56%|█████▋ | 462000/818627 [00:33<00:25, 14138.99 examples/s]
Filter: 56%|█████▋ | 462000/818627 [00:33<00:25, 14168.05 examples/s]
Filter: 56%|█████▋ | 462000/818627 [00:33<00:25, 14171.99 examples/s]
Filter: 56%|█████▋ | 462000/818627 [00:33<00:25, 14157.57 examples/s]
Filter: 56%|█████▌ | 458000/818627 [00:33<00:25, 13992.33 examples/s]
Filter: 55%|█████▌ | 454000/818627 [00:33<00:26, 13797.82 examples/s]
Filter: 56%|█████▌ | 458000/818627 [00:33<00:26, 13811.96 examples/s]
Filter: 56%|█████▌ | 458000/818627 [00:33<00:25, 14009.95 examples/s]
Filter: 57%|█████▋ | 464000/818627 [00:33<00:25, 14182.06 examples/s]
Filter: 57%|█████▋ | 464000/818627 [00:33<00:25, 14093.93 examples/s]
Filter: 57%|█████▋ | 464000/818627 [00:33<00:25, 14136.32 examples/s]
Filter: 57%|█████▋ | 464000/818627 [00:33<00:25, 14063.18 examples/s]
Filter: 56%|█████▌ | 460000/818627 [00:33<00:25, 13949.34 examples/s]
Filter: 56%|█████▌ | 456000/818627 [00:33<00:26, 13728.72 examples/s]
Filter: 56%|█████▌ | 460000/818627 [00:33<00:25, 13798.41 examples/s]
Filter: 56%|█████▌ | 460000/818627 [00:33<00:25, 14021.68 examples/s]
Filter: 57%|█████▋ | 466000/818627 [00:33<00:24, 14231.27 examples/s]
Filter: 57%|█████▋ | 466000/818627 [00:33<00:24, 14196.35 examples/s]
Filter: 57%|█████▋ | 466000/818627 [00:33<00:24, 14153.14 examples/s]
Filter: 57%|█████▋ | 466000/818627 [00:33<00:24, 14141.33 examples/s]
Filter: 56%|█████▋ | 462000/818627 [00:33<00:25, 14002.61 examples/s]
Filter: 56%|█████▋ | 462000/818627 [00:33<00:25, 13766.34 examples/s]
Filter: 56%|█████▌ | 458000/818627 [00:33<00:26, 13673.53 examples/s]
Filter: 56%|█████▋ | 462000/818627 [00:33<00:25, 14010.53 examples/s]
Filter: 57%|█████▋ | 468000/818627 [00:33<00:24, 14213.17 examples/s]
Filter: 57%|█████▋ | 468000/818627 [00:33<00:24, 14179.20 examples/s]
Filter: 57%|█████▋ | 468000/818627 [00:33<00:24, 14142.99 examples/s]
Filter: 57%|█████▋ | 468000/818627 [00:33<00:24, 14182.60 examples/s]
Filter: 57%|█████▋ | 464000/818627 [00:34<00:25, 13926.91 examples/s]
Filter: 57%|█████▋ | 464000/818627 [00:33<00:25, 13833.01 examples/s]
Filter: 56%|█████▌ | 460000/818627 [00:33<00:26, 13749.49 examples/s]
Filter: 57%|█████▋ | 464000/818627 [00:33<00:25, 13985.49 examples/s]
Filter: 57%|█████▋ | 470000/818627 [00:33<00:24, 14204.66 examples/s]
Filter: 57%|█████▋ | 470000/818627 [00:33<00:24, 14173.57 examples/s]
Filter: 57%|█████▋ | 470000/818627 [00:33<00:24, 14130.82 examples/s]
Filter: 57%|█████▋ | 470000/818627 [00:33<00:24, 14013.00 examples/s]
Filter: 57%|█████▋ | 466000/818627 [00:34<00:25, 13975.16 examples/s]
Filter: 56%|█████▋ | 462000/818627 [00:33<00:25, 13782.93 examples/s]
Filter: 57%|█████▋ | 466000/818627 [00:34<00:26, 13435.74 examples/s]
Filter: 57%|█████▋ | 466000/818627 [00:34<00:25, 13996.40 examples/s]
Filter: 58%|█████▊ | 472000/818627 [00:34<00:24, 14307.52 examples/s]
Filter: 58%|█████▊ | 472000/818627 [00:34<00:24, 14065.86 examples/s]
Filter: 58%|█████▊ | 472000/818627 [00:34<00:24, 14072.55 examples/s]
Filter: 58%|█████▊ | 472000/818627 [00:34<00:24, 14089.32 examples/s]
Filter: 57%|█████▋ | 468000/818627 [00:34<00:25, 14023.61 examples/s]
Filter: 57%|█████▋ | 464000/818627 [00:34<00:25, 13808.81 examples/s]
Filter: 57%|█████▋ | 468000/818627 [00:34<00:25, 13616.76 examples/s]
Filter: 57%|█████▋ | 468000/818627 [00:34<00:25, 13975.20 examples/s]
Filter: 58%|█████▊ | 474000/818627 [00:34<00:24, 14258.57 examples/s]
Filter: 58%|█████▊ | 474000/818627 [00:34<00:24, 14116.89 examples/s]
Filter: 58%|█████▊ | 474000/818627 [00:34<00:24, 14149.49 examples/s]
Filter: 58%|█████▊ | 474000/818627 [00:34<00:24, 14116.48 examples/s]
Filter: 57%|█████▋ | 470000/818627 [00:34<00:24, 14078.61 examples/s]
Filter: 57%|█████▋ | 466000/818627 [00:34<00:25, 13842.42 examples/s]
Filter: 57%|█████▋ | 470000/818627 [00:34<00:25, 13780.00 examples/s]
Filter: 57%|█████▋ | 470000/818627 [00:34<00:24, 13978.85 examples/s]
Filter: 58%|█████▊ | 476000/818627 [00:34<00:24, 14203.05 examples/s]
Filter: 58%|█████▊ | 476000/818627 [00:34<00:24, 14162.71 examples/s]
Filter: 58%|█████▊ | 476000/818627 [00:34<00:24, 14158.89 examples/s]
Filter: 58%|█████▊ | 476000/818627 [00:34<00:24, 14165.59 examples/s]
Filter: 58%|█████▊ | 472000/818627 [00:34<00:24, 13882.30 examples/s]
Filter: 57%|█████▋ | 468000/818627 [00:34<00:25, 13860.20 examples/s]
Filter: 58%|█████▊ | 472000/818627 [00:34<00:25, 13772.08 examples/s]
Filter: 58%|█████▊ | 472000/818627 [00:34<00:24, 13881.37 examples/s]
Filter: 58%|█████▊ | 478000/818627 [00:34<00:24, 14144.30 examples/s]
Filter: 58%|█████▊ | 478000/818627 [00:34<00:24, 14017.87 examples/s]
Filter: 58%|█████▊ | 478000/818627 [00:34<00:24, 13960.07 examples/s]
Filter: 58%|█████▊ | 478000/818627 [00:34<00:24, 13939.00 examples/s]
Filter: 58%|█████▊ | 474000/818627 [00:34<00:24, 13942.57 examples/s]
Filter: 57%|█████▋ | 470000/818627 [00:34<00:25, 13893.27 examples/s]
Filter: 58%|█████▊ | 474000/818627 [00:34<00:25, 13754.75 examples/s]
Filter: 58%|█████▊ | 474000/818627 [00:34<00:24, 13924.80 examples/s]
Filter: 59%|█████▊ | 480000/818627 [00:34<00:23, 14157.36 examples/s]
Filter: 59%|█████▊ | 480000/818627 [00:34<00:24, 14053.40 examples/s]
Filter: 59%|█████▊ | 480000/818627 [00:34<00:24, 14030.56 examples/s]
Filter: 59%|█████▊ | 480000/818627 [00:34<00:24, 13917.20 examples/s]
Filter: 58%|█████▊ | 476000/818627 [00:34<00:24, 14001.15 examples/s]
Filter: 58%|█████▊ | 472000/818627 [00:34<00:25, 13783.85 examples/s]
Filter: 58%|█████▊ | 476000/818627 [00:34<00:24, 13848.17 examples/s]
Filter: 58%|█████▊ | 476000/818627 [00:34<00:24, 13914.87 examples/s]
Filter: 59%|█████▉ | 482000/818627 [00:34<00:23, 14261.73 examples/s]
Filter: 59%|█████▉ | 482000/818627 [00:34<00:23, 14090.04 examples/s]
Filter: 59%|█████▉ | 482000/818627 [00:34<00:23, 14078.15 examples/s]
Filter: 59%|█████▉ | 482000/818627 [00:34<00:24, 13999.79 examples/s]
Filter: 58%|█████▊ | 478000/818627 [00:35<00:24, 13947.13 examples/s]
Filter: 58%|█████▊ | 474000/818627 [00:34<00:25, 13777.92 examples/s]
Filter: 58%|█████▊ | 478000/818627 [00:34<00:24, 13901.27 examples/s]
Filter: 58%|█████▊ | 478000/818627 [00:34<00:24, 13956.50 examples/s]
Filter: 59%|█████▉ | 484000/818627 [00:34<00:23, 14234.38 examples/s]
Filter: 59%|█████▉ | 484000/818627 [00:34<00:23, 14084.69 examples/s]
Filter: 59%|█████▉ | 484000/818627 [00:34<00:23, 14111.61 examples/s]
Filter: 59%|█████▉ | 484000/818627 [00:34<00:23, 14059.27 examples/s]
Filter: 59%|█████▊ | 480000/818627 [00:35<00:24, 13933.71 examples/s]
Filter: 58%|█████▊ | 476000/818627 [00:35<00:24, 13799.15 examples/s]
Filter: 59%|█████▊ | 480000/818627 [00:35<00:24, 13847.47 examples/s]
Filter: 59%|█████▊ | 480000/818627 [00:35<00:24, 13957.86 examples/s]
Filter: 59%|█████▉ | 486000/818627 [00:35<00:23, 14313.35 examples/s]
Filter: 59%|█████▉ | 486000/818627 [00:35<00:23, 14085.52 examples/s]
Filter: 59%|█████▉ | 486000/818627 [00:35<00:23, 14128.55 examples/s]
Filter: 59%|█████▉ | 486000/818627 [00:35<00:23, 14073.53 examples/s]
Filter: 59%|█████▉ | 482000/818627 [00:35<00:24, 13907.23 examples/s]
Filter: 58%|█████▊ | 478000/818627 [00:35<00:24, 13835.14 examples/s]
Filter: 59%|█████▉ | 482000/818627 [00:35<00:24, 13753.29 examples/s]
Filter: 59%|█████▉ | 482000/818627 [00:35<00:24, 13942.74 examples/s]
Filter: 60%|█████▉ | 488000/818627 [00:35<00:22, 14385.89 examples/s]
Filter: 60%|█████▉ | 488000/818627 [00:35<00:23, 14000.35 examples/s]
Filter: 60%|█████▉ | 488000/818627 [00:35<00:23, 14081.78 examples/s]
Filter: 60%|█████▉ | 488000/818627 [00:35<00:23, 14013.23 examples/s]
Filter: 59%|█████▉ | 484000/818627 [00:35<00:23, 13967.52 examples/s]
Filter: 59%|█████▊ | 480000/818627 [00:35<00:24, 13864.94 examples/s]
Filter: 59%|█████▉ | 484000/818627 [00:35<00:24, 13747.94 examples/s]
Filter: 59%|█████▉ | 484000/818627 [00:35<00:24, 13847.82 examples/s]
Filter: 60%|█████▉ | 490000/818627 [00:35<00:22, 14356.87 examples/s]
Filter: 60%|█████▉ | 490000/818627 [00:35<00:23, 14054.33 examples/s]
Filter: 60%|█████▉ | 490000/818627 [00:35<00:23, 13976.44 examples/s]
Filter: 60%|█████▉ | 490000/818627 [00:35<00:23, 14047.24 examples/s]
Filter: 59%|█████▉ | 486000/818627 [00:35<00:24, 13716.68 examples/s]
Filter: 59%|█████▉ | 482000/818627 [00:35<00:24, 13860.17 examples/s]
Filter: 59%|█████▉ | 486000/818627 [00:35<00:24, 13693.29 examples/s]
Filter: 59%|█████▉ | 486000/818627 [00:35<00:24, 13848.05 examples/s]
Filter: 60%|██████ | 492000/818627 [00:35<00:22, 14258.21 examples/s]
Filter: 60%|██████ | 492000/818627 [00:35<00:23, 14067.42 examples/s]
Filter: 60%|██████ | 492000/818627 [00:35<00:23, 13946.07 examples/s]
Filter: 60%|██████ | 492000/818627 [00:35<00:23, 13974.98 examples/s]
Filter: 60%|█████▉ | 488000/818627 [00:35<00:24, 13754.07 examples/s]
Filter: 59%|█████▉ | 484000/818627 [00:35<00:24, 13744.81 examples/s]
Filter: 60%|█████▉ | 488000/818627 [00:35<00:24, 13774.50 examples/s]
Filter: 60%|█████▉ | 488000/818627 [00:35<00:24, 13756.34 examples/s]
Filter: 60%|██████ | 494000/818627 [00:35<00:22, 14333.31 examples/s]
Filter: 60%|██████ | 494000/818627 [00:35<00:23, 14107.54 examples/s]
Filter: 60%|██████ | 494000/818627 [00:35<00:23, 13988.35 examples/s]
Filter: 60%|██████ | 494000/818627 [00:35<00:23, 13763.27 examples/s]
Filter: 60%|█████▉ | 490000/818627 [00:35<00:23, 13738.57 examples/s]
Filter: 59%|█████▉ | 486000/818627 [00:35<00:24, 13804.66 examples/s]
Filter: 60%|█████▉ | 490000/818627 [00:35<00:23, 13745.35 examples/s]
Filter: 60%|█████▉ | 490000/818627 [00:35<00:23, 13854.69 examples/s]
Filter: 61%|██████ | 496000/818627 [00:35<00:22, 14284.50 examples/s]
Filter: 61%|██████ | 496000/818627 [00:35<00:22, 14127.71 examples/s]
Filter: 61%|██████ | 496000/818627 [00:35<00:22, 14046.51 examples/s]
Filter: 61%|██████ | 496000/818627 [00:35<00:23, 13760.57 examples/s]
Filter: 60%|██████ | 492000/818627 [00:36<00:23, 13897.82 examples/s]
Filter: 60%|█████▉ | 488000/818627 [00:35<00:23, 13853.91 examples/s]
Filter: 60%|██████ | 492000/818627 [00:35<00:23, 13873.99 examples/s]
Filter: 60%|██████ | 492000/818627 [00:35<00:23, 13911.37 examples/s]
Filter: 61%|██████ | 498000/818627 [00:35<00:22, 14155.98 examples/s]
Filter: 61%|██████ | 498000/818627 [00:35<00:22, 14165.64 examples/s]
Filter: 61%|██████ | 498000/818627 [00:35<00:22, 14109.51 examples/s]
Filter: 61%|██████ | 498000/818627 [00:35<00:23, 13838.05 examples/s]
Filter: 60%|██████ | 494000/818627 [00:36<00:23, 13881.50 examples/s]
Filter: 60%|█████▉ | 490000/818627 [00:36<00:23, 13864.03 examples/s]
Filter: 60%|██████ | 494000/818627 [00:36<00:23, 13900.06 examples/s]
Filter: 60%|██████ | 494000/818627 [00:36<00:23, 13810.00 examples/s]
Filter: 61%|██████ | 500000/818627 [00:36<00:22, 13967.06 examples/s]
Filter: 61%|██████ | 500000/818627 [00:36<00:22, 13942.88 examples/s]
Filter: 61%|██████ | 500000/818627 [00:36<00:23, 13844.49 examples/s]
Filter: 61%|██████ | 500000/818627 [00:36<00:23, 13729.33 examples/s]
Filter: 61%|██████ | 496000/818627 [00:36<00:23, 14000.75 examples/s]
Filter: 60%|██████ | 492000/818627 [00:36<00:23, 13885.29 examples/s]
Filter: 61%|██████ | 496000/818627 [00:36<00:23, 13793.89 examples/s]
Filter: 61%|██████ | 496000/818627 [00:36<00:23, 13818.65 examples/s]
Filter: 61%|██████▏ | 502000/818627 [00:36<00:22, 13974.52 examples/s]
Filter: 61%|██████▏ | 502000/818627 [00:36<00:22, 13913.32 examples/s]
Filter: 61%|██████▏ | 502000/818627 [00:36<00:23, 13488.19 examples/s]
Filter: 61%|██████▏ | 502000/818627 [00:36<00:23, 13702.22 examples/s]
Filter: 61%|██████ | 498000/818627 [00:36<00:22, 13952.30 examples/s]
Filter: 60%|██████ | 494000/818627 [00:36<00:23, 13704.60 examples/s]
Filter: 61%|██████ | 498000/818627 [00:36<00:23, 13726.43 examples/s]
Filter: 61%|██████ | 498000/818627 [00:36<00:23, 13851.67 examples/s]
Filter: 62%|██████▏ | 504000/818627 [00:36<00:22, 14034.40 examples/s]
Filter: 62%|██████▏ | 504000/818627 [00:36<00:22, 13968.90 examples/s]
Filter: 62%|██████▏ | 504000/818627 [00:36<00:23, 13556.51 examples/s]
Filter: 62%|██████▏ | 504000/818627 [00:36<00:22, 13736.76 examples/s]
Filter: 61%|██████ | 500000/818627 [00:36<00:22, 14059.38 examples/s]
Filter: 61%|██████ | 496000/818627 [00:36<00:23, 13755.71 examples/s]
Filter: 61%|██████ | 500000/818627 [00:36<00:23, 13789.70 examples/s]
Filter: 61%|██████ | 500000/818627 [00:36<00:23, 13748.69 examples/s]
Filter: 62%|██████▏ | 506000/818627 [00:36<00:22, 14056.89 examples/s]
Filter: 62%|██████▏ | 506000/818627 [00:36<00:22, 14036.11 examples/s]
Filter: 62%|██████▏ | 506000/818627 [00:36<00:22, 13617.27 examples/s]
Filter: 62%|██████▏ | 506000/818627 [00:36<00:22, 13762.17 examples/s]
Filter: 61%|██████▏ | 502000/818627 [00:36<00:22, 14140.47 examples/s]
Filter: 61%|██████ | 498000/818627 [00:36<00:23, 13818.34 examples/s]
Filter: 61%|██████▏ | 502000/818627 [00:36<00:22, 13890.73 examples/s]
Filter: 61%|██████▏ | 502000/818627 [00:36<00:22, 13803.78 examples/s]
Filter: 62%|██████▏ | 508000/818627 [00:36<00:22, 14076.36 examples/s]
Filter: 62%|██████▏ | 508000/818627 [00:36<00:22, 14078.38 examples/s]
Filter: 62%|██████▏ | 508000/818627 [00:36<00:22, 13792.85 examples/s]
Filter: 62%|██████▏ | 508000/818627 [00:36<00:22, 13894.68 examples/s]
Filter: 62%|██████▏ | 504000/818627 [00:36<00:22, 14165.38 examples/s]
Filter: 61%|██████ | 500000/818627 [00:36<00:22, 13860.04 examples/s]
Filter: 62%|██████▏ | 504000/818627 [00:36<00:22, 13986.33 examples/s]
Filter: 62%|██████▏ | 504000/818627 [00:36<00:22, 13763.65 examples/s]
Filter: 62%|██████▏ | 510000/818627 [00:36<00:21, 14231.66 examples/s]
Filter: 62%|██████▏ | 510000/818627 [00:36<00:21, 14128.47 examples/s]
Filter: 62%|██████▏ | 506000/818627 [00:37<00:22, 14202.48 examples/s]
Filter: 62%|██████▏ | 510000/818627 [00:36<00:22, 13827.16 examples/s]
Filter: 62%|██████▏ | 510000/818627 [00:36<00:22, 13859.60 examples/s]
Filter: 61%|██████▏ | 502000/818627 [00:36<00:22, 13900.23 examples/s]
Filter: 62%|██████▏ | 506000/818627 [00:36<00:22, 14055.23 examples/s]
Filter: 62%|██████▏ | 506000/818627 [00:36<00:22, 13843.51 examples/s]
Filter: 63%|██████▎ | 512000/818627 [00:36<00:21, 14315.22 examples/s]
Filter: 63%|██████▎ | 512000/818627 [00:36<00:21, 14140.54 examples/s]
Filter: 62%|██████▏ | 508000/818627 [00:37<00:21, 14225.05 examples/s]
Filter: 63%|██████▎ | 512000/818627 [00:36<00:22, 13934.68 examples/s]
Filter: 63%|██████▎ | 512000/818627 [00:36<00:22, 13763.02 examples/s]
Filter: 62%|██████▏ | 504000/818627 [00:37<00:22, 13934.40 examples/s]
Filter: 62%|██████▏ | 508000/818627 [00:37<00:22, 13986.55 examples/s]
Filter: 62%|██████▏ | 508000/818627 [00:37<00:22, 13903.25 examples/s]
Filter: 63%|██████▎ | 514000/818627 [00:37<00:21, 14373.84 examples/s]
Filter: 63%|██████▎ | 514000/818627 [00:37<00:21, 14152.16 examples/s]
Filter: 62%|██████▏ | 510000/818627 [00:37<00:21, 14253.96 examples/s]
Filter: 63%|██████▎ | 514000/818627 [00:37<00:21, 13961.41 examples/s]
Filter: 63%|██████▎ | 514000/818627 [00:37<00:21, 13878.29 examples/s]
Filter: 62%|██████▏ | 506000/818627 [00:37<00:22, 13838.75 examples/s]
Filter: 62%|██████▏ | 510000/818627 [00:37<00:22, 13929.59 examples/s]
Filter: 63%|██████▎ | 516000/818627 [00:37<00:21, 14397.81 examples/s]
Filter: 62%|██████▏ | 510000/818627 [00:37<00:22, 13955.02 examples/s]
Filter: 63%|██████▎ | 516000/818627 [00:37<00:21, 13957.46 examples/s]
Filter: 63%|██████▎ | 512000/818627 [00:37<00:21, 14163.17 examples/s]
Filter: 63%|██████▎ | 516000/818627 [00:37<00:21, 13935.00 examples/s]
Filter: 63%|██████▎ | 516000/818627 [00:37<00:21, 13940.58 examples/s]
Filter: 62%|██████▏ | 508000/818627 [00:37<00:22, 13841.11 examples/s]
Filter: 63%|██████▎ | 512000/818627 [00:37<00:22, 13727.45 examples/s]
Filter: 63%|██████▎ | 518000/818627 [00:37<00:21, 14296.97 examples/s]
Filter: 63%|██████▎ | 512000/818627 [00:37<00:22, 13798.69 examples/s]
Filter: 63%|██████▎ | 518000/818627 [00:37<00:21, 13907.25 examples/s]
Filter: 63%|██████▎ | 514000/818627 [00:37<00:21, 14061.63 examples/s]
Filter: 63%|██████▎ | 518000/818627 [00:37<00:21, 14025.74 examples/s]
Filter: 63%|██████▎ | 518000/818627 [00:37<00:21, 13994.64 examples/s]
Filter: 62%|██████▏ | 510000/818627 [00:37<00:22, 13888.80 examples/s]
Filter: 64%|██████▎ | 520000/818627 [00:37<00:20, 14300.51 examples/s]
Filter: 63%|██████▎ | 514000/818627 [00:37<00:22, 13836.24 examples/s]
Filter: 63%|██████▎ | 514000/818627 [00:37<00:21, 13899.77 examples/s]
Filter: 64%|██████▎ | 520000/818627 [00:37<00:21, 13856.76 examples/s]
Filter: 63%|██████▎ | 516000/818627 [00:37<00:21, 14021.08 examples/s]
Filter: 64%|██████▎ | 520000/818627 [00:37<00:21, 14050.92 examples/s]
Filter: 64%|██████▎ | 520000/818627 [00:37<00:21, 13913.85 examples/s]
Filter: 63%|██████▎ | 512000/818627 [00:37<00:22, 13923.63 examples/s]
Filter: 64%|██████▍ | 522000/818627 [00:37<00:20, 14325.43 examples/s]
Filter: 63%|██████▎ | 516000/818627 [00:37<00:21, 13906.76 examples/s]
Filter: 63%|██████▎ | 516000/818627 [00:37<00:21, 13989.97 examples/s]
Filter: 64%|██████▍ | 522000/818627 [00:37<00:21, 13965.89 examples/s]
Filter: 63%|██████▎ | 518000/818627 [00:37<00:21, 14111.51 examples/s]
Filter: 64%|██████▍ | 522000/818627 [00:37<00:21, 14079.00 examples/s]
Filter: 64%|██████▍ | 522000/818627 [00:37<00:21, 14028.78 examples/s]
Filter: 63%|██████▎ | 514000/818627 [00:37<00:21, 13964.73 examples/s]
Filter: 64%|██████▍ | 524000/818627 [00:37<00:20, 14355.80 examples/s]
Filter: 63%|██████▎ | 518000/818627 [00:37<00:21, 13972.74 examples/s]
Filter: 63%|██████▎ | 518000/818627 [00:37<00:21, 13715.89 examples/s]
Filter: 64%|██████▍ | 524000/818627 [00:37<00:20, 14050.31 examples/s]
Filter: 64%|██████▎ | 520000/818627 [00:38<00:21, 14072.95 examples/s]
Filter: 64%|██████▍ | 524000/818627 [00:37<00:21, 14007.90 examples/s]
Filter: 64%|██████▍ | 524000/818627 [00:37<00:21, 13946.62 examples/s]
Filter: 64%|██████▍ | 526000/818627 [00:37<00:20, 14360.88 examples/s]
Filter: 63%|██████▎ | 516000/818627 [00:37<00:21, 14014.08 examples/s]
Filter: 64%|██████▎ | 520000/818627 [00:37<00:21, 14032.66 examples/s]
Filter: 64%|██████▎ | 520000/818627 [00:37<00:21, 13776.20 examples/s]
Filter: 64%|██████▍ | 526000/818627 [00:37<00:20, 14103.73 examples/s]
Filter: 64%|██████▍ | 522000/818627 [00:38<00:21, 14040.61 examples/s]
Filter: 64%|██████▍ | 526000/818627 [00:37<00:20, 13959.34 examples/s]
Filter: 64%|██████▍ | 526000/818627 [00:37<00:21, 13918.42 examples/s]
Filter: 63%|██████▎ | 518000/818627 [00:38<00:21, 14036.05 examples/s]
Filter: 64%|██████▍ | 528000/818627 [00:38<00:20, 14252.46 examples/s]
Filter: 64%|██████▍ | 522000/818627 [00:38<00:21, 13944.07 examples/s]
Filter: 64%|██████▍ | 522000/818627 [00:38<00:21, 13887.95 examples/s]
Filter: 64%|██████▍ | 528000/818627 [00:38<00:20, 14160.22 examples/s]
Filter: 64%|██████▍ | 524000/818627 [00:38<00:20, 14165.49 examples/s]
Filter: 64%|██████▍ | 528000/818627 [00:38<00:20, 13950.07 examples/s]
Filter: 64%|██████▍ | 528000/818627 [00:38<00:20, 13907.29 examples/s]
Filter: 65%|██████▍ | 530000/818627 [00:38<00:20, 14164.31 examples/s]
Filter: 64%|██████▎ | 520000/818627 [00:38<00:21, 13950.33 examples/s]
Filter: 64%|██████▍ | 524000/818627 [00:38<00:21, 13998.49 examples/s]
Filter: 64%|██████▍ | 524000/818627 [00:38<00:21, 13955.64 examples/s]
Filter: 65%|██████▍ | 530000/818627 [00:38<00:20, 14153.13 examples/s]
Filter: 64%|██████▍ | 526000/818627 [00:38<00:20, 14227.00 examples/s]
Filter: 65%|██████▍ | 530000/818627 [00:38<00:20, 14048.02 examples/s]
Filter: 65%|██████▍ | 530000/818627 [00:38<00:20, 13983.25 examples/s]
Filter: 65%|██████▍ | 532000/818627 [00:38<00:20, 14136.48 examples/s]
Filter: 64%|██████▍ | 522000/818627 [00:38<00:21, 14006.02 examples/s]
Filter: 64%|██████▍ | 526000/818627 [00:38<00:21, 13914.96 examples/s]
Filter: 64%|██████▍ | 526000/818627 [00:38<00:20, 13996.64 examples/s]
Filter: 65%|██████▍ | 532000/818627 [00:38<00:20, 14060.52 examples/s]
Filter: 64%|██████▍ | 528000/818627 [00:38<00:20, 14166.54 examples/s]
Filter: 65%|██████▍ | 532000/818627 [00:38<00:20, 14105.22 examples/s]
Filter: 65%|██████▍ | 532000/818627 [00:38<00:20, 14052.75 examples/s]
Filter: 65%|██████▌ | 534000/818627 [00:38<00:19, 14234.33 examples/s]
Filter: 64%|██████▍ | 524000/818627 [00:38<00:20, 14034.35 examples/s]
Filter: 64%|██████▍ | 528000/818627 [00:38<00:20, 13981.42 examples/s]
Filter: 64%|██████▍ | 528000/818627 [00:38<00:20, 14030.98 examples/s]
Filter: 65%|██████▌ | 534000/818627 [00:38<00:20, 14112.91 examples/s]
Filter: 65%|██████▍ | 530000/818627 [00:38<00:20, 14097.50 examples/s]
Filter: 65%|██████▌ | 534000/818627 [00:38<00:20, 14167.03 examples/s]
Filter: 65%|██████▌ | 534000/818627 [00:38<00:20, 13976.70 examples/s]
Filter: 65%|██████▌ | 536000/818627 [00:38<00:19, 14167.15 examples/s]
Filter: 64%|██████▍ | 526000/818627 [00:38<00:21, 13915.22 examples/s]
Filter: 65%|██████▍ | 530000/818627 [00:38<00:20, 14020.33 examples/s]
Filter: 65%|██████▍ | 530000/818627 [00:38<00:20, 14056.52 examples/s]
Filter: 65%|██████▌ | 536000/818627 [00:38<00:19, 14134.65 examples/s]
Filter: 65%|██████▍ | 532000/818627 [00:38<00:20, 14192.02 examples/s]
Filter: 65%|██████▌ | 536000/818627 [00:38<00:19, 14210.26 examples/s]
Filter: 65%|██████▌ | 536000/818627 [00:38<00:20, 14018.93 examples/s]
Filter: 66%|██████▌ | 538000/818627 [00:38<00:19, 14239.73 examples/s]
Filter: 64%|██████▍ | 528000/818627 [00:38<00:20, 13951.93 examples/s]
Filter: 65%|██████▍ | 532000/818627 [00:38<00:20, 14056.96 examples/s]
Filter: 65%|██████▍ | 532000/818627 [00:38<00:20, 13935.67 examples/s]
Filter: 66%|██████▌ | 538000/818627 [00:38<00:19, 14170.61 examples/s]
Filter: 65%|██████▌ | 534000/818627 [00:39<00:19, 14267.82 examples/s]
Filter: 66%|██████▌ | 538000/818627 [00:38<00:20, 13885.91 examples/s]
Filter: 66%|██████▌ | 538000/818627 [00:38<00:20, 13933.88 examples/s]
Filter: 66%|██████▌ | 540000/818627 [00:38<00:19, 14300.51 examples/s]
Filter: 65%|██████▍ | 530000/818627 [00:38<00:20, 13975.52 examples/s]
Filter: 65%|██████▌ | 534000/818627 [00:38<00:20, 14072.91 examples/s]
Filter: 65%|██████▌ | 534000/818627 [00:38<00:20, 13884.08 examples/s]
Filter: 66%|██████▌ | 540000/818627 [00:38<00:19, 14060.86 examples/s]
Filter: 65%|██████▌ | 536000/818627 [00:39<00:20, 14060.15 examples/s]
Filter: 66%|██████▌ | 540000/818627 [00:38<00:20, 13824.32 examples/s]
Filter: 66%|██████▌ | 540000/818627 [00:38<00:20, 13837.97 examples/s]
Filter: 65%|██████▍ | 532000/818627 [00:39<00:20, 13764.83 examples/s]
Filter: 65%|██████▌ | 536000/818627 [00:39<00:20, 13954.34 examples/s]
Filter: 65%|██████▌ | 536000/818627 [00:39<00:20, 13940.28 examples/s]
Filter: 66%|██████▌ | 538000/818627 [00:39<00:19, 14045.48 examples/s]
Filter: 65%|██████▌ | 534000/818627 [00:39<00:20, 13840.90 examples/s]
Filter: 66%|██████▌ | 538000/818627 [00:39<00:20, 13867.12 examples/s]
Filter: 66%|██████▌ | 538000/818627 [00:39<00:20, 13981.53 examples/s]
Filter: 66%|██████▌ | 540000/818627 [00:39<00:19, 14147.57 examples/s]
Filter: 65%|██████▌ | 536000/818627 [00:39<00:20, 13878.01 examples/s]
Filter: 66%|██████▌ | 542000/818627 [00:39<00:32, 8482.67 examples/s]
Filter: 66%|██████▌ | 540000/818627 [00:39<00:20, 13778.69 examples/s]
Filter: 66%|██████▌ | 540000/818627 [00:39<00:19, 14011.17 examples/s]
Filter: 66%|██████▌ | 542000/818627 [00:39<00:19, 13837.39 examples/s]
Filter: 66%|██████▌ | 542000/818627 [00:39<00:34, 8080.00 examples/s]
Filter: 66%|██████▌ | 538000/818627 [00:39<00:20, 13930.52 examples/s]
Filter: 66%|██████▌ | 542000/818627 [00:39<00:34, 8068.61 examples/s]
Filter: 66%|██████▋ | 544000/818627 [00:39<00:28, 9612.62 examples/s]
Filter: 66%|██████▌ | 542000/818627 [00:39<00:34, 8054.31 examples/s]
Filter: 66%|██████▋ | 544000/818627 [00:39<00:19, 13985.46 examples/s]
Filter: 66%|██████▋ | 544000/818627 [00:39<00:29, 9186.62 examples/s]
Filter: 66%|██████▌ | 540000/818627 [00:39<00:19, 13953.50 examples/s]
Filter: 66%|██████▋ | 544000/818627 [00:39<00:29, 9236.11 examples/s]
Filter: 67%|██████▋ | 546000/818627 [00:39<00:25, 10569.51 examples/s]
Filter: 66%|██████▋ | 544000/818627 [00:39<00:29, 9213.67 examples/s]
Filter: 67%|██████▋ | 546000/818627 [00:39<00:26, 10246.55 examples/s]
Filter: 67%|██████▋ | 546000/818627 [00:39<00:26, 10300.80 examples/s]
Filter: 67%|██████▋ | 546000/818627 [00:39<00:26, 10274.74 examples/s]
Filter: 67%|██████▋ | 548000/818627 [00:39<00:23, 11358.44 examples/s]
Filter: 66%|██████▌ | 542000/818627 [00:39<00:32, 8500.12 examples/s]
Filter: 66%|██████▌ | 542000/818627 [00:39<00:34, 8033.16 examples/s]
Filter: 67%|██████▋ | 548000/818627 [00:39<00:24, 11171.04 examples/s]
Filter: 67%|██████▋ | 548000/818627 [00:39<00:24, 11222.80 examples/s]
Filter: 67%|██████▋ | 548000/818627 [00:39<00:24, 11187.44 examples/s]
Filter: 67%|██████▋ | 550000/818627 [00:39<00:22, 12008.22 examples/s]
Filter: 66%|██████▋ | 544000/818627 [00:39<00:28, 9592.73 examples/s]
Filter: 66%|██████▋ | 544000/818627 [00:39<00:29, 9193.50 examples/s]
Filter: 67%|██████▋ | 550000/818627 [00:40<00:22, 11923.95 examples/s]
Filter: 67%|██████▋ | 550000/818627 [00:40<00:22, 11877.17 examples/s]
Filter: 67%|██████▋ | 552000/818627 [00:40<00:21, 12639.65 examples/s]
Filter: 67%|██████▋ | 550000/818627 [00:40<00:22, 11856.36 examples/s]
Filter: 67%|██████▋ | 546000/818627 [00:40<00:35, 7760.77 examples/s]
Filter: 67%|██████▋ | 546000/818627 [00:40<00:25, 10573.24 examples/s]
Filter: 66%|██████▌ | 542000/818627 [00:40<00:33, 8143.31 examples/s]
Filter: 67%|██████▋ | 546000/818627 [00:40<00:26, 10255.23 examples/s]
Filter: 67%|██████▋ | 552000/818627 [00:40<00:21, 12510.24 examples/s]
Filter: 67%|██████▋ | 552000/818627 [00:40<00:21, 12494.36 examples/s]
Filter: 68%|██████▊ | 554000/818627 [00:40<00:20, 13112.39 examples/s]
Filter: 67%|██████▋ | 552000/818627 [00:40<00:21, 12451.92 examples/s]
Filter: 67%|██████▋ | 548000/818627 [00:40<00:30, 8888.43 examples/s]
Filter: 67%|██████▋ | 548000/818627 [00:40<00:23, 11342.30 examples/s]
Filter: 66%|██████▋ | 544000/818627 [00:40<00:30, 9145.45 examples/s]
Filter: 67%|██████▋ | 548000/818627 [00:40<00:24, 11100.93 examples/s]
Filter: 68%|██████▊ | 554000/818627 [00:40<00:20, 12853.51 examples/s]
Filter: 68%|██████▊ | 554000/818627 [00:40<00:20, 12895.15 examples/s]
Filter: 68%|██████▊ | 556000/818627 [00:40<00:19, 13461.73 examples/s]
Filter: 68%|██████▊ | 554000/818627 [00:40<00:20, 12834.71 examples/s]
Filter: 67%|██████▋ | 550000/818627 [00:40<00:27, 9903.61 examples/s]
Filter: 67%|██████▋ | 550000/818627 [00:40<00:22, 11950.31 examples/s]
Filter: 67%|██████▋ | 546000/818627 [00:40<00:26, 10202.21 examples/s]
Filter: 67%|██████▋ | 550000/818627 [00:40<00:22, 11858.61 examples/s]
Filter: 68%|██████▊ | 556000/818627 [00:40<00:19, 13134.88 examples/s]
Filter: 68%|██████▊ | 558000/818627 [00:40<00:18, 13730.23 examples/s]
Filter: 68%|██████▊ | 556000/818627 [00:40<00:19, 13270.33 examples/s]
Filter: 68%|██████▊ | 556000/818627 [00:40<00:19, 13192.71 examples/s]
Filter: 67%|██████▋ | 552000/818627 [00:40<00:24, 10891.69 examples/s]
Filter: 67%|██████▋ | 552000/818627 [00:40<00:21, 12458.52 examples/s]
Filter: 67%|██████▋ | 548000/818627 [00:40<00:24, 11028.08 examples/s]
Filter: 67%|██████▋ | 552000/818627 [00:40<00:21, 12315.39 examples/s]
Filter: 68%|██████▊ | 558000/818627 [00:40<00:19, 13311.77 examples/s]
Filter: 68%|██████▊ | 558000/818627 [00:40<00:19, 13559.84 examples/s]
Filter: 68%|██████▊ | 560000/818627 [00:40<00:18, 13837.14 examples/s]
Filter: 68%|██████▊ | 558000/818627 [00:40<00:19, 13423.61 examples/s]
Filter: 68%|██████▊ | 554000/818627 [00:40<00:22, 11616.03 examples/s]
Filter: 68%|██████▊ | 554000/818627 [00:40<00:20, 12890.76 examples/s]
Filter: 67%|██████▋ | 550000/818627 [00:40<00:22, 11767.62 examples/s]
Filter: 68%|██████▊ | 554000/818627 [00:40<00:20, 12805.95 examples/s]
Filter: 68%|██████▊ | 560000/818627 [00:40<00:19, 13560.18 examples/s]
Filter: 68%|██████▊ | 560000/818627 [00:40<00:18, 13712.09 examples/s]
Filter: 69%|██████▊ | 562000/818627 [00:40<00:18, 13914.52 examples/s]
Filter: 68%|██████▊ | 560000/818627 [00:40<00:19, 13608.38 examples/s]
Filter: 68%|██████▊ | 556000/818627 [00:40<00:21, 12205.65 examples/s]
Filter: 68%|██████▊ | 556000/818627 [00:40<00:19, 13226.48 examples/s]
Filter: 67%|██████▋ | 552000/818627 [00:40<00:21, 12273.31 examples/s]
Filter: 68%|██████▊ | 556000/818627 [00:40<00:20, 13020.06 examples/s]
Filter: 69%|██████▊ | 562000/818627 [00:40<00:18, 13733.84 examples/s]
Filter: 69%|██████▉ | 564000/818627 [00:40<00:18, 14060.10 examples/s]
Filter: 69%|██████▊ | 562000/818627 [00:40<00:18, 13871.28 examples/s]
Filter: 69%|██████▊ | 562000/818627 [00:40<00:18, 13737.17 examples/s]
Filter: 68%|██████▊ | 558000/818627 [00:41<00:20, 12696.53 examples/s]
Filter: 68%|██████▊ | 558000/818627 [00:40<00:19, 13353.03 examples/s]
Filter: 68%|██████▊ | 554000/818627 [00:40<00:20, 12668.06 examples/s]
Filter: 68%|██████▊ | 558000/818627 [00:40<00:19, 13200.78 examples/s]
Filter: 69%|██████▉ | 564000/818627 [00:41<00:18, 13870.88 examples/s]
Filter: 69%|██████▉ | 566000/818627 [00:41<00:17, 14171.57 examples/s]
Filter: 69%|██████▉ | 564000/818627 [00:41<00:18, 13940.86 examples/s]
Filter: 69%|██████▉ | 564000/818627 [00:41<00:18, 13837.80 examples/s]
Filter: 68%|██████▊ | 560000/818627 [00:41<00:19, 13108.61 examples/s]
Filter: 68%|██████▊ | 560000/818627 [00:41<00:19, 13558.14 examples/s]
Filter: 68%|██████▊ | 556000/818627 [00:41<00:20, 13032.48 examples/s]
Filter: 68%|██████▊ | 560000/818627 [00:41<00:19, 13449.04 examples/s]
Filter: 69%|██████▉ | 566000/818627 [00:41<00:18, 13970.52 examples/s]
Filter: 69%|██████▉ | 568000/818627 [00:41<00:17, 14251.29 examples/s]
Filter: 69%|██████▉ | 566000/818627 [00:41<00:18, 13931.54 examples/s]
Filter: 69%|██████▉ | 566000/818627 [00:41<00:18, 13960.78 examples/s]
Filter: 69%|██████▊ | 562000/818627 [00:41<00:19, 13326.08 examples/s]
Filter: 69%|██████▊ | 562000/818627 [00:41<00:18, 13714.91 examples/s]
Filter: 68%|██████▊ | 558000/818627 [00:41<00:19, 13323.95 examples/s]
Filter: 69%|██████▊ | 562000/818627 [00:41<00:18, 13604.39 examples/s]
Filter: 69%|██████▉ | 568000/818627 [00:41<00:17, 14070.73 examples/s]
Filter: 70%|██████▉ | 570000/818627 [00:41<00:17, 14245.63 examples/s]
Filter: 69%|██████▉ | 568000/818627 [00:41<00:18, 13912.76 examples/s]
Filter: 69%|██████▉ | 568000/818627 [00:41<00:17, 14007.45 examples/s]
Filter: 69%|██████▉ | 564000/818627 [00:41<00:18, 13465.37 examples/s]
Filter: 69%|██████▉ | 564000/818627 [00:41<00:18, 13798.38 examples/s]
Filter: 68%|██████▊ | 560000/818627 [00:41<00:19, 13526.14 examples/s]
Filter: 69%|██████▉ | 564000/818627 [00:41<00:18, 13755.93 examples/s]
Filter: 70%|██████▉ | 570000/818627 [00:41<00:17, 14116.62 examples/s]
Filter: 70%|██████▉ | 572000/818627 [00:41<00:17, 14296.07 examples/s]
Filter: 70%|██████▉ | 570000/818627 [00:41<00:17, 14000.39 examples/s]
Filter: 70%|██████▉ | 570000/818627 [00:41<00:17, 14051.17 examples/s]
Filter: 69%|██████▉ | 566000/818627 [00:41<00:19, 13222.25 examples/s]
Filter: 69%|██████▉ | 566000/818627 [00:41<00:18, 13853.15 examples/s]
Filter: 69%|██████▊ | 562000/818627 [00:41<00:18, 13669.21 examples/s]
Filter: 69%|██████▉ | 566000/818627 [00:41<00:18, 13666.46 examples/s]
Filter: 70%|██████▉ | 572000/818627 [00:41<00:17, 14141.59 examples/s]
Filter: 70%|███████ | 574000/818627 [00:41<00:17, 14334.66 examples/s]
Filter: 70%|██████▉ | 572000/818627 [00:41<00:17, 14073.07 examples/s]
Filter: 70%|██████▉ | 572000/818627 [00:41<00:17, 14071.65 examples/s]
Filter: 69%|██████▉ | 568000/818627 [00:41<00:18, 13455.27 examples/s]
Filter: 69%|██████▉ | 568000/818627 [00:41<00:18, 13918.54 examples/s]
Filter: 69%|██████▉ | 564000/818627 [00:41<00:18, 13778.44 examples/s]
Filter: 69%|██████▉ | 568000/818627 [00:41<00:18, 13784.50 examples/s]
Filter: 70%|███████ | 574000/818627 [00:41<00:17, 14185.06 examples/s]
Filter: 70%|███████ | 576000/818627 [00:41<00:16, 14339.79 examples/s]
Filter: 70%|███████ | 574000/818627 [00:41<00:17, 14140.34 examples/s]
Filter: 70%|███████ | 574000/818627 [00:41<00:17, 14079.97 examples/s]
Filter: 70%|██████▉ | 570000/818627 [00:41<00:18, 13502.10 examples/s]
Filter: 70%|██████▉ | 570000/818627 [00:41<00:18, 13712.87 examples/s]
Filter: 69%|██████▉ | 566000/818627 [00:41<00:18, 13840.09 examples/s]
Filter: 70%|██████▉ | 570000/818627 [00:41<00:17, 13818.90 examples/s]
Filter: 70%|███████ | 576000/818627 [00:41<00:17, 14142.04 examples/s]
Filter: 71%|███████ | 578000/818627 [00:41<00:16, 14194.92 examples/s]
Filter: 70%|███████ | 576000/818627 [00:41<00:17, 14145.11 examples/s]
Filter: 70%|███████ | 576000/818627 [00:41<00:17, 14095.43 examples/s]
Filter: 70%|██████▉ | 572000/818627 [00:42<00:18, 13680.13 examples/s]
Filter: 70%|██████▉ | 572000/818627 [00:41<00:17, 13779.22 examples/s]
Filter: 69%|██████▉ | 568000/818627 [00:41<00:18, 13903.67 examples/s]
Filter: 70%|██████▉ | 572000/818627 [00:41<00:17, 13876.11 examples/s]
Filter: 71%|███████ | 578000/818627 [00:41<00:16, 14179.56 examples/s]
Filter: 71%|███████ | 580000/818627 [00:41<00:16, 14125.58 examples/s]
Filter: 71%|███████ | 578000/818627 [00:42<00:16, 14203.90 examples/s]
Filter: 71%|███████ | 578000/818627 [00:42<00:17, 13936.55 examples/s]
Filter: 70%|███████ | 574000/818627 [00:42<00:17, 13714.02 examples/s]
Filter: 70%|███████ | 574000/818627 [00:42<00:17, 13853.97 examples/s]
Filter: 70%|██████▉ | 570000/818627 [00:42<00:17, 13964.65 examples/s]
Filter: 71%|███████ | 580000/818627 [00:42<00:16, 14208.26 examples/s]
Filter: 70%|███████ | 574000/818627 [00:42<00:17, 13838.22 examples/s]
Filter: 71%|███████ | 582000/818627 [00:42<00:16, 14193.26 examples/s]
Filter: 71%|███████ | 580000/818627 [00:42<00:16, 14250.47 examples/s]
Filter: 71%|███████ | 580000/818627 [00:42<00:17, 14029.20 examples/s]
Filter: 70%|███████ | 576000/818627 [00:42<00:17, 13727.80 examples/s]
Filter: 70%|███████ | 576000/818627 [00:42<00:17, 13825.15 examples/s]
Filter: 70%|██████▉ | 572000/818627 [00:42<00:17, 14005.39 examples/s]
Filter: 71%|███████ | 582000/818627 [00:42<00:16, 14102.60 examples/s]
Filter: 70%|███████ | 576000/818627 [00:42<00:17, 13786.60 examples/s]
Filter: 71%|███████▏ | 584000/818627 [00:42<00:16, 14119.07 examples/s]
Filter: 71%|███████ | 582000/818627 [00:42<00:16, 14284.19 examples/s]
Filter: 71%|███████ | 582000/818627 [00:42<00:16, 14088.65 examples/s]
Filter: 71%|███████ | 578000/818627 [00:42<00:17, 13896.71 examples/s]
Filter: 71%|███████ | 578000/818627 [00:42<00:17, 13899.49 examples/s]
Filter: 70%|███████ | 574000/818627 [00:42<00:17, 13832.14 examples/s]
Filter: 71%|███████▏ | 584000/818627 [00:42<00:16, 14014.29 examples/s]
Filter: 71%|███████ | 578000/818627 [00:42<00:17, 13760.34 examples/s]
Filter: 71%|███████▏ | 584000/818627 [00:42<00:16, 14184.31 examples/s]
Filter: 72%|███████▏ | 586000/818627 [00:42<00:17, 13679.05 examples/s]
Filter: 71%|███████▏ | 584000/818627 [00:42<00:16, 13985.26 examples/s]
Filter: 71%|███████ | 580000/818627 [00:42<00:17, 13852.27 examples/s]
Filter: 71%|███████ | 580000/818627 [00:42<00:17, 13689.53 examples/s]
Filter: 70%|███████ | 576000/818627 [00:42<00:17, 13869.77 examples/s]
Filter: 72%|███████▏ | 586000/818627 [00:42<00:16, 14116.86 examples/s]
Filter: 71%|███████ | 580000/818627 [00:42<00:17, 13724.12 examples/s]
Filter: 72%|███████▏ | 586000/818627 [00:42<00:16, 14238.31 examples/s]
Filter: 72%|███████▏ | 588000/818627 [00:42<00:16, 13853.53 examples/s]
Filter: 72%|███████▏ | 586000/818627 [00:42<00:16, 13920.30 examples/s]
Filter: 71%|███████ | 582000/818627 [00:42<00:17, 13814.89 examples/s]
Filter: 71%|███████ | 582000/818627 [00:42<00:17, 13726.30 examples/s]
Filter: 71%|███████ | 578000/818627 [00:42<00:17, 13820.40 examples/s]
Filter: 72%|███████▏ | 588000/818627 [00:42<00:16, 14048.51 examples/s]
Filter: 71%|███████ | 582000/818627 [00:42<00:17, 13800.24 examples/s]
Filter: 72%|███████▏ | 588000/818627 [00:42<00:16, 14248.02 examples/s]
Filter: 72%|███████▏ | 590000/818627 [00:42<00:16, 13983.75 examples/s]
Filter: 72%|███████▏ | 588000/818627 [00:42<00:16, 14000.83 examples/s]
Filter: 71%|███████▏ | 584000/818627 [00:43<00:16, 13919.01 examples/s]
Filter: 71%|███████▏ | 584000/818627 [00:42<00:16, 13809.80 examples/s]
Filter: 71%|███████ | 580000/818627 [00:42<00:17, 13902.67 examples/s]
Filter: 72%|███████▏ | 590000/818627 [00:42<00:16, 14121.57 examples/s]
Filter: 71%|███████▏ | 584000/818627 [00:42<00:17, 13688.64 examples/s]
Filter: 72%|███████▏ | 590000/818627 [00:42<00:16, 14153.72 examples/s]
Filter: 72%|███████▏ | 592000/818627 [00:42<00:16, 13986.05 examples/s]
Filter: 72%|███████▏ | 590000/818627 [00:42<00:16, 14081.28 examples/s]
Filter: 72%|███████▏ | 586000/818627 [00:43<00:16, 13990.47 examples/s]
Filter: 72%|███████▏ | 586000/818627 [00:42<00:16, 13886.15 examples/s]
Filter: 71%|███████ | 582000/818627 [00:42<00:16, 13950.00 examples/s]
Filter: 72%|███████▏ | 592000/818627 [00:42<00:15, 14181.33 examples/s]
Filter: 72%|███████▏ | 592000/818627 [00:43<00:15, 14216.95 examples/s]
Filter: 72%|███████▏ | 586000/818627 [00:43<00:16, 13692.27 examples/s]
Filter: 73%|███████▎ | 594000/818627 [00:42<00:16, 13988.02 examples/s]
Filter: 72%|███████▏ | 592000/818627 [00:43<00:16, 14134.84 examples/s]
Filter: 72%|███████▏ | 588000/818627 [00:43<00:16, 14023.70 examples/s]
Filter: 72%|███████▏ | 588000/818627 [00:43<00:16, 13924.08 examples/s]
Filter: 71%|███████▏ | 584000/818627 [00:43<00:16, 13984.44 examples/s]
Filter: 73%|███████▎ | 594000/818627 [00:43<00:15, 14200.88 examples/s]
Filter: 73%|███████▎ | 594000/818627 [00:43<00:15, 14249.59 examples/s]
Filter: 72%|███████▏ | 588000/818627 [00:43<00:16, 13799.17 examples/s]
Filter: 73%|███████▎ | 596000/818627 [00:43<00:15, 14100.38 examples/s]
Filter: 73%|███████▎ | 594000/818627 [00:43<00:15, 14150.41 examples/s]
Filter: 72%|███████▏ | 590000/818627 [00:43<00:16, 13803.10 examples/s]
Filter: 72%|███████▏ | 590000/818627 [00:43<00:16, 13955.83 examples/s]
Filter: 73%|███████▎ | 596000/818627 [00:43<00:15, 14083.94 examples/s]
Filter: 72%|███████▏ | 586000/818627 [00:43<00:16, 13882.26 examples/s]
Filter: 73%|███████▎ | 596000/818627 [00:43<00:15, 14151.88 examples/s]
Filter: 72%|███████▏ | 590000/818627 [00:43<00:16, 13898.43 examples/s]
Filter: 73%|███████▎ | 598000/818627 [00:43<00:15, 14081.68 examples/s]
Filter: 73%|███████▎ | 596000/818627 [00:43<00:15, 14065.47 examples/s]
Filter: 72%|███████▏ | 592000/818627 [00:43<00:16, 13782.20 examples/s]
Filter: 72%|███████▏ | 592000/818627 [00:43<00:16, 13956.27 examples/s]
Filter: 73%|███████▎ | 598000/818627 [00:43<00:15, 14139.88 examples/s]
Filter: 72%|███████▏ | 588000/818627 [00:43<00:16, 13915.95 examples/s]
Filter: 73%|███████▎ | 598000/818627 [00:43<00:15, 14184.08 examples/s]
Filter: 72%|███████▏ | 592000/818627 [00:43<00:16, 13918.30 examples/s]
Filter: 73%|███████▎ | 600000/818627 [00:43<00:15, 14162.25 examples/s]
Filter: 73%|███████▎ | 598000/818627 [00:43<00:15, 14038.57 examples/s]
Filter: 73%|███████▎ | 594000/818627 [00:43<00:16, 13803.56 examples/s]
Filter: 73%|███████▎ | 594000/818627 [00:43<00:16, 13992.52 examples/s]
Filter: 73%|███████▎ | 600000/818627 [00:43<00:15, 14074.23 examples/s]
Filter: 72%|███████▏ | 590000/818627 [00:43<00:16, 13961.85 examples/s]
Filter: 73%|███████▎ | 600000/818627 [00:43<00:15, 14211.65 examples/s]
Filter: 74%|███████▎ | 602000/818627 [00:43<00:15, 14253.97 examples/s]
Filter: 73%|███████▎ | 594000/818627 [00:43<00:16, 13886.71 examples/s]
Filter: 73%|███████▎ | 600000/818627 [00:43<00:15, 13931.50 examples/s]
Filter: 73%|███████▎ | 596000/818627 [00:43<00:16, 13883.87 examples/s]
Filter: 73%|███████▎ | 596000/818627 [00:43<00:15, 14010.93 examples/s]
Filter: 72%|███████▏ | 592000/818627 [00:43<00:16, 14000.08 examples/s]
Filter: 74%|███████▎ | 602000/818627 [00:43<00:15, 13996.62 examples/s]
Filter: 74%|███████▎ | 602000/818627 [00:43<00:15, 14249.29 examples/s]
Filter: 74%|███████▍ | 604000/818627 [00:43<00:14, 14320.32 examples/s]
Filter: 73%|███████▎ | 596000/818627 [00:43<00:15, 13942.52 examples/s]
Filter: 74%|███████▎ | 602000/818627 [00:43<00:15, 14020.86 examples/s]
Filter: 73%|███████▎ | 598000/818627 [00:44<00:16, 13758.81 examples/s]
Filter: 73%|███████▎ | 598000/818627 [00:43<00:15, 13816.26 examples/s]
Filter: 74%|███████▍ | 604000/818627 [00:43<00:15, 14055.64 examples/s]
Filter: 73%|███████▎ | 594000/818627 [00:43<00:16, 14016.51 examples/s]
Filter: 74%|███████▍ | 604000/818627 [00:43<00:15, 14171.76 examples/s]
Filter: 74%|███████▍ | 606000/818627 [00:43<00:14, 14201.88 examples/s]
Filter: 73%|███████▎ | 598000/818627 [00:43<00:15, 13860.02 examples/s]
Filter: 74%|███████▍ | 604000/818627 [00:43<00:15, 14079.63 examples/s]
Filter: 73%|███████▎ | 600000/818627 [00:44<00:15, 13824.05 examples/s]
Filter: 73%|███████▎ | 600000/818627 [00:43<00:15, 13814.52 examples/s]
Filter: 74%|███████▍ | 606000/818627 [00:43<00:15, 14046.22 examples/s]
Filter: 73%|███████▎ | 596000/818627 [00:43<00:15, 13991.25 examples/s]
Filter: 74%|███████▍ | 606000/818627 [00:43<00:15, 14164.08 examples/s]
Filter: 74%|███████▍ | 608000/818627 [00:43<00:14, 14256.23 examples/s]
Filter: 73%|███████▎ | 600000/818627 [00:44<00:15, 13766.56 examples/s]
Filter: 74%|███████▍ | 606000/818627 [00:44<00:15, 14046.05 examples/s]
Filter: 74%|███████▎ | 602000/818627 [00:44<00:15, 13927.92 examples/s]
Filter: 74%|███████▎ | 602000/818627 [00:44<00:15, 13889.19 examples/s]
Filter: 74%|███████▍ | 608000/818627 [00:44<00:14, 14090.86 examples/s]
Filter: 73%|███████▎ | 598000/818627 [00:44<00:15, 13996.06 examples/s]
Filter: 74%|███████▍ | 608000/818627 [00:44<00:14, 14080.20 examples/s]
Filter: 75%|███████▍ | 610000/818627 [00:44<00:14, 14099.74 examples/s]
Filter: 74%|███████▎ | 602000/818627 [00:44<00:15, 13820.73 examples/s]
Filter: 74%|███████▍ | 608000/818627 [00:44<00:14, 14083.38 examples/s]
Filter: 74%|███████▍ | 604000/818627 [00:44<00:15, 13994.91 examples/s]
Filter: 74%|███████▍ | 604000/818627 [00:44<00:15, 13940.10 examples/s]
Filter: 75%|███████▍ | 610000/818627 [00:44<00:14, 14130.74 examples/s]
Filter: 73%|███████▎ | 600000/818627 [00:44<00:15, 13822.91 examples/s]
Filter: 75%|███████▍ | 610000/818627 [00:44<00:14, 14048.90 examples/s]
Filter: 75%|███████▍ | 612000/818627 [00:44<00:14, 14193.73 examples/s]
Filter: 74%|███████▍ | 604000/818627 [00:44<00:15, 13661.19 examples/s]
Filter: 75%|███████▍ | 610000/818627 [00:44<00:14, 14014.12 examples/s]
Filter: 74%|███████▍ | 606000/818627 [00:44<00:15, 13861.19 examples/s]
Filter: 75%|███████▍ | 612000/818627 [00:44<00:14, 14044.41 examples/s]
Filter: 74%|███████▍ | 606000/818627 [00:44<00:15, 13844.63 examples/s]
Filter: 74%|███████▎ | 602000/818627 [00:44<00:15, 13908.53 examples/s]
Filter: 75%|███████▌ | 614000/818627 [00:44<00:14, 14020.42 examples/s]
Filter: 75%|███████▍ | 612000/818627 [00:44<00:14, 13914.90 examples/s]
Filter: 74%|███████▍ | 606000/818627 [00:44<00:15, 13750.50 examples/s]
Filter: 75%|███████▍ | 612000/818627 [00:44<00:14, 14081.94 examples/s]
Filter: 74%|███████▍ | 608000/818627 [00:44<00:15, 13807.28 examples/s]
Filter: 75%|███████▌ | 614000/818627 [00:44<00:14, 14125.47 examples/s]
Filter: 74%|███████▍ | 608000/818627 [00:44<00:15, 13894.71 examples/s]
Filter: 74%|███████▍ | 604000/818627 [00:44<00:15, 13872.91 examples/s]
Filter: 75%|███████▌ | 616000/818627 [00:44<00:14, 14040.43 examples/s]
Filter: 75%|███████▌ | 614000/818627 [00:44<00:14, 13939.04 examples/s]
Filter: 75%|███████▌ | 614000/818627 [00:44<00:14, 14139.46 examples/s]
Filter: 74%|███████▍ | 608000/818627 [00:44<00:15, 13387.77 examples/s]
Filter: 75%|███████▌ | 616000/818627 [00:44<00:14, 14192.03 examples/s]
Filter: 75%|███████▍ | 610000/818627 [00:44<00:15, 13901.14 examples/s]
Filter: 75%|███████▍ | 610000/818627 [00:44<00:14, 13959.68 examples/s]
Filter: 74%|███████▍ | 606000/818627 [00:44<00:15, 13800.77 examples/s]
Filter: 75%|███████▌ | 618000/818627 [00:44<00:14, 14154.53 examples/s]
Filter: 75%|███████▌ | 616000/818627 [00:44<00:14, 13878.68 examples/s]
Filter: 75%|███████▌ | 616000/818627 [00:44<00:14, 14161.80 examples/s]
Filter: 75%|███████▍ | 610000/818627 [00:44<00:15, 13464.79 examples/s]
Filter: 75%|███████▍ | 612000/818627 [00:45<00:14, 13992.53 examples/s]
Filter: 75%|███████▌ | 618000/818627 [00:44<00:14, 14093.31 examples/s]
Filter: 75%|███████▍ | 612000/818627 [00:44<00:14, 13977.04 examples/s]
Filter: 76%|███████▌ | 620000/818627 [00:44<00:13, 14248.76 examples/s]
Filter: 74%|███████▍ | 608000/818627 [00:44<00:15, 13897.23 examples/s]
Filter: 75%|███████▌ | 618000/818627 [00:44<00:14, 14031.89 examples/s]
Filter: 75%|███████▌ | 618000/818627 [00:44<00:14, 14180.00 examples/s]
Filter: 75%|███████▍ | 612000/818627 [00:44<00:15, 13537.09 examples/s]
Filter: 75%|███████▌ | 614000/818627 [00:45<00:14, 13884.18 examples/s]
Filter: 76%|███████▌ | 620000/818627 [00:44<00:14, 14028.99 examples/s]
Filter: 75%|███████▌ | 614000/818627 [00:44<00:14, 13878.15 examples/s]
Filter: 76%|███████▌ | 622000/818627 [00:44<00:13, 14335.27 examples/s]
Filter: 75%|███████▍ | 610000/818627 [00:44<00:14, 13977.09 examples/s]
Filter: 76%|███████▌ | 620000/818627 [00:44<00:14, 14142.69 examples/s]
Filter: 76%|███████▌ | 620000/818627 [00:45<00:14, 13942.04 examples/s]
Filter: 75%|███████▌ | 614000/818627 [00:45<00:14, 13706.53 examples/s]
Filter: 76%|███████▌ | 622000/818627 [00:45<00:13, 14109.56 examples/s]
Filter: 75%|███████▌ | 616000/818627 [00:45<00:14, 13842.31 examples/s]
Filter: 76%|███████▌ | 624000/818627 [00:45<00:13, 14386.26 examples/s]
Filter: 75%|███████▌ | 616000/818627 [00:45<00:14, 13932.06 examples/s]
Filter: 75%|███████▍ | 612000/818627 [00:45<00:14, 14021.57 examples/s]
Filter: 76%|███████▌ | 622000/818627 [00:45<00:13, 14101.24 examples/s]
Filter: 76%|███████▌ | 622000/818627 [00:45<00:14, 13780.98 examples/s]
Filter: 75%|███████▌ | 616000/818627 [00:45<00:14, 13715.89 examples/s]
Filter: 76%|███████▌ | 624000/818627 [00:45<00:13, 14016.02 examples/s]
Filter: 76%|███████▋ | 626000/818627 [00:45<00:13, 14415.18 examples/s]
Filter: 75%|███████▌ | 618000/818627 [00:45<00:14, 13926.11 examples/s]
Filter: 75%|███████▌ | 618000/818627 [00:45<00:14, 13973.39 examples/s]
Filter: 75%|███████▌ | 614000/818627 [00:45<00:14, 14051.84 examples/s]
Filter: 76%|███████▌ | 624000/818627 [00:45<00:13, 14150.65 examples/s]
Filter: 76%|███████▌ | 624000/818627 [00:45<00:14, 13787.02 examples/s]
Filter: 75%|███████▌ | 618000/818627 [00:45<00:14, 13831.53 examples/s]
Filter: 77%|███████▋ | 628000/818627 [00:45<00:13, 14466.02 examples/s]
Filter: 76%|███████▋ | 626000/818627 [00:45<00:13, 14093.38 examples/s]
Filter: 76%|███████▌ | 620000/818627 [00:45<00:14, 13875.88 examples/s]
Filter: 76%|███████▋ | 626000/818627 [00:45<00:13, 14225.82 examples/s]
Filter: 75%|███████▌ | 616000/818627 [00:45<00:14, 14063.84 examples/s]
Filter: 76%|███████▌ | 620000/818627 [00:45<00:14, 13763.83 examples/s]
Filter: 76%|███████▋ | 626000/818627 [00:45<00:13, 13933.98 examples/s]
Filter: 76%|███████▌ | 620000/818627 [00:45<00:14, 13899.20 examples/s]
Filter: 77%|███████▋ | 630000/818627 [00:45<00:13, 14436.68 examples/s]
Filter: 77%|███████▋ | 628000/818627 [00:45<00:13, 14006.49 examples/s]
Filter: 76%|███████▌ | 622000/818627 [00:45<00:14, 13831.06 examples/s]
Filter: 75%|███████▌ | 618000/818627 [00:45<00:14, 14070.41 examples/s]
Filter: 77%|███████▋ | 628000/818627 [00:45<00:13, 14140.45 examples/s]
Filter: 76%|███████▌ | 622000/818627 [00:45<00:14, 13738.36 examples/s]
Filter: 77%|███████▋ | 628000/818627 [00:45<00:13, 13883.43 examples/s]
Filter: 76%|███████▌ | 622000/818627 [00:45<00:14, 13953.53 examples/s]
Filter: 77%|███████▋ | 632000/818627 [00:45<00:12, 14465.37 examples/s]
Filter: 77%|███████▋ | 630000/818627 [00:45<00:13, 14060.61 examples/s]
Filter: 76%|███████▌ | 624000/818627 [00:45<00:13, 13939.38 examples/s]
Filter: 77%|███████▋ | 630000/818627 [00:45<00:13, 14198.67 examples/s]
Filter: 76%|███████▌ | 620000/818627 [00:45<00:14, 13953.47 examples/s]
Filter: 76%|███████▌ | 624000/818627 [00:45<00:14, 13836.38 examples/s]
Filter: 77%|███████▋ | 630000/818627 [00:45<00:13, 13973.26 examples/s]
Filter: 76%|███████▌ | 624000/818627 [00:45<00:14, 13879.70 examples/s]
Filter: 77%|███████▋ | 634000/818627 [00:45<00:12, 14439.48 examples/s]
Filter: 77%|███████▋ | 632000/818627 [00:45<00:13, 14118.58 examples/s]
Filter: 76%|███████▋ | 626000/818627 [00:46<00:13, 13999.15 examples/s]
Filter: 77%|███████▋ | 632000/818627 [00:45<00:13, 14133.26 examples/s]
Filter: 76%|███████▌ | 622000/818627 [00:45<00:14, 14000.35 examples/s]
Filter: 76%|███████▋ | 626000/818627 [00:45<00:13, 13912.96 examples/s]
Filter: 77%|███████▋ | 632000/818627 [00:45<00:13, 14048.78 examples/s]
Filter: 76%|███████▋ | 626000/818627 [00:45<00:13, 13866.53 examples/s]
Filter: 78%|███████▊ | 636000/818627 [00:45<00:12, 14448.80 examples/s]
Filter: 77%|███████▋ | 634000/818627 [00:45<00:13, 14032.70 examples/s]
Filter: 77%|███████▋ | 628000/818627 [00:46<00:13, 14042.16 examples/s]
Filter: 77%|███████▋ | 634000/818627 [00:45<00:12, 14202.08 examples/s]
Filter: 76%|███████▌ | 624000/818627 [00:45<00:13, 14017.93 examples/s]
Filter: 77%|███████▋ | 628000/818627 [00:45<00:13, 13966.81 examples/s]
Filter: 77%|███████▋ | 634000/818627 [00:46<00:13, 13992.59 examples/s]
Filter: 77%|███████▋ | 628000/818627 [00:46<00:13, 13968.87 examples/s]
Filter: 78%|███████▊ | 638000/818627 [00:46<00:12, 14459.44 examples/s]
Filter: 78%|███████▊ | 636000/818627 [00:46<00:12, 14055.28 examples/s]
Filter: 77%|███████▋ | 630000/818627 [00:46<00:13, 14068.84 examples/s]
Filter: 78%|███████▊ | 636000/818627 [00:46<00:12, 14214.90 examples/s]
Filter: 77%|███████▋ | 630000/818627 [00:46<00:13, 13991.01 examples/s]
Filter: 76%|███████▋ | 626000/818627 [00:46<00:13, 13936.34 examples/s]
Filter: 78%|███████▊ | 636000/818627 [00:46<00:13, 13888.36 examples/s]
Filter: 77%|███████▋ | 630000/818627 [00:46<00:13, 13828.35 examples/s]
Filter: 78%|███████▊ | 640000/818627 [00:46<00:12, 14303.39 examples/s]
Filter: 78%|███████▊ | 638000/818627 [00:46<00:12, 14062.93 examples/s]
Filter: 77%|███████▋ | 632000/818627 [00:46<00:13, 14104.41 examples/s]
Filter: 78%|███████▊ | 638000/818627 [00:46<00:12, 14205.55 examples/s]
Filter: 77%|███████▋ | 632000/818627 [00:46<00:13, 14010.17 examples/s]
Filter: 77%|███████▋ | 628000/818627 [00:46<00:13, 13900.74 examples/s]
Filter: 78%|███████▊ | 638000/818627 [00:46<00:13, 13835.62 examples/s]
Filter: 77%|███████▋ | 632000/818627 [00:46<00:13, 13906.29 examples/s]
Filter: 78%|███████▊ | 642000/818627 [00:46<00:12, 14233.96 examples/s]
Filter: 78%|███████▊ | 640000/818627 [00:46<00:12, 14091.23 examples/s]
Filter: 77%|███████▋ | 634000/818627 [00:46<00:13, 14130.80 examples/s]
Filter: 78%|███████▊ | 640000/818627 [00:46<00:12, 14214.07 examples/s]
Filter: 77%|███████▋ | 634000/818627 [00:46<00:13, 14020.79 examples/s]
Filter: 77%|███████▋ | 630000/818627 [00:46<00:13, 13800.28 examples/s]
Filter: 78%|███████▊ | 640000/818627 [00:46<00:12, 13902.47 examples/s]
Filter: 77%|███████▋ | 634000/818627 [00:46<00:13, 13978.36 examples/s]
Filter: 79%|███████▊ | 644000/818627 [00:46<00:12, 14066.93 examples/s]
Filter: 78%|███████▊ | 642000/818627 [00:46<00:12, 13978.72 examples/s]
Filter: 78%|███████▊ | 636000/818627 [00:46<00:13, 13879.04 examples/s]
Filter: 78%|███████▊ | 642000/818627 [00:46<00:12, 13969.25 examples/s]
Filter: 78%|███████▊ | 636000/818627 [00:46<00:13, 13797.75 examples/s]
Filter: 77%|███████▋ | 632000/818627 [00:46<00:13, 13748.31 examples/s]
Filter: 78%|███████▊ | 642000/818627 [00:46<00:12, 13877.48 examples/s]
Filter: 78%|███████▊ | 636000/818627 [00:46<00:13, 13897.61 examples/s]
Filter: 79%|███████▉ | 646000/818627 [00:46<00:12, 14194.75 examples/s]
Filter: 79%|███████▊ | 644000/818627 [00:46<00:12, 14007.61 examples/s]
Filter: 78%|███████▊ | 638000/818627 [00:46<00:12, 13966.51 examples/s]
Filter: 79%|███████▊ | 644000/818627 [00:46<00:12, 14055.20 examples/s]
Filter: 78%|███████▊ | 638000/818627 [00:46<00:13, 13862.40 examples/s]
Filter: 77%|███████▋ | 634000/818627 [00:46<00:13, 13708.68 examples/s]
Filter: 79%|███████▊ | 644000/818627 [00:46<00:12, 13909.98 examples/s]
Filter: 78%|███████▊ | 638000/818627 [00:46<00:12, 13986.78 examples/s]
Filter: 79%|███████▉ | 648000/818627 [00:46<00:11, 14308.61 examples/s]
Filter: 79%|███████▉ | 646000/818627 [00:46<00:12, 14116.78 examples/s]
Filter: 78%|███████▊ | 640000/818627 [00:47<00:12, 14004.48 examples/s]
Filter: 79%|███████▉ | 646000/818627 [00:46<00:12, 13733.76 examples/s]
Filter: 78%|███████▊ | 640000/818627 [00:46<00:12, 13912.57 examples/s]
Filter: 78%|███████▊ | 636000/818627 [00:46<00:13, 13801.56 examples/s]
Filter: 79%|███████▉ | 646000/818627 [00:46<00:12, 13973.72 examples/s]
Filter: 78%|███████▊ | 640000/818627 [00:46<00:12, 14045.13 examples/s]
Filter: 79%|███████▉ | 650000/818627 [00:46<00:11, 14386.22 examples/s]
Filter: 78%|███████▊ | 642000/818627 [00:47<00:12, 14053.35 examples/s]
Filter: 79%|███████▉ | 648000/818627 [00:46<00:12, 14021.85 examples/s]
Filter: 79%|███████▉ | 648000/818627 [00:46<00:12, 13798.21 examples/s]
Filter: 78%|███████▊ | 642000/818627 [00:46<00:12, 13958.16 examples/s]
Filter: 78%|███████▊ | 638000/818627 [00:47<00:13, 13854.00 examples/s]
Filter: 79%|███████▉ | 648000/818627 [00:47<00:12, 14038.38 examples/s]
Filter: 78%|███████▊ | 642000/818627 [00:47<00:12, 14088.82 examples/s]
Filter: 80%|███████▉ | 652000/818627 [00:47<00:11, 14437.63 examples/s]
Filter: 79%|███████▊ | 644000/818627 [00:47<00:12, 14084.23 examples/s]
Filter: 79%|███████▉ | 650000/818627 [00:47<00:11, 14096.47 examples/s]
Filter: 79%|███████▉ | 650000/818627 [00:47<00:12, 13935.39 examples/s]
Filter: 79%|███████▊ | 644000/818627 [00:47<00:12, 13897.03 examples/s]
Filter: 78%|███████▊ | 640000/818627 [00:47<00:12, 13765.52 examples/s]
Filter: 79%|███████▉ | 650000/818627 [00:47<00:12, 13983.17 examples/s]
Filter: 79%|███████▊ | 644000/818627 [00:47<00:12, 14117.05 examples/s]
Filter: 80%|███████▉ | 654000/818627 [00:47<00:11, 14451.52 examples/s]
Filter: 80%|███████▉ | 652000/818627 [00:47<00:11, 14089.69 examples/s]
Filter: 79%|███████▉ | 646000/818627 [00:47<00:12, 13974.86 examples/s]
Filter: 80%|███████▉ | 652000/818627 [00:47<00:11, 13947.99 examples/s]
Filter: 79%|███████▉ | 646000/818627 [00:47<00:12, 13897.41 examples/s]
Filter: 78%|███████▊ | 642000/818627 [00:47<00:12, 13772.06 examples/s]
Filter: 80%|███████▉ | 652000/818627 [00:47<00:11, 14001.59 examples/s]
Filter: 79%|███████▉ | 646000/818627 [00:47<00:12, 14009.50 examples/s]
Filter: 80%|████████ | 656000/818627 [00:47<00:11, 14403.54 examples/s]
Filter: 80%|███████▉ | 654000/818627 [00:47<00:11, 14123.68 examples/s]
Filter: 79%|███████▉ | 648000/818627 [00:47<00:12, 14015.77 examples/s]
Filter: 80%|███████▉ | 654000/818627 [00:47<00:11, 14006.12 examples/s]
Filter: 79%|███████▉ | 648000/818627 [00:47<00:12, 13811.73 examples/s]
Filter: 79%|███████▊ | 644000/818627 [00:47<00:12, 13817.70 examples/s]
Filter: 80%|███████▉ | 654000/818627 [00:47<00:11, 14038.63 examples/s]
Filter: 79%|███████▉ | 648000/818627 [00:47<00:12, 14064.38 examples/s]
Filter: 80%|████████ | 658000/818627 [00:47<00:11, 14370.93 examples/s]
Filter: 80%|████████ | 656000/818627 [00:47<00:11, 14028.47 examples/s]
Filter: 79%|███████▉ | 650000/818627 [00:47<00:12, 13936.52 examples/s]
Filter: 80%|████████ | 656000/818627 [00:47<00:11, 13933.52 examples/s]
Filter: 79%|███████▉ | 650000/818627 [00:47<00:12, 13889.56 examples/s]
Filter: 79%|███████▉ | 646000/818627 [00:47<00:12, 13822.56 examples/s]
Filter: 79%|███████▉ | 650000/818627 [00:47<00:11, 14101.31 examples/s]
Filter: 80%|████████ | 656000/818627 [00:47<00:11, 13903.26 examples/s]
Filter: 81%|████████ | 660000/818627 [00:47<00:11, 14393.96 examples/s]
Filter: 80%|███████▉ | 652000/818627 [00:47<00:11, 13996.57 examples/s]
Filter: 80%|████████ | 658000/818627 [00:47<00:11, 14028.54 examples/s]
Filter: 80%|████████ | 658000/818627 [00:47<00:11, 13964.14 examples/s]
Filter: 80%|███████▉ | 652000/818627 [00:47<00:12, 13821.18 examples/s]
Filter: 79%|███████▉ | 648000/818627 [00:47<00:12, 13860.05 examples/s]
Filter: 80%|████████ | 658000/818627 [00:47<00:11, 13970.52 examples/s]
Filter: 80%|███████▉ | 652000/818627 [00:47<00:11, 14029.77 examples/s]
Filter: 81%|████████ | 662000/818627 [00:47<00:10, 14431.24 examples/s]
Filter: 81%|████████ | 660000/818627 [00:47<00:11, 14012.05 examples/s]
Filter: 80%|███████▉ | 654000/818627 [00:48<00:11, 13905.16 examples/s]
Filter: 81%|████████ | 660000/818627 [00:47<00:11, 13906.40 examples/s]
Filter: 80%|███████▉ | 654000/818627 [00:47<00:11, 13880.18 examples/s]
Filter: 79%|███████▉ | 650000/818627 [00:47<00:12, 13895.41 examples/s]
Filter: 81%|████████ | 660000/818627 [00:47<00:11, 14024.99 examples/s]
Filter: 81%|████████ | 664000/818627 [00:47<00:10, 14459.76 examples/s]
Filter: 80%|███████▉ | 654000/818627 [00:47<00:11, 13931.18 examples/s]
Filter: 81%|████████ | 662000/818627 [00:47<00:11, 14078.65 examples/s]
Filter: 80%|████████ | 656000/818627 [00:48<00:11, 13843.60 examples/s]
Filter: 81%|████████ | 662000/818627 [00:47<00:11, 13853.58 examples/s]
Filter: 80%|████████ | 656000/818627 [00:48<00:11, 13936.26 examples/s]
Filter: 80%|███████▉ | 652000/818627 [00:48<00:11, 13922.53 examples/s]
Filter: 81%|████████▏ | 666000/818627 [00:48<00:10, 14475.17 examples/s]
Filter: 81%|████████ | 662000/818627 [00:48<00:11, 14048.14 examples/s]
Filter: 80%|████████ | 656000/818627 [00:48<00:11, 14026.95 examples/s]
Filter: 81%|████████ | 664000/818627 [00:48<00:10, 14132.26 examples/s]
Filter: 80%|████████ | 658000/818627 [00:48<00:11, 13934.61 examples/s]
Filter: 81%|████████ | 664000/818627 [00:48<00:11, 13925.98 examples/s]
Filter: 80%|████████ | 658000/818627 [00:48<00:11, 13862.42 examples/s]
Filter: 80%|███████▉ | 654000/818627 [00:48<00:11, 13832.71 examples/s]
Filter: 82%|████████▏ | 668000/818627 [00:48<00:10, 14524.70 examples/s]
Filter: 81%|████████ | 664000/818627 [00:48<00:10, 14068.83 examples/s]
Filter: 80%|████████ | 658000/818627 [00:48<00:11, 13960.39 examples/s]
Filter: 81%|████████▏ | 666000/818627 [00:48<00:10, 14165.01 examples/s]
Filter: 81%|████████ | 660000/818627 [00:48<00:11, 13998.33 examples/s]
Filter: 81%|████████▏ | 666000/818627 [00:48<00:10, 13989.65 examples/s]
Filter: 81%|████████ | 660000/818627 [00:48<00:11, 13927.58 examples/s]
Filter: 80%|████████ | 656000/818627 [00:48<00:11, 13743.98 examples/s]
Filter: 82%|████████▏ | 670000/818627 [00:48<00:10, 14531.86 examples/s]
Filter: 81%|████████▏ | 666000/818627 [00:48<00:10, 14050.66 examples/s]
Filter: 81%|████████ | 660000/818627 [00:48<00:11, 14008.35 examples/s]
Filter: 82%|████████▏ | 668000/818627 [00:48<00:10, 14174.39 examples/s]
Filter: 81%|████████ | 662000/818627 [00:48<00:11, 14048.14 examples/s]
Filter: 82%|████████▏ | 668000/818627 [00:48<00:10, 13894.92 examples/s]
Filter: 81%|████████ | 662000/818627 [00:48<00:11, 13844.42 examples/s]
Filter: 82%|████████▏ | 672000/818627 [00:48<00:10, 14514.39 examples/s]
Filter: 80%|████████ | 658000/818627 [00:48<00:11, 13800.31 examples/s]
Filter: 82%|████████▏ | 668000/818627 [00:48<00:10, 14036.13 examples/s]
Filter: 81%|████████ | 662000/818627 [00:48<00:11, 14034.15 examples/s]
Filter: 82%|████████▏ | 670000/818627 [00:48<00:10, 14206.20 examples/s]
Filter: 81%|████████ | 664000/818627 [00:48<00:11, 13937.38 examples/s]
Filter: 82%|████████▏ | 670000/818627 [00:48<00:10, 13788.74 examples/s]
Filter: 81%|████████ | 664000/818627 [00:48<00:11, 13918.27 examples/s]
Filter: 82%|████████▏ | 674000/818627 [00:48<00:09, 14526.44 examples/s]
Filter: 81%|████████ | 660000/818627 [00:48<00:11, 13869.32 examples/s]
Filter: 82%|████████▏ | 670000/818627 [00:48<00:10, 13958.76 examples/s]
Filter: 81%|████████ | 664000/818627 [00:48<00:11, 13945.86 examples/s]
Filter: 82%|████████▏ | 672000/818627 [00:48<00:10, 13986.59 examples/s]
Filter: 81%|████████▏ | 666000/818627 [00:48<00:10, 13880.17 examples/s]
Filter: 82%|████████▏ | 672000/818627 [00:48<00:10, 13677.45 examples/s]
Filter: 81%|████████▏ | 666000/818627 [00:48<00:11, 13809.88 examples/s]
Filter: 83%|████████▎ | 676000/818627 [00:48<00:09, 14376.14 examples/s]
Filter: 81%|████████ | 662000/818627 [00:48<00:11, 13699.24 examples/s]
Filter: 82%|████████▏ | 672000/818627 [00:48<00:10, 14041.85 examples/s]
Filter: 81%|████████▏ | 666000/818627 [00:48<00:10, 13997.49 examples/s]
Filter: 82%|████████▏ | 674000/818627 [00:48<00:10, 13970.34 examples/s]
Filter: 82%|████████▏ | 668000/818627 [00:49<00:10, 13967.95 examples/s]
Filter: 82%|████████▏ | 674000/818627 [00:48<00:10, 13838.39 examples/s]
Filter: 83%|████████▎ | 678000/818627 [00:48<00:09, 14425.84 examples/s]
Filter: 82%|████████▏ | 668000/818627 [00:48<00:10, 13879.76 examples/s]
Filter: 81%|████████ | 664000/818627 [00:48<00:11, 13810.68 examples/s]
Filter: 82%|████████▏ | 674000/818627 [00:48<00:10, 13997.46 examples/s]
Filter: 82%|████████▏ | 668000/818627 [00:48<00:10, 13899.30 examples/s]
Filter: 83%|████████▎ | 676000/818627 [00:48<00:10, 14071.57 examples/s]
Filter: 82%|████████▏ | 670000/818627 [00:49<00:10, 13897.79 examples/s]
Filter: 83%|████████▎ | 676000/818627 [00:48<00:10, 13957.45 examples/s]
Filter: 83%|████████▎ | 680000/818627 [00:48<00:09, 14443.89 examples/s]
Filter: 82%|████████▏ | 670000/818627 [00:49<00:10, 13940.62 examples/s]
Filter: 81%|████████▏ | 666000/818627 [00:49<00:10, 13892.35 examples/s]
Filter: 83%|████████▎ | 676000/818627 [00:49<00:10, 14076.88 examples/s]
Filter: 82%|████████▏ | 670000/818627 [00:49<00:10, 13958.06 examples/s]
Filter: 83%|████████▎ | 678000/818627 [00:49<00:09, 14161.57 examples/s]
Filter: 82%|████████▏ | 672000/818627 [00:49<00:10, 13988.55 examples/s]
Filter: 83%|████████▎ | 678000/818627 [00:49<00:10, 14037.33 examples/s]
Filter: 83%|████████▎ | 682000/818627 [00:49<00:09, 14333.08 examples/s]
Filter: 82%|████████▏ | 672000/818627 [00:49<00:10, 13868.13 examples/s]
Filter: 82%|████████▏ | 668000/818627 [00:49<00:10, 13889.28 examples/s]
Filter: 83%|████████▎ | 678000/818627 [00:49<00:09, 14103.67 examples/s]
Filter: 82%|████████▏ | 672000/818627 [00:49<00:10, 14008.19 examples/s]
Filter: 83%|████████▎ | 680000/818627 [00:49<00:09, 14125.12 examples/s]
Filter: 83%|████████▎ | 680000/818627 [00:49<00:09, 14104.56 examples/s]
Filter: 82%|████████▏ | 674000/818627 [00:49<00:10, 13820.89 examples/s]
Filter: 84%|████████▎ | 684000/818627 [00:49<00:09, 14357.58 examples/s]
Filter: 82%|████████▏ | 674000/818627 [00:49<00:10, 13926.06 examples/s]
Filter: 82%|████████▏ | 670000/818627 [00:49<00:10, 13947.41 examples/s]
Filter: 83%|████████▎ | 680000/818627 [00:49<00:09, 14152.62 examples/s]
Filter: 82%|████████▏ | 674000/818627 [00:49<00:10, 13910.28 examples/s]
Filter: 83%|████████▎ | 682000/818627 [00:49<00:09, 14150.07 examples/s]
Filter: 83%|████████▎ | 682000/818627 [00:49<00:09, 14145.32 examples/s]
Filter: 83%|████████▎ | 676000/818627 [00:49<00:10, 13876.72 examples/s]
Filter: 84%|████████▍ | 686000/818627 [00:49<00:09, 14255.03 examples/s]
Filter: 83%|████████▎ | 676000/818627 [00:49<00:10, 13966.31 examples/s]
Filter: 82%|████████▏ | 672000/818627 [00:49<00:10, 14000.84 examples/s]
Filter: 83%|████████▎ | 682000/818627 [00:49<00:09, 14171.03 examples/s]
Filter: 83%|████████▎ | 676000/818627 [00:49<00:10, 13958.70 examples/s]
Filter: 84%|████████▎ | 684000/818627 [00:49<00:09, 14185.47 examples/s]
Filter: 84%|████████▎ | 684000/818627 [00:49<00:09, 14183.60 examples/s]
Filter: 83%|████████▎ | 678000/818627 [00:49<00:10, 13952.33 examples/s]
Filter: 84%|████████▍ | 688000/818627 [00:49<00:09, 14330.30 examples/s]
Filter: 83%|████████▎ | 678000/818627 [00:49<00:10, 13875.21 examples/s]
Filter: 82%|████████▏ | 674000/818627 [00:49<00:10, 14048.21 examples/s]
Filter: 84%|████████▎ | 684000/818627 [00:49<00:09, 14194.99 examples/s]
Filter: 83%|████████▎ | 678000/818627 [00:49<00:10, 13809.07 examples/s]
Filter: 84%|████████▍ | 686000/818627 [00:49<00:09, 14235.17 examples/s]
Filter: 84%|████████▍ | 686000/818627 [00:49<00:09, 14204.34 examples/s]
Filter: 83%|████████▎ | 680000/818627 [00:49<00:10, 13856.63 examples/s]
Filter: 84%|████████▍ | 690000/818627 [00:49<00:08, 14361.33 examples/s]
Filter: 83%|████████▎ | 680000/818627 [00:49<00:09, 13933.55 examples/s]
Filter: 83%|████████▎ | 676000/818627 [00:49<00:10, 14055.75 examples/s]
Filter: 84%|████████▍ | 686000/818627 [00:49<00:09, 14223.21 examples/s]
Filter: 83%|████████▎ | 680000/818627 [00:49<00:10, 13729.70 examples/s]
Filter: 84%|████████▍ | 688000/818627 [00:49<00:09, 14276.32 examples/s]
Filter: 84%|████████▍ | 688000/818627 [00:49<00:09, 14235.16 examples/s]
Filter: 83%|████████▎ | 682000/818627 [00:50<00:09, 13949.00 examples/s]
Filter: 85%|████████▍ | 692000/818627 [00:49<00:08, 14408.20 examples/s]
Filter: 83%|████████▎ | 682000/818627 [00:49<00:09, 13976.81 examples/s]
Filter: 83%|████████▎ | 678000/818627 [00:49<00:10, 14060.35 examples/s]
Filter: 84%|████████▍ | 688000/818627 [00:49<00:09, 14192.54 examples/s]
Filter: 83%|████████▎ | 682000/818627 [00:49<00:09, 13831.69 examples/s]
Filter: 84%|████████▍ | 690000/818627 [00:49<00:09, 14289.23 examples/s]
Filter: 84%|████████▍ | 690000/818627 [00:49<00:09, 14217.79 examples/s]
Filter: 85%|████████▍ | 694000/818627 [00:49<00:08, 14434.58 examples/s]
Filter: 84%|████████▎ | 684000/818627 [00:50<00:09, 13866.63 examples/s]
Filter: 84%|████████▎ | 684000/818627 [00:50<00:09, 13873.79 examples/s]
Filter: 84%|████████▍ | 690000/818627 [00:50<00:09, 14191.48 examples/s]
Filter: 83%|████████▎ | 680000/818627 [00:50<00:09, 14065.38 examples/s]
Filter: 84%|████████▎ | 684000/818627 [00:50<00:09, 13889.65 examples/s]
Filter: 85%|████████▍ | 692000/818627 [00:50<00:08, 14230.51 examples/s]
Filter: 85%|████████▍ | 692000/818627 [00:50<00:08, 14178.61 examples/s]
Filter: 85%|████████▌ | 696000/818627 [00:50<00:08, 14419.56 examples/s]
Filter: 84%|████████▍ | 686000/818627 [00:50<00:09, 13952.06 examples/s]
Filter: 84%|████████▍ | 686000/818627 [00:50<00:09, 13796.77 examples/s]
Filter: 83%|████████▎ | 682000/818627 [00:50<00:09, 14027.05 examples/s]
Filter: 85%|████████▍ | 692000/818627 [00:50<00:09, 13990.41 examples/s]
Filter: 84%|████████▍ | 686000/818627 [00:50<00:09, 13905.81 examples/s]
Filter: 85%|████████▍ | 694000/818627 [00:50<00:08, 14225.23 examples/s]
Filter: 85%|████████▍ | 694000/818627 [00:50<00:08, 14186.79 examples/s]
Filter: 85%|████████▌ | 698000/818627 [00:50<00:08, 14397.34 examples/s]
Filter: 84%|████████▍ | 688000/818627 [00:50<00:09, 14037.89 examples/s]
Filter: 84%|████████▍ | 688000/818627 [00:50<00:09, 13877.83 examples/s]
Filter: 84%|████████▎ | 684000/818627 [00:50<00:09, 14014.29 examples/s]
Filter: 85%|████████▍ | 694000/818627 [00:50<00:08, 14023.98 examples/s]
Filter: 84%|████████▍ | 688000/818627 [00:50<00:09, 13838.41 examples/s]
Filter: 85%|████████▌ | 696000/818627 [00:50<00:08, 14212.58 examples/s]
Filter: 85%|████████▌ | 696000/818627 [00:50<00:08, 14200.66 examples/s]
Filter: 86%|████████▌ | 700000/818627 [00:50<00:08, 14401.99 examples/s]
Filter: 84%|████████▍ | 690000/818627 [00:50<00:09, 14081.64 examples/s]
Filter: 84%|████████▍ | 690000/818627 [00:50<00:09, 13938.84 examples/s]
Filter: 85%|████████▌ | 696000/818627 [00:50<00:08, 14092.89 examples/s]
Filter: 84%|████████▍ | 686000/818627 [00:50<00:09, 13901.37 examples/s]
Filter: 84%|████████▍ | 690000/818627 [00:50<00:09, 13907.39 examples/s]
Filter: 85%|████████▌ | 698000/818627 [00:50<00:08, 14258.71 examples/s]
Filter: 85%|████████▌ | 698000/818627 [00:50<00:08, 14206.92 examples/s]
Filter: 86%|████████▌ | 702000/818627 [00:50<00:08, 14277.63 examples/s]
Filter: 85%|████████▍ | 692000/818627 [00:50<00:08, 14105.29 examples/s]
Filter: 85%|████████▍ | 692000/818627 [00:50<00:09, 13969.32 examples/s]
Filter: 85%|████████▌ | 698000/818627 [00:50<00:08, 14099.99 examples/s]
Filter: 84%|████████▍ | 688000/818627 [00:50<00:09, 13846.88 examples/s]
Filter: 85%|████████▍ | 692000/818627 [00:50<00:09, 13821.45 examples/s]
Filter: 86%|████████▌ | 700000/818627 [00:50<00:08, 14243.38 examples/s]
Filter: 86%|████████▌ | 700000/818627 [00:50<00:08, 14201.46 examples/s]
Filter: 86%|████████▌ | 704000/818627 [00:50<00:08, 14303.35 examples/s]
Filter: 85%|████████▍ | 694000/818627 [00:50<00:08, 14090.02 examples/s]
Filter: 85%|████████▍ | 694000/818627 [00:50<00:08, 13998.38 examples/s]
Filter: 86%|████████▌ | 700000/818627 [00:50<00:08, 14099.64 examples/s]
Filter: 84%|████████▍ | 690000/818627 [00:50<00:09, 13844.94 examples/s]
Filter: 85%|████████▍ | 694000/818627 [00:50<00:08, 13878.86 examples/s]
Filter: 86%|████████▌ | 702000/818627 [00:50<00:08, 13913.22 examples/s]
Filter: 86%|████████▌ | 702000/818627 [00:50<00:08, 14203.72 examples/s]
Filter: 86%|████████▌ | 706000/818627 [00:50<00:07, 14354.69 examples/s]
Filter: 85%|████████▌ | 696000/818627 [00:51<00:08, 14117.36 examples/s]
Filter: 85%|████████▌ | 696000/818627 [00:50<00:08, 14018.91 examples/s]
Filter: 86%|████████▌ | 702000/818627 [00:50<00:08, 14137.80 examples/s]
Filter: 85%|████████▍ | 692000/818627 [00:50<00:09, 13933.70 examples/s]
Filter: 85%|████████▌ | 696000/818627 [00:50<00:08, 13918.88 examples/s]
Filter: 86%|████████▌ | 704000/818627 [00:50<00:08, 14013.02 examples/s]
Filter: 86%|████████▌ | 704000/818627 [00:50<00:08, 14224.65 examples/s]
Filter: 86%|████████▋ | 708000/818627 [00:50<00:07, 14395.13 examples/s]
Filter: 85%|████████▌ | 698000/818627 [00:51<00:08, 14160.51 examples/s]
Filter: 86%|████████▌ | 704000/818627 [00:51<00:08, 14180.34 examples/s]
Filter: 85%|████████▌ | 698000/818627 [00:51<00:08, 13900.13 examples/s]
Filter: 85%|████████▍ | 694000/818627 [00:51<00:08, 13971.31 examples/s]
Filter: 85%|████████▌ | 698000/818627 [00:51<00:08, 13850.80 examples/s]
Filter: 86%|████████▌ | 706000/818627 [00:51<00:07, 14109.78 examples/s]
Filter: 87%|████████▋ | 710000/818627 [00:51<00:07, 14425.30 examples/s]
Filter: 86%|████████▌ | 706000/818627 [00:51<00:07, 14242.29 examples/s]
Filter: 86%|████████▌ | 700000/818627 [00:51<00:08, 14187.63 examples/s]
Filter: 86%|████████▌ | 706000/818627 [00:51<00:07, 14214.86 examples/s]
Filter: 86%|████████▌ | 700000/818627 [00:51<00:08, 13847.05 examples/s]
Filter: 85%|████████▌ | 696000/818627 [00:51<00:08, 14015.15 examples/s]
Filter: 86%|████████▌ | 700000/818627 [00:51<00:08, 13946.43 examples/s]
Filter: 86%|████████▋ | 708000/818627 [00:51<00:07, 14177.41 examples/s]
Filter: 87%|████████▋ | 712000/818627 [00:51<00:07, 14438.93 examples/s]
Filter: 86%|████████▋ | 708000/818627 [00:51<00:07, 14246.65 examples/s]
Filter: 86%|████████▌ | 702000/818627 [00:51<00:08, 14196.24 examples/s]
Filter: 86%|████████▋ | 708000/818627 [00:51<00:07, 14218.30 examples/s]
Filter: 86%|████████▌ | 702000/818627 [00:51<00:08, 13833.92 examples/s]
Filter: 85%|████████▌ | 698000/818627 [00:51<00:08, 14031.44 examples/s]
Filter: 86%|████████▌ | 702000/818627 [00:51<00:08, 13988.30 examples/s]
Filter: 87%|████████▋ | 710000/818627 [00:51<00:07, 14228.40 examples/s]
Filter: 87%|████████▋ | 714000/818627 [00:51<00:07, 14435.60 examples/s]
Filter: 87%|████████▋ | 710000/818627 [00:51<00:07, 14124.75 examples/s]
Filter: 86%|████████▌ | 704000/818627 [00:51<00:08, 14179.09 examples/s]
Filter: 87%|████████▋ | 710000/818627 [00:51<00:07, 14102.11 examples/s]
Filter: 86%|████████▌ | 700000/818627 [00:51<00:08, 14065.40 examples/s]
Filter: 86%|████████▌ | 704000/818627 [00:51<00:08, 13879.58 examples/s]
Filter: 86%|████████▌ | 704000/818627 [00:51<00:08, 13996.57 examples/s]
Filter: 87%|████████▋ | 712000/818627 [00:51<00:07, 14239.12 examples/s]
Filter: 87%|████████▋ | 716000/818627 [00:51<00:07, 14427.11 examples/s]
Filter: 87%|████████▋ | 712000/818627 [00:51<00:07, 14139.51 examples/s]
Filter: 86%|████████▌ | 706000/818627 [00:51<00:07, 14086.91 examples/s]
Filter: 87%|████████▋ | 712000/818627 [00:51<00:07, 14137.32 examples/s]
Filter: 86%|████████▌ | 706000/818627 [00:51<00:08, 13923.71 examples/s]
Filter: 86%|████████▌ | 702000/818627 [00:51<00:08, 13939.66 examples/s]
Filter: 87%|████████▋ | 714000/818627 [00:51<00:07, 14258.65 examples/s]
Filter: 86%|████████▌ | 706000/818627 [00:51<00:08, 13996.88 examples/s]
Filter: 88%|████████▊ | 718000/818627 [00:51<00:06, 14435.04 examples/s]
Filter: 87%|████████▋ | 714000/818627 [00:51<00:07, 14161.91 examples/s]
Filter: 86%|████████▋ | 708000/818627 [00:51<00:07, 14123.87 examples/s]
Filter: 87%|████████▋ | 714000/818627 [00:51<00:07, 14172.65 examples/s]
Filter: 86%|████████▋ | 708000/818627 [00:51<00:07, 13963.06 examples/s]
Filter: 86%|████████▌ | 704000/818627 [00:51<00:08, 13952.85 examples/s]
Filter: 87%|████████▋ | 716000/818627 [00:51<00:07, 14164.19 examples/s]
Filter: 86%|████████▋ | 708000/818627 [00:51<00:07, 13898.28 examples/s]
Filter: 88%|████████▊ | 720000/818627 [00:51<00:07, 14042.82 examples/s]
Filter: 87%|████████▋ | 716000/818627 [00:51<00:07, 14142.60 examples/s]
Filter: 87%|████████▋ | 710000/818627 [00:52<00:07, 14138.95 examples/s]
Filter: 87%|████████▋ | 716000/818627 [00:51<00:07, 14187.62 examples/s]
Filter: 87%|████████▋ | 710000/818627 [00:51<00:07, 14005.66 examples/s]
Filter: 86%|████████▌ | 706000/818627 [00:51<00:08, 13999.41 examples/s]
Filter: 88%|████████▊ | 718000/818627 [00:51<00:07, 14089.50 examples/s]
Filter: 87%|████████▋ | 710000/818627 [00:51<00:07, 13957.78 examples/s]
Filter: 88%|████████▊ | 722000/818627 [00:51<00:06, 14138.22 examples/s]
Filter: 88%|████████▊ | 718000/818627 [00:51<00:07, 14168.64 examples/s]
Filter: 87%|████████▋ | 712000/818627 [00:52<00:07, 13987.18 examples/s]
Filter: 88%|████████▊ | 718000/818627 [00:52<00:07, 14140.54 examples/s]
Filter: 87%|████████▋ | 712000/818627 [00:52<00:07, 14014.23 examples/s]
Filter: 86%|████████▋ | 708000/818627 [00:52<00:07, 14015.38 examples/s]
Filter: 88%|████████▊ | 720000/818627 [00:52<00:06, 14135.69 examples/s]
Filter: 87%|████████▋ | 712000/818627 [00:52<00:07, 13923.31 examples/s]
Filter: 88%|████████▊ | 724000/818627 [00:52<00:06, 14083.40 examples/s]
Filter: 88%|████████▊ | 720000/818627 [00:52<00:06, 14195.21 examples/s]
Filter: 87%|████████▋ | 714000/818627 [00:52<00:07, 14064.23 examples/s]
Filter: 88%|████████▊ | 720000/818627 [00:52<00:07, 13893.37 examples/s]
Filter: 87%|████████▋ | 714000/818627 [00:52<00:07, 13983.27 examples/s]
Filter: 87%|████████▋ | 710000/818627 [00:52<00:07, 13767.94 examples/s]
Filter: 88%|████████▊ | 722000/818627 [00:52<00:06, 14096.53 examples/s]
Filter: 87%|████████▋ | 714000/818627 [00:52<00:07, 13840.10 examples/s]
Filter: 88%|████████▊ | 722000/818627 [00:52<00:06, 14191.23 examples/s]
Filter: 89%|████████▊ | 726000/818627 [00:52<00:06, 14046.51 examples/s]
Filter: 87%|████████▋ | 716000/818627 [00:52<00:07, 13984.71 examples/s]
Filter: 88%|████████▊ | 722000/818627 [00:52<00:06, 13869.68 examples/s]
Filter: 87%|████████▋ | 716000/818627 [00:52<00:07, 13987.56 examples/s]
Filter: 87%|████████▋ | 712000/818627 [00:52<00:07, 13840.15 examples/s]
Filter: 88%|████████▊ | 724000/818627 [00:52<00:06, 13916.76 examples/s]
Filter: 87%|████████▋ | 716000/818627 [00:52<00:07, 13814.26 examples/s]
Filter: 89%|████████▉ | 728000/818627 [00:52<00:06, 14133.92 examples/s]
Filter: 88%|████████▊ | 724000/818627 [00:52<00:06, 14192.99 examples/s]
Filter: 88%|████████▊ | 718000/818627 [00:52<00:07, 14060.61 examples/s]
Filter: 88%|████████▊ | 724000/818627 [00:52<00:06, 13864.21 examples/s]
Filter: 88%|████████▊ | 718000/818627 [00:52<00:07, 13963.95 examples/s]
Filter: 87%|████████▋ | 714000/818627 [00:52<00:07, 13894.89 examples/s]
Filter: 89%|████████▊ | 726000/818627 [00:52<00:06, 13790.27 examples/s]
Filter: 89%|████████▉ | 730000/818627 [00:52<00:06, 13923.46 examples/s]
Filter: 89%|████████▊ | 726000/818627 [00:52<00:06, 13968.60 examples/s]
Filter: 88%|████████▊ | 718000/818627 [00:52<00:07, 13380.14 examples/s]
Filter: 88%|████████▊ | 720000/818627 [00:52<00:07, 13739.87 examples/s]
Filter: 89%|████████▊ | 726000/818627 [00:52<00:06, 13857.36 examples/s]
Filter: 88%|████████▊ | 720000/818627 [00:52<00:07, 13895.35 examples/s]
Filter: 87%|████████▋ | 716000/818627 [00:52<00:07, 13832.27 examples/s]
Filter: 89%|████████▉ | 728000/818627 [00:52<00:06, 13969.16 examples/s]
Filter: 89%|████████▉ | 732000/818627 [00:52<00:06, 14059.12 examples/s]
Filter: 89%|████████▉ | 728000/818627 [00:52<00:06, 14056.47 examples/s]
Filter: 88%|████████▊ | 720000/818627 [00:52<00:07, 13578.67 examples/s]
Filter: 88%|████████▊ | 722000/818627 [00:52<00:06, 13866.37 examples/s]
Filter: 89%|████████▉ | 728000/818627 [00:52<00:06, 13855.13 examples/s]
Filter: 88%|████████▊ | 722000/818627 [00:52<00:06, 13940.78 examples/s]
Filter: 88%|████████▊ | 718000/818627 [00:52<00:07, 13913.92 examples/s]
Filter: 89%|████████▉ | 730000/818627 [00:52<00:06, 13934.65 examples/s]
Filter: 90%|████████▉ | 734000/818627 [00:52<00:05, 14156.49 examples/s]
Filter: 89%|████████▉ | 730000/818627 [00:52<00:06, 14094.84 examples/s]
Filter: 88%|████████▊ | 722000/818627 [00:52<00:07, 13594.33 examples/s]
Filter: 88%|████████▊ | 724000/818627 [00:53<00:06, 13962.89 examples/s]
Filter: 89%|████████▉ | 730000/818627 [00:52<00:06, 13917.43 examples/s]
Filter: 88%|████████▊ | 724000/818627 [00:52<00:06, 13975.81 examples/s]
Filter: 88%|████████▊ | 720000/818627 [00:52<00:07, 13947.76 examples/s]
Filter: 89%|████████▉ | 732000/818627 [00:52<00:06, 14013.30 examples/s]
Filter: 90%|████████▉ | 736000/818627 [00:52<00:05, 14189.30 examples/s]
Filter: 89%|████████▉ | 732000/818627 [00:52<00:06, 14121.75 examples/s]
Filter: 88%|████████▊ | 724000/818627 [00:52<00:06, 13609.61 examples/s]
Filter: 89%|████████▊ | 726000/818627 [00:53<00:06, 14018.32 examples/s]
Filter: 89%|████████▉ | 732000/818627 [00:53<00:06, 14007.09 examples/s]
Filter: 89%|████████▊ | 726000/818627 [00:53<00:06, 13757.14 examples/s]
Filter: 88%|████████▊ | 722000/818627 [00:53<00:06, 13995.22 examples/s]
Filter: 90%|████████▉ | 734000/818627 [00:53<00:06, 14101.35 examples/s]
Filter: 90%|█████████ | 738000/818627 [00:53<00:05, 14241.45 examples/s]
Filter: 90%|████████▉ | 734000/818627 [00:53<00:05, 14169.27 examples/s]
Filter: 89%|████████▊ | 726000/818627 [00:53<00:06, 13614.45 examples/s]
Filter: 89%|████████▉ | 728000/818627 [00:53<00:06, 13988.87 examples/s]
Filter: 90%|████████▉ | 734000/818627 [00:53<00:06, 13958.92 examples/s]
Filter: 89%|████████▉ | 728000/818627 [00:53<00:06, 13846.54 examples/s]
Filter: 88%|████████▊ | 724000/818627 [00:53<00:06, 13914.08 examples/s]
Filter: 90%|████████▉ | 736000/818627 [00:53<00:05, 14157.50 examples/s]
Filter: 90%|█████████ | 740000/818627 [00:53<00:05, 14267.55 examples/s]
Filter: 90%|████████▉ | 736000/818627 [00:53<00:05, 14207.32 examples/s]
Filter: 89%|████████▉ | 728000/818627 [00:53<00:06, 13763.07 examples/s]
Filter: 89%|████████▉ | 730000/818627 [00:53<00:06, 14011.91 examples/s]
Filter: 90%|████████▉ | 736000/818627 [00:53<00:05, 13909.29 examples/s]
Filter: 89%|████████▉ | 730000/818627 [00:53<00:06, 13899.05 examples/s]
Filter: 89%|████████▊ | 726000/818627 [00:53<00:06, 13984.43 examples/s]
Filter: 90%|█████████ | 738000/818627 [00:53<00:05, 14208.31 examples/s]
Filter: 91%|█████████ | 742000/818627 [00:53<00:05, 14207.19 examples/s]
Filter: 90%|█████████ | 738000/818627 [00:53<00:05, 14211.22 examples/s]
Filter: 89%|████████▉ | 730000/818627 [00:53<00:06, 13744.18 examples/s]
Filter: 89%|████████▉ | 732000/818627 [00:53<00:06, 14059.52 examples/s]
Filter: 90%|█████████ | 738000/818627 [00:53<00:05, 14010.59 examples/s]
Filter: 89%|████████▉ | 732000/818627 [00:53<00:06, 13952.65 examples/s]
Filter: 89%|████████▉ | 728000/818627 [00:53<00:06, 14038.16 examples/s]
Filter: 90%|█████████ | 740000/818627 [00:53<00:05, 14242.94 examples/s]
Filter: 91%|█████████ | 744000/818627 [00:53<00:05, 14295.13 examples/s]
Filter: 90%|█████████ | 740000/818627 [00:53<00:05, 14240.78 examples/s]
Filter: 89%|████████▉ | 732000/818627 [00:53<00:06, 13872.53 examples/s]
Filter: 90%|████████▉ | 734000/818627 [00:53<00:06, 14103.36 examples/s]
Filter: 90%|█████████ | 740000/818627 [00:53<00:05, 14088.86 examples/s]
Filter: 89%|████████▉ | 730000/818627 [00:53<00:06, 14046.84 examples/s]
Filter: 90%|████████▉ | 734000/818627 [00:53<00:06, 13867.69 examples/s]
Filter: 91%|█████████ | 742000/818627 [00:53<00:05, 14172.43 examples/s]
Filter: 91%|█████████ | 746000/818627 [00:53<00:05, 14237.08 examples/s]
Filter: 91%|█████████ | 742000/818627 [00:53<00:05, 14161.01 examples/s]
Filter: 90%|████████▉ | 734000/818627 [00:53<00:06, 13940.16 examples/s]
Filter: 90%|████████▉ | 736000/818627 [00:53<00:05, 14080.63 examples/s]
Filter: 91%|█████████ | 742000/818627 [00:53<00:05, 14044.26 examples/s]
Filter: 89%|████████▉ | 732000/818627 [00:53<00:06, 14083.06 examples/s]
Filter: 90%|████████▉ | 736000/818627 [00:53<00:05, 13919.88 examples/s]
Filter: 91%|█████████ | 744000/818627 [00:53<00:05, 14157.01 examples/s]
Filter: 91%|█████████▏| 748000/818627 [00:53<00:04, 14190.79 examples/s]
Filter: 91%|█████████ | 744000/818627 [00:53<00:05, 14214.89 examples/s]
Filter: 90%|████████▉ | 736000/818627 [00:53<00:05, 13982.53 examples/s]
Filter: 90%|█████████ | 738000/818627 [00:54<00:05, 13984.64 examples/s]
Filter: 91%|█████████ | 744000/818627 [00:53<00:05, 14102.33 examples/s]
Filter: 90%|████████▉ | 734000/818627 [00:53<00:06, 14080.03 examples/s]
Filter: 90%|█████████ | 738000/818627 [00:53<00:05, 13982.62 examples/s]
Filter: 91%|█████████ | 746000/818627 [00:53<00:05, 14221.05 examples/s]
Filter: 92%|█████████▏| 750000/818627 [00:53<00:04, 14168.82 examples/s]
Filter: 91%|█████████ | 746000/818627 [00:53<00:05, 14251.62 examples/s]
Filter: 90%|█████████ | 738000/818627 [00:53<00:05, 13535.62 examples/s]
Filter: 90%|█████████ | 740000/818627 [00:54<00:05, 13681.38 examples/s]
Filter: 91%|█████████ | 746000/818627 [00:54<00:05, 14164.75 examples/s]
Filter: 90%|████████▉ | 736000/818627 [00:54<00:05, 14080.74 examples/s]
Filter: 90%|█████████ | 740000/818627 [00:54<00:05, 13889.87 examples/s]
Filter: 91%|█████████▏| 748000/818627 [00:54<00:04, 14271.56 examples/s]
Filter: 92%|█████████▏| 752000/818627 [00:54<00:04, 14287.40 examples/s]
Filter: 91%|█████████▏| 748000/818627 [00:54<00:04, 14294.73 examples/s]
Filter: 90%|█████████ | 740000/818627 [00:54<00:05, 13602.60 examples/s]
Filter: 91%|█████████ | 742000/818627 [00:54<00:05, 13685.84 examples/s]
Filter: 91%|█████████▏| 748000/818627 [00:54<00:05, 14086.12 examples/s]
Filter: 90%|█████████ | 738000/818627 [00:54<00:05, 13985.92 examples/s]
Filter: 91%|█████████ | 742000/818627 [00:54<00:05, 13980.31 examples/s]
Filter: 92%|█████████▏| 750000/818627 [00:54<00:04, 14300.16 examples/s]
Filter: 92%|█████████▏| 754000/818627 [00:54<00:04, 14238.05 examples/s]
Filter: 92%|█████████▏| 750000/818627 [00:54<00:04, 14310.20 examples/s]
Filter: 91%|█████████ | 742000/818627 [00:54<00:05, 13744.40 examples/s]
Filter: 91%|█████████ | 744000/818627 [00:54<00:05, 13831.53 examples/s]
Filter: 92%|█████████▏| 750000/818627 [00:54<00:04, 13792.31 examples/s]
Filter: 90%|█████████ | 740000/818627 [00:54<00:05, 14047.00 examples/s]
Filter: 91%|█████████ | 744000/818627 [00:54<00:05, 13913.51 examples/s]
Filter: 92%|█████████▏| 752000/818627 [00:54<00:04, 14321.06 examples/s]
Filter: 92%|█████████▏| 752000/818627 [00:54<00:04, 14299.81 examples/s]
Filter: 92%|█████████▏| 756000/818627 [00:54<00:04, 14181.63 examples/s]
Filter: 91%|█████████ | 744000/818627 [00:54<00:05, 13717.36 examples/s]
Filter: 91%|█████████ | 746000/818627 [00:54<00:05, 13830.17 examples/s]
Filter: 92%|█████████▏| 752000/818627 [00:54<00:04, 13916.35 examples/s]
Filter: 91%|█████████ | 742000/818627 [00:54<00:05, 14093.29 examples/s]
Filter: 92%|█████████▏| 754000/818627 [00:54<00:04, 14340.44 examples/s]
Filter: 93%|█████████▎| 758000/818627 [00:54<00:04, 14275.80 examples/s]
Filter: 91%|█████████ | 746000/818627 [00:54<00:05, 13703.14 examples/s]
Filter: 92%|█████████▏| 754000/818627 [00:54<00:04, 14286.96 examples/s]
Filter: 91%|█████████ | 746000/818627 [00:54<00:05, 13723.35 examples/s]
Filter: 91%|█████████▏| 748000/818627 [00:54<00:05, 13798.11 examples/s]
Filter: 92%|█████████▏| 754000/818627 [00:54<00:04, 14021.69 examples/s]
Filter: 91%|█████████ | 744000/818627 [00:54<00:05, 13970.54 examples/s]
Filter: 92%|█████████▏| 756000/818627 [00:54<00:04, 13965.57 examples/s]
Filter: 91%|█████████▏| 748000/818627 [00:54<00:05, 13822.58 examples/s]
Filter: 93%|█████████▎| 760000/818627 [00:54<00:04, 14072.79 examples/s]
Filter: 92%|█████████▏| 756000/818627 [00:54<00:04, 14140.80 examples/s]
Filter: 92%|█████████▏| 750000/818627 [00:54<00:04, 13790.16 examples/s]
Filter: 91%|█████████▏| 748000/818627 [00:54<00:05, 13601.40 examples/s]
Filter: 92%|█████████▏| 756000/818627 [00:54<00:04, 13960.37 examples/s]
Filter: 91%|█████████ | 746000/818627 [00:54<00:05, 13903.51 examples/s]
Filter: 93%|█████████▎| 762000/818627 [00:54<00:03, 14182.89 examples/s]
Filter: 93%|█████████▎| 758000/818627 [00:54<00:04, 13958.05 examples/s]
Filter: 92%|█████████▏| 750000/818627 [00:54<00:04, 13790.68 examples/s]
Filter: 93%|█████████▎| 758000/818627 [00:54<00:04, 14088.58 examples/s]
Filter: 92%|█████████▏| 752000/818627 [00:55<00:04, 13898.76 examples/s]
Filter: 92%|█████████▏| 750000/818627 [00:54<00:05, 13643.10 examples/s]
Filter: 93%|█████████▎| 758000/818627 [00:54<00:04, 13953.24 examples/s]
Filter: 91%|█████████▏| 748000/818627 [00:54<00:05, 13980.51 examples/s]
Filter: 93%|█████████▎| 764000/818627 [00:54<00:03, 14262.88 examples/s]
Filter: 93%|█████████▎| 760000/818627 [00:54<00:04, 14079.19 examples/s]
Filter: 93%|█████████▎| 760000/818627 [00:54<00:04, 14150.01 examples/s]
Filter: 92%|█████████▏| 752000/818627 [00:54<00:04, 13891.78 examples/s]
Filter: 92%|█████████▏| 754000/818627 [00:55<00:04, 13972.45 examples/s]
Filter: 92%|█████████▏| 752000/818627 [00:54<00:04, 13761.84 examples/s]
Filter: 93%|█████████▎| 760000/818627 [00:55<00:04, 13875.57 examples/s]
Filter: 92%|█████████▏| 750000/818627 [00:55<00:04, 13956.06 examples/s]
Filter: 93%|█████████▎| 762000/818627 [00:55<00:04, 14121.56 examples/s]
Filter: 94%|█████████▎| 766000/818627 [00:55<00:03, 14193.79 examples/s]
Filter: 93%|█████████▎| 762000/818627 [00:55<00:04, 14154.02 examples/s]
Filter: 92%|█████████▏| 754000/818627 [00:55<00:04, 13966.62 examples/s]
Filter: 92%|█████████▏| 756000/818627 [00:55<00:04, 14025.92 examples/s]
Filter: 92%|█████████▏| 754000/818627 [00:55<00:04, 13718.20 examples/s]
Filter: 93%|█████████▎| 762000/818627 [00:55<00:04, 13981.11 examples/s]
Filter: 92%|█████████▏| 752000/818627 [00:55<00:04, 14003.12 examples/s]
Filter: 94%|█████████▍| 768000/818627 [00:55<00:03, 14254.73 examples/s]
Filter: 93%|█████████▎| 764000/818627 [00:55<00:03, 14175.92 examples/s]
Filter: 93%|█████████▎| 764000/818627 [00:55<00:03, 14188.59 examples/s]
Filter: 92%|█████████▏| 756000/818627 [00:55<00:04, 14000.88 examples/s]
Filter: 93%|█████████▎| 758000/818627 [00:55<00:04, 13970.92 examples/s]
Filter: 92%|█████████▏| 756000/818627 [00:55<00:04, 13793.13 examples/s]
Filter: 93%|█████████▎| 764000/818627 [00:55<00:03, 14003.43 examples/s]
Filter: 92%|█████████▏| 754000/818627 [00:55<00:04, 14003.95 examples/s]
Filter: 94%|█████████▎| 766000/818627 [00:55<00:03, 14172.06 examples/s]
Filter: 94%|█████████▍| 770000/818627 [00:55<00:03, 14152.05 examples/s]
Filter: 94%|█████████▎| 766000/818627 [00:55<00:03, 14198.46 examples/s]
Filter: 93%|█████████▎| 758000/818627 [00:55<00:04, 13882.18 examples/s]
Filter: 93%|█████████▎| 760000/818627 [00:55<00:04, 14036.63 examples/s]
Filter: 93%|█████████▎| 758000/818627 [00:55<00:04, 13765.91 examples/s]
Filter: 94%|█████████▎| 766000/818627 [00:55<00:03, 14095.32 examples/s]
Filter: 94%|█████████▍| 768000/818627 [00:55<00:03, 14207.47 examples/s]
Filter: 92%|█████████▏| 756000/818627 [00:55<00:04, 14043.74 examples/s]
Filter: 94%|█████████▍| 772000/818627 [00:55<00:03, 14091.93 examples/s]
Filter: 94%|█████████▍| 768000/818627 [00:55<00:03, 14191.86 examples/s]
Filter: 93%|█████████▎| 760000/818627 [00:55<00:04, 13781.55 examples/s]
Filter: 93%|█████████▎| 762000/818627 [00:55<00:04, 14070.05 examples/s]
Filter: 93%|█████████▎| 760000/818627 [00:55<00:04, 13846.06 examples/s]
Filter: 94%|█████████▍| 768000/818627 [00:55<00:03, 14132.64 examples/s]
Filter: 94%|█████████▍| 770000/818627 [00:55<00:03, 14202.59 examples/s]
Filter: 93%|█████████▎| 758000/818627 [00:55<00:04, 14078.76 examples/s]
Filter: 94%|█████████▍| 770000/818627 [00:55<00:03, 14176.88 examples/s]
Filter: 93%|█████████▎| 762000/818627 [00:55<00:04, 13739.72 examples/s]
Filter: 93%|█████████▎| 764000/818627 [00:55<00:03, 13912.02 examples/s]
Filter: 93%|█████████▎| 762000/818627 [00:55<00:04, 13913.63 examples/s]
Filter: 94%|█████████▍| 770000/818627 [00:55<00:03, 13999.77 examples/s]
Filter: 94%|█████████▍| 772000/818627 [00:55<00:03, 14213.94 examples/s]
Filter: 93%|█████████▎| 760000/818627 [00:55<00:04, 14101.78 examples/s]
Filter: 94%|█████████▍| 772000/818627 [00:55<00:03, 14071.41 examples/s]
Filter: 93%|█████████▎| 764000/818627 [00:55<00:03, 13801.09 examples/s]
Filter: 94%|█████████▎| 766000/818627 [00:56<00:03, 13977.49 examples/s]
Filter: 93%|█████████▎| 764000/818627 [00:55<00:03, 13969.23 examples/s]
Filter: 94%|█████████▍| 772000/818627 [00:55<00:03, 13925.23 examples/s]
Filter: 93%|█████████▎| 762000/818627 [00:55<00:04, 14114.22 examples/s]
Filter: 94%|█████████▎| 766000/818627 [00:55<00:03, 13869.05 examples/s]
Filter: 95%|█████████▍| 774000/818627 [00:55<00:05, 8449.82 examples/s]
Filter: 94%|█████████▍| 768000/818627 [00:56<00:03, 14020.97 examples/s]
Filter: 94%|█████████▎| 766000/818627 [00:56<00:03, 13852.22 examples/s]
Filter: 93%|█████████▎| 764000/818627 [00:56<00:03, 14114.54 examples/s]
Filter: 94%|█████████▍| 768000/818627 [00:56<00:03, 13924.12 examples/s]
Filter: 95%|█████████▍| 776000/818627 [00:56<00:04, 9515.08 examples/s]
Filter: 94%|█████████▍| 770000/818627 [00:56<00:03, 14086.45 examples/s]
Filter: 94%|█████████▍| 768000/818627 [00:56<00:03, 13902.25 examples/s]
Filter: 94%|█████████▎| 766000/818627 [00:56<00:03, 14090.80 examples/s]
Filter: 94%|█████████▍| 770000/818627 [00:56<00:03, 13976.21 examples/s]
Filter: 95%|█████████▌| 778000/818627 [00:56<00:03, 10492.68 examples/s]
Filter: 95%|█████████▍| 774000/818627 [00:56<00:05, 8204.71 examples/s]
Filter: 95%|█████████▍| 774000/818627 [00:56<00:05, 8147.72 examples/s]
Filter: 94%|█████████▍| 772000/818627 [00:56<00:03, 14119.00 examples/s]
Filter: 94%|█████████▍| 770000/818627 [00:56<00:03, 13761.97 examples/s]
Filter: 94%|█████████▍| 768000/818627 [00:56<00:03, 14078.14 examples/s]
Filter: 94%|█████████▍| 772000/818627 [00:56<00:03, 14017.76 examples/s]
Filter: 95%|█████████▌| 780000/818627 [00:56<00:03, 11331.46 examples/s]
Filter: 95%|█████████▍| 774000/818627 [00:56<00:05, 8108.21 examples/s]
Filter: 95%|█████████▍| 776000/818627 [00:56<00:04, 9313.08 examples/s]
Filter: 95%|█████████▍| 776000/818627 [00:56<00:04, 9287.75 examples/s]
Filter: 95%|█████████▍| 774000/818627 [00:56<00:03, 14185.42 examples/s]
Filter: 94%|█████████▍| 772000/818627 [00:56<00:03, 13731.10 examples/s]
Filter: 94%|█████████▍| 770000/818627 [00:56<00:03, 14090.78 examples/s]
Filter: 96%|█████████▌| 782000/818627 [00:56<00:03, 12107.46 examples/s]
Filter: 95%|█████████▍| 776000/818627 [00:56<00:04, 9201.20 examples/s]
Filter: 95%|█████████▌| 778000/818627 [00:56<00:03, 10355.82 examples/s]
Filter: 95%|█████████▌| 778000/818627 [00:56<00:03, 10343.14 examples/s]
Filter: 95%|█████████▍| 776000/818627 [00:56<00:03, 14181.32 examples/s]
Filter: 94%|█████████▍| 772000/818627 [00:56<00:03, 14096.82 examples/s]
Filter: 96%|█████████▌| 784000/818627 [00:56<00:02, 12723.69 examples/s]
Filter: 95%|█████████▌| 778000/818627 [00:56<00:03, 10200.17 examples/s]
Filter: 95%|█████████▌| 780000/818627 [00:56<00:03, 11267.35 examples/s]
Filter: 95%|█████████▌| 780000/818627 [00:56<00:03, 11188.43 examples/s]
Filter: 95%|█████████▌| 778000/818627 [00:56<00:02, 14178.65 examples/s]
Filter: 96%|█████████▌| 786000/818627 [00:56<00:02, 13180.04 examples/s]
Filter: 95%|█████████▍| 774000/818627 [00:56<00:05, 8616.84 examples/s]
Filter: 95%|█████████▌| 780000/818627 [00:56<00:03, 11061.16 examples/s]
Filter: 96%|█████████▌| 782000/818627 [00:56<00:03, 11831.96 examples/s]
Filter: 96%|█████████▌| 782000/818627 [00:56<00:03, 11944.61 examples/s]
Filter: 95%|█████████▍| 774000/818627 [00:56<00:05, 8205.54 examples/s]
Filter: 96%|█████████▋| 788000/818627 [00:56<00:02, 13403.54 examples/s]
Filter: 95%|█████████▍| 776000/818627 [00:56<00:04, 9618.33 examples/s]
Filter: 96%|█████████▌| 782000/818627 [00:56<00:03, 11813.93 examples/s]
Filter: 96%|█████████▌| 784000/818627 [00:56<00:02, 12446.21 examples/s]
Filter: 96%|█████████▌| 784000/818627 [00:56<00:02, 12537.80 examples/s]
Filter: 97%|█████████▋| 790000/818627 [00:57<00:02, 13546.26 examples/s]
Filter: 95%|█████████▍| 776000/818627 [00:57<00:04, 9251.55 examples/s]
Filter: 95%|█████████▌| 778000/818627 [00:57<00:03, 10597.39 examples/s]
Filter: 95%|█████████▍| 774000/818627 [00:57<00:05, 8111.42 examples/s]
Filter: 96%|█████████▌| 784000/818627 [00:57<00:02, 12334.94 examples/s]
Filter: 96%|█████████▌| 786000/818627 [00:57<00:02, 12887.75 examples/s]
Filter: 96%|█████████▌| 786000/818627 [00:57<00:02, 12733.91 examples/s]
Filter: 95%|█████████▌| 780000/818627 [00:57<00:04, 8380.94 examples/s]
Filter: 97%|█████████▋| 792000/818627 [00:57<00:01, 13649.70 examples/s]
Filter: 95%|█████████▌| 778000/818627 [00:57<00:03, 10197.84 examples/s]
Filter: 95%|█████████▌| 780000/818627 [00:57<00:03, 11377.25 examples/s]
Filter: 96%|█████████▋| 788000/818627 [00:57<00:02, 13216.20 examples/s]
Filter: 96%|█████████▌| 786000/818627 [00:57<00:02, 12686.31 examples/s]
Filter: 95%|█████████▍| 776000/818627 [00:57<00:04, 9173.85 examples/s]
Filter: 96%|█████████▋| 788000/818627 [00:57<00:02, 12994.61 examples/s]
Filter: 96%|█████████▌| 782000/818627 [00:57<00:03, 9474.17 examples/s]
Filter: 97%|█████████▋| 794000/818627 [00:57<00:01, 13792.97 examples/s]
Filter: 95%|█████████▌| 780000/818627 [00:57<00:03, 11019.14 examples/s]
Filter: 96%|█████████▌| 782000/818627 [00:57<00:03, 12018.64 examples/s]
Filter: 97%|█████████▋| 790000/818627 [00:57<00:02, 13459.55 examples/s]
Filter: 96%|█████████▋| 788000/818627 [00:57<00:02, 13049.88 examples/s]
Filter: 95%|█████████▌| 778000/818627 [00:57<00:03, 10189.79 examples/s]
Filter: 97%|█████████▋| 790000/818627 [00:57<00:02, 13338.12 examples/s]
Filter: 96%|█████████▌| 784000/818627 [00:57<00:03, 10514.82 examples/s]
Filter: 97%|█████████▋| 796000/818627 [00:57<00:01, 13840.82 examples/s]
Filter: 96%|█████████▌| 782000/818627 [00:57<00:03, 11688.96 examples/s]
Filter: 96%|█████████▌| 784000/818627 [00:57<00:02, 12465.74 examples/s]
Filter: 97%|█████████▋| 792000/818627 [00:57<00:01, 13557.49 examples/s]
Filter: 97%|█████████▋| 790000/818627 [00:57<00:02, 13375.02 examples/s]
Filter: 95%|█████████▌| 780000/818627 [00:57<00:03, 11107.24 examples/s]
Filter: 97%|█████████▋| 792000/818627 [00:57<00:01, 13468.04 examples/s]
Filter: 96%|█████████▌| 786000/818627 [00:57<00:02, 11336.85 examples/s]
Filter: 97%|█████████▋| 798000/818627 [00:57<00:01, 13881.02 examples/s]
Filter: 96%|█████████▌| 784000/818627 [00:57<00:02, 12235.18 examples/s]
Filter: 96%|█████████▌| 786000/818627 [00:57<00:02, 12909.19 examples/s]
Filter: 97%|█████████▋| 792000/818627 [00:57<00:01, 13491.17 examples/s]
Filter: 97%|█████████▋| 794000/818627 [00:57<00:01, 13544.59 examples/s]
Filter: 96%|█████████▌| 782000/818627 [00:57<00:03, 11705.12 examples/s]
Filter: 97%|█████████▋| 794000/818627 [00:57<00:01, 13693.61 examples/s]
Filter: 96%|█████████▋| 788000/818627 [00:57<00:02, 11948.58 examples/s]
Filter: 98%|█████████▊| 800000/818627 [00:57<00:01, 14030.20 examples/s]
Filter: 96%|█████████▌| 786000/818627 [00:57<00:02, 12640.78 examples/s]
Filter: 96%|█████████▋| 788000/818627 [00:57<00:02, 13144.41 examples/s]
Filter: 97%|█████████▋| 794000/818627 [00:57<00:01, 13698.01 examples/s]
Filter: 97%|█████████▋| 796000/818627 [00:57<00:01, 13699.25 examples/s]
Filter: 96%|█████████▌| 784000/818627 [00:57<00:02, 12305.44 examples/s]
Filter: 97%|█████████▋| 796000/818627 [00:57<00:01, 13849.93 examples/s]
Filter: 97%|█████████▋| 790000/818627 [00:58<00:02, 12456.08 examples/s]
Filter: 98%|█████████▊| 802000/818627 [00:57<00:01, 14025.48 examples/s]
Filter: 96%|█████████▋| 788000/818627 [00:57<00:02, 13081.14 examples/s]
Filter: 97%|█████████▋| 790000/818627 [00:57<00:02, 13390.50 examples/s]
Filter: 97%|█████████▋| 796000/818627 [00:57<00:01, 13840.70 examples/s]
Filter: 97%|█████████▋| 798000/818627 [00:57<00:01, 13743.82 examples/s]
Filter: 97%|█████████▋| 798000/818627 [00:57<00:01, 13935.17 examples/s]
Filter: 96%|█████████▌| 786000/818627 [00:57<00:02, 12718.93 examples/s]
Filter: 97%|█████████▋| 792000/818627 [00:58<00:02, 12824.77 examples/s]
Filter: 98%|█████████▊| 804000/818627 [00:58<00:01, 14023.47 examples/s]
Filter: 97%|█████████▋| 790000/818627 [00:58<00:02, 13267.24 examples/s]
Filter: 97%|█████████▋| 792000/818627 [00:58<00:01, 13576.26 examples/s]
Filter: 97%|█████████▋| 798000/818627 [00:58<00:01, 13925.12 examples/s]
Filter: 98%|█████████▊| 800000/818627 [00:58<00:01, 13884.91 examples/s]
Filter: 98%|█████████▊| 800000/818627 [00:58<00:01, 13911.18 examples/s]
Filter: 96%|█████████▋| 788000/818627 [00:58<00:02, 13072.12 examples/s]
Filter: 97%|█████████▋| 794000/818627 [00:58<00:01, 13214.93 examples/s]
Filter: 98%|█████████▊| 806000/818627 [00:58<00:00, 14014.03 examples/s]
Filter: 98%|█████████▊| 800000/818627 [00:58<00:01, 13990.63 examples/s]
Filter: 97%|█████████▋| 794000/818627 [00:58<00:01, 13603.45 examples/s]
Filter: 97%|█████████▋| 792000/818627 [00:58<00:01, 13326.78 examples/s]
Filter: 98%|█████████▊| 802000/818627 [00:58<00:01, 13968.65 examples/s]
Filter: 98%|█████████▊| 802000/818627 [00:58<00:01, 14003.59 examples/s]
Filter: 97%|█████████▋| 790000/818627 [00:58<00:02, 13333.17 examples/s]
Filter: 97%|█████████▋| 796000/818627 [00:58<00:01, 13409.01 examples/s]
Filter: 99%|█████████▊| 808000/818627 [00:58<00:00, 14146.00 examples/s]
Filter: 98%|█████████▊| 802000/818627 [00:58<00:01, 14050.45 examples/s]
Filter: 97%|█████████▋| 796000/818627 [00:58<00:01, 13761.55 examples/s]
Filter: 98%|█████████▊| 804000/818627 [00:58<00:01, 14056.47 examples/s]
Filter: 97%|█████████▋| 794000/818627 [00:58<00:01, 13563.44 examples/s]
Filter: 98%|█████████▊| 804000/818627 [00:58<00:01, 14069.67 examples/s]
Filter: 97%|█████████▋| 792000/818627 [00:58<00:01, 13508.30 examples/s]
Filter: 97%|█████████▋| 798000/818627 [00:58<00:01, 13533.80 examples/s]
Filter: 99%|█████████▉| 810000/818627 [00:58<00:00, 14089.53 examples/s]
Filter: 98%|█████████▊| 804000/818627 [00:58<00:01, 14034.41 examples/s]
Filter: 97%|█████████▋| 798000/818627 [00:58<00:01, 13846.67 examples/s]
Filter: 98%|█████████▊| 806000/818627 [00:58<00:00, 14057.81 examples/s]
Filter: 97%|█████████▋| 796000/818627 [00:58<00:01, 13564.61 examples/s]
Filter: 98%|█████████▊| 806000/818627 [00:58<00:00, 13990.75 examples/s]
Filter: 97%|█████████▋| 794000/818627 [00:58<00:01, 13454.65 examples/s]
Filter: 98%|█████████▊| 800000/818627 [00:58<00:01, 13750.78 examples/s]
Filter: 99%|█████████▉| 812000/818627 [00:58<00:00, 13768.71 examples/s]
Filter: 98%|█████████▊| 806000/818627 [00:58<00:00, 14089.10 examples/s]
Filter: 99%|█████████▊| 808000/818627 [00:58<00:00, 13993.14 examples/s]
Filter: 98%|█████████▊| 800000/818627 [00:58<00:01, 13812.57 examples/s]
Filter: 97%|█████████▋| 798000/818627 [00:58<00:01, 13592.12 examples/s]
Filter: 99%|█████████▊| 808000/818627 [00:58<00:00, 13941.56 examples/s]
Filter: 97%|█████████▋| 796000/818627 [00:58<00:01, 13613.08 examples/s]
Filter: 98%|█████████▊| 802000/818627 [00:58<00:01, 13797.49 examples/s]
Filter: 99%|█████████▉| 814000/818627 [00:58<00:00, 13939.78 examples/s]
Filter: 99%|█████████▊| 808000/818627 [00:58<00:00, 14114.25 examples/s]
Filter: 99%|█████████▉| 810000/818627 [00:58<00:00, 13936.59 examples/s]
Filter: 98%|█████████▊| 802000/818627 [00:58<00:01, 13794.97 examples/s]
Filter: 98%|█████████▊| 800000/818627 [00:58<00:01, 13738.01 examples/s]
Filter: 99%|█████████▉| 810000/818627 [00:58<00:00, 14012.05 examples/s]
Filter: 97%|█████████▋| 798000/818627 [00:58<00:01, 13726.08 examples/s]
Filter: 98%|█████████▊| 804000/818627 [00:59<00:01, 13818.47 examples/s]
Filter: 100%|█████████▉| 816000/818627 [00:58<00:00, 13816.86 examples/s]
Filter: 99%|█████████▉| 810000/818627 [00:58<00:00, 13881.68 examples/s]
Filter: 99%|█████████▉| 812000/818627 [00:58<00:00, 13829.60 examples/s]
Filter: 98%|█████████▊| 802000/818627 [00:58<00:01, 13707.71 examples/s]
Filter: 98%|█████████▊| 804000/818627 [00:58<00:01, 13639.49 examples/s]
Filter: 99%|█████████▉| 812000/818627 [00:58<00:00, 13841.25 examples/s]
Filter: 98%|█████████▊| 800000/818627 [00:58<00:01, 13680.39 examples/s]
Filter: 98%|█████████▊| 806000/818627 [00:59<00:00, 13727.04 examples/s]
Filter: 100%|█████████▉| 818000/818627 [00:59<00:00, 13990.28 examples/s]
Filter: 99%|█████████▉| 812000/818627 [00:59<00:00, 13969.05 examples/s]
Filter: 99%|█████████▉| 814000/818627 [00:59<00:00, 13768.02 examples/s]
Filter: 98%|█████████▊| 804000/818627 [00:59<00:01, 13716.60 examples/s]
Filter: 98%|█████████▊| 806000/818627 [00:59<00:00, 13653.11 examples/s]
Filter: 99%|█████████▉| 814000/818627 [00:59<00:00, 13958.05 examples/s]
Filter: 100%|██████████| 818627/818627 [00:59<00:00, 13851.89 examples/s]
+
Filter: 98%|█████████▊| 802000/818627 [00:59<00:01, 13771.81 examples/s]
Filter: 99%|█████████▊| 808000/818627 [00:59<00:00, 13791.16 examples/s]
Filter: 99%|█████████▉| 814000/818627 [00:59<00:00, 14019.92 examples/s]
Filter: 100%|█████████▉| 816000/818627 [00:59<00:00, 13881.29 examples/s]
Filter: 98%|█████████▊| 806000/818627 [00:59<00:00, 13840.48 examples/s]
Filter: 100%|█████████▉| 816000/818627 [00:59<00:00, 14026.15 examples/s]
Filter: 99%|█████████▊| 808000/818627 [00:59<00:00, 13778.20 examples/s]
Filter: 98%|█████████▊| 804000/818627 [00:59<00:01, 13827.55 examples/s]
Filter: 99%|█████████▉| 810000/818627 [00:59<00:00, 13839.27 examples/s]
Filter: 100%|█████████▉| 816000/818627 [00:59<00:00, 13891.53 examples/s]
Filter: 100%|█████████▉| 818000/818627 [00:59<00:00, 13831.64 examples/s]
Filter: 100%|█████████▉| 818000/818627 [00:59<00:00, 14028.45 examples/s]
Filter: 99%|█████████▊| 808000/818627 [00:59<00:00, 13823.34 examples/s]
Filter: 99%|█████████▉| 810000/818627 [00:59<00:00, 13761.90 examples/s]
Filter: 98%|█████████▊| 806000/818627 [00:59<00:00, 13831.57 examples/s]
Filter: 100%|██████████| 818627/818627 [00:59<00:00, 13771.47 examples/s]
+
Filter: 100%|██████████| 818627/818627 [00:59<00:00, 13771.52 examples/s]
+
Filter: 99%|█████████▉| 812000/818627 [00:59<00:00, 13975.74 examples/s]
Filter: 100%|█████████▉| 818000/818627 [00:59<00:00, 13787.82 examples/s]
Filter: 99%|█████████▉| 812000/818627 [00:59<00:00, 13875.20 examples/s]
Filter: 99%|█████████▉| 810000/818627 [00:59<00:00, 13799.23 examples/s]
Filter: 99%|█████████▊| 808000/818627 [00:59<00:00, 13755.04 examples/s]
Filter: 100%|██████████| 818627/818627 [00:59<00:00, 13740.27 examples/s]
+
Filter: 99%|█████████▉| 814000/818627 [00:59<00:00, 13776.73 examples/s]
Filter: 99%|█████████▉| 812000/818627 [00:59<00:00, 13883.95 examples/s]
Filter: 99%|█████████▉| 814000/818627 [00:59<00:00, 13869.39 examples/s]
Filter: 99%|█████████▉| 810000/818627 [00:59<00:00, 13863.41 examples/s]
Filter: 100%|█████████▉| 816000/818627 [00:59<00:00, 13761.42 examples/s]
Filter: 99%|█████████▉| 814000/818627 [00:59<00:00, 13940.70 examples/s]
Filter: 100%|█████████▉| 816000/818627 [00:59<00:00, 13828.92 examples/s]
Filter: 99%|█████████▉| 812000/818627 [00:59<00:00, 13852.26 examples/s]
Filter: 100%|█████████▉| 818000/818627 [01:00<00:00, 13943.71 examples/s]
Filter: 100%|██████████| 818627/818627 [01:00<00:00, 13612.65 examples/s]
+
Filter: 100%|█████████▉| 816000/818627 [00:59<00:00, 14002.18 examples/s]
Filter: 100%|█████████▉| 818000/818627 [00:59<00:00, 13907.97 examples/s]
Filter: 99%|█████████▉| 814000/818627 [00:59<00:00, 13958.43 examples/s]
Filter: 100%|██████████| 818627/818627 [01:00<00:00, 13639.97 examples/s]
+
Filter: 100%|█████████▉| 818000/818627 [01:00<00:00, 14072.60 examples/s]
Filter: 100%|█████████▉| 816000/818627 [01:00<00:00, 14055.33 examples/s]
Filter: 100%|██████████| 818627/818627 [01:00<00:00, 13609.43 examples/s]
+
Filter: 100%|█████████▉| 818000/818627 [01:00<00:00, 13904.67 examples/s]
Filter: 100%|██████████| 818627/818627 [01:00<00:00, 13569.88 examples/s]
+
Epoch 0: 0%| | 0/12384 [00:00, ?it/s]
Epoch 0: 0%| | 0/12384 [00:07, ?it/s, loss=25.6497, acc=0.0005, iter_time=7.42s]
Epoch 0: 0%| | 1/12384 [00:07<27:03:35, 7.87s/it, loss=25.6497, acc=0.0005, iter_time=7.42s]
Epoch 0: 0%| | 1/12384 [00:15<27:03:35, 7.87s/it, loss=24.4383, acc=0.0003, iter_time=6.22s]
Epoch 0: 0%| | 2/12384 [00:15<25:46:16, 7.49s/it, loss=24.4383, acc=0.0003, iter_time=6.22s]
Epoch 0: 0%| | 2/12384 [00:22<25:46:16, 7.49s/it, loss=27.3238, acc=0.0007, iter_time=8.31s]
Epoch 0: 0%| | 3/12384 [00:22<25:22:05, 7.38s/it, loss=27.3238, acc=0.0007, iter_time=8.31s]
Epoch 0: 0%| | 3/12384 [00:29<25:22:05, 7.38s/it, loss=25.5323, acc=0.0009, iter_time=4.43s]
Epoch 0: 0%| | 4/12384 [00:29<25:08:40, 7.31s/it, loss=25.5323, acc=0.0009, iter_time=4.43s]
Epoch 0: 0%| | 4/12384 [00:36<25:08:40, 7.31s/it, loss=24.9663, acc=0.0007, iter_time=10.03s]
Epoch 0: 0%| | 5/12384 [00:36<25:07:42, 7.31s/it, loss=24.9663, acc=0.0007, iter_time=10.03s]
Epoch 0: 0%| | 5/12384 [00:44<25:07:42, 7.31s/it, loss=25.6308, acc=0.0010, iter_time=7.29s]
Epoch 0: 0%| | 6/12384 [00:44<25:02:08, 7.28s/it, loss=25.6308, acc=0.0010, iter_time=7.29s]
Epoch 0: 0%| | 6/12384 [00:51<25:02:08, 7.28s/it, loss=25.3157, acc=0.0013, iter_time=7.29s]
Epoch 0: 0%| | 7/12384 [00:51<25:01:49, 7.28s/it, loss=25.3157, acc=0.0013, iter_time=7.29s]
Epoch 0: 0%| | 7/12384 [00:58<25:01:49, 7.28s/it, loss=25.7164, acc=0.0010, iter_time=7.85s]
Epoch 0: 0%| | 8/12384 [00:58<25:13:42, 7.34s/it, loss=25.7164, acc=0.0010, iter_time=7.85s]
Epoch 0: 0%| | 8/12384 [01:06<25:13:42, 7.34s/it, loss=23.5843, acc=0.0014, iter_time=4.82s]
Epoch 0: 0%| | 9/12384 [01:06<25:07:13, 7.31s/it, loss=23.5843, acc=0.0014, iter_time=4.82s]
Epoch 0: 0%| | 9/12384 [01:13<25:07:13, 7.31s/it, loss=26.5867, acc=0.0009, iter_time=9.27s]
Epoch 0: 0%| | 10/12384 [01:13<25:02:38, 7.29s/it, loss=26.5867, acc=0.0009, iter_time=9.27s]
Epoch 0: 0%| | 10/12384 [01:20<25:02:38, 7.29s/it, loss=25.7749, acc=0.0000, iter_time=7.24s]
Epoch 0: 0%| | 11/12384 [01:20<24:59:22, 7.27s/it, loss=25.7749, acc=0.0000, iter_time=7.24s]
Epoch 0: 0%| | 11/12384 [01:27<24:59:22, 7.27s/it, loss=25.6492, acc=0.0004, iter_time=7.24s]
Epoch 0: 0%| | 12/12384 [01:27<24:57:15, 7.26s/it, loss=25.6492, acc=0.0004, iter_time=7.24s]
Epoch 0: 0%| | 12/12384 [01:35<24:57:15, 7.26s/it, loss=25.6676, acc=0.0011, iter_time=4.88s]
Epoch 0: 0%| | 13/12384 [01:35<24:55:01, 7.25s/it, loss=25.6676, acc=0.0011, iter_time=4.88s]
Epoch 0: 0%| | 13/12384 [01:42<24:55:01, 7.25s/it, loss=24.9120, acc=0.0014, iter_time=8.03s]
Epoch 0: 0%| | 14/12384 [01:42<24:53:30, 7.24s/it, loss=24.9120, acc=0.0014, iter_time=8.03s]
Epoch 0: 0%| | 14/12384 [01:49<24:53:30, 7.24s/it, loss=24.5085, acc=0.0015, iter_time=8.79s]
Epoch 0: 0%| | 15/12384 [01:49<24:53:13, 7.24s/it, loss=24.5085, acc=0.0015, iter_time=8.79s]
Epoch 0: 0%| | 15/12384 [01:56<24:53:13, 7.24s/it, loss=26.1575, acc=0.0000, iter_time=7.11s]
Epoch 0: 0%| | 16/12384 [01:56<24:53:26, 7.24s/it, loss=26.1575, acc=0.0000, iter_time=7.11s]
Epoch 0: 0%| | 16/12384 [02:03<24:53:26, 7.24s/it, loss=25.1220, acc=0.0009, iter_time=6.29s]
Epoch 0: 0%| | 17/12384 [02:03<24:53:01, 7.24s/it, loss=25.1220, acc=0.0009, iter_time=6.29s]
Epoch 0: 0%| | 17/12384 [02:11<24:53:01, 7.24s/it, loss=24.7204, acc=0.0011, iter_time=8.33s]
Epoch 0: 0%| | 18/12384 [02:11<24:53:26, 7.25s/it, loss=24.7204, acc=0.0011, iter_time=8.33s]
Epoch 0: 0%| | 18/12384 [02:18<24:53:26, 7.25s/it, loss=25.7300, acc=0.0004, iter_time=6.18s]
Epoch 0: 0%| | 19/12384 [02:18<24:58:58, 7.27s/it, loss=25.7300, acc=0.0004, iter_time=6.18s]
Epoch 0: 0%| | 19/12384 [02:25<24:58:58, 7.27s/it, loss=25.3883, acc=0.0011, iter_time=8.41s]
Epoch 0: 0%| | 20/12384 [02:25<24:57:11, 7.27s/it, loss=25.3883, acc=0.0011, iter_time=8.41s]
Epoch 0: 0%| | 20/12384 [02:33<24:57:11, 7.27s/it, loss=25.3092, acc=0.0002, iter_time=7.33s]
Epoch 0: 0%| | 21/12384 [02:33<25:19:33, 7.37s/it, loss=25.3092, acc=0.0002, iter_time=7.33s]
Epoch 0: 0%| | 21/12384 [02:40<25:19:33, 7.37s/it, loss=25.6943, acc=0.0011, iter_time=7.56s]
Epoch 0: 0%| | 22/12384 [02:40<25:11:45, 7.34s/it, loss=25.6943, acc=0.0011, iter_time=7.56s]
Epoch 0: 0%| | 22/12384 [02:47<25:11:45, 7.34s/it, loss=26.9137, acc=0.0004, iter_time=7.25s]
Epoch 0: 0%| | 23/12384 [02:47<25:06:06, 7.31s/it, loss=26.9137, acc=0.0004, iter_time=7.25s]
Epoch 0: 0%| | 23/12384 [02:55<25:06:06, 7.31s/it, loss=25.6135, acc=0.0014, iter_time=7.64s]
Epoch 0: 0%| | 24/12384 [02:55<25:02:34, 7.29s/it, loss=25.6135, acc=0.0014, iter_time=7.64s]
Epoch 0: 0%| | 24/12384 [03:02<25:02:34, 7.29s/it, loss=26.1792, acc=0.0009, iter_time=6.87s]
Epoch 0: 0%| | 25/12384 [03:02<25:01:00, 7.29s/it, loss=26.1792, acc=0.0009, iter_time=6.87s]
Epoch 0: 0%| | 25/12384 [03:09<25:01:00, 7.29s/it, loss=25.4236, acc=0.0010, iter_time=7.25s]
Epoch 0: 0%| | 26/12384 [03:09<24:59:08, 7.28s/it, loss=25.4236, acc=0.0010, iter_time=7.25s]
Epoch 0: 0%| | 26/12384 [03:16<24:59:08, 7.28s/it, loss=25.8779, acc=0.0008, iter_time=7.27s]
Epoch 0: 0%| | 27/12384 [03:16<24:57:22, 7.27s/it, loss=25.8779, acc=0.0008, iter_time=7.27s]
Epoch 0: 0%| | 27/12384 [03:24<24:57:22, 7.27s/it, loss=25.2761, acc=0.0002, iter_time=4.21s]
Epoch 0: 0%| | 28/12384 [03:24<24:55:54, 7.26s/it, loss=25.2761, acc=0.0002, iter_time=4.21s]
Epoch 0: 0%| | 28/12384 [03:31<24:55:54, 7.26s/it, loss=24.7261, acc=0.0006, iter_time=10.28s]
Epoch 0: 0%| | 29/12384 [03:31<24:55:29, 7.26s/it, loss=24.7261, acc=0.0006, iter_time=10.28s]
Epoch 0: 0%| | 29/12384 [03:38<24:55:29, 7.26s/it, loss=26.0604, acc=0.0012, iter_time=6.71s]
Epoch 0: 0%| | 30/12384 [03:38<24:53:52, 7.26s/it, loss=26.0604, acc=0.0012, iter_time=6.71s]
Epoch 0: 0%| | 30/12384 [03:45<24:53:52, 7.26s/it, loss=25.6512, acc=0.0013, iter_time=7.79s]
Epoch 0: 0%| | 31/12384 [03:45<24:53:34, 7.25s/it, loss=25.6512, acc=0.0013, iter_time=7.79s]
Epoch 0: 0%| | 31/12384 [03:53<24:53:34, 7.25s/it, loss=25.4752, acc=0.0010, iter_time=7.65s]
Epoch 0: 0%| | 32/12384 [03:53<24:53:27, 7.25s/it, loss=25.4752, acc=0.0010, iter_time=7.65s]
Epoch 0: 0%| | 32/12384 [04:00<24:53:27, 7.25s/it, loss=26.0732, acc=0.0004, iter_time=6.86s]
Epoch 0: 0%| | 33/12384 [04:00<24:53:16, 7.25s/it, loss=26.0732, acc=0.0004, iter_time=6.86s]
Epoch 0: 0%| | 33/12384 [04:07<24:53:16, 7.25s/it, loss=26.2147, acc=0.0006, iter_time=7.27s]
Epoch 0: 0%| | 34/12384 [04:07<24:53:29, 7.26s/it, loss=26.2147, acc=0.0006, iter_time=7.27s]
Epoch 0: 0%| | 34/12384 [04:14<24:53:29, 7.26s/it, loss=25.3158, acc=0.0018, iter_time=5.68s]
Epoch 0: 0%| | 35/12384 [04:14<24:51:20, 7.25s/it, loss=25.3158, acc=0.0018, iter_time=5.68s]
Epoch 0: 0%| | 35/12384 [04:22<24:51:20, 7.25s/it, loss=25.3095, acc=0.0006, iter_time=8.80s]
Epoch 0: 0%| | 36/12384 [04:22<24:52:17, 7.25s/it, loss=25.3095, acc=0.0006, iter_time=8.80s]
Epoch 0: 0%| | 36/12384 [04:29<24:52:17, 7.25s/it, loss=26.7242, acc=0.0006, iter_time=7.26s]
Epoch 0: 0%| | 37/12384 [04:29<24:52:10, 7.25s/it, loss=26.7242, acc=0.0006, iter_time=7.26s]
Epoch 0: 0%| | 37/12384 [04:36<24:52:10, 7.25s/it, loss=24.7830, acc=0.0007, iter_time=3.49s]
Epoch 0: 0%| | 38/12384 [04:36<24:52:14, 7.25s/it, loss=24.7830, acc=0.0007, iter_time=3.49s]
Epoch 0: 0%| | 38/12384 [04:43<24:52:14, 7.25s/it, loss=26.1911, acc=0.0006, iter_time=11.00s]
Epoch 0: 0%| | 39/12384 [04:43<24:51:17, 7.25s/it, loss=26.1911, acc=0.0006, iter_time=11.00s]
Epoch 0: 0%| | 39/12384 [04:51<24:51:17, 7.25s/it, loss=26.6228, acc=0.0004, iter_time=7.63s]
Epoch 0: 0%| | 40/12384 [04:51<24:50:52, 7.25s/it, loss=26.6228, acc=0.0004, iter_time=7.63s]
Epoch 0: 0%| | 40/12384 [04:58<24:50:52, 7.25s/it, loss=26.3213, acc=0.0003, iter_time=6.85s]
Epoch 0: 0%| | 41/12384 [04:58<24:50:44, 7.25s/it, loss=26.3213, acc=0.0003, iter_time=6.85s]
Epoch 0: 0%| | 41/12384 [05:05<24:50:44, 7.25s/it, loss=25.6779, acc=0.0007, iter_time=7.24s]
Epoch 0: 0%| | 42/12384 [05:05<24:50:51, 7.25s/it, loss=25.6779, acc=0.0007, iter_time=7.24s]
Epoch 0: 0%| | 42/12384 [05:12<24:50:51, 7.25s/it, loss=25.1938, acc=0.0003, iter_time=6.75s]
Epoch 0: 0%| | 43/12384 [05:12<24:50:51, 7.25s/it, loss=25.1938, acc=0.0003, iter_time=6.75s]
Epoch 0: 0%| | 43/12384 [05:20<24:50:51, 7.25s/it, loss=26.5261, acc=0.0019, iter_time=7.76s]
Epoch 0: 0%| | 44/12384 [05:20<24:50:08, 7.25s/it, loss=26.5261, acc=0.0019, iter_time=7.76s]
Epoch 0: 0%| | 44/12384 [05:27<24:50:08, 7.25s/it, loss=24.9753, acc=0.0005, iter_time=7.24s]
Epoch 0: 0%| | 45/12384 [05:27<24:49:44, 7.24s/it, loss=24.9753, acc=0.0005, iter_time=7.24s]
Epoch 0: 0%| | 45/12384 [05:34<24:49:44, 7.24s/it, loss=25.4438, acc=0.0005, iter_time=4.87s]
Epoch 0: 0%| | 46/12384 [05:34<24:46:59, 7.23s/it, loss=25.4438, acc=0.0005, iter_time=4.87s]
Epoch 0: 0%| | 46/12384 [05:41<24:46:59, 7.23s/it, loss=24.4372, acc=0.0011, iter_time=9.57s]
Epoch 0: 0%| | 47/12384 [05:41<24:47:22, 7.23s/it, loss=24.4372, acc=0.0011, iter_time=9.57s]
Epoch 0: 0%| | 47/12384 [05:49<24:47:22, 7.23s/it, loss=24.4923, acc=0.0013, iter_time=7.65s]
Epoch 0: 0%| | 48/12384 [05:49<24:48:55, 7.24s/it, loss=24.4923, acc=0.0013, iter_time=7.65s]
Epoch 0: 0%| | 48/12384 [05:56<24:48:55, 7.24s/it, loss=25.7376, acc=0.0007, iter_time=5.25s]
Epoch 0: 0%| | 49/12384 [05:56<24:53:36, 7.27s/it, loss=25.7376, acc=0.0007, iter_time=5.25s]
Epoch 0: 0%| | 49/12384 [06:03<24:53:36, 7.27s/it, loss=25.5508, acc=0.0010, iter_time=9.31s]
Epoch 0: 0%| | 50/12384 [06:03<24:51:52, 7.26s/it, loss=25.5508, acc=0.0010, iter_time=9.31s]
Epoch 0: 0%| | 50/12384 [06:10<24:51:52, 7.26s/it, loss=24.6517, acc=0.0011, iter_time=4.49s]
Epoch 0: 0%| | 51/12384 [06:10<24:50:53, 7.25s/it, loss=24.6517, acc=0.0011, iter_time=4.49s]
Epoch 0: 0%| | 51/12384 [06:18<24:50:53, 7.25s/it, loss=26.7249, acc=0.0002, iter_time=9.02s]
Epoch 0: 0%| | 52/12384 [06:18<24:48:17, 7.24s/it, loss=26.7249, acc=0.0002, iter_time=9.02s]
Epoch 0: 0%| | 52/12384 [06:25<24:48:17, 7.24s/it, loss=25.1032, acc=0.0008, iter_time=7.81s]
Epoch 0: 0%| | 53/12384 [06:25<24:49:07, 7.25s/it, loss=25.1032, acc=0.0008, iter_time=7.81s]
Epoch 0: 0%| | 53/12384 [06:32<24:49:07, 7.25s/it, loss=25.9677, acc=0.0010, iter_time=4.72s]
Epoch 0: 0%| | 54/12384 [06:32<24:49:54, 7.25s/it, loss=25.9677, acc=0.0010, iter_time=4.72s]
Epoch 0: 0%| | 54/12384 [06:39<24:49:54, 7.25s/it, loss=24.8746, acc=0.0004, iter_time=9.83s]
Epoch 0: 0%| | 55/12384 [06:39<24:52:17, 7.26s/it, loss=24.8746, acc=0.0004, iter_time=9.83s]
Epoch 0: 0%| | 55/12384 [06:47<24:52:17, 7.26s/it, loss=25.2453, acc=0.0004, iter_time=7.64s]
Epoch 0: 0%| | 56/12384 [06:47<24:51:22, 7.26s/it, loss=25.2453, acc=0.0004, iter_time=7.64s]
Epoch 0: 0%| | 56/12384 [06:54<24:51:22, 7.26s/it, loss=24.1171, acc=0.0013, iter_time=6.07s]
Epoch 0: 0%| | 57/12384 [06:54<24:46:43, 7.24s/it, loss=24.1171, acc=0.0013, iter_time=6.07s]
Epoch 0: 0%| | 57/12384 [07:01<24:46:43, 7.24s/it, loss=25.7877, acc=0.0010, iter_time=4.90s]
Epoch 0: 0%| | 58/12384 [07:01<24:47:18, 7.24s/it, loss=25.7877, acc=0.0010, iter_time=4.90s]
Epoch 0: 0%| | 58/12384 [07:08<24:47:18, 7.24s/it, loss=24.9161, acc=0.0011, iter_time=10.32s]
Epoch 0: 0%| | 59/12384 [07:08<24:47:08, 7.24s/it, loss=24.9161, acc=0.0011, iter_time=10.32s]
Epoch 0: 0%| | 59/12384 [07:16<24:47:08, 7.24s/it, loss=24.8615, acc=0.0005, iter_time=7.25s]
Epoch 0: 0%| | 60/12384 [07:16<24:47:53, 7.24s/it, loss=24.8615, acc=0.0005, iter_time=7.25s]
Epoch 0: 0%| | 60/12384 [07:23<24:47:53, 7.24s/it, loss=25.7963, acc=0.0004, iter_time=6.39s]
Epoch 0: 0%| | 61/12384 [07:23<24:47:46, 7.24s/it, loss=25.7963, acc=0.0004, iter_time=6.39s]
Epoch 0: 0%| | 61/12384 [07:30<24:47:46, 7.24s/it, loss=25.4569, acc=0.0008, iter_time=6.48s]
Epoch 0: 1%| | 62/12384 [07:30<24:47:13, 7.24s/it, loss=25.4569, acc=0.0008, iter_time=6.48s]
Epoch 0: 1%| | 62/12384 [07:37<24:47:13, 7.24s/it, loss=23.8285, acc=0.0003, iter_time=8.86s]
Epoch 0: 1%| | 63/12384 [07:37<24:47:50, 7.25s/it, loss=23.8285, acc=0.0003, iter_time=8.86s]
Epoch 0: 1%| | 63/12384 [07:45<24:47:50, 7.25s/it, loss=24.9708, acc=0.0014, iter_time=7.34s]
Epoch 0: 1%| | 64/12384 [07:45<24:46:58, 7.24s/it, loss=24.9708, acc=0.0014, iter_time=7.34s]
Epoch 0: 1%| | 64/12384 [07:52<24:46:58, 7.24s/it, loss=26.5769, acc=0.0011, iter_time=6.65s]
Epoch 0: 1%| | 65/12384 [07:52<24:46:22, 7.24s/it, loss=26.5769, acc=0.0011, iter_time=6.65s]
Epoch 0: 1%| | 65/12384 [07:59<24:46:22, 7.24s/it, loss=26.3202, acc=0.0011, iter_time=7.73s]
Epoch 0: 1%| | 66/12384 [07:59<24:46:34, 7.24s/it, loss=26.3202, acc=0.0011, iter_time=7.73s]
Epoch 0: 1%| | 66/12384 [08:06<24:46:34, 7.24s/it, loss=26.4568, acc=0.0007, iter_time=7.25s]
Epoch 0: 1%| | 67/12384 [08:06<24:47:17, 7.25s/it, loss=26.4568, acc=0.0007, iter_time=7.25s]
Epoch 0: 1%| | 67/12384 [08:14<24:47:17, 7.25s/it, loss=24.0713, acc=0.0008, iter_time=7.25s]
Epoch 0: 1%| | 68/12384 [08:14<24:47:27, 7.25s/it, loss=24.0713, acc=0.0008, iter_time=7.25s]
Epoch 0: 1%| | 68/12384 [08:21<24:47:27, 7.25s/it, loss=26.1297, acc=0.0008, iter_time=6.17s]
Epoch 0: 1%| | 69/12384 [08:21<24:46:04, 7.24s/it, loss=26.1297, acc=0.0008, iter_time=6.17s]
Epoch 0: 1%| | 69/12384 [08:28<24:46:04, 7.24s/it, loss=25.1814, acc=0.0004, iter_time=8.30s]
Epoch 0: 1%| | 70/12384 [08:28<24:46:18, 7.24s/it, loss=25.1814, acc=0.0004, iter_time=8.30s]
Epoch 0: 1%| | 70/12384 [08:35<24:46:18, 7.24s/it, loss=25.3554, acc=0.0012, iter_time=7.24s]
Epoch 0: 1%| | 71/12384 [08:35<24:46:09, 7.24s/it, loss=25.3554, acc=0.0012, iter_time=7.24s]
Epoch 0: 1%| | 71/12384 [08:43<24:46:09, 7.24s/it, loss=26.4846, acc=0.0008, iter_time=7.64s]
Epoch 0: 1%| | 72/12384 [08:43<24:46:47, 7.25s/it, loss=26.4846, acc=0.0008, iter_time=7.64s]
Epoch 0: 1%| | 72/12384 [08:50<24:46:47, 7.25s/it, loss=25.3087, acc=0.0013, iter_time=4.99s]
Epoch 0: 1%| | 73/12384 [08:50<24:48:08, 7.25s/it, loss=25.3087, acc=0.0013, iter_time=4.99s]
Epoch 0: 1%| | 73/12384 [08:57<24:48:08, 7.25s/it, loss=25.8696, acc=0.0007, iter_time=9.14s]
Epoch 0: 1%| | 74/12384 [08:57<24:47:27, 7.25s/it, loss=25.8696, acc=0.0007, iter_time=9.14s]
Epoch 0: 1%| | 74/12384 [09:04<24:47:27, 7.25s/it, loss=25.4730, acc=0.0010, iter_time=7.26s]
Epoch 0: 1%| | 75/12384 [09:04<24:47:57, 7.25s/it, loss=25.4730, acc=0.0010, iter_time=7.26s]
Epoch 0: 1%| | 75/12384 [09:12<24:47:57, 7.25s/it, loss=25.9954, acc=0.0000, iter_time=6.67s]
Epoch 0: 1%| | 76/12384 [09:12<24:46:05, 7.24s/it, loss=25.9954, acc=0.0000, iter_time=6.67s]
Epoch 0: 1%| | 76/12384 [09:19<24:46:05, 7.24s/it, loss=25.1234, acc=0.0011, iter_time=6.97s]
Epoch 0: 1%| | 77/12384 [09:19<24:47:05, 7.25s/it, loss=25.1234, acc=0.0011, iter_time=6.97s]
Epoch 0: 1%| | 77/12384 [09:26<24:47:05, 7.25s/it, loss=24.7491, acc=0.0007, iter_time=8.08s]
Epoch 0: 1%| | 78/12384 [09:26<24:45:33, 7.24s/it, loss=24.7491, acc=0.0007, iter_time=8.08s]
Epoch 0: 1%| | 78/12384 [09:33<24:45:33, 7.24s/it, loss=25.9329, acc=0.0006, iter_time=7.24s]
Epoch 0: 1%| | 79/12384 [09:33<24:45:19, 7.24s/it, loss=25.9329, acc=0.0006, iter_time=7.24s]
Epoch 0: 1%| | 79/12384 [09:41<24:45:19, 7.24s/it, loss=24.6874, acc=0.0018, iter_time=7.10s]
Epoch 0: 1%| | 80/12384 [09:41<24:44:59, 7.24s/it, loss=24.6874, acc=0.0018, iter_time=7.10s]
Epoch 0: 1%| | 80/12384 [09:48<24:44:59, 7.24s/it, loss=25.7239, acc=0.0006, iter_time=4.80s]
Epoch 0: 1%| | 81/12384 [09:48<24:45:03, 7.24s/it, loss=25.7239, acc=0.0006, iter_time=4.80s]
Epoch 0: 1%| | 81/12384 [09:55<24:45:03, 7.24s/it, loss=25.8323, acc=0.0006, iter_time=9.80s]
Epoch 0: 1%| | 82/12384 [09:55<24:45:41, 7.25s/it, loss=25.8323, acc=0.0006, iter_time=9.80s]
Epoch 0: 1%| | 82/12384 [10:02<24:45:41, 7.25s/it, loss=24.6073, acc=0.0011, iter_time=7.29s]
Epoch 0: 1%| | 83/12384 [10:02<24:46:03, 7.25s/it, loss=24.6073, acc=0.0011, iter_time=7.29s]
Epoch 0: 1%| | 83/12384 [10:09<24:46:03, 7.25s/it, loss=25.9912, acc=0.0005, iter_time=6.97s]
Epoch 0: 1%| | 84/12384 [10:09<24:44:38, 7.24s/it, loss=25.9912, acc=0.0005, iter_time=6.97s]
Epoch 0: 1%| | 84/12384 [10:17<24:44:38, 7.24s/it, loss=25.8104, acc=0.0005, iter_time=7.49s]
Epoch 0: 1%| | 85/12384 [10:17<24:43:46, 7.24s/it, loss=25.8104, acc=0.0005, iter_time=7.49s]
Epoch 0: 1%| | 85/12384 [10:24<24:43:46, 7.24s/it, loss=25.5907, acc=0.0000, iter_time=7.23s]
Epoch 0: 1%| | 86/12384 [10:24<24:43:26, 7.24s/it, loss=25.5907, acc=0.0000, iter_time=7.23s]
Epoch 0: 1%| | 86/12384 [10:31<24:43:26, 7.24s/it, loss=26.5948, acc=0.0009, iter_time=7.24s]
Epoch 0: 1%| | 87/12384 [10:31<24:47:26, 7.26s/it, loss=26.5948, acc=0.0009, iter_time=7.24s]
Epoch 0: 1%| | 87/12384 [10:39<24:47:26, 7.26s/it, loss=25.5724, acc=0.0004, iter_time=7.70s]
Epoch 0: 1%| | 88/12384 [10:39<24:47:41, 7.26s/it, loss=25.5724, acc=0.0004, iter_time=7.70s]
Epoch 0: 1%| | 88/12384 [10:46<24:47:41, 7.26s/it, loss=24.6367, acc=0.0009, iter_time=5.27s]
Epoch 0: 1%| | 89/12384 [10:46<24:47:03, 7.26s/it, loss=24.6367, acc=0.0009, iter_time=5.27s]
Epoch 0: 1%| | 89/12384 [10:53<24:47:03, 7.26s/it, loss=24.2505, acc=0.0012, iter_time=8.85s]
Epoch 0: 1%| | 90/12384 [10:53<24:45:40, 7.25s/it, loss=24.2505, acc=0.0012, iter_time=8.85s]
Epoch 0: 1%| | 90/12384 [11:00<24:45:40, 7.25s/it, loss=26.7861, acc=0.0012, iter_time=7.27s]
Epoch 0: 1%| | 91/12384 [11:00<24:46:49, 7.26s/it, loss=26.7861, acc=0.0012, iter_time=7.27s]
Epoch 0: 1%| | 91/12384 [11:08<24:46:49, 7.26s/it, loss=24.3304, acc=0.0012, iter_time=7.25s]
Epoch 0: 1%| | 92/12384 [11:08<24:46:38, 7.26s/it, loss=24.3304, acc=0.0012, iter_time=7.25s]
Epoch 0: 1%| | 92/12384 [11:15<24:46:38, 7.26s/it, loss=26.2561, acc=0.0007, iter_time=5.69s]
Epoch 0: 1%| | 93/12384 [11:15<24:45:51, 7.25s/it, loss=26.2561, acc=0.0007, iter_time=5.69s]
Epoch 0: 1%| | 93/12384 [11:22<24:45:51, 7.25s/it, loss=25.0205, acc=0.0013, iter_time=8.80s]
Epoch 0: 1%| | 94/12384 [11:22<24:44:52, 7.25s/it, loss=25.0205, acc=0.0013, iter_time=8.80s]
Epoch 0: 1%| | 94/12384 [11:29<24:44:52, 7.25s/it, loss=26.0604, acc=0.0012, iter_time=5.94s]
Epoch 0: 1%| | 95/12384 [11:29<24:43:22, 7.24s/it, loss=26.0604, acc=0.0012, iter_time=5.94s]
Epoch 0: 1%| | 95/12384 [11:37<24:43:22, 7.24s/it, loss=25.8327, acc=0.0003, iter_time=8.40s]
Epoch 0: 1%| | 96/12384 [11:37<24:44:01, 7.25s/it, loss=25.8327, acc=0.0003, iter_time=8.40s]
Epoch 0: 1%| | 96/12384 [11:44<24:44:01, 7.25s/it, loss=25.7407, acc=0.0004, iter_time=4.80s]
Epoch 0: 1%| | 97/12384 [11:44<24:44:23, 7.25s/it, loss=25.7407, acc=0.0004, iter_time=4.80s]
Epoch 0: 1%| | 97/12384 [11:51<24:44:23, 7.25s/it, loss=24.6398, acc=0.0008, iter_time=9.83s]
Epoch 0: 1%| | 98/12384 [11:51<24:43:52, 7.25s/it, loss=24.6398, acc=0.0008, iter_time=9.83s]
Epoch 0: 1%| | 98/12384 [11:59<24:43:52, 7.25s/it, loss=25.8374, acc=0.0004, iter_time=7.30s]
Epoch 0: 1%| | 99/12384 [11:59<25:00:21, 7.33s/it, loss=25.8374, acc=0.0004, iter_time=7.30s]
Epoch 0: 1%| | 99/12384 [12:06<25:00:21, 7.33s/it, loss=24.4787, acc=0.0002, iter_time=7.85s]
Epoch 0: 1%| | 100/12384 [12:06<24:55:01, 7.30s/it, loss=24.4787, acc=0.0002, iter_time=7.85s]
Epoch 0: 1%| | 100/12384 [12:13<24:55:01, 7.30s/it, loss=26.2808, acc=0.0007, iter_time=6.86s]
Epoch 0: 1%| | 101/12384 [12:13<24:51:55, 7.29s/it, loss=26.2808, acc=0.0007, iter_time=6.86s]
Epoch 0: 1%| | 101/12384 [12:20<24:51:55, 7.29s/it, loss=25.5292, acc=0.0003, iter_time=7.25s]
Epoch 0: 1%| | 102/12384 [12:20<24:49:11, 7.27s/it, loss=25.5292, acc=0.0003, iter_time=7.25s]
Epoch 0: 1%| | 102/12384 [12:28<24:49:11, 7.27s/it, loss=24.7556, acc=0.0012, iter_time=7.25s]
Epoch 0: 1%| | 103/12384 [12:28<24:47:47, 7.27s/it, loss=24.7556, acc=0.0012, iter_time=7.25s]
Epoch 0: 1%| | 103/12384 [12:35<24:47:47, 7.27s/it, loss=24.5222, acc=0.0009, iter_time=7.65s]
Epoch 0: 1%| | 104/12384 [12:35<24:47:23, 7.27s/it, loss=24.5222, acc=0.0009, iter_time=7.65s]
Epoch 0: 1%| | 104/12384 [12:42<24:47:23, 7.27s/it, loss=25.7881, acc=0.0008, iter_time=4.75s]
Epoch 0: 1%| | 105/12384 [12:42<24:44:57, 7.26s/it, loss=25.7881, acc=0.0008, iter_time=4.75s]
Epoch 0: 1%| | 105/12384 [12:49<24:44:57, 7.26s/it, loss=24.2179, acc=0.0007, iter_time=8.55s]
Epoch 0: 1%| | 106/12384 [12:49<24:46:52, 7.27s/it, loss=24.2179, acc=0.0007, iter_time=8.55s]
Epoch 0: 1%| | 106/12384 [12:57<24:46:52, 7.27s/it, loss=25.2753, acc=0.0006, iter_time=8.08s]
Epoch 0: 1%| | 107/12384 [12:57<24:45:38, 7.26s/it, loss=25.2753, acc=0.0006, iter_time=8.08s]
Epoch 0: 1%| | 107/12384 [13:04<24:45:38, 7.26s/it, loss=23.8982, acc=0.0015, iter_time=7.26s]
Epoch 0: 1%| | 108/12384 [13:04<24:45:00, 7.26s/it, loss=23.8982, acc=0.0015, iter_time=7.26s]
Epoch 0: 1%| | 108/12384 [13:11<24:45:00, 7.26s/it, loss=24.9451, acc=0.0011, iter_time=7.25s]
Epoch 0: 1%| | 109/12384 [13:11<24:44:08, 7.25s/it, loss=24.9451, acc=0.0011, iter_time=7.25s]
Epoch 0: 1%| | 109/12384 [13:18<24:44:08, 7.25s/it, loss=24.2399, acc=0.0012, iter_time=7.25s]
Epoch 0: 1%| | 110/12384 [13:18<24:43:46, 7.25s/it, loss=24.2399, acc=0.0012, iter_time=7.25s]
Epoch 0: 1%| | 110/12384 [13:26<24:43:46, 7.25s/it, loss=24.5482, acc=0.0006, iter_time=7.32s]
Epoch 0: 1%| | 111/12384 [13:26<24:48:37, 7.28s/it, loss=24.5482, acc=0.0006, iter_time=7.32s]
Epoch 0: 1%| | 111/12384 [13:33<24:48:37, 7.28s/it, loss=24.6159, acc=0.0011, iter_time=7.64s]
Epoch 0: 1%| | 112/12384 [13:33<24:46:39, 7.27s/it, loss=24.6159, acc=0.0011, iter_time=7.64s]
Epoch 0: 1%| | 112/12384 [13:40<24:46:39, 7.27s/it, loss=24.9661, acc=0.0007, iter_time=4.96s]
Epoch 0: 1%| | 113/12384 [13:40<24:45:09, 7.26s/it, loss=24.9661, acc=0.0007, iter_time=4.96s]
Epoch 0: 1%| | 113/12384 [13:47<24:45:09, 7.26s/it, loss=23.9603, acc=0.0010, iter_time=5.83s]
Epoch 0: 1%| | 114/12384 [13:47<24:44:07, 7.26s/it, loss=23.9603, acc=0.0010, iter_time=5.83s]
Epoch 0: 1%| | 114/12384 [13:55<24:44:07, 7.26s/it, loss=25.1833, acc=0.0010, iter_time=7.48s]
Epoch 0: 1%| | 115/12384 [13:55<24:42:44, 7.25s/it, loss=25.1833, acc=0.0010, iter_time=7.48s]
Epoch 0: 1%| | 115/12384 [14:02<24:42:44, 7.25s/it, loss=24.7678, acc=0.0012, iter_time=10.03s]
Epoch 0: 1%| | 116/12384 [14:02<24:41:41, 7.25s/it, loss=24.7678, acc=0.0012, iter_time=10.03s]
Epoch 0: 1%| | 116/12384 [14:09<24:41:41, 7.25s/it, loss=25.1418, acc=0.0007, iter_time=7.53s]
Epoch 0: 1%| | 117/12384 [14:09<24:42:13, 7.25s/it, loss=25.1418, acc=0.0007, iter_time=7.53s]
Epoch 0: 1%| | 117/12384 [14:16<24:42:13, 7.25s/it, loss=25.1265, acc=0.0002, iter_time=7.23s]
Epoch 0: 1%| | 118/12384 [14:16<24:40:32, 7.24s/it, loss=25.1265, acc=0.0002, iter_time=7.23s]
Epoch 0: 1%| | 118/12384 [14:24<24:40:32, 7.24s/it, loss=25.7655, acc=0.0009, iter_time=6.15s]
Epoch 0: 1%| | 119/12384 [14:24<24:39:52, 7.24s/it, loss=25.7655, acc=0.0009, iter_time=6.15s]
Epoch 0: 1%| | 119/12384 [14:31<24:39:52, 7.24s/it, loss=24.9375, acc=0.0007, iter_time=8.69s]
Epoch 0: 1%| | 120/12384 [14:31<24:39:07, 7.24s/it, loss=24.9375, acc=0.0007, iter_time=8.69s]
Epoch 0: 1%| | 120/12384 [14:38<24:39:07, 7.24s/it, loss=24.9806, acc=0.0010, iter_time=6.84s]
Epoch 0: 1%| | 121/12384 [14:38<24:38:55, 7.24s/it, loss=24.9806, acc=0.0010, iter_time=6.84s]
Epoch 0: 1%| | 121/12384 [14:45<24:38:55, 7.24s/it, loss=25.6743, acc=0.0008, iter_time=7.25s]
Epoch 0: 1%| | 122/12384 [14:45<24:38:58, 7.24s/it, loss=25.6743, acc=0.0008, iter_time=7.25s]
Epoch 0: 1%| | 122/12384 [14:52<24:38:58, 7.24s/it, loss=26.0748, acc=0.0005, iter_time=3.88s]
Epoch 0: 1%| | 123/12384 [14:52<24:38:40, 7.24s/it, loss=26.0748, acc=0.0005, iter_time=3.88s]
Epoch 0: 1%| | 123/12384 [15:00<24:38:40, 7.24s/it, loss=25.7487, acc=0.0014, iter_time=10.82s]
Epoch 0: 1%| | 124/12384 [15:00<24:52:38, 7.30s/it, loss=25.7487, acc=0.0014, iter_time=10.82s]
Epoch 0: 1%| | 124/12384 [15:07<24:52:38, 7.30s/it, loss=26.6740, acc=0.0005, iter_time=7.25s]
Epoch 0: 1%| | 125/12384 [15:07<24:49:50, 7.29s/it, loss=26.6740, acc=0.0005, iter_time=7.25s]
Epoch 0: 1%| | 125/12384 [15:14<24:49:50, 7.29s/it, loss=26.0283, acc=0.0007, iter_time=3.85s]
Epoch 0: 1%| | 126/12384 [15:14<24:46:25, 7.28s/it, loss=26.0283, acc=0.0007, iter_time=3.85s]
Epoch 0: 1%| | 126/12384 [15:22<24:46:25, 7.28s/it, loss=24.9161, acc=0.0009, iter_time=10.65s]
Epoch 0: 1%| | 127/12384 [15:22<24:44:47, 7.27s/it, loss=24.9161, acc=0.0009, iter_time=10.65s]
Epoch 0: 1%| | 127/12384 [15:29<24:44:47, 7.27s/it, loss=26.3718, acc=0.0008, iter_time=7.63s]
Epoch 0: 1%| | 128/12384 [15:29<24:43:48, 7.26s/it, loss=26.3718, acc=0.0008, iter_time=7.63s]
Epoch 0: 1%| | 128/12384 [15:36<24:43:48, 7.26s/it, loss=25.1223, acc=0.0010, iter_time=6.88s]
Epoch 0: 1%| | 129/12384 [15:36<24:43:19, 7.26s/it, loss=25.1223, acc=0.0010, iter_time=6.88s]
Epoch 0: 1%| | 129/12384 [15:43<24:43:19, 7.26s/it, loss=25.4832, acc=0.0003, iter_time=3.89s]
Epoch 0: 1%| | 130/12384 [15:43<24:41:40, 7.25s/it, loss=25.4832, acc=0.0003, iter_time=3.89s]
Epoch 0: 1%| | 130/12384 [15:51<24:41:40, 7.25s/it, loss=24.9629, acc=0.0021, iter_time=10.59s]
Epoch 0: 1%| | 131/12384 [15:51<24:41:27, 7.25s/it, loss=24.9629, acc=0.0021, iter_time=10.59s]
Epoch 0: 1%| | 131/12384 [15:58<24:41:27, 7.25s/it, loss=24.9183, acc=0.0016, iter_time=7.26s]
Epoch 0: 1%| | 132/12384 [15:58<24:40:23, 7.25s/it, loss=24.9183, acc=0.0016, iter_time=7.26s]
Epoch 0: 1%| | 132/12384 [16:05<24:40:23, 7.25s/it, loss=26.3849, acc=0.0005, iter_time=7.25s]
Epoch 0: 1%| | 133/12384 [16:05<24:40:42, 7.25s/it, loss=26.3849, acc=0.0005, iter_time=7.25s]
Epoch 0: 1%| | 133/12384 [16:12<24:40:42, 7.25s/it, loss=25.2442, acc=0.0001, iter_time=7.26s]
Epoch 0: 1%| | 134/12384 [16:12<24:41:10, 7.25s/it, loss=25.2442, acc=0.0001, iter_time=7.26s]
Epoch 0: 1%| | 134/12384 [16:20<24:41:10, 7.25s/it, loss=25.4194, acc=0.0010, iter_time=7.25s]
Epoch 0: 1%| | 135/12384 [16:20<24:40:07, 7.25s/it, loss=25.4194, acc=0.0010, iter_time=7.25s]W0323 13:19:51.617000 11145 site-packages/torch/distributed/elastic/agent/server/api.py:725] Received 15 death signal, shutting down workers
+W0323 13:19:51.635000 11145 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 11250 closing signal SIGTERM
+W0323 13:19:51.635000 11145 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 11251 closing signal SIGTERM
+W0323 13:19:51.636000 11145 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 11252 closing signal SIGTERM
+W0323 13:19:51.636000 11145 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 11253 closing signal SIGTERM
+W0323 13:19:51.636000 11145 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 11254 closing signal SIGTERM
+W0323 13:19:51.636000 11145 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 11255 closing signal SIGTERM
+W0323 13:19:51.636000 11145 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 11256 closing signal SIGTERM
+W0323 13:19:51.637000 11145 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 11257 closing signal SIGTERM
+Traceback (most recent call last):
+ File "", line 198, in _run_module_as_main
+ File "", line 88, in _run_code
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/run.py", line 940, in
+ main()
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/errors/__init__.py", line 357, in wrapper
+ return f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/run.py", line 936, in main
+ run(args)
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/run.py", line 927, in run
+ elastic_launch(
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 156, in __call__
+ return launch_agent(self._config, self._entrypoint, list(args))
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 284, in launch_agent
+ result = agent.run()
+ ^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/elastic/metrics/api.py", line 138, in wrapper
+ result = f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/elastic/agent/server/api.py", line 717, in run
+ result = self._invoke_run(role)
+ ^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/elastic/agent/server/api.py", line 881, in _invoke_run
+ time.sleep(monitor_interval)
+ File "/workspace/miniconda3/envs/spec/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/api.py", line 85, in _terminate_process_handler
+ raise SignalException(f"Process {os.getpid()} got signal: {sigval}", sigval=sigval)
+torch.distributed.elastic.multiprocessing.api.SignalException: Process 11145 got signal: 15
diff --git a/syxin_old/training.log b/syxin_old/training.log
new file mode 100644
index 0000000000000000000000000000000000000000..77201ad0c9ea32123830c750c52f4233a882e15c
--- /dev/null
+++ b/syxin_old/training.log
@@ -0,0 +1,118 @@
+nohup: ignoring input
+
+*****************************************
+Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed.
+*****************************************
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+Set TORCH_CUDA_ARCH_LIST to 9.0
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+/workspace/hanrui/syxin_old/Specforge/specforge/modeling/draft/llama3_eagle.py:29: UserWarning: flash_attn is not found, falling back to flex_attention. Please install flash_attn if you want to use the flash attention backend.
+ warnings.warn(
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+`torch_dtype` is deprecated! Use `dtype` instead!
+`torch_dtype` is deprecated! Use `dtype` instead!
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+The following generation flags are not valid and may be ignored: ['output_hidden_states']. Set `TRANSFORMERS_VERBOSITY=info` for more details.
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.43s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.56s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.52s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.55s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.57s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:09, 2.50s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.52s/it]
Loading checkpoint shards: 20%|██ | 1/5 [00:02<00:10, 2.70s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:04<00:07, 2.41s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.52s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.58s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.60s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.59s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.58s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:07, 2.57s/it]
Loading checkpoint shards: 40%|████ | 2/5 [00:05<00:08, 2.80s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.38s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.49s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:04, 2.49s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.52s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.51s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.53s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:07<00:05, 2.51s/it]
Loading checkpoint shards: 60%|██████ | 3/5 [00:08<00:05, 2.71s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:08<00:02, 2.14s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.26s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.59s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:09<00:00, 1.91s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.33it/s]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.23s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.23s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.73s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.04s/it]
+
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.30s/it]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.31s/it]
Loading checkpoint shards: 80%|████████ | 4/5 [00:09<00:02, 2.32s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 134.33it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.67s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.01s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.67s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.01s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 133.65it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.59it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.72s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.05s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.72s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.06s/it]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.73s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.06s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 80%|████████ | 4/5 [00:10<00:02, 2.47s/it]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 138.20it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 139.54it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 134.23it/s]
+
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 1.82s/it]
Loading checkpoint shards: 100%|██████████| 5/5 [00:10<00:00, 2.19s/it]
+
Loading checkpoint shards: 0%| | 0/5 [00:00, ?it/s]
Loading checkpoint shards: 100%|██████████| 5/5 [00:00<00:00, 134.21it/s]
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+trainable params: 15,335,424 || all params: 8,206,070,784 || trainable%: 0.1869
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/distributed_c10d.py:4876: UserWarning: barrier(): using the device under current context. You can specify `device_id` in `init_process_group` to mute this warning.
+ warnings.warn( # warn only once
+[rank0]:[W310 08:22:07.434083485 ProcessGroupNCCL.cpp:5072] Guessing device ID based on global rank. This can cause a hang if rank to GPU mapping is heterogeneous. You can specify device_id in init_process_group()
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkldataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkldataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
+
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+dataset is cached at /tmp/specforge_cache/processed_dataset/b2b7bdc9eb8a4170c0d33f03d2bf640b.pkl
+
Epoch 0: 0%| | 0/12384 [00:00, ?it/s]
Epoch 0: 0%| | 0/12384 [00:08, ?it/s, loss=11.4616, acc=0.0002, iter_time=7.95s]
Epoch 0: 0%| | 1/12384 [00:08<28:52:24, 8.39s/it, loss=11.4616, acc=0.0002, iter_time=7.95s]
Epoch 0: 0%| | 1/12384 [00:16<28:52:24, 8.39s/it, loss=10.6726, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 2/12384 [00:16<27:23:24, 7.96s/it, loss=10.6726, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 2/12384 [00:23<27:23:24, 7.96s/it, loss=10.4985, acc=0.0011, iter_time=8.86s]
Epoch 0: 0%| | 3/12384 [00:23<26:55:47, 7.83s/it, loss=10.4985, acc=0.0011, iter_time=8.86s]
Epoch 0: 0%| | 3/12384 [00:31<26:55:47, 7.83s/it, loss=12.4512, acc=0.0002, iter_time=4.60s]
Epoch 0: 0%| | 4/12384 [00:31<26:42:04, 7.76s/it, loss=12.4512, acc=0.0002, iter_time=4.60s]
Epoch 0: 0%| | 4/12384 [00:39<26:42:04, 7.76s/it, loss=10.6913, acc=0.0007, iter_time=10.74s]
Epoch 0: 0%| | 5/12384 [00:39<26:37:07, 7.74s/it, loss=10.6913, acc=0.0007, iter_time=10.74s]
Epoch 0: 0%| | 5/12384 [00:46<26:37:07, 7.74s/it, loss=10.7935, acc=0.0006, iter_time=7.67s]
Epoch 0: 0%| | 6/12384 [00:46<26:30:41, 7.71s/it, loss=10.7935, acc=0.0006, iter_time=7.67s]
Epoch 0: 0%| | 6/12384 [00:54<26:30:41, 7.71s/it, loss=12.5651, acc=0.0002, iter_time=7.69s]
Epoch 0: 0%| | 7/12384 [00:54<26:29:17, 7.70s/it, loss=12.5651, acc=0.0002, iter_time=7.69s]
Epoch 0: 0%| | 7/12384 [01:02<26:29:17, 7.70s/it, loss=11.6807, acc=0.0003, iter_time=8.32s]
Epoch 0: 0%| | 8/12384 [01:02<26:39:38, 7.76s/it, loss=11.6807, acc=0.0003, iter_time=8.32s]
Epoch 0: 0%| | 8/12384 [01:09<26:39:38, 7.76s/it, loss=11.3789, acc=0.0005, iter_time=4.95s]
Epoch 0: 0%| | 9/12384 [01:09<26:32:57, 7.72s/it, loss=11.3789, acc=0.0005, iter_time=4.95s]
Epoch 0: 0%| | 9/12384 [01:17<26:32:57, 7.72s/it, loss=10.5343, acc=0.0003, iter_time=10.35s]
Epoch 0: 0%| | 10/12384 [01:17<26:52:52, 7.82s/it, loss=10.5343, acc=0.0003, iter_time=10.35s]
Epoch 0: 0%| | 10/12384 [01:25<26:52:52, 7.82s/it, loss=11.6157, acc=0.0004, iter_time=7.60s]
Epoch 0: 0%| | 11/12384 [01:25<26:39:20, 7.76s/it, loss=11.6157, acc=0.0004, iter_time=7.60s]
Epoch 0: 0%| | 11/12384 [01:33<26:39:20, 7.76s/it, loss=11.2005, acc=0.0002, iter_time=7.61s]
Epoch 0: 0%| | 12/12384 [01:33<26:30:56, 7.72s/it, loss=11.2005, acc=0.0002, iter_time=7.61s]
Epoch 0: 0%| | 12/12384 [01:40<26:30:56, 7.72s/it, loss=11.8510, acc=0.0011, iter_time=5.03s]
Epoch 0: 0%| | 13/12384 [01:40<26:28:03, 7.70s/it, loss=11.8510, acc=0.0011, iter_time=5.03s]
Epoch 0: 0%| | 13/12384 [01:48<26:28:03, 7.70s/it, loss=12.6667, acc=0.0004, iter_time=8.56s]
Epoch 0: 0%| | 14/12384 [01:48<26:24:01, 7.68s/it, loss=12.6667, acc=0.0004, iter_time=8.56s]
Epoch 0: 0%| | 14/12384 [01:56<26:24:01, 7.68s/it, loss=11.3266, acc=0.0002, iter_time=9.36s]
Epoch 0: 0%| | 15/12384 [01:56<26:21:37, 7.67s/it, loss=11.3266, acc=0.0002, iter_time=9.36s]
Epoch 0: 0%| | 15/12384 [02:03<26:21:37, 7.67s/it, loss=12.2026, acc=0.0000, iter_time=7.61s]
Epoch 0: 0%| | 16/12384 [02:03<26:18:20, 7.66s/it, loss=12.2026, acc=0.0000, iter_time=7.61s]
Epoch 0: 0%| | 16/12384 [02:11<26:18:20, 7.66s/it, loss=10.7707, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 17/12384 [02:11<26:16:34, 7.65s/it, loss=10.7707, acc=0.0003, iter_time=6.47s]
Epoch 0: 0%| | 17/12384 [02:19<26:16:34, 7.65s/it, loss=10.9714, acc=0.0001, iter_time=8.84s]
Epoch 0: 0%| | 18/12384 [02:19<26:15:13, 7.64s/it, loss=10.9714, acc=0.0001, iter_time=8.84s]
Epoch 0: 0%| | 18/12384 [02:26<26:15:13, 7.64s/it, loss=11.0658, acc=0.0002, iter_time=6.42s]
Epoch 0: 0%| | 19/12384 [02:26<26:18:08, 7.66s/it, loss=11.0658, acc=0.0002, iter_time=6.42s]
Epoch 0: 0%| | 19/12384 [02:34<26:18:08, 7.66s/it, loss=10.9882, acc=0.0011, iter_time=8.88s]
Epoch 0: 0%| | 20/12384 [02:34<26:18:16, 7.66s/it, loss=10.9882, acc=0.0011, iter_time=8.88s]
Epoch 0: 0%| | 20/12384 [02:42<26:18:16, 7.66s/it, loss=11.3002, acc=0.0000, iter_time=7.65s]
Epoch 0: 0%| | 21/12384 [02:42<26:14:15, 7.64s/it, loss=11.3002, acc=0.0000, iter_time=7.65s]
Epoch 0: 0%| | 21/12384 [02:49<26:14:15, 7.64s/it, loss=10.9236, acc=0.0005, iter_time=7.62s]
Epoch 0: 0%| | 22/12384 [02:49<26:14:09, 7.64s/it, loss=10.9236, acc=0.0005, iter_time=7.62s]
Epoch 0: 0%| | 22/12384 [02:57<26:14:09, 7.64s/it, loss=11.6876, acc=0.0004, iter_time=7.64s]
Epoch 0: 0%| | 23/12384 [02:57<26:13:31, 7.64s/it, loss=11.6876, acc=0.0004, iter_time=7.64s]
Epoch 0: 0%| | 23/12384 [03:04<26:13:31, 7.64s/it, loss=10.1433, acc=0.0008, iter_time=8.02s]
Epoch 0: 0%| | 24/12384 [03:04<26:12:22, 7.63s/it, loss=10.1433, acc=0.0008, iter_time=8.02s]
Epoch 0: 0%| | 24/12384 [03:12<26:12:22, 7.63s/it, loss=11.4336, acc=0.0007, iter_time=7.26s]
Epoch 0: 0%| | 25/12384 [03:12<26:12:18, 7.63s/it, loss=11.4336, acc=0.0007, iter_time=7.26s]
Epoch 0: 0%| | 25/12384 [03:20<26:12:18, 7.63s/it, loss=11.4074, acc=0.0004, iter_time=7.63s]
Epoch 0: 0%| | 26/12384 [03:20<26:12:54, 7.64s/it, loss=11.4074, acc=0.0004, iter_time=7.63s]
Epoch 0: 0%| | 26/12384 [03:27<26:12:54, 7.64s/it, loss=11.0375, acc=0.0009, iter_time=7.64s]
Epoch 0: 0%| | 27/12384 [03:27<26:12:45, 7.64s/it, loss=11.0375, acc=0.0009, iter_time=7.64s]
Epoch 0: 0%| | 27/12384 [03:35<26:12:45, 7.64s/it, loss=13.4672, acc=0.0000, iter_time=4.34s]
Epoch 0: 0%| | 28/12384 [03:35<26:12:58, 7.64s/it, loss=13.4672, acc=0.0000, iter_time=4.34s]
Epoch 0: 0%| | 28/12384 [03:43<26:12:58, 7.64s/it, loss=10.7064, acc=0.0000, iter_time=10.95s]
Epoch 0: 0%| | 29/12384 [03:43<26:15:30, 7.65s/it, loss=10.7064, acc=0.0000, iter_time=10.95s]
Epoch 0: 0%| | 29/12384 [03:50<26:15:30, 7.65s/it, loss=10.6316, acc=0.0007, iter_time=7.05s]
Epoch 0: 0%| | 30/12384 [03:50<26:15:49, 7.65s/it, loss=10.6316, acc=0.0007, iter_time=7.05s]
Epoch 0: 0%| | 30/12384 [03:58<26:15:49, 7.65s/it, loss=10.6725, acc=0.0005, iter_time=8.31s]
Epoch 0: 0%| | 31/12384 [03:58<26:18:34, 7.67s/it, loss=10.6725, acc=0.0005, iter_time=8.31s]
Epoch 0: 0%| | 31/12384 [04:06<26:18:34, 7.67s/it, loss=11.1389, acc=0.0004, iter_time=8.08s]
Epoch 0: 0%| | 32/12384 [04:06<26:18:20, 7.67s/it, loss=11.1389, acc=0.0004, iter_time=8.08s]
Epoch 0: 0%| | 32/12384 [04:13<26:18:20, 7.67s/it, loss=11.0649, acc=0.0006, iter_time=7.25s]
Epoch 0: 0%| | 33/12384 [04:13<26:16:12, 7.66s/it, loss=11.0649, acc=0.0006, iter_time=7.25s]
Epoch 0: 0%| | 33/12384 [04:21<26:16:12, 7.66s/it, loss=10.9385, acc=0.0015, iter_time=7.64s]
Epoch 0: 0%| | 34/12384 [04:21<26:16:33, 7.66s/it, loss=10.9385, acc=0.0015, iter_time=7.64s]
Epoch 0: 0%| | 34/12384 [04:29<26:16:33, 7.66s/it, loss=11.5272, acc=0.0016, iter_time=5.92s]
Epoch 0: 0%| | 35/12384 [04:29<26:15:45, 7.66s/it, loss=11.5272, acc=0.0016, iter_time=5.92s]
Epoch 0: 0%| | 35/12384 [04:37<26:15:45, 7.66s/it, loss=10.9093, acc=0.0003, iter_time=9.69s]
Epoch 0: 0%| | 36/12384 [04:37<26:32:15, 7.74s/it, loss=10.9093, acc=0.0003, iter_time=9.69s]
Epoch 0: 0%| | 36/12384 [04:45<26:32:15, 7.74s/it, loss=12.0866, acc=0.0007, iter_time=7.66s]
Epoch 0: 0%| | 37/12384 [04:45<26:49:10, 7.82s/it, loss=12.0866, acc=0.0007, iter_time=7.66s]
Epoch 0: 0%| | 37/12384 [04:52<26:49:10, 7.82s/it, loss=12.0058, acc=0.0010, iter_time=4.01s]
Epoch 0: 0%| | 38/12384 [04:52<26:39:22, 7.77s/it, loss=12.0058, acc=0.0010, iter_time=4.01s]
Epoch 0: 0%| | 38/12384 [05:00<26:39:22, 7.77s/it, loss=11.0774, acc=0.0005, iter_time=11.59s]
Epoch 0: 0%| | 39/12384 [05:00<26:30:19, 7.73s/it, loss=11.0774, acc=0.0005, iter_time=11.59s]
Epoch 0: 0%| | 39/12384 [05:07<26:30:19, 7.73s/it, loss=11.2613, acc=0.0001, iter_time=8.04s]
Epoch 0: 0%| | 40/12384 [05:07<26:25:19, 7.71s/it, loss=11.2613, acc=0.0001, iter_time=8.04s]
Epoch 0: 0%| | 40/12384 [05:15<26:25:19, 7.71s/it, loss=10.6729, acc=0.0005, iter_time=7.24s]
Epoch 0: 0%| | 41/12384 [05:15<26:20:47, 7.68s/it, loss=10.6729, acc=0.0005, iter_time=7.24s]
Epoch 0: 0%| | 41/12384 [05:23<26:20:47, 7.68s/it, loss=10.2672, acc=0.0007, iter_time=7.62s]
Epoch 0: 0%| | 42/12384 [05:23<26:15:46, 7.66s/it, loss=10.2672, acc=0.0007, iter_time=7.62s]
Epoch 0: 0%| | 42/12384 [05:30<26:15:46, 7.66s/it, loss=11.5034, acc=0.0001, iter_time=7.04s]
Epoch 0: 0%| | 43/12384 [05:30<26:15:27, 7.66s/it, loss=11.5034, acc=0.0001, iter_time=7.04s]
Epoch 0: 0%| | 43/12384 [05:38<26:15:27, 7.66s/it, loss=11.4143, acc=0.0005, iter_time=8.24s]
Epoch 0: 0%| | 44/12384 [05:38<26:12:08, 7.64s/it, loss=11.4143, acc=0.0005, iter_time=8.24s]
Epoch 0: 0%| | 44/12384 [05:46<26:12:08, 7.64s/it, loss=11.8333, acc=0.0000, iter_time=7.62s]
Epoch 0: 0%| | 45/12384 [05:46<26:10:39, 7.64s/it, loss=11.8333, acc=0.0000, iter_time=7.62s]
Epoch 0: 0%| | 45/12384 [05:53<26:10:39, 7.64s/it, loss=12.4923, acc=0.0009, iter_time=4.75s]
Epoch 0: 0%| | 46/12384 [05:53<26:10:04, 7.64s/it, loss=12.4923, acc=0.0009, iter_time=4.75s]
Epoch 0: 0%| | 46/12384 [06:01<26:10:04, 7.64s/it, loss=10.7213, acc=0.0009, iter_time=10.48s]
Epoch 0: 0%| | 47/12384 [06:01<26:09:32, 7.63s/it, loss=10.7213, acc=0.0009, iter_time=10.48s]
Epoch 0: 0%| | 47/12384 [06:08<26:09:32, 7.63s/it, loss=11.5314, acc=0.0005, iter_time=8.04s]
Epoch 0: 0%| | 48/12384 [06:08<26:08:16, 7.63s/it, loss=11.5314, acc=0.0005, iter_time=8.04s]
Epoch 0: 0%| | 48/12384 [06:16<26:08:16, 7.63s/it, loss=12.5196, acc=0.0004, iter_time=5.45s]
Epoch 0: 0%| | 49/12384 [06:16<26:10:43, 7.64s/it, loss=12.5196, acc=0.0004, iter_time=5.45s]
Epoch 0: 0%| | 49/12384 [06:24<26:10:43, 7.64s/it, loss=12.3785, acc=0.0006, iter_time=9.85s]
Epoch 0: 0%| | 50/12384 [06:24<26:09:30, 7.64s/it, loss=12.3785, acc=0.0006, iter_time=9.85s]
Epoch 0: 0%| | 50/12384 [06:31<26:09:30, 7.64s/it, loss=11.2568, acc=0.0005, iter_time=4.59s]
Epoch 0: 0%| | 51/12384 [06:31<26:09:54, 7.64s/it, loss=11.2568, acc=0.0005, iter_time=4.59s]
Epoch 0: 0%| | 51/12384 [06:39<26:09:54, 7.64s/it, loss=12.6810, acc=0.0005, iter_time=9.62s]
Epoch 0: 0%| | 52/12384 [06:39<26:08:42, 7.63s/it, loss=12.6810, acc=0.0005, iter_time=9.62s]
Epoch 0: 0%| | 52/12384 [06:47<26:08:42, 7.63s/it, loss=11.2767, acc=0.0006, iter_time=8.28s]
Epoch 0: 0%| | 53/12384 [06:47<26:07:18, 7.63s/it, loss=11.2767, acc=0.0006, iter_time=8.28s]
Epoch 0: 0%| | 53/12384 [06:54<26:07:18, 7.63s/it, loss=12.0088, acc=0.0004, iter_time=4.82s]
Epoch 0: 0%| | 54/12384 [06:54<26:06:35, 7.62s/it, loss=12.0088, acc=0.0004, iter_time=4.82s]
Epoch 0: 0%| | 54/12384 [07:02<26:06:35, 7.62s/it, loss=12.1385, acc=0.0004, iter_time=10.43s]
Epoch 0: 0%| | 55/12384 [07:02<26:07:25, 7.63s/it, loss=12.1385, acc=0.0004, iter_time=10.43s]
Epoch 0: 0%| | 55/12384 [07:10<26:07:25, 7.63s/it, loss=10.7962, acc=0.0001, iter_time=8.01s]
Epoch 0: 0%| | 56/12384 [07:10<26:12:48, 7.65s/it, loss=10.7962, acc=0.0001, iter_time=8.01s]
Epoch 0: 0%| | 56/12384 [07:17<26:12:48, 7.65s/it, loss=11.5871, acc=0.0005, iter_time=6.45s]
Epoch 0: 0%| | 57/12384 [07:17<26:10:12, 7.64s/it, loss=11.5871, acc=0.0005, iter_time=6.45s]
Epoch 0: 0%| | 57/12384 [07:25<26:10:12, 7.64s/it, loss=14.1009, acc=0.0005, iter_time=5.16s]
Epoch 0: 0%| | 58/12384 [07:25<26:10:08, 7.64s/it, loss=14.1009, acc=0.0005, iter_time=5.16s]
Epoch 0: 0%| | 58/12384 [07:33<26:10:08, 7.64s/it, loss=10.7893, acc=0.0008, iter_time=10.96s]
Epoch 0: 0%| | 59/12384 [07:33<26:08:22, 7.64s/it, loss=10.7893, acc=0.0008, iter_time=10.96s]
Epoch 0: 0%| | 59/12384 [07:40<26:08:22, 7.64s/it, loss=10.9049, acc=0.0003, iter_time=7.62s]
Epoch 0: 0%| | 60/12384 [07:40<26:05:26, 7.62s/it, loss=10.9049, acc=0.0003, iter_time=7.62s]
Epoch 0: 0%| | 60/12384 [07:48<26:05:26, 7.62s/it, loss=11.4199, acc=0.0004, iter_time=6.67s]
Epoch 0: 0%| | 61/12384 [07:48<26:09:03, 7.64s/it, loss=11.4199, acc=0.0004, iter_time=6.67s]
Epoch 0: 0%| | 61/12384 [07:56<26:09:03, 7.64s/it, loss=13.1510, acc=0.0002, iter_time=7.12s]
Epoch 0: 1%| | 62/12384 [07:56<26:28:37, 7.74s/it, loss=13.1510, acc=0.0002, iter_time=7.12s]
Epoch 0: 1%| | 62/12384 [08:03<26:28:37, 7.74s/it, loss=10.5607, acc=0.0006, iter_time=9.46s]
Epoch 0: 1%| | 63/12384 [08:03<26:21:20, 7.70s/it, loss=10.5607, acc=0.0006, iter_time=9.46s]
Epoch 0: 1%| | 63/12384 [08:11<26:21:20, 7.70s/it, loss=11.2135, acc=0.0007, iter_time=7.68s]
Epoch 0: 1%| | 64/12384 [08:11<26:17:46, 7.68s/it, loss=11.2135, acc=0.0007, iter_time=7.68s]
Epoch 0: 1%| | 64/12384 [08:19<26:17:46, 7.68s/it, loss=11.6287, acc=0.0007, iter_time=7.01s]
Epoch 0: 1%| | 65/12384 [08:19<26:14:43, 7.67s/it, loss=11.6287, acc=0.0007, iter_time=7.01s]
Epoch 0: 1%| | 65/12384 [08:26<26:14:43, 7.67s/it, loss=11.7011, acc=0.0006, iter_time=8.20s]
Epoch 0: 1%| | 66/12384 [08:26<26:13:16, 7.66s/it, loss=11.7011, acc=0.0006, iter_time=8.20s]
Epoch 0: 1%| | 66/12384 [08:34<26:13:16, 7.66s/it, loss=11.1116, acc=0.0009, iter_time=7.66s]
Epoch 0: 1%| | 67/12384 [08:34<26:10:08, 7.65s/it, loss=11.1116, acc=0.0009, iter_time=7.66s]
Epoch 0: 1%| | 67/12384 [08:42<26:10:08, 7.65s/it, loss=10.5857, acc=0.0003, iter_time=7.62s]
Epoch 0: 1%| | 68/12384 [08:42<26:08:44, 7.64s/it, loss=10.5857, acc=0.0003, iter_time=7.62s]
Epoch 0: 1%| | 68/12384 [08:49<26:08:44, 7.64s/it, loss=12.2984, acc=0.0002, iter_time=6.42s]
Epoch 0: 1%| | 69/12384 [08:49<26:10:22, 7.65s/it, loss=12.2984, acc=0.0002, iter_time=6.42s]
Epoch 0: 1%| | 69/12384 [08:57<26:10:22, 7.65s/it, loss=10.6612, acc=0.0003, iter_time=8.87s]
Epoch 0: 1%| | 70/12384 [08:57<26:10:57, 7.65s/it, loss=10.6612, acc=0.0003, iter_time=8.87s]
Epoch 0: 1%| | 70/12384 [09:05<26:10:57, 7.65s/it, loss=10.8825, acc=0.0005, iter_time=7.65s]
Epoch 0: 1%| | 71/12384 [09:05<26:10:27, 7.65s/it, loss=10.8825, acc=0.0005, iter_time=7.65s]
Epoch 0: 1%| | 71/12384 [09:12<26:10:27, 7.65s/it, loss=10.7391, acc=0.0006, iter_time=8.04s]
Epoch 0: 1%| | 72/12384 [09:12<26:08:05, 7.64s/it, loss=10.7391, acc=0.0006, iter_time=8.04s]
Epoch 0: 1%| | 72/12384 [09:20<26:08:05, 7.64s/it, loss=12.1920, acc=0.0007, iter_time=5.13s]
Epoch 0: 1%| | 73/12384 [09:20<26:11:50, 7.66s/it, loss=12.1920, acc=0.0007, iter_time=5.13s]
Epoch 0: 1%| | 73/12384 [09:27<26:11:50, 7.66s/it, loss=10.5516, acc=0.0004, iter_time=9.80s]
Epoch 0: 1%| | 74/12384 [09:27<26:10:12, 7.65s/it, loss=10.5516, acc=0.0004, iter_time=9.80s]
Epoch 0: 1%| | 74/12384 [09:35<26:10:12, 7.65s/it, loss=10.1934, acc=0.0006, iter_time=7.66s]
Epoch 0: 1%| | 75/12384 [09:35<26:13:17, 7.67s/it, loss=10.1934, acc=0.0006, iter_time=7.66s]
Epoch 0: 1%| | 75/12384 [09:43<26:13:17, 7.67s/it, loss=11.6410, acc=0.0000, iter_time=7.04s]
Epoch 0: 1%| | 76/12384 [09:43<26:09:20, 7.65s/it, loss=11.6410, acc=0.0000, iter_time=7.04s]
Epoch 0: 1%| | 76/12384 [09:50<26:09:20, 7.65s/it, loss=10.9323, acc=0.0004, iter_time=7.31s]
Epoch 0: 1%| | 77/12384 [09:50<26:07:08, 7.64s/it, loss=10.9323, acc=0.0004, iter_time=7.31s]
Epoch 0: 1%| | 77/12384 [09:58<26:07:08, 7.64s/it, loss=11.0105, acc=0.0003, iter_time=8.54s]
Epoch 0: 1%| | 78/12384 [09:58<26:05:41, 7.63s/it, loss=11.0105, acc=0.0003, iter_time=8.54s]
Epoch 0: 1%| | 78/12384 [10:06<26:05:41, 7.63s/it, loss=10.8721, acc=0.0004, iter_time=7.63s]
Epoch 0: 1%| | 79/12384 [10:06<26:05:22, 7.63s/it, loss=10.8721, acc=0.0004, iter_time=7.63s]
Epoch 0: 1%| | 79/12384 [10:13<26:05:22, 7.63s/it, loss=11.3602, acc=0.0013, iter_time=7.61s]
Epoch 0: 1%| | 80/12384 [10:13<26:05:57, 7.64s/it, loss=11.3602, acc=0.0013, iter_time=7.61s]
Epoch 0: 1%| | 80/12384 [10:21<26:05:57, 7.64s/it, loss=12.4490, acc=0.0004, iter_time=4.84s]
Epoch 0: 1%| | 81/12384 [10:21<26:05:10, 7.63s/it, loss=12.4490, acc=0.0004, iter_time=4.84s]
Epoch 0: 1%| | 81/12384 [10:29<26:05:10, 7.63s/it, loss=11.2284, acc=0.0006, iter_time=10.44s]
Epoch 0: 1%| | 82/12384 [10:29<26:04:56, 7.63s/it, loss=11.2284, acc=0.0006, iter_time=10.44s]
Epoch 0: 1%| | 82/12384 [10:36<26:04:56, 7.63s/it, loss=11.5251, acc=0.0009, iter_time=7.66s]
Epoch 0: 1%| | 83/12384 [10:36<26:05:22, 7.64s/it, loss=11.5251, acc=0.0009, iter_time=7.66s]
Epoch 0: 1%| | 83/12384 [10:44<26:05:22, 7.64s/it, loss=11.2945, acc=0.0005, iter_time=7.31s]
Epoch 0: 1%| | 84/12384 [10:44<26:05:29, 7.64s/it, loss=11.2945, acc=0.0005, iter_time=7.31s]
Epoch 0: 1%| | 84/12384 [10:51<26:05:29, 7.64s/it, loss=10.4840, acc=0.0002, iter_time=7.96s]
Epoch 0: 1%| | 85/12384 [10:51<26:04:50, 7.63s/it, loss=10.4840, acc=0.0002, iter_time=7.96s]
Epoch 0: 1%| | 85/12384 [10:59<26:04:50, 7.63s/it, loss=10.6111, acc=0.0000, iter_time=7.63s]
Epoch 0: 1%| | 86/12384 [10:59<26:04:25, 7.63s/it, loss=10.6111, acc=0.0000, iter_time=7.63s]
Epoch 0: 1%| | 86/12384 [11:07<26:04:25, 7.63s/it, loss=10.8529, acc=0.0007, iter_time=7.63s]
Epoch 0: 1%| | 87/12384 [11:07<26:06:07, 7.64s/it, loss=10.8529, acc=0.0007, iter_time=7.63s]
Epoch 0: 1%| | 87/12384 [11:14<26:06:07, 7.64s/it, loss=11.2738, acc=0.0003, iter_time=8.06s]
Epoch 0: 1%| | 88/12384 [11:14<26:05:24, 7.64s/it, loss=11.2738, acc=0.0003, iter_time=8.06s]
Epoch 0: 1%| | 88/12384 [11:22<26:05:24, 7.64s/it, loss=11.2256, acc=0.0007, iter_time=5.78s]
Epoch 0: 1%| | 89/12384 [11:22<26:25:48, 7.74s/it, loss=11.2256, acc=0.0007, iter_time=5.78s]
Epoch 0: 1%| | 89/12384 [11:30<26:25:48, 7.74s/it, loss=11.0972, acc=0.0007, iter_time=9.42s]
Epoch 0: 1%| | 90/12384 [11:30<26:19:15, 7.71s/it, loss=11.0972, acc=0.0007, iter_time=9.42s]
Epoch 0: 1%| | 90/12384 [11:38<26:19:15, 7.71s/it, loss=10.9571, acc=0.0001, iter_time=7.64s]
Epoch 0: 1%| | 91/12384 [11:38<26:13:34, 7.68s/it, loss=10.9571, acc=0.0001, iter_time=7.64s]
Epoch 0: 1%| | 91/12384 [11:45<26:13:34, 7.68s/it, loss=10.6801, acc=0.0009, iter_time=7.60s]
Epoch 0: 1%| | 92/12384 [11:45<26:09:53, 7.66s/it, loss=10.6801, acc=0.0009, iter_time=7.60s]
Epoch 0: 1%| | 92/12384 [11:53<26:09:53, 7.66s/it, loss=12.3925, acc=0.0003, iter_time=5.89s]
Epoch 0: 1%| | 93/12384 [11:53<26:09:45, 7.66s/it, loss=12.3925, acc=0.0003, iter_time=5.89s]
Epoch 0: 1%| | 93/12384 [12:01<26:09:45, 7.66s/it, loss=10.8816, acc=0.0004, iter_time=9.39s]
Epoch 0: 1%| | 94/12384 [12:01<26:08:02, 7.66s/it, loss=10.8816, acc=0.0004, iter_time=9.39s]
Epoch 0: 1%| | 94/12384 [12:08<26:08:02, 7.66s/it, loss=12.1385, acc=0.0006, iter_time=6.20s]
Epoch 0: 1%| | 95/12384 [12:08<26:08:16, 7.66s/it, loss=12.1385, acc=0.0006, iter_time=6.20s]
Epoch 0: 1%| | 95/12384 [12:16<26:08:16, 7.66s/it, loss=12.2838, acc=0.0003, iter_time=9.09s]
Epoch 0: 1%| | 96/12384 [12:16<26:07:25, 7.65s/it, loss=12.2838, acc=0.0003, iter_time=9.09s]
Epoch 0: 1%| | 96/12384 [12:23<26:07:25, 7.65s/it, loss=12.4777, acc=0.0002, iter_time=4.85s]
Epoch 0: 1%| | 97/12384 [12:23<26:06:29, 7.65s/it, loss=12.4777, acc=0.0002, iter_time=4.85s]
Epoch 0: 1%| | 97/12384 [12:31<26:06:29, 7.65s/it, loss=11.9554, acc=0.0004, iter_time=10.47s]
Epoch 0: 1%| | 98/12384 [12:31<26:04:05, 7.64s/it, loss=11.9554, acc=0.0004, iter_time=10.47s]
Epoch 0: 1%| | 98/12384 [12:39<26:04:05, 7.64s/it, loss=10.9768, acc=0.0004, iter_time=7.63s]
Epoch 0: 1%| | 99/12384 [12:39<26:04:48, 7.64s/it, loss=10.9768, acc=0.0004, iter_time=7.63s]
Epoch 0: 1%| | 99/12384 [12:46<26:04:48, 7.64s/it, loss=10.7849, acc=0.0000, iter_time=8.05s]
Epoch 0: 1%| | 100/12384 [12:46<26:03:52, 7.64s/it, loss=10.7849, acc=0.0000, iter_time=8.05s]
Epoch 0: 1%| | 100/12384 [12:54<26:03:52, 7.64s/it, loss=11.4376, acc=0.0003, iter_time=7.24s]
Epoch 0: 1%| | 101/12384 [12:54<26:03:53, 7.64s/it, loss=11.4376, acc=0.0003, iter_time=7.24s]
Epoch 0: 1%| | 101/12384 [13:02<26:03:53, 7.64s/it, loss=11.4607, acc=0.0003, iter_time=7.64s]
Epoch 0: 1%| | 102/12384 [13:02<26:05:40, 7.65s/it, loss=11.4607, acc=0.0003, iter_time=7.64s]
Epoch 0: 1%| | 102/12384 [13:09<26:05:40, 7.65s/it, loss=11.0372, acc=0.0003, iter_time=7.66s]
Epoch 0: 1%| | 103/12384 [13:09<26:04:55, 7.65s/it, loss=11.0372, acc=0.0003, iter_time=7.66s]
Epoch 0: 1%| | 103/12384 [13:17<26:04:55, 7.65s/it, loss=11.2025, acc=0.0004, iter_time=8.03s]
Epoch 0: 1%| | 104/12384 [13:17<26:04:11, 7.64s/it, loss=11.2025, acc=0.0004, iter_time=8.03s]
Epoch 0: 1%| | 104/12384 [13:25<26:04:11, 7.64s/it, loss=12.3039, acc=0.0006, iter_time=4.90s]
Epoch 0: 1%| | 105/12384 [13:25<26:04:23, 7.64s/it, loss=12.3039, acc=0.0006, iter_time=4.90s]
Epoch 0: 1%| | 105/12384 [13:32<26:04:23, 7.64s/it, loss=10.6288, acc=0.0004, iter_time=9.11s]
Epoch 0: 1%| | 106/12384 [13:32<26:06:49, 7.66s/it, loss=10.6288, acc=0.0004, iter_time=9.11s]
Epoch 0: 1%| | 106/12384 [13:40<26:06:49, 7.66s/it, loss=11.4025, acc=0.0003, iter_time=8.57s]
Epoch 0: 1%| | 107/12384 [13:40<26:11:31, 7.68s/it, loss=11.4025, acc=0.0003, iter_time=8.57s]
Epoch 0: 1%| | 107/12384 [13:48<26:11:31, 7.68s/it, loss=10.4986, acc=0.0008, iter_time=7.75s]
Epoch 0: 1%| | 108/12384 [13:48<26:08:36, 7.67s/it, loss=10.4986, acc=0.0008, iter_time=7.75s]
Epoch 0: 1%| | 108/12384 [13:55<26:08:36, 7.67s/it, loss=10.0305, acc=0.0009, iter_time=7.62s]
Epoch 0: 1%| | 109/12384 [13:55<26:06:18, 7.66s/it, loss=10.0305, acc=0.0009, iter_time=7.62s]
Epoch 0: 1%| | 109/12384 [14:03<26:06:18, 7.66s/it, loss=10.4411, acc=0.0003, iter_time=7.66s]
Epoch 0: 1%| | 110/12384 [14:03<26:05:16, 7.65s/it, loss=10.4411, acc=0.0003, iter_time=7.66s]
Epoch 0: 1%| | 110/12384 [14:11<26:05:16, 7.65s/it, loss=11.6141, acc=0.0005, iter_time=7.70s]
Epoch 0: 1%| | 111/12384 [14:11<26:08:19, 7.67s/it, loss=11.6141, acc=0.0005, iter_time=7.70s]
Epoch 0: 1%| | 111/12384 [14:18<26:08:19, 7.67s/it, loss=11.2663, acc=0.0000, iter_time=8.01s]
Epoch 0: 1%| | 112/12384 [14:18<26:06:23, 7.66s/it, loss=11.2663, acc=0.0000, iter_time=8.01s]
Epoch 0: 1%| | 112/12384 [14:26<26:06:23, 7.66s/it, loss=11.4721, acc=0.0005, iter_time=5.13s]
Epoch 0: 1%| | 113/12384 [14:26<26:04:23, 7.65s/it, loss=11.4721, acc=0.0005, iter_time=5.13s]
Epoch 0: 1%| | 113/12384 [14:34<26:04:23, 7.65s/it, loss=11.8473, acc=0.0004, iter_time=6.20s]
Epoch 0: 1%| | 114/12384 [14:34<26:02:36, 7.64s/it, loss=11.8473, acc=0.0004, iter_time=6.20s]
Epoch 0: 1%| | 114/12384 [14:41<26:02:36, 7.64s/it, loss=11.5466, acc=0.0006, iter_time=7.83s]
Epoch 0: 1%| | 115/12384 [14:41<26:01:00, 7.63s/it, loss=11.5466, acc=0.0006, iter_time=7.83s]
Epoch 0: 1%| | 115/12384 [14:49<26:01:00, 7.63s/it, loss=11.3700, acc=0.0006, iter_time=10.94s]
Epoch 0: 1%| | 116/12384 [14:49<26:23:31, 7.74s/it, loss=11.3700, acc=0.0006, iter_time=10.94s]
Epoch 0: 1%| | 116/12384 [14:57<26:23:31, 7.74s/it, loss=10.0672, acc=0.0009, iter_time=8.01s]
Epoch 0: 1%| | 117/12384 [14:57<26:14:58, 7.70s/it, loss=10.0672, acc=0.0009, iter_time=8.01s]
Epoch 0: 1%| | 117/12384 [15:04<26:14:58, 7.70s/it, loss=10.2974, acc=0.0002, iter_time=7.60s]
Epoch 0: 1%| | 118/12384 [15:04<26:12:54, 7.69s/it, loss=10.2974, acc=0.0002, iter_time=7.60s]
Epoch 0: 1%| | 118/12384 [15:12<26:12:54, 7.69s/it, loss=11.7279, acc=0.0002, iter_time=6.46s]
Epoch 0: 1%| | 119/12384 [15:12<26:11:26, 7.69s/it, loss=11.7279, acc=0.0002, iter_time=6.46s]
Epoch 0: 1%| | 119/12384 [15:20<26:11:26, 7.69s/it, loss=9.5479, acc=0.0020, iter_time=9.27s]
Epoch 0: 1%| | 120/12384 [15:20<26:11:33, 7.69s/it, loss=9.5479, acc=0.0020, iter_time=9.27s]
Epoch 0: 1%| | 120/12384 [15:27<26:11:33, 7.69s/it, loss=11.3597, acc=0.0003, iter_time=7.29s]
Epoch 0: 1%| | 121/12384 [15:27<26:06:25, 7.66s/it, loss=11.3597, acc=0.0003, iter_time=7.29s]
Epoch 0: 1%| | 121/12384 [15:35<26:06:25, 7.66s/it, loss=10.2827, acc=0.0015, iter_time=7.62s]
Epoch 0: 1%| | 122/12384 [15:35<26:04:38, 7.66s/it, loss=10.2827, acc=0.0015, iter_time=7.62s]
Epoch 0: 1%| | 122/12384 [15:43<26:04:38, 7.66s/it, loss=11.4825, acc=0.0000, iter_time=4.05s]
Epoch 0: 1%| | 123/12384 [15:43<26:01:14, 7.64s/it, loss=11.4825, acc=0.0000, iter_time=4.05s]
Epoch 0: 1%| | 123/12384 [15:50<26:01:14, 7.64s/it, loss=10.4938, acc=0.0008, iter_time=11.19s]
Epoch 0: 1%| | 124/12384 [15:50<26:02:12, 7.65s/it, loss=10.4938, acc=0.0008, iter_time=11.19s]
Epoch 0: 1%| | 124/12384 [15:58<26:02:12, 7.65s/it, loss=10.7784, acc=0.0002, iter_time=7.65s]
Epoch 0: 1%| | 125/12384 [15:58<25:59:50, 7.63s/it, loss=10.7784, acc=0.0002, iter_time=7.65s]
Epoch 0: 1%| | 125/12384 [16:06<25:59:50, 7.63s/it, loss=11.1809, acc=0.0004, iter_time=4.00s]
Epoch 0: 1%| | 126/12384 [16:06<26:03:43, 7.65s/it, loss=11.1809, acc=0.0004, iter_time=4.00s]
Epoch 0: 1%| | 126/12384 [16:13<26:03:43, 7.65s/it, loss=9.8621, acc=0.0010, iter_time=11.32s]
Epoch 0: 1%| | 127/12384 [16:13<26:04:01, 7.66s/it, loss=9.8621, acc=0.0010, iter_time=11.32s]
Epoch 0: 1%| | 127/12384 [16:21<26:04:01, 7.66s/it, loss=9.6572, acc=0.0019, iter_time=8.05s]
Epoch 0: 1%| | 128/12384 [16:21<26:03:51, 7.66s/it, loss=9.6572, acc=0.0019, iter_time=8.05s]
Epoch 0: 1%| | 128/12384 [16:29<26:03:51, 7.66s/it, loss=9.7301, acc=0.0003, iter_time=7.26s]
Epoch 0: 1%| | 129/12384 [16:29<26:03:13, 7.65s/it, loss=9.7301, acc=0.0003, iter_time=7.26s]
Epoch 0: 1%| | 129/12384 [16:36<26:03:13, 7.65s/it, loss=11.0160, acc=0.0008, iter_time=4.07s]
Epoch 0: 1%| | 130/12384 [16:36<26:01:29, 7.65s/it, loss=11.0160, acc=0.0008, iter_time=4.07s]
Epoch 0: 1%| | 130/12384 [16:44<26:01:29, 7.65s/it, loss=10.1317, acc=0.0012, iter_time=11.20s]
Epoch 0: 1%| | 131/12384 [16:44<25:58:40, 7.63s/it, loss=10.1317, acc=0.0012, iter_time=11.20s]
Epoch 0: 1%| | 131/12384 [16:51<25:58:40, 7.63s/it, loss=10.1372, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 132/12384 [16:51<25:58:53, 7.63s/it, loss=10.1372, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 132/12384 [16:59<25:58:53, 7.63s/it, loss=11.0534, acc=0.0004, iter_time=7.64s]
Epoch 0: 1%| | 133/12384 [16:59<25:57:38, 7.63s/it, loss=11.0534, acc=0.0004, iter_time=7.64s]
Epoch 0: 1%| | 133/12384 [17:07<25:57:38, 7.63s/it, loss=10.4665, acc=0.0001, iter_time=7.62s]
Epoch 0: 1%| | 134/12384 [17:07<25:57:10, 7.63s/it, loss=10.4665, acc=0.0001, iter_time=7.62s]
Epoch 0: 1%| | 134/12384 [17:14<25:57:10, 7.63s/it, loss=10.1935, acc=0.0002, iter_time=7.61s]
Epoch 0: 1%| | 135/12384 [17:14<25:57:13, 7.63s/it, loss=10.1935, acc=0.0002, iter_time=7.61s]
Epoch 0: 1%| | 135/12384 [17:22<25:57:13, 7.63s/it, loss=10.0622, acc=0.0014, iter_time=8.00s]
Epoch 0: 1%| | 136/12384 [17:22<25:55:40, 7.62s/it, loss=10.0622, acc=0.0014, iter_time=8.00s]
Epoch 0: 1%| | 136/12384 [17:30<25:55:40, 7.62s/it, loss=9.8737, acc=0.0004, iter_time=7.23s]
Epoch 0: 1%| | 137/12384 [17:30<25:55:40, 7.62s/it, loss=9.8737, acc=0.0004, iter_time=7.23s]
Epoch 0: 1%| | 137/12384 [17:37<25:55:40, 7.62s/it, loss=9.8373, acc=0.0002, iter_time=7.60s]
Epoch 0: 1%| | 138/12384 [17:37<25:57:43, 7.63s/it, loss=9.8373, acc=0.0002, iter_time=7.60s]
Epoch 0: 1%| | 138/12384 [17:45<25:57:43, 7.63s/it, loss=11.1797, acc=0.0004, iter_time=5.42s]
Epoch 0: 1%| | 139/12384 [17:45<25:57:27, 7.63s/it, loss=11.1797, acc=0.0004, iter_time=5.42s]
Epoch 0: 1%| | 139/12384 [17:52<25:57:27, 7.63s/it, loss=10.2283, acc=0.0009, iter_time=9.90s]
Epoch 0: 1%| | 140/12384 [17:52<25:57:42, 7.63s/it, loss=10.2283, acc=0.0009, iter_time=9.90s]
Epoch 0: 1%| | 140/12384 [18:00<25:57:42, 7.63s/it, loss=9.6406, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 141/12384 [18:00<25:56:35, 7.63s/it, loss=9.6406, acc=0.0007, iter_time=7.62s]
Epoch 0: 1%| | 141/12384 [18:08<25:56:35, 7.63s/it, loss=9.4581, acc=0.0005, iter_time=7.94s]
Epoch 0: 1%| | 142/12384 [18:08<26:15:45, 7.72s/it, loss=9.4581, acc=0.0005, iter_time=7.94s]
Epoch 0: 1%| | 142/12384 [18:16<26:15:45, 7.72s/it, loss=10.2313, acc=0.0004, iter_time=7.64s]
Epoch 0: 1%| | 143/12384 [18:16<26:10:37, 7.70s/it, loss=10.2313, acc=0.0004, iter_time=7.64s]
Epoch 0: 1%| | 143/12384 [18:23<26:10:37, 7.70s/it, loss=10.6638, acc=0.0008, iter_time=8.01s]
Epoch 0: 1%| | 144/12384 [18:23<26:04:59, 7.67s/it, loss=10.6638, acc=0.0008, iter_time=8.01s]
Epoch 0: 1%| | 144/12384 [18:31<26:04:59, 7.67s/it, loss=10.3811, acc=0.0003, iter_time=5.72s]
Epoch 0: 1%| | 145/12384 [18:31<26:04:45, 7.67s/it, loss=10.3811, acc=0.0003, iter_time=5.72s]
Epoch 0: 1%| | 145/12384 [18:39<26:04:45, 7.67s/it, loss=10.4208, acc=0.0005, iter_time=7.06s]
Epoch 0: 1%| | 146/12384 [18:39<26:03:27, 7.67s/it, loss=10.4208, acc=0.0005, iter_time=7.06s]
Epoch 0: 1%| | 146/12384 [18:46<26:03:27, 7.67s/it, loss=10.2973, acc=0.0005, iter_time=9.76s]
Epoch 0: 1%| | 147/12384 [18:46<26:03:35, 7.67s/it, loss=10.2973, acc=0.0005, iter_time=9.76s]
Epoch 0: 1%| | 147/12384 [18:54<26:03:35, 7.67s/it, loss=10.8811, acc=0.0005, iter_time=5.57s]
Epoch 0: 1%| | 148/12384 [18:54<26:01:39, 7.66s/it, loss=10.8811, acc=0.0005, iter_time=5.57s]
Epoch 0: 1%| | 148/12384 [19:02<26:01:39, 7.66s/it, loss=9.8736, acc=0.0004, iter_time=9.75s]
Epoch 0: 1%| | 149/12384 [19:02<26:01:06, 7.66s/it, loss=9.8736, acc=0.0004, iter_time=9.75s]
Epoch 0: 1%| | 149/12384 [19:09<26:01:06, 7.66s/it, loss=9.4176, acc=0.0008, iter_time=8.07s]
Epoch 0: 1%| | 150/12384 [19:09<25:59:58, 7.65s/it, loss=9.4176, acc=0.0008, iter_time=8.07s]
Epoch 0: 1%| | 150/12384 [19:17<25:59:58, 7.65s/it, loss=9.5935, acc=0.0012, iter_time=7.24s]
Epoch 0: 1%| | 151/12384 [19:17<26:00:40, 7.65s/it, loss=9.5935, acc=0.0012, iter_time=7.24s]
Epoch 0: 1%| | 151/12384 [19:24<26:00:40, 7.65s/it, loss=10.0799, acc=0.0001, iter_time=8.03s]
Epoch 0: 1%| | 152/12384 [19:24<25:57:28, 7.64s/it, loss=10.0799, acc=0.0001, iter_time=8.03s]
Epoch 0: 1%| | 152/12384 [19:32<25:57:28, 7.64s/it, loss=10.7032, acc=0.0000, iter_time=5.11s]
Epoch 0: 1%| | 153/12384 [19:32<25:58:43, 7.65s/it, loss=10.7032, acc=0.0000, iter_time=5.11s]
Epoch 0: 1%| | 153/12384 [19:40<25:58:43, 7.65s/it, loss=11.3994, acc=0.0005, iter_time=7.22s]
Epoch 0: 1%| | 154/12384 [19:40<25:57:32, 7.64s/it, loss=11.3994, acc=0.0005, iter_time=7.22s]
Epoch 0: 1%| | 154/12384 [19:47<25:57:32, 7.64s/it, loss=9.8630, acc=0.0006, iter_time=9.57s]
Epoch 0: 1%|▏ | 155/12384 [19:47<25:57:18, 7.64s/it, loss=9.8630, acc=0.0006, iter_time=9.57s]
Epoch 0: 1%|▏ | 155/12384 [19:55<25:57:18, 7.64s/it, loss=9.9163, acc=0.0012, iter_time=4.86s]
Epoch 0: 1%|▏ | 156/12384 [19:55<25:54:38, 7.63s/it, loss=9.9163, acc=0.0012, iter_time=4.86s]
Epoch 0: 1%|▏ | 156/12384 [20:03<25:54:38, 7.63s/it, loss=10.2178, acc=0.0009, iter_time=10.06s]
Epoch 0: 1%|▏ | 157/12384 [20:03<25:54:09, 7.63s/it, loss=10.2178, acc=0.0009, iter_time=10.06s]
Epoch 0: 1%|▏ | 157/12384 [20:10<25:54:09, 7.63s/it, loss=8.8109, acc=0.0006, iter_time=8.55s]
Epoch 0: 1%|▏ | 158/12384 [20:10<25:54:06, 7.63s/it, loss=8.8109, acc=0.0006, iter_time=8.55s]
Epoch 0: 1%|▏ | 158/12384 [20:18<25:54:06, 7.63s/it, loss=9.9846, acc=0.0005, iter_time=7.64s]
Epoch 0: 1%|▏ | 159/12384 [20:18<25:54:16, 7.63s/it, loss=9.9846, acc=0.0005, iter_time=7.64s]
Epoch 0: 1%|▏ | 159/12384 [20:26<25:54:16, 7.63s/it, loss=10.0358, acc=0.0004, iter_time=8.01s]
Epoch 0: 1%|▏ | 160/12384 [20:26<25:54:33, 7.63s/it, loss=10.0358, acc=0.0004, iter_time=8.01s]
Epoch 0: 1%|▏ | 160/12384 [20:33<25:54:33, 7.63s/it, loss=10.1687, acc=0.0002, iter_time=4.45s]
Epoch 0: 1%|▏ | 161/12384 [20:33<25:56:01, 7.64s/it, loss=10.1687, acc=0.0002, iter_time=4.45s]
Epoch 0: 1%|▏ | 161/12384 [20:41<25:56:01, 7.64s/it, loss=9.5081, acc=0.0001, iter_time=9.61s]
Epoch 0: 1%|▏ | 162/12384 [20:41<25:55:16, 7.64s/it, loss=9.5081, acc=0.0001, iter_time=9.61s]
Epoch 0: 1%|▏ | 162/12384 [20:48<25:55:16, 7.64s/it, loss=10.1441, acc=0.0009, iter_time=8.48s]
Epoch 0: 1%|▏ | 163/12384 [20:48<25:54:59, 7.63s/it, loss=10.1441, acc=0.0009, iter_time=8.48s]
Epoch 0: 1%|▏ | 163/12384 [20:56<25:54:59, 7.63s/it, loss=9.8535, acc=0.0006, iter_time=5.60s]
Epoch 0: 1%|▏ | 164/12384 [20:56<25:56:47, 7.64s/it, loss=9.8535, acc=0.0006, iter_time=5.60s]
Epoch 0: 1%|▏ | 164/12384 [21:04<25:56:47, 7.64s/it, loss=9.5386, acc=0.0011, iter_time=8.18s]
Epoch 0: 1%|▏ | 165/12384 [21:04<25:54:40, 7.63s/it, loss=9.5386, acc=0.0011, iter_time=8.18s]
Epoch 0: 1%|▏ | 165/12384 [21:11<25:54:40, 7.63s/it, loss=10.1718, acc=0.0001, iter_time=7.61s]
Epoch 0: 1%|▏ | 166/12384 [21:11<25:54:19, 7.63s/it, loss=10.1718, acc=0.0001, iter_time=7.61s]
Epoch 0: 1%|▏ | 166/12384 [21:19<25:54:19, 7.63s/it, loss=9.0794, acc=0.0002, iter_time=9.46s]
Epoch 0: 1%|▏ | 167/12384 [21:19<26:16:06, 7.74s/it, loss=9.0794, acc=0.0002, iter_time=9.46s]
Epoch 0: 1%|▏ | 167/12384 [21:27<26:16:06, 7.74s/it, loss=10.0714, acc=0.0000, iter_time=7.65s]
Epoch 0: 1%|▏ | 168/12384 [21:27<26:09:28, 7.71s/it, loss=10.0714, acc=0.0000, iter_time=7.65s]
Epoch 0: 1%|▏ | 168/12384 [21:35<26:09:28, 7.71s/it, loss=9.7891, acc=0.0004, iter_time=4.80s]
Epoch 0: 1%|▏ | 169/12384 [21:35<26:03:41, 7.68s/it, loss=9.7891, acc=0.0004, iter_time=4.80s]
Epoch 0: 1%|▏ | 169/12384 [21:42<26:03:41, 7.68s/it, loss=11.7103, acc=0.0006, iter_time=7.71s]
Epoch 0: 1%|▏ | 170/12384 [21:42<26:02:47, 7.68s/it, loss=11.7103, acc=0.0006, iter_time=7.71s]
Epoch 0: 1%|▏ | 170/12384 [21:50<26:02:47, 7.68s/it, loss=9.3130, acc=0.0011, iter_time=10.46s]
Epoch 0: 1%|▏ | 171/12384 [21:50<26:03:50, 7.68s/it, loss=9.3130, acc=0.0011, iter_time=10.46s]
Epoch 0: 1%|▏ | 171/12384 [21:58<26:03:50, 7.68s/it, loss=9.5550, acc=0.0006, iter_time=7.13s]
Epoch 0: 1%|▏ | 172/12384 [21:58<26:04:05, 7.68s/it, loss=9.5550, acc=0.0006, iter_time=7.13s]
Epoch 0: 1%|▏ | 172/12384 [22:05<26:04:05, 7.68s/it, loss=8.9668, acc=0.0003, iter_time=8.24s]
Epoch 0: 1%|▏ | 173/12384 [22:05<26:01:45, 7.67s/it, loss=8.9668, acc=0.0003, iter_time=8.24s]
Epoch 0: 1%|▏ | 173/12384 [22:13<26:01:45, 7.67s/it, loss=11.1200, acc=0.0010, iter_time=6.44s]
Epoch 0: 1%|▏ | 174/12384 [22:13<26:01:11, 7.67s/it, loss=11.1200, acc=0.0010, iter_time=6.44s]
Epoch 0: 1%|▏ | 174/12384 [22:21<26:01:11, 7.67s/it, loss=9.4657, acc=0.0002, iter_time=7.11s]
Epoch 0: 1%|▏ | 175/12384 [22:21<25:58:09, 7.66s/it, loss=9.4657, acc=0.0002, iter_time=7.11s]
Epoch 0: 1%|▏ | 175/12384 [22:28<25:58:09, 7.66s/it, loss=9.2463, acc=0.0005, iter_time=9.79s]
Epoch 0: 1%|▏ | 176/12384 [22:28<25:56:57, 7.65s/it, loss=9.2463, acc=0.0005, iter_time=9.79s]
Epoch 0: 1%|▏ | 176/12384 [22:36<25:56:57, 7.65s/it, loss=9.1595, acc=0.0007, iter_time=7.24s]
Epoch 0: 1%|▏ | 177/12384 [22:36<25:54:34, 7.64s/it, loss=9.1595, acc=0.0007, iter_time=7.24s]
Epoch 0: 1%|▏ | 177/12384 [22:43<25:54:34, 7.64s/it, loss=9.4691, acc=0.0010, iter_time=5.81s]
Epoch 0: 1%|▏ | 178/12384 [22:43<25:51:50, 7.63s/it, loss=9.4691, acc=0.0010, iter_time=5.81s]
Epoch 0: 1%|▏ | 178/12384 [22:51<25:51:50, 7.63s/it, loss=9.2089, acc=0.0009, iter_time=9.41s]
Epoch 0: 1%|▏ | 179/12384 [22:51<25:54:16, 7.64s/it, loss=9.2089, acc=0.0009, iter_time=9.41s]
Epoch 0: 1%|▏ | 179/12384 [22:59<25:54:16, 7.64s/it, loss=9.3071, acc=0.0003, iter_time=7.67s]
Epoch 0: 1%|▏ | 180/12384 [22:59<25:52:58, 7.64s/it, loss=9.3071, acc=0.0003, iter_time=7.67s]
Epoch 0: 1%|▏ | 180/12384 [23:06<25:52:58, 7.64s/it, loss=9.2088, acc=0.0019, iter_time=7.62s]
Epoch 0: 1%|▏ | 181/12384 [23:06<25:53:54, 7.64s/it, loss=9.2088, acc=0.0019, iter_time=7.62s]
Epoch 0: 1%|▏ | 181/12384 [23:14<25:53:54, 7.64s/it, loss=9.0347, acc=0.0000, iter_time=5.58s]
Epoch 0: 1%|▏ | 182/12384 [23:14<25:53:41, 7.64s/it, loss=9.0347, acc=0.0000, iter_time=5.58s]
Epoch 0: 1%|▏ | 182/12384 [23:22<25:53:41, 7.64s/it, loss=8.9288, acc=0.0003, iter_time=7.97s]
Epoch 0: 1%|▏ | 183/12384 [23:22<25:55:01, 7.65s/it, loss=8.9288, acc=0.0003, iter_time=7.97s]
Epoch 0: 1%|▏ | 183/12384 [23:29<25:55:01, 7.65s/it, loss=9.0327, acc=0.0004, iter_time=9.80s]
Epoch 0: 1%|▏ | 184/12384 [23:29<25:55:15, 7.65s/it, loss=9.0327, acc=0.0004, iter_time=9.80s]
Epoch 0: 1%|▏ | 184/12384 [23:37<25:55:15, 7.65s/it, loss=9.1654, acc=0.0003, iter_time=7.26s]
Epoch 0: 1%|▏ | 185/12384 [23:37<25:55:05, 7.65s/it, loss=9.1654, acc=0.0003, iter_time=7.26s]
Epoch 0: 1%|▏ | 185/12384 [23:45<25:55:05, 7.65s/it, loss=8.8745, acc=0.0000, iter_time=4.37s]
Epoch 0: 2%|▏ | 186/12384 [23:45<25:59:27, 7.67s/it, loss=8.8745, acc=0.0000, iter_time=4.37s]
Epoch 0: 2%|▏ | 186/12384 [23:52<25:59:27, 7.67s/it, loss=8.9560, acc=0.0007, iter_time=11.00s]
Epoch 0: 2%|▏ | 187/12384 [23:52<25:56:24, 7.66s/it, loss=8.9560, acc=0.0007, iter_time=11.00s]
Epoch 0: 2%|▏ | 187/12384 [24:00<25:56:24, 7.66s/it, loss=8.7837, acc=0.0015, iter_time=7.64s]
Epoch 0: 2%|▏ | 188/12384 [24:00<25:59:04, 7.67s/it, loss=8.7837, acc=0.0015, iter_time=7.64s]
Epoch 0: 2%|▏ | 188/12384 [24:08<25:59:04, 7.67s/it, loss=9.0256, acc=0.0023, iter_time=5.96s]
Epoch 0: 2%|▏ | 189/12384 [24:08<25:57:07, 7.66s/it, loss=9.0256, acc=0.0023, iter_time=5.96s]
Epoch 0: 2%|▏ | 189/12384 [24:15<25:57:07, 7.66s/it, loss=9.4618, acc=0.0007, iter_time=9.04s]
Epoch 0: 2%|▏ | 190/12384 [24:15<25:56:23, 7.66s/it, loss=9.4618, acc=0.0007, iter_time=9.04s]
Epoch 0: 2%|▏ | 190/12384 [24:23<25:56:23, 7.66s/it, loss=8.8491, acc=0.0006, iter_time=7.97s]
Epoch 0: 2%|▏ | 191/12384 [24:23<25:54:09, 7.65s/it, loss=8.8491, acc=0.0006, iter_time=7.97s]
Epoch 0: 2%|▏ | 191/12384 [24:31<25:54:09, 7.65s/it, loss=9.3567, acc=0.0000, iter_time=7.60s]
Epoch 0: 2%|▏ | 192/12384 [24:31<25:54:00, 7.65s/it, loss=9.3567, acc=0.0000, iter_time=7.60s]
Epoch 0: 2%|▏ | 192/12384 [24:39<25:54:00, 7.65s/it, loss=8.7066, acc=0.0010, iter_time=7.97s]
Epoch 0: 2%|▏ | 193/12384 [24:39<26:13:47, 7.75s/it, loss=8.7066, acc=0.0010, iter_time=7.97s]
Epoch 0: 2%|▏ | 193/12384 [24:46<26:13:47, 7.75s/it, loss=9.0475, acc=0.0007, iter_time=7.68s]
Epoch 0: 2%|▏ | 194/12384 [24:46<26:08:06, 7.72s/it, loss=9.0475, acc=0.0007, iter_time=7.68s]
Epoch 0: 2%|▏ | 194/12384 [24:54<26:08:06, 7.72s/it, loss=9.0842, acc=0.0005, iter_time=5.57s]
Epoch 0: 2%|▏ | 195/12384 [24:54<26:03:40, 7.70s/it, loss=9.0842, acc=0.0005, iter_time=5.57s]
Epoch 0: 2%|▏ | 195/12384 [25:01<26:03:40, 7.70s/it, loss=8.1855, acc=0.0004, iter_time=9.71s]
Epoch 0: 2%|▏ | 196/12384 [25:01<25:59:19, 7.68s/it, loss=8.1855, acc=0.0004, iter_time=9.71s]
Epoch 0: 2%|▏ | 196/12384 [25:09<25:59:19, 7.68s/it, loss=8.0778, acc=0.0012, iter_time=7.63s]
Epoch 0: 2%|▏ | 197/12384 [25:09<25:55:00, 7.66s/it, loss=8.0778, acc=0.0012, iter_time=7.63s]
Epoch 0: 2%|▏ | 197/12384 [25:17<25:55:00, 7.66s/it, loss=8.8967, acc=0.0010, iter_time=7.35s]
Epoch 0: 2%|▏ | 198/12384 [25:17<25:59:45, 7.68s/it, loss=8.8967, acc=0.0010, iter_time=7.35s]
Epoch 0: 2%|▏ | 198/12384 [25:24<25:59:45, 7.68s/it, loss=9.0389, acc=0.0004, iter_time=7.99s]
Epoch 0: 2%|▏ | 199/12384 [25:24<25:55:17, 7.66s/it, loss=9.0389, acc=0.0004, iter_time=7.99s]
Epoch 0: 2%|▏ | 199/12384 [25:32<25:55:17, 7.66s/it, loss=9.1124, acc=0.0009, iter_time=8.07s]
Epoch 0: 2%|▏ | 200/12384 [25:32<25:55:07, 7.66s/it, loss=9.1124, acc=0.0009, iter_time=8.07s]
Epoch 0: 2%|▏ | 200/12384 [25:40<25:55:07, 7.66s/it, loss=8.4466, acc=0.0007, iter_time=6.24s]
Epoch 0: 2%|▏ | 201/12384 [25:40<25:53:28, 7.65s/it, loss=8.4466, acc=0.0007, iter_time=6.24s]
Epoch 0: 2%|▏ | 201/12384 [25:47<25:53:28, 7.65s/it, loss=8.7056, acc=0.0011, iter_time=8.61s]
Epoch 0: 2%|▏ | 202/12384 [25:47<25:52:45, 7.65s/it, loss=8.7056, acc=0.0011, iter_time=8.61s]
Epoch 0: 2%|▏ | 202/12384 [25:55<25:52:45, 7.65s/it, loss=8.5991, acc=0.0011, iter_time=7.66s]
Epoch 0: 2%|▏ | 203/12384 [25:55<25:51:32, 7.64s/it, loss=8.5991, acc=0.0011, iter_time=7.66s]
Epoch 0: 2%|▏ | 203/12384 [26:03<25:51:32, 7.64s/it, loss=8.7091, acc=0.0012, iter_time=7.30s]
Epoch 0: 2%|▏ | 204/12384 [26:03<25:49:56, 7.64s/it, loss=8.7091, acc=0.0012, iter_time=7.30s]
Epoch 0: 2%|▏ | 204/12384 [26:10<25:49:56, 7.64s/it, loss=8.7888, acc=0.0019, iter_time=7.01s]
Epoch 0: 2%|▏ | 205/12384 [26:10<25:52:18, 7.65s/it, loss=8.7888, acc=0.0019, iter_time=7.01s]
Epoch 0: 2%|▏ | 205/12384 [26:18<25:52:18, 7.65s/it, loss=9.4526, acc=0.0002, iter_time=5.57s]
Epoch 0: 2%|▏ | 206/12384 [26:18<25:52:19, 7.65s/it, loss=9.4526, acc=0.0002, iter_time=5.57s]
Epoch 0: 2%|▏ | 206/12384 [26:26<25:52:19, 7.65s/it, loss=8.4342, acc=0.0012, iter_time=10.67s]
Epoch 0: 2%|▏ | 207/12384 [26:26<25:50:36, 7.64s/it, loss=8.4342, acc=0.0012, iter_time=10.67s]
Epoch 0: 2%|▏ | 207/12384 [26:33<25:50:36, 7.64s/it, loss=8.3416, acc=0.0008, iter_time=7.58s]
Epoch 0: 2%|▏ | 208/12384 [26:33<25:48:59, 7.63s/it, loss=8.3416, acc=0.0008, iter_time=7.58s]
Epoch 0: 2%|▏ | 208/12384 [26:41<25:48:59, 7.63s/it, loss=8.3990, acc=0.0019, iter_time=5.93s]
Epoch 0: 2%|▏ | 209/12384 [26:41<25:47:45, 7.63s/it, loss=8.3990, acc=0.0019, iter_time=5.93s]
Epoch 0: 2%|▏ | 209/12384 [26:48<25:47:45, 7.63s/it, loss=8.1943, acc=0.0015, iter_time=6.07s]
Epoch 0: 2%|▏ | 210/12384 [26:48<25:47:02, 7.62s/it, loss=8.1943, acc=0.0015, iter_time=6.07s]
Epoch 0: 2%|▏ | 210/12384 [26:56<25:47:02, 7.62s/it, loss=8.5613, acc=0.0008, iter_time=10.91s]
Epoch 0: 2%|▏ | 211/12384 [26:56<25:49:23, 7.64s/it, loss=8.5613, acc=0.0008, iter_time=10.91s]
Epoch 0: 2%|▏ | 211/12384 [27:04<25:49:23, 7.64s/it, loss=8.1708, acc=0.0016, iter_time=7.68s]
Epoch 0: 2%|▏ | 212/12384 [27:04<25:50:05, 7.64s/it, loss=8.1708, acc=0.0016, iter_time=7.68s]
Epoch 0: 2%|▏ | 212/12384 [27:11<25:50:05, 7.64s/it, loss=8.1459, acc=0.0007, iter_time=7.64s]
Epoch 0: 2%|▏ | 213/12384 [27:11<25:48:42, 7.63s/it, loss=8.1459, acc=0.0007, iter_time=7.64s]
Epoch 0: 2%|▏ | 213/12384 [27:19<25:48:42, 7.63s/it, loss=8.5384, acc=0.0014, iter_time=4.30s]
Epoch 0: 2%|▏ | 214/12384 [27:19<25:48:03, 7.63s/it, loss=8.5384, acc=0.0014, iter_time=4.30s]
Epoch 0: 2%|▏ | 214/12384 [27:27<25:48:03, 7.63s/it, loss=8.1967, acc=0.0009, iter_time=10.94s]
Epoch 0: 2%|▏ | 215/12384 [27:27<25:47:52, 7.63s/it, loss=8.1967, acc=0.0009, iter_time=10.94s]
Epoch 0: 2%|▏ | 215/12384 [27:34<25:47:52, 7.63s/it, loss=9.2198, acc=0.0004, iter_time=7.59s]
Epoch 0: 2%|▏ | 216/12384 [27:34<25:46:40, 7.63s/it, loss=9.2198, acc=0.0004, iter_time=7.59s]
Epoch 0: 2%|▏ | 216/12384 [27:42<25:46:40, 7.63s/it, loss=8.2690, acc=0.0009, iter_time=4.80s]
Epoch 0: 2%|▏ | 217/12384 [27:42<25:47:47, 7.63s/it, loss=8.2690, acc=0.0009, iter_time=4.80s]
Epoch 0: 2%|▏ | 217/12384 [27:50<25:47:47, 7.63s/it, loss=7.8197, acc=0.0006, iter_time=8.26s]
Epoch 0: 2%|▏ | 218/12384 [27:50<25:50:16, 7.65s/it, loss=7.8197, acc=0.0006, iter_time=8.26s]
Epoch 0: 2%|▏ | 218/12384 [27:58<25:50:16, 7.65s/it, loss=8.0925, acc=0.0007, iter_time=10.22s]
Epoch 0: 2%|▏ | 219/12384 [27:58<26:11:49, 7.75s/it, loss=8.0925, acc=0.0007, iter_time=10.22s]
Epoch 0: 2%|▏ | 219/12384 [28:05<26:11:49, 7.75s/it, loss=8.1300, acc=0.0019, iter_time=7.70s]
Epoch 0: 2%|▏ | 220/12384 [28:05<26:02:22, 7.71s/it, loss=8.1300, acc=0.0019, iter_time=7.70s]
Epoch 0: 2%|▏ | 220/12384 [28:13<26:02:22, 7.71s/it, loss=7.9561, acc=0.0015, iter_time=7.61s]
Epoch 0: 2%|▏ | 221/12384 [28:13<25:56:33, 7.68s/it, loss=7.9561, acc=0.0015, iter_time=7.61s]
Epoch 0: 2%|▏ | 221/12384 [28:20<25:56:33, 7.68s/it, loss=8.0051, acc=0.0010, iter_time=7.60s]
Epoch 0: 2%|▏ | 222/12384 [28:20<25:55:49, 7.68s/it, loss=8.0051, acc=0.0010, iter_time=7.60s]
Epoch 0: 2%|▏ | 222/12384 [28:28<25:55:49, 7.68s/it, loss=8.2760, acc=0.0003, iter_time=7.68s]
Epoch 0: 2%|▏ | 223/12384 [28:28<25:54:58, 7.67s/it, loss=8.2760, acc=0.0003, iter_time=7.68s]
Epoch 0: 2%|▏ | 223/12384 [28:36<25:54:58, 7.67s/it, loss=8.1733, acc=0.0003, iter_time=8.06s]
Epoch 0: 2%|▏ | 224/12384 [28:36<25:54:30, 7.67s/it, loss=8.1733, acc=0.0003, iter_time=8.06s]
Epoch 0: 2%|▏ | 224/12384 [28:43<25:54:30, 7.67s/it, loss=8.0470, acc=0.0007, iter_time=7.27s]
Epoch 0: 2%|▏ | 225/12384 [28:43<25:50:46, 7.65s/it, loss=8.0470, acc=0.0007, iter_time=7.27s]
Epoch 0: 2%|▏ | 225/12384 [28:51<25:50:46, 7.65s/it, loss=7.5724, acc=0.0013, iter_time=7.62s]
Epoch 0: 2%|▏ | 226/12384 [28:51<25:48:04, 7.64s/it, loss=7.5724, acc=0.0013, iter_time=7.62s]
Epoch 0: 2%|▏ | 226/12384 [28:59<25:48:04, 7.64s/it, loss=8.4081, acc=0.0011, iter_time=6.12s]
Epoch 0: 2%|▏ | 227/12384 [28:59<25:48:26, 7.64s/it, loss=8.4081, acc=0.0011, iter_time=6.12s]
Epoch 0: 2%|▏ | 227/12384 [29:06<25:48:26, 7.64s/it, loss=8.6103, acc=0.0008, iter_time=9.11s]
Epoch 0: 2%|▏ | 228/12384 [29:06<25:46:50, 7.63s/it, loss=8.6103, acc=0.0008, iter_time=9.11s]
Epoch 0: 2%|▏ | 228/12384 [29:14<25:46:50, 7.63s/it, loss=7.8253, acc=0.0011, iter_time=7.64s]
Epoch 0: 2%|▏ | 229/12384 [29:14<25:47:33, 7.64s/it, loss=7.8253, acc=0.0011, iter_time=7.64s]
Epoch 0: 2%|▏ | 229/12384 [29:21<25:47:33, 7.64s/it, loss=8.3221, acc=0.0004, iter_time=7.64s]
Epoch 0: 2%|▏ | 230/12384 [29:21<25:45:26, 7.63s/it, loss=8.3221, acc=0.0004, iter_time=7.64s]
Epoch 0: 2%|▏ | 230/12384 [29:29<25:45:26, 7.63s/it, loss=7.7024, acc=0.0009, iter_time=7.58s]
Epoch 0: 2%|▏ | 231/12384 [29:29<25:44:38, 7.63s/it, loss=7.7024, acc=0.0009, iter_time=7.58s]
Epoch 0: 2%|▏ | 231/12384 [29:37<25:44:38, 7.63s/it, loss=7.7472, acc=0.0008, iter_time=8.02s]
Epoch 0: 2%|▏ | 232/12384 [29:37<25:47:42, 7.64s/it, loss=7.7472, acc=0.0008, iter_time=8.02s]
Epoch 0: 2%|▏ | 232/12384 [29:44<25:47:42, 7.64s/it, loss=7.7262, acc=0.0011, iter_time=7.31s]
Epoch 0: 2%|▏ | 233/12384 [29:44<25:48:58, 7.65s/it, loss=7.7262, acc=0.0011, iter_time=7.31s]
Epoch 0: 2%|▏ | 233/12384 [29:52<25:48:58, 7.65s/it, loss=7.4931, acc=0.0028, iter_time=7.41s]
Epoch 0: 2%|▏ | 234/12384 [29:52<25:50:21, 7.66s/it, loss=7.4931, acc=0.0028, iter_time=7.41s]
Epoch 0: 2%|▏ | 234/12384 [30:00<25:50:21, 7.66s/it, loss=7.4022, acc=0.0014, iter_time=7.93s]
Epoch 0: 2%|▏ | 235/12384 [30:00<25:48:15, 7.65s/it, loss=7.4022, acc=0.0014, iter_time=7.93s]
Epoch 0: 2%|▏ | 235/12384 [30:07<25:48:15, 7.65s/it, loss=7.7223, acc=0.0014, iter_time=7.59s]
Epoch 0: 2%|▏ | 236/12384 [30:07<25:45:43, 7.63s/it, loss=7.7223, acc=0.0014, iter_time=7.59s]
Epoch 0: 2%|▏ | 236/12384 [30:15<25:45:43, 7.63s/it, loss=7.8947, acc=0.0015, iter_time=4.31s]
Epoch 0: 2%|▏ | 237/12384 [30:15<25:46:15, 7.64s/it, loss=7.8947, acc=0.0015, iter_time=4.31s]
Epoch 0: 2%|▏ | 237/12384 [30:23<25:46:15, 7.64s/it, loss=7.7654, acc=0.0010, iter_time=9.74s]
Epoch 0: 2%|▏ | 238/12384 [30:23<25:47:31, 7.64s/it, loss=7.7654, acc=0.0010, iter_time=9.74s]
Epoch 0: 2%|▏ | 238/12384 [30:30<25:47:31, 7.64s/it, loss=7.4437, acc=0.0005, iter_time=8.88s]
Epoch 0: 2%|▏ | 239/12384 [30:30<25:47:04, 7.64s/it, loss=7.4437, acc=0.0005, iter_time=8.88s]
Epoch 0: 2%|▏ | 239/12384 [30:38<25:47:04, 7.64s/it, loss=7.7818, acc=0.0017, iter_time=7.71s]
Epoch 0: 2%|▏ | 240/12384 [30:38<25:47:28, 7.65s/it, loss=7.7818, acc=0.0017, iter_time=7.71s]
Epoch 0: 2%|▏ | 240/12384 [30:46<25:47:28, 7.65s/it, loss=7.3091, acc=0.0018, iter_time=7.57s]
Epoch 0: 2%|▏ | 241/12384 [30:46<25:48:50, 7.65s/it, loss=7.3091, acc=0.0018, iter_time=7.57s]
Epoch 0: 2%|▏ | 241/12384 [30:53<25:48:50, 7.65s/it, loss=7.3295, acc=0.0004, iter_time=7.66s]
Epoch 0: 2%|▏ | 242/12384 [30:53<25:47:11, 7.65s/it, loss=7.3295, acc=0.0004, iter_time=7.66s]
Epoch 0: 2%|▏ | 242/12384 [31:01<25:47:11, 7.65s/it, loss=7.2502, acc=0.0021, iter_time=5.10s]
Epoch 0: 2%|▏ | 243/12384 [31:01<25:47:23, 7.65s/it, loss=7.2502, acc=0.0021, iter_time=5.10s]
Epoch 0: 2%|▏ | 243/12384 [31:09<25:47:23, 7.65s/it, loss=7.8696, acc=0.0010, iter_time=10.20s]
Epoch 0: 2%|▏ | 244/12384 [31:09<25:45:32, 7.64s/it, loss=7.8696, acc=0.0010, iter_time=10.20s]
Epoch 0: 2%|▏ | 244/12384 [31:16<25:45:32, 7.64s/it, loss=7.1887, acc=0.0007, iter_time=6.46s]
Epoch 0: 2%|▏ | 245/12384 [31:16<26:04:58, 7.74s/it, loss=7.1887, acc=0.0007, iter_time=6.46s]
Epoch 0: 2%|▏ | 245/12384 [31:24<26:04:58, 7.74s/it, loss=7.3708, acc=0.0018, iter_time=9.11s]
Epoch 0: 2%|▏ | 246/12384 [31:24<26:00:05, 7.71s/it, loss=7.3708, acc=0.0018, iter_time=9.11s]
Epoch 0: 2%|▏ | 246/12384 [31:32<26:00:05, 7.71s/it, loss=7.8745, acc=0.0013, iter_time=7.66s]
Epoch 0: 2%|▏ | 247/12384 [31:32<25:56:15, 7.69s/it, loss=7.8745, acc=0.0013, iter_time=7.66s]
Epoch 0: 2%|▏ | 247/12384 [31:39<25:56:15, 7.69s/it, loss=7.2406, acc=0.0013, iter_time=7.64s]
Epoch 0: 2%|▏ | 248/12384 [31:39<25:54:27, 7.69s/it, loss=7.2406, acc=0.0013, iter_time=7.64s]
Epoch 0: 2%|▏ | 248/12384 [31:47<25:54:27, 7.69s/it, loss=7.3163, acc=0.0023, iter_time=7.34s]
Epoch 0: 2%|▏ | 249/12384 [31:47<25:50:08, 7.66s/it, loss=7.3163, acc=0.0023, iter_time=7.34s]
Epoch 0: 2%|▏ | 249/12384 [31:55<25:50:08, 7.66s/it, loss=7.6082, acc=0.0018, iter_time=8.41s]
Epoch 0: 2%|▏ | 250/12384 [31:55<25:51:22, 7.67s/it, loss=7.6082, acc=0.0018, iter_time=8.41s]
Epoch 0: 2%|▏ | 250/12384 [32:02<25:51:22, 7.67s/it, loss=7.2558, acc=0.0005, iter_time=7.23s]
Epoch 0: 2%|▏ | 251/12384 [32:02<25:50:15, 7.67s/it, loss=7.2558, acc=0.0005, iter_time=7.23s]
Epoch 0: 2%|▏ | 251/12384 [32:10<25:50:15, 7.67s/it, loss=7.6217, acc=0.0037, iter_time=7.64s]
Epoch 0: 2%|▏ | 252/12384 [32:10<25:50:25, 7.67s/it, loss=7.6217, acc=0.0037, iter_time=7.64s]
Epoch 0: 2%|▏ | 252/12384 [32:18<25:50:25, 7.67s/it, loss=7.3812, acc=0.0011, iter_time=7.77s]
Epoch 0: 2%|▏ | 253/12384 [32:18<25:52:09, 7.68s/it, loss=7.3812, acc=0.0011, iter_time=7.77s]
Epoch 0: 2%|▏ | 253/12384 [32:25<25:52:09, 7.68s/it, loss=7.3565, acc=0.0025, iter_time=7.60s]
Epoch 0: 2%|▏ | 254/12384 [32:25<25:48:52, 7.66s/it, loss=7.3565, acc=0.0025, iter_time=7.60s]
Epoch 0: 2%|▏ | 254/12384 [32:33<25:48:52, 7.66s/it, loss=7.2157, acc=0.0006, iter_time=7.65s]
Epoch 0: 2%|▏ | 255/12384 [32:33<25:48:10, 7.66s/it, loss=7.2157, acc=0.0006, iter_time=7.65s]
Epoch 0: 2%|▏ | 255/12384 [32:41<25:48:10, 7.66s/it, loss=7.7335, acc=0.0032, iter_time=8.03s]
Epoch 0: 2%|▏ | 256/12384 [32:41<25:47:10, 7.65s/it, loss=7.7335, acc=0.0032, iter_time=8.03s]
Epoch 0: 2%|▏ | 256/12384 [32:48<25:47:10, 7.65s/it, loss=7.2015, acc=0.0031, iter_time=7.33s]
Epoch 0: 2%|▏ | 257/12384 [32:48<25:50:04, 7.67s/it, loss=7.2015, acc=0.0031, iter_time=7.33s]
Epoch 0: 2%|▏ | 257/12384 [32:56<25:50:04, 7.67s/it, loss=7.1932, acc=0.0012, iter_time=4.10s]
Epoch 0: 2%|▏ | 258/12384 [32:56<25:47:00, 7.65s/it, loss=7.1932, acc=0.0012, iter_time=4.10s]
Epoch 0: 2%|▏ | 258/12384 [33:04<25:47:00, 7.65s/it, loss=7.2090, acc=0.0023, iter_time=8.53s]
Epoch 0: 2%|▏ | 259/12384 [33:04<25:48:05, 7.66s/it, loss=7.2090, acc=0.0023, iter_time=8.53s]
Epoch 0: 2%|▏ | 259/12384 [33:11<25:48:05, 7.66s/it, loss=7.0185, acc=0.0026, iter_time=8.88s]
Epoch 0: 2%|▏ | 260/12384 [33:11<25:45:49, 7.65s/it, loss=7.0185, acc=0.0026, iter_time=8.88s]
Epoch 0: 2%|▏ | 260/12384 [33:19<25:45:49, 7.65s/it, loss=6.9527, acc=0.0025, iter_time=9.03s]
Epoch 0: 2%|▏ | 261/12384 [33:19<25:45:03, 7.65s/it, loss=6.9527, acc=0.0025, iter_time=9.03s]
Epoch 0: 2%|▏ | 261/12384 [33:27<25:45:03, 7.65s/it, loss=7.0574, acc=0.0020, iter_time=7.67s]
Epoch 0: 2%|▏ | 262/12384 [33:27<25:45:16, 7.65s/it, loss=7.0574, acc=0.0020, iter_time=7.67s]
Epoch 0: 2%|▏ | 262/12384 [33:34<25:45:16, 7.65s/it, loss=7.2073, acc=0.0025, iter_time=7.63s]
Epoch 0: 2%|▏ | 263/12384 [33:34<25:48:03, 7.66s/it, loss=7.2073, acc=0.0025, iter_time=7.63s]
Epoch 0: 2%|▏ | 263/12384 [33:42<25:48:03, 7.66s/it, loss=7.3061, acc=0.0012, iter_time=8.09s]
Epoch 0: 2%|▏ | 264/12384 [33:42<25:44:58, 7.65s/it, loss=7.3061, acc=0.0012, iter_time=8.09s]
Epoch 0: 2%|▏ | 264/12384 [33:50<25:44:58, 7.65s/it, loss=7.0960, acc=0.0025, iter_time=7.21s]
Epoch 0: 2%|▏ | 265/12384 [33:50<25:46:19, 7.66s/it, loss=7.0960, acc=0.0025, iter_time=7.21s]
Epoch 0: 2%|▏ | 265/12384 [33:57<25:46:19, 7.66s/it, loss=6.9338, acc=0.0029, iter_time=5.62s]
Epoch 0: 2%|▏ | 266/12384 [33:57<25:46:25, 7.66s/it, loss=6.9338, acc=0.0029, iter_time=5.62s]
Epoch 0: 2%|▏ | 266/12384 [34:05<25:46:25, 7.66s/it, loss=6.8391, acc=0.0025, iter_time=9.73s]
Epoch 0: 2%|▏ | 267/12384 [34:05<25:43:47, 7.64s/it, loss=6.8391, acc=0.0025, iter_time=9.73s]
Epoch 0: 2%|▏ | 267/12384 [34:13<25:43:47, 7.64s/it, loss=7.1970, acc=0.0025, iter_time=5.53s]
Epoch 0: 2%|▏ | 268/12384 [34:13<25:42:40, 7.64s/it, loss=7.1970, acc=0.0025, iter_time=5.53s]
Epoch 0: 2%|▏ | 268/12384 [34:20<25:42:40, 7.64s/it, loss=7.0222, acc=0.0014, iter_time=7.73s]
Epoch 0: 2%|▏ | 269/12384 [34:20<25:41:18, 7.63s/it, loss=7.0222, acc=0.0014, iter_time=7.73s]
Epoch 0: 2%|▏ | 269/12384 [34:28<25:41:18, 7.63s/it, loss=6.9741, acc=0.0025, iter_time=9.60s]
Epoch 0: 2%|▏ | 270/12384 [34:28<25:42:21, 7.64s/it, loss=6.9741, acc=0.0025, iter_time=9.60s]
Epoch 0: 2%|▏ | 270/12384 [34:35<25:42:21, 7.64s/it, loss=7.2850, acc=0.0027, iter_time=7.68s]
Epoch 0: 2%|▏ | 271/12384 [34:35<25:45:43, 7.66s/it, loss=7.2850, acc=0.0027, iter_time=7.68s]
Epoch 0: 2%|▏ | 271/12384 [34:43<25:45:43, 7.66s/it, loss=7.3393, acc=0.0022, iter_time=8.00s]
Epoch 0: 2%|▏ | 272/12384 [34:43<26:05:41, 7.76s/it, loss=7.3393, acc=0.0022, iter_time=8.00s]
Epoch 0: 2%|▏ | 272/12384 [34:51<26:05:41, 7.76s/it, loss=6.7739, acc=0.0020, iter_time=7.68s]
Epoch 0: 2%|▏ | 273/12384 [34:51<25:58:03, 7.72s/it, loss=6.7739, acc=0.0020, iter_time=7.68s]
Epoch 0: 2%|▏ | 273/12384 [34:59<25:58:03, 7.72s/it, loss=6.9052, acc=0.0031, iter_time=7.63s]
Epoch 0: 2%|▏ | 274/12384 [34:59<25:52:15, 7.69s/it, loss=6.9052, acc=0.0031, iter_time=7.63s]
Epoch 0: 2%|▏ | 274/12384 [35:06<25:52:15, 7.69s/it, loss=6.9783, acc=0.0027, iter_time=7.61s]
Epoch 0: 2%|▏ | 275/12384 [35:06<25:47:34, 7.67s/it, loss=6.9783, acc=0.0027, iter_time=7.61s]
Epoch 0: 2%|▏ | 275/12384 [35:14<25:47:34, 7.67s/it, loss=7.3331, acc=0.0043, iter_time=7.61s]
Epoch 0: 2%|▏ | 276/12384 [35:14<25:45:53, 7.66s/it, loss=7.3331, acc=0.0043, iter_time=7.61s]
Epoch 0: 2%|▏ | 276/12384 [35:22<25:45:53, 7.66s/it, loss=6.9467, acc=0.0037, iter_time=7.65s]
Epoch 0: 2%|▏ | 277/12384 [35:22<25:43:51, 7.65s/it, loss=6.9467, acc=0.0037, iter_time=7.65s]
Epoch 0: 2%|▏ | 277/12384 [35:29<25:43:51, 7.65s/it, loss=6.8180, acc=0.0021, iter_time=7.61s]
Epoch 0: 2%|▏ | 278/12384 [35:29<25:43:24, 7.65s/it, loss=6.8180, acc=0.0021, iter_time=7.61s]
Epoch 0: 2%|▏ | 278/12384 [35:37<25:43:24, 7.65s/it, loss=6.8739, acc=0.0022, iter_time=7.66s]
Epoch 0: 2%|▏ | 279/12384 [35:37<25:43:12, 7.65s/it, loss=6.8739, acc=0.0022, iter_time=7.66s]
Epoch 0: 2%|▏ | 279/12384 [35:45<25:43:12, 7.65s/it, loss=7.0975, acc=0.0034, iter_time=7.73s]
Epoch 0: 2%|▏ | 280/12384 [35:45<25:40:40, 7.64s/it, loss=7.0975, acc=0.0034, iter_time=7.73s]
Epoch 0: 2%|▏ | 280/12384 [35:52<25:40:40, 7.64s/it, loss=7.0766, acc=0.0038, iter_time=7.50s]
Epoch 0: 2%|▏ | 281/12384 [35:52<25:40:49, 7.64s/it, loss=7.0766, acc=0.0038, iter_time=7.50s]
Epoch 0: 2%|▏ | 281/12384 [36:00<25:40:49, 7.64s/it, loss=6.6622, acc=0.0049, iter_time=7.04s]
Epoch 0: 2%|▏ | 282/12384 [36:00<25:38:44, 7.63s/it, loss=6.6622, acc=0.0049, iter_time=7.04s]
Epoch 0: 2%|▏ | 282/12384 [36:07<25:38:44, 7.63s/it, loss=7.0217, acc=0.0012, iter_time=5.96s]
Epoch 0: 2%|▏ | 283/12384 [36:07<25:41:08, 7.64s/it, loss=7.0217, acc=0.0012, iter_time=5.96s]
Epoch 0: 2%|▏ | 283/12384 [36:15<25:41:08, 7.64s/it, loss=6.9411, acc=0.0038, iter_time=9.92s]
Epoch 0: 2%|▏ | 284/12384 [36:15<25:38:59, 7.63s/it, loss=6.9411, acc=0.0038, iter_time=9.92s]
Epoch 0: 2%|▏ | 284/12384 [36:23<25:38:59, 7.63s/it, loss=7.3455, acc=0.0022, iter_time=7.63s]
Epoch 0: 2%|▏ | 285/12384 [36:23<25:38:43, 7.63s/it, loss=7.3455, acc=0.0022, iter_time=7.63s]
Epoch 0: 2%|▏ | 285/12384 [36:30<25:38:43, 7.63s/it, loss=6.8002, acc=0.0029, iter_time=7.63s]
Epoch 0: 2%|▏ | 286/12384 [36:30<25:39:46, 7.64s/it, loss=6.8002, acc=0.0029, iter_time=7.63s]
Epoch 0: 2%|▏ | 286/12384 [36:38<25:39:46, 7.64s/it, loss=6.7756, acc=0.0042, iter_time=7.65s]
Epoch 0: 2%|▏ | 287/12384 [36:38<25:37:32, 7.63s/it, loss=6.7756, acc=0.0042, iter_time=7.65s]
Epoch 0: 2%|▏ | 287/12384 [36:46<25:37:32, 7.63s/it, loss=7.3387, acc=0.0033, iter_time=7.99s]
Epoch 0: 2%|▏ | 288/12384 [36:46<25:38:22, 7.63s/it, loss=7.3387, acc=0.0033, iter_time=7.99s]
Epoch 0: 2%|▏ | 288/12384 [36:53<25:38:22, 7.63s/it, loss=6.7459, acc=0.0030, iter_time=6.96s]
Epoch 0: 2%|▏ | 289/12384 [36:53<25:35:55, 7.62s/it, loss=6.7459, acc=0.0030, iter_time=6.96s]
Epoch 0: 2%|▏ | 289/12384 [37:01<25:35:55, 7.62s/it, loss=6.3971, acc=0.0034, iter_time=7.90s]
Epoch 0: 2%|▏ | 290/12384 [37:01<25:37:36, 7.63s/it, loss=6.3971, acc=0.0034, iter_time=7.90s]
Epoch 0: 2%|▏ | 290/12384 [37:08<25:37:36, 7.63s/it, loss=6.7184, acc=0.0072, iter_time=7.63s]
Epoch 0: 2%|▏ | 291/12384 [37:08<25:38:29, 7.63s/it, loss=6.7184, acc=0.0072, iter_time=7.63s]
Epoch 0: 2%|▏ | 291/12384 [37:16<25:38:29, 7.63s/it, loss=6.7790, acc=0.0035, iter_time=7.64s]
Epoch 0: 2%|▏ | 292/12384 [37:16<25:39:30, 7.64s/it, loss=6.7790, acc=0.0035, iter_time=7.64s]
Epoch 0: 2%|▏ | 292/12384 [37:24<25:39:30, 7.64s/it, loss=6.5072, acc=0.0040, iter_time=7.66s]
Epoch 0: 2%|▏ | 293/12384 [37:24<25:38:43, 7.64s/it, loss=6.5072, acc=0.0040, iter_time=7.66s]
Epoch 0: 2%|▏ | 293/12384 [37:31<25:38:43, 7.64s/it, loss=6.6935, acc=0.0026, iter_time=5.07s]
Epoch 0: 2%|▏ | 294/12384 [37:31<25:40:16, 7.64s/it, loss=6.6935, acc=0.0026, iter_time=5.07s]
Epoch 0: 2%|▏ | 294/12384 [37:39<25:40:16, 7.64s/it, loss=6.3948, acc=0.0052, iter_time=8.13s]
Epoch 0: 2%|▏ | 295/12384 [37:39<25:38:37, 7.64s/it, loss=6.3948, acc=0.0052, iter_time=8.13s]
Epoch 0: 2%|▏ | 295/12384 [37:47<25:38:37, 7.64s/it, loss=6.7583, acc=0.0028, iter_time=9.71s]
Epoch 0: 2%|▏ | 296/12384 [37:47<25:40:48, 7.65s/it, loss=6.7583, acc=0.0028, iter_time=9.71s]
Epoch 0: 2%|▏ | 296/12384 [37:54<25:40:48, 7.65s/it, loss=6.1203, acc=0.0043, iter_time=7.66s]
Epoch 0: 2%|▏ | 297/12384 [37:54<25:39:54, 7.64s/it, loss=6.1203, acc=0.0043, iter_time=7.66s]
Epoch 0: 2%|▏ | 297/12384 [38:02<25:39:54, 7.64s/it, loss=7.0972, acc=0.0035, iter_time=7.96s]
Epoch 0: 2%|▏ | 298/12384 [38:02<26:00:03, 7.74s/it, loss=7.0972, acc=0.0035, iter_time=7.96s]
Epoch 0: 2%|▏ | 298/12384 [38:10<26:00:03, 7.74s/it, loss=6.2468, acc=0.0040, iter_time=7.07s]
Epoch 0: 2%|▏ | 299/12384 [38:10<25:54:47, 7.72s/it, loss=6.2468, acc=0.0040, iter_time=7.07s]
Epoch 0: 2%|▏ | 299/12384 [38:18<25:54:47, 7.72s/it, loss=6.3538, acc=0.0050, iter_time=8.72s]
Epoch 0: 2%|▏ | 300/12384 [38:18<25:52:28, 7.71s/it, loss=6.3538, acc=0.0050, iter_time=8.72s]
Epoch 0: 2%|▏ | 300/12384 [38:25<25:52:28, 7.71s/it, loss=5.8291, acc=0.0066, iter_time=4.60s]
Epoch 0: 2%|▏ | 301/12384 [38:25<25:49:18, 7.69s/it, loss=5.8291, acc=0.0066, iter_time=4.60s]
Epoch 0: 2%|▏ | 301/12384 [38:33<25:49:18, 7.69s/it, loss=6.3087, acc=0.0032, iter_time=10.30s]
Epoch 0: 2%|▏ | 302/12384 [38:33<25:48:30, 7.69s/it, loss=6.3087, acc=0.0032, iter_time=10.30s]
Epoch 0: 2%|▏ | 302/12384 [38:41<25:48:30, 7.69s/it, loss=6.6376, acc=0.0032, iter_time=5.61s]
Epoch 0: 2%|▏ | 303/12384 [38:41<25:42:30, 7.66s/it, loss=6.6376, acc=0.0032, iter_time=5.61s]
Epoch 0: 2%|▏ | 303/12384 [38:48<25:42:30, 7.66s/it, loss=6.8154, acc=0.0040, iter_time=10.00s]
Epoch 0: 2%|▏ | 304/12384 [38:48<25:41:36, 7.66s/it, loss=6.8154, acc=0.0040, iter_time=10.00s]
Epoch 0: 2%|▏ | 304/12384 [38:56<25:41:36, 7.66s/it, loss=5.8010, acc=0.0080, iter_time=4.22s]
Epoch 0: 2%|▏ | 305/12384 [38:56<25:39:34, 7.65s/it, loss=5.8010, acc=0.0080, iter_time=4.22s]
Epoch 0: 2%|▏ | 305/12384 [39:03<25:39:34, 7.65s/it, loss=6.6645, acc=0.0055, iter_time=10.67s]
Epoch 0: 2%|▏ | 306/12384 [39:03<25:38:25, 7.64s/it, loss=6.6645, acc=0.0055, iter_time=10.67s]
Epoch 0: 2%|▏ | 306/12384 [39:11<25:38:25, 7.64s/it, loss=6.6756, acc=0.0038, iter_time=5.32s]
Epoch 0: 2%|▏ | 307/12384 [39:11<25:34:56, 7.63s/it, loss=6.6756, acc=0.0038, iter_time=5.32s]
Epoch 0: 2%|▏ | 307/12384 [39:19<25:34:56, 7.63s/it, loss=6.4505, acc=0.0060, iter_time=9.92s]
Epoch 0: 2%|▏ | 308/12384 [39:19<25:36:27, 7.63s/it, loss=6.4505, acc=0.0060, iter_time=9.92s]
Epoch 0: 2%|▏ | 308/12384 [39:26<25:36:27, 7.63s/it, loss=6.1419, acc=0.0045, iter_time=4.76s]
Epoch 0: 2%|▏ | 309/12384 [39:26<25:35:33, 7.63s/it, loss=6.1419, acc=0.0045, iter_time=4.76s]
Epoch 0: 2%|▏ | 309/12384 [39:34<25:35:33, 7.63s/it, loss=5.9926, acc=0.0045, iter_time=6.99s]
Epoch 0: 3%|▎ | 310/12384 [39:34<25:37:26, 7.64s/it, loss=5.9926, acc=0.0045, iter_time=6.99s]
Epoch 0: 3%|▎ | 310/12384 [39:42<25:37:26, 7.64s/it, loss=6.0707, acc=0.0056, iter_time=11.17s]
Epoch 0: 3%|▎ | 311/12384 [39:42<25:36:56, 7.64s/it, loss=6.0707, acc=0.0056, iter_time=11.17s]
Epoch 0: 3%|▎ | 311/12384 [39:49<25:36:56, 7.64s/it, loss=6.5124, acc=0.0036, iter_time=7.74s]
Epoch 0: 3%|▎ | 312/12384 [39:49<25:37:29, 7.64s/it, loss=6.5124, acc=0.0036, iter_time=7.74s]
Epoch 0: 3%|▎ | 312/12384 [39:57<25:37:29, 7.64s/it, loss=5.6124, acc=0.0070, iter_time=5.01s]
Epoch 0: 3%|▎ | 313/12384 [39:57<25:39:13, 7.65s/it, loss=5.6124, acc=0.0070, iter_time=5.01s]
Epoch 0: 3%|▎ | 313/12384 [40:05<25:39:13, 7.65s/it, loss=6.2550, acc=0.0054, iter_time=10.20s]
Epoch 0: 3%|▎ | 314/12384 [40:05<25:39:13, 7.65s/it, loss=6.2550, acc=0.0054, iter_time=10.20s]
Epoch 0: 3%|▎ | 314/12384 [40:12<25:39:13, 7.65s/it, loss=5.9709, acc=0.0075, iter_time=5.64s]
Epoch 0: 3%|▎ | 315/12384 [40:12<25:40:12, 7.66s/it, loss=5.9709, acc=0.0075, iter_time=5.64s]
Epoch 0: 3%|▎ | 315/12384 [40:20<25:40:12, 7.66s/it, loss=6.4455, acc=0.0052, iter_time=9.69s]
Epoch 0: 3%|▎ | 316/12384 [40:20<25:41:19, 7.66s/it, loss=6.4455, acc=0.0052, iter_time=9.69s]
Epoch 0: 3%|▎ | 316/12384 [40:28<25:41:19, 7.66s/it, loss=5.5123, acc=0.0076, iter_time=5.37s]
Epoch 0: 3%|▎ | 317/12384 [40:28<25:42:23, 7.67s/it, loss=5.5123, acc=0.0076, iter_time=5.37s]
Epoch 0: 3%|▎ | 317/12384 [40:35<25:42:23, 7.67s/it, loss=5.9083, acc=0.0054, iter_time=10.00s]
Epoch 0: 3%|▎ | 318/12384 [40:35<25:43:43, 7.68s/it, loss=5.9083, acc=0.0054, iter_time=10.00s]
Epoch 0: 3%|▎ | 318/12384 [40:43<25:43:43, 7.68s/it, loss=5.7044, acc=0.0059, iter_time=4.80s]
Epoch 0: 3%|▎ | 319/12384 [40:43<25:43:38, 7.68s/it, loss=5.7044, acc=0.0059, iter_time=4.80s]
Epoch 0: 3%|▎ | 319/12384 [40:51<25:43:38, 7.68s/it, loss=6.1768, acc=0.0078, iter_time=10.52s]
Epoch 0: 3%|▎ | 320/12384 [40:51<25:42:00, 7.67s/it, loss=6.1768, acc=0.0078, iter_time=10.52s]
Epoch 0: 3%|▎ | 320/12384 [40:58<25:42:00, 7.67s/it, loss=5.7468, acc=0.0071, iter_time=7.68s]
Epoch 0: 3%|▎ | 321/12384 [40:58<25:39:49, 7.66s/it, loss=5.7468, acc=0.0071, iter_time=7.68s]
Epoch 0: 3%|▎ | 321/12384 [41:06<25:39:49, 7.66s/it, loss=5.8584, acc=0.0098, iter_time=4.80s]
Epoch 0: 3%|▎ | 322/12384 [41:06<25:35:59, 7.64s/it, loss=5.8584, acc=0.0098, iter_time=4.80s]
Epoch 0: 3%|▎ | 322/12384 [41:14<25:35:59, 7.64s/it, loss=6.2379, acc=0.0060, iter_time=10.44s]
Epoch 0: 3%|▎ | 323/12384 [41:14<25:35:57, 7.64s/it, loss=6.2379, acc=0.0060, iter_time=10.44s]
Epoch 0: 3%|▎ | 323/12384 [41:21<25:35:57, 7.64s/it, loss=5.9168, acc=0.0098, iter_time=7.30s]
Epoch 0: 3%|▎ | 324/12384 [41:21<25:36:27, 7.64s/it, loss=5.9168, acc=0.0098, iter_time=7.30s]
Epoch 0: 3%|▎ | 324/12384 [41:29<25:36:27, 7.64s/it, loss=5.6638, acc=0.0060, iter_time=8.30s]
Epoch 0: 3%|▎ | 325/12384 [41:29<25:54:59, 7.74s/it, loss=5.6638, acc=0.0060, iter_time=8.30s]
Epoch 0: 3%|▎ | 325/12384 [41:37<25:54:59, 7.74s/it, loss=5.8490, acc=0.0072, iter_time=7.62s]
Epoch 0: 3%|▎ | 326/12384 [41:37<25:50:37, 7.72s/it, loss=5.8490, acc=0.0072, iter_time=7.62s]
Epoch 0: 3%|▎ | 326/12384 [41:44<25:50:37, 7.72s/it, loss=5.6499, acc=0.0070, iter_time=7.66s]
Epoch 0: 3%|▎ | 327/12384 [41:44<25:45:52, 7.69s/it, loss=5.6499, acc=0.0070, iter_time=7.66s]
Epoch 0: 3%|▎ | 327/12384 [41:52<25:45:52, 7.69s/it, loss=5.8528, acc=0.0058, iter_time=8.03s]
Epoch 0: 3%|▎ | 328/12384 [41:52<25:40:44, 7.67s/it, loss=5.8528, acc=0.0058, iter_time=8.03s]
Epoch 0: 3%|▎ | 328/12384 [42:00<25:40:44, 7.67s/it, loss=5.3495, acc=0.0093, iter_time=7.22s]
Epoch 0: 3%|▎ | 329/12384 [42:00<25:39:31, 7.66s/it, loss=5.3495, acc=0.0093, iter_time=7.22s]
Epoch 0: 3%|▎ | 329/12384 [42:07<25:39:31, 7.66s/it, loss=5.3448, acc=0.0088, iter_time=7.64s]
Epoch 0: 3%|▎ | 330/12384 [42:07<25:37:29, 7.65s/it, loss=5.3448, acc=0.0088, iter_time=7.64s]
Epoch 0: 3%|▎ | 330/12384 [42:15<25:37:29, 7.65s/it, loss=5.8485, acc=0.0064, iter_time=7.66s]
Epoch 0: 3%|▎ | 331/12384 [42:15<25:35:47, 7.65s/it, loss=5.8485, acc=0.0064, iter_time=7.66s]
Epoch 0: 3%|▎ | 331/12384 [42:23<25:35:47, 7.65s/it, loss=5.9459, acc=0.0068, iter_time=7.62s]
Epoch 0: 3%|▎ | 332/12384 [42:23<25:35:17, 7.64s/it, loss=5.9459, acc=0.0068, iter_time=7.62s]
Epoch 0: 3%|▎ | 332/12384 [42:30<25:35:17, 7.64s/it, loss=5.4085, acc=0.0101, iter_time=7.63s]
Epoch 0: 3%|▎ | 333/12384 [42:30<25:37:01, 7.65s/it, loss=5.4085, acc=0.0101, iter_time=7.63s]
Epoch 0: 3%|▎ | 333/12384 [42:38<25:37:01, 7.65s/it, loss=5.3133, acc=0.0101, iter_time=5.07s]
Epoch 0: 3%|▎ | 334/12384 [42:38<25:36:06, 7.65s/it, loss=5.3133, acc=0.0101, iter_time=5.07s]
Epoch 0: 3%|▎ | 334/12384 [42:46<25:36:06, 7.65s/it, loss=5.3288, acc=0.0072, iter_time=10.25s]
Epoch 0: 3%|▎ | 335/12384 [42:46<25:36:47, 7.65s/it, loss=5.3288, acc=0.0072, iter_time=10.25s]
Epoch 0: 3%|▎ | 335/12384 [42:53<25:36:47, 7.65s/it, loss=5.7861, acc=0.0081, iter_time=8.04s]
Epoch 0: 3%|▎ | 336/12384 [42:53<25:34:58, 7.64s/it, loss=5.7861, acc=0.0081, iter_time=8.04s]
Epoch 0: 3%|▎ | 336/12384 [43:01<25:34:58, 7.64s/it, loss=5.7992, acc=0.0069, iter_time=7.23s]
Epoch 0: 3%|▎ | 337/12384 [43:01<25:38:53, 7.66s/it, loss=5.7992, acc=0.0069, iter_time=7.23s]
Epoch 0: 3%|▎ | 337/12384 [43:09<25:38:53, 7.66s/it, loss=6.0970, acc=0.0070, iter_time=7.73s]
Epoch 0: 3%|▎ | 338/12384 [43:09<25:40:20, 7.67s/it, loss=6.0970, acc=0.0070, iter_time=7.73s]
Epoch 0: 3%|▎ | 338/12384 [43:16<25:40:20, 7.67s/it, loss=5.6665, acc=0.0068, iter_time=7.69s]
Epoch 0: 3%|▎ | 339/12384 [43:16<25:38:39, 7.66s/it, loss=5.6665, acc=0.0068, iter_time=7.69s]
Epoch 0: 3%|▎ | 339/12384 [43:24<25:38:39, 7.66s/it, loss=5.7326, acc=0.0087, iter_time=5.86s]
Epoch 0: 3%|▎ | 340/12384 [43:24<25:38:37, 7.66s/it, loss=5.7326, acc=0.0087, iter_time=5.86s]
Epoch 0: 3%|▎ | 340/12384 [43:32<25:38:37, 7.66s/it, loss=5.4915, acc=0.0102, iter_time=9.45s]
Epoch 0: 3%|▎ | 341/12384 [43:32<25:38:16, 7.66s/it, loss=5.4915, acc=0.0102, iter_time=9.45s]
Epoch 0: 3%|▎ | 341/12384 [43:39<25:38:16, 7.66s/it, loss=5.7700, acc=0.0064, iter_time=7.67s]
Epoch 0: 3%|▎ | 342/12384 [43:39<25:37:02, 7.66s/it, loss=5.7700, acc=0.0064, iter_time=7.67s]
Epoch 0: 3%|▎ | 342/12384 [43:47<25:37:02, 7.66s/it, loss=5.6819, acc=0.0080, iter_time=7.63s]
Epoch 0: 3%|▎ | 343/12384 [43:47<25:34:27, 7.65s/it, loss=5.6819, acc=0.0080, iter_time=7.63s]
Epoch 0: 3%|▎ | 343/12384 [43:54<25:34:27, 7.65s/it, loss=5.4848, acc=0.0113, iter_time=8.01s]
Epoch 0: 3%|▎ | 344/12384 [43:54<25:33:07, 7.64s/it, loss=5.4848, acc=0.0113, iter_time=8.01s]
Epoch 0: 3%|▎ | 344/12384 [44:02<25:33:07, 7.64s/it, loss=5.6680, acc=0.0124, iter_time=7.25s]
Epoch 0: 3%|▎ | 345/12384 [44:02<25:33:43, 7.64s/it, loss=5.6680, acc=0.0124, iter_time=7.25s]
Epoch 0: 3%|▎ | 345/12384 [44:10<25:33:43, 7.64s/it, loss=5.4482, acc=0.0082, iter_time=7.64s]
Epoch 0: 3%|▎ | 346/12384 [44:10<25:33:42, 7.64s/it, loss=5.4482, acc=0.0082, iter_time=7.64s]
Epoch 0: 3%|▎ | 346/12384 [44:17<25:33:42, 7.64s/it, loss=5.3382, acc=0.0116, iter_time=7.65s]
Epoch 0: 3%|▎ | 347/12384 [44:17<25:30:54, 7.63s/it, loss=5.3382, acc=0.0116, iter_time=7.65s]
Epoch 0: 3%|▎ | 347/12384 [44:25<25:30:54, 7.63s/it, loss=5.9495, acc=0.0055, iter_time=7.62s]
Epoch 0: 3%|▎ | 348/12384 [44:25<25:30:03, 7.63s/it, loss=5.9495, acc=0.0055, iter_time=7.62s]
Epoch 0: 3%|▎ | 348/12384 [44:33<25:30:03, 7.63s/it, loss=5.5126, acc=0.0067, iter_time=7.60s]
Epoch 0: 3%|▎ | 349/12384 [44:33<25:30:12, 7.63s/it, loss=5.5126, acc=0.0067, iter_time=7.60s]
Epoch 0: 3%|▎ | 349/12384 [44:40<25:30:12, 7.63s/it, loss=5.4053, acc=0.0117, iter_time=8.02s]
Epoch 0: 3%|▎ | 350/12384 [44:40<25:28:43, 7.62s/it, loss=5.4053, acc=0.0117, iter_time=8.02s]
Epoch 0: 3%|▎ | 350/12384 [44:48<25:28:43, 7.62s/it, loss=5.0049, acc=0.0102, iter_time=7.57s]
Epoch 0: 3%|▎ | 351/12384 [44:48<25:50:39, 7.73s/it, loss=5.0049, acc=0.0102, iter_time=7.57s]
Epoch 0: 3%|▎ | 351/12384 [44:56<25:50:39, 7.73s/it, loss=4.9376, acc=0.0129, iter_time=7.60s]
Epoch 0: 3%|▎ | 352/12384 [44:56<25:44:47, 7.70s/it, loss=4.9376, acc=0.0129, iter_time=7.60s]
Epoch 0: 3%|▎ | 352/12384 [45:03<25:44:47, 7.70s/it, loss=5.2557, acc=0.0145, iter_time=7.66s]
Epoch 0: 3%|▎ | 353/12384 [45:03<25:40:11, 7.68s/it, loss=5.2557, acc=0.0145, iter_time=7.66s]
Epoch 0: 3%|▎ | 353/12384 [45:11<25:40:11, 7.68s/it, loss=4.6446, acc=0.0172, iter_time=7.64s]
Epoch 0: 3%|▎ | 354/12384 [45:11<25:35:22, 7.66s/it, loss=4.6446, acc=0.0172, iter_time=7.64s]
Epoch 0: 3%|▎ | 354/12384 [45:19<25:35:22, 7.66s/it, loss=4.7147, acc=0.0130, iter_time=7.60s]
Epoch 0: 3%|▎ | 355/12384 [45:19<25:33:58, 7.65s/it, loss=4.7147, acc=0.0130, iter_time=7.60s]
Epoch 0: 3%|▎ | 355/12384 [45:26<25:33:58, 7.65s/it, loss=5.1595, acc=0.0100, iter_time=3.61s]
Epoch 0: 3%|▎ | 356/12384 [45:26<25:37:44, 7.67s/it, loss=5.1595, acc=0.0100, iter_time=3.61s]
Epoch 0: 3%|▎ | 356/12384 [45:34<25:37:44, 7.67s/it, loss=5.1754, acc=0.0106, iter_time=11.74s]
Epoch 0: 3%|▎ | 357/12384 [45:34<25:34:07, 7.65s/it, loss=5.1754, acc=0.0106, iter_time=11.74s]
Epoch 0: 3%|▎ | 357/12384 [45:42<25:34:07, 7.65s/it, loss=5.2104, acc=0.0132, iter_time=7.60s]
Epoch 0: 3%|▎ | 358/12384 [45:42<25:33:46, 7.65s/it, loss=5.2104, acc=0.0132, iter_time=7.60s]
Epoch 0: 3%|▎ | 358/12384 [45:49<25:33:46, 7.65s/it, loss=5.5443, acc=0.0122, iter_time=7.68s]
Epoch 0: 3%|▎ | 359/12384 [45:49<25:32:20, 7.65s/it, loss=5.5443, acc=0.0122, iter_time=7.68s]
Epoch 0: 3%|▎ | 359/12384 [45:57<25:32:20, 7.65s/it, loss=4.6941, acc=0.0179, iter_time=7.56s]
Epoch 0: 3%|▎ | 360/12384 [45:57<25:30:07, 7.64s/it, loss=4.6941, acc=0.0179, iter_time=7.56s]
Epoch 0: 3%|▎ | 360/12384 [46:05<25:30:07, 7.64s/it, loss=5.2813, acc=0.0146, iter_time=7.65s]
Epoch 0: 3%|▎ | 361/12384 [46:05<25:28:42, 7.63s/it, loss=5.2813, acc=0.0146, iter_time=7.65s]
Epoch 0: 3%|▎ | 361/12384 [46:12<25:28:42, 7.63s/it, loss=4.4687, acc=0.0203, iter_time=5.53s]
Epoch 0: 3%|▎ | 362/12384 [46:12<25:32:07, 7.65s/it, loss=4.4687, acc=0.0203, iter_time=5.53s]
Epoch 0: 3%|▎ | 362/12384 [46:20<25:32:07, 7.65s/it, loss=4.8078, acc=0.0235, iter_time=9.80s]
Epoch 0: 3%|▎ | 363/12384 [46:20<25:32:04, 7.65s/it, loss=4.8078, acc=0.0235, iter_time=9.80s]
Epoch 0: 3%|▎ | 363/12384 [46:28<25:32:04, 7.65s/it, loss=4.4958, acc=0.0183, iter_time=7.63s]
Epoch 0: 3%|▎ | 364/12384 [46:28<25:30:55, 7.64s/it, loss=4.4958, acc=0.0183, iter_time=7.63s]
Epoch 0: 3%|▎ | 364/12384 [46:35<25:30:55, 7.64s/it, loss=5.0373, acc=0.0105, iter_time=7.66s]
Epoch 0: 3%|▎ | 365/12384 [46:35<25:29:15, 7.63s/it, loss=5.0373, acc=0.0105, iter_time=7.66s]
Epoch 0: 3%|▎ | 365/12384 [46:43<25:29:15, 7.63s/it, loss=4.6957, acc=0.0158, iter_time=7.60s]
Epoch 0: 3%|▎ | 366/12384 [46:43<25:31:48, 7.65s/it, loss=4.6957, acc=0.0158, iter_time=7.60s]
Epoch 0: 3%|▎ | 366/12384 [46:50<25:31:48, 7.65s/it, loss=4.7914, acc=0.0158, iter_time=7.70s]
Epoch 0: 3%|▎ | 367/12384 [46:50<25:29:35, 7.64s/it, loss=4.7914, acc=0.0158, iter_time=7.70s]
Epoch 0: 3%|▎ | 367/12384 [46:58<25:29:35, 7.64s/it, loss=4.8600, acc=0.0196, iter_time=7.59s]
Epoch 0: 3%|▎ | 368/12384 [46:58<25:30:08, 7.64s/it, loss=4.8600, acc=0.0196, iter_time=7.59s]
Epoch 0: 3%|▎ | 368/12384 [47:06<25:30:08, 7.64s/it, loss=4.6137, acc=0.0147, iter_time=7.68s]
Epoch 0: 3%|▎ | 369/12384 [47:06<25:37:18, 7.68s/it, loss=4.6137, acc=0.0147, iter_time=7.68s]
Epoch 0: 3%|▎ | 369/12384 [47:13<25:37:18, 7.68s/it, loss=4.9908, acc=0.0129, iter_time=7.73s]
Epoch 0: 3%|▎ | 370/12384 [47:13<25:33:52, 7.66s/it, loss=4.9908, acc=0.0129, iter_time=7.73s]
Epoch 0: 3%|▎ | 370/12384 [47:21<25:33:52, 7.66s/it, loss=4.8862, acc=0.0132, iter_time=7.66s]
Epoch 0: 3%|▎ | 371/12384 [47:21<25:32:29, 7.65s/it, loss=4.8862, acc=0.0132, iter_time=7.66s]
Epoch 0: 3%|▎ | 371/12384 [47:29<25:32:29, 7.65s/it, loss=4.9949, acc=0.0125, iter_time=7.61s]
Epoch 0: 3%|▎ | 372/12384 [47:29<25:29:35, 7.64s/it, loss=4.9949, acc=0.0125, iter_time=7.61s]
Epoch 0: 3%|▎ | 372/12384 [47:36<25:29:35, 7.64s/it, loss=4.9881, acc=0.0133, iter_time=7.64s]
Epoch 0: 3%|▎ | 373/12384 [47:36<25:30:03, 7.64s/it, loss=4.9881, acc=0.0133, iter_time=7.64s]
Epoch 0: 3%|▎ | 373/12384 [47:44<25:30:03, 7.64s/it, loss=4.7250, acc=0.0206, iter_time=4.32s]
Epoch 0: 3%|▎ | 374/12384 [47:44<25:29:53, 7.64s/it, loss=4.7250, acc=0.0206, iter_time=4.32s]
Epoch 0: 3%|▎ | 374/12384 [47:52<25:29:53, 7.64s/it, loss=5.1235, acc=0.0125, iter_time=10.95s]
Epoch 0: 3%|▎ | 375/12384 [47:52<25:28:39, 7.64s/it, loss=5.1235, acc=0.0125, iter_time=10.95s]
Epoch 0: 3%|▎ | 375/12384 [47:59<25:28:39, 7.64s/it, loss=5.1166, acc=0.0131, iter_time=8.01s]
Epoch 0: 3%|▎ | 376/12384 [47:59<25:29:48, 7.64s/it, loss=5.1166, acc=0.0131, iter_time=8.01s]
Epoch 0: 3%|▎ | 376/12384 [48:07<25:29:48, 7.64s/it, loss=5.0236, acc=0.0119, iter_time=7.56s]
Epoch 0: 3%|▎ | 377/12384 [48:07<25:47:08, 7.73s/it, loss=5.0236, acc=0.0119, iter_time=7.56s]
Epoch 0: 3%|▎ | 377/12384 [48:15<25:47:08, 7.73s/it, loss=4.2411, acc=0.0275, iter_time=4.34s]
Epoch 0: 3%|▎ | 378/12384 [48:15<25:37:55, 7.69s/it, loss=4.2411, acc=0.0275, iter_time=4.34s]
Epoch 0: 3%|▎ | 378/12384 [48:22<25:37:55, 7.69s/it, loss=4.5981, acc=0.0179, iter_time=10.23s]
Epoch 0: 3%|▎ | 379/12384 [48:22<25:37:33, 7.68s/it, loss=4.5981, acc=0.0179, iter_time=10.23s]
Epoch 0: 3%|▎ | 379/12384 [48:30<25:37:33, 7.68s/it, loss=5.0602, acc=0.0156, iter_time=7.47s]
Epoch 0: 3%|▎ | 380/12384 [48:30<25:36:04, 7.68s/it, loss=5.0602, acc=0.0156, iter_time=7.47s]
Epoch 0: 3%|▎ | 380/12384 [48:38<25:36:04, 7.68s/it, loss=4.7217, acc=0.0143, iter_time=8.51s]
Epoch 0: 3%|▎ | 381/12384 [48:38<25:32:56, 7.66s/it, loss=4.7217, acc=0.0143, iter_time=8.51s]
Epoch 0: 3%|▎ | 381/12384 [48:45<25:32:56, 7.66s/it, loss=4.8477, acc=0.0153, iter_time=7.63s]
Epoch 0: 3%|▎ | 382/12384 [48:45<25:30:49, 7.65s/it, loss=4.8477, acc=0.0153, iter_time=7.63s]
Epoch 0: 3%|▎ | 382/12384 [48:53<25:30:49, 7.65s/it, loss=4.2739, acc=0.0184, iter_time=7.65s]
Epoch 0: 3%|▎ | 383/12384 [48:53<25:31:10, 7.66s/it, loss=4.2739, acc=0.0184, iter_time=7.65s]
Epoch 0: 3%|▎ | 383/12384 [49:01<25:31:10, 7.66s/it, loss=4.7012, acc=0.0205, iter_time=8.04s]
Epoch 0: 3%|▎ | 384/12384 [49:01<25:28:24, 7.64s/it, loss=4.7012, acc=0.0205, iter_time=8.04s]
Epoch 0: 3%|▎ | 384/12384 [49:08<25:28:24, 7.64s/it, loss=4.2782, acc=0.0249, iter_time=7.27s]
Epoch 0: 3%|▎ | 385/12384 [49:08<25:29:26, 7.65s/it, loss=4.2782, acc=0.0249, iter_time=7.27s]
Epoch 0: 3%|▎ | 385/12384 [49:16<25:29:26, 7.65s/it, loss=4.4541, acc=0.0239, iter_time=7.62s]
Epoch 0: 3%|▎ | 386/12384 [49:16<25:28:25, 7.64s/it, loss=4.4541, acc=0.0239, iter_time=7.62s]
Epoch 0: 3%|▎ | 386/12384 [49:24<25:28:25, 7.64s/it, loss=4.2846, acc=0.0287, iter_time=6.77s]
Epoch 0: 3%|▎ | 387/12384 [49:24<25:28:19, 7.64s/it, loss=4.2846, acc=0.0287, iter_time=6.77s]
Epoch 0: 3%|▎ | 387/12384 [49:31<25:28:19, 7.64s/it, loss=4.1714, acc=0.0222, iter_time=8.50s]
Epoch 0: 3%|▎ | 388/12384 [49:31<25:27:30, 7.64s/it, loss=4.1714, acc=0.0222, iter_time=8.50s]
Epoch 0: 3%|▎ | 388/12384 [49:39<25:27:30, 7.64s/it, loss=4.2648, acc=0.0199, iter_time=7.63s]
Epoch 0: 3%|▎ | 389/12384 [49:39<25:31:02, 7.66s/it, loss=4.2648, acc=0.0199, iter_time=7.63s]
Epoch 0: 3%|▎ | 389/12384 [49:47<25:31:02, 7.66s/it, loss=4.3564, acc=0.0300, iter_time=7.40s]
Epoch 0: 3%|▎ | 390/12384 [49:47<25:27:13, 7.64s/it, loss=4.3564, acc=0.0300, iter_time=7.40s]
Epoch 0: 3%|▎ | 390/12384 [49:54<25:27:13, 7.64s/it, loss=4.5471, acc=0.0209, iter_time=7.91s]
Epoch 0: 3%|▎ | 391/12384 [49:54<25:27:37, 7.64s/it, loss=4.5471, acc=0.0209, iter_time=7.91s]
Epoch 0: 3%|▎ | 391/12384 [50:02<25:27:37, 7.64s/it, loss=4.4058, acc=0.0166, iter_time=8.04s]
Epoch 0: 3%|▎ | 392/12384 [50:02<25:28:59, 7.65s/it, loss=4.4058, acc=0.0166, iter_time=8.04s]
Epoch 0: 3%|▎ | 392/12384 [50:10<25:28:59, 7.65s/it, loss=4.1021, acc=0.0195, iter_time=7.38s]
Epoch 0: 3%|▎ | 393/12384 [50:10<25:32:59, 7.67s/it, loss=4.1021, acc=0.0195, iter_time=7.38s]
Epoch 0: 3%|▎ | 393/12384 [50:17<25:32:59, 7.67s/it, loss=4.2500, acc=0.0247, iter_time=6.98s]
Epoch 0: 3%|▎ | 394/12384 [50:17<25:31:09, 7.66s/it, loss=4.2500, acc=0.0247, iter_time=6.98s]
Epoch 0: 3%|▎ | 394/12384 [50:25<25:31:09, 7.66s/it, loss=4.0351, acc=0.0294, iter_time=5.35s]
Epoch 0: 3%|▎ | 395/12384 [50:25<25:32:56, 7.67s/it, loss=4.0351, acc=0.0294, iter_time=5.35s]
Epoch 0: 3%|▎ | 395/12384 [50:33<25:32:56, 7.67s/it, loss=4.0351, acc=0.0264, iter_time=10.65s]
Epoch 0: 3%|▎ | 396/12384 [50:33<25:32:00, 7.67s/it, loss=4.0351, acc=0.0264, iter_time=10.65s]
Epoch 0: 3%|▎ | 396/12384 [50:40<25:32:00, 7.67s/it, loss=3.8231, acc=0.0282, iter_time=7.63s]
Epoch 0: 3%|▎ | 397/12384 [50:40<25:29:23, 7.66s/it, loss=3.8231, acc=0.0282, iter_time=7.63s]
Epoch 0: 3%|▎ | 397/12384 [50:48<25:29:23, 7.66s/it, loss=4.3682, acc=0.0196, iter_time=7.65s]
Epoch 0: 3%|▎ | 398/12384 [50:48<25:31:08, 7.66s/it, loss=4.3682, acc=0.0196, iter_time=7.65s]
Epoch 0: 3%|▎ | 398/12384 [50:56<25:31:08, 7.66s/it, loss=3.7488, acc=0.0245, iter_time=6.43s]
Epoch 0: 3%|▎ | 399/12384 [50:56<25:29:10, 7.66s/it, loss=3.7488, acc=0.0245, iter_time=6.43s]
Epoch 0: 3%|▎ | 399/12384 [51:03<25:29:10, 7.66s/it, loss=4.3565, acc=0.0228, iter_time=9.42s]
Epoch 0: 3%|▎ | 400/12384 [51:03<25:35:48, 7.69s/it, loss=4.3565, acc=0.0228, iter_time=9.42s]
Epoch 0: 3%|▎ | 400/12384 [51:11<25:35:48, 7.69s/it, loss=3.7938, acc=0.0266, iter_time=7.20s]
Epoch 0: 3%|▎ | 401/12384 [51:11<25:31:45, 7.67s/it, loss=3.7938, acc=0.0266, iter_time=7.20s]
Epoch 0: 3%|▎ | 401/12384 [51:19<25:31:45, 7.67s/it, loss=4.2312, acc=0.0216, iter_time=7.64s]
Epoch 0: 3%|▎ | 402/12384 [51:19<25:31:52, 7.67s/it, loss=4.2312, acc=0.0216, iter_time=7.64s]
Epoch 0: 3%|▎ | 402/12384 [51:27<25:31:52, 7.67s/it, loss=3.9393, acc=0.0294, iter_time=8.02s]
Epoch 0: 3%|▎ | 403/12384 [51:27<25:53:43, 7.78s/it, loss=3.9393, acc=0.0294, iter_time=8.02s]
Epoch 0: 3%|▎ | 403/12384 [51:34<25:53:43, 7.78s/it, loss=4.2445, acc=0.0226, iter_time=6.81s]
Epoch 0: 3%|▎ | 404/12384 [51:34<25:45:49, 7.74s/it, loss=4.2445, acc=0.0226, iter_time=6.81s]
Epoch 0: 3%|▎ | 404/12384 [51:42<25:45:49, 7.74s/it, loss=3.7501, acc=0.0291, iter_time=7.12s]
Epoch 0: 3%|▎ | 405/12384 [51:42<25:43:25, 7.73s/it, loss=3.7501, acc=0.0291, iter_time=7.12s]
Epoch 0: 3%|▎ | 405/12384 [51:50<25:43:25, 7.73s/it, loss=3.5726, acc=0.0380, iter_time=7.14s]
Epoch 0: 3%|▎ | 406/12384 [51:50<25:38:49, 7.71s/it, loss=3.5726, acc=0.0380, iter_time=7.14s]
Epoch 0: 3%|▎ | 406/12384 [51:57<25:38:49, 7.71s/it, loss=4.2236, acc=0.0188, iter_time=9.66s]
Epoch 0: 3%|▎ | 407/12384 [51:57<25:35:21, 7.69s/it, loss=4.2236, acc=0.0188, iter_time=9.66s]
Epoch 0: 3%|▎ | 407/12384 [52:05<25:35:21, 7.69s/it, loss=3.8117, acc=0.0293, iter_time=8.06s]
Epoch 0: 3%|▎ | 408/12384 [52:05<25:33:23, 7.68s/it, loss=3.8117, acc=0.0293, iter_time=8.06s]
Epoch 0: 3%|▎ | 408/12384 [52:13<25:33:23, 7.68s/it, loss=3.6982, acc=0.0342, iter_time=7.23s]
Epoch 0: 3%|▎ | 409/12384 [52:13<25:30:38, 7.67s/it, loss=3.6982, acc=0.0342, iter_time=7.23s]
Epoch 0: 3%|▎ | 409/12384 [52:20<25:30:38, 7.67s/it, loss=3.5757, acc=0.0318, iter_time=7.67s]
Epoch 0: 3%|▎ | 410/12384 [52:20<25:33:26, 7.68s/it, loss=3.5757, acc=0.0318, iter_time=7.67s]
Epoch 0: 3%|▎ | 410/12384 [52:28<25:33:26, 7.68s/it, loss=3.8740, acc=0.0279, iter_time=7.70s]
Epoch 0: 3%|▎ | 411/12384 [52:28<25:32:28, 7.68s/it, loss=3.8740, acc=0.0279, iter_time=7.70s]
Epoch 0: 3%|▎ | 411/12384 [52:36<25:32:28, 7.68s/it, loss=3.5094, acc=0.0339, iter_time=7.09s]
Epoch 0: 3%|▎ | 412/12384 [52:36<25:30:37, 7.67s/it, loss=3.5094, acc=0.0339, iter_time=7.09s]
Epoch 0: 3%|▎ | 412/12384 [52:43<25:30:37, 7.67s/it, loss=3.2465, acc=0.0371, iter_time=4.61s]
Epoch 0: 3%|▎ | 413/12384 [52:43<25:29:09, 7.66s/it, loss=3.2465, acc=0.0371, iter_time=4.61s]
Epoch 0: 3%|▎ | 413/12384 [52:51<25:29:09, 7.66s/it, loss=2.8904, acc=0.0574, iter_time=8.40s]
Epoch 0: 3%|▎ | 414/12384 [52:51<25:28:28, 7.66s/it, loss=2.8904, acc=0.0574, iter_time=8.40s]
Epoch 0: 3%|▎ | 414/12384 [52:59<25:28:28, 7.66s/it, loss=3.6628, acc=0.0276, iter_time=10.50s]
Epoch 0: 3%|▎ | 415/12384 [52:59<25:25:31, 7.65s/it, loss=3.6628, acc=0.0276, iter_time=10.50s]
Epoch 0: 3%|▎ | 415/12384 [53:06<25:25:31, 7.65s/it, loss=3.8821, acc=0.0325, iter_time=8.01s]
Epoch 0: 3%|▎ | 416/12384 [53:06<25:26:24, 7.65s/it, loss=3.8821, acc=0.0325, iter_time=8.01s]
Epoch 0: 3%|▎ | 416/12384 [53:14<25:26:24, 7.65s/it, loss=3.2570, acc=0.0432, iter_time=4.50s]
Epoch 0: 3%|▎ | 417/12384 [53:14<25:28:00, 7.66s/it, loss=3.2570, acc=0.0432, iter_time=4.50s]
Epoch 0: 3%|▎ | 417/12384 [53:22<25:28:00, 7.66s/it, loss=3.5080, acc=0.0288, iter_time=10.45s]
Epoch 0: 3%|▎ | 418/12384 [53:22<25:30:13, 7.67s/it, loss=3.5080, acc=0.0288, iter_time=10.45s]
Epoch 0: 3%|▎ | 418/12384 [53:29<25:30:13, 7.67s/it, loss=3.0909, acc=0.0365, iter_time=7.70s]
Epoch 0: 3%|▎ | 419/12384 [53:29<25:27:52, 7.66s/it, loss=3.0909, acc=0.0365, iter_time=7.70s]
Epoch 0: 3%|▎ | 419/12384 [53:37<25:27:52, 7.66s/it, loss=3.4928, acc=0.0372, iter_time=7.65s]
Epoch 0: 3%|▎ | 420/12384 [53:37<25:27:45, 7.66s/it, loss=3.4928, acc=0.0372, iter_time=7.65s]
Epoch 0: 3%|▎ | 420/12384 [53:45<25:27:45, 7.66s/it, loss=3.4464, acc=0.0396, iter_time=7.65s]
Epoch 0: 3%|▎ | 421/12384 [53:45<25:25:33, 7.65s/it, loss=3.4464, acc=0.0396, iter_time=7.65s]
Epoch 0: 3%|▎ | 421/12384 [53:52<25:25:33, 7.65s/it, loss=3.3146, acc=0.0343, iter_time=7.63s]
Epoch 0: 3%|▎ | 422/12384 [53:52<25:22:39, 7.64s/it, loss=3.3146, acc=0.0343, iter_time=7.63s]
Epoch 0: 3%|▎ | 422/12384 [54:00<25:22:39, 7.64s/it, loss=3.3239, acc=0.0348, iter_time=6.66s]
Epoch 0: 3%|▎ | 423/12384 [54:00<25:23:53, 7.64s/it, loss=3.3239, acc=0.0348, iter_time=6.66s]
Epoch 0: 3%|▎ | 423/12384 [54:07<25:23:53, 7.64s/it, loss=3.2749, acc=0.0364, iter_time=8.56s]
Epoch 0: 3%|▎ | 424/12384 [54:07<25:22:46, 7.64s/it, loss=3.2749, acc=0.0364, iter_time=8.56s]
Epoch 0: 3%|▎ | 424/12384 [54:15<25:22:46, 7.64s/it, loss=3.0364, acc=0.0451, iter_time=7.66s]
Epoch 0: 3%|▎ | 425/12384 [54:15<25:22:33, 7.64s/it, loss=3.0364, acc=0.0451, iter_time=7.66s]
Epoch 0: 3%|▎ | 425/12384 [54:23<25:22:33, 7.64s/it, loss=3.0444, acc=0.0412, iter_time=7.65s]
Epoch 0: 3%|▎ | 426/12384 [54:23<25:21:50, 7.64s/it, loss=3.0444, acc=0.0412, iter_time=7.65s]
Epoch 0: 3%|▎ | 426/12384 [54:30<25:21:50, 7.64s/it, loss=3.2301, acc=0.0386, iter_time=7.72s]
Epoch 0: 3%|▎ | 427/12384 [54:30<25:26:05, 7.66s/it, loss=3.2301, acc=0.0386, iter_time=7.72s]
Epoch 0: 3%|▎ | 427/12384 [54:38<25:26:05, 7.66s/it, loss=3.2357, acc=0.0334, iter_time=7.62s]
Epoch 0: 3%|▎ | 428/12384 [54:38<25:22:50, 7.64s/it, loss=3.2357, acc=0.0334, iter_time=7.62s]
Epoch 0: 3%|▎ | 428/12384 [54:46<25:22:50, 7.64s/it, loss=3.1309, acc=0.0459, iter_time=5.59s]
Epoch 0: 3%|▎ | 429/12384 [54:46<25:44:00, 7.75s/it, loss=3.1309, acc=0.0459, iter_time=5.59s]
Epoch 0: 3%|▎ | 429/12384 [54:54<25:44:00, 7.75s/it, loss=2.9865, acc=0.0453, iter_time=10.01s]
Epoch 0: 3%|▎ | 430/12384 [54:54<25:38:28, 7.72s/it, loss=2.9865, acc=0.0453, iter_time=10.01s]
Epoch 0: 3%|▎ | 430/12384 [55:01<25:38:28, 7.72s/it, loss=3.1372, acc=0.0429, iter_time=7.65s]
Epoch 0: 3%|▎ | 431/12384 [55:01<25:37:07, 7.72s/it, loss=3.1372, acc=0.0429, iter_time=7.65s]
Epoch 0: 3%|▎ | 431/12384 [55:09<25:37:07, 7.72s/it, loss=3.2819, acc=0.0415, iter_time=8.11s]
Epoch 0: 3%|▎ | 432/12384 [55:09<25:33:47, 7.70s/it, loss=3.2819, acc=0.0415, iter_time=8.11s]
Epoch 0: 3%|▎ | 432/12384 [55:17<25:33:47, 7.70s/it, loss=3.0646, acc=0.0505, iter_time=7.26s]
Epoch 0: 3%|▎ | 433/12384 [55:17<25:31:41, 7.69s/it, loss=3.0646, acc=0.0505, iter_time=7.26s]
Epoch 0: 3%|▎ | 433/12384 [55:24<25:31:41, 7.69s/it, loss=3.4927, acc=0.0437, iter_time=7.74s]
Epoch 0: 4%|▎ | 434/12384 [55:24<25:29:55, 7.68s/it, loss=3.4927, acc=0.0437, iter_time=7.74s]
Epoch 0: 4%|▎ | 434/12384 [55:32<25:29:55, 7.68s/it, loss=3.1577, acc=0.0383, iter_time=7.62s]
Epoch 0: 4%|▎ | 435/12384 [55:32<25:28:53, 7.68s/it, loss=3.1577, acc=0.0383, iter_time=7.62s]
Epoch 0: 4%|▎ | 435/12384 [55:40<25:28:53, 7.68s/it, loss=2.9042, acc=0.0446, iter_time=7.64s]
Epoch 0: 4%|▎ | 436/12384 [55:40<25:23:48, 7.65s/it, loss=2.9042, acc=0.0446, iter_time=7.64s]
Epoch 0: 4%|▎ | 436/12384 [55:47<25:23:48, 7.65s/it, loss=2.8476, acc=0.0494, iter_time=7.62s]
Epoch 0: 4%|▎ | 437/12384 [55:47<25:24:27, 7.66s/it, loss=2.8476, acc=0.0494, iter_time=7.62s]
Epoch 0: 4%|▎ | 437/12384 [55:55<25:24:27, 7.66s/it, loss=2.5513, acc=0.0720, iter_time=4.37s]
Epoch 0: 4%|▎ | 438/12384 [55:55<25:24:39, 7.66s/it, loss=2.5513, acc=0.0720, iter_time=4.37s]
Epoch 0: 4%|▎ | 438/12384 [56:03<25:24:39, 7.66s/it, loss=3.1866, acc=0.0466, iter_time=10.93s]
Epoch 0: 4%|▎ | 439/12384 [56:03<25:22:33, 7.65s/it, loss=3.1866, acc=0.0466, iter_time=10.93s]
Epoch 0: 4%|▎ | 439/12384 [56:10<25:22:33, 7.65s/it, loss=3.7266, acc=0.0348, iter_time=8.02s]
Epoch 0: 4%|▎ | 440/12384 [56:10<25:21:13, 7.64s/it, loss=3.7266, acc=0.0348, iter_time=8.02s]
Epoch 0: 4%|▎ | 440/12384 [56:18<25:21:13, 7.64s/it, loss=2.6208, acc=0.0580, iter_time=4.90s]
Epoch 0: 4%|▎ | 441/12384 [56:18<25:19:17, 7.63s/it, loss=2.6208, acc=0.0580, iter_time=4.90s]
Epoch 0: 4%|▎ | 441/12384 [56:25<25:19:17, 7.63s/it, loss=2.8994, acc=0.0426, iter_time=9.96s]
Epoch 0: 4%|▎ | 442/12384 [56:25<25:18:06, 7.63s/it, loss=2.8994, acc=0.0426, iter_time=9.96s]
Epoch 0: 4%|▎ | 442/12384 [56:33<25:18:06, 7.63s/it, loss=2.9250, acc=0.0597, iter_time=5.03s]
Epoch 0: 4%|▎ | 443/12384 [56:33<25:19:24, 7.63s/it, loss=2.9250, acc=0.0597, iter_time=5.03s]
Epoch 0: 4%|▎ | 443/12384 [56:41<25:19:24, 7.63s/it, loss=3.0754, acc=0.0495, iter_time=9.93s]
Epoch 0: 4%|▎ | 444/12384 [56:41<25:18:40, 7.63s/it, loss=3.0754, acc=0.0495, iter_time=9.93s]
Epoch 0: 4%|▎ | 444/12384 [56:48<25:18:40, 7.63s/it, loss=2.9707, acc=0.0498, iter_time=7.93s]
Epoch 0: 4%|▎ | 445/12384 [56:48<25:17:50, 7.63s/it, loss=2.9707, acc=0.0498, iter_time=7.93s]
Epoch 0: 4%|▎ | 445/12384 [56:56<25:17:50, 7.63s/it, loss=2.7525, acc=0.0550, iter_time=7.62s]
Epoch 0: 4%|▎ | 446/12384 [56:56<25:16:04, 7.62s/it, loss=2.7525, acc=0.0550, iter_time=7.62s]
Epoch 0: 4%|▎ | 446/12384 [57:04<25:16:04, 7.62s/it, loss=3.1286, acc=0.0480, iter_time=7.60s]
Epoch 0: 4%|▎ | 447/12384 [57:04<25:14:50, 7.61s/it, loss=3.1286, acc=0.0480, iter_time=7.60s]
Epoch 0: 4%|▎ | 447/12384 [57:11<25:14:50, 7.61s/it, loss=2.8419, acc=0.0528, iter_time=7.54s]
Epoch 0: 4%|▎ | 448/12384 [57:11<25:14:05, 7.61s/it, loss=2.8419, acc=0.0528, iter_time=7.54s]
Epoch 0: 4%|▎ | 448/12384 [57:19<25:14:05, 7.61s/it, loss=2.3611, acc=0.0641, iter_time=7.65s]
Epoch 0: 4%|▎ | 449/12384 [57:19<25:15:34, 7.62s/it, loss=2.3611, acc=0.0641, iter_time=7.65s]
Epoch 0: 4%|▎ | 449/12384 [57:26<25:15:34, 7.62s/it, loss=2.8634, acc=0.0636, iter_time=8.04s]
Epoch 0: 4%|▎ | 450/12384 [57:26<25:14:47, 7.62s/it, loss=2.8634, acc=0.0636, iter_time=8.04s]
Epoch 0: 4%|▎ | 450/12384 [57:34<25:14:47, 7.62s/it, loss=2.6805, acc=0.0543, iter_time=7.21s]
Epoch 0: 4%|▎ | 451/12384 [57:34<25:16:42, 7.63s/it, loss=2.6805, acc=0.0543, iter_time=7.21s]
Epoch 0: 4%|▎ | 451/12384 [57:42<25:16:42, 7.63s/it, loss=2.7589, acc=0.0638, iter_time=7.65s]
Epoch 0: 4%|▎ | 452/12384 [57:42<25:18:12, 7.63s/it, loss=2.7589, acc=0.0638, iter_time=7.65s]
Epoch 0: 4%|▎ | 452/12384 [57:49<25:18:12, 7.63s/it, loss=2.5675, acc=0.0499, iter_time=7.38s]
Epoch 0: 4%|▎ | 453/12384 [57:49<25:19:49, 7.64s/it, loss=2.5675, acc=0.0499, iter_time=7.38s]
Epoch 0: 4%|▎ | 453/12384 [57:57<25:19:49, 7.64s/it, loss=2.9277, acc=0.0398, iter_time=7.96s]
Epoch 0: 4%|▎ | 454/12384 [57:57<25:18:56, 7.64s/it, loss=2.9277, acc=0.0398, iter_time=7.96s]
Epoch 0: 4%|▎ | 454/12384 [58:05<25:18:56, 7.64s/it, loss=2.5893, acc=0.0614, iter_time=7.62s]
Epoch 0: 4%|▎ | 455/12384 [58:05<25:18:51, 7.64s/it, loss=2.5893, acc=0.0614, iter_time=7.62s]
Epoch 0: 4%|▎ | 455/12384 [58:13<25:18:51, 7.64s/it, loss=2.7613, acc=0.0720, iter_time=8.34s]
Epoch 0: 4%|▎ | 456/12384 [58:13<25:39:03, 7.74s/it, loss=2.7613, acc=0.0720, iter_time=8.34s]
Epoch 0: 4%|▎ | 456/12384 [58:20<25:39:03, 7.74s/it, loss=2.6479, acc=0.0560, iter_time=7.30s]
Epoch 0: 4%|▎ | 457/12384 [58:20<25:32:43, 7.71s/it, loss=2.6479, acc=0.0560, iter_time=7.30s]
Epoch 0: 4%|▎ | 457/12384 [58:28<25:32:43, 7.71s/it, loss=2.1886, acc=0.0814, iter_time=5.28s]
Epoch 0: 4%|▎ | 458/12384 [58:28<25:32:53, 7.71s/it, loss=2.1886, acc=0.0814, iter_time=5.28s]
Epoch 0: 4%|▎ | 458/12384 [58:36<25:32:53, 7.71s/it, loss=2.3791, acc=0.0607, iter_time=10.05s]
Epoch 0: 4%|▎ | 459/12384 [58:36<25:28:02, 7.69s/it, loss=2.3791, acc=0.0607, iter_time=10.05s]
Epoch 0: 4%|▎ | 459/12384 [58:43<25:28:02, 7.69s/it, loss=2.1744, acc=0.0658, iter_time=7.66s]
Epoch 0: 4%|▎ | 460/12384 [58:43<25:24:42, 7.67s/it, loss=2.1744, acc=0.0658, iter_time=7.66s]
Epoch 0: 4%|▎ | 460/12384 [58:51<25:24:42, 7.67s/it, loss=2.9240, acc=0.0432, iter_time=7.63s]
Epoch 0: 4%|▎ | 461/12384 [58:51<25:21:46, 7.66s/it, loss=2.9240, acc=0.0432, iter_time=7.63s]
Epoch 0: 4%|▎ | 461/12384 [58:58<25:21:46, 7.66s/it, loss=2.4064, acc=0.0642, iter_time=7.63s]
Epoch 0: 4%|▎ | 462/12384 [58:58<25:21:49, 7.66s/it, loss=2.4064, acc=0.0642, iter_time=7.63s]
Epoch 0: 4%|▎ | 462/12384 [59:06<25:21:49, 7.66s/it, loss=2.2047, acc=0.0689, iter_time=5.08s]
Epoch 0: 4%|▎ | 463/12384 [59:06<25:19:56, 7.65s/it, loss=2.2047, acc=0.0689, iter_time=5.08s]
Epoch 0: 4%|▎ | 463/12384 [59:14<25:19:56, 7.65s/it, loss=2.6974, acc=0.0564, iter_time=10.58s]
Epoch 0: 4%|▎ | 464/12384 [59:14<25:23:11, 7.67s/it, loss=2.6974, acc=0.0564, iter_time=10.58s]
Epoch 0: 4%|▎ | 464/12384 [59:21<25:23:11, 7.67s/it, loss=2.0215, acc=0.0805, iter_time=4.25s]
Epoch 0: 4%|▍ | 465/12384 [59:21<25:21:02, 7.66s/it, loss=2.0215, acc=0.0805, iter_time=4.25s]
Epoch 0: 4%|▍ | 465/12384 [59:29<25:21:02, 7.66s/it, loss=2.1350, acc=0.0804, iter_time=8.90s]
Epoch 0: 4%|▍ | 466/12384 [59:29<25:20:03, 7.65s/it, loss=2.1350, acc=0.0804, iter_time=8.90s]
Epoch 0: 4%|▍ | 466/12384 [59:37<25:20:03, 7.65s/it, loss=1.8644, acc=0.0877, iter_time=7.17s]
Epoch 0: 4%|▍ | 467/12384 [59:37<25:19:16, 7.65s/it, loss=1.8644, acc=0.0877, iter_time=7.17s]
Epoch 0: 4%|▍ | 467/12384 [59:44<25:19:16, 7.65s/it, loss=2.3691, acc=0.0603, iter_time=9.93s]
Epoch 0: 4%|▍ | 468/12384 [59:44<25:17:20, 7.64s/it, loss=2.3691, acc=0.0603, iter_time=9.93s]
Epoch 0: 4%|▍ | 468/12384 [59:52<25:17:20, 7.64s/it, loss=2.5097, acc=0.0765, iter_time=7.62s]
Epoch 0: 4%|▍ | 469/12384 [59:52<25:16:52, 7.64s/it, loss=2.5097, acc=0.0765, iter_time=7.62s]
Epoch 0: 4%|▍ | 469/12384 [1:00:00<25:16:52, 7.64s/it, loss=2.3412, acc=0.0614, iter_time=7.64s]
Epoch 0: 4%|▍ | 470/12384 [1:00:00<25:17:42, 7.64s/it, loss=2.3412, acc=0.0614, iter_time=7.64s]
Epoch 0: 4%|▍ | 470/12384 [1:00:07<25:17:42, 7.64s/it, loss=2.4188, acc=0.0616, iter_time=7.63s]
Epoch 0: 4%|▍ | 471/12384 [1:00:07<25:17:57, 7.65s/it, loss=2.4188, acc=0.0616, iter_time=7.63s]
Epoch 0: 4%|▍ | 471/12384 [1:00:15<25:17:57, 7.65s/it, loss=2.3378, acc=0.0728, iter_time=7.60s]
Epoch 0: 4%|▍ | 472/12384 [1:00:15<25:16:22, 7.64s/it, loss=2.3378, acc=0.0728, iter_time=7.60s]
Epoch 0: 4%|▍ | 472/12384 [1:00:23<25:16:22, 7.64s/it, loss=2.0764, acc=0.0804, iter_time=7.69s]
Epoch 0: 4%|▍ | 473/12384 [1:00:23<25:15:48, 7.64s/it, loss=2.0764, acc=0.0804, iter_time=7.69s]
Epoch 0: 4%|▍ | 473/12384 [1:00:30<25:15:48, 7.64s/it, loss=1.9360, acc=0.0943, iter_time=6.75s]
Epoch 0: 4%|▍ | 474/12384 [1:00:30<25:17:34, 7.65s/it, loss=1.9360, acc=0.0943, iter_time=6.75s]
Epoch 0: 4%|▍ | 474/12384 [1:00:38<25:17:34, 7.65s/it, loss=1.9062, acc=0.0851, iter_time=7.92s]
Epoch 0: 4%|▍ | 475/12384 [1:00:38<25:15:16, 7.63s/it, loss=1.9062, acc=0.0851, iter_time=7.92s]
Epoch 0: 4%|▍ | 475/12384 [1:00:45<25:15:16, 7.63s/it, loss=2.1786, acc=0.0661, iter_time=8.23s]
Epoch 0: 4%|▍ | 476/12384 [1:00:45<25:16:11, 7.64s/it, loss=2.1786, acc=0.0661, iter_time=8.23s]
Epoch 0: 4%|▍ | 476/12384 [1:00:53<25:16:11, 7.64s/it, loss=2.6808, acc=0.0632, iter_time=5.05s]
Epoch 0: 4%|▍ | 477/12384 [1:00:53<25:20:18, 7.66s/it, loss=2.6808, acc=0.0632, iter_time=5.05s]
Epoch 0: 4%|▍ | 477/12384 [1:01:01<25:20:18, 7.66s/it, loss=2.1899, acc=0.0762, iter_time=10.31s]
Epoch 0: 4%|▍ | 478/12384 [1:01:01<25:21:22, 7.67s/it, loss=2.1899, acc=0.0762, iter_time=10.31s]
Epoch 0: 4%|▍ | 478/12384 [1:01:08<25:21:22, 7.67s/it, loss=2.0382, acc=0.0792, iter_time=7.67s]
Epoch 0: 4%|▍ | 479/12384 [1:01:08<25:17:54, 7.65s/it, loss=2.0382, acc=0.0792, iter_time=7.67s]
Epoch 0: 4%|▍ | 479/12384 [1:01:16<25:17:54, 7.65s/it, loss=2.1239, acc=0.0640, iter_time=8.01s]
Epoch 0: 4%|▍ | 480/12384 [1:01:16<25:17:39, 7.65s/it, loss=2.1239, acc=0.0640, iter_time=8.01s]
Epoch 0: 4%|▍ | 480/12384 [1:01:24<25:17:39, 7.65s/it, loss=1.8730, acc=0.0906, iter_time=5.69s]
Epoch 0: 4%|▍ | 481/12384 [1:01:24<25:16:10, 7.64s/it, loss=1.8730, acc=0.0906, iter_time=5.69s]
Epoch 0: 4%|▍ | 481/12384 [1:01:32<25:16:10, 7.64s/it, loss=1.7140, acc=0.1096, iter_time=6.45s]
Epoch 0: 4%|▍ | 482/12384 [1:01:32<25:38:55, 7.76s/it, loss=1.7140, acc=0.1096, iter_time=6.45s]
Epoch 0: 4%|▍ | 482/12384 [1:01:39<25:38:55, 7.76s/it, loss=1.8818, acc=0.1072, iter_time=7.94s]
Epoch 0: 4%|▍ | 483/12384 [1:01:39<25:33:20, 7.73s/it, loss=1.8818, acc=0.1072, iter_time=7.94s]
Epoch 0: 4%|▍ | 483/12384 [1:01:47<25:33:20, 7.73s/it, loss=1.8504, acc=0.0905, iter_time=9.27s]
Epoch 0: 4%|▍ | 484/12384 [1:01:47<25:29:08, 7.71s/it, loss=1.8504, acc=0.0905, iter_time=9.27s]
Epoch 0: 4%|▍ | 484/12384 [1:01:55<25:29:08, 7.71s/it, loss=2.3645, acc=0.0783, iter_time=8.87s]
Epoch 0: 4%|▍ | 485/12384 [1:01:55<25:24:33, 7.69s/it, loss=2.3645, acc=0.0783, iter_time=8.87s]
Epoch 0: 4%|▍ | 485/12384 [1:02:02<25:24:33, 7.69s/it, loss=2.0253, acc=0.0711, iter_time=7.64s]
Epoch 0: 4%|▍ | 486/12384 [1:02:02<25:21:34, 7.67s/it, loss=2.0253, acc=0.0711, iter_time=7.64s]
Epoch 0: 4%|▍ | 486/12384 [1:02:10<25:21:34, 7.67s/it, loss=1.8402, acc=0.0922, iter_time=7.62s]
Epoch 0: 4%|▍ | 487/12384 [1:02:10<25:18:25, 7.66s/it, loss=1.8402, acc=0.0922, iter_time=7.62s]
Epoch 0: 4%|▍ | 487/12384 [1:02:18<25:18:25, 7.66s/it, loss=2.3611, acc=0.0677, iter_time=8.05s]
Epoch 0: 4%|▍ | 488/12384 [1:02:18<25:17:37, 7.65s/it, loss=2.3611, acc=0.0677, iter_time=8.05s]
Epoch 0: 4%|▍ | 488/12384 [1:02:25<25:17:37, 7.65s/it, loss=1.8946, acc=0.1047, iter_time=7.23s]
Epoch 0: 4%|▍ | 489/12384 [1:02:25<25:15:22, 7.64s/it, loss=1.8946, acc=0.1047, iter_time=7.23s]
Epoch 0: 4%|▍ | 489/12384 [1:02:33<25:15:22, 7.64s/it, loss=1.8590, acc=0.0874, iter_time=7.63s]
Epoch 0: 4%|▍ | 490/12384 [1:02:33<25:15:18, 7.64s/it, loss=1.8590, acc=0.0874, iter_time=7.63s]
Epoch 0: 4%|▍ | 490/12384 [1:02:41<25:15:18, 7.64s/it, loss=1.9773, acc=0.1019, iter_time=7.66s]
Epoch 0: 4%|▍ | 491/12384 [1:02:41<25:16:13, 7.65s/it, loss=1.9773, acc=0.1019, iter_time=7.66s]
Epoch 0: 4%|▍ | 491/12384 [1:02:48<25:16:13, 7.65s/it, loss=1.5691, acc=0.1026, iter_time=7.74s]
Epoch 0: 4%|▍ | 492/12384 [1:02:48<25:19:21, 7.67s/it, loss=1.5691, acc=0.1026, iter_time=7.74s]
Epoch 0: 4%|▍ | 492/12384 [1:02:56<25:19:21, 7.67s/it, loss=1.7926, acc=0.0978, iter_time=7.63s]
Epoch 0: 4%|▍ | 493/12384 [1:02:56<25:16:38, 7.65s/it, loss=1.7926, acc=0.0978, iter_time=7.63s]
Epoch 0: 4%|▍ | 493/12384 [1:03:04<25:16:38, 7.65s/it, loss=2.1797, acc=0.0721, iter_time=7.62s]
Epoch 0: 4%|▍ | 494/12384 [1:03:04<25:17:48, 7.66s/it, loss=2.1797, acc=0.0721, iter_time=7.62s]
Epoch 0: 4%|▍ | 494/12384 [1:03:11<25:17:48, 7.66s/it, loss=2.0808, acc=0.0790, iter_time=7.67s]
Epoch 0: 4%|▍ | 495/12384 [1:03:11<25:17:14, 7.66s/it, loss=2.0808, acc=0.0790, iter_time=7.67s]
Epoch 0: 4%|▍ | 495/12384 [1:03:19<25:17:14, 7.66s/it, loss=2.2031, acc=0.0782, iter_time=8.10s]
Epoch 0: 4%|▍ | 496/12384 [1:03:19<25:18:08, 7.66s/it, loss=2.2031, acc=0.0782, iter_time=8.10s]
Epoch 0: 4%|▍ | 496/12384 [1:03:27<25:18:08, 7.66s/it, loss=1.7503, acc=0.1270, iter_time=6.93s]
Epoch 0: 4%|▍ | 497/12384 [1:03:27<25:17:23, 7.66s/it, loss=1.7503, acc=0.1270, iter_time=6.93s]
Epoch 0: 4%|▍ | 497/12384 [1:03:34<25:17:23, 7.66s/it, loss=1.7370, acc=0.0869, iter_time=7.92s]
Epoch 0: 4%|▍ | 498/12384 [1:03:34<25:15:02, 7.65s/it, loss=1.7370, acc=0.0869, iter_time=7.92s]
Epoch 0: 4%|▍ | 498/12384 [1:03:42<25:15:02, 7.65s/it, loss=2.2853, acc=0.0846, iter_time=7.66s]
Epoch 0: 4%|▍ | 499/12384 [1:03:42<25:13:21, 7.64s/it, loss=2.2853, acc=0.0846, iter_time=7.66s]
Epoch 0: 4%|▍ | 499/12384 [1:03:49<25:13:21, 7.64s/it, loss=1.5637, acc=0.0990, iter_time=8.00s]
Epoch 0: 4%|▍ | 500/12384 [1:03:50<25:25:18, 7.70s/it, loss=1.5637, acc=0.0990, iter_time=8.00s]
Epoch 0: 4%|▍ | 500/12384 [1:03:57<25:25:18, 7.70s/it, loss=1.9870, acc=0.0964, iter_time=7.46s]
Epoch 0: 4%|▍ | 501/12384 [1:03:57<25:20:35, 7.68s/it, loss=1.9870, acc=0.0964, iter_time=7.46s]
Epoch 0: 4%|▍ | 501/12384 [1:04:05<25:20:35, 7.68s/it, loss=1.5320, acc=0.1148, iter_time=6.78s]
Epoch 0: 4%|▍ | 502/12384 [1:04:05<25:19:51, 7.67s/it, loss=1.5320, acc=0.1148, iter_time=6.78s]
Epoch 0: 4%|▍ | 502/12384 [1:04:13<25:19:51, 7.67s/it, loss=1.6261, acc=0.0951, iter_time=7.55s]
Epoch 0: 4%|▍ | 503/12384 [1:04:13<25:17:47, 7.66s/it, loss=1.6261, acc=0.0951, iter_time=7.55s]
Epoch 0: 4%|▍ | 503/12384 [1:04:20<25:17:47, 7.66s/it, loss=1.4938, acc=0.1099, iter_time=8.54s]
Epoch 0: 4%|▍ | 504/12384 [1:04:20<25:14:29, 7.65s/it, loss=1.4938, acc=0.1099, iter_time=8.54s]
Epoch 0: 4%|▍ | 504/12384 [1:04:28<25:14:29, 7.65s/it, loss=1.7771, acc=0.1023, iter_time=7.67s]
Epoch 0: 4%|▍ | 505/12384 [1:04:28<25:12:02, 7.64s/it, loss=1.7771, acc=0.1023, iter_time=7.67s]
Epoch 0: 4%|▍ | 505/12384 [1:04:35<25:12:02, 7.64s/it, loss=1.6810, acc=0.1148, iter_time=7.60s]
Epoch 0: 4%|▍ | 506/12384 [1:04:35<25:10:43, 7.63s/it, loss=1.6810, acc=0.1148, iter_time=7.60s]
Epoch 0: 4%|▍ | 506/12384 [1:04:43<25:10:43, 7.63s/it, loss=1.5150, acc=0.1185, iter_time=7.63s]
Epoch 0: 4%|▍ | 507/12384 [1:04:43<25:12:23, 7.64s/it, loss=1.5150, acc=0.1185, iter_time=7.63s]
Epoch 0: 4%|▍ | 507/12384 [1:04:51<25:12:23, 7.64s/it, loss=1.5239, acc=0.1060, iter_time=7.66s]
Epoch 0: 4%|▍ | 508/12384 [1:04:51<25:10:50, 7.63s/it, loss=1.5239, acc=0.1060, iter_time=7.66s]
Epoch 0: 4%|▍ | 508/12384 [1:04:59<25:10:50, 7.63s/it, loss=1.5047, acc=0.1262, iter_time=7.95s]
Epoch 0: 4%|▍ | 509/12384 [1:04:59<25:30:52, 7.73s/it, loss=1.5047, acc=0.1262, iter_time=7.95s]
Epoch 0: 4%|▍ | 509/12384 [1:05:06<25:30:52, 7.73s/it, loss=1.8039, acc=0.1183, iter_time=7.66s]
Epoch 0: 4%|▍ | 510/12384 [1:05:06<25:24:40, 7.70s/it, loss=1.8039, acc=0.1183, iter_time=7.66s]
Epoch 0: 4%|▍ | 510/12384 [1:05:14<25:24:40, 7.70s/it, loss=1.6836, acc=0.1040, iter_time=7.60s]
Epoch 0: 4%|▍ | 511/12384 [1:05:14<25:18:24, 7.67s/it, loss=1.6836, acc=0.1040, iter_time=7.60s]
Epoch 0: 4%|▍ | 511/12384 [1:05:22<25:18:24, 7.67s/it, loss=1.4030, acc=0.1384, iter_time=7.70s]
Epoch 0: 4%|▍ | 512/12384 [1:05:22<25:20:09, 7.68s/it, loss=1.4030, acc=0.1384, iter_time=7.70s]
Epoch 0: 4%|▍ | 512/12384 [1:05:29<25:20:09, 7.68s/it, loss=1.4032, acc=0.1294, iter_time=7.60s]
Epoch 0: 4%|▍ | 513/12384 [1:05:29<25:16:35, 7.67s/it, loss=1.4032, acc=0.1294, iter_time=7.60s]
Epoch 0: 4%|▍ | 513/12384 [1:05:37<25:16:35, 7.67s/it, loss=1.3707, acc=0.1583, iter_time=7.66s]
Epoch 0: 4%|▍ | 514/12384 [1:05:37<25:16:22, 7.66s/it, loss=1.3707, acc=0.1583, iter_time=7.66s]
Epoch 0: 4%|▍ | 514/12384 [1:05:45<25:16:22, 7.66s/it, loss=1.1802, acc=0.1476, iter_time=7.70s]
Epoch 0: 4%|▍ | 515/12384 [1:05:45<25:17:33, 7.67s/it, loss=1.1802, acc=0.1476, iter_time=7.70s]
Epoch 0: 4%|▍ | 515/12384 [1:05:52<25:17:33, 7.67s/it, loss=1.4299, acc=0.1386, iter_time=5.39s]
Epoch 0: 4%|▍ | 516/12384 [1:05:52<25:16:08, 7.67s/it, loss=1.4299, acc=0.1386, iter_time=5.39s]
Epoch 0: 4%|▍ | 516/12384 [1:06:00<25:16:08, 7.67s/it, loss=1.4811, acc=0.1189, iter_time=7.71s]
Epoch 0: 4%|▍ | 517/12384 [1:06:00<25:21:03, 7.69s/it, loss=1.4811, acc=0.1189, iter_time=7.71s]
Epoch 0: 4%|▍ | 517/12384 [1:06:08<25:21:03, 7.69s/it, loss=1.3481, acc=0.1673, iter_time=7.67s]
Epoch 0: 4%|▍ | 518/12384 [1:06:08<25:17:24, 7.67s/it, loss=1.3481, acc=0.1673, iter_time=7.67s]
Epoch 0: 4%|▍ | 518/12384 [1:06:15<25:17:24, 7.67s/it, loss=1.5646, acc=0.1122, iter_time=9.89s]
Epoch 0: 4%|▍ | 519/12384 [1:06:15<25:16:26, 7.67s/it, loss=1.5646, acc=0.1122, iter_time=9.89s]
Epoch 0: 4%|▍ | 519/12384 [1:06:23<25:16:26, 7.67s/it, loss=1.2987, acc=0.1386, iter_time=8.08s]
Epoch 0: 4%|▍ | 520/12384 [1:06:23<25:15:20, 7.66s/it, loss=1.2987, acc=0.1386, iter_time=8.08s]
Epoch 0: 4%|▍ | 520/12384 [1:06:31<25:15:20, 7.66s/it, loss=1.3657, acc=0.1161, iter_time=6.35s]
Epoch 0: 4%|▍ | 521/12384 [1:06:31<25:15:28, 7.66s/it, loss=1.3657, acc=0.1161, iter_time=6.35s]
Epoch 0: 4%|▍ | 521/12384 [1:06:38<25:15:28, 7.66s/it, loss=1.2062, acc=0.1535, iter_time=8.55s]
Epoch 0: 4%|▍ | 522/12384 [1:06:38<25:13:49, 7.66s/it, loss=1.2062, acc=0.1535, iter_time=8.55s]
Epoch 0: 4%|▍ | 522/12384 [1:06:46<25:13:49, 7.66s/it, loss=1.2758, acc=0.1454, iter_time=7.65s]
Epoch 0: 4%|▍ | 523/12384 [1:06:46<25:12:01, 7.65s/it, loss=1.2758, acc=0.1454, iter_time=7.65s]
Epoch 0: 4%|▍ | 523/12384 [1:06:53<25:12:01, 7.65s/it, loss=1.2117, acc=0.1257, iter_time=5.83s]
Epoch 0: 4%|▍ | 524/12384 [1:06:53<25:11:32, 7.65s/it, loss=1.2117, acc=0.1257, iter_time=5.83s]
Epoch 0: 4%|▍ | 524/12384 [1:07:01<25:11:32, 7.65s/it, loss=1.4545, acc=0.1447, iter_time=8.59s]
Epoch 0: 4%|▍ | 525/12384 [1:07:01<25:16:09, 7.67s/it, loss=1.4545, acc=0.1447, iter_time=8.59s]
Epoch 0: 4%|▍ | 525/12384 [1:07:09<25:16:09, 7.67s/it, loss=1.0486, acc=0.1929, iter_time=7.63s]
Epoch 0: 4%|▍ | 526/12384 [1:07:09<25:14:50, 7.66s/it, loss=1.0486, acc=0.1929, iter_time=7.63s]
Epoch 0: 4%|▍ | 526/12384 [1:07:16<25:14:50, 7.66s/it, loss=1.2718, acc=0.1351, iter_time=8.60s]
Epoch 0: 4%|▍ | 527/12384 [1:07:16<25:12:15, 7.65s/it, loss=1.2718, acc=0.1351, iter_time=8.60s]
Epoch 0: 4%|▍ | 527/12384 [1:07:24<25:12:15, 7.65s/it, loss=1.2497, acc=0.1386, iter_time=8.01s]
Epoch 0: 4%|▍ | 528/12384 [1:07:24<25:11:41, 7.65s/it, loss=1.2497, acc=0.1386, iter_time=8.01s]
Epoch 0: 4%|▍ | 528/12384 [1:07:32<25:11:41, 7.65s/it, loss=1.0450, acc=0.2315, iter_time=5.73s]
Epoch 0: 4%|▍ | 529/12384 [1:07:32<25:11:20, 7.65s/it, loss=1.0450, acc=0.2315, iter_time=5.73s]
Epoch 0: 4%|▍ | 529/12384 [1:07:39<25:11:20, 7.65s/it, loss=1.1168, acc=0.1592, iter_time=8.55s]
Epoch 0: 4%|▍ | 530/12384 [1:07:39<25:10:04, 7.64s/it, loss=1.1168, acc=0.1592, iter_time=8.55s]
Epoch 0: 4%|▍ | 530/12384 [1:07:47<25:10:04, 7.64s/it, loss=1.1135, acc=0.1942, iter_time=7.33s]
Epoch 0: 4%|▍ | 531/12384 [1:07:47<25:10:01, 7.64s/it, loss=1.1135, acc=0.1942, iter_time=7.33s]
Epoch 0: 4%|▍ | 531/12384 [1:07:55<25:10:01, 7.64s/it, loss=1.1992, acc=0.1433, iter_time=8.58s]
Epoch 0: 4%|▍ | 532/12384 [1:07:55<25:13:53, 7.66s/it, loss=1.1992, acc=0.1433, iter_time=8.58s]
Epoch 0: 4%|▍ | 532/12384 [1:08:02<25:13:53, 7.66s/it, loss=1.0983, acc=0.1781, iter_time=6.61s]
Epoch 0: 4%|▍ | 533/12384 [1:08:02<25:11:17, 7.65s/it, loss=1.0983, acc=0.1781, iter_time=6.61s]
Epoch 0: 4%|▍ | 533/12384 [1:08:10<25:11:17, 7.65s/it, loss=1.1803, acc=0.1655, iter_time=8.71s]
Epoch 0: 4%|▍ | 534/12384 [1:08:10<25:11:47, 7.65s/it, loss=1.1803, acc=0.1655, iter_time=8.71s]
Epoch 0: 4%|▍ | 534/12384 [1:08:18<25:11:47, 7.65s/it, loss=1.3010, acc=0.1560, iter_time=7.15s]
Epoch 0: 4%|▍ | 535/12384 [1:08:18<25:30:05, 7.75s/it, loss=1.3010, acc=0.1560, iter_time=7.15s]
Epoch 0: 4%|▍ | 535/12384 [1:08:26<25:30:05, 7.75s/it, loss=1.3130, acc=0.1668, iter_time=8.47s]
Epoch 0: 4%|▍ | 536/12384 [1:08:26<25:24:29, 7.72s/it, loss=1.3130, acc=0.1668, iter_time=8.47s]
Epoch 0: 4%|▍ | 536/12384 [1:08:33<25:24:29, 7.72s/it, loss=1.0739, acc=0.1849, iter_time=7.67s]
Epoch 0: 4%|▍ | 537/12384 [1:08:33<25:18:47, 7.69s/it, loss=1.0739, acc=0.1849, iter_time=7.67s]
Epoch 0: 4%|▍ | 537/12384 [1:08:41<25:18:47, 7.69s/it, loss=0.9642, acc=0.2393, iter_time=7.07s]
Epoch 0: 4%|▍ | 538/12384 [1:08:41<25:17:07, 7.68s/it, loss=0.9642, acc=0.2393, iter_time=7.07s]
Epoch 0: 4%|▍ | 538/12384 [1:08:49<25:17:07, 7.68s/it, loss=1.1014, acc=0.1750, iter_time=8.22s]
Epoch 0: 4%|▍ | 539/12384 [1:08:49<25:14:01, 7.67s/it, loss=1.1014, acc=0.1750, iter_time=8.22s]
Epoch 0: 4%|▍ | 539/12384 [1:08:56<25:14:01, 7.67s/it, loss=1.0269, acc=0.1964, iter_time=7.65s]
Epoch 0: 4%|▍ | 540/12384 [1:08:56<25:13:27, 7.67s/it, loss=1.0269, acc=0.1964, iter_time=7.65s]
Epoch 0: 4%|▍ | 540/12384 [1:09:04<25:13:27, 7.67s/it, loss=1.0619, acc=0.2396, iter_time=5.85s]
Epoch 0: 4%|▍ | 541/12384 [1:09:04<25:16:54, 7.69s/it, loss=1.0619, acc=0.2396, iter_time=5.85s]
Epoch 0: 4%|▍ | 541/12384 [1:09:12<25:16:54, 7.69s/it, loss=1.0353, acc=0.2250, iter_time=9.52s]
Epoch 0: 4%|▍ | 542/12384 [1:09:12<25:14:13, 7.67s/it, loss=1.0353, acc=0.2250, iter_time=9.52s]
Epoch 0: 4%|▍ | 542/12384 [1:09:19<25:14:13, 7.67s/it, loss=1.2098, acc=0.1728, iter_time=7.64s]
Epoch 0: 4%|▍ | 543/12384 [1:09:19<25:11:36, 7.66s/it, loss=1.2098, acc=0.1728, iter_time=7.64s]
Epoch 0: 4%|▍ | 543/12384 [1:09:27<25:11:36, 7.66s/it, loss=1.0547, acc=0.1759, iter_time=8.02s]
Epoch 0: 4%|▍ | 544/12384 [1:09:27<25:09:47, 7.65s/it, loss=1.0547, acc=0.1759, iter_time=8.02s]
Epoch 0: 4%|▍ | 544/12384 [1:09:35<25:09:47, 7.65s/it, loss=0.9190, acc=0.2185, iter_time=3.87s]
Epoch 0: 4%|▍ | 545/12384 [1:09:35<25:09:37, 7.65s/it, loss=0.9190, acc=0.2185, iter_time=3.87s]
Epoch 0: 4%|▍ | 545/12384 [1:09:42<25:09:37, 7.65s/it, loss=1.3871, acc=0.1515, iter_time=11.01s]
Epoch 0: 4%|▍ | 546/12384 [1:09:42<25:07:06, 7.64s/it, loss=1.3871, acc=0.1515, iter_time=11.01s]
Epoch 0: 4%|▍ | 546/12384 [1:09:50<25:07:06, 7.64s/it, loss=0.8361, acc=0.2270, iter_time=7.65s]
Epoch 0: 4%|▍ | 547/12384 [1:09:50<25:06:51, 7.64s/it, loss=0.8361, acc=0.2270, iter_time=7.65s]
Epoch 0: 4%|▍ | 547/12384 [1:09:57<25:06:51, 7.64s/it, loss=1.1352, acc=0.1755, iter_time=7.30s]
Epoch 0: 4%|▍ | 548/12384 [1:09:57<25:07:55, 7.64s/it, loss=1.1352, acc=0.1755, iter_time=7.30s]
Epoch 0: 4%|▍ | 548/12384 [1:10:05<25:07:55, 7.64s/it, loss=1.0154, acc=0.2016, iter_time=7.96s]
Epoch 0: 4%|▍ | 549/12384 [1:10:05<25:05:44, 7.63s/it, loss=1.0154, acc=0.2016, iter_time=7.96s]
Epoch 0: 4%|▍ | 549/12384 [1:10:13<25:05:44, 7.63s/it, loss=1.0715, acc=0.2152, iter_time=8.04s]
Epoch 0: 4%|▍ | 550/12384 [1:10:13<25:06:09, 7.64s/it, loss=1.0715, acc=0.2152, iter_time=8.04s]
Epoch 0: 4%|▍ | 550/12384 [1:10:20<25:06:09, 7.64s/it, loss=0.9247, acc=0.2230, iter_time=5.12s]
Epoch 0: 4%|▍ | 551/12384 [1:10:20<25:05:22, 7.63s/it, loss=0.9247, acc=0.2230, iter_time=5.12s]
Epoch 0: 4%|▍ | 551/12384 [1:10:28<25:05:22, 7.63s/it, loss=0.9215, acc=0.2149, iter_time=10.11s]
Epoch 0: 4%|▍ | 552/12384 [1:10:28<25:04:53, 7.63s/it, loss=0.9215, acc=0.2149, iter_time=10.11s]
Epoch 0: 4%|▍ | 552/12384 [1:10:36<25:04:53, 7.63s/it, loss=0.8211, acc=0.2492, iter_time=7.23s]
Epoch 0: 4%|▍ | 553/12384 [1:10:36<25:04:05, 7.63s/it, loss=0.8211, acc=0.2492, iter_time=7.23s]
Epoch 0: 4%|▍ | 553/12384 [1:10:43<25:04:05, 7.63s/it, loss=1.0839, acc=0.2324, iter_time=7.66s]
Epoch 0: 4%|▍ | 554/12384 [1:10:43<25:04:50, 7.63s/it, loss=1.0839, acc=0.2324, iter_time=7.66s]
Epoch 0: 4%|▍ | 554/12384 [1:10:51<25:04:50, 7.63s/it, loss=0.9729, acc=0.2124, iter_time=7.31s]
Epoch 0: 4%|▍ | 555/12384 [1:10:51<25:03:22, 7.63s/it, loss=0.9729, acc=0.2124, iter_time=7.31s]
Epoch 0: 4%|▍ | 555/12384 [1:10:58<25:03:22, 7.63s/it, loss=0.7429, acc=0.2806, iter_time=5.57s]
Epoch 0: 4%|▍ | 556/12384 [1:10:58<25:03:14, 7.63s/it, loss=0.7429, acc=0.2806, iter_time=5.57s]
Epoch 0: 4%|▍ | 556/12384 [1:11:06<25:03:14, 7.63s/it, loss=0.9001, acc=0.2481, iter_time=9.97s]
Epoch 0: 4%|▍ | 557/12384 [1:11:06<25:03:57, 7.63s/it, loss=0.9001, acc=0.2481, iter_time=9.97s]
Epoch 0: 4%|▍ | 557/12384 [1:11:14<25:03:57, 7.63s/it, loss=0.8742, acc=0.2299, iter_time=7.64s]
Epoch 0: 5%|▍ | 558/12384 [1:11:14<25:04:17, 7.63s/it, loss=0.8742, acc=0.2299, iter_time=7.64s]
Epoch 0: 5%|▍ | 558/12384 [1:11:21<25:04:17, 7.63s/it, loss=0.8940, acc=0.2662, iter_time=7.63s]
Epoch 0: 5%|▍ | 559/12384 [1:11:21<25:04:39, 7.63s/it, loss=0.8940, acc=0.2662, iter_time=7.63s]
Epoch 0: 5%|▍ | 559/12384 [1:11:29<25:04:39, 7.63s/it, loss=0.7924, acc=0.2755, iter_time=7.65s]
Epoch 0: 5%|▍ | 560/12384 [1:11:29<25:07:08, 7.65s/it, loss=0.7924, acc=0.2755, iter_time=7.65s]
Epoch 0: 5%|▍ | 560/12384 [1:11:37<25:07:08, 7.65s/it, loss=0.7921, acc=0.3057, iter_time=7.98s]
Epoch 0: 5%|▍ | 561/12384 [1:11:37<25:26:43, 7.75s/it, loss=0.7921, acc=0.3057, iter_time=7.98s]
Epoch 0: 5%|▍ | 561/12384 [1:11:45<25:26:43, 7.75s/it, loss=0.6653, acc=0.3116, iter_time=7.69s]
Epoch 0: 5%|▍ | 562/12384 [1:11:45<25:20:26, 7.72s/it, loss=0.6653, acc=0.3116, iter_time=7.69s]
Epoch 0: 5%|▍ | 562/12384 [1:11:52<25:20:26, 7.72s/it, loss=0.7885, acc=0.2770, iter_time=7.10s]
Epoch 0: 5%|▍ | 563/12384 [1:11:52<25:16:42, 7.70s/it, loss=0.7885, acc=0.2770, iter_time=7.10s]
Epoch 0: 5%|▍ | 563/12384 [1:12:00<25:16:42, 7.70s/it, loss=0.6566, acc=0.3586, iter_time=6.40s]
Epoch 0: 5%|▍ | 564/12384 [1:12:00<25:14:28, 7.69s/it, loss=0.6566, acc=0.3586, iter_time=6.40s]
Epoch 0: 5%|▍ | 564/12384 [1:12:08<25:14:28, 7.69s/it, loss=0.6048, acc=0.3385, iter_time=7.36s]
Epoch 0: 5%|▍ | 565/12384 [1:12:08<25:10:16, 7.67s/it, loss=0.6048, acc=0.3385, iter_time=7.36s]
Epoch 0: 5%|▍ | 565/12384 [1:12:15<25:10:16, 7.67s/it, loss=0.7702, acc=0.2858, iter_time=9.73s]
Epoch 0: 5%|▍ | 566/12384 [1:12:15<25:08:33, 7.66s/it, loss=0.7702, acc=0.2858, iter_time=9.73s]
Epoch 0: 5%|▍ | 566/12384 [1:12:23<25:08:33, 7.66s/it, loss=0.6689, acc=0.3683, iter_time=3.88s]
Epoch 0: 5%|▍ | 567/12384 [1:12:23<25:07:46, 7.66s/it, loss=0.6689, acc=0.3683, iter_time=3.88s]
Epoch 0: 5%|▍ | 567/12384 [1:12:31<25:07:46, 7.66s/it, loss=0.8656, acc=0.2532, iter_time=11.79s]
Epoch 0: 5%|▍ | 568/12384 [1:12:31<25:07:39, 7.66s/it, loss=0.8656, acc=0.2532, iter_time=11.79s]
Epoch 0: 5%|▍ | 568/12384 [1:12:38<25:07:39, 7.66s/it, loss=0.5556, acc=0.4360, iter_time=5.19s]
Epoch 0: 5%|▍ | 569/12384 [1:12:38<25:10:33, 7.67s/it, loss=0.5556, acc=0.4360, iter_time=5.19s]
Epoch 0: 5%|▍ | 569/12384 [1:12:46<25:10:33, 7.67s/it, loss=0.6650, acc=0.3469, iter_time=9.78s]
Epoch 0: 5%|▍ | 570/12384 [1:12:46<25:06:09, 7.65s/it, loss=0.6650, acc=0.3469, iter_time=9.78s]
Epoch 0: 5%|▍ | 570/12384 [1:12:53<25:06:09, 7.65s/it, loss=0.6787, acc=0.3174, iter_time=7.60s]
Epoch 0: 5%|▍ | 571/12384 [1:12:53<25:02:46, 7.63s/it, loss=0.6787, acc=0.3174, iter_time=7.60s]
Epoch 0: 5%|▍ | 571/12384 [1:13:01<25:02:46, 7.63s/it, loss=0.6823, acc=0.3189, iter_time=6.18s]
Epoch 0: 5%|▍ | 572/12384 [1:13:01<25:02:20, 7.63s/it, loss=0.6823, acc=0.3189, iter_time=6.18s]
Epoch 0: 5%|▍ | 572/12384 [1:13:09<25:02:20, 7.63s/it, loss=0.6189, acc=0.3393, iter_time=9.04s]
Epoch 0: 5%|▍ | 573/12384 [1:13:09<25:00:04, 7.62s/it, loss=0.6189, acc=0.3393, iter_time=9.04s]
Epoch 0: 5%|▍ | 573/12384 [1:13:16<25:00:04, 7.62s/it, loss=0.6919, acc=0.3102, iter_time=7.62s]
Epoch 0: 5%|▍ | 574/12384 [1:13:16<25:01:22, 7.63s/it, loss=0.6919, acc=0.3102, iter_time=7.62s]
Epoch 0: 5%|▍ | 574/12384 [1:13:24<25:01:22, 7.63s/it, loss=0.6962, acc=0.2823, iter_time=7.64s]
Epoch 0: 5%|▍ | 575/12384 [1:13:24<25:01:18, 7.63s/it, loss=0.6962, acc=0.2823, iter_time=7.64s]
Epoch 0: 5%|▍ | 575/12384 [1:13:32<25:01:18, 7.63s/it, loss=0.7182, acc=0.2974, iter_time=8.01s]
Epoch 0: 5%|▍ | 576/12384 [1:13:32<24:59:54, 7.62s/it, loss=0.7182, acc=0.2974, iter_time=8.01s]
Epoch 0: 5%|▍ | 576/12384 [1:13:39<24:59:54, 7.62s/it, loss=0.7195, acc=0.3184, iter_time=6.00s]
Epoch 0: 5%|▍ | 577/12384 [1:13:39<25:01:44, 7.63s/it, loss=0.7195, acc=0.3184, iter_time=6.00s]
Epoch 0: 5%|▍ | 577/12384 [1:13:47<25:01:44, 7.63s/it, loss=0.5484, acc=0.3960, iter_time=5.53s]
Epoch 0: 5%|▍ | 578/12384 [1:13:47<25:00:46, 7.63s/it, loss=0.5484, acc=0.3960, iter_time=5.53s]
Epoch 0: 5%|▍ | 578/12384 [1:13:55<25:00:46, 7.63s/it, loss=0.5956, acc=0.4156, iter_time=8.19s]
Epoch 0: 5%|▍ | 579/12384 [1:13:55<25:04:22, 7.65s/it, loss=0.5956, acc=0.4156, iter_time=8.19s]
Epoch 0: 5%|▍ | 579/12384 [1:14:02<25:04:22, 7.65s/it, loss=0.5682, acc=0.3444, iter_time=10.49s]
Epoch 0: 5%|▍ | 580/12384 [1:14:02<25:02:46, 7.64s/it, loss=0.5682, acc=0.3444, iter_time=10.49s]
Epoch 0: 5%|▍ | 580/12384 [1:14:10<25:02:46, 7.64s/it, loss=0.5496, acc=0.4052, iter_time=7.59s]
Epoch 0: 5%|▍ | 581/12384 [1:14:10<25:00:41, 7.63s/it, loss=0.5496, acc=0.4052, iter_time=7.59s]
Epoch 0: 5%|▍ | 581/12384 [1:14:17<25:00:41, 7.63s/it, loss=0.6160, acc=0.3355, iter_time=7.62s]
Epoch 0: 5%|▍ | 582/12384 [1:14:17<25:02:43, 7.64s/it, loss=0.6160, acc=0.3355, iter_time=7.62s]
Epoch 0: 5%|▍ | 582/12384 [1:14:25<25:02:43, 7.64s/it, loss=0.7119, acc=0.3244, iter_time=7.65s]
Epoch 0: 5%|▍ | 583/12384 [1:14:25<25:02:10, 7.64s/it, loss=0.7119, acc=0.3244, iter_time=7.65s]
Epoch 0: 5%|▍ | 583/12384 [1:14:33<25:02:10, 7.64s/it, loss=0.6709, acc=0.3242, iter_time=8.04s]
Epoch 0: 5%|▍ | 584/12384 [1:14:33<25:02:46, 7.64s/it, loss=0.6709, acc=0.3242, iter_time=8.04s]
Epoch 0: 5%|▍ | 584/12384 [1:14:40<25:02:46, 7.64s/it, loss=0.6783, acc=0.3475, iter_time=6.95s]
Epoch 0: 5%|▍ | 585/12384 [1:14:40<25:03:34, 7.65s/it, loss=0.6783, acc=0.3475, iter_time=6.95s]
Epoch 0: 5%|▍ | 585/12384 [1:14:48<25:03:34, 7.65s/it, loss=0.5960, acc=0.4014, iter_time=7.95s]
Epoch 0: 5%|▍ | 586/12384 [1:14:48<25:00:06, 7.63s/it, loss=0.5960, acc=0.4014, iter_time=7.95s]
Epoch 0: 5%|▍ | 586/12384 [1:14:56<25:00:06, 7.63s/it, loss=0.3958, acc=0.5014, iter_time=5.40s]
Epoch 0: 5%|▍ | 587/12384 [1:14:56<25:19:14, 7.73s/it, loss=0.3958, acc=0.5014, iter_time=5.40s]
Epoch 0: 5%|▍ | 587/12384 [1:15:04<25:19:14, 7.73s/it, loss=0.5950, acc=0.3516, iter_time=10.16s]
Epoch 0: 5%|▍ | 588/12384 [1:15:04<25:13:55, 7.70s/it, loss=0.5950, acc=0.3516, iter_time=10.16s]
Epoch 0: 5%|▍ | 588/12384 [1:15:11<25:13:55, 7.70s/it, loss=0.4965, acc=0.4395, iter_time=7.63s]
Epoch 0: 5%|▍ | 589/12384 [1:15:11<25:09:42, 7.68s/it, loss=0.4965, acc=0.4395, iter_time=7.63s]
Epoch 0: 5%|▍ | 589/12384 [1:15:19<25:09:42, 7.68s/it, loss=0.5482, acc=0.4071, iter_time=7.35s]
Epoch 0: 5%|▍ | 590/12384 [1:15:19<25:07:35, 7.67s/it, loss=0.5482, acc=0.4071, iter_time=7.35s]
Epoch 0: 5%|▍ | 590/12384 [1:15:26<25:07:35, 7.67s/it, loss=0.5106, acc=0.4397, iter_time=7.93s]
Epoch 0: 5%|▍ | 591/12384 [1:15:26<25:04:16, 7.65s/it, loss=0.5106, acc=0.4397, iter_time=7.93s]
Epoch 0: 5%|▍ | 591/12384 [1:15:34<25:04:16, 7.65s/it, loss=0.5197, acc=0.4329, iter_time=7.61s]
Epoch 0: 5%|▍ | 592/12384 [1:15:34<25:04:07, 7.65s/it, loss=0.5197, acc=0.4329, iter_time=7.61s]
Epoch 0: 5%|▍ | 592/12384 [1:15:42<25:04:07, 7.65s/it, loss=0.4506, acc=0.4788, iter_time=5.93s]
Epoch 0: 5%|▍ | 593/12384 [1:15:42<25:03:26, 7.65s/it, loss=0.4506, acc=0.4788, iter_time=5.93s]
Epoch 0: 5%|▍ | 593/12384 [1:15:49<25:03:26, 7.65s/it, loss=0.4671, acc=0.4699, iter_time=6.23s]
Epoch 0: 5%|▍ | 594/12384 [1:15:49<25:03:28, 7.65s/it, loss=0.4671, acc=0.4699, iter_time=6.23s]
Epoch 0: 5%|▍ | 594/12384 [1:15:57<25:03:28, 7.65s/it, loss=0.3762, acc=0.4901, iter_time=9.68s]
Epoch 0: 5%|▍ | 595/12384 [1:15:57<25:02:26, 7.65s/it, loss=0.3762, acc=0.4901, iter_time=9.68s]
Epoch 0: 5%|▍ | 595/12384 [1:16:05<25:02:26, 7.65s/it, loss=0.6318, acc=0.4473, iter_time=8.77s]
Epoch 0: 5%|▍ | 596/12384 [1:16:05<25:02:30, 7.65s/it, loss=0.6318, acc=0.4473, iter_time=8.77s]
Epoch 0: 5%|▍ | 596/12384 [1:16:12<25:02:30, 7.65s/it, loss=0.4220, acc=0.5015, iter_time=7.72s]
Epoch 0: 5%|▍ | 597/12384 [1:16:12<25:05:04, 7.66s/it, loss=0.4220, acc=0.5015, iter_time=7.72s]
Epoch 0: 5%|▍ | 597/12384 [1:16:20<25:05:04, 7.66s/it, loss=0.4720, acc=0.4488, iter_time=7.02s]
Epoch 0: 5%|▍ | 598/12384 [1:16:20<25:02:10, 7.65s/it, loss=0.4720, acc=0.4488, iter_time=7.02s]
Epoch 0: 5%|▍ | 598/12384 [1:16:28<25:02:10, 7.65s/it, loss=0.4471, acc=0.4765, iter_time=8.24s]
Epoch 0: 5%|▍ | 599/12384 [1:16:28<25:02:04, 7.65s/it, loss=0.4471, acc=0.4765, iter_time=8.24s]
Epoch 0: 5%|▍ | 599/12384 [1:16:35<25:02:04, 7.65s/it, loss=0.4545, acc=0.4907, iter_time=8.04s]
Epoch 0: 5%|▍ | 600/12384 [1:16:35<25:01:31, 7.65s/it, loss=0.4545, acc=0.4907, iter_time=8.04s]
Epoch 0: 5%|▍ | 600/12384 [1:16:43<25:01:31, 7.65s/it, loss=0.3590, acc=0.5658, iter_time=7.21s]
Epoch 0: 5%|▍ | 601/12384 [1:16:43<24:58:57, 7.63s/it, loss=0.3590, acc=0.5658, iter_time=7.21s]
Epoch 0: 5%|▍ | 601/12384 [1:16:51<24:58:57, 7.63s/it, loss=0.3608, acc=0.5635, iter_time=4.77s]
Epoch 0: 5%|▍ | 602/12384 [1:16:51<24:59:41, 7.64s/it, loss=0.3608, acc=0.5635, iter_time=4.77s]
Epoch 0: 5%|▍ | 602/12384 [1:16:58<24:59:41, 7.64s/it, loss=0.4167, acc=0.4805, iter_time=10.47s]
Epoch 0: 5%|▍ | 603/12384 [1:16:58<24:59:09, 7.64s/it, loss=0.4167, acc=0.4805, iter_time=10.47s]
Epoch 0: 5%|▍ | 603/12384 [1:17:06<24:59:09, 7.64s/it, loss=0.3339, acc=0.5512, iter_time=7.66s]
Epoch 0: 5%|▍ | 604/12384 [1:17:06<25:00:31, 7.64s/it, loss=0.3339, acc=0.5512, iter_time=7.66s]
Epoch 0: 5%|▍ | 604/12384 [1:17:13<25:00:31, 7.64s/it, loss=0.3723, acc=0.6058, iter_time=6.45s]
Epoch 0: 5%|▍ | 605/12384 [1:17:13<24:58:34, 7.63s/it, loss=0.3723, acc=0.6058, iter_time=6.45s]
Epoch 0: 5%|▍ | 605/12384 [1:17:21<24:58:34, 7.63s/it, loss=0.4356, acc=0.4972, iter_time=8.80s]
Epoch 0: 5%|▍ | 606/12384 [1:17:21<24:58:41, 7.63s/it, loss=0.4356, acc=0.4972, iter_time=8.80s]
Epoch 0: 5%|▍ | 606/12384 [1:17:29<24:58:41, 7.63s/it, loss=0.3879, acc=0.5585, iter_time=7.63s]
Epoch 0: 5%|▍ | 607/12384 [1:17:29<24:59:41, 7.64s/it, loss=0.3879, acc=0.5585, iter_time=7.63s]
Epoch 0: 5%|▍ | 607/12384 [1:17:36<24:59:41, 7.64s/it, loss=0.4014, acc=0.5559, iter_time=7.64s]
Epoch 0: 5%|▍ | 608/12384 [1:17:36<25:00:20, 7.64s/it, loss=0.4014, acc=0.5559, iter_time=7.64s]
Epoch 0: 5%|▍ | 608/12384 [1:17:44<25:00:20, 7.64s/it, loss=0.3320, acc=0.5873, iter_time=7.68s]
Epoch 0: 5%|▍ | 609/12384 [1:17:44<24:58:37, 7.64s/it, loss=0.3320, acc=0.5873, iter_time=7.68s]
Epoch 0: 5%|▍ | 609/12384 [1:17:52<24:58:37, 7.64s/it, loss=0.4512, acc=0.5488, iter_time=4.07s]
Epoch 0: 5%|▍ | 610/12384 [1:17:52<24:59:21, 7.64s/it, loss=0.4512, acc=0.5488, iter_time=4.07s]
Epoch 0: 5%|▍ | 610/12384 [1:17:59<24:59:21, 7.64s/it, loss=0.3436, acc=0.5503, iter_time=11.19s]
Epoch 0: 5%|▍ | 611/12384 [1:17:59<25:00:45, 7.65s/it, loss=0.3436, acc=0.5503, iter_time=11.19s]
Epoch 0: 5%|▍ | 611/12384 [1:18:07<25:00:45, 7.65s/it, loss=0.2757, acc=0.6474, iter_time=7.72s]
Epoch 0: 5%|▍ | 612/12384 [1:18:07<25:01:53, 7.65s/it, loss=0.2757, acc=0.6474, iter_time=7.72s]
Epoch 0: 5%|▍ | 612/12384 [1:18:15<25:01:53, 7.65s/it, loss=0.3746, acc=0.5754, iter_time=7.92s]
Epoch 0: 5%|▍ | 613/12384 [1:18:15<25:19:13, 7.74s/it, loss=0.3746, acc=0.5754, iter_time=7.92s]
Epoch 0: 5%|▍ | 613/12384 [1:18:23<25:19:13, 7.74s/it, loss=0.3046, acc=0.5813, iter_time=6.71s]
Epoch 0: 5%|▍ | 614/12384 [1:18:23<25:12:10, 7.71s/it, loss=0.3046, acc=0.5813, iter_time=6.71s]
Epoch 0: 5%|▍ | 614/12384 [1:18:30<25:12:10, 7.71s/it, loss=0.3546, acc=0.5911, iter_time=5.79s]
Epoch 0: 5%|▍ | 615/12384 [1:18:30<25:07:42, 7.69s/it, loss=0.3546, acc=0.5911, iter_time=5.79s]
Epoch 0: 5%|▍ | 615/12384 [1:18:38<25:07:42, 7.69s/it, loss=0.2801, acc=0.6547, iter_time=10.86s]
Epoch 0: 5%|▍ | 616/12384 [1:18:38<25:06:35, 7.68s/it, loss=0.2801, acc=0.6547, iter_time=10.86s]
Epoch 0: 5%|▍ | 616/12384 [1:18:45<25:06:35, 7.68s/it, loss=0.3847, acc=0.5504, iter_time=7.21s]
Epoch 0: 5%|▍ | 617/12384 [1:18:45<25:03:00, 7.66s/it, loss=0.3847, acc=0.5504, iter_time=7.21s]
Epoch 0: 5%|▍ | 617/12384 [1:18:53<25:03:00, 7.66s/it, loss=0.2462, acc=0.6632, iter_time=5.85s]
Epoch 0: 5%|▍ | 618/12384 [1:18:53<25:01:59, 7.66s/it, loss=0.2462, acc=0.6632, iter_time=5.85s]
Epoch 0: 5%|▍ | 618/12384 [1:19:01<25:01:59, 7.66s/it, loss=0.3307, acc=0.6648, iter_time=9.42s]
Epoch 0: 5%|▍ | 619/12384 [1:19:01<25:00:27, 7.65s/it, loss=0.3307, acc=0.6648, iter_time=9.42s]
Epoch 0: 5%|▍ | 619/12384 [1:19:08<25:00:27, 7.65s/it, loss=0.3192, acc=0.5956, iter_time=7.64s]
Epoch 0: 5%|▌ | 620/12384 [1:19:08<24:56:30, 7.63s/it, loss=0.3192, acc=0.5956, iter_time=7.64s]
Epoch 0: 5%|▌ | 620/12384 [1:19:16<24:56:30, 7.63s/it, loss=0.2890, acc=0.6224, iter_time=7.60s]
Epoch 0: 5%|▌ | 621/12384 [1:19:16<24:55:58, 7.63s/it, loss=0.2890, acc=0.6224, iter_time=7.60s]
Epoch 0: 5%|▌ | 621/12384 [1:19:24<24:55:58, 7.63s/it, loss=0.2759, acc=0.6690, iter_time=7.63s]
Epoch 0: 5%|▌ | 622/12384 [1:19:24<24:57:59, 7.64s/it, loss=0.2759, acc=0.6690, iter_time=7.63s]
Epoch 0: 5%|▌ | 622/12384 [1:19:31<24:57:59, 7.64s/it, loss=0.2857, acc=0.6261, iter_time=7.66s]
Epoch 0: 5%|▌ | 623/12384 [1:19:31<24:57:50, 7.64s/it, loss=0.2857, acc=0.6261, iter_time=7.66s]
Epoch 0: 5%|▌ | 623/12384 [1:19:39<24:57:50, 7.64s/it, loss=0.2741, acc=0.6090, iter_time=8.04s]
Epoch 0: 5%|▌ | 624/12384 [1:19:39<25:00:58, 7.66s/it, loss=0.2741, acc=0.6090, iter_time=8.04s]
Epoch 0: 5%|▌ | 624/12384 [1:19:47<25:00:58, 7.66s/it, loss=0.3084, acc=0.5810, iter_time=7.30s]
Epoch 0: 5%|▌ | 625/12384 [1:19:47<24:59:33, 7.65s/it, loss=0.3084, acc=0.5810, iter_time=7.30s]
Epoch 0: 5%|▌ | 625/12384 [1:19:54<24:59:33, 7.65s/it, loss=0.2274, acc=0.7522, iter_time=4.04s]
Epoch 0: 5%|▌ | 626/12384 [1:19:54<24:56:39, 7.64s/it, loss=0.2274, acc=0.7522, iter_time=4.04s]
Epoch 0: 5%|▌ | 626/12384 [1:20:02<24:56:39, 7.64s/it, loss=0.2724, acc=0.6851, iter_time=11.17s]
Epoch 0: 5%|▌ | 627/12384 [1:20:02<24:55:59, 7.63s/it, loss=0.2724, acc=0.6851, iter_time=11.17s]
Epoch 0: 5%|▌ | 627/12384 [1:20:09<24:55:59, 7.63s/it, loss=0.2737, acc=0.6208, iter_time=7.65s]
Epoch 0: 5%|▌ | 628/12384 [1:20:09<24:54:54, 7.63s/it, loss=0.2737, acc=0.6208, iter_time=7.65s]
Epoch 0: 5%|▌ | 628/12384 [1:20:17<24:54:54, 7.63s/it, loss=0.2697, acc=0.6223, iter_time=7.62s]
Epoch 0: 5%|▌ | 629/12384 [1:20:17<24:54:39, 7.63s/it, loss=0.2697, acc=0.6223, iter_time=7.62s]
Epoch 0: 5%|▌ | 629/12384 [1:20:25<24:54:39, 7.63s/it, loss=0.3092, acc=0.6069, iter_time=7.65s]
Epoch 0: 5%|▌ | 630/12384 [1:20:25<24:56:20, 7.64s/it, loss=0.3092, acc=0.6069, iter_time=7.65s]
Epoch 0: 5%|▌ | 630/12384 [1:20:32<24:56:20, 7.64s/it, loss=0.2454, acc=0.6816, iter_time=7.64s]
Epoch 0: 5%|▌ | 631/12384 [1:20:32<24:56:58, 7.64s/it, loss=0.2454, acc=0.6816, iter_time=7.64s]
Epoch 0: 5%|▌ | 631/12384 [1:20:40<24:56:58, 7.64s/it, loss=0.3183, acc=0.5691, iter_time=8.04s]
Epoch 0: 5%|▌ | 632/12384 [1:20:40<24:56:56, 7.64s/it, loss=0.3183, acc=0.5691, iter_time=8.04s]
Epoch 0: 5%|▌ | 632/12384 [1:20:48<24:56:56, 7.64s/it, loss=0.2355, acc=0.6794, iter_time=7.25s]
Epoch 0: 5%|▌ | 633/12384 [1:20:48<24:56:52, 7.64s/it, loss=0.2355, acc=0.6794, iter_time=7.25s]
Epoch 0: 5%|▌ | 633/12384 [1:20:55<24:56:52, 7.64s/it, loss=0.2374, acc=0.6964, iter_time=7.63s]
Epoch 0: 5%|▌ | 634/12384 [1:20:55<24:57:06, 7.64s/it, loss=0.2374, acc=0.6964, iter_time=7.63s]
Epoch 0: 5%|▌ | 634/12384 [1:21:03<24:57:06, 7.64s/it, loss=0.2305, acc=0.6784, iter_time=7.66s]
Epoch 0: 5%|▌ | 635/12384 [1:21:03<24:58:33, 7.65s/it, loss=0.2305, acc=0.6784, iter_time=7.66s]
Epoch 0: 5%|▌ | 635/12384 [1:21:11<24:58:33, 7.65s/it, loss=0.1761, acc=0.7745, iter_time=7.67s]
Epoch 0: 5%|▌ | 636/12384 [1:21:11<24:59:50, 7.66s/it, loss=0.1761, acc=0.7745, iter_time=7.67s]
Epoch 0: 5%|▌ | 636/12384 [1:21:18<24:59:50, 7.66s/it, loss=0.1990, acc=0.7060, iter_time=7.68s]
Epoch 0: 5%|▌ | 637/12384 [1:21:18<24:57:25, 7.65s/it, loss=0.1990, acc=0.7060, iter_time=7.68s]
Epoch 0: 5%|▌ | 637/12384 [1:21:26<24:57:25, 7.65s/it, loss=0.2891, acc=0.6542, iter_time=7.66s]
Epoch 0: 5%|▌ | 638/12384 [1:21:26<25:01:05, 7.67s/it, loss=0.2891, acc=0.6542, iter_time=7.66s]
Epoch 0: 5%|▌ | 638/12384 [1:21:35<25:01:05, 7.67s/it, loss=0.2287, acc=0.6787, iter_time=8.48s]
Epoch 0: 5%|▌ | 639/12384 [1:21:35<25:54:06, 7.94s/it, loss=0.2287, acc=0.6787, iter_time=8.48s]
Epoch 0: 5%|▌ | 639/12384 [1:21:43<25:54:06, 7.94s/it, loss=0.2104, acc=0.7418, iter_time=8.11s]
Epoch 0: 5%|▌ | 640/12384 [1:21:43<25:58:16, 7.96s/it, loss=0.2104, acc=0.7418, iter_time=8.11s]
Epoch 0: 5%|▌ | 640/12384 [1:21:50<25:58:16, 7.96s/it, loss=0.2158, acc=0.6936, iter_time=7.65s]
Epoch 0: 5%|▌ | 641/12384 [1:21:50<25:42:47, 7.88s/it, loss=0.2158, acc=0.6936, iter_time=7.65s]
Epoch 0: 5%|▌ | 641/12384 [1:21:58<25:42:47, 7.88s/it, loss=0.1843, acc=0.7471, iter_time=7.73s]
Epoch 0: 5%|▌ | 642/12384 [1:21:58<25:26:42, 7.80s/it, loss=0.1843, acc=0.7471, iter_time=7.73s]
Epoch 0: 5%|▌ | 642/12384 [1:22:06<25:26:42, 7.80s/it, loss=0.2027, acc=0.7683, iter_time=6.67s]
Epoch 0: 5%|▌ | 643/12384 [1:22:06<25:17:14, 7.75s/it, loss=0.2027, acc=0.7683, iter_time=6.67s]
Epoch 0: 5%|▌ | 643/12384 [1:22:13<25:17:14, 7.75s/it, loss=0.1985, acc=0.7134, iter_time=8.56s]
Epoch 0: 5%|▌ | 644/12384 [1:22:13<25:08:42, 7.71s/it, loss=0.1985, acc=0.7134, iter_time=8.56s]
Epoch 0: 5%|▌ | 644/12384 [1:22:21<25:08:42, 7.71s/it, loss=0.1784, acc=0.7264, iter_time=7.64s]
Epoch 0: 5%|▌ | 645/12384 [1:22:21<25:04:52, 7.69s/it, loss=0.1784, acc=0.7264, iter_time=7.64s]
Epoch 0: 5%|▌ | 645/12384 [1:22:28<25:04:52, 7.69s/it, loss=0.1879, acc=0.7621, iter_time=7.62s]
Epoch 0: 5%|▌ | 646/12384 [1:22:28<25:00:38, 7.67s/it, loss=0.1879, acc=0.7621, iter_time=7.62s]
Epoch 0: 5%|▌ | 646/12384 [1:22:36<25:00:38, 7.67s/it, loss=0.1737, acc=0.7515, iter_time=7.63s]
Epoch 0: 5%|▌ | 647/12384 [1:22:36<24:58:09, 7.66s/it, loss=0.1737, acc=0.7515, iter_time=7.63s]
Epoch 0: 5%|▌ | 647/12384 [1:22:44<24:58:09, 7.66s/it, loss=0.1593, acc=0.7533, iter_time=8.02s]
Epoch 0: 5%|▌ | 648/12384 [1:22:44<24:54:37, 7.64s/it, loss=0.1593, acc=0.7533, iter_time=8.02s]
Epoch 0: 5%|▌ | 648/12384 [1:22:51<24:54:37, 7.64s/it, loss=0.1462, acc=0.7813, iter_time=7.21s]
Epoch 0: 5%|▌ | 649/12384 [1:22:51<24:52:36, 7.63s/it, loss=0.1462, acc=0.7813, iter_time=7.21s]
Epoch 0: 5%|▌ | 649/12384 [1:22:59<24:52:36, 7.63s/it, loss=0.5466, acc=0.6792, iter_time=8.10s]
Epoch 0: 5%|▌ | 650/12384 [1:22:59<24:56:29, 7.65s/it, loss=0.5466, acc=0.6792, iter_time=8.10s]
Epoch 0: 5%|▌ | 650/12384 [1:23:07<24:56:29, 7.65s/it, loss=0.1704, acc=0.7695, iter_time=7.24s]
Epoch 0: 5%|▌ | 651/12384 [1:23:07<24:59:51, 7.67s/it, loss=0.1704, acc=0.7695, iter_time=7.24s]
Epoch 0: 5%|▌ | 651/12384 [1:23:14<24:59:51, 7.67s/it, loss=0.1583, acc=0.7768, iter_time=7.70s]
Epoch 0: 5%|▌ | 652/12384 [1:23:14<24:57:30, 7.66s/it, loss=0.1583, acc=0.7768, iter_time=7.70s]
Epoch 0: 5%|▌ | 652/12384 [1:23:22<24:57:30, 7.66s/it, loss=0.2298, acc=0.7080, iter_time=7.64s]
Epoch 0: 5%|▌ | 653/12384 [1:23:22<24:55:59, 7.65s/it, loss=0.2298, acc=0.7080, iter_time=7.64s]
Epoch 0: 5%|▌ | 653/12384 [1:23:30<24:55:59, 7.65s/it, loss=0.1883, acc=0.7259, iter_time=4.84s]
Epoch 0: 5%|▌ | 654/12384 [1:23:30<24:54:47, 7.65s/it, loss=0.1883, acc=0.7259, iter_time=4.84s]
Epoch 0: 5%|▌ | 654/12384 [1:23:37<24:54:47, 7.65s/it, loss=0.1999, acc=0.7265, iter_time=10.41s]
Epoch 0: 5%|▌ | 655/12384 [1:23:37<24:53:51, 7.64s/it, loss=0.1999, acc=0.7265, iter_time=10.41s]
Epoch 0: 5%|▌ | 655/12384 [1:23:45<24:53:51, 7.64s/it, loss=0.1884, acc=0.7112, iter_time=8.01s]
Epoch 0: 5%|▌ | 656/12384 [1:23:45<24:58:08, 7.66s/it, loss=0.1884, acc=0.7112, iter_time=8.01s]
Epoch 0: 5%|▌ | 656/12384 [1:23:53<24:58:08, 7.66s/it, loss=0.1850, acc=0.7239, iter_time=7.35s]
Epoch 0: 5%|▌ | 657/12384 [1:23:53<24:54:59, 7.65s/it, loss=0.1850, acc=0.7239, iter_time=7.35s]
Epoch 0: 5%|▌ | 657/12384 [1:24:00<24:54:59, 7.65s/it, loss=0.1589, acc=0.7934, iter_time=7.59s]
Epoch 0: 5%|▌ | 658/12384 [1:24:00<24:51:10, 7.63s/it, loss=0.1589, acc=0.7934, iter_time=7.59s]
Epoch 0: 5%|▌ | 658/12384 [1:24:08<24:51:10, 7.63s/it, loss=0.1807, acc=0.7450, iter_time=7.62s]
Epoch 0: 5%|▌ | 659/12384 [1:24:08<24:53:02, 7.64s/it, loss=0.1807, acc=0.7450, iter_time=7.62s]
Epoch 0: 5%|▌ | 659/12384 [1:24:15<24:53:02, 7.64s/it, loss=0.1695, acc=0.7443, iter_time=6.70s]
Epoch 0: 5%|▌ | 660/12384 [1:24:15<24:52:43, 7.64s/it, loss=0.1695, acc=0.7443, iter_time=6.70s]
Epoch 0: 5%|▌ | 660/12384 [1:24:23<24:52:43, 7.64s/it, loss=0.1544, acc=0.7608, iter_time=8.60s]
Epoch 0: 5%|▌ | 661/12384 [1:24:23<24:52:39, 7.64s/it, loss=0.1544, acc=0.7608, iter_time=8.60s]
Epoch 0: 5%|▌ | 661/12384 [1:24:31<24:52:39, 7.64s/it, loss=0.1465, acc=0.7956, iter_time=7.64s]
Epoch 0: 5%|▌ | 662/12384 [1:24:31<24:52:13, 7.64s/it, loss=0.1465, acc=0.7956, iter_time=7.64s]
Epoch 0: 5%|▌ | 662/12384 [1:24:38<24:52:13, 7.64s/it, loss=0.2700, acc=0.7387, iter_time=4.85s]
Epoch 0: 5%|▌ | 663/12384 [1:24:38<24:52:28, 7.64s/it, loss=0.2700, acc=0.7387, iter_time=4.85s]
Epoch 0: 5%|▌ | 663/12384 [1:24:46<24:52:28, 7.64s/it, loss=0.1463, acc=0.7929, iter_time=10.38s]
Epoch 0: 5%|▌ | 664/12384 [1:24:46<24:51:12, 7.63s/it, loss=0.1463, acc=0.7929, iter_time=10.38s]
Epoch 0: 5%|▌ | 664/12384 [1:24:54<24:51:12, 7.63s/it, loss=0.2011, acc=0.7511, iter_time=7.66s]
Epoch 0: 5%|▌ | 665/12384 [1:24:54<24:49:41, 7.63s/it, loss=0.2011, acc=0.7511, iter_time=7.66s]
Epoch 0: 5%|▌ | 665/12384 [1:25:01<24:49:41, 7.63s/it, loss=0.1036, acc=0.8381, iter_time=7.92s]
Epoch 0: 5%|▌ | 666/12384 [1:25:01<25:06:07, 7.71s/it, loss=0.1036, acc=0.8381, iter_time=7.92s]
Epoch 0: 5%|▌ | 666/12384 [1:25:09<25:06:07, 7.71s/it, loss=0.1327, acc=0.8042, iter_time=4.23s]
Epoch 0: 5%|▌ | 667/12384 [1:25:09<25:00:36, 7.68s/it, loss=0.1327, acc=0.8042, iter_time=4.23s]
Epoch 0: 5%|▌ | 667/12384 [1:25:17<25:00:36, 7.68s/it, loss=0.1302, acc=0.8088, iter_time=10.99s]
Epoch 0: 5%|▌ | 668/12384 [1:25:17<24:56:54, 7.67s/it, loss=0.1302, acc=0.8088, iter_time=10.99s]
Epoch 0: 5%|▌ | 668/12384 [1:25:24<24:56:54, 7.67s/it, loss=0.0870, acc=0.8783, iter_time=7.63s]
Epoch 0: 5%|▌ | 669/12384 [1:25:24<24:54:18, 7.65s/it, loss=0.0870, acc=0.8783, iter_time=7.63s]
Epoch 0: 5%|▌ | 669/12384 [1:25:32<24:54:18, 7.65s/it, loss=0.1286, acc=0.8579, iter_time=5.56s]
Epoch 0: 5%|▌ | 670/12384 [1:25:32<24:52:04, 7.64s/it, loss=0.1286, acc=0.8579, iter_time=5.56s]
Epoch 0: 5%|▌ | 670/12384 [1:25:40<24:52:04, 7.64s/it, loss=0.1241, acc=0.8032, iter_time=9.44s]
Epoch 0: 5%|▌ | 671/12384 [1:25:40<24:49:59, 7.63s/it, loss=0.1241, acc=0.8032, iter_time=9.44s]
Epoch 0: 5%|▌ | 671/12384 [1:25:47<24:49:59, 7.63s/it, loss=0.1622, acc=0.8018, iter_time=7.83s]
Epoch 0: 5%|▌ | 672/12384 [1:25:47<24:50:36, 7.64s/it, loss=0.1622, acc=0.8018, iter_time=7.83s]
Epoch 0: 5%|▌ | 672/12384 [1:25:55<24:50:36, 7.64s/it, loss=0.1058, acc=0.8327, iter_time=6.69s]
Epoch 0: 5%|▌ | 673/12384 [1:25:55<24:48:24, 7.63s/it, loss=0.1058, acc=0.8327, iter_time=6.69s]
Epoch 0: 5%|▌ | 673/12384 [1:26:02<24:48:24, 7.63s/it, loss=0.1210, acc=0.8160, iter_time=5.04s]
Epoch 0: 5%|▌ | 674/12384 [1:26:02<24:46:49, 7.62s/it, loss=0.1210, acc=0.8160, iter_time=5.04s]
Epoch 0: 5%|▌ | 674/12384 [1:26:10<24:46:49, 7.62s/it, loss=0.1089, acc=0.8183, iter_time=11.10s]
Epoch 0: 5%|▌ | 675/12384 [1:26:10<24:46:43, 7.62s/it, loss=0.1089, acc=0.8183, iter_time=11.10s]
Epoch 0: 5%|▌ | 675/12384 [1:26:18<24:46:43, 7.62s/it, loss=0.1180, acc=0.8083, iter_time=7.63s]
Epoch 0: 5%|▌ | 676/12384 [1:26:18<24:47:31, 7.62s/it, loss=0.1180, acc=0.8083, iter_time=7.63s]
Epoch 0: 5%|▌ | 676/12384 [1:26:25<24:47:31, 7.62s/it, loss=0.1031, acc=0.8541, iter_time=7.63s]
Epoch 0: 5%|▌ | 677/12384 [1:26:25<24:45:33, 7.61s/it, loss=0.1031, acc=0.8541, iter_time=7.63s]
Epoch 0: 5%|▌ | 677/12384 [1:26:33<24:45:33, 7.61s/it, loss=0.1068, acc=0.8435, iter_time=7.60s]
Epoch 0: 5%|▌ | 678/12384 [1:26:33<24:46:14, 7.62s/it, loss=0.1068, acc=0.8435, iter_time=7.60s]
Epoch 0: 5%|▌ | 678/12384 [1:26:41<24:46:14, 7.62s/it, loss=0.2316, acc=0.7498, iter_time=5.90s]
Epoch 0: 5%|▌ | 679/12384 [1:26:41<24:50:06, 7.64s/it, loss=0.2316, acc=0.7498, iter_time=5.90s]
Epoch 0: 5%|▌ | 679/12384 [1:26:48<24:50:06, 7.64s/it, loss=0.1292, acc=0.8201, iter_time=9.40s]
Epoch 0: 5%|▌ | 680/12384 [1:26:48<24:50:21, 7.64s/it, loss=0.1292, acc=0.8201, iter_time=9.40s]
Epoch 0: 5%|▌ | 680/12384 [1:26:56<24:50:21, 7.64s/it, loss=0.1082, acc=0.8327, iter_time=7.72s]
Epoch 0: 5%|▌ | 681/12384 [1:26:56<24:51:59, 7.65s/it, loss=0.1082, acc=0.8327, iter_time=7.72s]
Epoch 0: 5%|▌ | 681/12384 [1:27:04<24:51:59, 7.65s/it, loss=0.1277, acc=0.8374, iter_time=4.84s]
Epoch 0: 6%|▌ | 682/12384 [1:27:04<24:50:16, 7.64s/it, loss=0.1277, acc=0.8374, iter_time=4.84s]
Epoch 0: 6%|▌ | 682/12384 [1:27:11<24:50:16, 7.64s/it, loss=0.1247, acc=0.7995, iter_time=10.39s]
Epoch 0: 6%|▌ | 683/12384 [1:27:11<24:50:26, 7.64s/it, loss=0.1247, acc=0.7995, iter_time=10.39s]
Epoch 0: 6%|▌ | 683/12384 [1:27:19<24:50:26, 7.64s/it, loss=0.1036, acc=0.8508, iter_time=6.42s]
Epoch 0: 6%|▌ | 684/12384 [1:27:19<24:49:39, 7.64s/it, loss=0.1036, acc=0.8508, iter_time=6.42s]
Epoch 0: 6%|▌ | 684/12384 [1:27:26<24:49:39, 7.64s/it, loss=0.1177, acc=0.8069, iter_time=7.94s]
Epoch 0: 6%|▌ | 685/12384 [1:27:26<24:47:02, 7.63s/it, loss=0.1177, acc=0.8069, iter_time=7.94s]
Epoch 0: 6%|▌ | 685/12384 [1:27:34<24:47:02, 7.63s/it, loss=0.1126, acc=0.8421, iter_time=8.53s]
Epoch 0: 6%|▌ | 686/12384 [1:27:34<24:48:19, 7.63s/it, loss=0.1126, acc=0.8421, iter_time=8.53s]
Epoch 0: 6%|▌ | 686/12384 [1:27:42<24:48:19, 7.63s/it, loss=0.1070, acc=0.8501, iter_time=7.64s]
Epoch 0: 6%|▌ | 687/12384 [1:27:42<24:50:35, 7.65s/it, loss=0.1070, acc=0.8501, iter_time=7.64s]
Epoch 0: 6%|▌ | 687/12384 [1:27:49<24:50:35, 7.65s/it, loss=0.1305, acc=0.7891, iter_time=8.06s]
Epoch 0: 6%|▌ | 688/12384 [1:27:49<24:48:56, 7.64s/it, loss=0.1305, acc=0.7891, iter_time=8.06s]
Epoch 0: 6%|▌ | 688/12384 [1:27:57<24:48:56, 7.64s/it, loss=0.0905, acc=0.8557, iter_time=7.36s]
Epoch 0: 6%|▌ | 689/12384 [1:27:57<24:53:38, 7.66s/it, loss=0.0905, acc=0.8557, iter_time=7.36s]
Epoch 0: 6%|▌ | 689/12384 [1:28:05<24:53:38, 7.66s/it, loss=0.0984, acc=0.8304, iter_time=6.40s]
Epoch 0: 6%|▌ | 690/12384 [1:28:05<24:51:24, 7.65s/it, loss=0.0984, acc=0.8304, iter_time=6.40s]
Epoch 0: 6%|▌ | 690/12384 [1:28:12<24:51:24, 7.65s/it, loss=0.0924, acc=0.8252, iter_time=8.84s]
Epoch 0: 6%|▌ | 691/12384 [1:28:12<24:51:44, 7.65s/it, loss=0.0924, acc=0.8252, iter_time=8.84s]
Epoch 0: 6%|▌ | 691/12384 [1:28:20<24:51:44, 7.65s/it, loss=0.0950, acc=0.8587, iter_time=7.66s]
Epoch 0: 6%|▌ | 692/12384 [1:28:20<24:49:29, 7.64s/it, loss=0.0950, acc=0.8587, iter_time=7.66s]
Epoch 0: 6%|▌ | 692/12384 [1:28:28<24:49:29, 7.64s/it, loss=0.1179, acc=0.7997, iter_time=7.94s]
Epoch 0: 6%|▌ | 693/12384 [1:28:28<25:08:25, 7.74s/it, loss=0.1179, acc=0.7997, iter_time=7.94s]
Epoch 0: 6%|▌ | 693/12384 [1:28:36<25:08:25, 7.74s/it, loss=0.0900, acc=0.8538, iter_time=7.08s]
Epoch 0: 6%|▌ | 694/12384 [1:28:36<25:00:02, 7.70s/it, loss=0.0900, acc=0.8538, iter_time=7.08s]
Epoch 0: 6%|▌ | 694/12384 [1:28:43<25:00:02, 7.70s/it, loss=0.0796, acc=0.8855, iter_time=4.61s]
Epoch 0: 6%|▌ | 695/12384 [1:28:43<24:53:38, 7.67s/it, loss=0.0796, acc=0.8855, iter_time=4.61s]
Epoch 0: 6%|▌ | 695/12384 [1:28:51<24:53:38, 7.67s/it, loss=0.0898, acc=0.8556, iter_time=11.22s]
Epoch 0: 6%|▌ | 696/12384 [1:28:51<24:49:06, 7.64s/it, loss=0.0898, acc=0.8556, iter_time=11.22s]
Epoch 0: 6%|▌ | 696/12384 [1:28:58<24:49:06, 7.64s/it, loss=0.0742, acc=0.9220, iter_time=4.88s]
Epoch 0: 6%|▌ | 697/12384 [1:28:58<24:47:54, 7.64s/it, loss=0.0742, acc=0.9220, iter_time=4.88s]
Epoch 0: 6%|▌ | 697/12384 [1:29:06<24:47:54, 7.64s/it, loss=0.0700, acc=0.9074, iter_time=8.46s]
Epoch 0: 6%|▌ | 698/12384 [1:29:06<24:49:52, 7.65s/it, loss=0.0700, acc=0.9074, iter_time=8.46s]
Epoch 0: 6%|▌ | 698/12384 [1:29:14<24:49:52, 7.65s/it, loss=0.1078, acc=0.8478, iter_time=8.52s]
Epoch 0: 6%|▌ | 699/12384 [1:29:14<24:46:45, 7.63s/it, loss=0.1078, acc=0.8478, iter_time=8.52s]
Epoch 0: 6%|▌ | 699/12384 [1:29:21<24:46:45, 7.63s/it, loss=0.0870, acc=0.8846, iter_time=8.96s]
Epoch 0: 6%|▌ | 700/12384 [1:29:21<24:45:54, 7.63s/it, loss=0.0870, acc=0.8846, iter_time=8.96s]
Epoch 0: 6%|▌ | 700/12384 [1:29:29<24:45:54, 7.63s/it, loss=0.0963, acc=0.8636, iter_time=7.20s]
Epoch 0: 6%|▌ | 701/12384 [1:29:29<24:44:46, 7.63s/it, loss=0.0963, acc=0.8636, iter_time=7.20s]
Epoch 0: 6%|▌ | 701/12384 [1:29:36<24:44:46, 7.63s/it, loss=0.0899, acc=0.8464, iter_time=7.63s]
Epoch 0: 6%|▌ | 702/12384 [1:29:36<24:44:36, 7.63s/it, loss=0.0899, acc=0.8464, iter_time=7.63s]
Epoch 0: 6%|▌ | 702/12384 [1:29:44<24:44:36, 7.63s/it, loss=0.0659, acc=0.8993, iter_time=7.62s]
Epoch 0: 6%|▌ | 703/12384 [1:29:44<24:44:40, 7.63s/it, loss=0.0659, acc=0.8993, iter_time=7.62s]
Epoch 0: 6%|▌ | 703/12384 [1:29:52<24:44:40, 7.63s/it, loss=0.0636, acc=0.9133, iter_time=7.61s]
Epoch 0: 6%|▌ | 704/12384 [1:29:52<24:45:31, 7.63s/it, loss=0.0636, acc=0.9133, iter_time=7.61s]
Epoch 0: 6%|▌ | 704/12384 [1:29:59<24:45:31, 7.63s/it, loss=0.0882, acc=0.8802, iter_time=5.10s]
Epoch 0: 6%|▌ | 705/12384 [1:29:59<24:45:50, 7.63s/it, loss=0.0882, acc=0.8802, iter_time=5.10s]
Epoch 0: 6%|▌ | 705/12384 [1:30:07<24:45:50, 7.63s/it, loss=0.0552, acc=0.9215, iter_time=10.19s]
Epoch 0: 6%|▌ | 706/12384 [1:30:07<24:44:24, 7.63s/it, loss=0.0552, acc=0.9215, iter_time=10.19s]
Epoch 0: 6%|▌ | 706/12384 [1:30:15<24:44:24, 7.63s/it, loss=0.0729, acc=0.8890, iter_time=7.63s]
Epoch 0: 6%|▌ | 707/12384 [1:30:15<24:45:26, 7.63s/it, loss=0.0729, acc=0.8890, iter_time=7.63s]
Epoch 0: 6%|▌ | 707/12384 [1:30:22<24:45:26, 7.63s/it, loss=0.0743, acc=0.8881, iter_time=7.62s]
Epoch 0: 6%|▌ | 708/12384 [1:30:22<24:44:36, 7.63s/it, loss=0.0743, acc=0.8881, iter_time=7.62s]
Epoch 0: 6%|▌ | 708/12384 [1:30:30<24:44:36, 7.63s/it, loss=0.0683, acc=0.8922, iter_time=7.65s]
Epoch 0: 6%|▌ | 709/12384 [1:30:30<24:43:40, 7.62s/it, loss=0.0683, acc=0.8922, iter_time=7.65s]
Epoch 0: 6%|▌ | 709/12384 [1:30:38<24:43:40, 7.62s/it, loss=0.0779, acc=0.8605, iter_time=4.74s]
Epoch 0: 6%|▌ | 710/12384 [1:30:38<24:44:15, 7.63s/it, loss=0.0779, acc=0.8605, iter_time=4.74s]
Epoch 0: 6%|▌ | 710/12384 [1:30:45<24:44:15, 7.63s/it, loss=0.0851, acc=0.8623, iter_time=10.49s]
Epoch 0: 6%|▌ | 711/12384 [1:30:45<24:45:14, 7.63s/it, loss=0.0851, acc=0.8623, iter_time=10.49s]
Epoch 0: 6%|▌ | 711/12384 [1:30:53<24:45:14, 7.63s/it, loss=0.1700, acc=0.8449, iter_time=8.04s]
Epoch 0: 6%|▌ | 712/12384 [1:30:53<24:45:44, 7.64s/it, loss=0.1700, acc=0.8449, iter_time=8.04s]
Epoch 0: 6%|▌ | 712/12384 [1:31:00<24:45:44, 7.64s/it, loss=0.1078, acc=0.8213, iter_time=7.23s]
Epoch 0: 6%|▌ | 713/12384 [1:31:00<24:45:00, 7.63s/it, loss=0.1078, acc=0.8213, iter_time=7.23s]
Epoch 0: 6%|▌ | 713/12384 [1:31:08<24:45:00, 7.63s/it, loss=0.0854, acc=0.8348, iter_time=7.01s]
Epoch 0: 6%|▌ | 714/12384 [1:31:08<24:45:39, 7.64s/it, loss=0.0854, acc=0.8348, iter_time=7.01s]
Epoch 0: 6%|▌ | 714/12384 [1:31:16<24:45:39, 7.64s/it, loss=0.0721, acc=0.8963, iter_time=8.30s]
Epoch 0: 6%|▌ | 715/12384 [1:31:16<24:46:52, 7.65s/it, loss=0.0721, acc=0.8963, iter_time=8.30s]
Epoch 0: 6%|▌ | 715/12384 [1:31:23<24:46:52, 7.65s/it, loss=0.0602, acc=0.9016, iter_time=7.66s]
Epoch 0: 6%|▌ | 716/12384 [1:31:23<24:44:33, 7.63s/it, loss=0.0602, acc=0.9016, iter_time=7.66s]
Epoch 0: 6%|▌ | 716/12384 [1:31:31<24:44:33, 7.63s/it, loss=0.0475, acc=0.9400, iter_time=7.61s]
Epoch 0: 6%|▌ | 717/12384 [1:31:31<24:43:56, 7.63s/it, loss=0.0475, acc=0.9400, iter_time=7.61s]
Epoch 0: 6%|▌ | 717/12384 [1:31:39<24:43:56, 7.63s/it, loss=0.0821, acc=0.8669, iter_time=5.83s]
Epoch 0: 6%|▌ | 718/12384 [1:31:39<24:47:11, 7.65s/it, loss=0.0821, acc=0.8669, iter_time=5.83s]
Epoch 0: 6%|▌ | 718/12384 [1:31:47<24:47:11, 7.65s/it, loss=0.0577, acc=0.9257, iter_time=9.48s]
Epoch 0: 6%|▌ | 719/12384 [1:31:47<25:02:04, 7.73s/it, loss=0.0577, acc=0.9257, iter_time=9.48s]
Epoch 0: 6%|▌ | 719/12384 [1:31:54<25:02:04, 7.73s/it, loss=0.0791, acc=0.8718, iter_time=8.29s]
Epoch 0: 6%|▌ | 720/12384 [1:31:54<24:57:03, 7.70s/it, loss=0.0791, acc=0.8718, iter_time=8.29s]
Epoch 0: 6%|▌ | 720/12384 [1:32:02<24:57:03, 7.70s/it, loss=0.1032, acc=0.8775, iter_time=7.24s]
Epoch 0: 6%|▌ | 721/12384 [1:32:02<24:51:42, 7.67s/it, loss=0.1032, acc=0.8775, iter_time=7.24s]
Epoch 0: 6%|▌ | 721/12384 [1:32:09<24:51:42, 7.67s/it, loss=0.0505, acc=0.9189, iter_time=6.42s]
Epoch 0: 6%|▌ | 722/12384 [1:32:09<24:47:12, 7.65s/it, loss=0.0505, acc=0.9189, iter_time=6.42s]
Epoch 0: 6%|▌ | 722/12384 [1:32:17<24:47:12, 7.65s/it, loss=0.0540, acc=0.9087, iter_time=8.80s]
Epoch 0: 6%|▌ | 723/12384 [1:32:17<24:45:45, 7.64s/it, loss=0.0540, acc=0.9087, iter_time=8.80s]
Epoch 0: 6%|▌ | 723/12384 [1:32:25<24:45:45, 7.64s/it, loss=0.0382, acc=0.9305, iter_time=7.64s]
Epoch 0: 6%|▌ | 724/12384 [1:32:25<24:44:41, 7.64s/it, loss=0.0382, acc=0.9305, iter_time=7.64s]
Epoch 0: 6%|▌ | 724/12384 [1:32:32<24:44:41, 7.64s/it, loss=0.0724, acc=0.8542, iter_time=4.25s]
Epoch 0: 6%|▌ | 725/12384 [1:32:32<24:45:24, 7.64s/it, loss=0.0724, acc=0.8542, iter_time=4.25s]
Epoch 0: 6%|▌ | 725/12384 [1:32:40<24:45:24, 7.64s/it, loss=0.0610, acc=0.9049, iter_time=11.01s]
Epoch 0: 6%|▌ | 726/12384 [1:32:40<24:43:10, 7.63s/it, loss=0.0610, acc=0.9049, iter_time=11.01s]
Epoch 0: 6%|▌ | 726/12384 [1:32:48<24:43:10, 7.63s/it, loss=0.0618, acc=0.9024, iter_time=7.63s]
Epoch 0: 6%|▌ | 727/12384 [1:32:48<24:41:11, 7.62s/it, loss=0.0618, acc=0.9024, iter_time=7.63s]
Epoch 0: 6%|▌ | 727/12384 [1:32:55<24:41:11, 7.62s/it, loss=0.0476, acc=0.9378, iter_time=7.57s]
Epoch 0: 6%|▌ | 728/12384 [1:32:55<24:41:34, 7.63s/it, loss=0.0476, acc=0.9378, iter_time=7.57s]
Epoch 0: 6%|▌ | 728/12384 [1:33:03<24:41:34, 7.63s/it, loss=0.0640, acc=0.8811, iter_time=7.68s]
Epoch 0: 6%|▌ | 729/12384 [1:33:03<24:41:03, 7.62s/it, loss=0.0640, acc=0.8811, iter_time=7.68s]
Epoch 0: 6%|▌ | 729/12384 [1:33:10<24:41:03, 7.62s/it, loss=0.0732, acc=0.8555, iter_time=7.59s]
Epoch 0: 6%|▌ | 730/12384 [1:33:10<24:40:30, 7.62s/it, loss=0.0732, acc=0.8555, iter_time=7.59s]
Epoch 0: 6%|▌ | 730/12384 [1:33:18<24:40:30, 7.62s/it, loss=0.1067, acc=0.8770, iter_time=4.56s]
Epoch 0: 6%|▌ | 731/12384 [1:33:18<24:42:32, 7.63s/it, loss=0.1067, acc=0.8770, iter_time=4.56s]
Epoch 0: 6%|▌ | 731/12384 [1:33:26<24:42:32, 7.63s/it, loss=0.0435, acc=0.9228, iter_time=7.91s]
Epoch 0: 6%|▌ | 732/12384 [1:33:26<24:49:14, 7.67s/it, loss=0.0435, acc=0.9228, iter_time=7.91s]
Epoch 0: 6%|▌ | 732/12384 [1:33:33<24:49:14, 7.67s/it, loss=0.0788, acc=0.8607, iter_time=10.56s]
Epoch 0: 6%|▌ | 733/12384 [1:33:33<24:47:25, 7.66s/it, loss=0.0788, acc=0.8607, iter_time=10.56s]
Epoch 0: 6%|▌ | 733/12384 [1:33:41<24:47:25, 7.66s/it, loss=0.0610, acc=0.8936, iter_time=6.16s]
Epoch 0: 6%|▌ | 734/12384 [1:33:41<24:46:09, 7.65s/it, loss=0.0610, acc=0.8936, iter_time=6.16s]
Epoch 0: 6%|▌ | 734/12384 [1:33:49<24:46:09, 7.65s/it, loss=0.0510, acc=0.9132, iter_time=7.92s]
Epoch 0: 6%|▌ | 735/12384 [1:33:49<24:45:02, 7.65s/it, loss=0.0510, acc=0.9132, iter_time=7.92s]
Epoch 0: 6%|▌ | 735/12384 [1:33:56<24:45:02, 7.65s/it, loss=0.0514, acc=0.9083, iter_time=9.25s]
Epoch 0: 6%|▌ | 736/12384 [1:33:56<24:46:00, 7.65s/it, loss=0.0514, acc=0.9083, iter_time=9.25s]
Epoch 0: 6%|▌ | 736/12384 [1:34:04<24:46:00, 7.65s/it, loss=0.0416, acc=0.9112, iter_time=4.95s]
Epoch 0: 6%|▌ | 737/12384 [1:34:04<24:42:48, 7.64s/it, loss=0.0416, acc=0.9112, iter_time=4.95s]
Epoch 0: 6%|▌ | 737/12384 [1:34:12<24:42:48, 7.64s/it, loss=0.0671, acc=0.9069, iter_time=9.90s]
Epoch 0: 6%|▌ | 738/12384 [1:34:12<24:42:37, 7.64s/it, loss=0.0671, acc=0.9069, iter_time=9.90s]
Epoch 0: 6%|▌ | 738/12384 [1:34:19<24:42:37, 7.64s/it, loss=0.0615, acc=0.8817, iter_time=7.66s]
Epoch 0: 6%|▌ | 739/12384 [1:34:19<24:44:39, 7.65s/it, loss=0.0615, acc=0.8817, iter_time=7.66s]
Epoch 0: 6%|▌ | 739/12384 [1:34:27<24:44:39, 7.65s/it, loss=0.0525, acc=0.9135, iter_time=5.90s]
Epoch 0: 6%|▌ | 740/12384 [1:34:27<24:47:19, 7.66s/it, loss=0.0525, acc=0.9135, iter_time=5.90s]
Epoch 0: 6%|▌ | 740/12384 [1:34:35<24:47:19, 7.66s/it, loss=0.2883, acc=0.8236, iter_time=9.47s]
Epoch 0: 6%|▌ | 741/12384 [1:34:35<24:44:20, 7.65s/it, loss=0.2883, acc=0.8236, iter_time=9.47s]
Epoch 0: 6%|▌ | 741/12384 [1:34:42<24:44:20, 7.65s/it, loss=0.0424, acc=0.9257, iter_time=7.59s]
Epoch 0: 6%|▌ | 742/12384 [1:34:42<24:42:15, 7.64s/it, loss=0.0424, acc=0.9257, iter_time=7.59s]
Epoch 0: 6%|▌ | 742/12384 [1:34:50<24:42:15, 7.64s/it, loss=0.1948, acc=0.8517, iter_time=7.62s]
Epoch 0: 6%|▌ | 743/12384 [1:34:50<24:41:33, 7.64s/it, loss=0.1948, acc=0.8517, iter_time=7.62s]
Epoch 0: 6%|▌ | 743/12384 [1:34:58<24:41:33, 7.64s/it, loss=0.0475, acc=0.9171, iter_time=8.04s]
Epoch 0: 6%|▌ | 744/12384 [1:34:58<24:40:17, 7.63s/it, loss=0.0475, acc=0.9171, iter_time=8.04s]
Epoch 0: 6%|▌ | 744/12384 [1:35:05<24:40:17, 7.63s/it, loss=0.0418, acc=0.9287, iter_time=7.52s]
Epoch 0: 6%|▌ | 745/12384 [1:35:05<24:58:51, 7.73s/it, loss=0.0418, acc=0.9287, iter_time=7.52s]
Epoch 0: 6%|▌ | 745/12384 [1:35:13<24:58:51, 7.73s/it, loss=0.0360, acc=0.9375, iter_time=7.68s]
Epoch 0: 6%|▌ | 746/12384 [1:35:13<24:57:01, 7.72s/it, loss=0.0360, acc=0.9375, iter_time=7.68s]
Epoch 0: 6%|▌ | 746/12384 [1:35:21<24:57:01, 7.72s/it, loss=0.0492, acc=0.9099, iter_time=7.68s]
Epoch 0: 6%|▌ | 747/12384 [1:35:21<24:51:00, 7.69s/it, loss=0.0492, acc=0.9099, iter_time=7.68s]
Epoch 0: 6%|▌ | 747/12384 [1:35:28<24:51:00, 7.69s/it, loss=0.0421, acc=0.9237, iter_time=7.61s]
Epoch 0: 6%|▌ | 748/12384 [1:35:28<24:47:09, 7.67s/it, loss=0.0421, acc=0.9237, iter_time=7.61s]
Epoch 0: 6%|▌ | 748/12384 [1:35:36<24:47:09, 7.67s/it, loss=0.0499, acc=0.9035, iter_time=7.03s]
Epoch 0: 6%|▌ | 749/12384 [1:35:36<24:42:50, 7.65s/it, loss=0.0499, acc=0.9035, iter_time=7.03s]
Epoch 0: 6%|▌ | 749/12384 [1:35:44<24:42:50, 7.65s/it, loss=0.0404, acc=0.9213, iter_time=8.59s]
Epoch 0: 6%|▌ | 750/12384 [1:35:44<24:41:44, 7.64s/it, loss=0.0404, acc=0.9213, iter_time=8.59s]
Epoch 0: 6%|▌ | 750/12384 [1:35:51<24:41:44, 7.64s/it, loss=0.0422, acc=0.9309, iter_time=4.63s]
Epoch 0: 6%|▌ | 751/12384 [1:35:51<24:39:00, 7.63s/it, loss=0.0422, acc=0.9309, iter_time=4.63s]
Epoch 0: 6%|▌ | 751/12384 [1:35:59<24:39:00, 7.63s/it, loss=0.0383, acc=0.9451, iter_time=10.54s]
Epoch 0: 6%|▌ | 752/12384 [1:35:59<24:39:12, 7.63s/it, loss=0.0383, acc=0.9451, iter_time=10.54s]
Epoch 0: 6%|▌ | 752/12384 [1:36:06<24:39:12, 7.63s/it, loss=0.0451, acc=0.9196, iter_time=7.27s]
Epoch 0: 6%|▌ | 753/12384 [1:36:06<24:39:29, 7.63s/it, loss=0.0451, acc=0.9196, iter_time=7.27s]
Epoch 0: 6%|▌ | 753/12384 [1:36:14<24:39:29, 7.63s/it, loss=0.0458, acc=0.9211, iter_time=7.64s]
Epoch 0: 6%|▌ | 754/12384 [1:36:14<24:40:17, 7.64s/it, loss=0.0458, acc=0.9211, iter_time=7.64s]
Epoch 0: 6%|▌ | 754/12384 [1:36:22<24:40:17, 7.64s/it, loss=0.0374, acc=0.9325, iter_time=7.64s]
Epoch 0: 6%|▌ | 755/12384 [1:36:22<24:40:36, 7.64s/it, loss=0.0374, acc=0.9325, iter_time=7.64s]
Epoch 0: 6%|▌ | 755/12384 [1:36:29<24:40:36, 7.64s/it, loss=0.2386, acc=0.8100, iter_time=7.64s]
Epoch 0: 6%|▌ | 756/12384 [1:36:29<24:39:46, 7.64s/it, loss=0.2386, acc=0.8100, iter_time=7.64s]
Epoch 0: 6%|▌ | 756/12384 [1:36:37<24:39:46, 7.64s/it, loss=0.0359, acc=0.9196, iter_time=6.43s]
Epoch 0: 6%|▌ | 757/12384 [1:36:37<24:36:51, 7.62s/it, loss=0.0359, acc=0.9196, iter_time=6.43s]
Epoch 0: 6%|▌ | 757/12384 [1:36:45<24:36:51, 7.62s/it, loss=0.0413, acc=0.9169, iter_time=5.04s]
Epoch 0: 6%|▌ | 758/12384 [1:36:45<24:36:17, 7.62s/it, loss=0.0413, acc=0.9169, iter_time=5.04s]
Epoch 0: 6%|▌ | 758/12384 [1:36:52<24:36:17, 7.62s/it, loss=0.0432, acc=0.9119, iter_time=11.35s]
Epoch 0: 6%|▌ | 759/12384 [1:36:52<24:34:29, 7.61s/it, loss=0.0432, acc=0.9119, iter_time=11.35s]
Epoch 0: 6%|▌ | 759/12384 [1:37:00<24:34:29, 7.61s/it, loss=0.0478, acc=0.9104, iter_time=7.99s]
Epoch 0: 6%|▌ | 760/12384 [1:37:00<24:36:19, 7.62s/it, loss=0.0478, acc=0.9104, iter_time=7.99s]
Epoch 0: 6%|▌ | 760/12384 [1:37:07<24:36:19, 7.62s/it, loss=0.0376, acc=0.9337, iter_time=7.24s]
Epoch 0: 6%|▌ | 761/12384 [1:37:07<24:37:37, 7.63s/it, loss=0.0376, acc=0.9337, iter_time=7.24s]
Epoch 0: 6%|▌ | 761/12384 [1:37:15<24:37:37, 7.63s/it, loss=0.0319, acc=0.9420, iter_time=7.67s]
Epoch 0: 6%|▌ | 762/12384 [1:37:15<24:36:26, 7.62s/it, loss=0.0319, acc=0.9420, iter_time=7.67s]
Epoch 0: 6%|▌ | 762/12384 [1:37:23<24:36:26, 7.62s/it, loss=0.0306, acc=0.9524, iter_time=7.58s]
Epoch 0: 6%|▌ | 763/12384 [1:37:23<24:34:05, 7.61s/it, loss=0.0306, acc=0.9524, iter_time=7.58s]
Epoch 0: 6%|▌ | 763/12384 [1:37:30<24:34:05, 7.61s/it, loss=0.0217, acc=0.9687, iter_time=4.47s]
Epoch 0: 6%|▌ | 764/12384 [1:37:30<24:36:08, 7.62s/it, loss=0.0217, acc=0.9687, iter_time=4.47s]
Epoch 0: 6%|▌ | 764/12384 [1:37:38<24:36:08, 7.62s/it, loss=0.0435, acc=0.9098, iter_time=10.17s]
Epoch 0: 6%|▌ | 765/12384 [1:37:38<24:34:32, 7.61s/it, loss=0.0435, acc=0.9098, iter_time=10.17s]
Epoch 0: 6%|▌ | 765/12384 [1:37:46<24:34:32, 7.61s/it, loss=0.0369, acc=0.9183, iter_time=6.73s]
Epoch 0: 6%|▌ | 766/12384 [1:37:46<24:35:48, 7.62s/it, loss=0.0369, acc=0.9183, iter_time=6.73s]
Epoch 0: 6%|▌ | 766/12384 [1:37:53<24:35:48, 7.62s/it, loss=0.0226, acc=0.9585, iter_time=6.53s]
Epoch 0: 6%|▌ | 767/12384 [1:37:53<24:35:49, 7.62s/it, loss=0.0226, acc=0.9585, iter_time=6.53s]
Epoch 0: 6%|▌ | 767/12384 [1:38:01<24:35:49, 7.62s/it, loss=0.0323, acc=0.9444, iter_time=10.59s]
Epoch 0: 6%|▌ | 768/12384 [1:38:01<24:38:55, 7.64s/it, loss=0.0323, acc=0.9444, iter_time=10.59s]
Epoch 0: 6%|▌ | 768/12384 [1:38:09<24:38:55, 7.64s/it, loss=0.0343, acc=0.9373, iter_time=7.30s]
Epoch 0: 6%|▌ | 769/12384 [1:38:09<24:38:52, 7.64s/it, loss=0.0343, acc=0.9373, iter_time=7.30s]
Epoch 0: 6%|▌ | 769/12384 [1:38:16<24:38:52, 7.64s/it, loss=0.0251, acc=0.9559, iter_time=7.65s]
Epoch 0: 6%|▌ | 770/12384 [1:38:16<24:38:04, 7.64s/it, loss=0.0251, acc=0.9559, iter_time=7.65s]
Epoch 0: 6%|▌ | 770/12384 [1:38:24<24:38:04, 7.64s/it, loss=0.0246, acc=0.9612, iter_time=7.94s]
Epoch 0: 6%|▌ | 771/12384 [1:38:24<24:59:50, 7.75s/it, loss=0.0246, acc=0.9612, iter_time=7.94s]
Epoch 0: 6%|▌ | 771/12384 [1:38:32<24:59:50, 7.75s/it, loss=0.0601, acc=0.8999, iter_time=7.70s]
Epoch 0: 6%|▌ | 772/12384 [1:38:32<24:51:15, 7.71s/it, loss=0.0601, acc=0.8999, iter_time=7.70s]
Epoch 0: 6%|▌ | 772/12384 [1:38:39<24:51:15, 7.71s/it, loss=0.0359, acc=0.9443, iter_time=7.60s]
Epoch 0: 6%|▌ | 773/12384 [1:38:39<24:44:39, 7.67s/it, loss=0.0359, acc=0.9443, iter_time=7.60s]
Epoch 0: 6%|▌ | 773/12384 [1:38:47<24:44:39, 7.67s/it, loss=0.0329, acc=0.9437, iter_time=7.58s]
Epoch 0: 6%|▋ | 774/12384 [1:38:47<24:40:25, 7.65s/it, loss=0.0329, acc=0.9437, iter_time=7.58s]
Epoch 0: 6%|▋ | 774/12384 [1:38:55<24:40:25, 7.65s/it, loss=0.0413, acc=0.9204, iter_time=7.63s]
Epoch 0: 6%|▋ | 775/12384 [1:38:55<24:38:11, 7.64s/it, loss=0.0413, acc=0.9204, iter_time=7.63s]
Epoch 0: 6%|▋ | 775/12384 [1:39:02<24:38:11, 7.64s/it, loss=0.0435, acc=0.9154, iter_time=7.64s]
Epoch 0: 6%|▋ | 776/12384 [1:39:02<24:41:52, 7.66s/it, loss=0.0435, acc=0.9154, iter_time=7.64s]
Epoch 0: 6%|▋ | 776/12384 [1:39:10<24:41:52, 7.66s/it, loss=0.0415, acc=0.9187, iter_time=7.66s]
Epoch 0: 6%|▋ | 777/12384 [1:39:10<24:45:14, 7.68s/it, loss=0.0415, acc=0.9187, iter_time=7.66s]
Epoch 0: 6%|▋ | 777/12384 [1:39:18<24:45:14, 7.68s/it, loss=0.0216, acc=0.9552, iter_time=7.74s]
Epoch 0: 6%|▋ | 778/12384 [1:39:18<24:42:22, 7.66s/it, loss=0.0216, acc=0.9552, iter_time=7.74s]
Epoch 0: 6%|▋ | 778/12384 [1:39:25<24:42:22, 7.66s/it, loss=0.0148, acc=0.9775, iter_time=7.63s]
Epoch 0: 6%|▋ | 779/12384 [1:39:25<24:40:21, 7.65s/it, loss=0.0148, acc=0.9775, iter_time=7.63s]
Epoch 0: 6%|▋ | 779/12384 [1:39:33<24:40:21, 7.65s/it, loss=0.0324, acc=0.9460, iter_time=7.65s]
Epoch 0: 6%|▋ | 780/12384 [1:39:33<24:38:24, 7.64s/it, loss=0.0324, acc=0.9460, iter_time=7.65s]
Epoch 0: 6%|▋ | 780/12384 [1:39:40<24:38:24, 7.64s/it, loss=0.0238, acc=0.9511, iter_time=7.60s]
Epoch 0: 6%|▋ | 781/12384 [1:39:40<24:36:47, 7.64s/it, loss=0.0238, acc=0.9511, iter_time=7.60s]
Epoch 0: 6%|▋ | 781/12384 [1:39:48<24:36:47, 7.64s/it, loss=0.0370, acc=0.9297, iter_time=7.65s]
Epoch 0: 6%|▋ | 782/12384 [1:39:48<24:36:28, 7.64s/it, loss=0.0370, acc=0.9297, iter_time=7.65s]
Epoch 0: 6%|▋ | 782/12384 [1:39:56<24:36:28, 7.64s/it, loss=0.0324, acc=0.9425, iter_time=7.60s]
Epoch 0: 6%|▋ | 783/12384 [1:39:56<24:37:43, 7.64s/it, loss=0.0324, acc=0.9425, iter_time=7.60s]
Epoch 0: 6%|▋ | 783/12384 [1:40:03<24:37:43, 7.64s/it, loss=0.0326, acc=0.9294, iter_time=8.04s]
Epoch 0: 6%|▋ | 784/12384 [1:40:03<24:37:34, 7.64s/it, loss=0.0326, acc=0.9294, iter_time=8.04s]
Epoch 0: 6%|▋ | 784/12384 [1:40:11<24:37:34, 7.64s/it, loss=0.0227, acc=0.9600, iter_time=7.24s]
Epoch 0: 6%|▋ | 785/12384 [1:40:11<24:35:05, 7.63s/it, loss=0.0227, acc=0.9600, iter_time=7.24s]
Epoch 0: 6%|▋ | 785/12384 [1:40:19<24:35:05, 7.63s/it, loss=0.0224, acc=0.9444, iter_time=4.49s]
Epoch 0: 6%|▋ | 786/12384 [1:40:19<24:34:26, 7.63s/it, loss=0.0224, acc=0.9444, iter_time=4.49s]
Epoch 0: 6%|▋ | 786/12384 [1:40:26<24:34:26, 7.63s/it, loss=0.0280, acc=0.9426, iter_time=7.69s]
Epoch 0: 6%|▋ | 787/12384 [1:40:26<24:33:20, 7.62s/it, loss=0.0280, acc=0.9426, iter_time=7.69s]
Epoch 0: 6%|▋ | 787/12384 [1:40:34<24:33:20, 7.62s/it, loss=0.0509, acc=0.9484, iter_time=10.66s]
Epoch 0: 6%|▋ | 788/12384 [1:40:34<24:33:31, 7.62s/it, loss=0.0509, acc=0.9484, iter_time=10.66s]
Epoch 0: 6%|▋ | 788/12384 [1:40:42<24:33:31, 7.62s/it, loss=0.0369, acc=0.9292, iter_time=5.66s]
Epoch 0: 6%|▋ | 789/12384 [1:40:42<24:34:25, 7.63s/it, loss=0.0369, acc=0.9292, iter_time=5.66s]
Epoch 0: 6%|▋ | 789/12384 [1:40:49<24:34:25, 7.63s/it, loss=0.0209, acc=0.9621, iter_time=9.60s]
Epoch 0: 6%|▋ | 790/12384 [1:40:49<24:33:11, 7.62s/it, loss=0.0209, acc=0.9621, iter_time=9.60s]
Epoch 0: 6%|▋ | 790/12384 [1:40:57<24:33:11, 7.62s/it, loss=0.0131, acc=0.9784, iter_time=7.63s]
Epoch 0: 6%|▋ | 791/12384 [1:40:57<24:33:43, 7.63s/it, loss=0.0131, acc=0.9784, iter_time=7.63s]
Epoch 0: 6%|▋ | 791/12384 [1:41:04<24:33:43, 7.63s/it, loss=0.0366, acc=0.9400, iter_time=8.03s]
Epoch 0: 6%|▋ | 792/12384 [1:41:04<24:36:42, 7.64s/it, loss=0.0366, acc=0.9400, iter_time=8.03s]
Epoch 0: 6%|▋ | 792/12384 [1:41:12<24:36:42, 7.64s/it, loss=0.0259, acc=0.9537, iter_time=7.29s]
Epoch 0: 6%|▋ | 793/12384 [1:41:12<24:35:23, 7.64s/it, loss=0.0259, acc=0.9537, iter_time=7.29s]
Epoch 0: 6%|▋ | 793/12384 [1:41:20<24:35:23, 7.64s/it, loss=0.0289, acc=0.9530, iter_time=7.62s]
Epoch 0: 6%|▋ | 794/12384 [1:41:20<24:34:26, 7.63s/it, loss=0.0289, acc=0.9530, iter_time=7.62s]
Epoch 0: 6%|▋ | 794/12384 [1:41:27<24:34:26, 7.63s/it, loss=0.0270, acc=0.9490, iter_time=7.63s]
Epoch 0: 6%|▋ | 795/12384 [1:41:27<24:32:28, 7.62s/it, loss=0.0270, acc=0.9490, iter_time=7.63s]
Epoch 0: 6%|▋ | 795/12384 [1:41:35<24:32:28, 7.62s/it, loss=0.0203, acc=0.9541, iter_time=6.98s]
Epoch 0: 6%|▋ | 796/12384 [1:41:35<24:34:21, 7.63s/it, loss=0.0203, acc=0.9541, iter_time=6.98s]
Epoch 0: 6%|▋ | 796/12384 [1:41:43<24:34:21, 7.63s/it, loss=0.0223, acc=0.9582, iter_time=7.37s]
Epoch 0: 6%|▋ | 797/12384 [1:41:43<24:55:27, 7.74s/it, loss=0.0223, acc=0.9582, iter_time=7.37s]
Epoch 0: 6%|▋ | 797/12384 [1:41:51<24:55:27, 7.74s/it, loss=0.0206, acc=0.9566, iter_time=7.97s]
Epoch 0: 6%|▋ | 798/12384 [1:41:51<24:49:17, 7.71s/it, loss=0.0206, acc=0.9566, iter_time=7.97s]
Epoch 0: 6%|▋ | 798/12384 [1:41:58<24:49:17, 7.71s/it, loss=0.0391, acc=0.9308, iter_time=8.58s]
Epoch 0: 6%|▋ | 799/12384 [1:41:58<24:44:52, 7.69s/it, loss=0.0391, acc=0.9308, iter_time=8.58s]
Epoch 0: 6%|▋ | 799/12384 [1:42:06<24:44:52, 7.69s/it, loss=0.0208, acc=0.9563, iter_time=8.09s]
Epoch 0: 6%|▋ | 800/12384 [1:42:06<24:42:33, 7.68s/it, loss=0.0208, acc=0.9563, iter_time=8.09s]
Epoch 0: 6%|▋ | 800/12384 [1:42:14<24:42:33, 7.68s/it, loss=0.0147, acc=0.9859, iter_time=6.97s]
Epoch 0: 6%|▋ | 801/12384 [1:42:14<24:38:48, 7.66s/it, loss=0.0147, acc=0.9859, iter_time=6.97s]
Epoch 0: 6%|▋ | 801/12384 [1:42:21<24:38:48, 7.66s/it, loss=0.0229, acc=0.9482, iter_time=7.84s]
Epoch 0: 6%|▋ | 802/12384 [1:42:21<24:36:18, 7.65s/it, loss=0.0229, acc=0.9482, iter_time=7.84s]
Epoch 0: 6%|▋ | 802/12384 [1:42:29<24:36:18, 7.65s/it, loss=0.0218, acc=0.9426, iter_time=7.63s]
Epoch 0: 6%|▋ | 803/12384 [1:42:29<24:33:55, 7.64s/it, loss=0.0218, acc=0.9426, iter_time=7.63s]
Epoch 0: 6%|▋ | 803/12384 [1:42:36<24:33:55, 7.64s/it, loss=0.0136, acc=0.9779, iter_time=4.58s]
Epoch 0: 6%|▋ | 804/12384 [1:42:36<24:31:23, 7.62s/it, loss=0.0136, acc=0.9779, iter_time=4.58s]
Epoch 0: 6%|▋ | 804/12384 [1:42:44<24:31:23, 7.62s/it, loss=0.1282, acc=0.8586, iter_time=10.63s]
Epoch 0: 7%|▋ | 805/12384 [1:42:44<24:32:52, 7.63s/it, loss=0.1282, acc=0.8586, iter_time=10.63s]
Epoch 0: 7%|▋ | 805/12384 [1:42:52<24:32:52, 7.63s/it, loss=0.0136, acc=0.9759, iter_time=5.35s]
Epoch 0: 7%|▋ | 806/12384 [1:42:52<24:31:08, 7.62s/it, loss=0.0136, acc=0.9759, iter_time=5.35s]
Epoch 0: 7%|▋ | 806/12384 [1:42:59<24:31:08, 7.62s/it, loss=0.0248, acc=0.9474, iter_time=9.89s]
Epoch 0: 7%|▋ | 807/12384 [1:42:59<24:30:53, 7.62s/it, loss=0.0248, acc=0.9474, iter_time=9.89s]
Epoch 0: 7%|▋ | 807/12384 [1:43:07<24:30:53, 7.62s/it, loss=0.0343, acc=0.9413, iter_time=8.01s]
Epoch 0: 7%|▋ | 808/12384 [1:43:07<24:31:35, 7.63s/it, loss=0.0343, acc=0.9413, iter_time=8.01s]
Epoch 0: 7%|▋ | 808/12384 [1:43:14<24:31:35, 7.63s/it, loss=0.0203, acc=0.9623, iter_time=7.24s]
Epoch 0: 7%|▋ | 809/12384 [1:43:14<24:29:47, 7.62s/it, loss=0.0203, acc=0.9623, iter_time=7.24s]
Epoch 0: 7%|▋ | 809/12384 [1:43:22<24:29:47, 7.62s/it, loss=0.0209, acc=0.9636, iter_time=7.31s]
Epoch 0: 7%|▋ | 810/12384 [1:43:22<24:30:05, 7.62s/it, loss=0.0209, acc=0.9636, iter_time=7.31s]
Epoch 0: 7%|▋ | 810/12384 [1:43:30<24:30:05, 7.62s/it, loss=0.0101, acc=0.9779, iter_time=7.62s]
Epoch 0: 7%|▋ | 811/12384 [1:43:30<24:29:12, 7.62s/it, loss=0.0101, acc=0.9779, iter_time=7.62s]
Epoch 0: 7%|▋ | 811/12384 [1:43:37<24:29:12, 7.62s/it, loss=0.0137, acc=0.9719, iter_time=7.92s]
Epoch 0: 7%|▋ | 812/12384 [1:43:37<24:29:00, 7.62s/it, loss=0.0137, acc=0.9719, iter_time=7.92s]
Epoch 0: 7%|▋ | 812/12384 [1:43:45<24:29:00, 7.62s/it, loss=0.0200, acc=0.9688, iter_time=6.11s]
Epoch 0: 7%|▋ | 813/12384 [1:43:45<24:28:13, 7.61s/it, loss=0.0200, acc=0.9688, iter_time=6.11s]
Epoch 0: 7%|▋ | 813/12384 [1:43:53<24:28:13, 7.61s/it, loss=0.0177, acc=0.9663, iter_time=9.11s]
Epoch 0: 7%|▋ | 814/12384 [1:43:53<24:31:41, 7.63s/it, loss=0.0177, acc=0.9663, iter_time=9.11s]
Epoch 0: 7%|▋ | 814/12384 [1:44:00<24:31:41, 7.63s/it, loss=0.0262, acc=0.9547, iter_time=7.69s]
Epoch 0: 7%|▋ | 815/12384 [1:44:00<24:31:52, 7.63s/it, loss=0.0262, acc=0.9547, iter_time=7.69s]
Epoch 0: 7%|▋ | 815/12384 [1:44:08<24:31:52, 7.63s/it, loss=0.0173, acc=0.9666, iter_time=8.01s]
Epoch 0: 7%|▋ | 816/12384 [1:44:08<24:30:53, 7.63s/it, loss=0.0173, acc=0.9666, iter_time=8.01s]
Epoch 0: 7%|▋ | 816/12384 [1:44:16<24:30:53, 7.63s/it, loss=0.0208, acc=0.9611, iter_time=7.25s]
Epoch 0: 7%|▋ | 817/12384 [1:44:16<24:32:36, 7.64s/it, loss=0.0208, acc=0.9611, iter_time=7.25s]
Epoch 0: 7%|▋ | 817/12384 [1:44:23<24:32:36, 7.64s/it, loss=0.0165, acc=0.9687, iter_time=7.67s]
Epoch 0: 7%|▋ | 818/12384 [1:44:23<24:32:21, 7.64s/it, loss=0.0165, acc=0.9687, iter_time=7.67s]
Epoch 0: 7%|▋ | 818/12384 [1:44:31<24:32:21, 7.64s/it, loss=0.0184, acc=0.9669, iter_time=7.34s]
Epoch 0: 7%|▋ | 819/12384 [1:44:31<24:32:55, 7.64s/it, loss=0.0184, acc=0.9669, iter_time=7.34s]
Epoch 0: 7%|▋ | 819/12384 [1:44:38<24:32:55, 7.64s/it, loss=0.0115, acc=0.9805, iter_time=7.94s]
Epoch 0: 7%|▋ | 820/12384 [1:44:38<24:33:14, 7.64s/it, loss=0.0115, acc=0.9805, iter_time=7.94s]
Epoch 0: 7%|▋ | 820/12384 [1:44:46<24:33:14, 7.64s/it, loss=0.0213, acc=0.9653, iter_time=7.65s]
Epoch 0: 7%|▋ | 821/12384 [1:44:46<24:33:30, 7.65s/it, loss=0.0213, acc=0.9653, iter_time=7.65s]
Epoch 0: 7%|▋ | 821/12384 [1:44:54<24:33:30, 7.65s/it, loss=0.0548, acc=0.9306, iter_time=7.63s]
Epoch 0: 7%|▋ | 822/12384 [1:44:54<24:30:32, 7.63s/it, loss=0.0548, acc=0.9306, iter_time=7.63s]
Epoch 0: 7%|▋ | 822/12384 [1:45:01<24:30:32, 7.63s/it, loss=0.0178, acc=0.9735, iter_time=7.62s]
Epoch 0: 7%|▋ | 823/12384 [1:45:01<24:30:45, 7.63s/it, loss=0.0178, acc=0.9735, iter_time=7.62s]
Epoch 0: 7%|▋ | 823/12384 [1:45:09<24:30:45, 7.63s/it, loss=0.0151, acc=0.9684, iter_time=8.33s]
Epoch 0: 7%|▋ | 824/12384 [1:45:09<24:54:14, 7.76s/it, loss=0.0151, acc=0.9684, iter_time=8.33s]
Epoch 0: 7%|▋ | 824/12384 [1:45:17<24:54:14, 7.76s/it, loss=0.0110, acc=0.9790, iter_time=7.35s]
Epoch 0: 7%|▋ | 825/12384 [1:45:17<24:45:43, 7.71s/it, loss=0.0110, acc=0.9790, iter_time=7.35s]
Epoch 0: 7%|▋ | 825/12384 [1:45:25<24:45:43, 7.71s/it, loss=0.0301, acc=0.9566, iter_time=7.61s]
Epoch 0: 7%|▋ | 826/12384 [1:45:25<24:41:51, 7.69s/it, loss=0.0301, acc=0.9566, iter_time=7.61s]
Epoch 0: 7%|▋ | 826/12384 [1:45:32<24:41:51, 7.69s/it, loss=0.0191, acc=0.9618, iter_time=7.65s]
Epoch 0: 7%|▋ | 827/12384 [1:45:32<24:39:56, 7.68s/it, loss=0.0191, acc=0.9618, iter_time=7.65s]
Epoch 0: 7%|▋ | 827/12384 [1:45:40<24:39:56, 7.68s/it, loss=0.0231, acc=0.9660, iter_time=7.66s]
Epoch 0: 7%|▋ | 828/12384 [1:45:40<24:37:35, 7.67s/it, loss=0.0231, acc=0.9660, iter_time=7.66s]
Epoch 0: 7%|▋ | 828/12384 [1:45:48<24:37:35, 7.67s/it, loss=0.0083, acc=0.9900, iter_time=4.25s]
Epoch 0: 7%|▋ | 829/12384 [1:45:48<24:37:24, 7.67s/it, loss=0.0083, acc=0.9900, iter_time=4.25s]
Epoch 0: 7%|▋ | 829/12384 [1:45:55<24:37:24, 7.67s/it, loss=0.0175, acc=0.9750, iter_time=11.07s]
Epoch 0: 7%|▋ | 830/12384 [1:45:55<24:35:23, 7.66s/it, loss=0.0175, acc=0.9750, iter_time=11.07s]
Epoch 0: 7%|▋ | 830/12384 [1:46:03<24:35:23, 7.66s/it, loss=0.0138, acc=0.9700, iter_time=5.81s]
Epoch 0: 7%|▋ | 831/12384 [1:46:03<24:32:21, 7.65s/it, loss=0.0138, acc=0.9700, iter_time=5.81s]
Epoch 0: 7%|▋ | 831/12384 [1:46:10<24:32:21, 7.65s/it, loss=0.0289, acc=0.9414, iter_time=9.79s]
Epoch 0: 7%|▋ | 832/12384 [1:46:10<24:31:03, 7.64s/it, loss=0.0289, acc=0.9414, iter_time=9.79s]
Epoch 0: 7%|▋ | 832/12384 [1:46:18<24:31:03, 7.64s/it, loss=0.0426, acc=0.9357, iter_time=7.28s]
Epoch 0: 7%|▋ | 833/12384 [1:46:18<24:30:12, 7.64s/it, loss=0.0426, acc=0.9357, iter_time=7.28s]
Epoch 0: 7%|▋ | 833/12384 [1:46:26<24:30:12, 7.64s/it, loss=0.0132, acc=0.9743, iter_time=7.62s]
Epoch 0: 7%|▋ | 834/12384 [1:46:26<24:28:12, 7.63s/it, loss=0.0132, acc=0.9743, iter_time=7.62s]
Epoch 0: 7%|▋ | 834/12384 [1:46:33<24:28:12, 7.63s/it, loss=0.0149, acc=0.9719, iter_time=7.60s]
Epoch 0: 7%|▋ | 835/12384 [1:46:33<24:31:57, 7.65s/it, loss=0.0149, acc=0.9719, iter_time=7.60s]
Epoch 0: 7%|▋ | 835/12384 [1:46:41<24:31:57, 7.65s/it, loss=0.0825, acc=0.8881, iter_time=7.70s]
Epoch 0: 7%|▋ | 836/12384 [1:46:41<24:31:48, 7.65s/it, loss=0.0825, acc=0.8881, iter_time=7.70s]
Epoch 0: 7%|▋ | 836/12384 [1:46:49<24:31:48, 7.65s/it, loss=0.0171, acc=0.9772, iter_time=7.65s]
Epoch 0: 7%|▋ | 837/12384 [1:46:49<24:29:26, 7.64s/it, loss=0.0171, acc=0.9772, iter_time=7.65s]
Epoch 0: 7%|▋ | 837/12384 [1:46:56<24:29:26, 7.64s/it, loss=0.0180, acc=0.9716, iter_time=7.30s]
Epoch 0: 7%|▋ | 838/12384 [1:46:56<24:31:59, 7.65s/it, loss=0.0180, acc=0.9716, iter_time=7.30s]
Epoch 0: 7%|▋ | 838/12384 [1:47:04<24:31:59, 7.65s/it, loss=0.0183, acc=0.9586, iter_time=8.00s]
Epoch 0: 7%|▋ | 839/12384 [1:47:04<24:30:42, 7.64s/it, loss=0.0183, acc=0.9586, iter_time=8.00s]
Epoch 0: 7%|▋ | 839/12384 [1:47:12<24:30:42, 7.64s/it, loss=0.0253, acc=0.9593, iter_time=8.01s]
Epoch 0: 7%|▋ | 840/12384 [1:47:12<24:28:48, 7.63s/it, loss=0.0253, acc=0.9593, iter_time=8.01s]
Epoch 0: 7%|▋ | 840/12384 [1:47:19<24:28:48, 7.63s/it, loss=0.0115, acc=0.9781, iter_time=6.90s]
Epoch 0: 7%|▋ | 841/12384 [1:47:19<24:27:11, 7.63s/it, loss=0.0115, acc=0.9781, iter_time=6.90s]
Epoch 0: 7%|▋ | 841/12384 [1:47:27<24:27:11, 7.63s/it, loss=0.0146, acc=0.9697, iter_time=3.73s]
Epoch 0: 7%|▋ | 842/12384 [1:47:27<24:25:26, 7.62s/it, loss=0.0146, acc=0.9697, iter_time=3.73s]
Epoch 0: 7%|▋ | 842/12384 [1:47:34<24:25:26, 7.62s/it, loss=0.0187, acc=0.9620, iter_time=11.78s]
Epoch 0: 7%|▋ | 843/12384 [1:47:34<24:24:37, 7.61s/it, loss=0.0187, acc=0.9620, iter_time=11.78s]
Epoch 0: 7%|▋ | 843/12384 [1:47:42<24:24:37, 7.61s/it, loss=0.0183, acc=0.9614, iter_time=7.62s]
Epoch 0: 7%|▋ | 844/12384 [1:47:42<24:26:51, 7.63s/it, loss=0.0183, acc=0.9614, iter_time=7.62s]
Epoch 0: 7%|▋ | 844/12384 [1:47:50<24:26:51, 7.63s/it, loss=0.0190, acc=0.9616, iter_time=7.65s]
Epoch 0: 7%|▋ | 845/12384 [1:47:50<24:25:37, 7.62s/it, loss=0.0190, acc=0.9616, iter_time=7.65s]
Epoch 0: 7%|▋ | 845/12384 [1:47:57<24:25:37, 7.62s/it, loss=0.0199, acc=0.9600, iter_time=7.62s]
Epoch 0: 7%|▋ | 846/12384 [1:47:57<24:25:50, 7.62s/it, loss=0.0199, acc=0.9600, iter_time=7.62s]
Epoch 0: 7%|▋ | 846/12384 [1:48:05<24:25:50, 7.62s/it, loss=0.0185, acc=0.9690, iter_time=7.63s]
Epoch 0: 7%|▋ | 847/12384 [1:48:05<24:27:53, 7.63s/it, loss=0.0185, acc=0.9690, iter_time=7.63s]
Epoch 0: 7%|▋ | 847/12384 [1:48:13<24:27:53, 7.63s/it, loss=0.0248, acc=0.9542, iter_time=8.02s]
Epoch 0: 7%|▋ | 848/12384 [1:48:13<24:25:41, 7.62s/it, loss=0.0248, acc=0.9542, iter_time=8.02s]
Epoch 0: 7%|▋ | 848/12384 [1:48:20<24:25:41, 7.62s/it, loss=0.0102, acc=0.9843, iter_time=6.91s]
Epoch 0: 7%|▋ | 849/12384 [1:48:20<24:25:20, 7.62s/it, loss=0.0102, acc=0.9843, iter_time=6.91s]
Epoch 0: 7%|▋ | 849/12384 [1:48:28<24:25:20, 7.62s/it, loss=0.0156, acc=0.9599, iter_time=8.69s]
Epoch 0: 7%|▋ | 850/12384 [1:48:28<24:45:13, 7.73s/it, loss=0.0156, acc=0.9599, iter_time=8.69s]
Epoch 0: 7%|▋ | 850/12384 [1:48:36<24:45:13, 7.73s/it, loss=0.0109, acc=0.9779, iter_time=4.39s]
Epoch 0: 7%|▋ | 851/12384 [1:48:36<24:40:36, 7.70s/it, loss=0.0109, acc=0.9779, iter_time=4.39s]
Epoch 0: 7%|▋ | 851/12384 [1:48:43<24:40:36, 7.70s/it, loss=0.0097, acc=0.9877, iter_time=10.13s]
Epoch 0: 7%|▋ | 852/12384 [1:48:43<24:34:49, 7.67s/it, loss=0.0097, acc=0.9877, iter_time=10.13s]
Epoch 0: 7%|▋ | 852/12384 [1:48:51<24:34:49, 7.67s/it, loss=0.0090, acc=0.9889, iter_time=7.93s]
Epoch 0: 7%|▋ | 853/12384 [1:48:51<24:32:00, 7.66s/it, loss=0.0090, acc=0.9889, iter_time=7.93s]
Epoch 0: 7%|▋ | 853/12384 [1:48:59<24:32:00, 7.66s/it, loss=0.0139, acc=0.9684, iter_time=7.64s]
Epoch 0: 7%|▋ | 854/12384 [1:48:59<24:30:48, 7.65s/it, loss=0.0139, acc=0.9684, iter_time=7.64s]
Epoch 0: 7%|▋ | 854/12384 [1:49:06<24:30:48, 7.65s/it, loss=0.0155, acc=0.9751, iter_time=7.05s]
Epoch 0: 7%|▋ | 855/12384 [1:49:06<24:31:08, 7.66s/it, loss=0.0155, acc=0.9751, iter_time=7.05s]
Epoch 0: 7%|▋ | 855/12384 [1:49:14<24:31:08, 7.66s/it, loss=0.0106, acc=0.9826, iter_time=8.23s]
Epoch 0: 7%|▋ | 856/12384 [1:49:14<24:30:33, 7.65s/it, loss=0.0106, acc=0.9826, iter_time=8.23s]
Epoch 0: 7%|▋ | 856/12384 [1:49:22<24:30:33, 7.65s/it, loss=0.0139, acc=0.9761, iter_time=4.62s]
Epoch 0: 7%|▋ | 857/12384 [1:49:22<24:29:09, 7.65s/it, loss=0.0139, acc=0.9761, iter_time=4.62s]
Epoch 0: 7%|▋ | 857/12384 [1:49:29<24:29:09, 7.65s/it, loss=0.0123, acc=0.9790, iter_time=10.65s]
Epoch 0: 7%|▋ | 858/12384 [1:49:29<24:27:52, 7.64s/it, loss=0.0123, acc=0.9790, iter_time=10.65s]
Epoch 0: 7%|▋ | 858/12384 [1:49:37<24:27:52, 7.64s/it, loss=0.0113, acc=0.9809, iter_time=7.63s]
Epoch 0: 7%|▋ | 859/12384 [1:49:37<24:25:10, 7.63s/it, loss=0.0113, acc=0.9809, iter_time=7.63s]
Epoch 0: 7%|▋ | 859/12384 [1:49:44<24:25:10, 7.63s/it, loss=0.0244, acc=0.9623, iter_time=7.63s]
Epoch 0: 7%|▋ | 860/12384 [1:49:44<24:25:51, 7.63s/it, loss=0.0244, acc=0.9623, iter_time=7.63s]
Epoch 0: 7%|▋ | 860/12384 [1:49:52<24:25:51, 7.63s/it, loss=0.0264, acc=0.9585, iter_time=7.64s]
Epoch 0: 7%|▋ | 861/12384 [1:49:52<24:25:31, 7.63s/it, loss=0.0264, acc=0.9585, iter_time=7.64s]
Epoch 0: 7%|▋ | 861/12384 [1:50:00<24:25:31, 7.63s/it, loss=0.0170, acc=0.9770, iter_time=7.30s]
Epoch 0: 7%|▋ | 862/12384 [1:50:00<24:24:35, 7.63s/it, loss=0.0170, acc=0.9770, iter_time=7.30s]
Epoch 0: 7%|▋ | 862/12384 [1:50:07<24:24:35, 7.63s/it, loss=0.0183, acc=0.9607, iter_time=7.92s]
Epoch 0: 7%|▋ | 863/12384 [1:50:07<24:22:44, 7.62s/it, loss=0.0183, acc=0.9607, iter_time=7.92s]
Epoch 0: 7%|▋ | 863/12384 [1:50:15<24:22:44, 7.62s/it, loss=0.0102, acc=0.9789, iter_time=8.00s]
Epoch 0: 7%|▋ | 864/12384 [1:50:15<24:27:43, 7.64s/it, loss=0.0102, acc=0.9789, iter_time=8.00s]
Epoch 0: 7%|▋ | 864/12384 [1:50:23<24:27:43, 7.64s/it, loss=0.0188, acc=0.9524, iter_time=7.31s]
Epoch 0: 7%|▋ | 865/12384 [1:50:23<24:31:50, 7.67s/it, loss=0.0188, acc=0.9524, iter_time=7.31s]
Epoch 0: 7%|▋ | 865/12384 [1:50:30<24:31:50, 7.67s/it, loss=0.0153, acc=0.9746, iter_time=4.41s]
Epoch 0: 7%|▋ | 866/12384 [1:50:30<24:28:25, 7.65s/it, loss=0.0153, acc=0.9746, iter_time=4.41s]
Epoch 0: 7%|▋ | 866/12384 [1:50:38<24:28:25, 7.65s/it, loss=0.0112, acc=0.9766, iter_time=10.92s]
Epoch 0: 7%|▋ | 867/12384 [1:50:38<24:29:13, 7.65s/it, loss=0.0112, acc=0.9766, iter_time=10.92s]
Epoch 0: 7%|▋ | 867/12384 [1:50:46<24:29:13, 7.65s/it, loss=0.0185, acc=0.9797, iter_time=7.67s]
Epoch 0: 7%|▋ | 868/12384 [1:50:46<24:29:22, 7.66s/it, loss=0.0185, acc=0.9797, iter_time=7.67s]
Epoch 0: 7%|▋ | 868/12384 [1:50:53<24:29:22, 7.66s/it, loss=0.0243, acc=0.9345, iter_time=5.87s]
Epoch 0: 7%|▋ | 869/12384 [1:50:53<24:29:02, 7.65s/it, loss=0.0243, acc=0.9345, iter_time=5.87s]
Epoch 0: 7%|▋ | 869/12384 [1:51:01<24:29:02, 7.65s/it, loss=0.0124, acc=0.9805, iter_time=9.45s]
Epoch 0: 7%|▋ | 870/12384 [1:51:01<24:29:59, 7.66s/it, loss=0.0124, acc=0.9805, iter_time=9.45s]
Epoch 0: 7%|▋ | 870/12384 [1:51:09<24:29:59, 7.66s/it, loss=0.0180, acc=0.9692, iter_time=7.66s]
Epoch 0: 7%|▋ | 871/12384 [1:51:09<24:29:34, 7.66s/it, loss=0.0180, acc=0.9692, iter_time=7.66s]
Epoch 0: 7%|▋ | 871/12384 [1:51:16<24:29:34, 7.66s/it, loss=0.0118, acc=0.9705, iter_time=8.04s]
Epoch 0: 7%|▋ | 872/12384 [1:51:16<24:26:10, 7.64s/it, loss=0.0118, acc=0.9705, iter_time=8.04s]
Epoch 0: 7%|▋ | 872/12384 [1:51:24<24:26:10, 7.64s/it, loss=0.0069, acc=0.9855, iter_time=7.21s]
Epoch 0: 7%|▋ | 873/12384 [1:51:24<24:25:22, 7.64s/it, loss=0.0069, acc=0.9855, iter_time=7.21s]
Epoch 0: 7%|▋ | 873/12384 [1:51:32<24:25:22, 7.64s/it, loss=0.0156, acc=0.9652, iter_time=7.65s]
Epoch 0: 7%|▋ | 874/12384 [1:51:32<24:25:17, 7.64s/it, loss=0.0156, acc=0.9652, iter_time=7.65s]
Epoch 0: 7%|▋ | 874/12384 [1:51:39<24:25:17, 7.64s/it, loss=0.0104, acc=0.9822, iter_time=6.18s]
Epoch 0: 7%|▋ | 875/12384 [1:51:39<24:22:57, 7.63s/it, loss=0.0104, acc=0.9822, iter_time=6.18s]
Epoch 0: 7%|▋ | 875/12384 [1:51:47<24:22:57, 7.63s/it, loss=0.0386, acc=0.9483, iter_time=6.50s]
Epoch 0: 7%|▋ | 876/12384 [1:51:47<24:22:17, 7.62s/it, loss=0.0386, acc=0.9483, iter_time=6.50s]
Epoch 0: 7%|▋ | 876/12384 [1:51:55<24:22:17, 7.62s/it, loss=0.0079, acc=0.9851, iter_time=7.63s]
Epoch 0: 7%|▋ | 877/12384 [1:51:55<24:41:25, 7.72s/it, loss=0.0079, acc=0.9851, iter_time=7.63s]
Epoch 0: 7%|▋ | 877/12384 [1:52:02<24:41:25, 7.72s/it, loss=0.0182, acc=0.9646, iter_time=9.54s]
Epoch 0: 7%|▋ | 878/12384 [1:52:02<24:35:23, 7.69s/it, loss=0.0182, acc=0.9646, iter_time=9.54s]
Epoch 0: 7%|▋ | 878/12384 [1:52:10<24:35:23, 7.69s/it, loss=0.0433, acc=0.9516, iter_time=7.45s]
Epoch 0: 7%|▋ | 879/12384 [1:52:10<24:32:25, 7.68s/it, loss=0.0433, acc=0.9516, iter_time=7.45s]
Epoch 0: 7%|▋ | 879/12384 [1:52:18<24:32:25, 7.68s/it, loss=0.0351, acc=0.9565, iter_time=9.15s]
Epoch 0: 7%|▋ | 880/12384 [1:52:18<24:29:23, 7.66s/it, loss=0.0351, acc=0.9565, iter_time=9.15s]
Epoch 0: 7%|▋ | 880/12384 [1:52:25<24:29:23, 7.66s/it, loss=0.0080, acc=0.9885, iter_time=7.25s]
Epoch 0: 7%|▋ | 881/12384 [1:52:25<24:25:23, 7.64s/it, loss=0.0080, acc=0.9885, iter_time=7.25s]
Epoch 0: 7%|▋ | 881/12384 [1:52:33<24:25:23, 7.64s/it, loss=0.0067, acc=0.9919, iter_time=5.03s]
Epoch 0: 7%|▋ | 882/12384 [1:52:33<24:25:18, 7.64s/it, loss=0.0067, acc=0.9919, iter_time=5.03s]
Epoch 0: 7%|▋ | 882/12384 [1:52:41<24:25:18, 7.64s/it, loss=0.0187, acc=0.9653, iter_time=10.24s]
Epoch 0: 7%|▋ | 883/12384 [1:52:41<24:27:27, 7.66s/it, loss=0.0187, acc=0.9653, iter_time=10.24s]
Epoch 0: 7%|▋ | 883/12384 [1:52:48<24:27:27, 7.66s/it, loss=0.0916, acc=0.8901, iter_time=7.66s]
Epoch 0: 7%|▋ | 884/12384 [1:52:48<24:27:57, 7.66s/it, loss=0.0916, acc=0.8901, iter_time=7.66s]
Epoch 0: 7%|▋ | 884/12384 [1:52:56<24:27:57, 7.66s/it, loss=0.0093, acc=0.9872, iter_time=4.27s]
Epoch 0: 7%|▋ | 885/12384 [1:52:56<24:26:06, 7.65s/it, loss=0.0093, acc=0.9872, iter_time=4.27s]
Epoch 0: 7%|▋ | 885/12384 [1:53:03<24:26:06, 7.65s/it, loss=0.0097, acc=0.9795, iter_time=11.03s]
Epoch 0: 7%|▋ | 886/12384 [1:53:03<24:24:13, 7.64s/it, loss=0.0097, acc=0.9795, iter_time=11.03s]
Epoch 0: 7%|▋ | 886/12384 [1:53:11<24:24:13, 7.64s/it, loss=0.0123, acc=0.9842, iter_time=7.60s]
Epoch 0: 7%|▋ | 887/12384 [1:53:11<24:22:34, 7.63s/it, loss=0.0123, acc=0.9842, iter_time=7.60s]
Epoch 0: 7%|▋ | 887/12384 [1:53:19<24:22:34, 7.63s/it, loss=0.0123, acc=0.9846, iter_time=7.74s]
Epoch 0: 7%|▋ | 888/12384 [1:53:19<24:22:31, 7.63s/it, loss=0.0123, acc=0.9846, iter_time=7.74s]
Epoch 0: 7%|▋ | 888/12384 [1:53:26<24:22:31, 7.63s/it, loss=0.0083, acc=0.9848, iter_time=3.98s]
Epoch 0: 7%|▋ | 889/12384 [1:53:26<24:21:08, 7.63s/it, loss=0.0083, acc=0.9848, iter_time=3.98s]
Epoch 0: 7%|▋ | 889/12384 [1:53:34<24:21:08, 7.63s/it, loss=0.0099, acc=0.9743, iter_time=8.59s]
Epoch 0: 7%|▋ | 890/12384 [1:53:34<24:21:46, 7.63s/it, loss=0.0099, acc=0.9743, iter_time=8.59s]
Epoch 0: 7%|▋ | 890/12384 [1:53:42<24:21:46, 7.63s/it, loss=0.0048, acc=0.9982, iter_time=10.18s]
Epoch 0: 7%|▋ | 891/12384 [1:53:42<24:21:03, 7.63s/it, loss=0.0048, acc=0.9982, iter_time=10.18s]
Epoch 0: 7%|▋ | 891/12384 [1:53:49<24:21:03, 7.63s/it, loss=0.0110, acc=0.9736, iter_time=4.82s]
Epoch 0: 7%|▋ | 892/12384 [1:53:49<24:19:20, 7.62s/it, loss=0.0110, acc=0.9736, iter_time=4.82s]
Epoch 0: 7%|▋ | 892/12384 [1:53:57<24:19:20, 7.62s/it, loss=0.0163, acc=0.9813, iter_time=10.40s]
Epoch 0: 7%|▋ | 893/12384 [1:53:57<24:17:30, 7.61s/it, loss=0.0163, acc=0.9813, iter_time=10.40s]
Epoch 0: 7%|▋ | 893/12384 [1:54:04<24:17:30, 7.61s/it, loss=0.0304, acc=0.9713, iter_time=3.85s]
Epoch 0: 7%|▋ | 894/12384 [1:54:04<24:19:22, 7.62s/it, loss=0.0304, acc=0.9713, iter_time=3.85s]
Epoch 0: 7%|▋ | 894/12384 [1:54:12<24:19:22, 7.62s/it, loss=0.0085, acc=0.9878, iter_time=11.38s]
Epoch 0: 7%|▋ | 895/12384 [1:54:12<24:18:12, 7.62s/it, loss=0.0085, acc=0.9878, iter_time=11.38s]
Epoch 0: 7%|▋ | 895/12384 [1:54:20<24:18:12, 7.62s/it, loss=0.0163, acc=0.9603, iter_time=8.03s]
Epoch 0: 7%|▋ | 896/12384 [1:54:20<24:18:28, 7.62s/it, loss=0.0163, acc=0.9603, iter_time=8.03s]
Epoch 0: 7%|▋ | 896/12384 [1:54:27<24:18:28, 7.62s/it, loss=0.0134, acc=0.9753, iter_time=7.22s]
Epoch 0: 7%|▋ | 897/12384 [1:54:27<24:20:59, 7.63s/it, loss=0.0134, acc=0.9753, iter_time=7.22s]
Epoch 0: 7%|▋ | 897/12384 [1:54:35<24:20:59, 7.63s/it, loss=0.0070, acc=0.9910, iter_time=7.17s]
Epoch 0: 7%|▋ | 898/12384 [1:54:35<24:25:03, 7.65s/it, loss=0.0070, acc=0.9910, iter_time=7.17s]
Epoch 0: 7%|▋ | 898/12384 [1:54:43<24:25:03, 7.65s/it, loss=0.0069, acc=0.9903, iter_time=8.19s]
Epoch 0: 7%|▋ | 899/12384 [1:54:43<24:23:12, 7.64s/it, loss=0.0069, acc=0.9903, iter_time=8.19s]
Epoch 0: 7%|▋ | 899/12384 [1:54:50<24:23:12, 7.64s/it, loss=0.0056, acc=0.9915, iter_time=8.05s]
Epoch 0: 7%|▋ | 900/12384 [1:54:50<24:22:19, 7.64s/it, loss=0.0056, acc=0.9915, iter_time=8.05s]
Epoch 0: 7%|▋ | 900/12384 [1:54:58<24:22:19, 7.64s/it, loss=0.0070, acc=0.9881, iter_time=7.21s]
Epoch 0: 7%|▋ | 901/12384 [1:54:58<24:24:29, 7.65s/it, loss=0.0070, acc=0.9881, iter_time=7.21s]
Epoch 0: 7%|▋ | 901/12384 [1:55:06<24:24:29, 7.65s/it, loss=0.0109, acc=0.9777, iter_time=7.67s]
Epoch 0: 7%|▋ | 902/12384 [1:55:06<24:21:26, 7.64s/it, loss=0.0109, acc=0.9777, iter_time=7.67s]
Epoch 0: 7%|▋ | 902/12384 [1:55:13<24:21:26, 7.64s/it, loss=0.0091, acc=0.9803, iter_time=7.94s]
Epoch 0: 7%|▋ | 903/12384 [1:55:13<24:41:11, 7.74s/it, loss=0.0091, acc=0.9803, iter_time=7.94s]
Epoch 0: 7%|▋ | 903/12384 [1:55:21<24:41:11, 7.74s/it, loss=0.0026, acc=0.9954, iter_time=7.63s]
Epoch 0: 7%|▋ | 904/12384 [1:55:21<24:35:18, 7.71s/it, loss=0.0026, acc=0.9954, iter_time=7.63s]
Epoch 0: 7%|▋ | 904/12384 [1:55:29<24:35:18, 7.71s/it, loss=0.0046, acc=0.9914, iter_time=7.64s]
Epoch 0: 7%|▋ | 905/12384 [1:55:29<24:30:44, 7.69s/it, loss=0.0046, acc=0.9914, iter_time=7.64s]
Epoch 0: 7%|▋ | 905/12384 [1:55:36<24:30:44, 7.69s/it, loss=0.0099, acc=0.9801, iter_time=5.55s]
Epoch 0: 7%|▋ | 906/12384 [1:55:36<24:27:25, 7.67s/it, loss=0.0099, acc=0.9801, iter_time=5.55s]
Epoch 0: 7%|▋ | 906/12384 [1:55:44<24:27:25, 7.67s/it, loss=0.0061, acc=0.9900, iter_time=7.19s]
Epoch 0: 7%|▋ | 907/12384 [1:55:44<24:23:42, 7.65s/it, loss=0.0061, acc=0.9900, iter_time=7.19s]
Epoch 0: 7%|▋ | 907/12384 [1:55:52<24:23:42, 7.65s/it, loss=0.0144, acc=0.9691, iter_time=8.66s]
Epoch 0: 7%|▋ | 908/12384 [1:55:52<24:23:25, 7.65s/it, loss=0.0144, acc=0.9691, iter_time=8.66s]
Epoch 0: 7%|▋ | 908/12384 [1:55:59<24:23:25, 7.65s/it, loss=0.0047, acc=0.9894, iter_time=6.57s]
Epoch 0: 7%|▋ | 909/12384 [1:55:59<24:21:01, 7.64s/it, loss=0.0047, acc=0.9894, iter_time=6.57s]
Epoch 0: 7%|▋ | 909/12384 [1:56:07<24:21:01, 7.64s/it, loss=0.0067, acc=0.9882, iter_time=10.20s]
Epoch 0: 7%|▋ | 910/12384 [1:56:07<24:21:33, 7.64s/it, loss=0.0067, acc=0.9882, iter_time=10.20s]
Epoch 0: 7%|▋ | 910/12384 [1:56:15<24:21:33, 7.64s/it, loss=0.0257, acc=0.9608, iter_time=7.64s]
Epoch 0: 7%|▋ | 911/12384 [1:56:15<24:20:38, 7.64s/it, loss=0.0257, acc=0.9608, iter_time=7.64s]
Epoch 0: 7%|▋ | 911/12384 [1:56:22<24:20:38, 7.64s/it, loss=0.0071, acc=0.9838, iter_time=8.03s]
Epoch 0: 7%|▋ | 912/12384 [1:56:22<24:19:40, 7.63s/it, loss=0.0071, acc=0.9838, iter_time=8.03s]
Epoch 0: 7%|▋ | 912/12384 [1:56:30<24:19:40, 7.63s/it, loss=0.0060, acc=0.9953, iter_time=7.23s]
Epoch 0: 7%|▋ | 913/12384 [1:56:30<24:20:15, 7.64s/it, loss=0.0060, acc=0.9953, iter_time=7.23s]
Epoch 0: 7%|▋ | 913/12384 [1:56:37<24:20:15, 7.64s/it, loss=0.0149, acc=0.9700, iter_time=5.56s]
Epoch 0: 7%|▋ | 914/12384 [1:56:37<24:22:47, 7.65s/it, loss=0.0149, acc=0.9700, iter_time=5.56s]
Epoch 0: 7%|▋ | 914/12384 [1:56:45<24:22:47, 7.65s/it, loss=0.0048, acc=0.9880, iter_time=9.76s]
Epoch 0: 7%|▋ | 915/12384 [1:56:45<24:23:39, 7.66s/it, loss=0.0048, acc=0.9880, iter_time=9.76s]
Epoch 0: 7%|▋ | 915/12384 [1:56:53<24:23:39, 7.66s/it, loss=0.0040, acc=0.9897, iter_time=7.67s]
Epoch 0: 7%|▋ | 916/12384 [1:56:53<24:20:39, 7.64s/it, loss=0.0040, acc=0.9897, iter_time=7.67s]
Epoch 0: 7%|▋ | 916/12384 [1:57:00<24:20:39, 7.64s/it, loss=0.0328, acc=0.9407, iter_time=7.62s]
Epoch 0: 7%|▋ | 917/12384 [1:57:00<24:20:57, 7.64s/it, loss=0.0328, acc=0.9407, iter_time=7.62s]
Epoch 0: 7%|▋ | 917/12384 [1:57:08<24:20:57, 7.64s/it, loss=0.0061, acc=0.9846, iter_time=7.63s]
Epoch 0: 7%|▋ | 918/12384 [1:57:08<24:19:24, 7.64s/it, loss=0.0061, acc=0.9846, iter_time=7.63s]
Epoch 0: 7%|▋ | 918/12384 [1:57:16<24:19:24, 7.64s/it, loss=0.0317, acc=0.9741, iter_time=5.08s]
Epoch 0: 7%|▋ | 919/12384 [1:57:16<24:19:35, 7.64s/it, loss=0.0317, acc=0.9741, iter_time=5.08s]
Epoch 0: 7%|▋ | 919/12384 [1:57:23<24:19:35, 7.64s/it, loss=0.0099, acc=0.9790, iter_time=10.11s]
Epoch 0: 7%|▋ | 920/12384 [1:57:23<24:16:38, 7.62s/it, loss=0.0099, acc=0.9790, iter_time=10.11s]
Epoch 0: 7%|▋ | 920/12384 [1:57:31<24:16:38, 7.62s/it, loss=0.0050, acc=0.9933, iter_time=7.04s]
Epoch 0: 7%|▋ | 921/12384 [1:57:31<24:17:59, 7.63s/it, loss=0.0050, acc=0.9933, iter_time=7.04s]
Epoch 0: 7%|▋ | 921/12384 [1:57:39<24:17:59, 7.63s/it, loss=0.0143, acc=0.9628, iter_time=8.27s]
Epoch 0: 7%|▋ | 922/12384 [1:57:39<24:15:17, 7.62s/it, loss=0.0143, acc=0.9628, iter_time=8.27s]
Epoch 0: 7%|▋ | 922/12384 [1:57:46<24:15:17, 7.62s/it, loss=0.0085, acc=0.9817, iter_time=4.23s]
Epoch 0: 7%|▋ | 923/12384 [1:57:46<24:15:32, 7.62s/it, loss=0.0085, acc=0.9817, iter_time=4.23s]
Epoch 0: 7%|▋ | 923/12384 [1:57:54<24:15:32, 7.62s/it, loss=0.0057, acc=0.9899, iter_time=10.97s]
Epoch 0: 7%|▋ | 924/12384 [1:57:54<24:14:32, 7.62s/it, loss=0.0057, acc=0.9899, iter_time=10.97s]
Epoch 0: 7%|▋ | 924/12384 [1:58:01<24:14:32, 7.62s/it, loss=0.0348, acc=0.9716, iter_time=7.62s]
Epoch 0: 7%|▋ | 925/12384 [1:58:01<24:14:53, 7.62s/it, loss=0.0348, acc=0.9716, iter_time=7.62s]
Epoch 0: 7%|▋ | 925/12384 [1:58:09<24:14:53, 7.62s/it, loss=0.0068, acc=0.9897, iter_time=7.64s]
Epoch 0: 7%|▋ | 926/12384 [1:58:09<24:16:13, 7.63s/it, loss=0.0068, acc=0.9897, iter_time=7.64s]
Epoch 0: 7%|▋ | 926/12384 [1:58:17<24:16:13, 7.63s/it, loss=0.0071, acc=0.9885, iter_time=5.51s]
Epoch 0: 7%|▋ | 927/12384 [1:58:17<24:14:21, 7.62s/it, loss=0.0071, acc=0.9885, iter_time=5.51s]
Epoch 0: 7%|▋ | 927/12384 [1:58:24<24:14:21, 7.62s/it, loss=0.0071, acc=0.9841, iter_time=10.09s]
Epoch 0: 7%|▋ | 928/12384 [1:58:24<24:19:26, 7.64s/it, loss=0.0071, acc=0.9841, iter_time=10.09s]
Epoch 0: 7%|▋ | 928/12384 [1:58:32<24:19:26, 7.64s/it, loss=0.0101, acc=0.9736, iter_time=7.65s]
Epoch 0: 8%|▊ | 929/12384 [1:58:32<24:38:19, 7.74s/it, loss=0.0101, acc=0.9736, iter_time=7.65s]
Epoch 0: 8%|▊ | 929/12384 [1:58:40<24:38:19, 7.74s/it, loss=0.0028, acc=0.9978, iter_time=7.65s]
Epoch 0: 8%|▊ | 930/12384 [1:58:40<24:30:26, 7.70s/it, loss=0.0028, acc=0.9978, iter_time=7.65s]
Epoch 0: 8%|▊ | 930/12384 [1:58:48<24:30:26, 7.70s/it, loss=0.0289, acc=0.9722, iter_time=7.62s]
Epoch 0: 8%|▊ | 931/12384 [1:58:48<24:27:47, 7.69s/it, loss=0.0289, acc=0.9722, iter_time=7.62s]
Epoch 0: 8%|▊ | 931/12384 [1:58:55<24:27:47, 7.69s/it, loss=0.0086, acc=0.9780, iter_time=6.47s]
Epoch 0: 8%|▊ | 932/12384 [1:58:55<24:23:26, 7.67s/it, loss=0.0086, acc=0.9780, iter_time=6.47s]
Epoch 0: 8%|▊ | 932/12384 [1:59:03<24:23:26, 7.67s/it, loss=0.0093, acc=0.9876, iter_time=8.81s]
Epoch 0: 8%|▊ | 933/12384 [1:59:03<24:21:39, 7.66s/it, loss=0.0093, acc=0.9876, iter_time=8.81s]
Epoch 0: 8%|▊ | 933/12384 [1:59:10<24:21:39, 7.66s/it, loss=0.0111, acc=0.9763, iter_time=7.62s]
Epoch 0: 8%|▊ | 934/12384 [1:59:10<24:18:29, 7.64s/it, loss=0.0111, acc=0.9763, iter_time=7.62s]
Epoch 0: 8%|▊ | 934/12384 [1:59:18<24:18:29, 7.64s/it, loss=0.0127, acc=0.9751, iter_time=7.61s]
Epoch 0: 8%|▊ | 935/12384 [1:59:18<24:22:24, 7.66s/it, loss=0.0127, acc=0.9751, iter_time=7.61s]
Epoch 0: 8%|▊ | 935/12384 [1:59:26<24:22:24, 7.66s/it, loss=0.0039, acc=0.9964, iter_time=7.69s]
Epoch 0: 8%|▊ | 936/12384 [1:59:26<24:20:33, 7.65s/it, loss=0.0039, acc=0.9964, iter_time=7.69s]
Epoch 0: 8%|▊ | 936/12384 [1:59:33<24:20:33, 7.65s/it, loss=0.0041, acc=0.9931, iter_time=7.65s]
Epoch 0: 8%|▊ | 937/12384 [1:59:33<24:18:13, 7.64s/it, loss=0.0041, acc=0.9931, iter_time=7.65s]
Epoch 0: 8%|▊ | 937/12384 [1:59:41<24:18:13, 7.64s/it, loss=0.0169, acc=0.9569, iter_time=7.64s]
Epoch 0: 8%|▊ | 938/12384 [1:59:41<24:17:14, 7.64s/it, loss=0.0169, acc=0.9569, iter_time=7.64s]
Epoch 0: 8%|▊ | 938/12384 [1:59:49<24:17:14, 7.64s/it, loss=0.0282, acc=0.9559, iter_time=7.33s]
Epoch 0: 8%|▊ | 939/12384 [1:59:49<24:17:52, 7.64s/it, loss=0.0282, acc=0.9559, iter_time=7.33s]
Epoch 0: 8%|▊ | 939/12384 [1:59:56<24:17:52, 7.64s/it, loss=0.0076, acc=0.9813, iter_time=5.94s]
Epoch 0: 8%|▊ | 940/12384 [1:59:56<24:21:19, 7.66s/it, loss=0.0076, acc=0.9813, iter_time=5.94s]
Epoch 0: 8%|▊ | 940/12384 [2:00:04<24:21:19, 7.66s/it, loss=0.0069, acc=0.9862, iter_time=6.89s]
Epoch 0: 8%|▊ | 941/12384 [2:00:04<24:19:46, 7.65s/it, loss=0.0069, acc=0.9862, iter_time=6.89s]
Epoch 0: 8%|▊ | 941/12384 [2:00:12<24:19:46, 7.65s/it, loss=0.0056, acc=0.9913, iter_time=7.31s]
Epoch 0: 8%|▊ | 942/12384 [2:00:12<24:18:49, 7.65s/it, loss=0.0056, acc=0.9913, iter_time=7.31s]
Epoch 0: 8%|▊ | 942/12384 [2:00:19<24:18:49, 7.65s/it, loss=0.0028, acc=0.9981, iter_time=7.23s]
Epoch 0: 8%|▊ | 943/12384 [2:00:19<24:17:59, 7.65s/it, loss=0.0028, acc=0.9981, iter_time=7.23s]
Epoch 0: 8%|▊ | 943/12384 [2:00:27<24:17:59, 7.65s/it, loss=0.0162, acc=0.9659, iter_time=11.58s]
Epoch 0: 8%|▊ | 944/12384 [2:00:27<24:19:31, 7.65s/it, loss=0.0162, acc=0.9659, iter_time=11.58s]
Epoch 0: 8%|▊ | 944/12384 [2:00:35<24:19:31, 7.65s/it, loss=0.0048, acc=0.9966, iter_time=7.27s]
Epoch 0: 8%|▊ | 945/12384 [2:00:35<24:18:15, 7.65s/it, loss=0.0048, acc=0.9966, iter_time=7.27s]
Epoch 0: 8%|▊ | 945/12384 [2:00:42<24:18:15, 7.65s/it, loss=0.0056, acc=0.9894, iter_time=7.64s]
Epoch 0: 8%|▊ | 946/12384 [2:00:42<24:20:59, 7.66s/it, loss=0.0056, acc=0.9894, iter_time=7.64s]
Epoch 0: 8%|▊ | 946/12384 [2:00:50<24:20:59, 7.66s/it, loss=0.0072, acc=0.9839, iter_time=7.69s]
Epoch 0: 8%|▊ | 947/12384 [2:00:50<24:21:03, 7.66s/it, loss=0.0072, acc=0.9839, iter_time=7.69s]
Epoch 0: 8%|▊ | 947/12384 [2:00:58<24:21:03, 7.66s/it, loss=0.0051, acc=0.9963, iter_time=7.37s]
Epoch 0: 8%|▊ | 948/12384 [2:00:58<24:20:27, 7.66s/it, loss=0.0051, acc=0.9963, iter_time=7.37s]
Epoch 0: 8%|▊ | 948/12384 [2:01:05<24:20:27, 7.66s/it, loss=0.0054, acc=0.9898, iter_time=7.96s]
Epoch 0: 8%|▊ | 949/12384 [2:01:05<24:19:33, 7.66s/it, loss=0.0054, acc=0.9898, iter_time=7.96s]
Epoch 0: 8%|▊ | 949/12384 [2:01:13<24:19:33, 7.66s/it, loss=0.0045, acc=0.9898, iter_time=8.10s]
Epoch 0: 8%|▊ | 950/12384 [2:01:13<24:20:07, 7.66s/it, loss=0.0045, acc=0.9898, iter_time=8.10s]
Epoch 0: 8%|▊ | 950/12384 [2:01:21<24:20:07, 7.66s/it, loss=0.0064, acc=0.9899, iter_time=7.21s]
Epoch 0: 8%|▊ | 951/12384 [2:01:21<24:19:20, 7.66s/it, loss=0.0064, acc=0.9899, iter_time=7.21s]
Epoch 0: 8%|▊ | 951/12384 [2:01:28<24:19:20, 7.66s/it, loss=0.0126, acc=0.9777, iter_time=7.60s]
Epoch 0: 8%|▊ | 952/12384 [2:01:28<24:16:31, 7.64s/it, loss=0.0126, acc=0.9777, iter_time=7.60s]
Epoch 0: 8%|▊ | 952/12384 [2:01:36<24:16:31, 7.64s/it, loss=0.0079, acc=0.9837, iter_time=6.18s]
Epoch 0: 8%|▊ | 953/12384 [2:01:36<24:14:29, 7.63s/it, loss=0.0079, acc=0.9837, iter_time=6.18s]
Epoch 0: 8%|▊ | 953/12384 [2:01:43<24:14:29, 7.63s/it, loss=0.0069, acc=0.9834, iter_time=9.07s]
Epoch 0: 8%|▊ | 954/12384 [2:01:43<24:11:46, 7.62s/it, loss=0.0069, acc=0.9834, iter_time=9.07s]
Epoch 0: 8%|▊ | 954/12384 [2:01:51<24:11:46, 7.62s/it, loss=0.0086, acc=0.9863, iter_time=5.14s]
Epoch 0: 8%|▊ | 955/12384 [2:01:51<24:31:54, 7.73s/it, loss=0.0086, acc=0.9863, iter_time=5.14s]
Epoch 0: 8%|▊ | 955/12384 [2:01:59<24:31:54, 7.73s/it, loss=0.0138, acc=0.9684, iter_time=10.44s]
Epoch 0: 8%|▊ | 956/12384 [2:01:59<24:25:35, 7.69s/it, loss=0.0138, acc=0.9684, iter_time=10.44s]
Epoch 0: 8%|▊ | 956/12384 [2:02:07<24:25:35, 7.69s/it, loss=0.0067, acc=0.9871, iter_time=7.62s]
Epoch 0: 8%|▊ | 957/12384 [2:02:07<24:21:12, 7.67s/it, loss=0.0067, acc=0.9871, iter_time=7.62s]
Epoch 0: 8%|▊ | 957/12384 [2:02:14<24:21:12, 7.67s/it, loss=0.0045, acc=0.9881, iter_time=7.62s]
Epoch 0: 8%|▊ | 958/12384 [2:02:14<24:19:15, 7.66s/it, loss=0.0045, acc=0.9881, iter_time=7.62s]
Epoch 0: 8%|▊ | 958/12384 [2:02:22<24:19:15, 7.66s/it, loss=0.0051, acc=0.9858, iter_time=7.65s]
Epoch 0: 8%|▊ | 959/12384 [2:02:22<24:16:33, 7.65s/it, loss=0.0051, acc=0.9858, iter_time=7.65s]
Epoch 0: 8%|▊ | 959/12384 [2:02:29<24:16:33, 7.65s/it, loss=0.0079, acc=0.9799, iter_time=7.53s]
Epoch 0: 8%|▊ | 960/12384 [2:02:29<24:13:12, 7.63s/it, loss=0.0079, acc=0.9799, iter_time=7.53s]
Epoch 0: 8%|▊ | 960/12384 [2:02:37<24:13:12, 7.63s/it, loss=0.0177, acc=0.9659, iter_time=7.65s]
Epoch 0: 8%|▊ | 961/12384 [2:02:37<24:11:44, 7.63s/it, loss=0.0177, acc=0.9659, iter_time=7.65s]
Epoch 0: 8%|▊ | 961/12384 [2:02:45<24:11:44, 7.63s/it, loss=0.0062, acc=0.9867, iter_time=7.65s]
Epoch 0: 8%|▊ | 962/12384 [2:02:45<24:11:46, 7.63s/it, loss=0.0062, acc=0.9867, iter_time=7.65s]
Epoch 0: 8%|▊ | 962/12384 [2:02:52<24:11:46, 7.63s/it, loss=0.0075, acc=0.9800, iter_time=6.66s]
Epoch 0: 8%|▊ | 963/12384 [2:02:52<24:13:43, 7.64s/it, loss=0.0075, acc=0.9800, iter_time=6.66s]
Epoch 0: 8%|▊ | 963/12384 [2:03:00<24:13:43, 7.64s/it, loss=0.0128, acc=0.9723, iter_time=8.61s]
Epoch 0: 8%|▊ | 964/12384 [2:03:00<24:13:56, 7.64s/it, loss=0.0128, acc=0.9723, iter_time=8.61s]
Epoch 0: 8%|▊ | 964/12384 [2:03:08<24:13:56, 7.64s/it, loss=0.0050, acc=0.9939, iter_time=4.50s]
Epoch 0: 8%|▊ | 965/12384 [2:03:08<24:13:56, 7.64s/it, loss=0.0050, acc=0.9939, iter_time=4.50s]
Epoch 0: 8%|▊ | 965/12384 [2:03:15<24:13:56, 7.64s/it, loss=0.0042, acc=0.9962, iter_time=8.47s]
Epoch 0: 8%|▊ | 966/12384 [2:03:15<24:11:58, 7.63s/it, loss=0.0042, acc=0.9962, iter_time=8.47s]
Epoch 0: 8%|▊ | 966/12384 [2:03:23<24:11:58, 7.63s/it, loss=0.0046, acc=0.9878, iter_time=9.32s]
Epoch 0: 8%|▊ | 967/12384 [2:03:23<24:11:51, 7.63s/it, loss=0.0046, acc=0.9878, iter_time=9.32s]
Epoch 0: 8%|▊ | 967/12384 [2:03:31<24:11:51, 7.63s/it, loss=0.0041, acc=0.9892, iter_time=8.64s]
Epoch 0: 8%|▊ | 968/12384 [2:03:31<24:16:11, 7.65s/it, loss=0.0041, acc=0.9892, iter_time=8.64s]
Epoch 0: 8%|▊ | 968/12384 [2:03:38<24:16:11, 7.65s/it, loss=0.0117, acc=0.9770, iter_time=7.31s]
Epoch 0: 8%|▊ | 969/12384 [2:03:38<24:14:42, 7.65s/it, loss=0.0117, acc=0.9770, iter_time=7.31s]
Epoch 0: 8%|▊ | 969/12384 [2:03:46<24:14:42, 7.65s/it, loss=0.0022, acc=0.9920, iter_time=4.27s]
Epoch 0: 8%|▊ | 970/12384 [2:03:46<24:12:02, 7.63s/it, loss=0.0022, acc=0.9920, iter_time=4.27s]
Epoch 0: 8%|▊ | 970/12384 [2:03:53<24:12:02, 7.63s/it, loss=0.0055, acc=0.9921, iter_time=10.98s]
Epoch 0: 8%|▊ | 971/12384 [2:03:53<24:12:16, 7.63s/it, loss=0.0055, acc=0.9921, iter_time=10.98s]
Epoch 0: 8%|▊ | 971/12384 [2:04:01<24:12:16, 7.63s/it, loss=0.0067, acc=0.9879, iter_time=7.62s]
Epoch 0: 8%|▊ | 972/12384 [2:04:01<24:11:08, 7.63s/it, loss=0.0067, acc=0.9879, iter_time=7.62s]
Epoch 0: 8%|▊ | 972/12384 [2:04:09<24:11:08, 7.63s/it, loss=0.0050, acc=0.9938, iter_time=7.65s]
Epoch 0: 8%|▊ | 973/12384 [2:04:09<24:10:53, 7.63s/it, loss=0.0050, acc=0.9938, iter_time=7.65s]
Epoch 0: 8%|▊ | 973/12384 [2:04:16<24:10:53, 7.63s/it, loss=0.0055, acc=0.9927, iter_time=7.61s]
Epoch 0: 8%|▊ | 974/12384 [2:04:16<24:11:04, 7.63s/it, loss=0.0055, acc=0.9927, iter_time=7.61s]
Epoch 0: 8%|▊ | 974/12384 [2:04:24<24:11:04, 7.63s/it, loss=0.0124, acc=0.9897, iter_time=7.66s]
Epoch 0: 8%|▊ | 975/12384 [2:04:24<24:11:32, 7.63s/it, loss=0.0124, acc=0.9897, iter_time=7.66s]
Epoch 0: 8%|▊ | 975/12384 [2:04:32<24:11:32, 7.63s/it, loss=0.0121, acc=0.9766, iter_time=7.99s]
Epoch 0: 8%|▊ | 976/12384 [2:04:32<24:11:18, 7.63s/it, loss=0.0121, acc=0.9766, iter_time=7.99s]
Epoch 0: 8%|▊ | 976/12384 [2:04:39<24:11:18, 7.63s/it, loss=0.0060, acc=0.9853, iter_time=6.04s]
Epoch 0: 8%|▊ | 977/12384 [2:04:39<24:11:24, 7.63s/it, loss=0.0060, acc=0.9853, iter_time=6.04s]
Epoch 0: 8%|▊ | 977/12384 [2:04:47<24:11:24, 7.63s/it, loss=0.0064, acc=0.9838, iter_time=5.56s]
Epoch 0: 8%|▊ | 978/12384 [2:04:47<24:13:29, 7.65s/it, loss=0.0064, acc=0.9838, iter_time=5.56s]
Epoch 0: 8%|▊ | 978/12384 [2:04:55<24:13:29, 7.65s/it, loss=0.0102, acc=0.9818, iter_time=8.17s]
Epoch 0: 8%|▊ | 979/12384 [2:04:55<24:12:27, 7.64s/it, loss=0.0102, acc=0.9818, iter_time=8.17s]
Epoch 0: 8%|▊ | 979/12384 [2:05:02<24:12:27, 7.64s/it, loss=0.0152, acc=0.9760, iter_time=7.64s]
Epoch 0: 8%|▊ | 980/12384 [2:05:02<24:12:53, 7.64s/it, loss=0.0152, acc=0.9760, iter_time=7.64s]
Epoch 0: 8%|▊ | 980/12384 [2:05:10<24:12:53, 7.64s/it, loss=0.0098, acc=0.9809, iter_time=10.72s]
Epoch 0: 8%|▊ | 981/12384 [2:05:10<24:31:40, 7.74s/it, loss=0.0098, acc=0.9809, iter_time=10.72s]
Epoch 0: 8%|▊ | 981/12384 [2:05:18<24:31:40, 7.74s/it, loss=0.0065, acc=0.9818, iter_time=7.70s]
Epoch 0: 8%|▊ | 982/12384 [2:05:18<24:24:43, 7.71s/it, loss=0.0065, acc=0.9818, iter_time=7.70s]
Epoch 0: 8%|▊ | 982/12384 [2:05:25<24:24:43, 7.71s/it, loss=0.0123, acc=0.9675, iter_time=7.61s]
Epoch 0: 8%|▊ | 983/12384 [2:05:25<24:18:41, 7.68s/it, loss=0.0123, acc=0.9675, iter_time=7.61s]
Epoch 0: 8%|▊ | 983/12384 [2:05:33<24:18:41, 7.68s/it, loss=0.0034, acc=0.9942, iter_time=7.54s]
Epoch 0: 8%|▊ | 984/12384 [2:05:33<24:14:16, 7.65s/it, loss=0.0034, acc=0.9942, iter_time=7.54s]
Epoch 0: 8%|▊ | 984/12384 [2:05:41<24:14:16, 7.65s/it, loss=0.0045, acc=0.9879, iter_time=7.66s]
Epoch 0: 8%|▊ | 985/12384 [2:05:41<24:11:22, 7.64s/it, loss=0.0045, acc=0.9879, iter_time=7.66s]
Epoch 0: 8%|▊ | 985/12384 [2:05:48<24:11:22, 7.64s/it, loss=0.0083, acc=0.9807, iter_time=7.59s]
Epoch 0: 8%|▊ | 986/12384 [2:05:48<24:10:31, 7.64s/it, loss=0.0083, acc=0.9807, iter_time=7.59s]
Epoch 0: 8%|▊ | 986/12384 [2:05:56<24:10:31, 7.64s/it, loss=0.0047, acc=0.9907, iter_time=6.71s]
Epoch 0: 8%|▊ | 987/12384 [2:05:56<24:12:32, 7.65s/it, loss=0.0047, acc=0.9907, iter_time=6.71s]
Epoch 0: 8%|▊ | 987/12384 [2:06:04<24:12:32, 7.65s/it, loss=0.0027, acc=0.9948, iter_time=8.61s]
Epoch 0: 8%|▊ | 988/12384 [2:06:04<24:11:33, 7.64s/it, loss=0.0027, acc=0.9948, iter_time=8.61s]
Epoch 0: 8%|▊ | 988/12384 [2:06:11<24:11:33, 7.64s/it, loss=0.0072, acc=0.9799, iter_time=7.62s]
Epoch 0: 8%|▊ | 989/12384 [2:06:11<24:09:29, 7.63s/it, loss=0.0072, acc=0.9799, iter_time=7.62s]
Epoch 0: 8%|▊ | 989/12384 [2:06:19<24:09:29, 7.63s/it, loss=0.0042, acc=0.9847, iter_time=6.97s]
Epoch 0: 8%|▊ | 990/12384 [2:06:19<24:09:25, 7.63s/it, loss=0.0042, acc=0.9847, iter_time=6.97s]
Epoch 0: 8%|▊ | 990/12384 [2:06:26<24:09:25, 7.63s/it, loss=0.0053, acc=0.9882, iter_time=8.28s]
Epoch 0: 8%|▊ | 991/12384 [2:06:26<24:08:06, 7.63s/it, loss=0.0053, acc=0.9882, iter_time=8.28s]
Epoch 0: 8%|▊ | 991/12384 [2:06:34<24:08:06, 7.63s/it, loss=0.0059, acc=0.9857, iter_time=7.55s]
Epoch 0: 8%|▊ | 992/12384 [2:06:34<24:07:14, 7.62s/it, loss=0.0059, acc=0.9857, iter_time=7.55s]
Epoch 0: 8%|▊ | 992/12384 [2:06:42<24:07:14, 7.62s/it, loss=0.0017, acc=0.9995, iter_time=7.65s]
Epoch 0: 8%|▊ | 993/12384 [2:06:42<24:06:18, 7.62s/it, loss=0.0017, acc=0.9995, iter_time=7.65s]
Epoch 0: 8%|▊ | 993/12384 [2:06:49<24:06:18, 7.62s/it, loss=0.0124, acc=0.9837, iter_time=7.60s]
Epoch 0: 8%|▊ | 994/12384 [2:06:49<24:06:58, 7.62s/it, loss=0.0124, acc=0.9837, iter_time=7.60s]
Epoch 0: 8%|▊ | 994/12384 [2:06:57<24:06:58, 7.62s/it, loss=0.0210, acc=0.9684, iter_time=7.68s]
Epoch 0: 8%|▊ | 995/12384 [2:06:57<24:08:26, 7.63s/it, loss=0.0210, acc=0.9684, iter_time=7.68s]
Epoch 0: 8%|▊ | 995/12384 [2:07:04<24:08:26, 7.63s/it, loss=0.0028, acc=0.9942, iter_time=7.61s]
Epoch 0: 8%|▊ | 996/12384 [2:07:04<24:06:30, 7.62s/it, loss=0.0028, acc=0.9942, iter_time=7.61s]
Epoch 0: 8%|▊ | 996/12384 [2:07:12<24:06:30, 7.62s/it, loss=0.0053, acc=0.9909, iter_time=7.62s]
Epoch 0: 8%|▊ | 997/12384 [2:07:12<24:07:22, 7.63s/it, loss=0.0053, acc=0.9909, iter_time=7.62s]
Epoch 0: 8%|▊ | 997/12384 [2:07:20<24:07:22, 7.63s/it, loss=0.0038, acc=0.9914, iter_time=7.63s]
Epoch 0: 8%|▊ | 998/12384 [2:07:20<24:06:39, 7.62s/it, loss=0.0038, acc=0.9914, iter_time=7.63s]
Epoch 0: 8%|▊ | 998/12384 [2:07:27<24:06:39, 7.62s/it, loss=0.0072, acc=0.9869, iter_time=7.59s]
Epoch 0: 8%|▊ | 999/12384 [2:07:27<24:06:45, 7.62s/it, loss=0.0072, acc=0.9869, iter_time=7.59s]
Epoch 0: 8%|▊ | 999/12384 [2:07:35<24:06:45, 7.62s/it, loss=0.0031, acc=0.9893, iter_time=8.08s]
Epoch 0: 8%|▊ | 1000/12384 [2:07:35<24:19:36, 7.69s/it, loss=0.0031, acc=0.9893, iter_time=8.08s]
Epoch 0: 8%|▊ | 1000/12384 [2:07:43<24:19:36, 7.69s/it, loss=0.0037, acc=0.9923, iter_time=7.40s]
Epoch 0: 8%|▊ | 1001/12384 [2:07:43<24:18:34, 7.69s/it, loss=0.0037, acc=0.9923, iter_time=7.40s]
Epoch 0: 8%|▊ | 1001/12384 [2:07:51<24:18:34, 7.69s/it, loss=0.0036, acc=0.9895, iter_time=7.69s]
Epoch 0: 8%|▊ | 1002/12384 [2:07:51<24:14:21, 7.67s/it, loss=0.0036, acc=0.9895, iter_time=7.69s]
Epoch 0: 8%|▊ | 1002/12384 [2:07:58<24:14:21, 7.67s/it, loss=0.0148, acc=0.9791, iter_time=7.61s]
Epoch 0: 8%|▊ | 1003/12384 [2:07:58<24:12:05, 7.66s/it, loss=0.0148, acc=0.9791, iter_time=7.61s]
Epoch 0: 8%|▊ | 1003/12384 [2:08:06<24:12:05, 7.66s/it, loss=0.0058, acc=0.9831, iter_time=7.61s]
Epoch 0: 8%|▊ | 1004/12384 [2:08:06<24:09:25, 7.64s/it, loss=0.0058, acc=0.9831, iter_time=7.61s]
Epoch 0: 8%|▊ | 1004/12384 [2:08:13<24:09:25, 7.64s/it, loss=0.0033, acc=0.9912, iter_time=7.63s]
Epoch 0: 8%|▊ | 1005/12384 [2:08:13<24:10:25, 7.65s/it, loss=0.0033, acc=0.9912, iter_time=7.63s]
Epoch 0: 8%|▊ | 1005/12384 [2:08:21<24:10:25, 7.65s/it, loss=0.0048, acc=0.9879, iter_time=7.95s]
Epoch 0: 8%|▊ | 1006/12384 [2:08:21<24:23:44, 7.72s/it, loss=0.0048, acc=0.9879, iter_time=7.95s]
Epoch 0: 8%|▊ | 1006/12384 [2:08:29<24:23:44, 7.72s/it, loss=0.0050, acc=0.9908, iter_time=5.26s]
Epoch 0: 8%|▊ | 1007/12384 [2:08:29<24:16:39, 7.68s/it, loss=0.0050, acc=0.9908, iter_time=5.26s]
Epoch 0: 8%|▊ | 1007/12384 [2:08:37<24:16:39, 7.68s/it, loss=0.0141, acc=0.9724, iter_time=10.38s]
Epoch 0: 8%|▊ | 1008/12384 [2:08:37<24:31:53, 7.76s/it, loss=0.0141, acc=0.9724, iter_time=10.38s]
Epoch 0: 8%|▊ | 1008/12384 [2:08:45<24:31:53, 7.76s/it, loss=0.0036, acc=0.9910, iter_time=7.51s]
Epoch 0: 8%|▊ | 1009/12384 [2:08:45<24:25:42, 7.73s/it, loss=0.0036, acc=0.9910, iter_time=7.51s]
Epoch 0: 8%|▊ | 1009/12384 [2:08:52<24:25:42, 7.73s/it, loss=0.0130, acc=0.9754, iter_time=7.69s]
Epoch 0: 8%|▊ | 1010/12384 [2:08:52<24:20:05, 7.70s/it, loss=0.0130, acc=0.9754, iter_time=7.69s]
Epoch 0: 8%|▊ | 1010/12384 [2:09:00<24:20:05, 7.70s/it, loss=0.0031, acc=0.9924, iter_time=7.61s]
Epoch 0: 8%|▊ | 1011/12384 [2:09:00<24:14:39, 7.67s/it, loss=0.0031, acc=0.9924, iter_time=7.61s]
Epoch 0: 8%|▊ | 1011/12384 [2:09:07<24:14:39, 7.67s/it, loss=0.0112, acc=0.9841, iter_time=7.61s]
Epoch 0: 8%|▊ | 1012/12384 [2:09:07<24:14:25, 7.67s/it, loss=0.0112, acc=0.9841, iter_time=7.61s]
Epoch 0: 8%|▊ | 1012/12384 [2:09:15<24:14:25, 7.67s/it, loss=0.0066, acc=0.9865, iter_time=7.65s]
Epoch 0: 8%|▊ | 1013/12384 [2:09:15<24:09:50, 7.65s/it, loss=0.0066, acc=0.9865, iter_time=7.65s]
Epoch 0: 8%|▊ | 1013/12384 [2:09:23<24:09:50, 7.65s/it, loss=0.0024, acc=0.9921, iter_time=7.59s]
Epoch 0: 8%|▊ | 1014/12384 [2:09:23<24:08:22, 7.64s/it, loss=0.0024, acc=0.9921, iter_time=7.59s]
Epoch 0: 8%|▊ | 1014/12384 [2:09:30<24:08:22, 7.64s/it, loss=0.0065, acc=0.9930, iter_time=7.64s]
Epoch 0: 8%|▊ | 1015/12384 [2:09:30<24:10:31, 7.66s/it, loss=0.0065, acc=0.9930, iter_time=7.64s]
Epoch 0: 8%|▊ | 1015/12384 [2:09:38<24:10:31, 7.66s/it, loss=0.0042, acc=0.9923, iter_time=8.07s]
Epoch 0: 8%|▊ | 1016/12384 [2:09:38<24:09:48, 7.65s/it, loss=0.0042, acc=0.9923, iter_time=8.07s]
Epoch 0: 8%|▊ | 1016/12384 [2:09:46<24:09:48, 7.65s/it, loss=0.0075, acc=0.9877, iter_time=7.26s]
Epoch 0: 8%|▊ | 1017/12384 [2:09:46<24:08:06, 7.64s/it, loss=0.0075, acc=0.9877, iter_time=7.26s]
Epoch 0: 8%|▊ | 1017/12384 [2:09:53<24:08:06, 7.64s/it, loss=0.0109, acc=0.9815, iter_time=7.62s]
Epoch 0: 8%|▊ | 1018/12384 [2:09:53<24:06:33, 7.64s/it, loss=0.0109, acc=0.9815, iter_time=7.62s]
Epoch 0: 8%|▊ | 1018/12384 [2:10:01<24:06:33, 7.64s/it, loss=0.0056, acc=0.9881, iter_time=5.82s]
Epoch 0: 8%|▊ | 1019/12384 [2:10:01<24:04:06, 7.62s/it, loss=0.0056, acc=0.9881, iter_time=5.82s]
Epoch 0: 8%|▊ | 1019/12384 [2:10:08<24:04:06, 7.62s/it, loss=0.0039, acc=0.9879, iter_time=7.85s]
Epoch 0: 8%|▊ | 1020/12384 [2:10:08<24:02:43, 7.62s/it, loss=0.0039, acc=0.9879, iter_time=7.85s]
Epoch 0: 8%|▊ | 1020/12384 [2:10:16<24:02:43, 7.62s/it, loss=0.0122, acc=0.9763, iter_time=9.13s]
Epoch 0: 8%|▊ | 1021/12384 [2:10:16<24:00:47, 7.61s/it, loss=0.0122, acc=0.9763, iter_time=9.13s]
Epoch 0: 8%|▊ | 1021/12384 [2:10:24<24:00:47, 7.61s/it, loss=0.0047, acc=0.9898, iter_time=7.59s]
Epoch 0: 8%|▊ | 1022/12384 [2:10:24<24:02:24, 7.62s/it, loss=0.0047, acc=0.9898, iter_time=7.59s]
Epoch 0: 8%|▊ | 1022/12384 [2:10:31<24:02:24, 7.62s/it, loss=0.0020, acc=0.9959, iter_time=7.66s]
Epoch 0: 8%|▊ | 1023/12384 [2:10:31<24:05:35, 7.63s/it, loss=0.0020, acc=0.9959, iter_time=7.66s]
Epoch 0: 8%|▊ | 1023/12384 [2:10:39<24:05:35, 7.63s/it, loss=0.0020, acc=0.9976, iter_time=7.65s]
Epoch 0: 8%|▊ | 1024/12384 [2:10:39<24:06:11, 7.64s/it, loss=0.0020, acc=0.9976, iter_time=7.65s]
Epoch 0: 8%|▊ | 1024/12384 [2:10:47<24:06:11, 7.64s/it, loss=0.0025, acc=0.9925, iter_time=7.66s]
Epoch 0: 8%|▊ | 1025/12384 [2:10:47<24:04:54, 7.63s/it, loss=0.0025, acc=0.9925, iter_time=7.66s]
Epoch 0: 8%|▊ | 1025/12384 [2:10:54<24:04:54, 7.63s/it, loss=0.0031, acc=0.9926, iter_time=4.60s]
Epoch 0: 8%|▊ | 1026/12384 [2:10:54<24:06:06, 7.64s/it, loss=0.0031, acc=0.9926, iter_time=4.60s]
Epoch 0: 8%|▊ | 1026/12384 [2:11:02<24:06:06, 7.64s/it, loss=0.0125, acc=0.9719, iter_time=10.68s]
Epoch 0: 8%|▊ | 1027/12384 [2:11:02<24:06:45, 7.64s/it, loss=0.0125, acc=0.9719, iter_time=10.68s]
Epoch 0: 8%|▊ | 1027/12384 [2:11:10<24:06:45, 7.64s/it, loss=0.0014, acc=0.9990, iter_time=7.33s]
Epoch 0: 8%|▊ | 1028/12384 [2:11:10<24:06:24, 7.64s/it, loss=0.0014, acc=0.9990, iter_time=7.33s]
Epoch 0: 8%|▊ | 1028/12384 [2:11:17<24:06:24, 7.64s/it, loss=0.0025, acc=0.9945, iter_time=6.23s]
Epoch 0: 8%|▊ | 1029/12384 [2:11:17<24:06:39, 7.64s/it, loss=0.0025, acc=0.9945, iter_time=6.23s]
Epoch 0: 8%|▊ | 1029/12384 [2:11:25<24:06:39, 7.64s/it, loss=0.0064, acc=0.9901, iter_time=9.37s]
Epoch 0: 8%|▊ | 1030/12384 [2:11:25<24:05:51, 7.64s/it, loss=0.0064, acc=0.9901, iter_time=9.37s]
Epoch 0: 8%|▊ | 1030/12384 [2:11:32<24:05:51, 7.64s/it, loss=0.0037, acc=0.9942, iter_time=7.66s]
Epoch 0: 8%|▊ | 1031/12384 [2:11:32<24:05:45, 7.64s/it, loss=0.0037, acc=0.9942, iter_time=7.66s]
Epoch 0: 8%|▊ | 1031/12384 [2:11:40<24:05:45, 7.64s/it, loss=0.0344, acc=0.9582, iter_time=7.61s]
Epoch 0: 8%|▊ | 1032/12384 [2:11:40<24:06:26, 7.65s/it, loss=0.0344, acc=0.9582, iter_time=7.61s]
Epoch 0: 8%|▊ | 1032/12384 [2:11:48<24:06:26, 7.65s/it, loss=0.0038, acc=0.9897, iter_time=7.96s]
Epoch 0: 8%|▊ | 1033/12384 [2:11:48<24:21:06, 7.72s/it, loss=0.0038, acc=0.9897, iter_time=7.96s]
Epoch 0: 8%|▊ | 1033/12384 [2:11:56<24:21:06, 7.72s/it, loss=0.0090, acc=0.9823, iter_time=6.13s]
Epoch 0: 8%|▊ | 1034/12384 [2:11:56<24:34:01, 7.79s/it, loss=0.0090, acc=0.9823, iter_time=6.13s]
Epoch 0: 8%|▊ | 1034/12384 [2:12:04<24:34:01, 7.79s/it, loss=0.0085, acc=0.9762, iter_time=9.42s]
Epoch 0: 8%|▊ | 1035/12384 [2:12:04<24:22:58, 7.73s/it, loss=0.0085, acc=0.9762, iter_time=9.42s]
Epoch 0: 8%|▊ | 1035/12384 [2:12:11<24:22:58, 7.73s/it, loss=0.0046, acc=0.9904, iter_time=7.66s]
Epoch 0: 8%|▊ | 1036/12384 [2:12:11<24:18:27, 7.71s/it, loss=0.0046, acc=0.9904, iter_time=7.66s]
Epoch 0: 8%|▊ | 1036/12384 [2:12:19<24:18:27, 7.71s/it, loss=0.0035, acc=0.9900, iter_time=5.36s]
Epoch 0: 8%|▊ | 1037/12384 [2:12:19<24:12:10, 7.68s/it, loss=0.0035, acc=0.9900, iter_time=5.36s]
Epoch 0: 8%|▊ | 1037/12384 [2:12:26<24:12:10, 7.68s/it, loss=0.0055, acc=0.9900, iter_time=9.85s]
Epoch 0: 8%|▊ | 1038/12384 [2:12:26<24:09:12, 7.66s/it, loss=0.0055, acc=0.9900, iter_time=9.85s]
Epoch 0: 8%|▊ | 1038/12384 [2:12:34<24:09:12, 7.66s/it, loss=0.0053, acc=0.9886, iter_time=7.61s]
Epoch 0: 8%|▊ | 1039/12384 [2:12:34<24:06:53, 7.65s/it, loss=0.0053, acc=0.9886, iter_time=7.61s]
Epoch 0: 8%|▊ | 1039/12384 [2:12:42<24:06:53, 7.65s/it, loss=0.0073, acc=0.9914, iter_time=8.01s]
Epoch 0: 8%|▊ | 1040/12384 [2:12:42<24:04:31, 7.64s/it, loss=0.0073, acc=0.9914, iter_time=8.01s]
Epoch 0: 8%|▊ | 1040/12384 [2:12:49<24:04:31, 7.64s/it, loss=0.0017, acc=0.9949, iter_time=4.09s]
Epoch 0: 8%|▊ | 1041/12384 [2:12:49<24:05:20, 7.65s/it, loss=0.0017, acc=0.9949, iter_time=4.09s]
Epoch 0: 8%|▊ | 1041/12384 [2:12:57<24:05:20, 7.65s/it, loss=0.5570, acc=0.7423, iter_time=10.50s]
Epoch 0: 8%|▊ | 1042/12384 [2:12:57<24:05:00, 7.64s/it, loss=0.5570, acc=0.7423, iter_time=10.50s]
Epoch 0: 8%|▊ | 1042/12384 [2:13:05<24:05:00, 7.64s/it, loss=0.0054, acc=0.9913, iter_time=7.95s]
Epoch 0: 8%|▊ | 1043/12384 [2:13:05<24:05:05, 7.65s/it, loss=0.0054, acc=0.9913, iter_time=7.95s]
Epoch 0: 8%|▊ | 1043/12384 [2:13:12<24:05:05, 7.65s/it, loss=0.0042, acc=0.9910, iter_time=4.33s]
Epoch 0: 8%|▊ | 1044/12384 [2:13:12<24:01:51, 7.63s/it, loss=0.0042, acc=0.9910, iter_time=4.33s]
Epoch 0: 8%|▊ | 1044/12384 [2:13:20<24:01:51, 7.63s/it, loss=0.0046, acc=0.9945, iter_time=9.17s]
Epoch 0: 8%|▊ | 1045/12384 [2:13:20<23:59:58, 7.62s/it, loss=0.0046, acc=0.9945, iter_time=9.17s]
Epoch 0: 8%|▊ | 1045/12384 [2:13:28<23:59:58, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.09s]
Epoch 0: 8%|▊ | 1046/12384 [2:13:28<24:03:00, 7.64s/it, loss=0.0008, acc=0.9980, iter_time=7.09s]
Epoch 0: 8%|▊ | 1046/12384 [2:13:35<24:03:00, 7.64s/it, loss=0.0017, acc=0.9987, iter_time=9.92s]
Epoch 0: 8%|▊ | 1047/12384 [2:13:35<24:02:51, 7.64s/it, loss=0.0017, acc=0.9987, iter_time=9.92s]
Epoch 0: 8%|▊ | 1047/12384 [2:13:43<24:02:51, 7.64s/it, loss=0.0029, acc=0.9876, iter_time=8.03s]
Epoch 0: 8%|▊ | 1048/12384 [2:13:43<24:00:54, 7.63s/it, loss=0.0029, acc=0.9876, iter_time=8.03s]
Epoch 0: 8%|▊ | 1048/12384 [2:13:50<24:00:54, 7.63s/it, loss=0.0029, acc=0.9957, iter_time=7.21s]
Epoch 0: 8%|▊ | 1049/12384 [2:13:50<24:01:35, 7.63s/it, loss=0.0029, acc=0.9957, iter_time=7.21s]
Epoch 0: 8%|▊ | 1049/12384 [2:13:58<24:01:35, 7.63s/it, loss=0.0153, acc=0.9740, iter_time=8.05s]
Epoch 0: 8%|▊ | 1050/12384 [2:13:58<24:00:47, 7.63s/it, loss=0.0153, acc=0.9740, iter_time=8.05s]
Epoch 0: 8%|▊ | 1050/12384 [2:14:06<24:00:47, 7.63s/it, loss=0.0118, acc=0.9700, iter_time=6.61s]
Epoch 0: 8%|▊ | 1051/12384 [2:14:06<23:59:57, 7.62s/it, loss=0.0118, acc=0.9700, iter_time=6.61s]
Epoch 0: 8%|▊ | 1051/12384 [2:14:13<23:59:57, 7.62s/it, loss=0.0067, acc=0.9849, iter_time=8.22s]
Epoch 0: 8%|▊ | 1052/12384 [2:14:13<23:59:57, 7.62s/it, loss=0.0067, acc=0.9849, iter_time=8.22s]
Epoch 0: 8%|▊ | 1052/12384 [2:14:21<23:59:57, 7.62s/it, loss=0.0013, acc=0.9975, iter_time=4.44s]
Epoch 0: 9%|▊ | 1053/12384 [2:14:21<24:05:07, 7.65s/it, loss=0.0013, acc=0.9975, iter_time=4.44s]
Epoch 0: 9%|▊ | 1053/12384 [2:14:29<24:05:07, 7.65s/it, loss=0.0042, acc=0.9887, iter_time=9.14s]
Epoch 0: 9%|▊ | 1054/12384 [2:14:29<24:03:45, 7.65s/it, loss=0.0042, acc=0.9887, iter_time=9.14s]
Epoch 0: 9%|▊ | 1054/12384 [2:14:36<24:03:45, 7.65s/it, loss=0.0031, acc=0.9946, iter_time=9.42s]
Epoch 0: 9%|▊ | 1055/12384 [2:14:36<24:01:44, 7.64s/it, loss=0.0031, acc=0.9946, iter_time=9.42s]
Epoch 0: 9%|▊ | 1055/12384 [2:14:44<24:01:44, 7.64s/it, loss=0.0053, acc=0.9915, iter_time=7.57s]
Epoch 0: 9%|▊ | 1056/12384 [2:14:44<24:00:39, 7.63s/it, loss=0.0053, acc=0.9915, iter_time=7.57s]
Epoch 0: 9%|▊ | 1056/12384 [2:14:51<24:00:39, 7.63s/it, loss=0.0066, acc=0.9869, iter_time=3.90s]
Epoch 0: 9%|▊ | 1057/12384 [2:14:51<23:59:10, 7.62s/it, loss=0.0066, acc=0.9869, iter_time=3.90s]
Epoch 0: 9%|▊ | 1057/12384 [2:14:59<23:59:10, 7.62s/it, loss=0.0075, acc=0.9860, iter_time=11.33s]
Epoch 0: 9%|▊ | 1058/12384 [2:14:59<23:59:28, 7.63s/it, loss=0.0075, acc=0.9860, iter_time=11.33s]
Epoch 0: 9%|▊ | 1058/12384 [2:15:07<23:59:28, 7.63s/it, loss=0.0016, acc=0.9973, iter_time=7.66s]
Epoch 0: 9%|▊ | 1059/12384 [2:15:07<23:58:55, 7.62s/it, loss=0.0016, acc=0.9973, iter_time=7.66s]
Epoch 0: 9%|▊ | 1059/12384 [2:15:15<23:58:55, 7.62s/it, loss=0.0038, acc=0.9930, iter_time=7.91s]
Epoch 0: 9%|▊ | 1060/12384 [2:15:15<24:14:29, 7.71s/it, loss=0.0038, acc=0.9930, iter_time=7.91s]
Epoch 0: 9%|▊ | 1060/12384 [2:15:23<24:14:29, 7.71s/it, loss=0.0093, acc=0.9816, iter_time=7.67s]
Epoch 0: 9%|▊ | 1061/12384 [2:15:23<24:26:31, 7.77s/it, loss=0.0093, acc=0.9816, iter_time=7.67s]
Epoch 0: 9%|▊ | 1061/12384 [2:15:30<24:26:31, 7.77s/it, loss=0.0259, acc=0.9664, iter_time=7.56s]
Epoch 0: 9%|▊ | 1062/12384 [2:15:30<24:18:30, 7.73s/it, loss=0.0259, acc=0.9664, iter_time=7.56s]
Epoch 0: 9%|▊ | 1062/12384 [2:15:38<24:18:30, 7.73s/it, loss=0.0054, acc=0.9909, iter_time=7.93s]
Epoch 0: 9%|▊ | 1063/12384 [2:15:38<24:13:58, 7.71s/it, loss=0.0054, acc=0.9909, iter_time=7.93s]
Epoch 0: 9%|▊ | 1063/12384 [2:15:45<24:13:58, 7.71s/it, loss=0.0047, acc=0.9945, iter_time=8.02s]
Epoch 0: 9%|▊ | 1064/12384 [2:15:45<24:08:51, 7.68s/it, loss=0.0047, acc=0.9945, iter_time=8.02s]
Epoch 0: 9%|▊ | 1064/12384 [2:15:53<24:08:51, 7.68s/it, loss=0.0019, acc=0.9982, iter_time=4.12s]
Epoch 0: 9%|▊ | 1065/12384 [2:15:53<24:05:15, 7.66s/it, loss=0.0019, acc=0.9982, iter_time=4.12s]
Epoch 0: 9%|▊ | 1065/12384 [2:16:01<24:05:15, 7.66s/it, loss=0.0088, acc=0.9754, iter_time=7.00s]
Epoch 0: 9%|▊ | 1066/12384 [2:16:01<24:01:44, 7.64s/it, loss=0.0088, acc=0.9754, iter_time=7.00s]
Epoch 0: 9%|▊ | 1066/12384 [2:16:08<24:01:44, 7.64s/it, loss=0.0053, acc=0.9916, iter_time=11.34s]
Epoch 0: 9%|▊ | 1067/12384 [2:16:08<24:00:59, 7.64s/it, loss=0.0053, acc=0.9916, iter_time=11.34s]
Epoch 0: 9%|▊ | 1067/12384 [2:16:16<24:00:59, 7.64s/it, loss=0.0053, acc=0.9881, iter_time=7.72s]
Epoch 0: 9%|▊ | 1068/12384 [2:16:16<24:03:29, 7.65s/it, loss=0.0053, acc=0.9881, iter_time=7.72s]
Epoch 0: 9%|▊ | 1068/12384 [2:16:24<24:03:29, 7.65s/it, loss=0.0033, acc=0.9901, iter_time=7.61s]
Epoch 0: 9%|▊ | 1069/12384 [2:16:24<24:00:21, 7.64s/it, loss=0.0033, acc=0.9901, iter_time=7.61s]
Epoch 0: 9%|▊ | 1069/12384 [2:16:31<24:00:21, 7.64s/it, loss=0.0090, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▊ | 1070/12384 [2:16:31<23:58:48, 7.63s/it, loss=0.0090, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▊ | 1070/12384 [2:16:39<23:58:48, 7.63s/it, loss=0.0053, acc=0.9913, iter_time=7.61s]
Epoch 0: 9%|▊ | 1071/12384 [2:16:39<23:57:25, 7.62s/it, loss=0.0053, acc=0.9913, iter_time=7.61s]
Epoch 0: 9%|▊ | 1071/12384 [2:16:46<23:57:25, 7.62s/it, loss=0.0068, acc=0.9760, iter_time=7.65s]
Epoch 0: 9%|▊ | 1072/12384 [2:16:46<24:02:12, 7.65s/it, loss=0.0068, acc=0.9760, iter_time=7.65s]
Epoch 0: 9%|▊ | 1072/12384 [2:16:54<24:02:12, 7.65s/it, loss=0.0065, acc=0.9832, iter_time=7.68s]
Epoch 0: 9%|▊ | 1073/12384 [2:16:54<24:01:02, 7.64s/it, loss=0.0065, acc=0.9832, iter_time=7.68s]
Epoch 0: 9%|▊ | 1073/12384 [2:17:02<24:01:02, 7.64s/it, loss=0.0020, acc=0.9961, iter_time=5.91s]
Epoch 0: 9%|▊ | 1074/12384 [2:17:02<23:58:32, 7.63s/it, loss=0.0020, acc=0.9961, iter_time=5.91s]
Epoch 0: 9%|▊ | 1074/12384 [2:17:09<23:58:32, 7.63s/it, loss=0.0044, acc=0.9916, iter_time=9.32s]
Epoch 0: 9%|▊ | 1075/12384 [2:17:09<24:01:15, 7.65s/it, loss=0.0044, acc=0.9916, iter_time=9.32s]
Epoch 0: 9%|▊ | 1075/12384 [2:17:17<24:01:15, 7.65s/it, loss=0.0024, acc=0.9923, iter_time=7.68s]
Epoch 0: 9%|▊ | 1076/12384 [2:17:17<24:04:15, 7.66s/it, loss=0.0024, acc=0.9923, iter_time=7.68s]
Epoch 0: 9%|▊ | 1076/12384 [2:17:25<24:04:15, 7.66s/it, loss=0.0029, acc=0.9968, iter_time=7.70s]
Epoch 0: 9%|▊ | 1077/12384 [2:17:25<24:02:45, 7.66s/it, loss=0.0029, acc=0.9968, iter_time=7.70s]
Epoch 0: 9%|▊ | 1077/12384 [2:17:32<24:02:45, 7.66s/it, loss=0.0078, acc=0.9792, iter_time=7.63s]
Epoch 0: 9%|▊ | 1078/12384 [2:17:32<24:00:09, 7.64s/it, loss=0.0078, acc=0.9792, iter_time=7.63s]
Epoch 0: 9%|▊ | 1078/12384 [2:17:40<24:00:09, 7.64s/it, loss=0.0087, acc=0.9875, iter_time=7.62s]
Epoch 0: 9%|▊ | 1079/12384 [2:17:40<23:57:41, 7.63s/it, loss=0.0087, acc=0.9875, iter_time=7.62s]
Epoch 0: 9%|▊ | 1079/12384 [2:17:48<23:57:41, 7.63s/it, loss=0.0031, acc=0.9944, iter_time=8.00s]
Epoch 0: 9%|▊ | 1080/12384 [2:17:48<23:56:43, 7.63s/it, loss=0.0031, acc=0.9944, iter_time=8.00s]
Epoch 0: 9%|▊ | 1080/12384 [2:17:55<23:56:43, 7.63s/it, loss=0.0123, acc=0.9817, iter_time=7.24s]
Epoch 0: 9%|▊ | 1081/12384 [2:17:55<24:00:39, 7.65s/it, loss=0.0123, acc=0.9817, iter_time=7.24s]
Epoch 0: 9%|▊ | 1081/12384 [2:18:03<24:00:39, 7.65s/it, loss=0.0037, acc=0.9943, iter_time=7.70s]
Epoch 0: 9%|▊ | 1082/12384 [2:18:03<23:59:20, 7.64s/it, loss=0.0037, acc=0.9943, iter_time=7.70s]
Epoch 0: 9%|▊ | 1082/12384 [2:18:11<23:59:20, 7.64s/it, loss=0.0018, acc=0.9940, iter_time=4.54s]
Epoch 0: 9%|▊ | 1083/12384 [2:18:11<24:00:25, 7.65s/it, loss=0.0018, acc=0.9940, iter_time=4.54s]
Epoch 0: 9%|▊ | 1083/12384 [2:18:18<24:00:25, 7.65s/it, loss=0.0023, acc=0.9947, iter_time=10.72s]
Epoch 0: 9%|▉ | 1084/12384 [2:18:18<23:57:23, 7.63s/it, loss=0.0023, acc=0.9947, iter_time=10.72s]
Epoch 0: 9%|▉ | 1084/12384 [2:18:26<23:57:23, 7.63s/it, loss=0.0039, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▉ | 1085/12384 [2:18:26<23:56:25, 7.63s/it, loss=0.0039, acc=0.9896, iter_time=7.60s]
Epoch 0: 9%|▉ | 1085/12384 [2:18:33<23:56:25, 7.63s/it, loss=0.0028, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1086/12384 [2:18:33<23:55:09, 7.62s/it, loss=0.0028, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1086/12384 [2:18:41<23:55:09, 7.62s/it, loss=0.0044, acc=0.9905, iter_time=7.89s]
Epoch 0: 9%|▉ | 1087/12384 [2:18:41<24:12:41, 7.72s/it, loss=0.0044, acc=0.9905, iter_time=7.89s]
Epoch 0: 9%|▉ | 1087/12384 [2:18:49<24:12:41, 7.72s/it, loss=0.0036, acc=0.9913, iter_time=7.67s]
Epoch 0: 9%|▉ | 1088/12384 [2:18:49<24:11:52, 7.71s/it, loss=0.0036, acc=0.9913, iter_time=7.67s]
Epoch 0: 9%|▉ | 1088/12384 [2:18:57<24:11:52, 7.71s/it, loss=0.0069, acc=0.9895, iter_time=7.66s]
Epoch 0: 9%|▉ | 1089/12384 [2:18:57<24:11:20, 7.71s/it, loss=0.0069, acc=0.9895, iter_time=7.66s]
Epoch 0: 9%|▉ | 1089/12384 [2:19:04<24:11:20, 7.71s/it, loss=0.0073, acc=0.9904, iter_time=7.71s]
Epoch 0: 9%|▉ | 1090/12384 [2:19:04<24:08:06, 7.69s/it, loss=0.0073, acc=0.9904, iter_time=7.71s]
Epoch 0: 9%|▉ | 1090/12384 [2:19:12<24:08:06, 7.69s/it, loss=0.0017, acc=0.9979, iter_time=7.67s]
Epoch 0: 9%|▉ | 1091/12384 [2:19:12<24:05:08, 7.68s/it, loss=0.0017, acc=0.9979, iter_time=7.67s]
Epoch 0: 9%|▉ | 1091/12384 [2:19:20<24:05:08, 7.68s/it, loss=0.0028, acc=0.9936, iter_time=7.66s]
Epoch 0: 9%|▉ | 1092/12384 [2:19:20<24:01:42, 7.66s/it, loss=0.0028, acc=0.9936, iter_time=7.66s]
Epoch 0: 9%|▉ | 1092/12384 [2:19:27<24:01:42, 7.66s/it, loss=0.0009, acc=0.9965, iter_time=4.29s]
Epoch 0: 9%|▉ | 1093/12384 [2:19:27<23:58:49, 7.65s/it, loss=0.0009, acc=0.9965, iter_time=4.29s]
Epoch 0: 9%|▉ | 1093/12384 [2:19:35<23:58:49, 7.65s/it, loss=0.0037, acc=0.9918, iter_time=10.93s]
Epoch 0: 9%|▉ | 1094/12384 [2:19:35<23:57:22, 7.64s/it, loss=0.0037, acc=0.9918, iter_time=10.93s]
Epoch 0: 9%|▉ | 1094/12384 [2:19:43<23:57:22, 7.64s/it, loss=0.0014, acc=0.9980, iter_time=4.31s]
Epoch 0: 9%|▉ | 1095/12384 [2:19:43<24:02:39, 7.67s/it, loss=0.0014, acc=0.9980, iter_time=4.31s]
Epoch 0: 9%|▉ | 1095/12384 [2:19:50<24:02:39, 7.67s/it, loss=0.0019, acc=0.9985, iter_time=11.44s]
Epoch 0: 9%|▉ | 1096/12384 [2:19:50<24:06:09, 7.69s/it, loss=0.0019, acc=0.9985, iter_time=11.44s]
Epoch 0: 9%|▉ | 1096/12384 [2:19:58<24:06:09, 7.69s/it, loss=0.0028, acc=0.9901, iter_time=7.33s]
Epoch 0: 9%|▉ | 1097/12384 [2:19:58<24:02:16, 7.67s/it, loss=0.0028, acc=0.9901, iter_time=7.33s]
Epoch 0: 9%|▉ | 1097/12384 [2:20:06<24:02:16, 7.67s/it, loss=0.0053, acc=0.9867, iter_time=7.63s]
Epoch 0: 9%|▉ | 1098/12384 [2:20:06<24:00:08, 7.66s/it, loss=0.0053, acc=0.9867, iter_time=7.63s]
Epoch 0: 9%|▉ | 1098/12384 [2:20:13<24:00:08, 7.66s/it, loss=0.0036, acc=0.9950, iter_time=7.64s]
Epoch 0: 9%|▉ | 1099/12384 [2:20:13<23:58:38, 7.65s/it, loss=0.0036, acc=0.9950, iter_time=7.64s]
Epoch 0: 9%|▉ | 1099/12384 [2:20:21<23:58:38, 7.65s/it, loss=0.0021, acc=0.9967, iter_time=8.11s]
Epoch 0: 9%|▉ | 1100/12384 [2:20:21<24:01:07, 7.66s/it, loss=0.0021, acc=0.9967, iter_time=8.11s]
Epoch 0: 9%|▉ | 1100/12384 [2:20:29<24:01:07, 7.66s/it, loss=0.0107, acc=0.9828, iter_time=4.90s]
Epoch 0: 9%|▉ | 1101/12384 [2:20:29<23:58:37, 7.65s/it, loss=0.0107, acc=0.9828, iter_time=4.90s]
Epoch 0: 9%|▉ | 1101/12384 [2:20:36<23:58:37, 7.65s/it, loss=0.0031, acc=0.9938, iter_time=9.92s]
Epoch 0: 9%|▉ | 1102/12384 [2:20:36<23:56:44, 7.64s/it, loss=0.0031, acc=0.9938, iter_time=9.92s]
Epoch 0: 9%|▉ | 1102/12384 [2:20:44<23:56:44, 7.64s/it, loss=0.0047, acc=0.9906, iter_time=7.63s]
Epoch 0: 9%|▉ | 1103/12384 [2:20:44<23:54:59, 7.63s/it, loss=0.0047, acc=0.9906, iter_time=7.63s]
Epoch 0: 9%|▉ | 1103/12384 [2:20:51<23:54:59, 7.63s/it, loss=0.0013, acc=0.9977, iter_time=7.99s]
Epoch 0: 9%|▉ | 1104/12384 [2:20:51<23:52:25, 7.62s/it, loss=0.0013, acc=0.9977, iter_time=7.99s]
Epoch 0: 9%|▉ | 1104/12384 [2:20:59<23:52:25, 7.62s/it, loss=0.0027, acc=0.9968, iter_time=7.21s]
Epoch 0: 9%|▉ | 1105/12384 [2:20:59<23:57:00, 7.64s/it, loss=0.0027, acc=0.9968, iter_time=7.21s]
Epoch 0: 9%|▉ | 1105/12384 [2:21:07<23:57:00, 7.64s/it, loss=0.0031, acc=0.9918, iter_time=7.71s]
Epoch 0: 9%|▉ | 1106/12384 [2:21:07<24:02:02, 7.67s/it, loss=0.0031, acc=0.9918, iter_time=7.71s]
Epoch 0: 9%|▉ | 1106/12384 [2:21:14<24:02:02, 7.67s/it, loss=0.0142, acc=0.9920, iter_time=7.20s]
Epoch 0: 9%|▉ | 1107/12384 [2:21:14<23:59:01, 7.66s/it, loss=0.0142, acc=0.9920, iter_time=7.20s]
Epoch 0: 9%|▉ | 1107/12384 [2:21:22<23:59:01, 7.66s/it, loss=0.0018, acc=0.9979, iter_time=8.15s]
Epoch 0: 9%|▉ | 1108/12384 [2:21:22<23:57:19, 7.65s/it, loss=0.0018, acc=0.9979, iter_time=8.15s]
Epoch 0: 9%|▉ | 1108/12384 [2:21:30<23:57:19, 7.65s/it, loss=0.0028, acc=0.9922, iter_time=7.64s]
Epoch 0: 9%|▉ | 1109/12384 [2:21:30<23:55:40, 7.64s/it, loss=0.0028, acc=0.9922, iter_time=7.64s]
Epoch 0: 9%|▉ | 1109/12384 [2:21:37<23:55:40, 7.64s/it, loss=0.0025, acc=0.9972, iter_time=7.63s]
Epoch 0: 9%|▉ | 1110/12384 [2:21:37<23:56:13, 7.64s/it, loss=0.0025, acc=0.9972, iter_time=7.63s]
Epoch 0: 9%|▉ | 1110/12384 [2:21:45<23:56:13, 7.64s/it, loss=0.0018, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1111/12384 [2:21:45<23:54:44, 7.64s/it, loss=0.0018, acc=0.9967, iter_time=7.63s]
Epoch 0: 9%|▉ | 1111/12384 [2:21:53<23:54:44, 7.64s/it, loss=0.0011, acc=1.0000, iter_time=8.29s]
Epoch 0: 9%|▉ | 1112/12384 [2:21:53<24:08:41, 7.71s/it, loss=0.0011, acc=1.0000, iter_time=8.29s]
Epoch 0: 9%|▉ | 1112/12384 [2:22:01<24:08:41, 7.71s/it, loss=0.0023, acc=0.9968, iter_time=7.25s]
Epoch 0: 9%|▉ | 1113/12384 [2:22:01<24:23:09, 7.79s/it, loss=0.0023, acc=0.9968, iter_time=7.25s]
Epoch 0: 9%|▉ | 1113/12384 [2:22:08<24:23:09, 7.79s/it, loss=0.0052, acc=0.9896, iter_time=5.64s]
Epoch 0: 9%|▉ | 1114/12384 [2:22:08<24:13:44, 7.74s/it, loss=0.0052, acc=0.9896, iter_time=5.64s]
Epoch 0: 9%|▉ | 1114/12384 [2:22:16<24:13:44, 7.74s/it, loss=0.0067, acc=0.9904, iter_time=9.92s]
Epoch 0: 9%|▉ | 1115/12384 [2:22:16<24:07:04, 7.70s/it, loss=0.0067, acc=0.9904, iter_time=9.92s]
Epoch 0: 9%|▉ | 1115/12384 [2:22:24<24:07:04, 7.70s/it, loss=0.0036, acc=0.9925, iter_time=4.31s]
Epoch 0: 9%|▉ | 1116/12384 [2:22:24<24:00:49, 7.67s/it, loss=0.0036, acc=0.9925, iter_time=4.31s]
Epoch 0: 9%|▉ | 1116/12384 [2:22:31<24:00:49, 7.67s/it, loss=0.0171, acc=0.9720, iter_time=10.90s]
Epoch 0: 9%|▉ | 1117/12384 [2:22:31<24:00:08, 7.67s/it, loss=0.0171, acc=0.9720, iter_time=10.90s]
Epoch 0: 9%|▉ | 1117/12384 [2:22:39<24:00:08, 7.67s/it, loss=0.0036, acc=0.9873, iter_time=7.66s]
Epoch 0: 9%|▉ | 1118/12384 [2:22:39<23:56:26, 7.65s/it, loss=0.0036, acc=0.9873, iter_time=7.66s]
Epoch 0: 9%|▉ | 1118/12384 [2:22:46<23:56:26, 7.65s/it, loss=0.0045, acc=0.9943, iter_time=7.61s]
Epoch 0: 9%|▉ | 1119/12384 [2:22:46<23:53:21, 7.63s/it, loss=0.0045, acc=0.9943, iter_time=7.61s]
Epoch 0: 9%|▉ | 1119/12384 [2:22:54<23:53:21, 7.63s/it, loss=0.0036, acc=0.9881, iter_time=7.55s]
Epoch 0: 9%|▉ | 1120/12384 [2:22:54<23:51:38, 7.63s/it, loss=0.0036, acc=0.9881, iter_time=7.55s]
Epoch 0: 9%|▉ | 1120/12384 [2:23:02<23:51:38, 7.63s/it, loss=0.0032, acc=0.9953, iter_time=7.64s]
Epoch 0: 9%|▉ | 1121/12384 [2:23:02<23:49:49, 7.62s/it, loss=0.0032, acc=0.9953, iter_time=7.64s]
Epoch 0: 9%|▉ | 1121/12384 [2:23:09<23:49:49, 7.62s/it, loss=0.0044, acc=0.9883, iter_time=7.07s]
Epoch 0: 9%|▉ | 1122/12384 [2:23:09<23:49:19, 7.61s/it, loss=0.0044, acc=0.9883, iter_time=7.07s]
Epoch 0: 9%|▉ | 1122/12384 [2:23:17<23:49:19, 7.61s/it, loss=0.0035, acc=0.9950, iter_time=4.42s]
Epoch 0: 9%|▉ | 1123/12384 [2:23:17<23:48:52, 7.61s/it, loss=0.0035, acc=0.9950, iter_time=4.42s]
Epoch 0: 9%|▉ | 1123/12384 [2:23:25<23:48:52, 7.61s/it, loss=0.0019, acc=0.9946, iter_time=11.07s]
Epoch 0: 9%|▉ | 1124/12384 [2:23:25<23:48:19, 7.61s/it, loss=0.0019, acc=0.9946, iter_time=11.07s]
Epoch 0: 9%|▉ | 1124/12384 [2:23:32<23:48:19, 7.61s/it, loss=0.0025, acc=0.9956, iter_time=7.89s]
Epoch 0: 9%|▉ | 1125/12384 [2:23:32<23:49:38, 7.62s/it, loss=0.0025, acc=0.9956, iter_time=7.89s]
Epoch 0: 9%|▉ | 1125/12384 [2:23:40<23:49:38, 7.62s/it, loss=0.0030, acc=0.9933, iter_time=6.18s]
Epoch 0: 9%|▉ | 1126/12384 [2:23:40<23:49:34, 7.62s/it, loss=0.0030, acc=0.9933, iter_time=6.18s]
Epoch 0: 9%|▉ | 1126/12384 [2:23:47<23:49:34, 7.62s/it, loss=0.0015, acc=0.9988, iter_time=9.11s]
Epoch 0: 9%|▉ | 1127/12384 [2:23:47<23:51:16, 7.63s/it, loss=0.0015, acc=0.9988, iter_time=9.11s]
Epoch 0: 9%|▉ | 1127/12384 [2:23:55<23:51:16, 7.63s/it, loss=0.0020, acc=0.9968, iter_time=7.98s]
Epoch 0: 9%|▉ | 1128/12384 [2:23:55<23:50:03, 7.62s/it, loss=0.0020, acc=0.9968, iter_time=7.98s]
Epoch 0: 9%|▉ | 1128/12384 [2:24:03<23:50:03, 7.62s/it, loss=0.0019, acc=0.9998, iter_time=4.21s]
Epoch 0: 9%|▉ | 1129/12384 [2:24:03<23:49:07, 7.62s/it, loss=0.0019, acc=0.9998, iter_time=4.21s]
Epoch 0: 9%|▉ | 1129/12384 [2:24:10<23:49:07, 7.62s/it, loss=0.0021, acc=0.9953, iter_time=9.12s]
Epoch 0: 9%|▉ | 1130/12384 [2:24:10<23:47:01, 7.61s/it, loss=0.0021, acc=0.9953, iter_time=9.12s]
Epoch 0: 9%|▉ | 1130/12384 [2:24:18<23:47:01, 7.61s/it, loss=0.0048, acc=0.9911, iter_time=9.10s]
Epoch 0: 9%|▉ | 1131/12384 [2:24:18<23:48:26, 7.62s/it, loss=0.0048, acc=0.9911, iter_time=9.10s]
Epoch 0: 9%|▉ | 1131/12384 [2:24:25<23:48:26, 7.62s/it, loss=0.0023, acc=0.9956, iter_time=7.65s]
Epoch 0: 9%|▉ | 1132/12384 [2:24:25<23:48:37, 7.62s/it, loss=0.0023, acc=0.9956, iter_time=7.65s]
Epoch 0: 9%|▉ | 1132/12384 [2:24:33<23:48:37, 7.62s/it, loss=0.0060, acc=0.9853, iter_time=7.31s]
Epoch 0: 9%|▉ | 1133/12384 [2:24:33<23:47:08, 7.61s/it, loss=0.0060, acc=0.9853, iter_time=7.31s]
Epoch 0: 9%|▉ | 1133/12384 [2:24:41<23:47:08, 7.61s/it, loss=0.0062, acc=0.9846, iter_time=6.70s]
Epoch 0: 9%|▉ | 1134/12384 [2:24:41<23:48:48, 7.62s/it, loss=0.0062, acc=0.9846, iter_time=6.70s]
Epoch 0: 9%|▉ | 1134/12384 [2:24:48<23:48:48, 7.62s/it, loss=0.0059, acc=0.9877, iter_time=7.89s]
Epoch 0: 9%|▉ | 1135/12384 [2:24:48<23:48:54, 7.62s/it, loss=0.0059, acc=0.9877, iter_time=7.89s]
Epoch 0: 9%|▉ | 1135/12384 [2:24:56<23:48:54, 7.62s/it, loss=0.0018, acc=0.9956, iter_time=8.99s]
Epoch 0: 9%|▉ | 1136/12384 [2:24:56<23:50:35, 7.63s/it, loss=0.0018, acc=0.9956, iter_time=8.99s]
Epoch 0: 9%|▉ | 1136/12384 [2:25:04<23:50:35, 7.63s/it, loss=0.0028, acc=0.9941, iter_time=7.22s]
Epoch 0: 9%|▉ | 1137/12384 [2:25:04<23:48:38, 7.62s/it, loss=0.0028, acc=0.9941, iter_time=7.22s]
Epoch 0: 9%|▉ | 1137/12384 [2:25:11<23:48:38, 7.62s/it, loss=0.0018, acc=0.9974, iter_time=7.88s]
Epoch 0: 9%|▉ | 1138/12384 [2:25:11<24:01:44, 7.69s/it, loss=0.0018, acc=0.9974, iter_time=7.88s]
Epoch 0: 9%|▉ | 1138/12384 [2:25:19<24:01:44, 7.69s/it, loss=0.0086, acc=0.9795, iter_time=7.64s]
Epoch 0: 9%|▉ | 1139/12384 [2:25:19<24:16:45, 7.77s/it, loss=0.0086, acc=0.9795, iter_time=7.64s]
Epoch 0: 9%|▉ | 1139/12384 [2:25:27<24:16:45, 7.77s/it, loss=0.0016, acc=0.9998, iter_time=5.38s]
Epoch 0: 9%|▉ | 1140/12384 [2:25:27<24:11:36, 7.75s/it, loss=0.0016, acc=0.9998, iter_time=5.38s]
Epoch 0: 9%|▉ | 1140/12384 [2:25:35<24:11:36, 7.75s/it, loss=0.0015, acc=0.9978, iter_time=10.24s]
Epoch 0: 9%|▉ | 1141/12384 [2:25:35<24:04:10, 7.71s/it, loss=0.0015, acc=0.9978, iter_time=10.24s]
Epoch 0: 9%|▉ | 1141/12384 [2:25:42<24:04:10, 7.71s/it, loss=0.0026, acc=0.9950, iter_time=5.04s]
Epoch 0: 9%|▉ | 1142/12384 [2:25:42<23:58:32, 7.68s/it, loss=0.0026, acc=0.9950, iter_time=5.04s]
Epoch 0: 9%|▉ | 1142/12384 [2:25:50<23:58:32, 7.68s/it, loss=0.0012, acc=0.9982, iter_time=8.92s]
Epoch 0: 9%|▉ | 1143/12384 [2:25:50<23:55:16, 7.66s/it, loss=0.0012, acc=0.9982, iter_time=8.92s]
Epoch 0: 9%|▉ | 1143/12384 [2:25:58<23:55:16, 7.66s/it, loss=0.0024, acc=0.9909, iter_time=9.26s]
Epoch 0: 9%|▉ | 1144/12384 [2:25:58<23:52:52, 7.65s/it, loss=0.0024, acc=0.9909, iter_time=9.26s]
Epoch 0: 9%|▉ | 1144/12384 [2:26:05<23:52:52, 7.65s/it, loss=0.0043, acc=0.9876, iter_time=7.23s]
Epoch 0: 9%|▉ | 1145/12384 [2:26:05<23:51:03, 7.64s/it, loss=0.0043, acc=0.9876, iter_time=7.23s]
Epoch 0: 9%|▉ | 1145/12384 [2:26:13<23:51:03, 7.64s/it, loss=0.0021, acc=0.9979, iter_time=6.11s]
Epoch 0: 9%|▉ | 1146/12384 [2:26:13<23:50:19, 7.64s/it, loss=0.0021, acc=0.9979, iter_time=6.11s]
Epoch 0: 9%|▉ | 1146/12384 [2:26:21<23:50:19, 7.64s/it, loss=0.0052, acc=0.9965, iter_time=9.14s]
Epoch 0: 9%|▉ | 1147/12384 [2:26:21<23:53:45, 7.66s/it, loss=0.0052, acc=0.9965, iter_time=9.14s]
Epoch 0: 9%|▉ | 1147/12384 [2:26:28<23:53:45, 7.66s/it, loss=0.0020, acc=0.9983, iter_time=4.42s]
Epoch 0: 9%|▉ | 1148/12384 [2:26:28<23:52:12, 7.65s/it, loss=0.0020, acc=0.9983, iter_time=4.42s]
Epoch 0: 9%|▉ | 1148/12384 [2:26:36<23:52:12, 7.65s/it, loss=0.0030, acc=0.9913, iter_time=10.90s]
Epoch 0: 9%|▉ | 1149/12384 [2:26:36<23:50:40, 7.64s/it, loss=0.0030, acc=0.9913, iter_time=10.90s]
Epoch 0: 9%|▉ | 1149/12384 [2:26:43<23:50:40, 7.64s/it, loss=0.0054, acc=0.9857, iter_time=8.03s]
Epoch 0: 9%|▉ | 1150/12384 [2:26:43<23:48:18, 7.63s/it, loss=0.0054, acc=0.9857, iter_time=8.03s]
Epoch 0: 9%|▉ | 1150/12384 [2:26:51<23:48:18, 7.63s/it, loss=0.0021, acc=0.9958, iter_time=7.20s]
Epoch 0: 9%|▉ | 1151/12384 [2:26:51<23:49:47, 7.64s/it, loss=0.0021, acc=0.9958, iter_time=7.20s]
Epoch 0: 9%|▉ | 1151/12384 [2:26:59<23:49:47, 7.64s/it, loss=0.0022, acc=0.9931, iter_time=7.66s]
Epoch 0: 9%|▉ | 1152/12384 [2:26:59<23:50:45, 7.64s/it, loss=0.0022, acc=0.9931, iter_time=7.66s]
Epoch 0: 9%|▉ | 1152/12384 [2:27:06<23:50:45, 7.64s/it, loss=0.0062, acc=0.9890, iter_time=5.65s]
Epoch 0: 9%|▉ | 1153/12384 [2:27:06<23:48:08, 7.63s/it, loss=0.0062, acc=0.9890, iter_time=5.65s]
Epoch 0: 9%|▉ | 1153/12384 [2:27:14<23:48:08, 7.63s/it, loss=0.0012, acc=0.9975, iter_time=5.87s]
Epoch 0: 9%|▉ | 1154/12384 [2:27:14<23:48:53, 7.63s/it, loss=0.0012, acc=0.9975, iter_time=5.87s]
Epoch 0: 9%|▉ | 1154/12384 [2:27:22<23:48:53, 7.63s/it, loss=0.0010, acc=0.9977, iter_time=9.87s]
Epoch 0: 9%|▉ | 1155/12384 [2:27:22<23:45:41, 7.62s/it, loss=0.0010, acc=0.9977, iter_time=9.87s]
Epoch 0: 9%|▉ | 1155/12384 [2:27:29<23:45:41, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=9.08s]
Epoch 0: 9%|▉ | 1156/12384 [2:27:29<23:45:19, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=9.08s]
Epoch 0: 9%|▉ | 1156/12384 [2:27:37<23:45:19, 7.62s/it, loss=0.0033, acc=0.9963, iter_time=4.77s]
Epoch 0: 9%|▉ | 1157/12384 [2:27:37<23:43:56, 7.61s/it, loss=0.0033, acc=0.9963, iter_time=4.77s]
Epoch 0: 9%|▉ | 1157/12384 [2:27:44<23:43:56, 7.61s/it, loss=0.0025, acc=0.9946, iter_time=7.41s]
Epoch 0: 9%|▉ | 1158/12384 [2:27:44<23:45:03, 7.62s/it, loss=0.0025, acc=0.9946, iter_time=7.41s]
Epoch 0: 9%|▉ | 1158/12384 [2:27:52<23:45:03, 7.62s/it, loss=0.0033, acc=0.9901, iter_time=10.68s]
Epoch 0: 9%|▉ | 1159/12384 [2:27:52<23:45:07, 7.62s/it, loss=0.0033, acc=0.9901, iter_time=10.68s]
Epoch 0: 9%|▉ | 1159/12384 [2:28:00<23:45:07, 7.62s/it, loss=0.0082, acc=0.9832, iter_time=8.00s]
Epoch 0: 9%|▉ | 1160/12384 [2:28:00<23:47:15, 7.63s/it, loss=0.0082, acc=0.9832, iter_time=8.00s]
Epoch 0: 9%|▉ | 1160/12384 [2:28:07<23:47:15, 7.63s/it, loss=0.0026, acc=0.9970, iter_time=7.27s]
Epoch 0: 9%|▉ | 1161/12384 [2:28:07<23:46:49, 7.63s/it, loss=0.0026, acc=0.9970, iter_time=7.27s]
Epoch 0: 9%|▉ | 1161/12384 [2:28:15<23:46:49, 7.63s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 9%|▉ | 1162/12384 [2:28:15<23:44:41, 7.62s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 9%|▉ | 1162/12384 [2:28:22<23:44:41, 7.62s/it, loss=0.0059, acc=0.9853, iter_time=7.61s]
Epoch 0: 9%|▉ | 1163/12384 [2:28:22<23:46:09, 7.63s/it, loss=0.0059, acc=0.9853, iter_time=7.61s]
Epoch 0: 9%|▉ | 1163/12384 [2:28:30<23:46:09, 7.63s/it, loss=0.0030, acc=0.9947, iter_time=7.63s]
Epoch 0: 9%|▉ | 1164/12384 [2:28:30<23:47:41, 7.63s/it, loss=0.0030, acc=0.9947, iter_time=7.63s]
Epoch 0: 9%|▉ | 1164/12384 [2:28:38<23:47:41, 7.63s/it, loss=0.0025, acc=0.9942, iter_time=7.94s]
Epoch 0: 9%|▉ | 1165/12384 [2:28:38<24:07:09, 7.74s/it, loss=0.0025, acc=0.9942, iter_time=7.94s]
Epoch 0: 9%|▉ | 1165/12384 [2:28:46<24:07:09, 7.74s/it, loss=0.0023, acc=0.9957, iter_time=5.90s]
Epoch 0: 9%|▉ | 1166/12384 [2:28:46<23:59:38, 7.70s/it, loss=0.0023, acc=0.9957, iter_time=5.90s]
Epoch 0: 9%|▉ | 1166/12384 [2:28:53<23:59:38, 7.70s/it, loss=0.0065, acc=0.9885, iter_time=9.39s]
Epoch 0: 9%|▉ | 1167/12384 [2:28:53<23:56:52, 7.69s/it, loss=0.0065, acc=0.9885, iter_time=9.39s]
Epoch 0: 9%|▉ | 1167/12384 [2:29:01<23:56:52, 7.69s/it, loss=0.0015, acc=0.9978, iter_time=8.06s]
Epoch 0: 9%|▉ | 1168/12384 [2:29:01<23:53:34, 7.67s/it, loss=0.0015, acc=0.9978, iter_time=8.06s]
Epoch 0: 9%|▉ | 1168/12384 [2:29:09<23:53:34, 7.67s/it, loss=0.0033, acc=0.9889, iter_time=7.24s]
Epoch 0: 9%|▉ | 1169/12384 [2:29:09<23:50:38, 7.65s/it, loss=0.0033, acc=0.9889, iter_time=7.24s]
Epoch 0: 9%|▉ | 1169/12384 [2:29:16<23:50:38, 7.65s/it, loss=0.0009, acc=0.9990, iter_time=5.83s]
Epoch 0: 9%|▉ | 1170/12384 [2:29:16<23:50:24, 7.65s/it, loss=0.0009, acc=0.9990, iter_time=5.83s]
Epoch 0: 9%|▉ | 1170/12384 [2:29:24<23:50:24, 7.65s/it, loss=0.0049, acc=0.9915, iter_time=9.44s]
Epoch 0: 9%|▉ | 1171/12384 [2:29:24<23:49:31, 7.65s/it, loss=0.0049, acc=0.9915, iter_time=9.44s]
Epoch 0: 9%|▉ | 1171/12384 [2:29:32<23:49:31, 7.65s/it, loss=0.0081, acc=0.9851, iter_time=7.63s]
Epoch 0: 9%|▉ | 1172/12384 [2:29:32<23:47:50, 7.64s/it, loss=0.0081, acc=0.9851, iter_time=7.63s]
Epoch 0: 9%|▉ | 1172/12384 [2:29:39<23:47:50, 7.64s/it, loss=0.0085, acc=0.9846, iter_time=7.65s]
Epoch 0: 9%|▉ | 1173/12384 [2:29:39<23:47:34, 7.64s/it, loss=0.0085, acc=0.9846, iter_time=7.65s]
Epoch 0: 9%|▉ | 1173/12384 [2:29:47<23:47:34, 7.64s/it, loss=0.0014, acc=0.9965, iter_time=7.62s]
Epoch 0: 9%|▉ | 1174/12384 [2:29:47<23:49:29, 7.65s/it, loss=0.0014, acc=0.9965, iter_time=7.62s]
Epoch 0: 9%|▉ | 1174/12384 [2:29:54<23:49:29, 7.65s/it, loss=0.0007, acc=0.9991, iter_time=5.10s]
Epoch 0: 9%|▉ | 1175/12384 [2:29:54<23:46:52, 7.64s/it, loss=0.0007, acc=0.9991, iter_time=5.10s]
Epoch 0: 9%|▉ | 1175/12384 [2:30:02<23:46:52, 7.64s/it, loss=0.0024, acc=0.9959, iter_time=10.56s]
Epoch 0: 9%|▉ | 1176/12384 [2:30:02<23:46:08, 7.63s/it, loss=0.0024, acc=0.9959, iter_time=10.56s]
Epoch 0: 9%|▉ | 1176/12384 [2:30:10<23:46:08, 7.63s/it, loss=0.0026, acc=0.9958, iter_time=7.25s]
Epoch 0: 10%|▉ | 1177/12384 [2:30:10<23:44:29, 7.63s/it, loss=0.0026, acc=0.9958, iter_time=7.25s]
Epoch 0: 10%|▉ | 1177/12384 [2:30:17<23:44:29, 7.63s/it, loss=0.0034, acc=0.9929, iter_time=7.60s]
Epoch 0: 10%|▉ | 1178/12384 [2:30:17<23:42:15, 7.62s/it, loss=0.0034, acc=0.9929, iter_time=7.60s]
Epoch 0: 10%|▉ | 1178/12384 [2:30:25<23:42:15, 7.62s/it, loss=0.0028, acc=0.9944, iter_time=7.70s]
Epoch 0: 10%|▉ | 1179/12384 [2:30:25<23:49:07, 7.65s/it, loss=0.0028, acc=0.9944, iter_time=7.70s]
Epoch 0: 10%|▉ | 1179/12384 [2:30:33<23:49:07, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 10%|▉ | 1180/12384 [2:30:33<23:47:11, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.64s]
Epoch 0: 10%|▉ | 1180/12384 [2:30:40<23:47:11, 7.64s/it, loss=0.0013, acc=0.9968, iter_time=6.42s]
Epoch 0: 10%|▉ | 1181/12384 [2:30:40<23:40:29, 7.61s/it, loss=0.0013, acc=0.9968, iter_time=6.42s]
Epoch 0: 10%|▉ | 1181/12384 [2:30:48<23:40:29, 7.61s/it, loss=0.0040, acc=0.9933, iter_time=8.73s]
Epoch 0: 10%|▉ | 1182/12384 [2:30:48<23:40:13, 7.61s/it, loss=0.0040, acc=0.9933, iter_time=8.73s]
Epoch 0: 10%|▉ | 1182/12384 [2:30:55<23:40:13, 7.61s/it, loss=0.0040, acc=0.9918, iter_time=5.55s]
Epoch 0: 10%|▉ | 1183/12384 [2:30:55<23:39:36, 7.60s/it, loss=0.0040, acc=0.9918, iter_time=5.55s]
Epoch 0: 10%|▉ | 1183/12384 [2:31:03<23:39:36, 7.60s/it, loss=0.0035, acc=0.9963, iter_time=9.61s]
Epoch 0: 10%|▉ | 1184/12384 [2:31:03<23:40:11, 7.61s/it, loss=0.0035, acc=0.9963, iter_time=9.61s]
Epoch 0: 10%|▉ | 1184/12384 [2:31:11<23:40:11, 7.61s/it, loss=0.0059, acc=0.9922, iter_time=7.65s]
Epoch 0: 10%|▉ | 1185/12384 [2:31:11<23:39:13, 7.60s/it, loss=0.0059, acc=0.9922, iter_time=7.65s]
Epoch 0: 10%|▉ | 1185/12384 [2:31:18<23:39:13, 7.60s/it, loss=0.0024, acc=0.9944, iter_time=7.61s]
Epoch 0: 10%|▉ | 1186/12384 [2:31:18<23:39:40, 7.61s/it, loss=0.0024, acc=0.9944, iter_time=7.61s]
Epoch 0: 10%|▉ | 1186/12384 [2:31:26<23:39:40, 7.61s/it, loss=0.0068, acc=0.9873, iter_time=7.71s]
Epoch 0: 10%|▉ | 1187/12384 [2:31:26<23:45:23, 7.64s/it, loss=0.0068, acc=0.9873, iter_time=7.71s]
Epoch 0: 10%|▉ | 1187/12384 [2:31:34<23:45:23, 7.64s/it, loss=0.0028, acc=0.9921, iter_time=7.61s]
Epoch 0: 10%|▉ | 1188/12384 [2:31:34<23:44:16, 7.63s/it, loss=0.0028, acc=0.9921, iter_time=7.61s]
Epoch 0: 10%|▉ | 1188/12384 [2:31:41<23:44:16, 7.63s/it, loss=0.0046, acc=0.9948, iter_time=7.62s]
Epoch 0: 10%|▉ | 1189/12384 [2:31:41<23:43:30, 7.63s/it, loss=0.0046, acc=0.9948, iter_time=7.62s]
Epoch 0: 10%|▉ | 1189/12384 [2:31:49<23:43:30, 7.63s/it, loss=0.0006, acc=0.9994, iter_time=5.28s]
Epoch 0: 10%|▉ | 1190/12384 [2:31:49<23:41:11, 7.62s/it, loss=0.0006, acc=0.9994, iter_time=5.28s]
Epoch 0: 10%|▉ | 1190/12384 [2:31:56<23:41:11, 7.62s/it, loss=0.0019, acc=0.9951, iter_time=9.93s]
Epoch 0: 10%|▉ | 1191/12384 [2:31:56<23:41:35, 7.62s/it, loss=0.0019, acc=0.9951, iter_time=9.93s]
Epoch 0: 10%|▉ | 1191/12384 [2:32:04<23:41:35, 7.62s/it, loss=0.0023, acc=0.9951, iter_time=8.10s]
Epoch 0: 10%|▉ | 1192/12384 [2:32:04<24:02:45, 7.73s/it, loss=0.0023, acc=0.9951, iter_time=8.10s]
Epoch 0: 10%|▉ | 1192/12384 [2:32:12<24:02:45, 7.73s/it, loss=0.0045, acc=0.9965, iter_time=6.10s]
Epoch 0: 10%|▉ | 1193/12384 [2:32:12<24:01:59, 7.73s/it, loss=0.0045, acc=0.9965, iter_time=6.10s]
Epoch 0: 10%|▉ | 1193/12384 [2:32:20<24:01:59, 7.73s/it, loss=0.0010, acc=0.9997, iter_time=7.64s]
Epoch 0: 10%|▉ | 1194/12384 [2:32:20<23:55:44, 7.70s/it, loss=0.0010, acc=0.9997, iter_time=7.64s]
Epoch 0: 10%|▉ | 1194/12384 [2:32:27<23:55:44, 7.70s/it, loss=0.0057, acc=0.9928, iter_time=9.12s]
Epoch 0: 10%|▉ | 1195/12384 [2:32:27<23:51:03, 7.67s/it, loss=0.0057, acc=0.9928, iter_time=9.12s]
Epoch 0: 10%|▉ | 1195/12384 [2:32:35<23:51:03, 7.67s/it, loss=0.0006, acc=0.9986, iter_time=4.76s]
Epoch 0: 10%|▉ | 1196/12384 [2:32:35<23:46:32, 7.65s/it, loss=0.0006, acc=0.9986, iter_time=4.76s]
Epoch 0: 10%|▉ | 1196/12384 [2:32:43<23:46:32, 7.65s/it, loss=0.0022, acc=0.9961, iter_time=7.92s]
Epoch 0: 10%|▉ | 1197/12384 [2:32:43<23:44:11, 7.64s/it, loss=0.0022, acc=0.9961, iter_time=7.92s]
Epoch 0: 10%|▉ | 1197/12384 [2:32:50<23:44:11, 7.64s/it, loss=0.0095, acc=0.9842, iter_time=8.41s]
Epoch 0: 10%|▉ | 1198/12384 [2:32:50<23:45:00, 7.64s/it, loss=0.0095, acc=0.9842, iter_time=8.41s]
Epoch 0: 10%|▉ | 1198/12384 [2:32:58<23:45:00, 7.64s/it, loss=0.0017, acc=0.9975, iter_time=9.39s]
Epoch 0: 10%|▉ | 1199/12384 [2:32:58<23:46:09, 7.65s/it, loss=0.0017, acc=0.9975, iter_time=9.39s]
Epoch 0: 10%|▉ | 1199/12384 [2:33:05<23:46:09, 7.65s/it, loss=0.0046, acc=0.9872, iter_time=8.06s]
Epoch 0: 10%|▉ | 1200/12384 [2:33:05<23:43:34, 7.64s/it, loss=0.0046, acc=0.9872, iter_time=8.06s]
Epoch 0: 10%|▉ | 1200/12384 [2:33:13<23:43:34, 7.64s/it, loss=0.0009, acc=0.9962, iter_time=3.01s]
Epoch 0: 10%|▉ | 1201/12384 [2:33:13<23:39:06, 7.61s/it, loss=0.0009, acc=0.9962, iter_time=3.01s]
Epoch 0: 10%|▉ | 1201/12384 [2:33:21<23:39:06, 7.61s/it, loss=0.0045, acc=0.9904, iter_time=8.16s]
Epoch 0: 10%|▉ | 1202/12384 [2:33:21<23:43:19, 7.64s/it, loss=0.0045, acc=0.9904, iter_time=8.16s]
Epoch 0: 10%|▉ | 1202/12384 [2:33:28<23:43:19, 7.64s/it, loss=0.0034, acc=0.9887, iter_time=11.27s]
Epoch 0: 10%|▉ | 1203/12384 [2:33:28<23:42:20, 7.63s/it, loss=0.0034, acc=0.9887, iter_time=11.27s]
Epoch 0: 10%|▉ | 1203/12384 [2:33:36<23:42:20, 7.63s/it, loss=0.0030, acc=0.9949, iter_time=5.35s]
Epoch 0: 10%|▉ | 1204/12384 [2:33:36<23:42:14, 7.63s/it, loss=0.0030, acc=0.9949, iter_time=5.35s]
Epoch 0: 10%|▉ | 1204/12384 [2:33:44<23:42:14, 7.63s/it, loss=0.0010, acc=0.9977, iter_time=7.07s]
Epoch 0: 10%|▉ | 1205/12384 [2:33:44<23:40:59, 7.63s/it, loss=0.0010, acc=0.9977, iter_time=7.07s]
Epoch 0: 10%|▉ | 1205/12384 [2:33:51<23:40:59, 7.63s/it, loss=0.0027, acc=0.9942, iter_time=10.46s]
Epoch 0: 10%|▉ | 1206/12384 [2:33:51<23:41:16, 7.63s/it, loss=0.0027, acc=0.9942, iter_time=10.46s]
Epoch 0: 10%|▉ | 1206/12384 [2:33:59<23:41:16, 7.63s/it, loss=0.0029, acc=0.9945, iter_time=7.65s]
Epoch 0: 10%|▉ | 1207/12384 [2:33:59<23:40:33, 7.63s/it, loss=0.0029, acc=0.9945, iter_time=7.65s]
Epoch 0: 10%|▉ | 1207/12384 [2:34:06<23:40:33, 7.63s/it, loss=0.0035, acc=0.9897, iter_time=7.99s]
Epoch 0: 10%|▉ | 1208/12384 [2:34:06<23:38:34, 7.62s/it, loss=0.0035, acc=0.9897, iter_time=7.99s]
Epoch 0: 10%|▉ | 1208/12384 [2:34:14<23:38:34, 7.62s/it, loss=0.0007, acc=0.9981, iter_time=7.23s]
Epoch 0: 10%|▉ | 1209/12384 [2:34:14<23:40:27, 7.63s/it, loss=0.0007, acc=0.9981, iter_time=7.23s]
Epoch 0: 10%|▉ | 1209/12384 [2:34:22<23:40:27, 7.63s/it, loss=0.0037, acc=0.9939, iter_time=7.63s]
Epoch 0: 10%|▉ | 1210/12384 [2:34:22<23:39:15, 7.62s/it, loss=0.0037, acc=0.9939, iter_time=7.63s]
Epoch 0: 10%|▉ | 1210/12384 [2:34:29<23:39:15, 7.62s/it, loss=0.0051, acc=0.9901, iter_time=7.63s]
Epoch 0: 10%|▉ | 1211/12384 [2:34:29<23:40:00, 7.63s/it, loss=0.0051, acc=0.9901, iter_time=7.63s]
Epoch 0: 10%|▉ | 1211/12384 [2:34:37<23:40:00, 7.63s/it, loss=0.0013, acc=0.9969, iter_time=7.64s]
Epoch 0: 10%|▉ | 1212/12384 [2:34:37<23:39:50, 7.63s/it, loss=0.0013, acc=0.9969, iter_time=7.64s]
Epoch 0: 10%|▉ | 1212/12384 [2:34:45<23:39:50, 7.63s/it, loss=0.0008, acc=0.9986, iter_time=7.63s]
Epoch 0: 10%|▉ | 1213/12384 [2:34:45<23:39:41, 7.63s/it, loss=0.0008, acc=0.9986, iter_time=7.63s]
Epoch 0: 10%|▉ | 1213/12384 [2:34:52<23:39:41, 7.63s/it, loss=0.0086, acc=0.9859, iter_time=4.00s]
Epoch 0: 10%|▉ | 1214/12384 [2:34:52<23:41:25, 7.64s/it, loss=0.0086, acc=0.9859, iter_time=4.00s]
Epoch 0: 10%|▉ | 1214/12384 [2:35:00<23:41:25, 7.64s/it, loss=0.0026, acc=0.9962, iter_time=9.18s]
Epoch 0: 10%|▉ | 1215/12384 [2:35:00<23:41:19, 7.64s/it, loss=0.0026, acc=0.9962, iter_time=9.18s]
Epoch 0: 10%|▉ | 1215/12384 [2:35:08<23:41:19, 7.64s/it, loss=0.0024, acc=0.9972, iter_time=9.87s]
Epoch 0: 10%|▉ | 1216/12384 [2:35:08<23:41:43, 7.64s/it, loss=0.0024, acc=0.9972, iter_time=9.87s]
Epoch 0: 10%|▉ | 1216/12384 [2:35:15<23:41:43, 7.64s/it, loss=0.0049, acc=0.9911, iter_time=5.14s]
Epoch 0: 10%|▉ | 1217/12384 [2:35:15<23:41:31, 7.64s/it, loss=0.0049, acc=0.9911, iter_time=5.14s]
Epoch 0: 10%|▉ | 1217/12384 [2:35:23<23:41:31, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=10.03s]
Epoch 0: 10%|▉ | 1218/12384 [2:35:23<24:01:35, 7.75s/it, loss=0.0006, acc=1.0000, iter_time=10.03s]
Epoch 0: 10%|▉ | 1218/12384 [2:35:31<24:01:35, 7.75s/it, loss=0.0005, acc=0.9992, iter_time=7.95s]
Epoch 0: 10%|▉ | 1219/12384 [2:35:31<23:54:06, 7.71s/it, loss=0.0005, acc=0.9992, iter_time=7.95s]
Epoch 0: 10%|▉ | 1219/12384 [2:35:39<23:54:06, 7.71s/it, loss=0.0037, acc=0.9884, iter_time=5.52s]
Epoch 0: 10%|▉ | 1220/12384 [2:35:39<23:55:08, 7.71s/it, loss=0.0037, acc=0.9884, iter_time=5.52s]
Epoch 0: 10%|▉ | 1220/12384 [2:35:46<23:55:08, 7.71s/it, loss=0.0015, acc=0.9915, iter_time=9.83s]
Epoch 0: 10%|▉ | 1221/12384 [2:35:46<23:50:17, 7.69s/it, loss=0.0015, acc=0.9915, iter_time=9.83s]
Epoch 0: 10%|▉ | 1221/12384 [2:35:54<23:50:17, 7.69s/it, loss=0.0010, acc=0.9999, iter_time=7.63s]
Epoch 0: 10%|▉ | 1222/12384 [2:35:54<23:45:44, 7.66s/it, loss=0.0010, acc=0.9999, iter_time=7.63s]
Epoch 0: 10%|▉ | 1222/12384 [2:36:01<23:45:44, 7.66s/it, loss=0.0045, acc=0.9887, iter_time=5.62s]
Epoch 0: 10%|▉ | 1223/12384 [2:36:01<23:44:23, 7.66s/it, loss=0.0045, acc=0.9887, iter_time=5.62s]
Epoch 0: 10%|▉ | 1223/12384 [2:36:09<23:44:23, 7.66s/it, loss=0.0045, acc=0.9916, iter_time=10.01s]
Epoch 0: 10%|▉ | 1224/12384 [2:36:09<23:41:03, 7.64s/it, loss=0.0045, acc=0.9916, iter_time=10.01s]
Epoch 0: 10%|▉ | 1224/12384 [2:36:17<23:41:03, 7.64s/it, loss=0.0026, acc=0.9983, iter_time=7.25s]
Epoch 0: 10%|▉ | 1225/12384 [2:36:17<23:40:04, 7.64s/it, loss=0.0026, acc=0.9983, iter_time=7.25s]
Epoch 0: 10%|▉ | 1225/12384 [2:36:24<23:40:04, 7.64s/it, loss=0.0013, acc=0.9985, iter_time=7.63s]
Epoch 0: 10%|▉ | 1226/12384 [2:36:24<23:40:03, 7.64s/it, loss=0.0013, acc=0.9985, iter_time=7.63s]
Epoch 0: 10%|▉ | 1226/12384 [2:36:32<23:40:03, 7.64s/it, loss=0.0016, acc=0.9919, iter_time=7.61s]
Epoch 0: 10%|▉ | 1227/12384 [2:36:32<23:38:07, 7.63s/it, loss=0.0016, acc=0.9919, iter_time=7.61s]
Epoch 0: 10%|▉ | 1227/12384 [2:36:40<23:38:07, 7.63s/it, loss=0.0051, acc=0.9953, iter_time=5.78s]
Epoch 0: 10%|▉ | 1228/12384 [2:36:40<23:55:41, 7.72s/it, loss=0.0051, acc=0.9953, iter_time=5.78s]
Epoch 0: 10%|▉ | 1228/12384 [2:36:48<23:55:41, 7.72s/it, loss=0.0035, acc=0.9960, iter_time=8.42s]
Epoch 0: 10%|▉ | 1229/12384 [2:36:48<24:02:12, 7.76s/it, loss=0.0035, acc=0.9960, iter_time=8.42s]
Epoch 0: 10%|▉ | 1229/12384 [2:36:55<24:02:12, 7.76s/it, loss=0.0021, acc=0.9960, iter_time=9.18s]
Epoch 0: 10%|▉ | 1230/12384 [2:36:55<23:53:45, 7.71s/it, loss=0.0021, acc=0.9960, iter_time=9.18s]
Epoch 0: 10%|▉ | 1230/12384 [2:37:03<23:53:45, 7.71s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 10%|▉ | 1231/12384 [2:37:03<23:52:43, 7.71s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 10%|▉ | 1231/12384 [2:37:11<23:52:43, 7.71s/it, loss=0.0009, acc=0.9971, iter_time=8.07s]
Epoch 0: 10%|▉ | 1232/12384 [2:37:11<23:49:13, 7.69s/it, loss=0.0009, acc=0.9971, iter_time=8.07s]
Epoch 0: 10%|▉ | 1232/12384 [2:37:18<23:49:13, 7.69s/it, loss=0.0057, acc=0.9894, iter_time=6.55s]
Epoch 0: 10%|▉ | 1233/12384 [2:37:18<23:44:49, 7.67s/it, loss=0.0057, acc=0.9894, iter_time=6.55s]
Epoch 0: 10%|▉ | 1233/12384 [2:37:26<23:44:49, 7.67s/it, loss=0.0028, acc=0.9957, iter_time=8.29s]
Epoch 0: 10%|▉ | 1234/12384 [2:37:26<23:42:56, 7.66s/it, loss=0.0028, acc=0.9957, iter_time=8.29s]
Epoch 0: 10%|▉ | 1234/12384 [2:37:33<23:42:56, 7.66s/it, loss=0.0017, acc=0.9926, iter_time=7.63s]
Epoch 0: 10%|▉ | 1235/12384 [2:37:33<23:42:50, 7.66s/it, loss=0.0017, acc=0.9926, iter_time=7.63s]
Epoch 0: 10%|▉ | 1235/12384 [2:37:41<23:42:50, 7.66s/it, loss=0.0025, acc=0.9932, iter_time=7.67s]
Epoch 0: 10%|▉ | 1236/12384 [2:37:41<23:41:19, 7.65s/it, loss=0.0025, acc=0.9932, iter_time=7.67s]
Epoch 0: 10%|▉ | 1236/12384 [2:37:49<23:41:19, 7.65s/it, loss=0.0009, acc=0.9973, iter_time=7.62s]
Epoch 0: 10%|▉ | 1237/12384 [2:37:49<23:41:07, 7.65s/it, loss=0.0009, acc=0.9973, iter_time=7.62s]
Epoch 0: 10%|▉ | 1237/12384 [2:37:56<23:41:07, 7.65s/it, loss=0.0013, acc=0.9989, iter_time=7.65s]
Epoch 0: 10%|▉ | 1238/12384 [2:37:56<23:39:52, 7.64s/it, loss=0.0013, acc=0.9989, iter_time=7.65s]
Epoch 0: 10%|▉ | 1238/12384 [2:38:04<23:39:52, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=4.30s]
Epoch 0: 10%|█ | 1239/12384 [2:38:04<23:38:52, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=4.30s]
Epoch 0: 10%|█ | 1239/12384 [2:38:12<23:38:52, 7.64s/it, loss=0.0027, acc=0.9915, iter_time=10.89s]
Epoch 0: 10%|█ | 1240/12384 [2:38:12<23:37:56, 7.63s/it, loss=0.0027, acc=0.9915, iter_time=10.89s]
Epoch 0: 10%|█ | 1240/12384 [2:38:19<23:37:56, 7.63s/it, loss=0.0016, acc=0.9968, iter_time=5.41s]
Epoch 0: 10%|█ | 1241/12384 [2:38:19<23:37:42, 7.63s/it, loss=0.0016, acc=0.9968, iter_time=5.41s]
Epoch 0: 10%|█ | 1241/12384 [2:38:27<23:37:42, 7.63s/it, loss=0.0018, acc=0.9977, iter_time=9.89s]
Epoch 0: 10%|█ | 1242/12384 [2:38:27<23:37:44, 7.63s/it, loss=0.0018, acc=0.9977, iter_time=9.89s]
Epoch 0: 10%|█ | 1242/12384 [2:38:35<23:37:44, 7.63s/it, loss=0.0014, acc=0.9955, iter_time=7.65s]
Epoch 0: 10%|█ | 1243/12384 [2:38:35<23:39:41, 7.65s/it, loss=0.0014, acc=0.9955, iter_time=7.65s]
Epoch 0: 10%|█ | 1243/12384 [2:38:42<23:39:41, 7.65s/it, loss=0.0013, acc=0.9973, iter_time=7.96s]
Epoch 0: 10%|█ | 1244/12384 [2:38:42<23:53:40, 7.72s/it, loss=0.0013, acc=0.9973, iter_time=7.96s]
Epoch 0: 10%|█ | 1244/12384 [2:38:50<23:53:40, 7.72s/it, loss=0.0019, acc=0.9973, iter_time=7.35s]
Epoch 0: 10%|█ | 1245/12384 [2:38:50<24:05:31, 7.79s/it, loss=0.0019, acc=0.9973, iter_time=7.35s]
Epoch 0: 10%|█ | 1245/12384 [2:38:58<24:05:31, 7.79s/it, loss=0.0016, acc=0.9977, iter_time=8.20s]
Epoch 0: 10%|█ | 1246/12384 [2:38:58<23:57:00, 7.74s/it, loss=0.0016, acc=0.9977, iter_time=8.20s]
Epoch 0: 10%|█ | 1246/12384 [2:39:06<23:57:00, 7.74s/it, loss=0.0050, acc=0.9893, iter_time=4.79s]
Epoch 0: 10%|█ | 1247/12384 [2:39:06<23:51:46, 7.71s/it, loss=0.0050, acc=0.9893, iter_time=4.79s]
Epoch 0: 10%|█ | 1247/12384 [2:39:13<23:51:46, 7.71s/it, loss=0.0004, acc=0.9991, iter_time=10.44s]
Epoch 0: 10%|█ | 1248/12384 [2:39:13<23:46:12, 7.68s/it, loss=0.0004, acc=0.9991, iter_time=10.44s]
Epoch 0: 10%|█ | 1248/12384 [2:39:21<23:46:12, 7.68s/it, loss=0.0011, acc=0.9985, iter_time=7.66s]
Epoch 0: 10%|█ | 1249/12384 [2:39:21<23:42:36, 7.67s/it, loss=0.0011, acc=0.9985, iter_time=7.66s]
Epoch 0: 10%|█ | 1249/12384 [2:39:29<23:42:36, 7.67s/it, loss=0.0050, acc=0.9874, iter_time=8.04s]
Epoch 0: 10%|█ | 1250/12384 [2:39:29<23:40:32, 7.66s/it, loss=0.0050, acc=0.9874, iter_time=8.04s]
Epoch 0: 10%|█ | 1250/12384 [2:39:36<23:40:32, 7.66s/it, loss=0.0013, acc=0.9988, iter_time=7.19s]
Epoch 0: 10%|█ | 1251/12384 [2:39:36<23:36:45, 7.64s/it, loss=0.0013, acc=0.9988, iter_time=7.19s]
Epoch 0: 10%|█ | 1251/12384 [2:39:44<23:36:45, 7.64s/it, loss=0.0021, acc=0.9985, iter_time=7.62s]
Epoch 0: 10%|█ | 1252/12384 [2:39:44<23:38:53, 7.65s/it, loss=0.0021, acc=0.9985, iter_time=7.62s]
Epoch 0: 10%|█ | 1252/12384 [2:39:52<23:38:53, 7.65s/it, loss=0.0027, acc=0.9948, iter_time=7.14s]
Epoch 0: 10%|█ | 1253/12384 [2:39:52<23:40:12, 7.66s/it, loss=0.0027, acc=0.9948, iter_time=7.14s]
Epoch 0: 10%|█ | 1253/12384 [2:39:59<23:40:12, 7.66s/it, loss=0.0023, acc=0.9969, iter_time=8.21s]
Epoch 0: 10%|█ | 1254/12384 [2:39:59<23:37:50, 7.64s/it, loss=0.0023, acc=0.9969, iter_time=8.21s]
Epoch 0: 10%|█ | 1254/12384 [2:40:07<23:37:50, 7.64s/it, loss=0.0040, acc=0.9939, iter_time=7.62s]
Epoch 0: 10%|█ | 1255/12384 [2:40:07<23:37:31, 7.64s/it, loss=0.0040, acc=0.9939, iter_time=7.62s]
Epoch 0: 10%|█ | 1255/12384 [2:40:14<23:37:31, 7.64s/it, loss=0.0046, acc=0.9950, iter_time=7.79s]
Epoch 0: 10%|█ | 1256/12384 [2:40:14<23:37:21, 7.64s/it, loss=0.0046, acc=0.9950, iter_time=7.79s]
Epoch 0: 10%|█ | 1256/12384 [2:40:22<23:37:21, 7.64s/it, loss=0.0023, acc=0.9920, iter_time=7.49s]
Epoch 0: 10%|█ | 1257/12384 [2:40:22<23:37:52, 7.65s/it, loss=0.0023, acc=0.9920, iter_time=7.49s]
Epoch 0: 10%|█ | 1257/12384 [2:40:31<23:37:52, 7.65s/it, loss=0.0018, acc=0.9976, iter_time=7.25s]
Epoch 0: 10%|█ | 1258/12384 [2:40:31<24:32:45, 7.94s/it, loss=0.0018, acc=0.9976, iter_time=7.25s]
Epoch 0: 10%|█ | 1258/12384 [2:40:39<24:32:45, 7.94s/it, loss=0.0068, acc=0.9937, iter_time=9.48s]
Epoch 0: 10%|█ | 1259/12384 [2:40:39<24:39:00, 7.98s/it, loss=0.0068, acc=0.9937, iter_time=9.48s]
Epoch 0: 10%|█ | 1259/12384 [2:40:46<24:39:00, 7.98s/it, loss=0.0009, acc=0.9995, iter_time=6.99s]
Epoch 0: 10%|█ | 1260/12384 [2:40:46<24:20:12, 7.88s/it, loss=0.0009, acc=0.9995, iter_time=6.99s]
Epoch 0: 10%|█ | 1260/12384 [2:40:54<24:20:12, 7.88s/it, loss=0.0020, acc=0.9966, iter_time=8.24s]
Epoch 0: 10%|█ | 1261/12384 [2:40:54<24:03:57, 7.79s/it, loss=0.0020, acc=0.9966, iter_time=8.24s]
Epoch 0: 10%|█ | 1261/12384 [2:41:02<24:03:57, 7.79s/it, loss=0.0032, acc=0.9925, iter_time=7.60s]
Epoch 0: 10%|█ | 1262/12384 [2:41:02<23:56:23, 7.75s/it, loss=0.0032, acc=0.9925, iter_time=7.60s]
Epoch 0: 10%|█ | 1262/12384 [2:41:09<23:56:23, 7.75s/it, loss=0.0014, acc=0.9984, iter_time=7.66s]
Epoch 0: 10%|█ | 1263/12384 [2:41:09<23:50:14, 7.72s/it, loss=0.0014, acc=0.9984, iter_time=7.66s]
Epoch 0: 10%|█ | 1263/12384 [2:41:17<23:50:14, 7.72s/it, loss=0.0015, acc=0.9954, iter_time=7.73s]
Epoch 0: 10%|█ | 1264/12384 [2:41:17<23:45:33, 7.69s/it, loss=0.0015, acc=0.9954, iter_time=7.73s]
Epoch 0: 10%|█ | 1264/12384 [2:41:25<23:45:33, 7.69s/it, loss=0.0032, acc=0.9940, iter_time=7.54s]
Epoch 0: 10%|█ | 1265/12384 [2:41:25<23:41:28, 7.67s/it, loss=0.0032, acc=0.9940, iter_time=7.54s]
Epoch 0: 10%|█ | 1265/12384 [2:41:33<23:41:28, 7.67s/it, loss=0.0019, acc=0.9945, iter_time=8.78s]
Epoch 0: 10%|█ | 1266/12384 [2:41:33<24:46:07, 8.02s/it, loss=0.0019, acc=0.9945, iter_time=8.78s]
Epoch 0: 10%|█ | 1266/12384 [2:41:41<24:46:07, 8.02s/it, loss=0.0023, acc=0.9930, iter_time=5.06s]
Epoch 0: 10%|█ | 1267/12384 [2:41:41<24:24:09, 7.90s/it, loss=0.0023, acc=0.9930, iter_time=5.06s]
Epoch 0: 10%|█ | 1267/12384 [2:41:49<24:24:09, 7.90s/it, loss=0.0022, acc=0.9947, iter_time=10.23s]
Epoch 0: 10%|█ | 1268/12384 [2:41:49<24:08:42, 7.82s/it, loss=0.0022, acc=0.9947, iter_time=10.23s]
Epoch 0: 10%|█ | 1268/12384 [2:41:56<24:08:42, 7.82s/it, loss=0.0020, acc=0.9968, iter_time=7.62s]
Epoch 0: 10%|█ | 1269/12384 [2:41:56<23:57:01, 7.76s/it, loss=0.0020, acc=0.9968, iter_time=7.62s]
Epoch 0: 10%|█ | 1269/12384 [2:42:04<23:57:01, 7.76s/it, loss=0.0016, acc=0.9966, iter_time=7.63s]
Epoch 0: 10%|█ | 1270/12384 [2:42:04<23:48:42, 7.71s/it, loss=0.0016, acc=0.9966, iter_time=7.63s]
Epoch 0: 10%|█ | 1270/12384 [2:42:12<23:48:42, 7.71s/it, loss=0.0022, acc=0.9952, iter_time=8.00s]
Epoch 0: 10%|█ | 1271/12384 [2:42:12<24:04:42, 7.80s/it, loss=0.0022, acc=0.9952, iter_time=8.00s]
Epoch 0: 10%|█ | 1271/12384 [2:42:19<24:04:42, 7.80s/it, loss=0.0109, acc=0.9800, iter_time=7.98s]
Epoch 0: 10%|█ | 1272/12384 [2:42:19<23:55:40, 7.75s/it, loss=0.0109, acc=0.9800, iter_time=7.98s]
Epoch 0: 10%|█ | 1272/12384 [2:42:27<23:55:40, 7.75s/it, loss=0.0036, acc=0.9902, iter_time=7.27s]
Epoch 0: 10%|█ | 1273/12384 [2:42:27<23:50:17, 7.72s/it, loss=0.0036, acc=0.9902, iter_time=7.27s]
Epoch 0: 10%|█ | 1273/12384 [2:42:35<23:50:17, 7.72s/it, loss=0.0007, acc=0.9990, iter_time=7.67s]
Epoch 0: 10%|█ | 1274/12384 [2:42:35<23:44:53, 7.70s/it, loss=0.0007, acc=0.9990, iter_time=7.67s]
Epoch 0: 10%|█ | 1274/12384 [2:42:42<23:44:53, 7.70s/it, loss=0.0225, acc=0.9631, iter_time=7.61s]
Epoch 0: 10%|█ | 1275/12384 [2:42:42<23:41:11, 7.68s/it, loss=0.0225, acc=0.9631, iter_time=7.61s]
Epoch 0: 10%|█ | 1275/12384 [2:42:50<23:41:11, 7.68s/it, loss=0.0045, acc=0.9963, iter_time=7.64s]
Epoch 0: 10%|█ | 1276/12384 [2:42:50<23:40:05, 7.67s/it, loss=0.0045, acc=0.9963, iter_time=7.64s]
Epoch 0: 10%|█ | 1276/12384 [2:42:58<23:40:05, 7.67s/it, loss=0.0020, acc=0.9943, iter_time=7.67s]
Epoch 0: 10%|█ | 1277/12384 [2:42:58<23:40:02, 7.67s/it, loss=0.0020, acc=0.9943, iter_time=7.67s]
Epoch 0: 10%|█ | 1277/12384 [2:43:05<23:40:02, 7.67s/it, loss=0.0007, acc=0.9991, iter_time=5.66s]
Epoch 0: 10%|█ | 1278/12384 [2:43:05<23:34:18, 7.64s/it, loss=0.0007, acc=0.9991, iter_time=5.66s]
Epoch 0: 10%|█ | 1278/12384 [2:43:13<23:34:18, 7.64s/it, loss=0.0024, acc=0.9970, iter_time=9.56s]
Epoch 0: 10%|█ | 1279/12384 [2:43:13<23:33:08, 7.64s/it, loss=0.0024, acc=0.9970, iter_time=9.56s]
Epoch 0: 10%|█ | 1279/12384 [2:43:21<23:33:08, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.58s]
Epoch 0: 10%|█ | 1280/12384 [2:43:21<23:32:11, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.58s]
Epoch 0: 10%|█ | 1280/12384 [2:43:28<23:32:11, 7.63s/it, loss=0.0018, acc=0.9980, iter_time=6.42s]
Epoch 0: 10%|█ | 1281/12384 [2:43:28<23:33:36, 7.64s/it, loss=0.0018, acc=0.9980, iter_time=6.42s]
Epoch 0: 10%|█ | 1281/12384 [2:43:36<23:33:36, 7.64s/it, loss=0.0370, acc=0.9481, iter_time=8.92s]
Epoch 0: 10%|█ | 1282/12384 [2:43:36<23:32:31, 7.63s/it, loss=0.0370, acc=0.9481, iter_time=8.92s]
Epoch 0: 10%|█ | 1282/12384 [2:43:43<23:32:31, 7.63s/it, loss=0.0005, acc=0.9993, iter_time=5.51s]
Epoch 0: 10%|█ | 1283/12384 [2:43:43<23:33:03, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=5.51s]
Epoch 0: 10%|█ | 1283/12384 [2:43:51<23:33:03, 7.64s/it, loss=0.0015, acc=0.9951, iter_time=9.75s]
Epoch 0: 10%|█ | 1284/12384 [2:43:51<23:33:22, 7.64s/it, loss=0.0015, acc=0.9951, iter_time=9.75s]
Epoch 0: 10%|█ | 1284/12384 [2:43:59<23:33:22, 7.64s/it, loss=0.0038, acc=0.9940, iter_time=4.32s]
Epoch 0: 10%|█ | 1285/12384 [2:43:59<23:34:37, 7.65s/it, loss=0.0038, acc=0.9940, iter_time=4.32s]
Epoch 0: 10%|█ | 1285/12384 [2:44:06<23:34:37, 7.65s/it, loss=0.0010, acc=1.0000, iter_time=10.96s]
Epoch 0: 10%|█ | 1286/12384 [2:44:06<23:33:08, 7.64s/it, loss=0.0010, acc=1.0000, iter_time=10.96s]
Epoch 0: 10%|█ | 1286/12384 [2:44:14<23:33:08, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.33s]
Epoch 0: 10%|█ | 1287/12384 [2:44:14<23:33:29, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.33s]
Epoch 0: 10%|█ | 1287/12384 [2:44:22<23:33:29, 7.64s/it, loss=0.0015, acc=0.9954, iter_time=7.93s]
Epoch 0: 10%|█ | 1288/12384 [2:44:22<23:33:00, 7.64s/it, loss=0.0015, acc=0.9954, iter_time=7.93s]
Epoch 0: 10%|█ | 1288/12384 [2:44:29<23:33:00, 7.64s/it, loss=0.0015, acc=0.9969, iter_time=7.67s]
Epoch 0: 10%|█ | 1289/12384 [2:44:29<23:31:30, 7.63s/it, loss=0.0015, acc=0.9969, iter_time=7.67s]
Epoch 0: 10%|█ | 1289/12384 [2:44:37<23:31:30, 7.63s/it, loss=0.0031, acc=0.9954, iter_time=7.61s]
Epoch 0: 10%|█ | 1290/12384 [2:44:37<23:29:38, 7.62s/it, loss=0.0031, acc=0.9954, iter_time=7.61s]
Epoch 0: 10%|█ | 1290/12384 [2:44:45<23:29:38, 7.62s/it, loss=0.0005, acc=0.9983, iter_time=5.26s]
Epoch 0: 10%|█ | 1291/12384 [2:44:45<23:30:09, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=5.26s]
Epoch 0: 10%|█ | 1291/12384 [2:44:52<23:30:09, 7.63s/it, loss=0.0014, acc=0.9966, iter_time=9.97s]
Epoch 0: 10%|█ | 1292/12384 [2:44:52<23:28:58, 7.62s/it, loss=0.0014, acc=0.9966, iter_time=9.97s]
Epoch 0: 10%|█ | 1292/12384 [2:45:00<23:28:58, 7.62s/it, loss=0.0007, acc=0.9974, iter_time=7.61s]
Epoch 0: 10%|█ | 1293/12384 [2:45:00<23:27:26, 7.61s/it, loss=0.0007, acc=0.9974, iter_time=7.61s]
Epoch 0: 10%|█ | 1293/12384 [2:45:07<23:27:26, 7.61s/it, loss=0.0015, acc=0.9986, iter_time=6.40s]
Epoch 0: 10%|█ | 1294/12384 [2:45:07<23:28:17, 7.62s/it, loss=0.0015, acc=0.9986, iter_time=6.40s]
Epoch 0: 10%|█ | 1294/12384 [2:45:15<23:28:17, 7.62s/it, loss=0.0008, acc=0.9999, iter_time=8.85s]
Epoch 0: 10%|█ | 1295/12384 [2:45:15<23:27:38, 7.62s/it, loss=0.0008, acc=0.9999, iter_time=8.85s]
Epoch 0: 10%|█ | 1295/12384 [2:45:23<23:27:38, 7.62s/it, loss=0.0011, acc=0.9996, iter_time=7.56s]
Epoch 0: 10%|█ | 1296/12384 [2:45:23<23:27:46, 7.62s/it, loss=0.0011, acc=0.9996, iter_time=7.56s]
Epoch 0: 10%|█ | 1296/12384 [2:45:31<23:27:46, 7.62s/it, loss=0.0014, acc=0.9974, iter_time=7.67s]
Epoch 0: 10%|█ | 1297/12384 [2:45:31<23:44:33, 7.71s/it, loss=0.0014, acc=0.9974, iter_time=7.67s]
Epoch 0: 10%|█ | 1297/12384 [2:45:38<23:44:33, 7.71s/it, loss=0.0012, acc=0.9978, iter_time=7.92s]
Epoch 0: 10%|█ | 1298/12384 [2:45:38<23:41:19, 7.69s/it, loss=0.0012, acc=0.9978, iter_time=7.92s]
Epoch 0: 10%|█ | 1298/12384 [2:45:46<23:41:19, 7.69s/it, loss=0.0009, acc=0.9982, iter_time=7.63s]
Epoch 0: 10%|█ | 1299/12384 [2:45:46<23:35:49, 7.66s/it, loss=0.0009, acc=0.9982, iter_time=7.63s]
Epoch 0: 10%|█ | 1299/12384 [2:45:53<23:35:49, 7.66s/it, loss=0.0009, acc=0.9992, iter_time=8.02s]
Epoch 0: 10%|█ | 1300/12384 [2:45:53<23:33:25, 7.65s/it, loss=0.0009, acc=0.9992, iter_time=8.02s]
Epoch 0: 10%|█ | 1300/12384 [2:46:01<23:33:25, 7.65s/it, loss=0.0020, acc=0.9980, iter_time=5.12s]
Epoch 0: 11%|█ | 1301/12384 [2:46:01<23:34:20, 7.66s/it, loss=0.0020, acc=0.9980, iter_time=5.12s]
Epoch 0: 11%|█ | 1301/12384 [2:46:09<23:34:20, 7.66s/it, loss=0.0051, acc=0.9890, iter_time=9.75s]
Epoch 0: 11%|█ | 1302/12384 [2:46:09<23:30:35, 7.64s/it, loss=0.0051, acc=0.9890, iter_time=9.75s]
Epoch 0: 11%|█ | 1302/12384 [2:46:16<23:30:35, 7.64s/it, loss=0.0028, acc=0.9950, iter_time=7.59s]
Epoch 0: 11%|█ | 1303/12384 [2:46:16<23:28:46, 7.63s/it, loss=0.0028, acc=0.9950, iter_time=7.59s]
Epoch 0: 11%|█ | 1303/12384 [2:46:24<23:28:46, 7.63s/it, loss=0.0018, acc=0.9936, iter_time=7.98s]
Epoch 0: 11%|█ | 1304/12384 [2:46:24<23:27:47, 7.62s/it, loss=0.0018, acc=0.9936, iter_time=7.98s]
Epoch 0: 11%|█ | 1304/12384 [2:46:32<23:27:47, 7.62s/it, loss=0.0009, acc=0.9979, iter_time=7.25s]
Epoch 0: 11%|█ | 1305/12384 [2:46:32<23:28:32, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=7.25s]
Epoch 0: 11%|█ | 1305/12384 [2:46:39<23:28:32, 7.63s/it, loss=0.0008, acc=1.0000, iter_time=2.76s]
Epoch 0: 11%|█ | 1306/12384 [2:46:39<23:26:14, 7.62s/it, loss=0.0008, acc=1.0000, iter_time=2.76s]
Epoch 0: 11%|█ | 1306/12384 [2:46:47<23:26:14, 7.62s/it, loss=0.0011, acc=0.9978, iter_time=12.45s]
Epoch 0: 11%|█ | 1307/12384 [2:46:47<23:27:06, 7.62s/it, loss=0.0011, acc=0.9978, iter_time=12.45s]
Epoch 0: 11%|█ | 1307/12384 [2:46:54<23:27:06, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 0: 11%|█ | 1308/12384 [2:46:54<23:27:42, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.64s]
Epoch 0: 11%|█ | 1308/12384 [2:47:02<23:27:42, 7.63s/it, loss=0.0026, acc=0.9920, iter_time=7.64s]
Epoch 0: 11%|█ | 1309/12384 [2:47:02<23:31:59, 7.65s/it, loss=0.0026, acc=0.9920, iter_time=7.64s]
Epoch 0: 11%|█ | 1309/12384 [2:47:10<23:31:59, 7.65s/it, loss=0.0018, acc=0.9961, iter_time=7.69s]
Epoch 0: 11%|█ | 1310/12384 [2:47:10<23:29:53, 7.64s/it, loss=0.0018, acc=0.9961, iter_time=7.69s]
Epoch 0: 11%|█ | 1310/12384 [2:47:17<23:29:53, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 11%|█ | 1311/12384 [2:47:17<23:27:24, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 11%|█ | 1311/12384 [2:47:25<23:27:24, 7.63s/it, loss=0.0026, acc=0.9940, iter_time=7.61s]
Epoch 0: 11%|█ | 1312/12384 [2:47:25<23:30:48, 7.65s/it, loss=0.0026, acc=0.9940, iter_time=7.61s]
Epoch 0: 11%|█ | 1312/12384 [2:47:33<23:30:48, 7.65s/it, loss=0.0020, acc=0.9969, iter_time=7.67s]
Epoch 0: 11%|█ | 1313/12384 [2:47:33<23:28:25, 7.63s/it, loss=0.0020, acc=0.9969, iter_time=7.67s]
Epoch 0: 11%|█ | 1313/12384 [2:47:40<23:28:25, 7.63s/it, loss=0.0014, acc=0.9957, iter_time=7.61s]
Epoch 0: 11%|█ | 1314/12384 [2:47:40<23:28:52, 7.64s/it, loss=0.0014, acc=0.9957, iter_time=7.61s]
Epoch 0: 11%|█ | 1314/12384 [2:47:48<23:28:52, 7.64s/it, loss=0.0013, acc=0.9971, iter_time=7.64s]
Epoch 0: 11%|█ | 1315/12384 [2:47:48<23:28:22, 7.63s/it, loss=0.0013, acc=0.9971, iter_time=7.64s]
Epoch 0: 11%|█ | 1315/12384 [2:47:56<23:28:22, 7.63s/it, loss=0.0030, acc=0.9924, iter_time=7.64s]
Epoch 0: 11%|█ | 1316/12384 [2:47:56<23:28:28, 7.64s/it, loss=0.0030, acc=0.9924, iter_time=7.64s]
Epoch 0: 11%|█ | 1316/12384 [2:48:03<23:28:28, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=6.68s]
Epoch 0: 11%|█ | 1317/12384 [2:48:03<23:25:45, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=6.68s]
Epoch 0: 11%|█ | 1317/12384 [2:48:11<23:25:45, 7.62s/it, loss=0.0025, acc=0.9951, iter_time=8.53s]
Epoch 0: 11%|█ | 1318/12384 [2:48:11<23:26:19, 7.63s/it, loss=0.0025, acc=0.9951, iter_time=8.53s]
Epoch 0: 11%|█ | 1318/12384 [2:48:18<23:26:19, 7.63s/it, loss=0.0006, acc=0.9979, iter_time=6.12s]
Epoch 0: 11%|█ | 1319/12384 [2:48:18<23:25:14, 7.62s/it, loss=0.0006, acc=0.9979, iter_time=6.12s]
Epoch 0: 11%|█ | 1319/12384 [2:48:26<23:25:14, 7.62s/it, loss=0.0042, acc=0.9955, iter_time=9.51s]
Epoch 0: 11%|█ | 1320/12384 [2:48:26<23:29:52, 7.65s/it, loss=0.0042, acc=0.9955, iter_time=9.51s]
Epoch 0: 11%|█ | 1320/12384 [2:48:34<23:29:52, 7.65s/it, loss=0.0033, acc=0.9970, iter_time=3.02s]
Epoch 0: 11%|█ | 1321/12384 [2:48:34<23:27:46, 7.64s/it, loss=0.0033, acc=0.9970, iter_time=3.02s]
Epoch 0: 11%|█ | 1321/12384 [2:48:41<23:27:46, 7.64s/it, loss=0.0052, acc=0.9919, iter_time=8.65s]
Epoch 0: 11%|█ | 1322/12384 [2:48:41<23:30:44, 7.65s/it, loss=0.0052, acc=0.9919, iter_time=8.65s]
Epoch 0: 11%|█ | 1322/12384 [2:48:49<23:30:44, 7.65s/it, loss=0.0019, acc=0.9965, iter_time=10.98s]
Epoch 0: 11%|█ | 1323/12384 [2:48:49<23:50:43, 7.76s/it, loss=0.0019, acc=0.9965, iter_time=10.98s]
Epoch 0: 11%|█ | 1323/12384 [2:48:57<23:50:43, 7.76s/it, loss=0.0040, acc=0.9948, iter_time=7.96s]
Epoch 0: 11%|█ | 1324/12384 [2:48:57<23:40:56, 7.71s/it, loss=0.0040, acc=0.9948, iter_time=7.96s]
Epoch 0: 11%|█ | 1324/12384 [2:49:05<23:40:56, 7.71s/it, loss=0.0020, acc=0.9962, iter_time=7.07s]
Epoch 0: 11%|█ | 1325/12384 [2:49:05<23:35:45, 7.68s/it, loss=0.0020, acc=0.9962, iter_time=7.07s]
Epoch 0: 11%|█ | 1325/12384 [2:49:12<23:35:45, 7.68s/it, loss=0.0021, acc=0.9964, iter_time=8.15s]
Epoch 0: 11%|█ | 1326/12384 [2:49:12<23:35:09, 7.68s/it, loss=0.0021, acc=0.9964, iter_time=8.15s]
Epoch 0: 11%|█ | 1326/12384 [2:49:20<23:35:09, 7.68s/it, loss=0.0052, acc=0.9894, iter_time=7.69s]
Epoch 0: 11%|█ | 1327/12384 [2:49:20<23:33:00, 7.67s/it, loss=0.0052, acc=0.9894, iter_time=7.69s]
Epoch 0: 11%|█ | 1327/12384 [2:49:27<23:33:00, 7.67s/it, loss=0.0020, acc=0.9931, iter_time=8.02s]
Epoch 0: 11%|█ | 1328/12384 [2:49:27<23:29:15, 7.65s/it, loss=0.0020, acc=0.9931, iter_time=8.02s]
Epoch 0: 11%|█ | 1328/12384 [2:49:35<23:29:15, 7.65s/it, loss=0.0017, acc=0.9981, iter_time=7.22s]
Epoch 0: 11%|█ | 1329/12384 [2:49:35<23:27:27, 7.64s/it, loss=0.0017, acc=0.9981, iter_time=7.22s]
Epoch 0: 11%|█ | 1329/12384 [2:49:43<23:27:27, 7.64s/it, loss=0.0023, acc=0.9969, iter_time=6.39s]
Epoch 0: 11%|█ | 1330/12384 [2:49:43<23:25:25, 7.63s/it, loss=0.0023, acc=0.9969, iter_time=6.39s]
Epoch 0: 11%|█ | 1330/12384 [2:49:50<23:25:25, 7.63s/it, loss=0.0037, acc=0.9956, iter_time=8.81s]
Epoch 0: 11%|█ | 1331/12384 [2:49:50<23:24:30, 7.62s/it, loss=0.0037, acc=0.9956, iter_time=8.81s]
Epoch 0: 11%|█ | 1331/12384 [2:49:58<23:24:30, 7.62s/it, loss=0.0016, acc=0.9969, iter_time=7.08s]
Epoch 0: 11%|█ | 1332/12384 [2:49:58<23:29:17, 7.65s/it, loss=0.0016, acc=0.9969, iter_time=7.08s]
Epoch 0: 11%|█ | 1332/12384 [2:50:06<23:29:17, 7.65s/it, loss=0.0008, acc=0.9974, iter_time=5.41s]
Epoch 0: 11%|█ | 1333/12384 [2:50:06<23:34:26, 7.68s/it, loss=0.0008, acc=0.9974, iter_time=5.41s]
Epoch 0: 11%|█ | 1333/12384 [2:50:13<23:34:26, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=7.74s]
Epoch 0: 11%|█ | 1334/12384 [2:50:13<23:34:02, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=7.74s]
Epoch 0: 11%|█ | 1334/12384 [2:50:21<23:34:02, 7.68s/it, loss=0.0009, acc=0.9973, iter_time=10.53s]
Epoch 0: 11%|█ | 1335/12384 [2:50:21<23:32:08, 7.67s/it, loss=0.0009, acc=0.9973, iter_time=10.53s]
Epoch 0: 11%|█ | 1335/12384 [2:50:29<23:32:08, 7.67s/it, loss=0.0017, acc=0.9960, iter_time=8.02s]
Epoch 0: 11%|█ | 1336/12384 [2:50:29<23:28:59, 7.65s/it, loss=0.0017, acc=0.9960, iter_time=8.02s]
Epoch 0: 11%|█ | 1336/12384 [2:50:36<23:28:59, 7.65s/it, loss=0.0069, acc=0.9884, iter_time=7.24s]
Epoch 0: 11%|█ | 1337/12384 [2:50:36<23:30:32, 7.66s/it, loss=0.0069, acc=0.9884, iter_time=7.24s]
Epoch 0: 11%|█ | 1337/12384 [2:50:44<23:30:32, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=7.69s]
Epoch 0: 11%|█ | 1338/12384 [2:50:44<23:30:14, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=7.69s]
Epoch 0: 11%|█ | 1338/12384 [2:50:52<23:30:14, 7.66s/it, loss=0.0011, acc=0.9988, iter_time=7.66s]
Epoch 0: 11%|█ | 1339/12384 [2:50:52<23:28:57, 7.65s/it, loss=0.0011, acc=0.9988, iter_time=7.66s]
Epoch 0: 11%|█ | 1339/12384 [2:50:59<23:28:57, 7.65s/it, loss=0.0009, acc=0.9997, iter_time=7.61s]
Epoch 0: 11%|█ | 1340/12384 [2:50:59<23:28:07, 7.65s/it, loss=0.0009, acc=0.9997, iter_time=7.61s]
Epoch 0: 11%|█ | 1340/12384 [2:51:07<23:28:07, 7.65s/it, loss=0.0023, acc=0.9950, iter_time=7.65s]
Epoch 0: 11%|█ | 1341/12384 [2:51:07<23:24:54, 7.63s/it, loss=0.0023, acc=0.9950, iter_time=7.65s]
Epoch 0: 11%|█ | 1341/12384 [2:51:15<23:24:54, 7.63s/it, loss=0.0028, acc=0.9939, iter_time=7.58s]
Epoch 0: 11%|█ | 1342/12384 [2:51:15<23:22:27, 7.62s/it, loss=0.0028, acc=0.9939, iter_time=7.58s]
Epoch 0: 11%|█ | 1342/12384 [2:51:22<23:22:27, 7.62s/it, loss=0.0016, acc=0.9969, iter_time=7.61s]
Epoch 0: 11%|█ | 1343/12384 [2:51:22<23:23:32, 7.63s/it, loss=0.0016, acc=0.9969, iter_time=7.61s]
Epoch 0: 11%|█ | 1343/12384 [2:51:30<23:23:32, 7.63s/it, loss=0.0018, acc=0.9928, iter_time=7.61s]
Epoch 0: 11%|█ | 1344/12384 [2:51:30<23:23:42, 7.63s/it, loss=0.0018, acc=0.9928, iter_time=7.61s]
Epoch 0: 11%|█ | 1344/12384 [2:51:37<23:23:42, 7.63s/it, loss=0.0014, acc=0.9959, iter_time=6.44s]
Epoch 0: 11%|█ | 1345/12384 [2:51:37<23:22:20, 7.62s/it, loss=0.0014, acc=0.9959, iter_time=6.44s]
Epoch 0: 11%|█ | 1345/12384 [2:51:45<23:22:20, 7.62s/it, loss=0.0056, acc=0.9839, iter_time=8.83s]
Epoch 0: 11%|█ | 1346/12384 [2:51:45<23:27:06, 7.65s/it, loss=0.0056, acc=0.9839, iter_time=8.83s]
Epoch 0: 11%|█ | 1346/12384 [2:51:53<23:27:06, 7.65s/it, loss=0.0010, acc=0.9984, iter_time=7.11s]
Epoch 0: 11%|█ | 1347/12384 [2:51:53<23:28:31, 7.66s/it, loss=0.0010, acc=0.9984, iter_time=7.11s]
Epoch 0: 11%|█ | 1347/12384 [2:52:00<23:28:31, 7.66s/it, loss=0.0010, acc=0.9986, iter_time=7.09s]
Epoch 0: 11%|█ | 1348/12384 [2:52:00<23:25:39, 7.64s/it, loss=0.0010, acc=0.9986, iter_time=7.09s]
Epoch 0: 11%|█ | 1348/12384 [2:52:08<23:25:39, 7.64s/it, loss=0.0025, acc=0.9925, iter_time=9.09s]
Epoch 0: 11%|█ | 1349/12384 [2:52:08<23:42:32, 7.73s/it, loss=0.0025, acc=0.9925, iter_time=9.09s]
Epoch 0: 11%|█ | 1349/12384 [2:52:16<23:42:32, 7.73s/it, loss=0.0016, acc=0.9970, iter_time=8.05s]
Epoch 0: 11%|█ | 1350/12384 [2:52:16<23:35:11, 7.70s/it, loss=0.0016, acc=0.9970, iter_time=8.05s]
Epoch 0: 11%|█ | 1350/12384 [2:52:24<23:35:11, 7.70s/it, loss=0.0138, acc=0.9784, iter_time=7.22s]
Epoch 0: 11%|█ | 1351/12384 [2:52:24<23:30:48, 7.67s/it, loss=0.0138, acc=0.9784, iter_time=7.22s]
Epoch 0: 11%|█ | 1351/12384 [2:52:31<23:30:48, 7.67s/it, loss=0.0063, acc=0.9920, iter_time=7.60s]
Epoch 0: 11%|█ | 1352/12384 [2:52:31<23:29:17, 7.66s/it, loss=0.0063, acc=0.9920, iter_time=7.60s]
Epoch 0: 11%|█ | 1352/12384 [2:52:39<23:29:17, 7.66s/it, loss=0.0010, acc=0.9994, iter_time=4.52s]
Epoch 0: 11%|█ | 1353/12384 [2:52:39<23:29:04, 7.66s/it, loss=0.0010, acc=0.9994, iter_time=4.52s]
Epoch 0: 11%|█ | 1353/12384 [2:52:47<23:29:04, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.77s]
Epoch 0: 11%|█ | 1354/12384 [2:52:47<23:28:17, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.77s]
Epoch 0: 11%|█ | 1354/12384 [2:52:54<23:28:17, 7.66s/it, loss=0.0013, acc=0.9980, iter_time=10.67s]
Epoch 0: 11%|█ | 1355/12384 [2:52:54<23:26:51, 7.65s/it, loss=0.0013, acc=0.9980, iter_time=10.67s]
Epoch 0: 11%|█ | 1355/12384 [2:53:02<23:26:51, 7.65s/it, loss=0.0019, acc=0.9979, iter_time=5.56s]
Epoch 0: 11%|█ | 1356/12384 [2:53:02<23:26:20, 7.65s/it, loss=0.0019, acc=0.9979, iter_time=5.56s]
Epoch 0: 11%|█ | 1356/12384 [2:53:09<23:26:20, 7.65s/it, loss=0.0033, acc=0.9935, iter_time=9.72s]
Epoch 0: 11%|█ | 1357/12384 [2:53:09<23:24:06, 7.64s/it, loss=0.0033, acc=0.9935, iter_time=9.72s]
Epoch 0: 11%|█ | 1357/12384 [2:53:17<23:24:06, 7.64s/it, loss=0.0008, acc=0.9971, iter_time=7.63s]
Epoch 0: 11%|█ | 1358/12384 [2:53:17<23:23:38, 7.64s/it, loss=0.0008, acc=0.9971, iter_time=7.63s]
Epoch 0: 11%|█ | 1358/12384 [2:53:25<23:23:38, 7.64s/it, loss=0.0016, acc=0.9977, iter_time=7.63s]
Epoch 0: 11%|█ | 1359/12384 [2:53:25<23:20:57, 7.62s/it, loss=0.0016, acc=0.9977, iter_time=7.63s]
Epoch 0: 11%|█ | 1359/12384 [2:53:32<23:20:57, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=7.98s]
Epoch 0: 11%|█ | 1360/12384 [2:53:32<23:20:22, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=7.98s]
Epoch 0: 11%|█ | 1360/12384 [2:53:40<23:20:22, 7.62s/it, loss=0.0043, acc=0.9899, iter_time=7.23s]
Epoch 0: 11%|█ | 1361/12384 [2:53:40<23:20:19, 7.62s/it, loss=0.0043, acc=0.9899, iter_time=7.23s]
Epoch 0: 11%|█ | 1361/12384 [2:53:48<23:20:19, 7.62s/it, loss=0.0013, acc=0.9979, iter_time=7.63s]
Epoch 0: 11%|█ | 1362/12384 [2:53:48<23:19:55, 7.62s/it, loss=0.0013, acc=0.9979, iter_time=7.63s]
Epoch 0: 11%|█ | 1362/12384 [2:53:55<23:19:55, 7.62s/it, loss=0.0033, acc=0.9928, iter_time=7.37s]
Epoch 0: 11%|█ | 1363/12384 [2:53:55<23:20:20, 7.62s/it, loss=0.0033, acc=0.9928, iter_time=7.37s]
Epoch 0: 11%|█ | 1363/12384 [2:54:03<23:20:20, 7.62s/it, loss=0.0121, acc=0.9796, iter_time=7.87s]
Epoch 0: 11%|█ | 1364/12384 [2:54:03<23:18:55, 7.62s/it, loss=0.0121, acc=0.9796, iter_time=7.87s]
Epoch 0: 11%|█ | 1364/12384 [2:54:10<23:18:55, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=7.61s]
Epoch 0: 11%|█ | 1365/12384 [2:54:10<23:20:06, 7.62s/it, loss=0.0008, acc=0.9981, iter_time=7.61s]
Epoch 0: 11%|█ | 1365/12384 [2:54:18<23:20:06, 7.62s/it, loss=0.0041, acc=0.9914, iter_time=7.72s]
Epoch 0: 11%|█ | 1366/12384 [2:54:18<23:23:20, 7.64s/it, loss=0.0041, acc=0.9914, iter_time=7.72s]
Epoch 0: 11%|█ | 1366/12384 [2:54:26<23:23:20, 7.64s/it, loss=0.0021, acc=0.9929, iter_time=5.82s]
Epoch 0: 11%|█ | 1367/12384 [2:54:26<23:27:25, 7.66s/it, loss=0.0021, acc=0.9929, iter_time=5.82s]
Epoch 0: 11%|█ | 1367/12384 [2:54:33<23:27:25, 7.66s/it, loss=0.0012, acc=0.9947, iter_time=9.90s]
Epoch 0: 11%|█ | 1368/12384 [2:54:33<23:26:38, 7.66s/it, loss=0.0012, acc=0.9947, iter_time=9.90s]
Epoch 0: 11%|█ | 1368/12384 [2:54:41<23:26:38, 7.66s/it, loss=0.0060, acc=0.9860, iter_time=7.27s]
Epoch 0: 11%|█ | 1369/12384 [2:54:41<23:26:07, 7.66s/it, loss=0.0060, acc=0.9860, iter_time=7.27s]
Epoch 0: 11%|█ | 1369/12384 [2:54:49<23:26:07, 7.66s/it, loss=0.0057, acc=0.9873, iter_time=7.63s]
Epoch 0: 11%|█ | 1370/12384 [2:54:49<23:23:50, 7.65s/it, loss=0.0057, acc=0.9873, iter_time=7.63s]
Epoch 0: 11%|█ | 1370/12384 [2:54:56<23:23:50, 7.65s/it, loss=0.0010, acc=0.9993, iter_time=7.64s]
Epoch 0: 11%|█ | 1371/12384 [2:54:56<23:23:21, 7.65s/it, loss=0.0010, acc=0.9993, iter_time=7.64s]
Epoch 0: 11%|█ | 1371/12384 [2:55:04<23:23:21, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.63s]
Epoch 0: 11%|█ | 1372/12384 [2:55:04<23:22:13, 7.64s/it, loss=0.0004, acc=0.9988, iter_time=7.63s]
Epoch 0: 11%|█ | 1372/12384 [2:55:12<23:22:13, 7.64s/it, loss=0.0032, acc=0.9937, iter_time=5.56s]
Epoch 0: 11%|█ | 1373/12384 [2:55:12<23:20:45, 7.63s/it, loss=0.0032, acc=0.9937, iter_time=5.56s]
Epoch 0: 11%|█ | 1373/12384 [2:55:19<23:20:45, 7.63s/it, loss=0.0027, acc=0.9947, iter_time=9.92s]
Epoch 0: 11%|█ | 1374/12384 [2:55:19<23:31:56, 7.69s/it, loss=0.0027, acc=0.9947, iter_time=9.92s]
Epoch 0: 11%|█ | 1374/12384 [2:55:27<23:31:56, 7.69s/it, loss=0.0007, acc=0.9998, iter_time=7.58s]
Epoch 0: 11%|█ | 1375/12384 [2:55:27<23:28:09, 7.67s/it, loss=0.0007, acc=0.9998, iter_time=7.58s]
Epoch 0: 11%|█ | 1375/12384 [2:55:35<23:28:09, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=8.12s]
Epoch 0: 11%|█ | 1376/12384 [2:55:35<23:46:18, 7.77s/it, loss=0.0004, acc=1.0000, iter_time=8.12s]
Epoch 0: 11%|█ | 1376/12384 [2:55:43<23:46:18, 7.77s/it, loss=0.0007, acc=0.9998, iter_time=4.93s]
Epoch 0: 11%|█ | 1377/12384 [2:55:43<23:40:00, 7.74s/it, loss=0.0007, acc=0.9998, iter_time=4.93s]
Epoch 0: 11%|█ | 1377/12384 [2:55:50<23:40:00, 7.74s/it, loss=0.0032, acc=0.9939, iter_time=10.27s]
Epoch 0: 11%|█ | 1378/12384 [2:55:50<23:35:33, 7.72s/it, loss=0.0032, acc=0.9939, iter_time=10.27s]
Epoch 0: 11%|█ | 1378/12384 [2:55:58<23:35:33, 7.72s/it, loss=0.0039, acc=0.9865, iter_time=7.67s]
Epoch 0: 11%|█ | 1379/12384 [2:55:58<23:30:03, 7.69s/it, loss=0.0039, acc=0.9865, iter_time=7.67s]
Epoch 0: 11%|█ | 1379/12384 [2:56:06<23:30:03, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=6.68s]
Epoch 0: 11%|█ | 1380/12384 [2:56:06<23:27:23, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.68s]
Epoch 0: 11%|█ | 1380/12384 [2:56:13<23:27:23, 7.67s/it, loss=0.0021, acc=0.9973, iter_time=8.59s]
Epoch 0: 11%|█ | 1381/12384 [2:56:13<23:26:17, 7.67s/it, loss=0.0021, acc=0.9973, iter_time=8.59s]
Epoch 0: 11%|█ | 1381/12384 [2:56:21<23:26:17, 7.67s/it, loss=0.0019, acc=0.9953, iter_time=5.34s]
Epoch 0: 11%|█ | 1382/12384 [2:56:21<23:26:31, 7.67s/it, loss=0.0019, acc=0.9953, iter_time=5.34s]
Epoch 0: 11%|█ | 1382/12384 [2:56:29<23:26:31, 7.67s/it, loss=0.0061, acc=0.9972, iter_time=9.72s]
Epoch 0: 11%|█ | 1383/12384 [2:56:29<23:25:36, 7.67s/it, loss=0.0061, acc=0.9972, iter_time=9.72s]
Epoch 0: 11%|█ | 1383/12384 [2:56:36<23:25:36, 7.67s/it, loss=0.0016, acc=0.9940, iter_time=8.27s]
Epoch 0: 11%|█ | 1384/12384 [2:56:36<23:23:08, 7.65s/it, loss=0.0016, acc=0.9940, iter_time=8.27s]
Epoch 0: 11%|█ | 1384/12384 [2:56:44<23:23:08, 7.65s/it, loss=0.0016, acc=0.9941, iter_time=7.24s]
Epoch 0: 11%|█ | 1385/12384 [2:56:44<23:23:42, 7.66s/it, loss=0.0016, acc=0.9941, iter_time=7.24s]
Epoch 0: 11%|█ | 1385/12384 [2:56:52<23:23:42, 7.66s/it, loss=0.0007, acc=1.0000, iter_time=7.68s]
Epoch 0: 11%|█ | 1386/12384 [2:56:52<23:23:45, 7.66s/it, loss=0.0007, acc=1.0000, iter_time=7.68s]
Epoch 0: 11%|█ | 1386/12384 [2:56:59<23:23:45, 7.66s/it, loss=0.0016, acc=0.9959, iter_time=7.67s]
Epoch 0: 11%|█ | 1387/12384 [2:56:59<23:22:35, 7.65s/it, loss=0.0016, acc=0.9959, iter_time=7.67s]
Epoch 0: 11%|█ | 1387/12384 [2:57:07<23:22:35, 7.65s/it, loss=0.0024, acc=0.9940, iter_time=6.70s]
Epoch 0: 11%|█ | 1388/12384 [2:57:07<23:21:27, 7.65s/it, loss=0.0024, acc=0.9940, iter_time=6.70s]
Epoch 0: 11%|█ | 1388/12384 [2:57:15<23:21:27, 7.65s/it, loss=0.0030, acc=0.9943, iter_time=8.58s]
Epoch 0: 11%|█ | 1389/12384 [2:57:15<23:21:08, 7.65s/it, loss=0.0030, acc=0.9943, iter_time=8.58s]
Epoch 0: 11%|█ | 1389/12384 [2:57:22<23:21:08, 7.65s/it, loss=0.0060, acc=0.9835, iter_time=5.33s]
Epoch 0: 11%|█ | 1390/12384 [2:57:22<23:21:16, 7.65s/it, loss=0.0060, acc=0.9835, iter_time=5.33s]
Epoch 0: 11%|█ | 1390/12384 [2:57:30<23:21:16, 7.65s/it, loss=0.0015, acc=0.9946, iter_time=9.97s]
Epoch 0: 11%|█ | 1391/12384 [2:57:30<23:20:13, 7.64s/it, loss=0.0015, acc=0.9946, iter_time=9.97s]
Epoch 0: 11%|█ | 1391/12384 [2:57:37<23:20:13, 7.64s/it, loss=0.0061, acc=0.9859, iter_time=7.57s]
Epoch 0: 11%|█ | 1392/12384 [2:57:37<23:18:32, 7.63s/it, loss=0.0061, acc=0.9859, iter_time=7.57s]
Epoch 0: 11%|█ | 1392/12384 [2:57:45<23:18:32, 7.63s/it, loss=0.0007, acc=0.9968, iter_time=7.64s]
Epoch 0: 11%|█ | 1393/12384 [2:57:45<23:18:39, 7.64s/it, loss=0.0007, acc=0.9968, iter_time=7.64s]
Epoch 0: 11%|█ | 1393/12384 [2:57:53<23:18:39, 7.64s/it, loss=0.0011, acc=0.9962, iter_time=5.86s]
Epoch 0: 11%|█▏ | 1394/12384 [2:57:53<23:18:13, 7.63s/it, loss=0.0011, acc=0.9962, iter_time=5.86s]
Epoch 0: 11%|█▏ | 1394/12384 [2:58:00<23:18:13, 7.63s/it, loss=0.0013, acc=0.9985, iter_time=9.44s]
Epoch 0: 11%|█▏ | 1395/12384 [2:58:00<23:16:59, 7.63s/it, loss=0.0013, acc=0.9985, iter_time=9.44s]
Epoch 0: 11%|█▏ | 1395/12384 [2:58:08<23:16:59, 7.63s/it, loss=0.0034, acc=0.9940, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1396/12384 [2:58:08<23:17:17, 7.63s/it, loss=0.0034, acc=0.9940, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1396/12384 [2:58:16<23:17:17, 7.63s/it, loss=0.0015, acc=0.9980, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1397/12384 [2:58:16<23:15:04, 7.62s/it, loss=0.0015, acc=0.9980, iter_time=7.61s]
Epoch 0: 11%|█▏ | 1397/12384 [2:58:23<23:15:04, 7.62s/it, loss=0.0027, acc=0.9903, iter_time=6.09s]
Epoch 0: 11%|█▏ | 1398/12384 [2:58:23<23:13:33, 7.61s/it, loss=0.0027, acc=0.9903, iter_time=6.09s]
Epoch 0: 11%|█▏ | 1398/12384 [2:58:31<23:13:33, 7.61s/it, loss=0.0011, acc=0.9960, iter_time=9.10s]
Epoch 0: 11%|█▏ | 1399/12384 [2:58:31<23:16:42, 7.63s/it, loss=0.0011, acc=0.9960, iter_time=9.10s]
Epoch 0: 11%|█▏ | 1399/12384 [2:58:38<23:16:42, 7.63s/it, loss=0.0051, acc=0.9938, iter_time=8.07s]
Epoch 0: 11%|█▏ | 1400/12384 [2:58:38<23:15:07, 7.62s/it, loss=0.0051, acc=0.9938, iter_time=8.07s]
Epoch 0: 11%|█▏ | 1400/12384 [2:58:46<23:15:07, 7.62s/it, loss=0.0021, acc=0.9899, iter_time=7.51s]
Epoch 0: 11%|█▏ | 1401/12384 [2:58:46<23:30:28, 7.71s/it, loss=0.0021, acc=0.9899, iter_time=7.51s]
Epoch 0: 11%|█▏ | 1401/12384 [2:58:54<23:30:28, 7.71s/it, loss=0.0022, acc=0.9952, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1402/12384 [2:58:54<23:44:02, 7.78s/it, loss=0.0022, acc=0.9952, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1402/12384 [2:59:02<23:44:02, 7.78s/it, loss=0.0016, acc=0.9975, iter_time=4.63s]
Epoch 0: 11%|█▏ | 1403/12384 [2:59:02<23:33:59, 7.73s/it, loss=0.0016, acc=0.9975, iter_time=4.63s]
Epoch 0: 11%|█▏ | 1403/12384 [2:59:09<23:33:59, 7.73s/it, loss=0.0006, acc=0.9989, iter_time=8.28s]
Epoch 0: 11%|█▏ | 1404/12384 [2:59:09<23:27:31, 7.69s/it, loss=0.0006, acc=0.9989, iter_time=8.28s]
Epoch 0: 11%|█▏ | 1404/12384 [2:59:17<23:27:31, 7.69s/it, loss=0.0010, acc=0.9990, iter_time=9.60s]
Epoch 0: 11%|█▏ | 1405/12384 [2:59:17<23:25:23, 7.68s/it, loss=0.0010, acc=0.9990, iter_time=9.60s]
Epoch 0: 11%|█▏ | 1405/12384 [2:59:25<23:25:23, 7.68s/it, loss=0.0004, acc=0.9985, iter_time=8.27s]
Epoch 0: 11%|█▏ | 1406/12384 [2:59:25<23:23:02, 7.67s/it, loss=0.0004, acc=0.9985, iter_time=8.27s]
Epoch 0: 11%|█▏ | 1406/12384 [2:59:32<23:23:02, 7.67s/it, loss=0.0011, acc=0.9982, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1407/12384 [2:59:32<23:22:28, 7.67s/it, loss=0.0011, acc=0.9982, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1407/12384 [2:59:40<23:22:28, 7.67s/it, loss=0.0006, acc=1.0000, iter_time=8.05s]
Epoch 0: 11%|█▏ | 1408/12384 [2:59:40<23:25:01, 7.68s/it, loss=0.0006, acc=1.0000, iter_time=8.05s]
Epoch 0: 11%|█▏ | 1408/12384 [2:59:48<23:25:01, 7.68s/it, loss=0.0032, acc=0.9934, iter_time=7.33s]
Epoch 0: 11%|█▏ | 1409/12384 [2:59:48<23:21:49, 7.66s/it, loss=0.0032, acc=0.9934, iter_time=7.33s]
Epoch 0: 11%|█▏ | 1409/12384 [2:59:55<23:21:49, 7.66s/it, loss=0.0015, acc=0.9966, iter_time=7.32s]
Epoch 0: 11%|█▏ | 1410/12384 [2:59:55<23:21:03, 7.66s/it, loss=0.0015, acc=0.9966, iter_time=7.32s]
Epoch 0: 11%|█▏ | 1410/12384 [3:00:03<23:21:03, 7.66s/it, loss=0.0012, acc=0.9982, iter_time=7.95s]
Epoch 0: 11%|█▏ | 1411/12384 [3:00:03<23:20:15, 7.66s/it, loss=0.0012, acc=0.9982, iter_time=7.95s]
Epoch 0: 11%|█▏ | 1411/12384 [3:00:11<23:20:15, 7.66s/it, loss=0.0020, acc=0.9994, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1412/12384 [3:00:11<23:18:34, 7.65s/it, loss=0.0020, acc=0.9994, iter_time=7.64s]
Epoch 0: 11%|█▏ | 1412/12384 [3:00:18<23:18:34, 7.65s/it, loss=0.0019, acc=0.9947, iter_time=7.63s]
Epoch 0: 11%|█▏ | 1413/12384 [3:00:18<23:15:54, 7.63s/it, loss=0.0019, acc=0.9947, iter_time=7.63s]
Epoch 0: 11%|█▏ | 1413/12384 [3:00:26<23:15:54, 7.63s/it, loss=0.0021, acc=0.9964, iter_time=4.76s]
Epoch 0: 11%|█▏ | 1414/12384 [3:00:26<23:17:34, 7.64s/it, loss=0.0021, acc=0.9964, iter_time=4.76s]
Epoch 0: 11%|█▏ | 1414/12384 [3:00:34<23:17:34, 7.64s/it, loss=0.0006, acc=0.9998, iter_time=10.50s]
Epoch 0: 11%|█▏ | 1415/12384 [3:00:34<23:18:40, 7.65s/it, loss=0.0006, acc=0.9998, iter_time=10.50s]
Epoch 0: 11%|█▏ | 1415/12384 [3:00:41<23:18:40, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=8.05s]
Epoch 0: 11%|█▏ | 1416/12384 [3:00:41<23:17:56, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=8.05s]
Epoch 0: 11%|█▏ | 1416/12384 [3:00:49<23:17:56, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 11%|█▏ | 1417/12384 [3:00:49<23:16:17, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 11%|█▏ | 1417/12384 [3:00:56<23:16:17, 7.64s/it, loss=0.0051, acc=0.9926, iter_time=5.57s]
Epoch 0: 11%|█▏ | 1418/12384 [3:00:56<23:15:03, 7.63s/it, loss=0.0051, acc=0.9926, iter_time=5.57s]
Epoch 0: 11%|█▏ | 1418/12384 [3:01:04<23:15:03, 7.63s/it, loss=0.0020, acc=0.9930, iter_time=8.49s]
Epoch 0: 11%|█▏ | 1419/12384 [3:01:04<23:15:50, 7.64s/it, loss=0.0020, acc=0.9930, iter_time=8.49s]
Epoch 0: 11%|█▏ | 1419/12384 [3:01:12<23:15:50, 7.64s/it, loss=0.0010, acc=0.9988, iter_time=8.83s]
Epoch 0: 11%|█▏ | 1420/12384 [3:01:12<23:13:23, 7.63s/it, loss=0.0010, acc=0.9988, iter_time=8.83s]
Epoch 0: 11%|█▏ | 1420/12384 [3:01:19<23:13:23, 7.63s/it, loss=0.0003, acc=0.9995, iter_time=7.59s]
Epoch 0: 11%|█▏ | 1421/12384 [3:01:19<23:12:43, 7.62s/it, loss=0.0003, acc=0.9995, iter_time=7.59s]
Epoch 0: 11%|█▏ | 1421/12384 [3:01:27<23:12:43, 7.62s/it, loss=0.0063, acc=0.9903, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1422/12384 [3:01:27<23:14:12, 7.63s/it, loss=0.0063, acc=0.9903, iter_time=7.62s]
Epoch 0: 11%|█▏ | 1422/12384 [3:01:35<23:14:12, 7.63s/it, loss=0.0008, acc=0.9993, iter_time=7.67s]
Epoch 0: 11%|█▏ | 1423/12384 [3:01:35<23:13:05, 7.63s/it, loss=0.0008, acc=0.9993, iter_time=7.67s]
Epoch 0: 11%|█▏ | 1423/12384 [3:01:42<23:13:05, 7.63s/it, loss=0.0028, acc=0.9919, iter_time=7.98s]
Epoch 0: 11%|█▏ | 1424/12384 [3:01:42<23:12:42, 7.62s/it, loss=0.0028, acc=0.9919, iter_time=7.98s]
Epoch 0: 11%|█▏ | 1424/12384 [3:01:50<23:12:42, 7.62s/it, loss=0.0028, acc=0.9949, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1425/12384 [3:01:50<23:11:21, 7.62s/it, loss=0.0028, acc=0.9949, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1425/12384 [3:01:57<23:11:21, 7.62s/it, loss=0.0007, acc=0.9964, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1426/12384 [3:01:57<23:12:19, 7.62s/it, loss=0.0007, acc=0.9964, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1426/12384 [3:02:05<23:12:19, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.40s]
Epoch 0: 12%|█▏ | 1427/12384 [3:02:05<23:12:11, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.40s]
Epoch 0: 12%|█▏ | 1427/12384 [3:02:13<23:12:11, 7.62s/it, loss=0.0009, acc=0.9981, iter_time=6.83s]
Epoch 0: 12%|█▏ | 1428/12384 [3:02:13<23:11:27, 7.62s/it, loss=0.0009, acc=0.9981, iter_time=6.83s]
Epoch 0: 12%|█▏ | 1428/12384 [3:02:21<23:11:27, 7.62s/it, loss=0.0012, acc=0.9981, iter_time=9.67s]
Epoch 0: 12%|█▏ | 1429/12384 [3:02:21<23:31:37, 7.73s/it, loss=0.0012, acc=0.9981, iter_time=9.67s]
Epoch 0: 12%|█▏ | 1429/12384 [3:02:28<23:31:37, 7.73s/it, loss=0.0014, acc=0.9982, iter_time=7.96s]
Epoch 0: 12%|█▏ | 1430/12384 [3:02:28<23:25:29, 7.70s/it, loss=0.0014, acc=0.9982, iter_time=7.96s]
Epoch 0: 12%|█▏ | 1430/12384 [3:02:36<23:25:29, 7.70s/it, loss=0.0027, acc=0.9930, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1431/12384 [3:02:36<23:21:29, 7.68s/it, loss=0.0027, acc=0.9930, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1431/12384 [3:02:44<23:21:29, 7.68s/it, loss=0.0011, acc=0.9973, iter_time=7.57s]
Epoch 0: 12%|█▏ | 1432/12384 [3:02:44<23:18:01, 7.66s/it, loss=0.0011, acc=0.9973, iter_time=7.57s]
Epoch 0: 12%|█▏ | 1432/12384 [3:02:51<23:18:01, 7.66s/it, loss=0.0040, acc=0.9944, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1433/12384 [3:02:51<23:13:51, 7.64s/it, loss=0.0040, acc=0.9944, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1433/12384 [3:02:59<23:13:51, 7.64s/it, loss=0.0021, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1434/12384 [3:02:59<23:15:20, 7.65s/it, loss=0.0021, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1434/12384 [3:03:06<23:15:20, 7.65s/it, loss=0.0005, acc=0.9998, iter_time=4.50s]
Epoch 0: 12%|█▏ | 1435/12384 [3:03:06<23:13:16, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=4.50s]
Epoch 0: 12%|█▏ | 1435/12384 [3:03:14<23:13:16, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=10.75s]
Epoch 0: 12%|█▏ | 1436/12384 [3:03:14<23:14:10, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=10.75s]
Epoch 0: 12%|█▏ | 1436/12384 [3:03:22<23:14:10, 7.64s/it, loss=0.0034, acc=0.9931, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1437/12384 [3:03:22<23:12:35, 7.63s/it, loss=0.0034, acc=0.9931, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1437/12384 [3:03:29<23:12:35, 7.63s/it, loss=0.0005, acc=0.9977, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1438/12384 [3:03:29<23:10:44, 7.62s/it, loss=0.0005, acc=0.9977, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1438/12384 [3:03:37<23:10:44, 7.62s/it, loss=0.0027, acc=0.9941, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1439/12384 [3:03:37<23:10:54, 7.62s/it, loss=0.0027, acc=0.9941, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1439/12384 [3:03:45<23:10:54, 7.62s/it, loss=0.0031, acc=0.9954, iter_time=8.01s]
Epoch 0: 12%|█▏ | 1440/12384 [3:03:45<23:10:25, 7.62s/it, loss=0.0031, acc=0.9954, iter_time=8.01s]
Epoch 0: 12%|█▏ | 1440/12384 [3:03:52<23:10:25, 7.62s/it, loss=0.0094, acc=0.9850, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1441/12384 [3:03:52<23:08:47, 7.61s/it, loss=0.0094, acc=0.9850, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1441/12384 [3:04:00<23:08:47, 7.61s/it, loss=0.0019, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1442/12384 [3:04:00<23:10:23, 7.62s/it, loss=0.0019, acc=0.9966, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1442/12384 [3:04:07<23:10:23, 7.62s/it, loss=0.0021, acc=0.9978, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1443/12384 [3:04:07<23:10:14, 7.62s/it, loss=0.0021, acc=0.9978, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1443/12384 [3:04:15<23:10:14, 7.62s/it, loss=0.0011, acc=0.9958, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1444/12384 [3:04:15<23:11:39, 7.63s/it, loss=0.0011, acc=0.9958, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1444/12384 [3:04:23<23:11:39, 7.63s/it, loss=0.0011, acc=0.9987, iter_time=6.79s]
Epoch 0: 12%|█▏ | 1445/12384 [3:04:23<23:10:07, 7.62s/it, loss=0.0011, acc=0.9987, iter_time=6.79s]
Epoch 0: 12%|█▏ | 1445/12384 [3:04:30<23:10:07, 7.62s/it, loss=0.0044, acc=0.9944, iter_time=8.46s]
Epoch 0: 12%|█▏ | 1446/12384 [3:04:30<23:13:12, 7.64s/it, loss=0.0044, acc=0.9944, iter_time=8.46s]
Epoch 0: 12%|█▏ | 1446/12384 [3:04:38<23:13:12, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=7.69s]
Epoch 0: 12%|█▏ | 1447/12384 [3:04:38<23:10:50, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=7.69s]
Epoch 0: 12%|█▏ | 1447/12384 [3:04:46<23:10:50, 7.63s/it, loss=0.0019, acc=0.9938, iter_time=7.84s]
Epoch 0: 12%|█▏ | 1448/12384 [3:04:46<23:16:35, 7.66s/it, loss=0.0019, acc=0.9938, iter_time=7.84s]
Epoch 0: 12%|█▏ | 1448/12384 [3:04:53<23:16:35, 7.66s/it, loss=0.0006, acc=0.9987, iter_time=5.50s]
Epoch 0: 12%|█▏ | 1449/12384 [3:04:53<23:15:42, 7.66s/it, loss=0.0006, acc=0.9987, iter_time=5.50s]
Epoch 0: 12%|█▏ | 1449/12384 [3:05:01<23:15:42, 7.66s/it, loss=0.0007, acc=0.9996, iter_time=10.08s]
Epoch 0: 12%|█▏ | 1450/12384 [3:05:01<23:14:28, 7.65s/it, loss=0.0007, acc=0.9996, iter_time=10.08s]
Epoch 0: 12%|█▏ | 1450/12384 [3:05:09<23:14:28, 7.65s/it, loss=0.0008, acc=0.9987, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1451/12384 [3:05:09<23:13:06, 7.65s/it, loss=0.0008, acc=0.9987, iter_time=7.22s]
Epoch 0: 12%|█▏ | 1451/12384 [3:05:16<23:13:06, 7.65s/it, loss=0.0007, acc=0.9985, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1452/12384 [3:05:16<23:11:34, 7.64s/it, loss=0.0007, acc=0.9985, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1452/12384 [3:05:24<23:11:34, 7.64s/it, loss=0.0014, acc=0.9968, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1453/12384 [3:05:24<23:10:29, 7.63s/it, loss=0.0014, acc=0.9968, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1453/12384 [3:05:31<23:10:29, 7.63s/it, loss=0.0010, acc=0.9983, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1454/12384 [3:05:31<23:08:18, 7.62s/it, loss=0.0010, acc=0.9983, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1454/12384 [3:05:39<23:08:18, 7.62s/it, loss=0.0004, acc=0.9981, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1455/12384 [3:05:39<23:29:52, 7.74s/it, loss=0.0004, acc=0.9981, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1455/12384 [3:05:47<23:29:52, 7.74s/it, loss=0.0004, acc=0.9999, iter_time=9.24s]
Epoch 0: 12%|█▏ | 1456/12384 [3:05:47<23:21:42, 7.70s/it, loss=0.0004, acc=0.9999, iter_time=9.24s]
Epoch 0: 12%|█▏ | 1456/12384 [3:05:55<23:21:42, 7.70s/it, loss=0.0004, acc=0.9986, iter_time=6.27s]
Epoch 0: 12%|█▏ | 1457/12384 [3:05:55<23:18:49, 7.68s/it, loss=0.0004, acc=0.9986, iter_time=6.27s]
Epoch 0: 12%|█▏ | 1457/12384 [3:06:02<23:18:49, 7.68s/it, loss=0.0035, acc=0.9884, iter_time=8.58s]
Epoch 0: 12%|█▏ | 1458/12384 [3:06:02<23:15:22, 7.66s/it, loss=0.0035, acc=0.9884, iter_time=8.58s]
Epoch 0: 12%|█▏ | 1458/12384 [3:06:10<23:15:22, 7.66s/it, loss=0.0033, acc=0.9933, iter_time=5.30s]
Epoch 0: 12%|█▏ | 1459/12384 [3:06:10<23:12:52, 7.65s/it, loss=0.0033, acc=0.9933, iter_time=5.30s]
Epoch 0: 12%|█▏ | 1459/12384 [3:06:18<23:12:52, 7.65s/it, loss=0.0028, acc=0.9899, iter_time=9.96s]
Epoch 0: 12%|█▏ | 1460/12384 [3:06:18<23:09:56, 7.63s/it, loss=0.0028, acc=0.9899, iter_time=9.96s]
Epoch 0: 12%|█▏ | 1460/12384 [3:06:25<23:09:56, 7.63s/it, loss=0.0006, acc=0.9972, iter_time=6.10s]
Epoch 0: 12%|█▏ | 1461/12384 [3:06:25<23:08:45, 7.63s/it, loss=0.0006, acc=0.9972, iter_time=6.10s]
Epoch 0: 12%|█▏ | 1461/12384 [3:06:33<23:08:45, 7.63s/it, loss=0.0017, acc=0.9976, iter_time=9.11s]
Epoch 0: 12%|█▏ | 1462/12384 [3:06:33<23:07:25, 7.62s/it, loss=0.0017, acc=0.9976, iter_time=9.11s]
Epoch 0: 12%|█▏ | 1462/12384 [3:06:40<23:07:25, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1463/12384 [3:06:40<23:07:26, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1463/12384 [3:06:48<23:07:26, 7.62s/it, loss=0.0009, acc=0.9993, iter_time=7.54s]
Epoch 0: 12%|█▏ | 1464/12384 [3:06:48<23:05:49, 7.61s/it, loss=0.0009, acc=0.9993, iter_time=7.54s]
Epoch 0: 12%|█▏ | 1464/12384 [3:06:56<23:05:49, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1465/12384 [3:06:56<23:04:37, 7.61s/it, loss=0.0005, acc=0.9993, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1465/12384 [3:07:03<23:04:37, 7.61s/it, loss=0.0023, acc=0.9963, iter_time=7.40s]
Epoch 0: 12%|█▏ | 1466/12384 [3:07:03<23:07:39, 7.63s/it, loss=0.0023, acc=0.9963, iter_time=7.40s]
Epoch 0: 12%|█▏ | 1466/12384 [3:07:11<23:07:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 12%|█▏ | 1467/12384 [3:07:11<23:08:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 12%|█▏ | 1467/12384 [3:07:19<23:08:13, 7.63s/it, loss=0.0012, acc=0.9984, iter_time=9.43s]
Epoch 0: 12%|█▏ | 1468/12384 [3:07:19<23:14:28, 7.66s/it, loss=0.0012, acc=0.9984, iter_time=9.43s]
Epoch 0: 12%|█▏ | 1468/12384 [3:07:26<23:14:28, 7.66s/it, loss=0.0016, acc=0.9978, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1469/12384 [3:07:26<23:11:32, 7.65s/it, loss=0.0016, acc=0.9978, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1469/12384 [3:07:34<23:11:32, 7.65s/it, loss=0.0013, acc=0.9975, iter_time=5.29s]
Epoch 0: 12%|█▏ | 1470/12384 [3:07:34<23:12:45, 7.66s/it, loss=0.0013, acc=0.9975, iter_time=5.29s]
Epoch 0: 12%|█▏ | 1470/12384 [3:07:42<23:12:45, 7.66s/it, loss=0.0006, acc=0.9992, iter_time=9.99s]
Epoch 0: 12%|█▏ | 1471/12384 [3:07:42<23:10:19, 7.64s/it, loss=0.0006, acc=0.9992, iter_time=9.99s]
Epoch 0: 12%|█▏ | 1471/12384 [3:07:49<23:10:19, 7.64s/it, loss=0.0015, acc=0.9968, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1472/12384 [3:07:49<23:08:20, 7.63s/it, loss=0.0015, acc=0.9968, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1472/12384 [3:07:57<23:08:20, 7.63s/it, loss=0.0008, acc=0.9966, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1473/12384 [3:07:57<23:07:32, 7.63s/it, loss=0.0008, acc=0.9966, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1473/12384 [3:08:04<23:07:32, 7.63s/it, loss=0.0014, acc=0.9954, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1474/12384 [3:08:04<23:07:26, 7.63s/it, loss=0.0014, acc=0.9954, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1474/12384 [3:08:12<23:07:26, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=5.84s]
Epoch 0: 12%|█▏ | 1475/12384 [3:08:12<23:10:48, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=5.84s]
Epoch 0: 12%|█▏ | 1475/12384 [3:08:20<23:10:48, 7.65s/it, loss=0.0021, acc=0.9938, iter_time=9.18s]
Epoch 0: 12%|█▏ | 1476/12384 [3:08:20<23:08:50, 7.64s/it, loss=0.0021, acc=0.9938, iter_time=9.18s]
Epoch 0: 12%|█▏ | 1476/12384 [3:08:27<23:08:50, 7.64s/it, loss=0.0011, acc=0.9961, iter_time=4.68s]
Epoch 0: 12%|█▏ | 1477/12384 [3:08:27<23:10:21, 7.65s/it, loss=0.0011, acc=0.9961, iter_time=4.68s]
Epoch 0: 12%|█▏ | 1477/12384 [3:08:35<23:10:21, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=10.96s]
Epoch 0: 12%|█▏ | 1478/12384 [3:08:35<23:12:34, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=10.96s]
Epoch 0: 12%|█▏ | 1478/12384 [3:08:43<23:12:34, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1479/12384 [3:08:43<23:09:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 12%|█▏ | 1479/12384 [3:08:51<23:09:25, 7.64s/it, loss=0.0020, acc=0.9936, iter_time=8.50s]
Epoch 0: 12%|█▏ | 1480/12384 [3:08:51<23:35:32, 7.79s/it, loss=0.0020, acc=0.9936, iter_time=8.50s]
Epoch 0: 12%|█▏ | 1480/12384 [3:08:59<23:35:32, 7.79s/it, loss=0.0027, acc=0.9929, iter_time=5.77s]
Epoch 0: 12%|█▏ | 1481/12384 [3:08:59<23:44:54, 7.84s/it, loss=0.0027, acc=0.9929, iter_time=5.77s]
Epoch 0: 12%|█▏ | 1481/12384 [3:09:06<23:44:54, 7.84s/it, loss=0.0005, acc=0.9999, iter_time=8.86s]
Epoch 0: 12%|█▏ | 1482/12384 [3:09:06<23:33:27, 7.78s/it, loss=0.0005, acc=0.9999, iter_time=8.86s]
Epoch 0: 12%|█▏ | 1482/12384 [3:09:14<23:33:27, 7.78s/it, loss=0.0023, acc=0.9971, iter_time=6.13s]
Epoch 0: 12%|█▏ | 1483/12384 [3:09:14<23:25:20, 7.74s/it, loss=0.0023, acc=0.9971, iter_time=6.13s]
Epoch 0: 12%|█▏ | 1483/12384 [3:09:22<23:25:20, 7.74s/it, loss=0.0136, acc=0.9805, iter_time=9.65s]
Epoch 0: 12%|█▏ | 1484/12384 [3:09:22<23:21:42, 7.72s/it, loss=0.0136, acc=0.9805, iter_time=9.65s]
Epoch 0: 12%|█▏ | 1484/12384 [3:09:29<23:21:42, 7.72s/it, loss=0.0017, acc=0.9970, iter_time=7.70s]
Epoch 0: 12%|█▏ | 1485/12384 [3:09:29<23:21:54, 7.72s/it, loss=0.0017, acc=0.9970, iter_time=7.70s]
Epoch 0: 12%|█▏ | 1485/12384 [3:09:37<23:21:54, 7.72s/it, loss=0.0021, acc=0.9939, iter_time=4.72s]
Epoch 0: 12%|█▏ | 1486/12384 [3:09:37<23:17:19, 7.69s/it, loss=0.0021, acc=0.9939, iter_time=4.72s]
Epoch 0: 12%|█▏ | 1486/12384 [3:09:45<23:17:19, 7.69s/it, loss=0.0008, acc=0.9964, iter_time=10.64s]
Epoch 0: 12%|█▏ | 1487/12384 [3:09:45<23:13:58, 7.68s/it, loss=0.0008, acc=0.9964, iter_time=10.64s]
Epoch 0: 12%|█▏ | 1487/12384 [3:09:52<23:13:58, 7.68s/it, loss=0.0022, acc=0.9957, iter_time=8.04s]
Epoch 0: 12%|█▏ | 1488/12384 [3:09:52<23:12:30, 7.67s/it, loss=0.0022, acc=0.9957, iter_time=8.04s]
Epoch 0: 12%|█▏ | 1488/12384 [3:10:00<23:12:30, 7.67s/it, loss=0.0035, acc=0.9887, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1489/12384 [3:10:00<23:09:56, 7.65s/it, loss=0.0035, acc=0.9887, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1489/12384 [3:10:08<23:09:56, 7.65s/it, loss=0.0028, acc=0.9943, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1490/12384 [3:10:08<23:09:10, 7.65s/it, loss=0.0028, acc=0.9943, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1490/12384 [3:10:15<23:09:10, 7.65s/it, loss=0.0006, acc=0.9988, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1491/12384 [3:10:15<23:06:42, 7.64s/it, loss=0.0006, acc=0.9988, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1491/12384 [3:10:23<23:06:42, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1492/12384 [3:10:23<23:06:10, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1492/12384 [3:10:31<23:06:10, 7.64s/it, loss=0.0126, acc=0.9808, iter_time=7.37s]
Epoch 0: 12%|█▏ | 1493/12384 [3:10:31<23:07:24, 7.64s/it, loss=0.0126, acc=0.9808, iter_time=7.37s]
Epoch 0: 12%|█▏ | 1493/12384 [3:10:38<23:07:24, 7.64s/it, loss=0.0022, acc=0.9956, iter_time=6.76s]
Epoch 0: 12%|█▏ | 1494/12384 [3:10:38<23:07:30, 7.64s/it, loss=0.0022, acc=0.9956, iter_time=6.76s]
Epoch 0: 12%|█▏ | 1494/12384 [3:10:46<23:07:30, 7.64s/it, loss=0.0007, acc=0.9998, iter_time=5.76s]
Epoch 0: 12%|█▏ | 1495/12384 [3:10:46<23:06:24, 7.64s/it, loss=0.0007, acc=0.9998, iter_time=5.76s]
Epoch 0: 12%|█▏ | 1495/12384 [3:10:53<23:06:24, 7.64s/it, loss=0.0030, acc=0.9960, iter_time=11.09s]
Epoch 0: 12%|█▏ | 1496/12384 [3:10:53<23:06:48, 7.64s/it, loss=0.0030, acc=0.9960, iter_time=11.09s]
Epoch 0: 12%|█▏ | 1496/12384 [3:11:01<23:06:48, 7.64s/it, loss=0.0012, acc=0.9962, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1497/12384 [3:11:01<23:06:21, 7.64s/it, loss=0.0012, acc=0.9962, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1497/12384 [3:11:09<23:06:21, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=6.72s]
Epoch 0: 12%|█▏ | 1498/12384 [3:11:09<23:04:51, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.72s]
Epoch 0: 12%|█▏ | 1498/12384 [3:11:16<23:04:51, 7.63s/it, loss=0.0013, acc=0.9961, iter_time=7.33s]
Epoch 0: 12%|█▏ | 1499/12384 [3:11:16<23:05:24, 7.64s/it, loss=0.0013, acc=0.9961, iter_time=7.33s]
Epoch 0: 12%|█▏ | 1499/12384 [3:11:24<23:05:24, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=9.29s]
Epoch 0: 12%|█▏ | 1500/12384 [3:11:24<23:16:06, 7.70s/it, loss=0.0004, acc=1.0000, iter_time=9.29s]
Epoch 0: 12%|█▏ | 1500/12384 [3:11:32<23:16:06, 7.70s/it, loss=0.0019, acc=0.9970, iter_time=5.91s]
Epoch 0: 12%|█▏ | 1501/12384 [3:11:32<23:10:47, 7.67s/it, loss=0.0019, acc=0.9970, iter_time=5.91s]
Epoch 0: 12%|█▏ | 1501/12384 [3:11:39<23:10:47, 7.67s/it, loss=0.0025, acc=0.9960, iter_time=9.13s]
Epoch 0: 12%|█▏ | 1502/12384 [3:11:39<23:12:44, 7.68s/it, loss=0.0025, acc=0.9960, iter_time=9.13s]
Epoch 0: 12%|█▏ | 1502/12384 [3:11:47<23:12:44, 7.68s/it, loss=0.0012, acc=0.9977, iter_time=7.72s]
Epoch 0: 12%|█▏ | 1503/12384 [3:11:47<23:10:18, 7.67s/it, loss=0.0012, acc=0.9977, iter_time=7.72s]
Epoch 0: 12%|█▏ | 1503/12384 [3:11:55<23:10:18, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.56s]
Epoch 0: 12%|█▏ | 1504/12384 [3:11:55<23:07:27, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.56s]
Epoch 0: 12%|█▏ | 1504/12384 [3:12:02<23:07:27, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1505/12384 [3:12:02<23:08:35, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1505/12384 [3:12:10<23:08:35, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1506/12384 [3:12:10<23:10:07, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1506/12384 [3:12:18<23:10:07, 7.67s/it, loss=0.0021, acc=0.9969, iter_time=4.86s]
Epoch 0: 12%|█▏ | 1507/12384 [3:12:18<23:25:05, 7.75s/it, loss=0.0021, acc=0.9969, iter_time=4.86s]
Epoch 0: 12%|█▏ | 1507/12384 [3:12:26<23:25:05, 7.75s/it, loss=0.0007, acc=0.9990, iter_time=9.26s]
Epoch 0: 12%|█▏ | 1508/12384 [3:12:26<23:17:48, 7.71s/it, loss=0.0007, acc=0.9990, iter_time=9.26s]
Epoch 0: 12%|█▏ | 1508/12384 [3:12:33<23:17:48, 7.71s/it, loss=0.0008, acc=0.9986, iter_time=9.12s]
Epoch 0: 12%|█▏ | 1509/12384 [3:12:33<23:12:32, 7.68s/it, loss=0.0008, acc=0.9986, iter_time=9.12s]
Epoch 0: 12%|█▏ | 1509/12384 [3:12:41<23:12:32, 7.68s/it, loss=0.0013, acc=0.9969, iter_time=4.76s]
Epoch 0: 12%|█▏ | 1510/12384 [3:12:41<23:09:02, 7.66s/it, loss=0.0013, acc=0.9969, iter_time=4.76s]
Epoch 0: 12%|█▏ | 1510/12384 [3:12:49<23:09:02, 7.66s/it, loss=0.0007, acc=0.9972, iter_time=10.48s]
Epoch 0: 12%|█▏ | 1511/12384 [3:12:49<23:08:10, 7.66s/it, loss=0.0007, acc=0.9972, iter_time=10.48s]
Epoch 0: 12%|█▏ | 1511/12384 [3:12:56<23:08:10, 7.66s/it, loss=0.0009, acc=0.9984, iter_time=8.06s]
Epoch 0: 12%|█▏ | 1512/12384 [3:12:56<23:08:56, 7.67s/it, loss=0.0009, acc=0.9984, iter_time=8.06s]
Epoch 0: 12%|█▏ | 1512/12384 [3:13:04<23:08:56, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.16s]
Epoch 0: 12%|█▏ | 1513/12384 [3:13:04<23:07:30, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.16s]
Epoch 0: 12%|█▏ | 1513/12384 [3:13:12<23:07:30, 7.66s/it, loss=0.0005, acc=0.9994, iter_time=8.88s]
Epoch 0: 12%|█▏ | 1514/12384 [3:13:12<23:12:22, 7.69s/it, loss=0.0005, acc=0.9994, iter_time=8.88s]
Epoch 0: 12%|█▏ | 1514/12384 [3:13:19<23:12:22, 7.69s/it, loss=0.0022, acc=0.9975, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1515/12384 [3:13:19<23:08:29, 7.66s/it, loss=0.0022, acc=0.9975, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1515/12384 [3:13:27<23:08:29, 7.66s/it, loss=0.0019, acc=0.9969, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1516/12384 [3:13:27<23:06:06, 7.65s/it, loss=0.0019, acc=0.9969, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1516/12384 [3:13:34<23:06:06, 7.65s/it, loss=0.0150, acc=0.9878, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1517/12384 [3:13:34<23:05:12, 7.65s/it, loss=0.0150, acc=0.9878, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1517/12384 [3:13:42<23:05:12, 7.65s/it, loss=0.0009, acc=0.9995, iter_time=4.04s]
Epoch 0: 12%|█▏ | 1518/12384 [3:13:42<23:05:17, 7.65s/it, loss=0.0009, acc=0.9995, iter_time=4.04s]
Epoch 0: 12%|█▏ | 1518/12384 [3:13:50<23:05:17, 7.65s/it, loss=0.0018, acc=0.9972, iter_time=11.22s]
Epoch 0: 12%|█▏ | 1519/12384 [3:13:50<23:03:27, 7.64s/it, loss=0.0018, acc=0.9972, iter_time=11.22s]
Epoch 0: 12%|█▏ | 1519/12384 [3:13:57<23:03:27, 7.64s/it, loss=0.0075, acc=0.9868, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1520/12384 [3:13:57<23:04:11, 7.64s/it, loss=0.0075, acc=0.9868, iter_time=7.63s]
Epoch 0: 12%|█▏ | 1520/12384 [3:14:05<23:04:11, 7.64s/it, loss=0.0009, acc=0.9977, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1521/12384 [3:14:05<23:06:29, 7.66s/it, loss=0.0009, acc=0.9977, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1521/12384 [3:14:13<23:06:29, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 12%|█▏ | 1522/12384 [3:14:13<23:04:56, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 12%|█▏ | 1522/12384 [3:14:20<23:04:56, 7.65s/it, loss=0.0009, acc=0.9973, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1523/12384 [3:14:20<23:04:30, 7.65s/it, loss=0.0009, acc=0.9973, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1523/12384 [3:14:28<23:04:30, 7.65s/it, loss=0.0015, acc=0.9973, iter_time=5.06s]
Epoch 0: 12%|█▏ | 1524/12384 [3:14:28<23:02:57, 7.64s/it, loss=0.0015, acc=0.9973, iter_time=5.06s]
Epoch 0: 12%|█▏ | 1524/12384 [3:14:36<23:02:57, 7.64s/it, loss=0.0007, acc=0.9992, iter_time=10.18s]
Epoch 0: 12%|█▏ | 1525/12384 [3:14:36<23:03:16, 7.64s/it, loss=0.0007, acc=0.9992, iter_time=10.18s]
Epoch 0: 12%|█▏ | 1525/12384 [3:14:43<23:03:16, 7.64s/it, loss=0.0009, acc=0.9974, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1526/12384 [3:14:43<23:04:36, 7.65s/it, loss=0.0009, acc=0.9974, iter_time=7.64s]
Epoch 0: 12%|█▏ | 1526/12384 [3:14:51<23:04:36, 7.65s/it, loss=0.0006, acc=1.0000, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1527/12384 [3:14:51<23:02:04, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=7.67s]
Epoch 0: 12%|█▏ | 1527/12384 [3:14:59<23:02:04, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1528/12384 [3:14:59<23:00:12, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=8.00s]
Epoch 0: 12%|█▏ | 1528/12384 [3:15:06<23:00:12, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=5.68s]
Epoch 0: 12%|█▏ | 1529/12384 [3:15:06<22:58:58, 7.62s/it, loss=0.0005, acc=0.9997, iter_time=5.68s]
Epoch 0: 12%|█▏ | 1529/12384 [3:15:14<22:58:58, 7.62s/it, loss=0.0013, acc=0.9963, iter_time=7.34s]
Epoch 0: 12%|█▏ | 1530/12384 [3:15:14<23:00:16, 7.63s/it, loss=0.0013, acc=0.9963, iter_time=7.34s]
Epoch 0: 12%|█▏ | 1530/12384 [3:15:21<23:00:16, 7.63s/it, loss=0.0008, acc=0.9983, iter_time=9.45s]
Epoch 0: 12%|█▏ | 1531/12384 [3:15:21<23:02:13, 7.64s/it, loss=0.0008, acc=0.9983, iter_time=9.45s]
Epoch 0: 12%|█▏ | 1531/12384 [3:15:29<23:02:13, 7.64s/it, loss=0.0010, acc=0.9979, iter_time=5.89s]
Epoch 0: 12%|█▏ | 1532/12384 [3:15:29<23:00:17, 7.63s/it, loss=0.0010, acc=0.9979, iter_time=5.89s]
Epoch 0: 12%|█▏ | 1532/12384 [3:15:37<23:00:17, 7.63s/it, loss=0.0004, acc=0.9985, iter_time=9.64s]
Epoch 0: 12%|█▏ | 1533/12384 [3:15:37<23:17:42, 7.73s/it, loss=0.0004, acc=0.9985, iter_time=9.64s]
Epoch 0: 12%|█▏ | 1533/12384 [3:15:45<23:17:42, 7.73s/it, loss=0.0029, acc=0.9919, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1534/12384 [3:15:45<23:10:12, 7.69s/it, loss=0.0029, acc=0.9919, iter_time=7.68s]
Epoch 0: 12%|█▏ | 1534/12384 [3:15:52<23:10:12, 7.69s/it, loss=0.0009, acc=0.9962, iter_time=6.68s]
Epoch 0: 12%|█▏ | 1535/12384 [3:15:52<23:05:38, 7.66s/it, loss=0.0009, acc=0.9962, iter_time=6.68s]
Epoch 0: 12%|█▏ | 1535/12384 [3:16:00<23:05:38, 7.66s/it, loss=0.0023, acc=0.9937, iter_time=8.92s]
Epoch 0: 12%|█▏ | 1536/12384 [3:16:00<23:03:56, 7.65s/it, loss=0.0023, acc=0.9937, iter_time=8.92s]
Epoch 0: 12%|█▏ | 1536/12384 [3:16:07<23:03:56, 7.65s/it, loss=0.0012, acc=1.0000, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1537/12384 [3:16:07<23:03:24, 7.65s/it, loss=0.0012, acc=1.0000, iter_time=7.24s]
Epoch 0: 12%|█▏ | 1537/12384 [3:16:15<23:03:24, 7.65s/it, loss=0.0012, acc=0.9967, iter_time=7.35s]
Epoch 0: 12%|█▏ | 1538/12384 [3:16:15<23:00:34, 7.64s/it, loss=0.0012, acc=0.9967, iter_time=7.35s]
Epoch 0: 12%|█▏ | 1538/12384 [3:16:23<23:00:34, 7.64s/it, loss=0.0006, acc=0.9982, iter_time=7.90s]
Epoch 0: 12%|█▏ | 1539/12384 [3:16:23<22:59:31, 7.63s/it, loss=0.0006, acc=0.9982, iter_time=7.90s]
Epoch 0: 12%|█▏ | 1539/12384 [3:16:30<22:59:31, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1540/12384 [3:16:30<22:58:35, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1540/12384 [3:16:38<22:58:35, 7.63s/it, loss=0.0024, acc=0.9947, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1541/12384 [3:16:38<22:56:39, 7.62s/it, loss=0.0024, acc=0.9947, iter_time=7.61s]
Epoch 0: 12%|█▏ | 1541/12384 [3:16:46<22:56:39, 7.62s/it, loss=0.0049, acc=0.9881, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1542/12384 [3:16:46<22:56:55, 7.62s/it, loss=0.0049, acc=0.9881, iter_time=7.60s]
Epoch 0: 12%|█▏ | 1542/12384 [3:16:53<22:56:55, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1543/12384 [3:16:53<22:56:57, 7.62s/it, loss=0.0007, acc=0.9980, iter_time=7.62s]
Epoch 0: 12%|█▏ | 1543/12384 [3:17:01<22:56:57, 7.62s/it, loss=0.0010, acc=0.9980, iter_time=8.13s]
Epoch 0: 12%|█▏ | 1544/12384 [3:17:01<23:02:32, 7.65s/it, loss=0.0010, acc=0.9980, iter_time=8.13s]
Epoch 0: 12%|█▏ | 1544/12384 [3:17:09<23:02:32, 7.65s/it, loss=0.0014, acc=0.9992, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1545/12384 [3:17:09<23:02:22, 7.65s/it, loss=0.0014, acc=0.9992, iter_time=7.23s]
Epoch 0: 12%|█▏ | 1545/12384 [3:17:16<23:02:22, 7.65s/it, loss=0.0048, acc=0.9919, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1546/12384 [3:17:16<23:02:57, 7.66s/it, loss=0.0048, acc=0.9919, iter_time=7.66s]
Epoch 0: 12%|█▏ | 1546/12384 [3:17:24<23:02:57, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1547/12384 [3:17:24<23:01:48, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=6.71s]
Epoch 0: 12%|█▏ | 1547/12384 [3:17:31<23:01:48, 7.65s/it, loss=0.0013, acc=0.9988, iter_time=8.60s]
Epoch 0: 12%|█▎ | 1548/12384 [3:17:31<23:01:00, 7.65s/it, loss=0.0013, acc=0.9988, iter_time=8.60s]
Epoch 0: 12%|█▎ | 1548/12384 [3:17:39<23:01:00, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1549/12384 [3:17:39<22:59:30, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1549/12384 [3:17:47<22:59:30, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=8.09s]
Epoch 0: 13%|█▎ | 1550/12384 [3:17:47<23:01:30, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=8.09s]
Epoch 0: 13%|█▎ | 1550/12384 [3:17:54<23:01:30, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=4.15s]
Epoch 0: 13%|█▎ | 1551/12384 [3:17:54<23:01:58, 7.65s/it, loss=0.0006, acc=0.9977, iter_time=4.15s]
Epoch 0: 13%|█▎ | 1551/12384 [3:18:02<23:01:58, 7.65s/it, loss=0.0007, acc=0.9989, iter_time=11.10s]
Epoch 0: 13%|█▎ | 1552/12384 [3:18:02<23:00:29, 7.65s/it, loss=0.0007, acc=0.9989, iter_time=11.10s]
Epoch 0: 13%|█▎ | 1552/12384 [3:18:10<23:00:29, 7.65s/it, loss=0.0006, acc=0.9980, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1553/12384 [3:18:10<23:00:36, 7.65s/it, loss=0.0006, acc=0.9980, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1553/12384 [3:18:17<23:00:36, 7.65s/it, loss=0.0007, acc=0.9998, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1554/12384 [3:18:17<23:01:50, 7.66s/it, loss=0.0007, acc=0.9998, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1554/12384 [3:18:25<23:01:50, 7.66s/it, loss=0.0211, acc=0.9780, iter_time=8.81s]
Epoch 0: 13%|█▎ | 1555/12384 [3:18:25<22:59:00, 7.64s/it, loss=0.0211, acc=0.9780, iter_time=8.81s]
Epoch 0: 13%|█▎ | 1555/12384 [3:18:33<22:59:00, 7.64s/it, loss=0.0010, acc=0.9978, iter_time=9.05s]
Epoch 0: 13%|█▎ | 1556/12384 [3:18:33<22:57:38, 7.63s/it, loss=0.0010, acc=0.9978, iter_time=9.05s]
Epoch 0: 13%|█▎ | 1556/12384 [3:18:40<22:57:38, 7.63s/it, loss=0.0010, acc=0.9950, iter_time=4.84s]
Epoch 0: 13%|█▎ | 1557/12384 [3:18:40<22:55:52, 7.62s/it, loss=0.0010, acc=0.9950, iter_time=4.84s]
Epoch 0: 13%|█▎ | 1557/12384 [3:18:48<22:55:52, 7.62s/it, loss=0.0012, acc=0.9998, iter_time=7.08s]
Epoch 0: 13%|█▎ | 1558/12384 [3:18:48<22:55:40, 7.62s/it, loss=0.0012, acc=0.9998, iter_time=7.08s]
Epoch 0: 13%|█▎ | 1558/12384 [3:18:55<22:55:40, 7.62s/it, loss=0.0007, acc=0.9967, iter_time=7.53s]
Epoch 0: 13%|█▎ | 1559/12384 [3:18:55<22:56:06, 7.63s/it, loss=0.0007, acc=0.9967, iter_time=7.53s]
Epoch 0: 13%|█▎ | 1559/12384 [3:19:03<22:56:06, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=11.71s]
Epoch 0: 13%|█▎ | 1560/12384 [3:19:03<23:11:11, 7.71s/it, loss=0.0005, acc=0.9983, iter_time=11.71s]
Epoch 0: 13%|█▎ | 1560/12384 [3:19:11<23:11:11, 7.71s/it, loss=0.0009, acc=0.9979, iter_time=7.21s]
Epoch 0: 13%|█▎ | 1561/12384 [3:19:11<23:06:16, 7.69s/it, loss=0.0009, acc=0.9979, iter_time=7.21s]
Epoch 0: 13%|█▎ | 1561/12384 [3:19:19<23:06:16, 7.69s/it, loss=0.0013, acc=0.9957, iter_time=5.10s]
Epoch 0: 13%|█▎ | 1562/12384 [3:19:19<23:01:29, 7.66s/it, loss=0.0013, acc=0.9957, iter_time=5.10s]
Epoch 0: 13%|█▎ | 1562/12384 [3:19:26<23:01:29, 7.66s/it, loss=0.0006, acc=0.9981, iter_time=10.14s]
Epoch 0: 13%|█▎ | 1563/12384 [3:19:26<22:59:33, 7.65s/it, loss=0.0006, acc=0.9981, iter_time=10.14s]
Epoch 0: 13%|█▎ | 1563/12384 [3:19:34<22:59:33, 7.65s/it, loss=0.0033, acc=0.9926, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1564/12384 [3:19:34<22:58:37, 7.64s/it, loss=0.0033, acc=0.9926, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1564/12384 [3:19:41<22:58:37, 7.64s/it, loss=0.0080, acc=0.9841, iter_time=10.64s]
Epoch 0: 13%|█▎ | 1565/12384 [3:19:41<22:56:46, 7.64s/it, loss=0.0080, acc=0.9841, iter_time=10.64s]
Epoch 0: 13%|█▎ | 1565/12384 [3:19:49<22:56:46, 7.64s/it, loss=0.0042, acc=0.9969, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1566/12384 [3:19:49<22:56:44, 7.64s/it, loss=0.0042, acc=0.9969, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1566/12384 [3:19:57<22:56:44, 7.64s/it, loss=0.0015, acc=0.9952, iter_time=5.84s]
Epoch 0: 13%|█▎ | 1567/12384 [3:19:57<22:55:26, 7.63s/it, loss=0.0015, acc=0.9952, iter_time=5.84s]
Epoch 0: 13%|█▎ | 1567/12384 [3:20:04<22:55:26, 7.63s/it, loss=0.0007, acc=0.9999, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1568/12384 [3:20:04<22:53:18, 7.62s/it, loss=0.0007, acc=0.9999, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1568/12384 [3:20:12<22:53:18, 7.62s/it, loss=0.0009, acc=0.9978, iter_time=3.86s]
Epoch 0: 13%|█▎ | 1569/12384 [3:20:12<22:56:36, 7.64s/it, loss=0.0009, acc=0.9978, iter_time=3.86s]
Epoch 0: 13%|█▎ | 1569/12384 [3:20:20<22:56:36, 7.64s/it, loss=0.0008, acc=0.9954, iter_time=9.60s]
Epoch 0: 13%|█▎ | 1570/12384 [3:20:20<22:57:19, 7.64s/it, loss=0.0008, acc=0.9954, iter_time=9.60s]
Epoch 0: 13%|█▎ | 1570/12384 [3:20:27<22:57:19, 7.64s/it, loss=0.0051, acc=0.9882, iter_time=7.57s]
Epoch 0: 13%|█▎ | 1571/12384 [3:20:27<22:57:35, 7.64s/it, loss=0.0051, acc=0.9882, iter_time=7.57s]
Epoch 0: 13%|█▎ | 1571/12384 [3:20:35<22:57:35, 7.64s/it, loss=0.0013, acc=0.9959, iter_time=9.16s]
Epoch 0: 13%|█▎ | 1572/12384 [3:20:35<22:55:31, 7.63s/it, loss=0.0013, acc=0.9959, iter_time=9.16s]
Epoch 0: 13%|█▎ | 1572/12384 [3:20:43<22:55:31, 7.63s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1573/12384 [3:20:43<22:53:17, 7.62s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1573/12384 [3:20:50<22:53:17, 7.62s/it, loss=0.0005, acc=0.9993, iter_time=4.76s]
Epoch 0: 13%|█▎ | 1574/12384 [3:20:50<22:53:55, 7.63s/it, loss=0.0005, acc=0.9993, iter_time=4.76s]
Epoch 0: 13%|█▎ | 1574/12384 [3:20:58<22:53:55, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=10.49s]
Epoch 0: 13%|█▎ | 1575/12384 [3:20:58<22:56:57, 7.64s/it, loss=0.0005, acc=0.9997, iter_time=10.49s]
Epoch 0: 13%|█▎ | 1575/12384 [3:21:05<22:56:57, 7.64s/it, loss=0.0028, acc=0.9960, iter_time=8.08s]
Epoch 0: 13%|█▎ | 1576/12384 [3:21:05<22:56:33, 7.64s/it, loss=0.0028, acc=0.9960, iter_time=8.08s]
Epoch 0: 13%|█▎ | 1576/12384 [3:21:13<22:56:33, 7.64s/it, loss=0.0037, acc=0.9941, iter_time=7.23s]
Epoch 0: 13%|█▎ | 1577/12384 [3:21:13<22:56:12, 7.64s/it, loss=0.0037, acc=0.9941, iter_time=7.23s]
Epoch 0: 13%|█▎ | 1577/12384 [3:21:21<22:56:12, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1578/12384 [3:21:21<22:54:41, 7.63s/it, loss=0.0005, acc=0.9979, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1578/12384 [3:21:28<22:54:41, 7.63s/it, loss=0.0009, acc=0.9978, iter_time=6.66s]
Epoch 0: 13%|█▎ | 1579/12384 [3:21:28<22:53:32, 7.63s/it, loss=0.0009, acc=0.9978, iter_time=6.66s]
Epoch 0: 13%|█▎ | 1579/12384 [3:21:36<22:53:32, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.27s]
Epoch 0: 13%|█▎ | 1580/12384 [3:21:36<22:51:45, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=8.27s]
Epoch 0: 13%|█▎ | 1580/12384 [3:21:44<22:51:45, 7.62s/it, loss=0.0041, acc=0.9935, iter_time=6.18s]
Epoch 0: 13%|█▎ | 1581/12384 [3:21:44<22:50:30, 7.61s/it, loss=0.0041, acc=0.9935, iter_time=6.18s]
Epoch 0: 13%|█▎ | 1581/12384 [3:21:51<22:50:30, 7.61s/it, loss=0.0013, acc=0.9954, iter_time=9.33s]
Epoch 0: 13%|█▎ | 1582/12384 [3:21:51<22:51:13, 7.62s/it, loss=0.0013, acc=0.9954, iter_time=9.33s]
Epoch 0: 13%|█▎ | 1582/12384 [3:21:59<22:51:13, 7.62s/it, loss=0.0008, acc=0.9990, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1583/12384 [3:21:59<22:51:47, 7.62s/it, loss=0.0008, acc=0.9990, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1583/12384 [3:22:06<22:51:47, 7.62s/it, loss=0.0012, acc=0.9966, iter_time=8.01s]
Epoch 0: 13%|█▎ | 1584/12384 [3:22:06<22:52:57, 7.63s/it, loss=0.0012, acc=0.9966, iter_time=8.01s]
Epoch 0: 13%|█▎ | 1584/12384 [3:22:14<22:52:57, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.29s]
Epoch 0: 13%|█▎ | 1585/12384 [3:22:14<22:54:10, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.29s]
Epoch 0: 13%|█▎ | 1585/12384 [3:22:22<22:54:10, 7.63s/it, loss=0.0015, acc=0.9975, iter_time=5.60s]
Epoch 0: 13%|█▎ | 1586/12384 [3:22:22<23:11:30, 7.73s/it, loss=0.0015, acc=0.9975, iter_time=5.60s]
Epoch 0: 13%|█▎ | 1586/12384 [3:22:30<23:11:30, 7.73s/it, loss=0.0004, acc=0.9998, iter_time=9.96s]
Epoch 0: 13%|█▎ | 1587/12384 [3:22:30<23:05:37, 7.70s/it, loss=0.0004, acc=0.9998, iter_time=9.96s]
Epoch 0: 13%|█▎ | 1587/12384 [3:22:37<23:05:37, 7.70s/it, loss=0.0005, acc=0.9980, iter_time=7.70s]
Epoch 0: 13%|█▎ | 1588/12384 [3:22:37<23:04:33, 7.69s/it, loss=0.0005, acc=0.9980, iter_time=7.70s]
Epoch 0: 13%|█▎ | 1588/12384 [3:22:45<23:04:33, 7.69s/it, loss=0.0005, acc=0.9972, iter_time=6.11s]
Epoch 0: 13%|█▎ | 1589/12384 [3:22:45<23:02:00, 7.68s/it, loss=0.0005, acc=0.9972, iter_time=6.11s]
Epoch 0: 13%|█▎ | 1589/12384 [3:22:53<23:02:00, 7.68s/it, loss=0.0051, acc=0.9887, iter_time=9.14s]
Epoch 0: 13%|█▎ | 1590/12384 [3:22:53<22:57:25, 7.66s/it, loss=0.0051, acc=0.9887, iter_time=9.14s]
Epoch 0: 13%|█▎ | 1590/12384 [3:23:00<22:57:25, 7.66s/it, loss=0.0006, acc=0.9992, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1591/12384 [3:23:00<23:00:08, 7.67s/it, loss=0.0006, acc=0.9992, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1591/12384 [3:23:08<23:00:08, 7.67s/it, loss=0.0019, acc=0.9985, iter_time=7.65s]
Epoch 0: 13%|█▎ | 1592/12384 [3:23:08<22:57:23, 7.66s/it, loss=0.0019, acc=0.9985, iter_time=7.65s]
Epoch 0: 13%|█▎ | 1592/12384 [3:23:16<22:57:23, 7.66s/it, loss=0.0057, acc=0.9909, iter_time=7.66s]
Epoch 0: 13%|█▎ | 1593/12384 [3:23:16<22:56:01, 7.65s/it, loss=0.0057, acc=0.9909, iter_time=7.66s]
Epoch 0: 13%|█▎ | 1593/12384 [3:23:23<22:56:01, 7.65s/it, loss=0.0022, acc=0.9970, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1594/12384 [3:23:23<22:54:34, 7.64s/it, loss=0.0022, acc=0.9970, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1594/12384 [3:23:31<22:54:34, 7.64s/it, loss=0.0005, acc=0.9996, iter_time=5.52s]
Epoch 0: 13%|█▎ | 1595/12384 [3:23:31<22:56:24, 7.65s/it, loss=0.0005, acc=0.9996, iter_time=5.52s]
Epoch 0: 13%|█▎ | 1595/12384 [3:23:39<22:56:24, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1596/12384 [3:23:39<22:54:38, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.78s]
Epoch 0: 13%|█▎ | 1596/12384 [3:23:46<22:54:38, 7.65s/it, loss=0.0013, acc=0.9976, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1597/12384 [3:23:46<22:54:46, 7.65s/it, loss=0.0013, acc=0.9976, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1597/12384 [3:23:54<22:54:46, 7.65s/it, loss=0.0027, acc=0.9962, iter_time=5.05s]
Epoch 0: 13%|█▎ | 1598/12384 [3:23:54<22:52:44, 7.64s/it, loss=0.0027, acc=0.9962, iter_time=5.05s]
Epoch 0: 13%|█▎ | 1598/12384 [3:24:01<22:52:44, 7.64s/it, loss=0.0005, acc=0.9994, iter_time=7.71s]
Epoch 0: 13%|█▎ | 1599/12384 [3:24:01<22:54:51, 7.65s/it, loss=0.0005, acc=0.9994, iter_time=7.71s]
Epoch 0: 13%|█▎ | 1599/12384 [3:24:09<22:54:51, 7.65s/it, loss=0.0029, acc=0.9943, iter_time=10.60s]
Epoch 0: 13%|█▎ | 1600/12384 [3:24:09<22:53:36, 7.64s/it, loss=0.0029, acc=0.9943, iter_time=10.60s]
Epoch 0: 13%|█▎ | 1600/12384 [3:24:17<22:53:36, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1601/12384 [3:24:17<22:50:58, 7.63s/it, loss=0.0007, acc=0.9980, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1601/12384 [3:24:24<22:50:58, 7.63s/it, loss=0.0022, acc=0.9979, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1602/12384 [3:24:24<22:50:03, 7.62s/it, loss=0.0022, acc=0.9979, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1602/12384 [3:24:32<22:50:03, 7.62s/it, loss=0.0007, acc=0.9977, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1603/12384 [3:24:32<22:50:23, 7.63s/it, loss=0.0007, acc=0.9977, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1603/12384 [3:24:40<22:50:23, 7.63s/it, loss=0.0016, acc=0.9905, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1604/12384 [3:24:40<22:59:01, 7.68s/it, loss=0.0016, acc=0.9905, iter_time=4.61s]
Epoch 0: 13%|█▎ | 1604/12384 [3:24:47<22:59:01, 7.68s/it, loss=0.0010, acc=0.9991, iter_time=10.81s]
Epoch 0: 13%|█▎ | 1605/12384 [3:24:47<22:59:29, 7.68s/it, loss=0.0010, acc=0.9991, iter_time=10.81s]
Epoch 0: 13%|█▎ | 1605/12384 [3:24:55<22:59:29, 7.68s/it, loss=0.0037, acc=0.9920, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1606/12384 [3:24:55<22:58:01, 7.67s/it, loss=0.0037, acc=0.9920, iter_time=7.69s]
Epoch 0: 13%|█▎ | 1606/12384 [3:25:03<22:58:01, 7.67s/it, loss=0.0025, acc=0.9956, iter_time=7.66s]
Epoch 0: 13%|█▎ | 1607/12384 [3:25:03<22:56:18, 7.66s/it, loss=0.0025, acc=0.9956, iter_time=7.66s]
Epoch 0: 13%|█▎ | 1607/12384 [3:25:10<22:56:18, 7.66s/it, loss=0.0010, acc=0.9992, iter_time=8.02s]
Epoch 0: 13%|█▎ | 1608/12384 [3:25:10<22:55:38, 7.66s/it, loss=0.0010, acc=0.9992, iter_time=8.02s]
Epoch 0: 13%|█▎ | 1608/12384 [3:25:18<22:55:38, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 13%|█▎ | 1609/12384 [3:25:18<22:54:02, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.26s]
Epoch 0: 13%|█▎ | 1609/12384 [3:25:26<22:54:02, 7.65s/it, loss=0.0033, acc=0.9928, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1610/12384 [3:25:26<22:52:26, 7.64s/it, loss=0.0033, acc=0.9928, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1610/12384 [3:25:33<22:52:26, 7.64s/it, loss=0.0009, acc=0.9998, iter_time=4.09s]
Epoch 0: 13%|█▎ | 1611/12384 [3:25:33<22:52:51, 7.65s/it, loss=0.0009, acc=0.9998, iter_time=4.09s]
Epoch 0: 13%|█▎ | 1611/12384 [3:25:41<22:52:51, 7.65s/it, loss=0.0007, acc=0.9997, iter_time=11.18s]
Epoch 0: 13%|█▎ | 1612/12384 [3:25:41<22:51:08, 7.64s/it, loss=0.0007, acc=0.9997, iter_time=11.18s]
Epoch 0: 13%|█▎ | 1612/12384 [3:25:49<22:51:08, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.94s]
Epoch 0: 13%|█▎ | 1613/12384 [3:25:49<23:12:34, 7.76s/it, loss=0.0003, acc=1.0000, iter_time=7.94s]
Epoch 0: 13%|█▎ | 1613/12384 [3:25:57<23:12:34, 7.76s/it, loss=0.0050, acc=0.9920, iter_time=7.71s]
Epoch 0: 13%|█▎ | 1614/12384 [3:25:57<23:05:10, 7.72s/it, loss=0.0050, acc=0.9920, iter_time=7.71s]
Epoch 0: 13%|█▎ | 1614/12384 [3:26:04<23:05:10, 7.72s/it, loss=0.0006, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1615/12384 [3:26:04<22:59:45, 7.69s/it, loss=0.0006, acc=0.9984, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1615/12384 [3:26:12<22:59:45, 7.69s/it, loss=0.0011, acc=0.9966, iter_time=7.99s]
Epoch 0: 13%|█▎ | 1616/12384 [3:26:12<22:55:11, 7.66s/it, loss=0.0011, acc=0.9966, iter_time=7.99s]
Epoch 0: 13%|█▎ | 1616/12384 [3:26:19<22:55:11, 7.66s/it, loss=0.0033, acc=0.9960, iter_time=7.23s]
Epoch 0: 13%|█▎ | 1617/12384 [3:26:19<22:53:37, 7.65s/it, loss=0.0033, acc=0.9960, iter_time=7.23s]
Epoch 0: 13%|█▎ | 1617/12384 [3:26:27<22:53:37, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1618/12384 [3:26:27<22:55:24, 7.67s/it, loss=0.0006, acc=0.9975, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1618/12384 [3:26:35<22:55:24, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=4.83s]
Epoch 0: 13%|█▎ | 1619/12384 [3:26:35<22:53:44, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=4.83s]
Epoch 0: 13%|█▎ | 1619/12384 [3:26:42<22:53:44, 7.66s/it, loss=0.0040, acc=0.9900, iter_time=10.22s]
Epoch 0: 13%|█▎ | 1620/12384 [3:26:42<22:53:00, 7.65s/it, loss=0.0040, acc=0.9900, iter_time=10.22s]
Epoch 0: 13%|█▎ | 1620/12384 [3:26:50<22:53:00, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.39s]
Epoch 0: 13%|█▎ | 1621/12384 [3:26:50<22:52:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.39s]
Epoch 0: 13%|█▎ | 1621/12384 [3:26:58<22:52:43, 7.65s/it, loss=0.0013, acc=0.9965, iter_time=7.15s]
Epoch 0: 13%|█▎ | 1622/12384 [3:26:58<22:51:56, 7.65s/it, loss=0.0013, acc=0.9965, iter_time=7.15s]
Epoch 0: 13%|█▎ | 1622/12384 [3:27:05<22:51:56, 7.65s/it, loss=0.0041, acc=0.9894, iter_time=8.60s]
Epoch 0: 13%|█▎ | 1623/12384 [3:27:05<22:50:39, 7.64s/it, loss=0.0041, acc=0.9894, iter_time=8.60s]
Epoch 0: 13%|█▎ | 1623/12384 [3:27:13<22:50:39, 7.64s/it, loss=0.0009, acc=0.9983, iter_time=10.73s]
Epoch 0: 13%|█▎ | 1624/12384 [3:27:13<22:53:37, 7.66s/it, loss=0.0009, acc=0.9983, iter_time=10.73s]
Epoch 0: 13%|█▎ | 1624/12384 [3:27:21<22:53:37, 7.66s/it, loss=0.0004, acc=0.9989, iter_time=5.31s]
Epoch 0: 13%|█▎ | 1625/12384 [3:27:21<22:50:47, 7.64s/it, loss=0.0004, acc=0.9989, iter_time=5.31s]
Epoch 0: 13%|█▎ | 1625/12384 [3:27:28<22:50:47, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=9.95s]
Epoch 0: 13%|█▎ | 1626/12384 [3:27:28<22:49:14, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=9.95s]
Epoch 0: 13%|█▎ | 1626/12384 [3:27:36<22:49:14, 7.64s/it, loss=0.0032, acc=0.9947, iter_time=6.50s]
Epoch 0: 13%|█▎ | 1627/12384 [3:27:36<22:47:16, 7.63s/it, loss=0.0032, acc=0.9947, iter_time=6.50s]
Epoch 0: 13%|█▎ | 1627/12384 [3:27:43<22:47:16, 7.63s/it, loss=0.0011, acc=0.9979, iter_time=8.73s]
Epoch 0: 13%|█▎ | 1628/12384 [3:27:43<22:45:29, 7.62s/it, loss=0.0011, acc=0.9979, iter_time=8.73s]
Epoch 0: 13%|█▎ | 1628/12384 [3:27:51<22:45:29, 7.62s/it, loss=0.0011, acc=0.9975, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1629/12384 [3:27:51<22:44:32, 7.61s/it, loss=0.0011, acc=0.9975, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1629/12384 [3:27:59<22:44:32, 7.61s/it, loss=0.0002, acc=0.9999, iter_time=7.59s]
Epoch 0: 13%|█▎ | 1630/12384 [3:27:59<22:45:03, 7.62s/it, loss=0.0002, acc=0.9999, iter_time=7.59s]
Epoch 0: 13%|█▎ | 1630/12384 [3:28:06<22:45:03, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1631/12384 [3:28:06<22:45:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1631/12384 [3:28:14<22:45:05, 7.62s/it, loss=0.0061, acc=0.9873, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1632/12384 [3:28:14<22:46:33, 7.63s/it, loss=0.0061, acc=0.9873, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1632/12384 [3:28:22<22:46:33, 7.63s/it, loss=0.0006, acc=0.9977, iter_time=5.04s]
Epoch 0: 13%|█▎ | 1633/12384 [3:28:22<22:46:23, 7.63s/it, loss=0.0006, acc=0.9977, iter_time=5.04s]
Epoch 0: 13%|█▎ | 1633/12384 [3:28:29<22:46:23, 7.63s/it, loss=0.0004, acc=0.9996, iter_time=10.24s]
Epoch 0: 13%|█▎ | 1634/12384 [3:28:29<22:46:01, 7.62s/it, loss=0.0004, acc=0.9996, iter_time=10.24s]
Epoch 0: 13%|█▎ | 1634/12384 [3:28:37<22:46:01, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1635/12384 [3:28:37<22:45:36, 7.62s/it, loss=0.0006, acc=0.9991, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1635/12384 [3:28:44<22:45:36, 7.62s/it, loss=0.0010, acc=0.9962, iter_time=5.55s]
Epoch 0: 13%|█▎ | 1636/12384 [3:28:44<22:45:11, 7.62s/it, loss=0.0010, acc=0.9962, iter_time=5.55s]
Epoch 0: 13%|█▎ | 1636/12384 [3:28:52<22:45:11, 7.62s/it, loss=0.0028, acc=0.9894, iter_time=9.70s]
Epoch 0: 13%|█▎ | 1637/12384 [3:28:52<22:44:03, 7.62s/it, loss=0.0028, acc=0.9894, iter_time=9.70s]
Epoch 0: 13%|█▎ | 1637/12384 [3:29:00<22:44:03, 7.62s/it, loss=0.0014, acc=0.9971, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1638/12384 [3:29:00<22:44:45, 7.62s/it, loss=0.0014, acc=0.9971, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1638/12384 [3:29:08<22:44:45, 7.62s/it, loss=0.0010, acc=0.9967, iter_time=7.96s]
Epoch 0: 13%|█▎ | 1639/12384 [3:29:08<23:04:34, 7.73s/it, loss=0.0010, acc=0.9967, iter_time=7.96s]
Epoch 0: 13%|█▎ | 1639/12384 [3:29:15<23:04:34, 7.73s/it, loss=0.0004, acc=0.9998, iter_time=8.03s]
Epoch 0: 13%|█▎ | 1640/12384 [3:29:15<23:00:18, 7.71s/it, loss=0.0004, acc=0.9998, iter_time=8.03s]
Epoch 0: 13%|█▎ | 1640/12384 [3:29:23<23:00:18, 7.71s/it, loss=0.0013, acc=0.9970, iter_time=6.33s]
Epoch 0: 13%|█▎ | 1641/12384 [3:29:23<22:53:58, 7.67s/it, loss=0.0013, acc=0.9970, iter_time=6.33s]
Epoch 0: 13%|█▎ | 1641/12384 [3:29:30<22:53:58, 7.67s/it, loss=0.0004, acc=0.9979, iter_time=6.73s]
Epoch 0: 13%|█▎ | 1642/12384 [3:29:30<22:49:37, 7.65s/it, loss=0.0004, acc=0.9979, iter_time=6.73s]
Epoch 0: 13%|█▎ | 1642/12384 [3:29:38<22:49:37, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.34s]
Epoch 0: 13%|█▎ | 1643/12384 [3:29:38<22:47:35, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.34s]
Epoch 0: 13%|█▎ | 1643/12384 [3:29:46<22:47:35, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.84s]
Epoch 0: 13%|█▎ | 1644/12384 [3:29:46<22:47:35, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.84s]
Epoch 0: 13%|█▎ | 1644/12384 [3:29:53<22:47:35, 7.64s/it, loss=0.0009, acc=0.9970, iter_time=9.22s]
Epoch 0: 13%|█▎ | 1645/12384 [3:29:53<22:47:55, 7.64s/it, loss=0.0009, acc=0.9970, iter_time=9.22s]
Epoch 0: 13%|█▎ | 1645/12384 [3:30:01<22:47:55, 7.64s/it, loss=0.0016, acc=0.9929, iter_time=6.84s]
Epoch 0: 13%|█▎ | 1646/12384 [3:30:01<22:47:12, 7.64s/it, loss=0.0016, acc=0.9929, iter_time=6.84s]
Epoch 0: 13%|█▎ | 1646/12384 [3:30:09<22:47:12, 7.64s/it, loss=0.0028, acc=0.9952, iter_time=9.76s]
Epoch 0: 13%|█▎ | 1647/12384 [3:30:09<22:46:32, 7.64s/it, loss=0.0028, acc=0.9952, iter_time=9.76s]
Epoch 0: 13%|█▎ | 1647/12384 [3:30:16<22:46:32, 7.64s/it, loss=0.0043, acc=0.9931, iter_time=8.54s]
Epoch 0: 13%|█▎ | 1648/12384 [3:30:16<22:45:12, 7.63s/it, loss=0.0043, acc=0.9931, iter_time=8.54s]
Epoch 0: 13%|█▎ | 1648/12384 [3:30:24<22:45:12, 7.63s/it, loss=0.0085, acc=0.9804, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1649/12384 [3:30:24<22:48:40, 7.65s/it, loss=0.0085, acc=0.9804, iter_time=4.62s]
Epoch 0: 13%|█▎ | 1649/12384 [3:30:32<22:48:40, 7.65s/it, loss=0.0005, acc=0.9961, iter_time=11.15s]
Epoch 0: 13%|█▎ | 1650/12384 [3:30:32<22:47:24, 7.64s/it, loss=0.0005, acc=0.9961, iter_time=11.15s]
Epoch 0: 13%|█▎ | 1650/12384 [3:30:39<22:47:24, 7.64s/it, loss=0.0027, acc=0.9919, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1651/12384 [3:30:39<22:46:08, 7.64s/it, loss=0.0027, acc=0.9919, iter_time=7.20s]
Epoch 0: 13%|█▎ | 1651/12384 [3:30:47<22:46:08, 7.64s/it, loss=0.0033, acc=0.9895, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1652/12384 [3:30:47<22:49:42, 7.66s/it, loss=0.0033, acc=0.9895, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1652/12384 [3:30:55<22:49:42, 7.66s/it, loss=0.0012, acc=0.9998, iter_time=5.12s]
Epoch 0: 13%|█▎ | 1653/12384 [3:30:55<22:47:25, 7.65s/it, loss=0.0012, acc=0.9998, iter_time=5.12s]
Epoch 0: 13%|█▎ | 1653/12384 [3:31:02<22:47:25, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=8.16s]
Epoch 0: 13%|█▎ | 1654/12384 [3:31:02<22:45:15, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.16s]
Epoch 0: 13%|█▎ | 1654/12384 [3:31:10<22:45:15, 7.63s/it, loss=0.0006, acc=0.9980, iter_time=8.72s]
Epoch 0: 13%|█▎ | 1655/12384 [3:31:10<22:45:43, 7.64s/it, loss=0.0006, acc=0.9980, iter_time=8.72s]
Epoch 0: 13%|█▎ | 1655/12384 [3:31:17<22:45:43, 7.64s/it, loss=0.0014, acc=0.9987, iter_time=9.02s]
Epoch 0: 13%|█▎ | 1656/12384 [3:31:17<22:47:03, 7.65s/it, loss=0.0014, acc=0.9987, iter_time=9.02s]
Epoch 0: 13%|█▎ | 1656/12384 [3:31:25<22:47:03, 7.65s/it, loss=0.0010, acc=0.9989, iter_time=7.24s]
Epoch 0: 13%|█▎ | 1657/12384 [3:31:25<22:45:31, 7.64s/it, loss=0.0010, acc=0.9989, iter_time=7.24s]
Epoch 0: 13%|█▎ | 1657/12384 [3:31:33<22:45:31, 7.64s/it, loss=0.0026, acc=0.9958, iter_time=4.31s]
Epoch 0: 13%|█▎ | 1658/12384 [3:31:33<22:45:51, 7.64s/it, loss=0.0026, acc=0.9958, iter_time=4.31s]
Epoch 0: 13%|█▎ | 1658/12384 [3:31:40<22:45:51, 7.64s/it, loss=0.0015, acc=0.9970, iter_time=9.70s]
Epoch 0: 13%|█▎ | 1659/12384 [3:31:40<22:45:10, 7.64s/it, loss=0.0015, acc=0.9970, iter_time=9.70s]
Epoch 0: 13%|█▎ | 1659/12384 [3:31:48<22:45:10, 7.64s/it, loss=0.0010, acc=0.9990, iter_time=8.92s]
Epoch 0: 13%|█▎ | 1660/12384 [3:31:48<22:45:49, 7.64s/it, loss=0.0010, acc=0.9990, iter_time=8.92s]
Epoch 0: 13%|█▎ | 1660/12384 [3:31:56<22:45:49, 7.64s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1661/12384 [3:31:56<22:45:47, 7.64s/it, loss=0.0003, acc=0.9995, iter_time=7.61s]
Epoch 0: 13%|█▎ | 1661/12384 [3:32:03<22:45:47, 7.64s/it, loss=0.0023, acc=0.9972, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1662/12384 [3:32:03<22:44:21, 7.63s/it, loss=0.0023, acc=0.9972, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1662/12384 [3:32:11<22:44:21, 7.63s/it, loss=0.0004, acc=0.9986, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1663/12384 [3:32:11<22:43:25, 7.63s/it, loss=0.0004, acc=0.9986, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1663/12384 [3:32:18<22:43:25, 7.63s/it, loss=0.0030, acc=0.9895, iter_time=8.00s]
Epoch 0: 13%|█▎ | 1664/12384 [3:32:18<22:42:33, 7.63s/it, loss=0.0030, acc=0.9895, iter_time=8.00s]
Epoch 0: 13%|█▎ | 1664/12384 [3:32:26<22:42:33, 7.63s/it, loss=0.0007, acc=0.9980, iter_time=6.28s]
Epoch 0: 13%|█▎ | 1665/12384 [3:32:26<23:03:26, 7.74s/it, loss=0.0007, acc=0.9980, iter_time=6.28s]
Epoch 0: 13%|█▎ | 1665/12384 [3:32:34<23:03:26, 7.74s/it, loss=0.0078, acc=0.9933, iter_time=8.98s]
Epoch 0: 13%|█▎ | 1666/12384 [3:32:34<22:57:53, 7.71s/it, loss=0.0078, acc=0.9933, iter_time=8.98s]
Epoch 0: 13%|█▎ | 1666/12384 [3:32:42<22:57:53, 7.71s/it, loss=0.0013, acc=0.9975, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1667/12384 [3:32:42<22:53:18, 7.69s/it, loss=0.0013, acc=0.9975, iter_time=7.62s]
Epoch 0: 13%|█▎ | 1667/12384 [3:32:49<22:53:18, 7.69s/it, loss=0.0013, acc=0.9971, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1668/12384 [3:32:49<22:48:25, 7.66s/it, loss=0.0013, acc=0.9971, iter_time=7.64s]
Epoch 0: 13%|█▎ | 1668/12384 [3:32:57<22:48:25, 7.66s/it, loss=0.0027, acc=0.9915, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1669/12384 [3:32:57<22:46:03, 7.65s/it, loss=0.0027, acc=0.9915, iter_time=7.60s]
Epoch 0: 13%|█▎ | 1669/12384 [3:33:05<22:46:03, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1670/12384 [3:33:05<22:43:52, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 13%|█▎ | 1670/12384 [3:33:12<22:43:52, 7.64s/it, loss=0.0015, acc=0.9982, iter_time=5.26s]
Epoch 0: 13%|█▎ | 1671/12384 [3:33:12<22:44:01, 7.64s/it, loss=0.0015, acc=0.9982, iter_time=5.26s]
Epoch 0: 13%|█▎ | 1671/12384 [3:33:20<22:44:01, 7.64s/it, loss=0.0023, acc=0.9957, iter_time=10.36s]
Epoch 0: 14%|█▎ | 1672/12384 [3:33:20<22:43:54, 7.64s/it, loss=0.0023, acc=0.9957, iter_time=10.36s]
Epoch 0: 14%|█▎ | 1672/12384 [3:33:27<22:43:54, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=7.24s]
Epoch 0: 14%|█▎ | 1673/12384 [3:33:27<22:42:38, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=7.24s]
Epoch 0: 14%|█▎ | 1673/12384 [3:33:35<22:42:38, 7.63s/it, loss=0.0028, acc=0.9923, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1674/12384 [3:33:35<22:41:35, 7.63s/it, loss=0.0028, acc=0.9923, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1674/12384 [3:33:43<22:41:35, 7.63s/it, loss=0.0018, acc=0.9952, iter_time=3.87s]
Epoch 0: 14%|█▎ | 1675/12384 [3:33:43<22:42:51, 7.64s/it, loss=0.0018, acc=0.9952, iter_time=3.87s]
Epoch 0: 14%|█▎ | 1675/12384 [3:33:50<22:42:51, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.10s]
Epoch 0: 14%|█▎ | 1676/12384 [3:33:50<22:42:13, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.10s]
Epoch 0: 14%|█▎ | 1676/12384 [3:33:58<22:42:13, 7.63s/it, loss=0.0006, acc=0.9981, iter_time=9.72s]
Epoch 0: 14%|█▎ | 1677/12384 [3:33:58<22:40:57, 7.63s/it, loss=0.0006, acc=0.9981, iter_time=9.72s]
Epoch 0: 14%|█▎ | 1677/12384 [3:34:06<22:40:57, 7.63s/it, loss=0.0133, acc=0.9850, iter_time=8.82s]
Epoch 0: 14%|█▎ | 1678/12384 [3:34:06<22:39:33, 7.62s/it, loss=0.0133, acc=0.9850, iter_time=8.82s]
Epoch 0: 14%|█▎ | 1678/12384 [3:34:13<22:39:33, 7.62s/it, loss=0.0004, acc=0.9999, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1679/12384 [3:34:13<22:40:00, 7.62s/it, loss=0.0004, acc=0.9999, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1679/12384 [3:34:21<22:40:00, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 14%|█▎ | 1680/12384 [3:34:21<22:40:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.02s]
Epoch 0: 14%|█▎ | 1680/12384 [3:34:28<22:40:23, 7.63s/it, loss=0.0015, acc=0.9982, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1681/12384 [3:34:28<22:40:11, 7.63s/it, loss=0.0015, acc=0.9982, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1681/12384 [3:34:36<22:40:11, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.74s]
Epoch 0: 14%|█▎ | 1682/12384 [3:34:36<22:40:36, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=8.74s]
Epoch 0: 14%|█▎ | 1682/12384 [3:34:44<22:40:36, 7.63s/it, loss=0.0003, acc=0.9987, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1683/12384 [3:34:44<22:39:50, 7.62s/it, loss=0.0003, acc=0.9987, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1683/12384 [3:34:51<22:39:50, 7.62s/it, loss=0.0031, acc=0.9975, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1684/12384 [3:34:51<22:40:31, 7.63s/it, loss=0.0031, acc=0.9975, iter_time=7.63s]
Epoch 0: 14%|█▎ | 1684/12384 [3:34:59<22:40:31, 7.63s/it, loss=0.0008, acc=0.9973, iter_time=6.47s]
Epoch 0: 14%|█▎ | 1685/12384 [3:34:59<22:40:01, 7.63s/it, loss=0.0008, acc=0.9973, iter_time=6.47s]
Epoch 0: 14%|█▎ | 1685/12384 [3:35:07<22:40:01, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=8.78s]
Epoch 0: 14%|█▎ | 1686/12384 [3:35:07<22:39:20, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=8.78s]
Epoch 0: 14%|█▎ | 1686/12384 [3:35:14<22:39:20, 7.62s/it, loss=0.0015, acc=0.9972, iter_time=7.08s]
Epoch 0: 14%|█▎ | 1687/12384 [3:35:14<22:40:44, 7.63s/it, loss=0.0015, acc=0.9972, iter_time=7.08s]
Epoch 0: 14%|█▎ | 1687/12384 [3:35:22<22:40:44, 7.63s/it, loss=0.0020, acc=0.9973, iter_time=8.55s]
Epoch 0: 14%|█▎ | 1688/12384 [3:35:22<22:38:06, 7.62s/it, loss=0.0020, acc=0.9973, iter_time=8.55s]
Epoch 0: 14%|█▎ | 1688/12384 [3:35:29<22:38:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 14%|█▎ | 1689/12384 [3:35:29<22:37:41, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.22s]
Epoch 0: 14%|█▎ | 1689/12384 [3:35:37<22:37:41, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1690/12384 [3:35:37<22:39:35, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▎ | 1690/12384 [3:35:45<22:39:35, 7.63s/it, loss=0.0016, acc=0.9976, iter_time=7.97s]
Epoch 0: 14%|█▎ | 1691/12384 [3:35:45<22:58:02, 7.73s/it, loss=0.0016, acc=0.9976, iter_time=7.97s]
Epoch 0: 14%|█▎ | 1691/12384 [3:35:53<22:58:02, 7.73s/it, loss=0.0008, acc=0.9981, iter_time=7.68s]
Epoch 0: 14%|█▎ | 1692/12384 [3:35:53<22:52:25, 7.70s/it, loss=0.0008, acc=0.9981, iter_time=7.68s]
Epoch 0: 14%|█▎ | 1692/12384 [3:36:00<22:52:25, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 14%|█▎ | 1693/12384 [3:36:00<22:49:08, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 14%|█▎ | 1693/12384 [3:36:08<22:49:08, 7.68s/it, loss=0.0006, acc=0.9978, iter_time=7.66s]
Epoch 0: 14%|█▎ | 1694/12384 [3:36:08<22:46:06, 7.67s/it, loss=0.0006, acc=0.9978, iter_time=7.66s]
Epoch 0: 14%|█▎ | 1694/12384 [3:36:16<22:46:06, 7.67s/it, loss=0.0032, acc=0.9913, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1695/12384 [3:36:16<22:45:08, 7.66s/it, loss=0.0032, acc=0.9913, iter_time=6.12s]
Epoch 0: 14%|█▎ | 1695/12384 [3:36:23<22:45:08, 7.66s/it, loss=0.0004, acc=1.0000, iter_time=9.52s]
Epoch 0: 14%|█▎ | 1696/12384 [3:36:23<22:42:45, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.52s]
Epoch 0: 14%|█▎ | 1696/12384 [3:36:31<22:42:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 14%|█▎ | 1697/12384 [3:36:31<22:45:55, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 14%|█▎ | 1697/12384 [3:36:39<22:45:55, 7.67s/it, loss=0.0022, acc=0.9965, iter_time=8.32s]
Epoch 0: 14%|█▎ | 1698/12384 [3:36:39<22:42:35, 7.65s/it, loss=0.0022, acc=0.9965, iter_time=8.32s]
Epoch 0: 14%|█▎ | 1698/12384 [3:36:46<22:42:35, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=7.91s]
Epoch 0: 14%|█▎ | 1699/12384 [3:36:46<22:39:54, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=7.91s]
Epoch 0: 14%|█▎ | 1699/12384 [3:36:54<22:39:54, 7.64s/it, loss=0.0003, acc=0.9982, iter_time=8.03s]
Epoch 0: 14%|█▎ | 1700/12384 [3:36:54<22:39:20, 7.63s/it, loss=0.0003, acc=0.9982, iter_time=8.03s]
Epoch 0: 14%|█▎ | 1700/12384 [3:37:01<22:39:20, 7.63s/it, loss=0.0024, acc=0.9943, iter_time=7.21s]
Epoch 0: 14%|█▎ | 1701/12384 [3:37:01<22:39:27, 7.64s/it, loss=0.0024, acc=0.9943, iter_time=7.21s]
Epoch 0: 14%|█▎ | 1701/12384 [3:37:09<22:39:27, 7.64s/it, loss=0.0011, acc=0.9969, iter_time=7.66s]
Epoch 0: 14%|█▎ | 1702/12384 [3:37:09<22:39:32, 7.64s/it, loss=0.0011, acc=0.9969, iter_time=7.66s]
Epoch 0: 14%|█▎ | 1702/12384 [3:37:17<22:39:32, 7.64s/it, loss=0.0010, acc=0.9969, iter_time=7.63s]
Epoch 0: 14%|█▍ | 1703/12384 [3:37:17<22:38:23, 7.63s/it, loss=0.0010, acc=0.9969, iter_time=7.63s]
Epoch 0: 14%|█▍ | 1703/12384 [3:37:24<22:38:23, 7.63s/it, loss=0.0017, acc=0.9983, iter_time=7.57s]
Epoch 0: 14%|█▍ | 1704/12384 [3:37:24<22:37:54, 7.63s/it, loss=0.0017, acc=0.9983, iter_time=7.57s]
Epoch 0: 14%|█▍ | 1704/12384 [3:37:32<22:37:54, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.13s]
Epoch 0: 14%|█▍ | 1705/12384 [3:37:32<22:37:02, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.13s]
Epoch 0: 14%|█▍ | 1705/12384 [3:37:40<22:37:02, 7.62s/it, loss=0.0007, acc=0.9984, iter_time=8.16s]
Epoch 0: 14%|█▍ | 1706/12384 [3:37:40<22:35:50, 7.62s/it, loss=0.0007, acc=0.9984, iter_time=8.16s]
Epoch 0: 14%|█▍ | 1706/12384 [3:37:47<22:35:50, 7.62s/it, loss=0.0011, acc=0.9977, iter_time=7.60s]
Epoch 0: 14%|█▍ | 1707/12384 [3:37:47<22:36:40, 7.62s/it, loss=0.0011, acc=0.9977, iter_time=7.60s]
Epoch 0: 14%|█▍ | 1707/12384 [3:37:55<22:36:40, 7.62s/it, loss=0.0027, acc=0.9970, iter_time=6.14s]
Epoch 0: 14%|█▍ | 1708/12384 [3:37:55<22:34:27, 7.61s/it, loss=0.0027, acc=0.9970, iter_time=6.14s]
Epoch 0: 14%|█▍ | 1708/12384 [3:38:02<22:34:27, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=7.56s]
Epoch 0: 14%|█▍ | 1709/12384 [3:38:02<22:34:25, 7.61s/it, loss=0.0005, acc=0.9982, iter_time=7.56s]
Epoch 0: 14%|█▍ | 1709/12384 [3:38:10<22:34:25, 7.61s/it, loss=0.0014, acc=0.9979, iter_time=7.70s]
Epoch 0: 14%|█▍ | 1710/12384 [3:38:10<22:39:47, 7.64s/it, loss=0.0014, acc=0.9979, iter_time=7.70s]
Epoch 0: 14%|█▍ | 1710/12384 [3:38:18<22:39:47, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.37s]
Epoch 0: 14%|█▍ | 1711/12384 [3:38:18<22:37:40, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.37s]
Epoch 0: 14%|█▍ | 1711/12384 [3:38:25<22:37:40, 7.63s/it, loss=0.0045, acc=0.9931, iter_time=9.78s]
Epoch 0: 14%|█▍ | 1712/12384 [3:38:25<22:41:04, 7.65s/it, loss=0.0045, acc=0.9931, iter_time=9.78s]
Epoch 0: 14%|█▍ | 1712/12384 [3:38:33<22:41:04, 7.65s/it, loss=0.0008, acc=0.9988, iter_time=7.29s]
Epoch 0: 14%|█▍ | 1713/12384 [3:38:33<22:38:24, 7.64s/it, loss=0.0008, acc=0.9988, iter_time=7.29s]
Epoch 0: 14%|█▍ | 1713/12384 [3:38:41<22:38:24, 7.64s/it, loss=0.0005, acc=0.9997, iter_time=5.36s]
Epoch 0: 14%|█▍ | 1714/12384 [3:38:41<22:39:52, 7.65s/it, loss=0.0005, acc=0.9997, iter_time=5.36s]
Epoch 0: 14%|█▍ | 1714/12384 [3:38:48<22:39:52, 7.65s/it, loss=0.0007, acc=0.9960, iter_time=9.93s]
Epoch 0: 14%|█▍ | 1715/12384 [3:38:48<22:39:56, 7.65s/it, loss=0.0007, acc=0.9960, iter_time=9.93s]
Epoch 0: 14%|█▍ | 1715/12384 [3:38:56<22:39:56, 7.65s/it, loss=0.0005, acc=0.9988, iter_time=6.22s]
Epoch 0: 14%|█▍ | 1716/12384 [3:38:56<22:40:25, 7.65s/it, loss=0.0005, acc=0.9988, iter_time=6.22s]
Epoch 0: 14%|█▍ | 1716/12384 [3:39:04<22:40:25, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=9.39s]
Epoch 0: 14%|█▍ | 1717/12384 [3:39:04<22:59:14, 7.76s/it, loss=0.0004, acc=1.0000, iter_time=9.39s]
Epoch 0: 14%|█▍ | 1717/12384 [3:39:12<22:59:14, 7.76s/it, loss=0.0009, acc=0.9999, iter_time=7.71s]
Epoch 0: 14%|█▍ | 1718/12384 [3:39:12<22:52:20, 7.72s/it, loss=0.0009, acc=0.9999, iter_time=7.71s]
Epoch 0: 14%|█▍ | 1718/12384 [3:39:19<22:52:20, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=4.34s]
Epoch 0: 14%|█▍ | 1719/12384 [3:39:19<22:46:00, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.34s]
Epoch 0: 14%|█▍ | 1719/12384 [3:39:27<22:46:00, 7.68s/it, loss=0.0013, acc=0.9983, iter_time=11.28s]
Epoch 0: 14%|█▍ | 1720/12384 [3:39:27<22:43:02, 7.67s/it, loss=0.0013, acc=0.9983, iter_time=11.28s]
Epoch 0: 14%|█▍ | 1720/12384 [3:39:34<22:43:02, 7.67s/it, loss=0.0039, acc=0.9931, iter_time=3.73s]
Epoch 0: 14%|█▍ | 1721/12384 [3:39:34<22:40:36, 7.66s/it, loss=0.0039, acc=0.9931, iter_time=3.73s]
Epoch 0: 14%|█▍ | 1721/12384 [3:39:42<22:40:36, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=9.96s]
Epoch 0: 14%|█▍ | 1722/12384 [3:39:42<22:38:37, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=9.96s]
Epoch 0: 14%|█▍ | 1722/12384 [3:39:50<22:38:37, 7.65s/it, loss=0.0128, acc=0.9713, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1723/12384 [3:39:50<22:38:43, 7.65s/it, loss=0.0128, acc=0.9713, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1723/12384 [3:39:57<22:38:43, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.09s]
Epoch 0: 14%|█▍ | 1724/12384 [3:39:57<22:38:47, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.09s]
Epoch 0: 14%|█▍ | 1724/12384 [3:40:05<22:38:47, 7.65s/it, loss=0.0010, acc=1.0000, iter_time=8.19s]
Epoch 0: 14%|█▍ | 1725/12384 [3:40:05<22:36:52, 7.64s/it, loss=0.0010, acc=1.0000, iter_time=8.19s]
Epoch 0: 14%|█▍ | 1725/12384 [3:40:13<22:36:52, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.31s]
Epoch 0: 14%|█▍ | 1726/12384 [3:40:13<22:36:05, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=5.31s]
Epoch 0: 14%|█▍ | 1726/12384 [3:40:20<22:36:05, 7.63s/it, loss=0.0012, acc=0.9972, iter_time=10.10s]
Epoch 0: 14%|█▍ | 1727/12384 [3:40:20<22:44:06, 7.68s/it, loss=0.0012, acc=0.9972, iter_time=10.10s]
Epoch 0: 14%|█▍ | 1727/12384 [3:40:28<22:44:06, 7.68s/it, loss=0.0022, acc=0.9962, iter_time=7.84s]
Epoch 0: 14%|█▍ | 1728/12384 [3:40:28<22:54:03, 7.74s/it, loss=0.0022, acc=0.9962, iter_time=7.84s]
Epoch 0: 14%|█▍ | 1728/12384 [3:40:36<22:54:03, 7.74s/it, loss=0.0008, acc=0.9980, iter_time=5.70s]
Epoch 0: 14%|█▍ | 1729/12384 [3:40:36<22:55:51, 7.75s/it, loss=0.0008, acc=0.9980, iter_time=5.70s]
Epoch 0: 14%|█▍ | 1729/12384 [3:40:44<22:55:51, 7.75s/it, loss=0.0006, acc=0.9994, iter_time=9.84s]
Epoch 0: 14%|█▍ | 1730/12384 [3:40:44<22:54:17, 7.74s/it, loss=0.0006, acc=0.9994, iter_time=9.84s]
Epoch 0: 14%|█▍ | 1730/12384 [3:40:52<22:54:17, 7.74s/it, loss=0.0007, acc=0.9983, iter_time=7.76s]
Epoch 0: 14%|█▍ | 1731/12384 [3:40:52<22:56:12, 7.75s/it, loss=0.0007, acc=0.9983, iter_time=7.76s]
Epoch 0: 14%|█▍ | 1731/12384 [3:40:59<22:56:12, 7.75s/it, loss=0.0012, acc=0.9969, iter_time=7.76s]
Epoch 0: 14%|█▍ | 1732/12384 [3:40:59<22:58:46, 7.77s/it, loss=0.0012, acc=0.9969, iter_time=7.76s]
Epoch 0: 14%|█▍ | 1732/12384 [3:41:07<22:58:46, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=7.16s]
Epoch 0: 14%|█▍ | 1733/12384 [3:41:07<23:00:06, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=7.16s]
Epoch 0: 14%|█▍ | 1733/12384 [3:41:15<23:00:06, 7.77s/it, loss=0.0001, acc=0.9998, iter_time=5.34s]
Epoch 0: 14%|█▍ | 1734/12384 [3:41:15<23:01:20, 7.78s/it, loss=0.0001, acc=0.9998, iter_time=5.34s]
Epoch 0: 14%|█▍ | 1734/12384 [3:41:23<23:01:20, 7.78s/it, loss=0.0016, acc=0.9975, iter_time=8.05s]
Epoch 0: 14%|█▍ | 1735/12384 [3:41:23<23:02:09, 7.79s/it, loss=0.0016, acc=0.9975, iter_time=8.05s]
Epoch 0: 14%|█▍ | 1735/12384 [3:41:31<23:02:09, 7.79s/it, loss=0.0017, acc=0.9965, iter_time=10.99s]
Epoch 0: 14%|█▍ | 1736/12384 [3:41:31<23:01:56, 7.79s/it, loss=0.0017, acc=0.9965, iter_time=10.99s]
Epoch 0: 14%|█▍ | 1736/12384 [3:41:38<23:01:56, 7.79s/it, loss=0.0003, acc=0.9999, iter_time=7.50s]
Epoch 0: 14%|█▍ | 1737/12384 [3:41:38<23:03:27, 7.80s/it, loss=0.0003, acc=0.9999, iter_time=7.50s]
Epoch 0: 14%|█▍ | 1737/12384 [3:41:46<23:03:27, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1738/12384 [3:41:46<23:04:52, 7.81s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1738/12384 [3:41:54<23:04:52, 7.81s/it, loss=0.0006, acc=0.9982, iter_time=7.54s]
Epoch 0: 14%|█▍ | 1739/12384 [3:41:54<23:02:54, 7.79s/it, loss=0.0006, acc=0.9982, iter_time=7.54s]
Epoch 0: 14%|█▍ | 1739/12384 [3:42:02<23:02:54, 7.79s/it, loss=0.0007, acc=0.9994, iter_time=8.07s]
Epoch 0: 14%|█▍ | 1740/12384 [3:42:02<23:03:58, 7.80s/it, loss=0.0007, acc=0.9994, iter_time=8.07s]
Epoch 0: 14%|█▍ | 1740/12384 [3:42:10<23:03:58, 7.80s/it, loss=0.0002, acc=0.9998, iter_time=7.85s]
Epoch 0: 14%|█▍ | 1741/12384 [3:42:10<23:05:46, 7.81s/it, loss=0.0002, acc=0.9998, iter_time=7.85s]
Epoch 0: 14%|█▍ | 1741/12384 [3:42:17<23:05:46, 7.81s/it, loss=0.0039, acc=0.9914, iter_time=4.48s]
Epoch 0: 14%|█▍ | 1742/12384 [3:42:17<23:02:34, 7.80s/it, loss=0.0039, acc=0.9914, iter_time=4.48s]
Epoch 0: 14%|█▍ | 1742/12384 [3:42:25<23:02:34, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=9.76s]
Epoch 0: 14%|█▍ | 1743/12384 [3:42:25<23:03:44, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=9.76s]
Epoch 0: 14%|█▍ | 1743/12384 [3:42:33<23:03:44, 7.80s/it, loss=0.0023, acc=0.9954, iter_time=9.54s]
Epoch 0: 14%|█▍ | 1744/12384 [3:42:33<23:25:28, 7.93s/it, loss=0.0023, acc=0.9954, iter_time=9.54s]
Epoch 0: 14%|█▍ | 1744/12384 [3:42:41<23:25:28, 7.93s/it, loss=0.0022, acc=0.9948, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1745/12384 [3:42:41<23:16:25, 7.88s/it, loss=0.0022, acc=0.9948, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1745/12384 [3:42:49<23:16:25, 7.88s/it, loss=0.0006, acc=0.9994, iter_time=7.85s]
Epoch 0: 14%|█▍ | 1746/12384 [3:42:49<23:12:17, 7.85s/it, loss=0.0006, acc=0.9994, iter_time=7.85s]
Epoch 0: 14%|█▍ | 1746/12384 [3:42:57<23:12:17, 7.85s/it, loss=0.0018, acc=0.9937, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1747/12384 [3:42:57<23:09:45, 7.84s/it, loss=0.0018, acc=0.9937, iter_time=7.75s]
Epoch 0: 14%|█▍ | 1747/12384 [3:43:05<23:09:45, 7.84s/it, loss=0.0006, acc=0.9974, iter_time=7.83s]
Epoch 0: 14%|█▍ | 1748/12384 [3:43:05<23:08:43, 7.83s/it, loss=0.0006, acc=0.9974, iter_time=7.83s]
Epoch 0: 14%|█▍ | 1748/12384 [3:43:12<23:08:43, 7.83s/it, loss=0.0024, acc=0.9947, iter_time=7.81s]
Epoch 0: 14%|█▍ | 1749/12384 [3:43:12<23:06:45, 7.82s/it, loss=0.0024, acc=0.9947, iter_time=7.81s]
Epoch 0: 14%|█▍ | 1749/12384 [3:43:20<23:06:45, 7.82s/it, loss=0.0003, acc=0.9999, iter_time=8.27s]
Epoch 0: 14%|█▍ | 1750/12384 [3:43:20<23:06:22, 7.82s/it, loss=0.0003, acc=0.9999, iter_time=8.27s]
Epoch 0: 14%|█▍ | 1750/12384 [3:43:28<23:06:22, 7.82s/it, loss=0.0006, acc=0.9997, iter_time=7.42s]
Epoch 0: 14%|█▍ | 1751/12384 [3:43:28<23:07:47, 7.83s/it, loss=0.0006, acc=0.9997, iter_time=7.42s]
Epoch 0: 14%|█▍ | 1751/12384 [3:43:36<23:07:47, 7.83s/it, loss=0.0003, acc=0.9993, iter_time=7.79s]
Epoch 0: 14%|█▍ | 1752/12384 [3:43:36<23:06:34, 7.82s/it, loss=0.0003, acc=0.9993, iter_time=7.79s]
Epoch 0: 14%|█▍ | 1752/12384 [3:43:44<23:06:34, 7.82s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 14%|█▍ | 1753/12384 [3:43:44<23:11:13, 7.85s/it, loss=0.0001, acc=1.0000, iter_time=7.90s]
Epoch 0: 14%|█▍ | 1753/12384 [3:43:52<23:11:13, 7.85s/it, loss=0.0024, acc=0.9939, iter_time=6.94s]
Epoch 0: 14%|█▍ | 1754/12384 [3:43:52<23:28:14, 7.95s/it, loss=0.0024, acc=0.9939, iter_time=6.94s]
Epoch 0: 14%|█▍ | 1754/12384 [3:44:00<23:28:14, 7.95s/it, loss=0.0014, acc=0.9977, iter_time=8.44s]
Epoch 0: 14%|█▍ | 1755/12384 [3:44:00<23:20:30, 7.91s/it, loss=0.0014, acc=0.9977, iter_time=8.44s]
Epoch 0: 14%|█▍ | 1755/12384 [3:44:08<23:20:30, 7.91s/it, loss=0.0008, acc=0.9980, iter_time=7.78s]
Epoch 0: 14%|█▍ | 1756/12384 [3:44:08<23:14:59, 7.88s/it, loss=0.0008, acc=0.9980, iter_time=7.78s]
Epoch 0: 14%|█▍ | 1756/12384 [3:44:16<23:14:59, 7.88s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 14%|█▍ | 1757/12384 [3:44:16<23:16:59, 7.89s/it, loss=0.0001, acc=1.0000, iter_time=8.54s]
Epoch 0: 14%|█▍ | 1757/12384 [3:44:23<23:16:59, 7.89s/it, loss=0.0002, acc=1.0000, iter_time=7.28s]
Epoch 0: 14%|█▍ | 1758/12384 [3:44:23<23:12:50, 7.86s/it, loss=0.0002, acc=1.0000, iter_time=7.28s]
Epoch 0: 14%|█▍ | 1758/12384 [3:44:31<23:12:50, 7.86s/it, loss=0.0007, acc=0.9974, iter_time=8.09s]
Epoch 0: 14%|█▍ | 1759/12384 [3:44:31<23:12:35, 7.86s/it, loss=0.0007, acc=0.9974, iter_time=8.09s]
Epoch 0: 14%|█▍ | 1759/12384 [3:44:39<23:12:35, 7.86s/it, loss=0.0018, acc=0.9956, iter_time=8.11s]
Epoch 0: 14%|█▍ | 1760/12384 [3:44:39<23:09:14, 7.85s/it, loss=0.0018, acc=0.9956, iter_time=8.11s]
Epoch 0: 14%|█▍ | 1760/12384 [3:44:47<23:09:14, 7.85s/it, loss=0.0004, acc=0.9991, iter_time=5.90s]
Epoch 0: 14%|█▍ | 1761/12384 [3:44:47<23:19:35, 7.91s/it, loss=0.0004, acc=0.9991, iter_time=5.90s]
Epoch 0: 14%|█▍ | 1761/12384 [3:44:55<23:19:35, 7.91s/it, loss=0.0005, acc=0.9976, iter_time=8.25s]
Epoch 0: 14%|█▍ | 1762/12384 [3:44:55<23:12:07, 7.86s/it, loss=0.0005, acc=0.9976, iter_time=8.25s]
Epoch 0: 14%|█▍ | 1762/12384 [3:45:03<23:12:07, 7.86s/it, loss=0.0002, acc=1.0000, iter_time=9.50s]
Epoch 0: 14%|█▍ | 1763/12384 [3:45:03<23:09:11, 7.85s/it, loss=0.0002, acc=1.0000, iter_time=9.50s]
Epoch 0: 14%|█▍ | 1763/12384 [3:45:10<23:09:11, 7.85s/it, loss=0.0007, acc=0.9982, iter_time=4.94s]
Epoch 0: 14%|█▍ | 1764/12384 [3:45:10<23:08:14, 7.84s/it, loss=0.0007, acc=0.9982, iter_time=4.94s]
Epoch 0: 14%|█▍ | 1764/12384 [3:45:18<23:08:14, 7.84s/it, loss=0.0006, acc=0.9982, iter_time=10.69s]
Epoch 0: 14%|█▍ | 1765/12384 [3:45:18<23:08:06, 7.84s/it, loss=0.0006, acc=0.9982, iter_time=10.69s]
Epoch 0: 14%|█▍ | 1765/12384 [3:45:26<23:08:06, 7.84s/it, loss=0.0001, acc=1.0000, iter_time=5.71s]
Epoch 0: 14%|█▍ | 1766/12384 [3:45:26<23:06:33, 7.84s/it, loss=0.0001, acc=1.0000, iter_time=5.71s]
Epoch 0: 14%|█▍ | 1766/12384 [3:45:34<23:06:33, 7.84s/it, loss=0.0002, acc=0.9998, iter_time=9.05s]
Epoch 0: 14%|█▍ | 1767/12384 [3:45:34<23:05:36, 7.83s/it, loss=0.0002, acc=0.9998, iter_time=9.05s]
Epoch 0: 14%|█▍ | 1767/12384 [3:45:42<23:05:36, 7.83s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 14%|█▍ | 1768/12384 [3:45:42<23:08:10, 7.85s/it, loss=0.0001, acc=1.0000, iter_time=9.10s]
Epoch 0: 14%|█▍ | 1768/12384 [3:45:50<23:08:10, 7.85s/it, loss=0.0003, acc=0.9994, iter_time=6.85s]
Epoch 0: 14%|█▍ | 1769/12384 [3:45:50<23:04:41, 7.83s/it, loss=0.0003, acc=0.9994, iter_time=6.85s]
Epoch 0: 14%|█▍ | 1769/12384 [3:45:58<23:04:41, 7.83s/it, loss=0.0004, acc=0.9997, iter_time=8.80s]
Epoch 0: 14%|█▍ | 1770/12384 [3:45:58<23:24:37, 7.94s/it, loss=0.0004, acc=0.9997, iter_time=8.80s]
Epoch 0: 14%|█▍ | 1770/12384 [3:46:06<23:24:37, 7.94s/it, loss=0.0004, acc=0.9998, iter_time=7.86s]
Epoch 0: 14%|█▍ | 1771/12384 [3:46:06<23:16:48, 7.90s/it, loss=0.0004, acc=0.9998, iter_time=7.86s]
Epoch 0: 14%|█▍ | 1771/12384 [3:46:13<23:16:48, 7.90s/it, loss=0.0007, acc=0.9953, iter_time=7.87s]
Epoch 0: 14%|█▍ | 1772/12384 [3:46:13<23:17:09, 7.90s/it, loss=0.0007, acc=0.9953, iter_time=7.87s]
Epoch 0: 14%|█▍ | 1772/12384 [3:46:21<23:17:09, 7.90s/it, loss=0.0025, acc=0.9956, iter_time=7.79s]
Epoch 0: 14%|█▍ | 1773/12384 [3:46:21<23:16:44, 7.90s/it, loss=0.0025, acc=0.9956, iter_time=7.79s]
Epoch 0: 14%|█▍ | 1773/12384 [3:46:29<23:16:44, 7.90s/it, loss=0.0004, acc=1.0000, iter_time=7.95s]
Epoch 0: 14%|█▍ | 1774/12384 [3:46:29<23:12:54, 7.88s/it, loss=0.0004, acc=1.0000, iter_time=7.95s]
Epoch 0: 14%|█▍ | 1774/12384 [3:46:37<23:12:54, 7.88s/it, loss=0.0030, acc=0.9984, iter_time=6.09s]
Epoch 0: 14%|█▍ | 1775/12384 [3:46:37<23:08:46, 7.85s/it, loss=0.0030, acc=0.9984, iter_time=6.09s]
Epoch 0: 14%|█▍ | 1775/12384 [3:46:45<23:08:46, 7.85s/it, loss=0.0011, acc=0.9989, iter_time=9.50s]
Epoch 0: 14%|█▍ | 1776/12384 [3:46:45<23:07:33, 7.85s/it, loss=0.0011, acc=0.9989, iter_time=9.50s]
Epoch 0: 14%|█▍ | 1776/12384 [3:46:53<23:07:33, 7.85s/it, loss=0.0014, acc=0.9959, iter_time=7.89s]
Epoch 0: 14%|█▍ | 1777/12384 [3:46:53<23:06:48, 7.84s/it, loss=0.0014, acc=0.9959, iter_time=7.89s]
Epoch 0: 14%|█▍ | 1777/12384 [3:47:01<23:06:48, 7.84s/it, loss=0.0004, acc=1.0000, iter_time=7.80s]
Epoch 0: 14%|█▍ | 1778/12384 [3:47:01<23:08:36, 7.86s/it, loss=0.0004, acc=1.0000, iter_time=7.80s]
Epoch 0: 14%|█▍ | 1778/12384 [3:47:08<23:08:36, 7.86s/it, loss=0.0004, acc=0.9999, iter_time=7.94s]
Epoch 0: 14%|█▍ | 1779/12384 [3:47:08<23:09:00, 7.86s/it, loss=0.0004, acc=0.9999, iter_time=7.94s]
Epoch 0: 14%|█▍ | 1779/12384 [3:47:16<23:09:00, 7.86s/it, loss=0.0003, acc=0.9998, iter_time=7.16s]
Epoch 0: 14%|█▍ | 1780/12384 [3:47:16<23:04:48, 7.84s/it, loss=0.0003, acc=0.9998, iter_time=7.16s]
Epoch 0: 14%|█▍ | 1780/12384 [3:47:24<23:04:48, 7.84s/it, loss=0.0029, acc=0.9959, iter_time=8.36s]
Epoch 0: 14%|█▍ | 1781/12384 [3:47:24<23:02:08, 7.82s/it, loss=0.0029, acc=0.9959, iter_time=8.36s]
Epoch 0: 14%|█▍ | 1781/12384 [3:47:32<23:02:08, 7.82s/it, loss=0.0003, acc=0.9996, iter_time=7.17s]
Epoch 0: 14%|█▍ | 1782/12384 [3:47:32<23:00:41, 7.81s/it, loss=0.0003, acc=0.9996, iter_time=7.17s]
Epoch 0: 14%|█▍ | 1782/12384 [3:47:40<23:00:41, 7.81s/it, loss=0.0002, acc=0.9990, iter_time=8.58s]
Epoch 0: 14%|█▍ | 1783/12384 [3:47:40<23:04:46, 7.84s/it, loss=0.0002, acc=0.9990, iter_time=8.58s]
Epoch 0: 14%|█▍ | 1783/12384 [3:47:47<23:04:46, 7.84s/it, loss=0.0015, acc=0.9984, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1784/12384 [3:47:47<22:55:30, 7.79s/it, loss=0.0015, acc=0.9984, iter_time=7.61s]
Epoch 0: 14%|█▍ | 1784/12384 [3:47:55<22:55:30, 7.79s/it, loss=0.0077, acc=0.9807, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1785/12384 [3:47:55<22:46:32, 7.74s/it, loss=0.0077, acc=0.9807, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1785/12384 [3:48:03<22:46:32, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=6.46s]
Epoch 0: 14%|█▍ | 1786/12384 [3:48:03<22:41:12, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.46s]
Epoch 0: 14%|█▍ | 1786/12384 [3:48:10<22:41:12, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.22s]
Epoch 0: 14%|█▍ | 1787/12384 [3:48:10<22:38:02, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.22s]
Epoch 0: 14%|█▍ | 1787/12384 [3:48:18<22:38:02, 7.69s/it, loss=0.0005, acc=0.9996, iter_time=10.07s]
Epoch 0: 14%|█▍ | 1788/12384 [3:48:18<22:35:55, 7.68s/it, loss=0.0005, acc=0.9996, iter_time=10.07s]
Epoch 0: 14%|█▍ | 1788/12384 [3:48:26<22:35:55, 7.68s/it, loss=0.0015, acc=0.9947, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1789/12384 [3:48:26<22:31:41, 7.65s/it, loss=0.0015, acc=0.9947, iter_time=8.82s]
Epoch 0: 14%|█▍ | 1789/12384 [3:48:33<22:31:41, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1790/12384 [3:48:33<22:30:12, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 14%|█▍ | 1790/12384 [3:48:41<22:30:12, 7.65s/it, loss=0.0006, acc=0.9992, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1791/12384 [3:48:41<22:29:33, 7.64s/it, loss=0.0006, acc=0.9992, iter_time=7.64s]
Epoch 0: 14%|█▍ | 1791/12384 [3:48:48<22:29:33, 7.64s/it, loss=0.0028, acc=0.9943, iter_time=8.02s]
Epoch 0: 14%|█▍ | 1792/12384 [3:48:48<22:33:12, 7.67s/it, loss=0.0028, acc=0.9943, iter_time=8.02s]
Epoch 0: 14%|█▍ | 1792/12384 [3:48:56<22:33:12, 7.67s/it, loss=0.0006, acc=0.9999, iter_time=7.32s]
Epoch 0: 14%|█▍ | 1793/12384 [3:48:56<22:30:13, 7.65s/it, loss=0.0006, acc=0.9999, iter_time=7.32s]
Epoch 0: 14%|█▍ | 1793/12384 [3:49:04<22:30:13, 7.65s/it, loss=0.0009, acc=0.9980, iter_time=5.63s]
Epoch 0: 14%|█▍ | 1794/12384 [3:49:04<22:31:36, 7.66s/it, loss=0.0009, acc=0.9980, iter_time=5.63s]
Epoch 0: 14%|█▍ | 1794/12384 [3:49:12<22:31:36, 7.66s/it, loss=0.0004, acc=0.9986, iter_time=9.79s]
Epoch 0: 14%|█▍ | 1795/12384 [3:49:12<22:35:26, 7.68s/it, loss=0.0004, acc=0.9986, iter_time=9.79s]
Epoch 0: 14%|█▍ | 1795/12384 [3:49:19<22:35:26, 7.68s/it, loss=0.0036, acc=0.9935, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1796/12384 [3:49:19<22:31:52, 7.66s/it, loss=0.0036, acc=0.9935, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1796/12384 [3:49:27<22:31:52, 7.66s/it, loss=0.0019, acc=0.9972, iter_time=6.20s]
Epoch 0: 15%|█▍ | 1797/12384 [3:49:27<22:52:26, 7.78s/it, loss=0.0019, acc=0.9972, iter_time=6.20s]
Epoch 0: 15%|█▍ | 1797/12384 [3:49:35<22:52:26, 7.78s/it, loss=0.0027, acc=0.9931, iter_time=7.16s]
Epoch 0: 15%|█▍ | 1798/12384 [3:49:35<22:45:24, 7.74s/it, loss=0.0027, acc=0.9931, iter_time=7.16s]
Epoch 0: 15%|█▍ | 1798/12384 [3:49:42<22:45:24, 7.74s/it, loss=0.0003, acc=1.0000, iter_time=8.44s]
Epoch 0: 15%|█▍ | 1799/12384 [3:49:42<22:39:07, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=8.44s]
Epoch 0: 15%|█▍ | 1799/12384 [3:49:50<22:39:07, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=9.64s]
Epoch 0: 15%|█▍ | 1800/12384 [3:49:50<22:40:22, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=9.64s]
Epoch 0: 15%|█▍ | 1800/12384 [3:49:58<22:40:22, 7.71s/it, loss=0.0003, acc=0.9998, iter_time=7.23s]
Epoch 0: 15%|█▍ | 1801/12384 [3:49:58<22:41:26, 7.72s/it, loss=0.0003, acc=0.9998, iter_time=7.23s]
Epoch 0: 15%|█▍ | 1801/12384 [3:50:06<22:41:26, 7.72s/it, loss=0.0002, acc=0.9978, iter_time=6.78s]
Epoch 0: 15%|█▍ | 1802/12384 [3:50:06<22:36:15, 7.69s/it, loss=0.0002, acc=0.9978, iter_time=6.78s]
Epoch 0: 15%|█▍ | 1802/12384 [3:50:13<22:36:15, 7.69s/it, loss=0.0006, acc=0.9969, iter_time=7.07s]
Epoch 0: 15%|█▍ | 1803/12384 [3:50:13<22:35:02, 7.68s/it, loss=0.0006, acc=0.9969, iter_time=7.07s]
Epoch 0: 15%|█▍ | 1803/12384 [3:50:21<22:35:02, 7.68s/it, loss=0.0010, acc=0.9975, iter_time=9.16s]
Epoch 0: 15%|█▍ | 1804/12384 [3:50:21<22:33:40, 7.68s/it, loss=0.0010, acc=0.9975, iter_time=9.16s]
Epoch 0: 15%|█▍ | 1804/12384 [3:50:28<22:33:40, 7.68s/it, loss=0.0005, acc=0.9983, iter_time=7.37s]
Epoch 0: 15%|█▍ | 1805/12384 [3:50:28<22:30:29, 7.66s/it, loss=0.0005, acc=0.9983, iter_time=7.37s]
Epoch 0: 15%|█▍ | 1805/12384 [3:50:36<22:30:29, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1806/12384 [3:50:36<22:30:26, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1806/12384 [3:50:44<22:30:26, 7.66s/it, loss=0.0006, acc=0.9973, iter_time=8.08s]
Epoch 0: 15%|█▍ | 1807/12384 [3:50:44<22:36:42, 7.70s/it, loss=0.0006, acc=0.9973, iter_time=8.08s]
Epoch 0: 15%|█▍ | 1807/12384 [3:50:52<22:36:42, 7.70s/it, loss=0.0022, acc=0.9913, iter_time=8.05s]
Epoch 0: 15%|█▍ | 1808/12384 [3:50:52<22:33:57, 7.68s/it, loss=0.0022, acc=0.9913, iter_time=8.05s]
Epoch 0: 15%|█▍ | 1808/12384 [3:50:59<22:33:57, 7.68s/it, loss=0.0011, acc=0.9975, iter_time=7.30s]
Epoch 0: 15%|█▍ | 1809/12384 [3:50:59<22:32:59, 7.68s/it, loss=0.0011, acc=0.9975, iter_time=7.30s]
Epoch 0: 15%|█▍ | 1809/12384 [3:51:07<22:32:59, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1810/12384 [3:51:07<22:29:42, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1810/12384 [3:51:14<22:29:42, 7.66s/it, loss=0.0033, acc=0.9906, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1811/12384 [3:51:14<22:28:04, 7.65s/it, loss=0.0033, acc=0.9906, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1811/12384 [3:51:22<22:28:04, 7.65s/it, loss=0.0009, acc=0.9976, iter_time=7.66s]
Epoch 0: 15%|█▍ | 1812/12384 [3:51:22<22:27:44, 7.65s/it, loss=0.0009, acc=0.9976, iter_time=7.66s]
Epoch 0: 15%|█▍ | 1812/12384 [3:51:30<22:27:44, 7.65s/it, loss=0.0002, acc=0.9999, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1813/12384 [3:51:30<22:27:28, 7.65s/it, loss=0.0002, acc=0.9999, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1813/12384 [3:51:37<22:27:28, 7.65s/it, loss=0.0015, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1814/12384 [3:51:37<22:25:19, 7.64s/it, loss=0.0015, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▍ | 1814/12384 [3:51:45<22:25:19, 7.64s/it, loss=0.0005, acc=0.9999, iter_time=7.72s]
Epoch 0: 15%|█▍ | 1815/12384 [3:51:45<22:33:20, 7.68s/it, loss=0.0005, acc=0.9999, iter_time=7.72s]
Epoch 0: 15%|█▍ | 1815/12384 [3:51:53<22:33:20, 7.68s/it, loss=0.0013, acc=0.9975, iter_time=8.07s]
Epoch 0: 15%|█▍ | 1816/12384 [3:51:53<22:29:58, 7.66s/it, loss=0.0013, acc=0.9975, iter_time=8.07s]
Epoch 0: 15%|█▍ | 1816/12384 [3:52:00<22:29:58, 7.66s/it, loss=0.0018, acc=0.9935, iter_time=7.23s]
Epoch 0: 15%|█▍ | 1817/12384 [3:52:00<22:27:13, 7.65s/it, loss=0.0018, acc=0.9935, iter_time=7.23s]
Epoch 0: 15%|█▍ | 1817/12384 [3:52:08<22:27:13, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1818/12384 [3:52:08<22:26:06, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1818/12384 [3:52:16<22:26:06, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.39s]
Epoch 0: 15%|█▍ | 1819/12384 [3:52:16<22:24:22, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.39s]
Epoch 0: 15%|█▍ | 1819/12384 [3:52:23<22:24:22, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.86s]
Epoch 0: 15%|█▍ | 1820/12384 [3:52:23<22:23:22, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.86s]
Epoch 0: 15%|█▍ | 1820/12384 [3:52:31<22:23:22, 7.63s/it, loss=0.0008, acc=0.9997, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1821/12384 [3:52:31<22:25:28, 7.64s/it, loss=0.0008, acc=0.9997, iter_time=7.63s]
Epoch 0: 15%|█▍ | 1821/12384 [3:52:39<22:25:28, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=7.67s]
Epoch 0: 15%|█▍ | 1822/12384 [3:52:39<22:25:30, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=7.67s]
Epoch 0: 15%|█▍ | 1822/12384 [3:52:47<22:25:30, 7.64s/it, loss=0.0032, acc=0.9905, iter_time=7.32s]
Epoch 0: 15%|█▍ | 1823/12384 [3:52:47<22:45:21, 7.76s/it, loss=0.0032, acc=0.9905, iter_time=7.32s]
Epoch 0: 15%|█▍ | 1823/12384 [3:52:54<22:45:21, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 0: 15%|█▍ | 1824/12384 [3:52:54<22:42:28, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=8.71s]
Epoch 0: 15%|█▍ | 1824/12384 [3:53:02<22:42:28, 7.74s/it, loss=0.0006, acc=0.9988, iter_time=7.32s]
Epoch 0: 15%|█▍ | 1825/12384 [3:53:02<22:36:33, 7.71s/it, loss=0.0006, acc=0.9988, iter_time=7.32s]
Epoch 0: 15%|█▍ | 1825/12384 [3:53:10<22:36:33, 7.71s/it, loss=0.0020, acc=0.9928, iter_time=7.64s]
Epoch 0: 15%|█▍ | 1826/12384 [3:53:10<22:31:40, 7.68s/it, loss=0.0020, acc=0.9928, iter_time=7.64s]
Epoch 0: 15%|█▍ | 1826/12384 [3:53:17<22:31:40, 7.68s/it, loss=0.0028, acc=0.9947, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1827/12384 [3:53:17<22:29:02, 7.67s/it, loss=0.0028, acc=0.9947, iter_time=7.61s]
Epoch 0: 15%|█▍ | 1827/12384 [3:53:25<22:29:02, 7.67s/it, loss=0.0008, acc=0.9974, iter_time=5.63s]
Epoch 0: 15%|█▍ | 1828/12384 [3:53:25<22:31:10, 7.68s/it, loss=0.0008, acc=0.9974, iter_time=5.63s]
Epoch 0: 15%|█▍ | 1828/12384 [3:53:33<22:31:10, 7.68s/it, loss=0.0004, acc=0.9997, iter_time=9.71s]
Epoch 0: 15%|█▍ | 1829/12384 [3:53:33<22:28:01, 7.66s/it, loss=0.0004, acc=0.9997, iter_time=9.71s]
Epoch 0: 15%|█▍ | 1829/12384 [3:53:40<22:28:01, 7.66s/it, loss=0.0006, acc=1.0000, iter_time=6.44s]
Epoch 0: 15%|█▍ | 1830/12384 [3:53:40<22:27:40, 7.66s/it, loss=0.0006, acc=1.0000, iter_time=6.44s]
Epoch 0: 15%|█▍ | 1830/12384 [3:53:48<22:27:40, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.96s]
Epoch 0: 15%|█▍ | 1831/12384 [3:53:48<22:30:49, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=8.96s]
Epoch 0: 15%|█▍ | 1831/12384 [3:53:56<22:30:49, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.57s]
Epoch 0: 15%|█▍ | 1832/12384 [3:53:56<22:27:57, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.57s]
Epoch 0: 15%|█▍ | 1832/12384 [3:54:03<22:27:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.47s]
Epoch 0: 15%|█▍ | 1833/12384 [3:54:03<22:26:22, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.47s]
Epoch 0: 15%|█▍ | 1833/12384 [3:54:11<22:26:22, 7.66s/it, loss=0.0003, acc=0.9999, iter_time=8.85s]
Epoch 0: 15%|█▍ | 1834/12384 [3:54:11<22:24:13, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=8.85s]
Epoch 0: 15%|█▍ | 1834/12384 [3:54:18<22:24:13, 7.64s/it, loss=0.0005, acc=0.9994, iter_time=6.38s]
Epoch 0: 15%|█▍ | 1835/12384 [3:54:18<22:23:38, 7.64s/it, loss=0.0005, acc=0.9994, iter_time=6.38s]
Epoch 0: 15%|█▍ | 1835/12384 [3:54:26<22:23:38, 7.64s/it, loss=0.0016, acc=0.9992, iter_time=8.55s]
Epoch 0: 15%|█▍ | 1836/12384 [3:54:26<22:19:57, 7.62s/it, loss=0.0016, acc=0.9992, iter_time=8.55s]
Epoch 0: 15%|█▍ | 1836/12384 [3:54:34<22:19:57, 7.62s/it, loss=0.0005, acc=1.0000, iter_time=7.97s]
Epoch 0: 15%|█▍ | 1837/12384 [3:54:34<22:23:53, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=7.97s]
Epoch 0: 15%|█▍ | 1837/12384 [3:54:41<22:23:53, 7.65s/it, loss=0.0013, acc=0.9972, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1838/12384 [3:54:41<22:22:03, 7.64s/it, loss=0.0013, acc=0.9972, iter_time=7.60s]
Epoch 0: 15%|█▍ | 1838/12384 [3:54:49<22:22:03, 7.64s/it, loss=0.0014, acc=0.9968, iter_time=5.35s]
Epoch 0: 15%|█▍ | 1839/12384 [3:54:49<22:20:34, 7.63s/it, loss=0.0014, acc=0.9968, iter_time=5.35s]
Epoch 0: 15%|█▍ | 1839/12384 [3:54:57<22:20:34, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.87s]
Epoch 0: 15%|█▍ | 1840/12384 [3:54:57<22:21:24, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.87s]
Epoch 0: 15%|█▍ | 1840/12384 [3:55:04<22:21:24, 7.63s/it, loss=0.0005, acc=0.9995, iter_time=6.70s]
Epoch 0: 15%|█▍ | 1841/12384 [3:55:04<22:21:49, 7.64s/it, loss=0.0005, acc=0.9995, iter_time=6.70s]
Epoch 0: 15%|█▍ | 1841/12384 [3:55:12<22:21:49, 7.64s/it, loss=0.0005, acc=0.9996, iter_time=8.60s]
Epoch 0: 15%|█▍ | 1842/12384 [3:55:12<22:19:42, 7.62s/it, loss=0.0005, acc=0.9996, iter_time=8.60s]
Epoch 0: 15%|█▍ | 1842/12384 [3:55:19<22:19:42, 7.62s/it, loss=0.0021, acc=0.9944, iter_time=5.26s]
Epoch 0: 15%|█▍ | 1843/12384 [3:55:19<22:20:46, 7.63s/it, loss=0.0021, acc=0.9944, iter_time=5.26s]
Epoch 0: 15%|█▍ | 1843/12384 [3:55:27<22:20:46, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.13s]
Epoch 0: 15%|█▍ | 1844/12384 [3:55:27<22:21:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.13s]
Epoch 0: 15%|█▍ | 1844/12384 [3:55:35<22:21:45, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.42s]
Epoch 0: 15%|█▍ | 1845/12384 [3:55:35<22:20:19, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.42s]
Epoch 0: 15%|█▍ | 1845/12384 [3:55:44<22:20:19, 7.63s/it, loss=0.0006, acc=0.9985, iter_time=7.97s]
Epoch 0: 15%|█▍ | 1846/12384 [3:55:44<23:25:11, 8.00s/it, loss=0.0006, acc=0.9985, iter_time=7.97s]
Epoch 0: 15%|█▍ | 1846/12384 [3:55:51<23:25:11, 8.00s/it, loss=0.0019, acc=0.9927, iter_time=10.60s]
Epoch 0: 15%|█▍ | 1847/12384 [3:55:51<23:06:42, 7.90s/it, loss=0.0019, acc=0.9927, iter_time=10.60s]
Epoch 0: 15%|█▍ | 1847/12384 [3:55:59<23:06:42, 7.90s/it, loss=0.0001, acc=1.0000, iter_time=8.58s]
Epoch 0: 15%|█▍ | 1848/12384 [3:55:59<23:18:52, 7.97s/it, loss=0.0001, acc=1.0000, iter_time=8.58s]
Epoch 0: 15%|█▍ | 1848/12384 [3:56:07<23:18:52, 7.97s/it, loss=0.0002, acc=1.0000, iter_time=7.57s]
Epoch 0: 15%|█▍ | 1849/12384 [3:56:07<23:24:22, 8.00s/it, loss=0.0002, acc=1.0000, iter_time=7.57s]
Epoch 0: 15%|█▍ | 1849/12384 [3:56:15<23:24:22, 8.00s/it, loss=0.0013, acc=0.9980, iter_time=8.12s]
Epoch 0: 15%|█▍ | 1850/12384 [3:56:15<23:04:17, 7.88s/it, loss=0.0013, acc=0.9980, iter_time=8.12s]
Epoch 0: 15%|█▍ | 1850/12384 [3:56:23<23:04:17, 7.88s/it, loss=0.0005, acc=0.9987, iter_time=7.22s]
Epoch 0: 15%|█▍ | 1851/12384 [3:56:23<22:50:11, 7.81s/it, loss=0.0005, acc=0.9987, iter_time=7.22s]
Epoch 0: 15%|█▍ | 1851/12384 [3:56:30<22:50:11, 7.81s/it, loss=0.0088, acc=0.9897, iter_time=7.70s]
Epoch 0: 15%|█▍ | 1852/12384 [3:56:30<22:43:38, 7.77s/it, loss=0.0088, acc=0.9897, iter_time=7.70s]
Epoch 0: 15%|█▍ | 1852/12384 [3:56:38<22:43:38, 7.77s/it, loss=0.0016, acc=0.9961, iter_time=7.72s]
Epoch 0: 15%|█▍ | 1853/12384 [3:56:38<22:41:01, 7.75s/it, loss=0.0016, acc=0.9961, iter_time=7.72s]
Epoch 0: 15%|█▍ | 1853/12384 [3:56:46<22:41:01, 7.75s/it, loss=0.0006, acc=0.9979, iter_time=7.71s]
Epoch 0: 15%|█▍ | 1854/12384 [3:56:46<22:38:31, 7.74s/it, loss=0.0006, acc=0.9979, iter_time=7.71s]
Epoch 0: 15%|█▍ | 1854/12384 [3:56:53<22:38:31, 7.74s/it, loss=0.0009, acc=0.9983, iter_time=5.69s]
Epoch 0: 15%|█▍ | 1855/12384 [3:56:53<22:32:16, 7.71s/it, loss=0.0009, acc=0.9983, iter_time=5.69s]
Epoch 0: 15%|█▍ | 1855/12384 [3:57:01<22:32:16, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=9.47s]
Epoch 0: 15%|█▍ | 1856/12384 [3:57:01<22:26:12, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=9.47s]
Epoch 0: 15%|█▍ | 1856/12384 [3:57:09<22:26:12, 7.67s/it, loss=0.0005, acc=0.9979, iter_time=7.65s]
Epoch 0: 15%|█▍ | 1857/12384 [3:57:09<22:23:42, 7.66s/it, loss=0.0005, acc=0.9979, iter_time=7.65s]
Epoch 0: 15%|█▍ | 1857/12384 [3:57:16<22:23:42, 7.66s/it, loss=0.0003, acc=0.9993, iter_time=5.30s]
Epoch 0: 15%|█▌ | 1858/12384 [3:57:16<22:22:01, 7.65s/it, loss=0.0003, acc=0.9993, iter_time=5.30s]
Epoch 0: 15%|█▌ | 1858/12384 [3:57:24<22:22:01, 7.65s/it, loss=0.0005, acc=0.9974, iter_time=9.66s]
Epoch 0: 15%|█▌ | 1859/12384 [3:57:24<22:20:52, 7.64s/it, loss=0.0005, acc=0.9974, iter_time=9.66s]
Epoch 0: 15%|█▌ | 1859/12384 [3:57:32<22:20:52, 7.64s/it, loss=0.0010, acc=0.9964, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1860/12384 [3:57:32<22:18:57, 7.63s/it, loss=0.0010, acc=0.9964, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1860/12384 [3:57:39<22:18:57, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=6.70s]
Epoch 0: 15%|█▌ | 1861/12384 [3:57:39<22:18:08, 7.63s/it, loss=0.0005, acc=0.9997, iter_time=6.70s]
Epoch 0: 15%|█▌ | 1861/12384 [3:57:47<22:18:08, 7.63s/it, loss=0.0065, acc=0.9889, iter_time=8.84s]
Epoch 0: 15%|█▌ | 1862/12384 [3:57:47<22:17:40, 7.63s/it, loss=0.0065, acc=0.9889, iter_time=8.84s]
Epoch 0: 15%|█▌ | 1862/12384 [3:57:54<22:17:40, 7.63s/it, loss=0.0028, acc=0.9897, iter_time=7.04s]
Epoch 0: 15%|█▌ | 1863/12384 [3:57:54<22:17:08, 7.63s/it, loss=0.0028, acc=0.9897, iter_time=7.04s]
Epoch 0: 15%|█▌ | 1863/12384 [3:58:02<22:17:08, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=8.16s]
Epoch 0: 15%|█▌ | 1864/12384 [3:58:02<22:16:13, 7.62s/it, loss=0.0004, acc=0.9998, iter_time=8.16s]
Epoch 0: 15%|█▌ | 1864/12384 [3:58:10<22:16:13, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.76s]
Epoch 0: 15%|█▌ | 1865/12384 [3:58:10<22:20:10, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.76s]
Epoch 0: 15%|█▌ | 1865/12384 [3:58:17<22:20:10, 7.64s/it, loss=0.0011, acc=0.9965, iter_time=7.68s]
Epoch 0: 15%|█▌ | 1866/12384 [3:58:17<22:21:24, 7.65s/it, loss=0.0011, acc=0.9965, iter_time=7.68s]
Epoch 0: 15%|█▌ | 1866/12384 [3:58:25<22:21:24, 7.65s/it, loss=0.0008, acc=0.9974, iter_time=7.72s]
Epoch 0: 15%|█▌ | 1867/12384 [3:58:25<22:24:40, 7.67s/it, loss=0.0008, acc=0.9974, iter_time=7.72s]
Epoch 0: 15%|█▌ | 1867/12384 [3:58:33<22:24:40, 7.67s/it, loss=0.0056, acc=0.9869, iter_time=4.66s]
Epoch 0: 15%|█▌ | 1868/12384 [3:58:33<22:24:17, 7.67s/it, loss=0.0056, acc=0.9869, iter_time=4.66s]
Epoch 0: 15%|█▌ | 1868/12384 [3:58:41<22:24:17, 7.67s/it, loss=0.0013, acc=0.9977, iter_time=10.81s]
Epoch 0: 15%|█▌ | 1869/12384 [3:58:41<22:31:24, 7.71s/it, loss=0.0013, acc=0.9977, iter_time=10.81s]
Epoch 0: 15%|█▌ | 1869/12384 [3:58:48<22:31:24, 7.71s/it, loss=0.0009, acc=0.9983, iter_time=7.69s]
Epoch 0: 15%|█▌ | 1870/12384 [3:58:48<22:33:55, 7.73s/it, loss=0.0009, acc=0.9983, iter_time=7.69s]
Epoch 0: 15%|█▌ | 1870/12384 [3:58:56<22:33:55, 7.73s/it, loss=0.0006, acc=0.9995, iter_time=6.27s]
Epoch 0: 15%|█▌ | 1871/12384 [3:58:56<22:27:42, 7.69s/it, loss=0.0006, acc=0.9995, iter_time=6.27s]
Epoch 0: 15%|█▌ | 1871/12384 [3:59:04<22:27:42, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=9.53s]
Epoch 0: 15%|█▌ | 1872/12384 [3:59:04<22:29:30, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.53s]
Epoch 0: 15%|█▌ | 1872/12384 [3:59:11<22:29:30, 7.70s/it, loss=0.0003, acc=0.9987, iter_time=4.37s]
Epoch 0: 15%|█▌ | 1873/12384 [3:59:11<22:27:31, 7.69s/it, loss=0.0003, acc=0.9987, iter_time=4.37s]
Epoch 0: 15%|█▌ | 1873/12384 [3:59:19<22:27:31, 7.69s/it, loss=0.0008, acc=0.9980, iter_time=10.50s]
Epoch 0: 15%|█▌ | 1874/12384 [3:59:19<22:24:08, 7.67s/it, loss=0.0008, acc=0.9980, iter_time=10.50s]
Epoch 0: 15%|█▌ | 1874/12384 [3:59:27<22:24:08, 7.67s/it, loss=0.0005, acc=0.9998, iter_time=7.75s]
Epoch 0: 15%|█▌ | 1875/12384 [3:59:27<22:41:02, 7.77s/it, loss=0.0005, acc=0.9998, iter_time=7.75s]
Epoch 0: 15%|█▌ | 1875/12384 [3:59:35<22:41:02, 7.77s/it, loss=0.0013, acc=0.9948, iter_time=8.00s]
Epoch 0: 15%|█▌ | 1876/12384 [3:59:35<22:38:26, 7.76s/it, loss=0.0013, acc=0.9948, iter_time=8.00s]
Epoch 0: 15%|█▌ | 1876/12384 [3:59:42<22:38:26, 7.76s/it, loss=0.0009, acc=0.9979, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1877/12384 [3:59:42<22:30:41, 7.71s/it, loss=0.0009, acc=0.9979, iter_time=7.61s]
Epoch 0: 15%|█▌ | 1877/12384 [3:59:50<22:30:41, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 15%|█▌ | 1878/12384 [3:59:50<22:29:09, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=6.42s]
Epoch 0: 15%|█▌ | 1878/12384 [3:59:58<22:29:09, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1879/12384 [3:59:58<22:26:05, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1879/12384 [4:00:05<22:26:05, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.03s]
Epoch 0: 15%|█▌ | 1880/12384 [4:00:05<22:22:04, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=8.03s]
Epoch 0: 15%|█▌ | 1880/12384 [4:00:13<22:22:04, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 15%|█▌ | 1881/12384 [4:00:13<22:19:20, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.22s]
Epoch 0: 15%|█▌ | 1881/12384 [4:00:20<22:19:20, 7.65s/it, loss=0.0010, acc=0.9985, iter_time=6.42s]
Epoch 0: 15%|█▌ | 1882/12384 [4:00:20<22:17:42, 7.64s/it, loss=0.0010, acc=0.9985, iter_time=6.42s]
Epoch 0: 15%|█▌ | 1882/12384 [4:00:28<22:17:42, 7.64s/it, loss=0.0019, acc=0.9958, iter_time=8.83s]
Epoch 0: 15%|█▌ | 1883/12384 [4:00:28<22:17:15, 7.64s/it, loss=0.0019, acc=0.9958, iter_time=8.83s]
Epoch 0: 15%|█▌ | 1883/12384 [4:00:36<22:17:15, 7.64s/it, loss=0.0006, acc=0.9999, iter_time=7.64s]
Epoch 0: 15%|█▌ | 1884/12384 [4:00:36<22:15:04, 7.63s/it, loss=0.0006, acc=0.9999, iter_time=7.64s]
Epoch 0: 15%|█▌ | 1884/12384 [4:00:43<22:15:04, 7.63s/it, loss=0.0012, acc=0.9973, iter_time=7.59s]
Epoch 0: 15%|█▌ | 1885/12384 [4:00:43<22:14:50, 7.63s/it, loss=0.0012, acc=0.9973, iter_time=7.59s]
Epoch 0: 15%|█▌ | 1885/12384 [4:00:51<22:14:50, 7.63s/it, loss=0.0010, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1886/12384 [4:00:51<22:17:48, 7.65s/it, loss=0.0010, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1886/12384 [4:00:59<22:17:48, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.80s]
Epoch 0: 15%|█▌ | 1887/12384 [4:00:59<22:26:22, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.80s]
Epoch 0: 15%|█▌ | 1887/12384 [4:01:06<22:26:22, 7.70s/it, loss=0.0003, acc=1.0000, iter_time=8.08s]
Epoch 0: 15%|█▌ | 1888/12384 [4:01:06<22:22:04, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=8.08s]
Epoch 0: 15%|█▌ | 1888/12384 [4:01:14<22:22:04, 7.67s/it, loss=0.0005, acc=0.9999, iter_time=6.92s]
Epoch 0: 15%|█▌ | 1889/12384 [4:01:14<22:21:10, 7.67s/it, loss=0.0005, acc=0.9999, iter_time=6.92s]
Epoch 0: 15%|█▌ | 1889/12384 [4:01:22<22:21:10, 7.67s/it, loss=0.0008, acc=0.9991, iter_time=7.99s]
Epoch 0: 15%|█▌ | 1890/12384 [4:01:22<22:18:31, 7.65s/it, loss=0.0008, acc=0.9991, iter_time=7.99s]
Epoch 0: 15%|█▌ | 1890/12384 [4:01:29<22:18:31, 7.65s/it, loss=0.0002, acc=0.9993, iter_time=6.49s]
Epoch 0: 15%|█▌ | 1891/12384 [4:01:29<22:15:38, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=6.49s]
Epoch 0: 15%|█▌ | 1891/12384 [4:01:37<22:15:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.69s]
Epoch 0: 15%|█▌ | 1892/12384 [4:01:37<22:15:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.69s]
Epoch 0: 15%|█▌ | 1892/12384 [4:01:45<22:15:05, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.74s]
Epoch 0: 15%|█▌ | 1893/12384 [4:01:45<22:22:16, 7.68s/it, loss=0.0003, acc=1.0000, iter_time=6.74s]
Epoch 0: 15%|█▌ | 1893/12384 [4:01:52<22:22:16, 7.68s/it, loss=0.0003, acc=0.9998, iter_time=10.67s]
Epoch 0: 15%|█▌ | 1894/12384 [4:01:52<22:18:47, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=10.67s]
Epoch 0: 15%|█▌ | 1894/12384 [4:02:00<22:18:47, 7.66s/it, loss=0.0005, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1895/12384 [4:02:00<22:17:55, 7.65s/it, loss=0.0005, acc=0.9984, iter_time=7.63s]
Epoch 0: 15%|█▌ | 1895/12384 [4:02:08<22:17:55, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=8.05s]
Epoch 0: 15%|█▌ | 1896/12384 [4:02:08<22:18:01, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=8.05s]
Epoch 0: 15%|█▌ | 1896/12384 [4:02:15<22:18:01, 7.65s/it, loss=0.0007, acc=0.9965, iter_time=7.25s]
Epoch 0: 15%|█▌ | 1897/12384 [4:02:15<22:17:06, 7.65s/it, loss=0.0007, acc=0.9965, iter_time=7.25s]
Epoch 0: 15%|█▌ | 1897/12384 [4:02:23<22:17:06, 7.65s/it, loss=0.0055, acc=0.9911, iter_time=4.79s]
Epoch 0: 15%|█▌ | 1898/12384 [4:02:23<22:14:52, 7.64s/it, loss=0.0055, acc=0.9911, iter_time=4.79s]
Epoch 0: 15%|█▌ | 1898/12384 [4:02:31<22:14:52, 7.64s/it, loss=0.0006, acc=1.0000, iter_time=8.96s]
Epoch 0: 15%|█▌ | 1899/12384 [4:02:31<22:16:15, 7.65s/it, loss=0.0006, acc=1.0000, iter_time=8.96s]
Epoch 0: 15%|█▌ | 1899/12384 [4:02:38<22:16:15, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.63s]
Epoch 0: 15%|█▌ | 1900/12384 [4:02:38<22:17:22, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.63s]
Epoch 0: 15%|█▌ | 1900/12384 [4:02:46<22:17:22, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.48s]
Epoch 0: 15%|█▌ | 1901/12384 [4:02:46<22:32:45, 7.74s/it, loss=0.0002, acc=0.9998, iter_time=7.48s]
Epoch 0: 15%|█▌ | 1901/12384 [4:02:54<22:32:45, 7.74s/it, loss=0.0009, acc=0.9982, iter_time=4.90s]
Epoch 0: 15%|█▌ | 1902/12384 [4:02:54<22:27:06, 7.71s/it, loss=0.0009, acc=0.9982, iter_time=4.90s]
Epoch 0: 15%|█▌ | 1902/12384 [4:03:02<22:27:06, 7.71s/it, loss=0.0058, acc=0.9907, iter_time=10.42s]
Epoch 0: 15%|█▌ | 1903/12384 [4:03:02<22:25:23, 7.70s/it, loss=0.0058, acc=0.9907, iter_time=10.42s]
Epoch 0: 15%|█▌ | 1903/12384 [4:03:09<22:25:23, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 15%|█▌ | 1904/12384 [4:03:09<22:20:17, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 15%|█▌ | 1904/12384 [4:03:17<22:20:17, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.20s]
Epoch 0: 15%|█▌ | 1905/12384 [4:03:17<22:14:56, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.20s]
Epoch 0: 15%|█▌ | 1905/12384 [4:03:24<22:14:56, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1906/12384 [4:03:24<22:13:10, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1906/12384 [4:03:32<22:13:10, 7.63s/it, loss=0.0033, acc=0.9937, iter_time=4.75s]
Epoch 0: 15%|█▌ | 1907/12384 [4:03:32<22:14:40, 7.64s/it, loss=0.0033, acc=0.9937, iter_time=4.75s]
Epoch 0: 15%|█▌ | 1907/12384 [4:03:40<22:14:40, 7.64s/it, loss=0.0009, acc=0.9985, iter_time=10.53s]
Epoch 0: 15%|█▌ | 1908/12384 [4:03:40<22:13:16, 7.64s/it, loss=0.0009, acc=0.9985, iter_time=10.53s]
Epoch 0: 15%|█▌ | 1908/12384 [4:03:47<22:13:16, 7.64s/it, loss=0.0089, acc=0.9913, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1909/12384 [4:03:47<22:13:31, 7.64s/it, loss=0.0089, acc=0.9913, iter_time=7.62s]
Epoch 0: 15%|█▌ | 1909/12384 [4:03:55<22:13:31, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=4.78s]
Epoch 0: 15%|█▌ | 1910/12384 [4:03:55<22:12:21, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=4.78s]
Epoch 0: 15%|█▌ | 1910/12384 [4:04:03<22:12:21, 7.63s/it, loss=0.0007, acc=0.9994, iter_time=10.51s]
Epoch 0: 15%|█▌ | 1911/12384 [4:04:03<22:12:55, 7.64s/it, loss=0.0007, acc=0.9994, iter_time=10.51s]
Epoch 0: 15%|█▌ | 1911/12384 [4:04:10<22:12:55, 7.64s/it, loss=0.0006, acc=0.9993, iter_time=7.57s]
Epoch 0: 15%|█▌ | 1912/12384 [4:04:10<22:12:22, 7.63s/it, loss=0.0006, acc=0.9993, iter_time=7.57s]
Epoch 0: 15%|█▌ | 1912/12384 [4:04:18<22:12:22, 7.63s/it, loss=0.0007, acc=0.9965, iter_time=4.14s]
Epoch 0: 15%|█▌ | 1913/12384 [4:04:18<22:13:53, 7.64s/it, loss=0.0007, acc=0.9965, iter_time=4.14s]
Epoch 0: 15%|█▌ | 1913/12384 [4:04:25<22:13:53, 7.64s/it, loss=0.0011, acc=0.9995, iter_time=9.97s]
Epoch 0: 15%|█▌ | 1914/12384 [4:04:25<22:14:11, 7.65s/it, loss=0.0011, acc=0.9995, iter_time=9.97s]
Epoch 0: 15%|█▌ | 1914/12384 [4:04:33<22:14:11, 7.65s/it, loss=0.0031, acc=0.9896, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1915/12384 [4:04:33<22:12:03, 7.63s/it, loss=0.0031, acc=0.9896, iter_time=8.87s]
Epoch 0: 15%|█▌ | 1915/12384 [4:04:41<22:12:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1916/12384 [4:04:41<22:15:18, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 15%|█▌ | 1916/12384 [4:04:48<22:15:18, 7.65s/it, loss=0.0006, acc=0.9999, iter_time=7.72s]
Epoch 0: 15%|█▌ | 1917/12384 [4:04:48<22:13:26, 7.64s/it, loss=0.0006, acc=0.9999, iter_time=7.72s]
Epoch 0: 15%|█▌ | 1917/12384 [4:04:56<22:13:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 15%|█▌ | 1918/12384 [4:04:56<22:11:57, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.12s]
Epoch 0: 15%|█▌ | 1918/12384 [4:05:04<22:11:57, 7.64s/it, loss=0.0014, acc=0.9978, iter_time=9.21s]
Epoch 0: 15%|█▌ | 1919/12384 [4:05:04<22:18:12, 7.67s/it, loss=0.0014, acc=0.9978, iter_time=9.21s]
Epoch 0: 15%|█▌ | 1919/12384 [4:05:11<22:18:12, 7.67s/it, loss=0.0009, acc=0.9955, iter_time=8.03s]
Epoch 0: 16%|█▌ | 1920/12384 [4:05:11<22:16:31, 7.66s/it, loss=0.0009, acc=0.9955, iter_time=8.03s]
Epoch 0: 16%|█▌ | 1920/12384 [4:05:19<22:16:31, 7.66s/it, loss=0.0006, acc=0.9974, iter_time=7.35s]
Epoch 0: 16%|█▌ | 1921/12384 [4:05:19<22:18:38, 7.68s/it, loss=0.0006, acc=0.9974, iter_time=7.35s]
Epoch 0: 16%|█▌ | 1921/12384 [4:05:27<22:18:38, 7.68s/it, loss=0.0004, acc=0.9984, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1922/12384 [4:05:27<22:16:31, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1922/12384 [4:05:34<22:16:31, 7.67s/it, loss=0.0010, acc=0.9977, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1923/12384 [4:05:34<22:14:41, 7.66s/it, loss=0.0010, acc=0.9977, iter_time=7.62s]
Epoch 0: 16%|█▌ | 1923/12384 [4:05:42<22:14:41, 7.66s/it, loss=0.0015, acc=0.9953, iter_time=3.81s]
Epoch 0: 16%|█▌ | 1924/12384 [4:05:42<22:14:22, 7.65s/it, loss=0.0015, acc=0.9953, iter_time=3.81s]
Epoch 0: 16%|█▌ | 1924/12384 [4:05:50<22:14:22, 7.65s/it, loss=0.0015, acc=0.9976, iter_time=11.48s]
Epoch 0: 16%|█▌ | 1925/12384 [4:05:50<22:19:12, 7.68s/it, loss=0.0015, acc=0.9976, iter_time=11.48s]
Epoch 0: 16%|█▌ | 1925/12384 [4:05:57<22:19:12, 7.68s/it, loss=0.0018, acc=0.9983, iter_time=7.74s]
Epoch 0: 16%|█▌ | 1926/12384 [4:05:57<22:17:39, 7.67s/it, loss=0.0018, acc=0.9983, iter_time=7.74s]
Epoch 0: 16%|█▌ | 1926/12384 [4:06:05<22:17:39, 7.67s/it, loss=0.0007, acc=0.9996, iter_time=4.61s]
Epoch 0: 16%|█▌ | 1927/12384 [4:06:05<22:16:06, 7.67s/it, loss=0.0007, acc=0.9996, iter_time=4.61s]
Epoch 0: 16%|█▌ | 1927/12384 [4:06:13<22:16:06, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=11.38s]
Epoch 0: 16%|█▌ | 1928/12384 [4:06:13<22:30:39, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=11.38s]
Epoch 0: 16%|█▌ | 1928/12384 [4:06:21<22:30:39, 7.75s/it, loss=0.0020, acc=0.9942, iter_time=7.23s]
Epoch 0: 16%|█▌ | 1929/12384 [4:06:21<22:23:05, 7.71s/it, loss=0.0020, acc=0.9942, iter_time=7.23s]
Epoch 0: 16%|█▌ | 1929/12384 [4:06:28<22:23:05, 7.71s/it, loss=0.0022, acc=0.9954, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1930/12384 [4:06:28<22:19:33, 7.69s/it, loss=0.0022, acc=0.9954, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1930/12384 [4:06:36<22:19:33, 7.69s/it, loss=0.0006, acc=0.9994, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1931/12384 [4:06:36<22:17:43, 7.68s/it, loss=0.0006, acc=0.9994, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1931/12384 [4:06:44<22:17:43, 7.68s/it, loss=0.0006, acc=0.9998, iter_time=7.35s]
Epoch 0: 16%|█▌ | 1932/12384 [4:06:44<22:14:33, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=7.35s]
Epoch 0: 16%|█▌ | 1932/12384 [4:06:51<22:14:33, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 16%|█▌ | 1933/12384 [4:06:51<22:13:47, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 16%|█▌ | 1933/12384 [4:06:59<22:13:47, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1934/12384 [4:06:59<22:14:58, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1934/12384 [4:07:07<22:14:58, 7.66s/it, loss=0.0009, acc=0.9995, iter_time=7.07s]
Epoch 0: 16%|█▌ | 1935/12384 [4:07:07<22:13:37, 7.66s/it, loss=0.0009, acc=0.9995, iter_time=7.07s]
Epoch 0: 16%|█▌ | 1935/12384 [4:07:14<22:13:37, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=8.62s]
Epoch 0: 16%|█▌ | 1936/12384 [4:07:14<22:15:40, 7.67s/it, loss=0.0005, acc=1.0000, iter_time=8.62s]
Epoch 0: 16%|█▌ | 1936/12384 [4:07:22<22:15:40, 7.67s/it, loss=0.0006, acc=0.9981, iter_time=6.11s]
Epoch 0: 16%|█▌ | 1937/12384 [4:07:22<22:11:57, 7.65s/it, loss=0.0006, acc=0.9981, iter_time=6.11s]
Epoch 0: 16%|█▌ | 1937/12384 [4:07:29<22:11:57, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1938/12384 [4:07:29<22:10:10, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1938/12384 [4:07:37<22:10:10, 7.64s/it, loss=0.0016, acc=0.9985, iter_time=8.87s]
Epoch 0: 16%|█▌ | 1939/12384 [4:07:37<22:08:42, 7.63s/it, loss=0.0016, acc=0.9985, iter_time=8.87s]
Epoch 0: 16%|█▌ | 1939/12384 [4:07:45<22:08:42, 7.63s/it, loss=0.0006, acc=0.9991, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1940/12384 [4:07:45<22:10:12, 7.64s/it, loss=0.0006, acc=0.9991, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1940/12384 [4:07:52<22:10:12, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=6.40s]
Epoch 0: 16%|█▌ | 1941/12384 [4:07:52<22:09:36, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=6.40s]
Epoch 0: 16%|█▌ | 1941/12384 [4:08:00<22:09:36, 7.64s/it, loss=0.0019, acc=0.9960, iter_time=8.83s]
Epoch 0: 16%|█▌ | 1942/12384 [4:08:00<22:08:45, 7.64s/it, loss=0.0019, acc=0.9960, iter_time=8.83s]
Epoch 0: 16%|█▌ | 1942/12384 [4:08:08<22:08:45, 7.64s/it, loss=0.0012, acc=0.9983, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1943/12384 [4:08:08<22:08:28, 7.63s/it, loss=0.0012, acc=0.9983, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1943/12384 [4:08:15<22:08:28, 7.63s/it, loss=0.0018, acc=0.9950, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1944/12384 [4:08:15<22:09:24, 7.64s/it, loss=0.0018, acc=0.9950, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1944/12384 [4:08:23<22:09:24, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=4.80s]
Epoch 0: 16%|█▌ | 1945/12384 [4:08:23<22:11:04, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=4.80s]
Epoch 0: 16%|█▌ | 1945/12384 [4:08:31<22:11:04, 7.65s/it, loss=0.0016, acc=0.9941, iter_time=8.20s]
Epoch 0: 16%|█▌ | 1946/12384 [4:08:31<22:09:29, 7.64s/it, loss=0.0016, acc=0.9941, iter_time=8.20s]
Epoch 0: 16%|█▌ | 1946/12384 [4:08:38<22:09:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.94s]
Epoch 0: 16%|█▌ | 1947/12384 [4:08:38<22:08:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.94s]
Epoch 0: 16%|█▌ | 1947/12384 [4:08:46<22:08:00, 7.63s/it, loss=0.0028, acc=0.9932, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1948/12384 [4:08:46<22:08:19, 7.64s/it, loss=0.0028, acc=0.9932, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1948/12384 [4:08:53<22:08:19, 7.64s/it, loss=0.0011, acc=0.9975, iter_time=6.44s]
Epoch 0: 16%|█▌ | 1949/12384 [4:08:53<22:07:14, 7.63s/it, loss=0.0011, acc=0.9975, iter_time=6.44s]
Epoch 0: 16%|█▌ | 1949/12384 [4:09:01<22:07:14, 7.63s/it, loss=0.0010, acc=0.9976, iter_time=9.22s]
Epoch 0: 16%|█▌ | 1950/12384 [4:09:01<22:06:02, 7.63s/it, loss=0.0010, acc=0.9976, iter_time=9.22s]
Epoch 0: 16%|█▌ | 1950/12384 [4:09:09<22:06:02, 7.63s/it, loss=0.0012, acc=0.9975, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1951/12384 [4:09:09<22:05:53, 7.63s/it, loss=0.0012, acc=0.9975, iter_time=7.21s]
Epoch 0: 16%|█▌ | 1951/12384 [4:09:16<22:05:53, 7.63s/it, loss=0.0020, acc=0.9984, iter_time=8.02s]
Epoch 0: 16%|█▌ | 1952/12384 [4:09:16<22:05:05, 7.62s/it, loss=0.0020, acc=0.9984, iter_time=8.02s]
Epoch 0: 16%|█▌ | 1952/12384 [4:09:24<22:05:05, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 0: 16%|█▌ | 1953/12384 [4:09:24<22:10:12, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.23s]
Epoch 0: 16%|█▌ | 1953/12384 [4:09:32<22:10:12, 7.65s/it, loss=0.0006, acc=0.9966, iter_time=6.84s]
Epoch 0: 16%|█▌ | 1954/12384 [4:09:32<22:27:12, 7.75s/it, loss=0.0006, acc=0.9966, iter_time=6.84s]
Epoch 0: 16%|█▌ | 1954/12384 [4:09:40<22:27:12, 7.75s/it, loss=0.0016, acc=0.9979, iter_time=7.73s]
Epoch 0: 16%|█▌ | 1955/12384 [4:09:40<22:21:00, 7.72s/it, loss=0.0016, acc=0.9979, iter_time=7.73s]
Epoch 0: 16%|█▌ | 1955/12384 [4:09:47<22:21:00, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=5.24s]
Epoch 0: 16%|█▌ | 1956/12384 [4:09:47<22:20:44, 7.71s/it, loss=0.0001, acc=0.9998, iter_time=5.24s]
Epoch 0: 16%|█▌ | 1956/12384 [4:09:55<22:20:44, 7.71s/it, loss=0.0005, acc=0.9980, iter_time=8.93s]
Epoch 0: 16%|█▌ | 1957/12384 [4:09:55<22:19:44, 7.71s/it, loss=0.0005, acc=0.9980, iter_time=8.93s]
Epoch 0: 16%|█▌ | 1957/12384 [4:10:03<22:19:44, 7.71s/it, loss=0.0009, acc=0.9999, iter_time=9.39s]
Epoch 0: 16%|█▌ | 1958/12384 [4:10:03<22:13:21, 7.67s/it, loss=0.0009, acc=0.9999, iter_time=9.39s]
Epoch 0: 16%|█▌ | 1958/12384 [4:10:10<22:13:21, 7.67s/it, loss=0.0110, acc=0.9852, iter_time=6.98s]
Epoch 0: 16%|█▌ | 1959/12384 [4:10:10<22:09:47, 7.65s/it, loss=0.0110, acc=0.9852, iter_time=6.98s]
Epoch 0: 16%|█▌ | 1959/12384 [4:10:18<22:09:47, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.80s]
Epoch 0: 16%|█▌ | 1960/12384 [4:10:18<22:09:09, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.80s]
Epoch 0: 16%|█▌ | 1960/12384 [4:10:26<22:09:09, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1961/12384 [4:10:26<22:11:04, 7.66s/it, loss=0.0004, acc=0.9988, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1961/12384 [4:10:33<22:11:04, 7.66s/it, loss=0.0009, acc=0.9980, iter_time=6.77s]
Epoch 0: 16%|█▌ | 1962/12384 [4:10:33<22:10:19, 7.66s/it, loss=0.0009, acc=0.9980, iter_time=6.77s]
Epoch 0: 16%|█▌ | 1962/12384 [4:10:41<22:10:19, 7.66s/it, loss=0.0237, acc=0.9555, iter_time=8.60s]
Epoch 0: 16%|█▌ | 1963/12384 [4:10:41<22:09:29, 7.65s/it, loss=0.0237, acc=0.9555, iter_time=8.60s]
Epoch 0: 16%|█▌ | 1963/12384 [4:10:49<22:09:29, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.85s]
Epoch 0: 16%|█▌ | 1964/12384 [4:10:49<22:09:08, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.85s]
Epoch 0: 16%|█▌ | 1964/12384 [4:10:56<22:09:08, 7.65s/it, loss=0.0012, acc=0.9981, iter_time=10.44s]
Epoch 0: 16%|█▌ | 1965/12384 [4:10:56<22:08:21, 7.65s/it, loss=0.0012, acc=0.9981, iter_time=10.44s]
Epoch 0: 16%|█▌ | 1965/12384 [4:11:04<22:08:21, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 16%|█▌ | 1966/12384 [4:11:04<22:12:08, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.70s]
Epoch 0: 16%|█▌ | 1966/12384 [4:11:12<22:12:08, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1967/12384 [4:11:12<22:13:45, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 16%|█▌ | 1967/12384 [4:11:19<22:13:45, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.74s]
Epoch 0: 16%|█▌ | 1968/12384 [4:11:19<22:13:45, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.74s]
Epoch 0: 16%|█▌ | 1968/12384 [4:11:27<22:13:45, 7.68s/it, loss=0.0007, acc=0.9980, iter_time=7.66s]
Epoch 0: 16%|█▌ | 1969/12384 [4:11:27<22:10:42, 7.67s/it, loss=0.0007, acc=0.9980, iter_time=7.66s]
Epoch 0: 16%|█▌ | 1969/12384 [4:11:35<22:10:42, 7.67s/it, loss=0.0019, acc=0.9948, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1970/12384 [4:11:35<22:08:00, 7.65s/it, loss=0.0019, acc=0.9948, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1970/12384 [4:11:42<22:08:00, 7.65s/it, loss=0.0022, acc=0.9961, iter_time=4.32s]
Epoch 0: 16%|█▌ | 1971/12384 [4:11:42<22:05:39, 7.64s/it, loss=0.0022, acc=0.9961, iter_time=4.32s]
Epoch 0: 16%|█▌ | 1971/12384 [4:11:50<22:05:39, 7.64s/it, loss=0.0010, acc=0.9983, iter_time=10.90s]
Epoch 0: 16%|█▌ | 1972/12384 [4:11:50<22:04:31, 7.63s/it, loss=0.0010, acc=0.9983, iter_time=10.90s]
Epoch 0: 16%|█▌ | 1972/12384 [4:11:57<22:04:31, 7.63s/it, loss=0.0008, acc=0.9980, iter_time=7.33s]
Epoch 0: 16%|█▌ | 1973/12384 [4:11:57<22:02:45, 7.62s/it, loss=0.0008, acc=0.9980, iter_time=7.33s]
Epoch 0: 16%|█▌ | 1973/12384 [4:12:05<22:02:45, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=7.88s]
Epoch 0: 16%|█▌ | 1974/12384 [4:12:05<22:02:15, 7.62s/it, loss=0.0005, acc=0.9998, iter_time=7.88s]
Epoch 0: 16%|█▌ | 1974/12384 [4:12:13<22:02:15, 7.62s/it, loss=0.0036, acc=0.9948, iter_time=6.69s]
Epoch 0: 16%|█▌ | 1975/12384 [4:12:13<22:03:26, 7.63s/it, loss=0.0036, acc=0.9948, iter_time=6.69s]
Epoch 0: 16%|█▌ | 1975/12384 [4:12:20<22:03:26, 7.63s/it, loss=0.0004, acc=0.9984, iter_time=8.97s]
Epoch 0: 16%|█▌ | 1976/12384 [4:12:20<22:05:14, 7.64s/it, loss=0.0004, acc=0.9984, iter_time=8.97s]
Epoch 0: 16%|█▌ | 1976/12384 [4:12:28<22:05:14, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=6.97s]
Epoch 0: 16%|█▌ | 1977/12384 [4:12:28<22:04:47, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=6.97s]
Epoch 0: 16%|█▌ | 1977/12384 [4:12:36<22:04:47, 7.64s/it, loss=0.0004, acc=0.9996, iter_time=7.95s]
Epoch 0: 16%|█▌ | 1978/12384 [4:12:36<22:03:52, 7.63s/it, loss=0.0004, acc=0.9996, iter_time=7.95s]
Epoch 0: 16%|█▌ | 1978/12384 [4:12:43<22:03:52, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1979/12384 [4:12:43<22:03:04, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 16%|█▌ | 1979/12384 [4:12:51<22:03:04, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1980/12384 [4:12:51<22:04:35, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1980/12384 [4:12:59<22:04:35, 7.64s/it, loss=0.0006, acc=0.9991, iter_time=7.98s]
Epoch 0: 16%|█▌ | 1981/12384 [4:12:59<22:24:27, 7.75s/it, loss=0.0006, acc=0.9991, iter_time=7.98s]
Epoch 0: 16%|█▌ | 1981/12384 [4:13:07<22:24:27, 7.75s/it, loss=0.0004, acc=0.9991, iter_time=7.76s]
Epoch 0: 16%|█▌ | 1982/12384 [4:13:07<22:20:20, 7.73s/it, loss=0.0004, acc=0.9991, iter_time=7.76s]
Epoch 0: 16%|█▌ | 1982/12384 [4:13:14<22:20:20, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1983/12384 [4:13:14<22:13:17, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 16%|█▌ | 1983/12384 [4:13:22<22:13:17, 7.69s/it, loss=0.0002, acc=0.9998, iter_time=8.10s]
Epoch 0: 16%|█▌ | 1984/12384 [4:13:22<22:14:39, 7.70s/it, loss=0.0002, acc=0.9998, iter_time=8.10s]
Epoch 0: 16%|█▌ | 1984/12384 [4:13:29<22:14:39, 7.70s/it, loss=0.0007, acc=0.9972, iter_time=6.29s]
Epoch 0: 16%|█▌ | 1985/12384 [4:13:29<22:10:48, 7.68s/it, loss=0.0007, acc=0.9972, iter_time=6.29s]
Epoch 0: 16%|█▌ | 1985/12384 [4:13:37<22:10:48, 7.68s/it, loss=0.0004, acc=0.9997, iter_time=8.55s]
Epoch 0: 16%|█▌ | 1986/12384 [4:13:37<22:06:18, 7.65s/it, loss=0.0004, acc=0.9997, iter_time=8.55s]
Epoch 0: 16%|█▌ | 1986/12384 [4:13:45<22:06:18, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=7.31s]
Epoch 0: 16%|█▌ | 1987/12384 [4:13:45<22:06:29, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=7.31s]
Epoch 0: 16%|█▌ | 1987/12384 [4:13:52<22:06:29, 7.66s/it, loss=0.0005, acc=1.0000, iter_time=7.96s]
Epoch 0: 16%|█▌ | 1988/12384 [4:13:52<22:05:58, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=7.96s]
Epoch 0: 16%|█▌ | 1988/12384 [4:14:00<22:05:58, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=3.67s]
Epoch 0: 16%|█▌ | 1989/12384 [4:14:00<22:05:35, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=3.67s]
Epoch 0: 16%|█▌ | 1989/12384 [4:14:08<22:05:35, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=11.65s]
Epoch 0: 16%|█▌ | 1990/12384 [4:14:08<22:06:24, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=11.65s]
Epoch 0: 16%|█▌ | 1990/12384 [4:14:15<22:06:24, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.23s]
Epoch 0: 16%|█▌ | 1991/12384 [4:14:15<22:07:12, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=6.23s]
Epoch 0: 16%|█▌ | 1991/12384 [4:14:23<22:07:12, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=9.47s]
Epoch 0: 16%|█▌ | 1992/12384 [4:14:23<22:06:01, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=9.47s]
Epoch 0: 16%|█▌ | 1992/12384 [4:14:31<22:06:01, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.13s]
Epoch 0: 16%|█▌ | 1993/12384 [4:14:31<22:04:59, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.13s]
Epoch 0: 16%|█▌ | 1993/12384 [4:14:38<22:04:59, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.47s]
Epoch 0: 16%|█▌ | 1994/12384 [4:14:38<22:05:31, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.47s]
Epoch 0: 16%|█▌ | 1994/12384 [4:14:46<22:05:31, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=9.99s]
Epoch 0: 16%|█▌ | 1995/12384 [4:14:46<22:05:20, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=9.99s]
Epoch 0: 16%|█▌ | 1995/12384 [4:14:54<22:05:20, 7.65s/it, loss=0.0005, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1996/12384 [4:14:54<22:01:50, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=7.60s]
Epoch 0: 16%|█▌ | 1996/12384 [4:15:01<22:01:50, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1997/12384 [4:15:01<22:01:59, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▌ | 1997/12384 [4:15:09<22:01:59, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.57s]
Epoch 0: 16%|█▌ | 1998/12384 [4:15:09<22:03:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.57s]
Epoch 0: 16%|█▌ | 1998/12384 [4:15:16<22:03:39, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=10.70s]
Epoch 0: 16%|█▌ | 1999/12384 [4:15:16<22:00:35, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=10.70s]
Epoch 0: 16%|█▌ | 1999/12384 [4:15:24<22:00:35, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=8.03s]
Epoch 0: 16%|█▌ | 2000/12384 [4:15:24<22:10:48, 7.69s/it, loss=0.0004, acc=0.9998, iter_time=8.03s]
Epoch 0: 16%|█▌ | 2000/12384 [4:15:32<22:10:48, 7.69s/it, loss=0.0011, acc=0.9961, iter_time=7.11s]
Epoch 0: 16%|█▌ | 2001/12384 [4:15:32<22:08:41, 7.68s/it, loss=0.0011, acc=0.9961, iter_time=7.11s]
Epoch 0: 16%|█▌ | 2001/12384 [4:15:40<22:08:41, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=7.41s]
Epoch 0: 16%|█▌ | 2002/12384 [4:15:40<22:07:36, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.41s]
Epoch 0: 16%|█▌ | 2002/12384 [4:15:47<22:07:36, 7.67s/it, loss=0.0008, acc=0.9977, iter_time=8.22s]
Epoch 0: 16%|█▌ | 2003/12384 [4:15:47<22:05:49, 7.66s/it, loss=0.0008, acc=0.9977, iter_time=8.22s]
Epoch 0: 16%|█▌ | 2003/12384 [4:15:55<22:05:49, 7.66s/it, loss=0.0028, acc=0.9974, iter_time=7.63s]
Epoch 0: 16%|█▌ | 2004/12384 [4:15:55<22:03:53, 7.65s/it, loss=0.0028, acc=0.9974, iter_time=7.63s]
Epoch 0: 16%|█▌ | 2004/12384 [4:16:02<22:03:53, 7.65s/it, loss=0.0013, acc=0.9964, iter_time=7.61s]
Epoch 0: 16%|█▌ | 2005/12384 [4:16:02<22:01:33, 7.64s/it, loss=0.0013, acc=0.9964, iter_time=7.61s]
Epoch 0: 16%|█▌ | 2005/12384 [4:16:10<22:01:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 16%|█▌ | 2006/12384 [4:16:10<22:13:24, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 16%|█▌ | 2006/12384 [4:16:18<22:13:24, 7.71s/it, loss=0.0004, acc=0.9995, iter_time=7.66s]
Epoch 0: 16%|█▌ | 2007/12384 [4:16:18<22:27:46, 7.79s/it, loss=0.0004, acc=0.9995, iter_time=7.66s]
Epoch 0: 16%|█▌ | 2007/12384 [4:16:26<22:27:46, 7.79s/it, loss=0.0003, acc=1.0000, iter_time=8.30s]
Epoch 0: 16%|█▌ | 2008/12384 [4:16:26<22:19:24, 7.75s/it, loss=0.0003, acc=1.0000, iter_time=8.30s]
Epoch 0: 16%|█▌ | 2008/12384 [4:16:34<22:19:24, 7.75s/it, loss=0.0008, acc=0.9988, iter_time=7.26s]
Epoch 0: 16%|█▌ | 2009/12384 [4:16:34<22:12:16, 7.70s/it, loss=0.0008, acc=0.9988, iter_time=7.26s]
Epoch 0: 16%|█▌ | 2009/12384 [4:16:41<22:12:16, 7.70s/it, loss=0.0106, acc=0.9933, iter_time=4.32s]
Epoch 0: 16%|█▌ | 2010/12384 [4:16:41<22:09:06, 7.69s/it, loss=0.0106, acc=0.9933, iter_time=4.32s]
Epoch 0: 16%|█▌ | 2010/12384 [4:16:49<22:09:06, 7.69s/it, loss=0.0006, acc=0.9983, iter_time=10.94s]
Epoch 0: 16%|█▌ | 2011/12384 [4:16:49<22:04:38, 7.66s/it, loss=0.0006, acc=0.9983, iter_time=10.94s]
Epoch 0: 16%|█▌ | 2011/12384 [4:16:56<22:04:38, 7.66s/it, loss=0.0019, acc=0.9972, iter_time=7.60s]
Epoch 0: 16%|█▌ | 2012/12384 [4:16:56<22:02:41, 7.65s/it, loss=0.0019, acc=0.9972, iter_time=7.60s]
Epoch 0: 16%|█▌ | 2012/12384 [4:17:04<22:02:41, 7.65s/it, loss=0.0006, acc=0.9987, iter_time=6.43s]
Epoch 0: 16%|█▋ | 2013/12384 [4:17:04<22:03:10, 7.66s/it, loss=0.0006, acc=0.9987, iter_time=6.43s]
Epoch 0: 16%|█▋ | 2013/12384 [4:17:12<22:03:10, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.24s]
Epoch 0: 16%|█▋ | 2014/12384 [4:17:12<22:01:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.24s]
Epoch 0: 16%|█▋ | 2014/12384 [4:17:19<22:01:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 16%|█▋ | 2015/12384 [4:17:19<22:07:21, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 16%|█▋ | 2015/12384 [4:17:27<22:07:21, 7.68s/it, loss=0.0017, acc=0.9963, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2016/12384 [4:17:27<22:07:43, 7.68s/it, loss=0.0017, acc=0.9963, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2016/12384 [4:17:35<22:07:43, 7.68s/it, loss=0.0007, acc=0.9967, iter_time=7.34s]
Epoch 0: 16%|█▋ | 2017/12384 [4:17:35<22:04:46, 7.67s/it, loss=0.0007, acc=0.9967, iter_time=7.34s]
Epoch 0: 16%|█▋ | 2017/12384 [4:17:42<22:04:46, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.00s]
Epoch 0: 16%|█▋ | 2018/12384 [4:17:42<22:04:33, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.00s]
Epoch 0: 16%|█▋ | 2018/12384 [4:17:50<22:04:33, 7.67s/it, loss=0.0019, acc=0.9958, iter_time=8.63s]
Epoch 0: 16%|█▋ | 2019/12384 [4:17:50<22:04:42, 7.67s/it, loss=0.0019, acc=0.9958, iter_time=8.63s]
Epoch 0: 16%|█▋ | 2019/12384 [4:17:58<22:04:42, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▋ | 2020/12384 [4:17:58<22:04:45, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 16%|█▋ | 2020/12384 [4:18:05<22:04:45, 7.67s/it, loss=0.0004, acc=1.0000, iter_time=7.68s]
Epoch 0: 16%|█▋ | 2021/12384 [4:18:05<22:01:19, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.68s]
Epoch 0: 16%|█▋ | 2021/12384 [4:18:13<22:01:19, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=4.76s]
Epoch 0: 16%|█▋ | 2022/12384 [4:18:13<22:01:05, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=4.76s]
Epoch 0: 16%|█▋ | 2022/12384 [4:18:21<22:01:05, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=10.50s]
Epoch 0: 16%|█▋ | 2023/12384 [4:18:21<22:00:32, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=10.50s]
Epoch 0: 16%|█▋ | 2023/12384 [4:18:28<22:00:32, 7.65s/it, loss=0.0016, acc=0.9940, iter_time=8.04s]
Epoch 0: 16%|█▋ | 2024/12384 [4:18:28<22:00:13, 7.65s/it, loss=0.0016, acc=0.9940, iter_time=8.04s]
Epoch 0: 16%|█▋ | 2024/12384 [4:18:36<22:00:13, 7.65s/it, loss=0.0006, acc=0.9985, iter_time=7.27s]
Epoch 0: 16%|█▋ | 2025/12384 [4:18:36<22:04:21, 7.67s/it, loss=0.0006, acc=0.9985, iter_time=7.27s]
Epoch 0: 16%|█▋ | 2025/12384 [4:18:44<22:04:21, 7.67s/it, loss=0.0017, acc=0.9965, iter_time=7.72s]
Epoch 0: 16%|█▋ | 2026/12384 [4:18:44<22:04:00, 7.67s/it, loss=0.0017, acc=0.9965, iter_time=7.72s]
Epoch 0: 16%|█▋ | 2026/12384 [4:18:51<22:04:00, 7.67s/it, loss=0.0033, acc=0.9953, iter_time=7.66s]
Epoch 0: 16%|█▋ | 2027/12384 [4:18:51<22:03:18, 7.67s/it, loss=0.0033, acc=0.9953, iter_time=7.66s]
Epoch 0: 16%|█▋ | 2027/12384 [4:18:59<22:03:18, 7.67s/it, loss=0.0007, acc=0.9979, iter_time=7.68s]
Epoch 0: 16%|█▋ | 2028/12384 [4:18:59<22:02:29, 7.66s/it, loss=0.0007, acc=0.9979, iter_time=7.68s]
Epoch 0: 16%|█▋ | 2028/12384 [4:19:07<22:02:29, 7.66s/it, loss=0.0007, acc=0.9980, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2029/12384 [4:19:07<22:02:47, 7.66s/it, loss=0.0007, acc=0.9980, iter_time=7.65s]
Epoch 0: 16%|█▋ | 2029/12384 [4:19:14<22:02:47, 7.66s/it, loss=0.0022, acc=0.9895, iter_time=7.66s]
Epoch 0: 16%|█▋ | 2030/12384 [4:19:14<21:59:39, 7.65s/it, loss=0.0022, acc=0.9895, iter_time=7.66s]
Epoch 0: 16%|█▋ | 2030/12384 [4:19:22<21:59:39, 7.65s/it, loss=0.0003, acc=0.9979, iter_time=7.60s]
Epoch 0: 16%|█▋ | 2031/12384 [4:19:22<21:57:51, 7.64s/it, loss=0.0003, acc=0.9979, iter_time=7.60s]
Epoch 0: 16%|█▋ | 2031/12384 [4:19:30<21:57:51, 7.64s/it, loss=0.0012, acc=0.9958, iter_time=8.33s]
Epoch 0: 16%|█▋ | 2032/12384 [4:19:30<22:12:37, 7.72s/it, loss=0.0012, acc=0.9958, iter_time=8.33s]
Epoch 0: 16%|█▋ | 2032/12384 [4:19:38<22:12:37, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=3.68s]
Epoch 0: 16%|█▋ | 2033/12384 [4:19:38<22:26:28, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=3.68s]
Epoch 0: 16%|█▋ | 2033/12384 [4:19:46<22:26:28, 7.80s/it, loss=0.0003, acc=0.9998, iter_time=9.83s]
Epoch 0: 16%|█▋ | 2034/12384 [4:19:46<22:19:54, 7.77s/it, loss=0.0003, acc=0.9998, iter_time=9.83s]
Epoch 0: 16%|█▋ | 2034/12384 [4:19:53<22:19:54, 7.77s/it, loss=0.0080, acc=0.9892, iter_time=9.38s]
Epoch 0: 16%|█▋ | 2035/12384 [4:19:53<22:12:00, 7.72s/it, loss=0.0080, acc=0.9892, iter_time=9.38s]
Epoch 0: 16%|█▋ | 2035/12384 [4:20:01<22:12:00, 7.72s/it, loss=0.0016, acc=0.9959, iter_time=7.31s]
Epoch 0: 16%|█▋ | 2036/12384 [4:20:01<22:08:40, 7.70s/it, loss=0.0016, acc=0.9959, iter_time=7.31s]
Epoch 0: 16%|█▋ | 2036/12384 [4:20:09<22:08:40, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=6.52s]
Epoch 0: 16%|█▋ | 2037/12384 [4:20:09<22:07:42, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=6.52s]
Epoch 0: 16%|█▋ | 2037/12384 [4:20:16<22:07:42, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 16%|█▋ | 2038/12384 [4:20:16<22:04:05, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 16%|█▋ | 2038/12384 [4:20:24<22:04:05, 7.68s/it, loss=0.0006, acc=0.9980, iter_time=10.83s]
Epoch 0: 16%|█▋ | 2039/12384 [4:20:24<22:09:00, 7.71s/it, loss=0.0006, acc=0.9980, iter_time=10.83s]
Epoch 0: 16%|█▋ | 2039/12384 [4:20:32<22:09:00, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 16%|█▋ | 2040/12384 [4:20:32<22:03:05, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.99s]
Epoch 0: 16%|█▋ | 2040/12384 [4:20:39<22:03:05, 7.67s/it, loss=0.0014, acc=0.9969, iter_time=7.20s]
Epoch 0: 16%|█▋ | 2041/12384 [4:20:39<22:01:32, 7.67s/it, loss=0.0014, acc=0.9969, iter_time=7.20s]
Epoch 0: 16%|█▋ | 2041/12384 [4:20:47<22:01:32, 7.67s/it, loss=0.0009, acc=0.9990, iter_time=6.79s]
Epoch 0: 16%|█▋ | 2042/12384 [4:20:47<21:59:26, 7.65s/it, loss=0.0009, acc=0.9990, iter_time=6.79s]
Epoch 0: 16%|█▋ | 2042/12384 [4:20:54<21:59:26, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=8.49s]
Epoch 0: 16%|█▋ | 2043/12384 [4:20:54<21:56:41, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=8.49s]
Epoch 0: 16%|█▋ | 2043/12384 [4:21:02<21:56:41, 7.64s/it, loss=0.0015, acc=0.9952, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2044/12384 [4:21:02<21:55:31, 7.63s/it, loss=0.0015, acc=0.9952, iter_time=7.59s]
Epoch 0: 17%|█▋ | 2044/12384 [4:21:10<21:55:31, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2045/12384 [4:21:10<21:57:28, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2045/12384 [4:21:17<21:57:28, 7.65s/it, loss=0.0004, acc=0.9998, iter_time=5.98s]
Epoch 0: 17%|█▋ | 2046/12384 [4:21:17<21:55:06, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=5.98s]
Epoch 0: 17%|█▋ | 2046/12384 [4:21:25<21:55:06, 7.63s/it, loss=0.0002, acc=0.9986, iter_time=9.59s]
Epoch 0: 17%|█▋ | 2047/12384 [4:21:25<21:55:26, 7.64s/it, loss=0.0002, acc=0.9986, iter_time=9.59s]
Epoch 0: 17%|█▋ | 2047/12384 [4:21:33<21:55:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 17%|█▋ | 2048/12384 [4:21:33<21:53:39, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.02s]
Epoch 0: 17%|█▋ | 2048/12384 [4:21:40<21:53:39, 7.63s/it, loss=0.0020, acc=0.9946, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2049/12384 [4:21:40<21:55:14, 7.64s/it, loss=0.0020, acc=0.9946, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2049/12384 [4:21:48<21:55:14, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.11s]
Epoch 0: 17%|█▋ | 2050/12384 [4:21:48<21:57:11, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.11s]
Epoch 0: 17%|█▋ | 2050/12384 [4:21:56<21:57:11, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2051/12384 [4:21:56<21:56:52, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2051/12384 [4:22:03<21:56:52, 7.65s/it, loss=0.0006, acc=0.9985, iter_time=7.75s]
Epoch 0: 17%|█▋ | 2052/12384 [4:22:03<22:06:01, 7.70s/it, loss=0.0006, acc=0.9985, iter_time=7.75s]
Epoch 0: 17%|█▋ | 2052/12384 [4:22:11<22:06:01, 7.70s/it, loss=0.0001, acc=0.9995, iter_time=7.75s]
Epoch 0: 17%|█▋ | 2053/12384 [4:22:11<22:05:49, 7.70s/it, loss=0.0001, acc=0.9995, iter_time=7.75s]
Epoch 0: 17%|█▋ | 2053/12384 [4:22:19<22:05:49, 7.70s/it, loss=0.0018, acc=0.9981, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2054/12384 [4:22:19<22:03:20, 7.69s/it, loss=0.0018, acc=0.9981, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2054/12384 [4:22:26<22:03:20, 7.69s/it, loss=0.0010, acc=0.9964, iter_time=4.82s]
Epoch 0: 17%|█▋ | 2055/12384 [4:22:26<22:01:18, 7.68s/it, loss=0.0010, acc=0.9964, iter_time=4.82s]
Epoch 0: 17%|█▋ | 2055/12384 [4:22:34<22:01:18, 7.68s/it, loss=0.0008, acc=0.9981, iter_time=10.84s]
Epoch 0: 17%|█▋ | 2056/12384 [4:22:34<21:57:53, 7.66s/it, loss=0.0008, acc=0.9981, iter_time=10.84s]
Epoch 0: 17%|█▋ | 2056/12384 [4:22:42<21:57:53, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2057/12384 [4:22:42<21:55:39, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2057/12384 [4:22:49<21:55:39, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2058/12384 [4:22:49<21:54:56, 7.64s/it, loss=0.0003, acc=0.9999, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2058/12384 [4:22:57<21:54:56, 7.64s/it, loss=0.0124, acc=0.9792, iter_time=7.95s]
Epoch 0: 17%|█▋ | 2059/12384 [4:22:57<22:13:56, 7.75s/it, loss=0.0124, acc=0.9792, iter_time=7.95s]
Epoch 0: 17%|█▋ | 2059/12384 [4:23:05<22:13:56, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=6.21s]
Epoch 0: 17%|█▋ | 2060/12384 [4:23:05<22:06:13, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=6.21s]
Epoch 0: 17%|█▋ | 2060/12384 [4:23:12<22:06:13, 7.71s/it, loss=0.0168, acc=0.9786, iter_time=9.10s]
Epoch 0: 17%|█▋ | 2061/12384 [4:23:12<22:02:27, 7.69s/it, loss=0.0168, acc=0.9786, iter_time=9.10s]
Epoch 0: 17%|█▋ | 2061/12384 [4:23:20<22:02:27, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2062/12384 [4:23:20<22:00:58, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2062/12384 [4:23:28<22:00:58, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2063/12384 [4:23:28<21:57:34, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2063/12384 [4:23:35<21:57:34, 7.66s/it, loss=0.0004, acc=0.9998, iter_time=7.99s]
Epoch 0: 17%|█▋ | 2064/12384 [4:23:35<21:59:06, 7.67s/it, loss=0.0004, acc=0.9998, iter_time=7.99s]
Epoch 0: 17%|█▋ | 2064/12384 [4:23:43<21:59:06, 7.67s/it, loss=0.0017, acc=0.9990, iter_time=7.31s]
Epoch 0: 17%|█▋ | 2065/12384 [4:23:43<21:56:02, 7.65s/it, loss=0.0017, acc=0.9990, iter_time=7.31s]
Epoch 0: 17%|█▋ | 2065/12384 [4:23:51<21:56:02, 7.65s/it, loss=0.0009, acc=0.9958, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2066/12384 [4:23:51<21:55:53, 7.65s/it, loss=0.0009, acc=0.9958, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2066/12384 [4:23:58<21:55:53, 7.65s/it, loss=0.0006, acc=0.9994, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2067/12384 [4:23:58<21:54:21, 7.64s/it, loss=0.0006, acc=0.9994, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2067/12384 [4:24:06<21:54:21, 7.64s/it, loss=0.0020, acc=0.9943, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2068/12384 [4:24:06<21:52:42, 7.63s/it, loss=0.0020, acc=0.9943, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2068/12384 [4:24:14<21:52:42, 7.63s/it, loss=0.0008, acc=0.9972, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2069/12384 [4:24:14<21:52:45, 7.64s/it, loss=0.0008, acc=0.9972, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2069/12384 [4:24:21<21:52:45, 7.64s/it, loss=0.0008, acc=0.9986, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2070/12384 [4:24:21<21:52:55, 7.64s/it, loss=0.0008, acc=0.9986, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2070/12384 [4:24:29<21:52:55, 7.64s/it, loss=0.0005, acc=0.9963, iter_time=6.70s]
Epoch 0: 17%|█▋ | 2071/12384 [4:24:29<21:52:46, 7.64s/it, loss=0.0005, acc=0.9963, iter_time=6.70s]
Epoch 0: 17%|█▋ | 2071/12384 [4:24:36<21:52:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.95s]
Epoch 0: 17%|█▋ | 2072/12384 [4:24:36<21:51:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.95s]
Epoch 0: 17%|█▋ | 2072/12384 [4:24:44<21:51:37, 7.63s/it, loss=0.0007, acc=0.9979, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2073/12384 [4:24:44<21:52:08, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.24s]
Epoch 0: 17%|█▋ | 2073/12384 [4:24:52<21:52:08, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2074/12384 [4:24:52<21:50:30, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2074/12384 [4:24:59<21:50:30, 7.63s/it, loss=0.0010, acc=0.9999, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2075/12384 [4:24:59<21:50:29, 7.63s/it, loss=0.0010, acc=0.9999, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2075/12384 [4:25:07<21:50:29, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2076/12384 [4:25:07<21:49:31, 7.62s/it, loss=0.0004, acc=1.0000, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2076/12384 [4:25:15<21:49:31, 7.62s/it, loss=0.0005, acc=0.9984, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2077/12384 [4:25:15<21:50:56, 7.63s/it, loss=0.0005, acc=0.9984, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2077/12384 [4:25:22<21:50:56, 7.63s/it, loss=0.0011, acc=0.9990, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2078/12384 [4:25:22<21:49:58, 7.63s/it, loss=0.0011, acc=0.9990, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2078/12384 [4:25:30<21:49:58, 7.63s/it, loss=0.0018, acc=0.9956, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2079/12384 [4:25:30<21:52:03, 7.64s/it, loss=0.0018, acc=0.9956, iter_time=7.63s]
Epoch 0: 17%|█▋ | 2079/12384 [4:25:37<21:52:03, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=8.04s]
Epoch 0: 17%|█▋ | 2080/12384 [4:25:37<21:50:24, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=8.04s]
Epoch 0: 17%|█▋ | 2080/12384 [4:25:45<21:50:24, 7.63s/it, loss=0.0006, acc=0.9966, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2081/12384 [4:25:45<21:54:14, 7.65s/it, loss=0.0006, acc=0.9966, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2081/12384 [4:25:53<21:54:14, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 17%|█▋ | 2082/12384 [4:25:53<21:52:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.17s]
Epoch 0: 17%|█▋ | 2082/12384 [4:26:00<21:52:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 0: 17%|█▋ | 2083/12384 [4:26:00<21:53:07, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.15s]
Epoch 0: 17%|█▋ | 2083/12384 [4:26:08<21:53:07, 7.65s/it, loss=0.0006, acc=0.9991, iter_time=7.68s]
Epoch 0: 17%|█▋ | 2084/12384 [4:26:08<21:53:54, 7.65s/it, loss=0.0006, acc=0.9991, iter_time=7.68s]
Epoch 0: 17%|█▋ | 2084/12384 [4:26:16<21:53:54, 7.65s/it, loss=0.0054, acc=0.9774, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2085/12384 [4:26:16<22:10:00, 7.75s/it, loss=0.0054, acc=0.9774, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2085/12384 [4:26:24<22:10:00, 7.75s/it, loss=0.0002, acc=0.9998, iter_time=8.55s]
Epoch 0: 17%|█▋ | 2086/12384 [4:26:24<22:01:45, 7.70s/it, loss=0.0002, acc=0.9998, iter_time=8.55s]
Epoch 0: 17%|█▋ | 2086/12384 [4:26:31<22:01:45, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 17%|█▋ | 2087/12384 [4:26:31<21:59:05, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.18s]
Epoch 0: 17%|█▋ | 2087/12384 [4:26:39<21:59:05, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2088/12384 [4:26:39<21:57:50, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 17%|█▋ | 2088/12384 [4:26:47<21:57:50, 7.68s/it, loss=0.0004, acc=0.9984, iter_time=7.05s]
Epoch 0: 17%|█▋ | 2089/12384 [4:26:47<21:55:16, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=7.05s]
Epoch 0: 17%|█▋ | 2089/12384 [4:26:54<21:55:16, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=8.25s]
Epoch 0: 17%|█▋ | 2090/12384 [4:26:54<21:54:53, 7.66s/it, loss=0.0004, acc=0.9984, iter_time=8.25s]
Epoch 0: 17%|█▋ | 2090/12384 [4:27:02<21:54:53, 7.66s/it, loss=0.0007, acc=0.9988, iter_time=4.59s]
Epoch 0: 17%|█▋ | 2091/12384 [4:27:02<21:52:36, 7.65s/it, loss=0.0007, acc=0.9988, iter_time=4.59s]
Epoch 0: 17%|█▋ | 2091/12384 [4:27:10<21:52:36, 7.65s/it, loss=0.0008, acc=0.9981, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2092/12384 [4:27:10<21:54:39, 7.66s/it, loss=0.0008, acc=0.9981, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2092/12384 [4:27:17<21:54:39, 7.66s/it, loss=0.0010, acc=0.9992, iter_time=10.51s]
Epoch 0: 17%|█▋ | 2093/12384 [4:27:17<21:53:19, 7.66s/it, loss=0.0010, acc=0.9992, iter_time=10.51s]
Epoch 0: 17%|█▋ | 2093/12384 [4:27:25<21:53:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 17%|█▋ | 2094/12384 [4:27:25<21:50:49, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.86s]
Epoch 0: 17%|█▋ | 2094/12384 [4:27:33<21:50:49, 7.64s/it, loss=0.0001, acc=0.9998, iter_time=5.83s]
Epoch 0: 17%|█▋ | 2095/12384 [4:27:33<21:51:15, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=5.83s]
Epoch 0: 17%|█▋ | 2095/12384 [4:27:40<21:51:15, 7.65s/it, loss=0.0012, acc=0.9955, iter_time=9.43s]
Epoch 0: 17%|█▋ | 2096/12384 [4:27:40<21:51:13, 7.65s/it, loss=0.0012, acc=0.9955, iter_time=9.43s]
Epoch 0: 17%|█▋ | 2096/12384 [4:27:48<21:51:13, 7.65s/it, loss=0.0053, acc=0.9871, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2097/12384 [4:27:48<21:48:55, 7.63s/it, loss=0.0053, acc=0.9871, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2097/12384 [4:27:55<21:48:55, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.01s]
Epoch 0: 17%|█▋ | 2098/12384 [4:27:55<21:49:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.01s]
Epoch 0: 17%|█▋ | 2098/12384 [4:28:03<21:49:28, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.26s]
Epoch 0: 17%|█▋ | 2099/12384 [4:28:03<21:48:05, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=10.26s]
Epoch 0: 17%|█▋ | 2099/12384 [4:28:11<21:48:05, 7.63s/it, loss=0.0025, acc=0.9951, iter_time=8.00s]
Epoch 0: 17%|█▋ | 2100/12384 [4:28:11<21:46:24, 7.62s/it, loss=0.0025, acc=0.9951, iter_time=8.00s]
Epoch 0: 17%|█▋ | 2100/12384 [4:28:18<21:46:24, 7.62s/it, loss=0.0016, acc=0.9949, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2101/12384 [4:28:18<21:47:21, 7.63s/it, loss=0.0016, acc=0.9949, iter_time=7.22s]
Epoch 0: 17%|█▋ | 2101/12384 [4:28:26<21:47:21, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2102/12384 [4:28:26<21:47:15, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 17%|█▋ | 2102/12384 [4:28:34<21:47:15, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2103/12384 [4:28:34<21:47:19, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2103/12384 [4:28:41<21:47:19, 7.63s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2104/12384 [4:28:41<21:48:25, 7.64s/it, loss=0.0020, acc=0.9977, iter_time=7.62s]
Epoch 0: 17%|█▋ | 2104/12384 [4:28:49<21:48:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.01s]
Epoch 0: 17%|█▋ | 2105/12384 [4:28:49<21:46:15, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.01s]
Epoch 0: 17%|█▋ | 2105/12384 [4:28:56<21:46:15, 7.62s/it, loss=0.0004, acc=0.9997, iter_time=8.24s]
Epoch 0: 17%|█▋ | 2106/12384 [4:28:56<21:45:51, 7.62s/it, loss=0.0004, acc=0.9997, iter_time=8.24s]
Epoch 0: 17%|█▋ | 2106/12384 [4:29:04<21:45:51, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2107/12384 [4:29:04<21:46:43, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2107/12384 [4:29:12<21:46:43, 7.63s/it, loss=0.0007, acc=0.9978, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2108/12384 [4:29:12<21:48:01, 7.64s/it, loss=0.0007, acc=0.9978, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2108/12384 [4:29:19<21:48:01, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.39s]
Epoch 0: 17%|█▋ | 2109/12384 [4:29:19<21:49:49, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.39s]
Epoch 0: 17%|█▋ | 2109/12384 [4:29:27<21:49:49, 7.65s/it, loss=0.0010, acc=0.9992, iter_time=6.73s]
Epoch 0: 17%|█▋ | 2110/12384 [4:29:27<21:47:58, 7.64s/it, loss=0.0010, acc=0.9992, iter_time=6.73s]
Epoch 0: 17%|█▋ | 2110/12384 [4:29:35<21:47:58, 7.64s/it, loss=0.0007, acc=0.9998, iter_time=6.99s]
Epoch 0: 17%|█▋ | 2111/12384 [4:29:35<21:46:22, 7.63s/it, loss=0.0007, acc=0.9998, iter_time=6.99s]
Epoch 0: 17%|█▋ | 2111/12384 [4:29:43<21:46:22, 7.63s/it, loss=0.0005, acc=0.9983, iter_time=9.87s]
Epoch 0: 17%|█▋ | 2112/12384 [4:29:43<22:04:32, 7.74s/it, loss=0.0005, acc=0.9983, iter_time=9.87s]
Epoch 0: 17%|█▋ | 2112/12384 [4:29:50<22:04:32, 7.74s/it, loss=0.0002, acc=1.0000, iter_time=7.53s]
Epoch 0: 17%|█▋ | 2113/12384 [4:29:50<21:58:25, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.53s]
Epoch 0: 17%|█▋ | 2113/12384 [4:29:58<21:58:25, 7.70s/it, loss=0.0001, acc=0.9999, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2114/12384 [4:29:58<21:56:59, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2114/12384 [4:30:06<21:56:59, 7.69s/it, loss=0.0002, acc=0.9983, iter_time=7.46s]
Epoch 0: 17%|█▋ | 2115/12384 [4:30:06<21:54:41, 7.68s/it, loss=0.0002, acc=0.9983, iter_time=7.46s]
Epoch 0: 17%|█▋ | 2115/12384 [4:30:13<21:54:41, 7.68s/it, loss=0.0002, acc=0.9999, iter_time=7.96s]
Epoch 0: 17%|█▋ | 2116/12384 [4:30:13<21:55:33, 7.69s/it, loss=0.0002, acc=0.9999, iter_time=7.96s]
Epoch 0: 17%|█▋ | 2116/12384 [4:30:21<21:55:33, 7.69s/it, loss=0.0005, acc=0.9994, iter_time=5.71s]
Epoch 0: 17%|█▋ | 2117/12384 [4:30:21<21:52:44, 7.67s/it, loss=0.0005, acc=0.9994, iter_time=5.71s]
Epoch 0: 17%|█▋ | 2117/12384 [4:30:29<21:52:44, 7.67s/it, loss=0.0022, acc=0.9939, iter_time=9.58s]
Epoch 0: 17%|█▋ | 2118/12384 [4:30:29<21:51:47, 7.67s/it, loss=0.0022, acc=0.9939, iter_time=9.58s]
Epoch 0: 17%|█▋ | 2118/12384 [4:30:36<21:51:47, 7.67s/it, loss=0.0004, acc=0.9987, iter_time=5.66s]
Epoch 0: 17%|█▋ | 2119/12384 [4:30:36<21:49:33, 7.65s/it, loss=0.0004, acc=0.9987, iter_time=5.66s]
Epoch 0: 17%|█▋ | 2119/12384 [4:30:44<21:49:33, 7.65s/it, loss=0.0003, acc=0.9986, iter_time=9.53s]
Epoch 0: 17%|█▋ | 2120/12384 [4:30:44<21:47:46, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=9.53s]
Epoch 0: 17%|█▋ | 2120/12384 [4:30:52<21:47:46, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.77s]
Epoch 0: 17%|█▋ | 2121/12384 [4:30:52<21:50:59, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.77s]
Epoch 0: 17%|█▋ | 2121/12384 [4:30:59<21:50:59, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2122/12384 [4:30:59<21:48:18, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2122/12384 [4:31:07<21:48:18, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2123/12384 [4:31:07<21:47:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2123/12384 [4:31:14<21:47:19, 7.64s/it, loss=0.0005, acc=0.9995, iter_time=5.65s]
Epoch 0: 17%|█▋ | 2124/12384 [4:31:14<21:46:57, 7.64s/it, loss=0.0005, acc=0.9995, iter_time=5.65s]
Epoch 0: 17%|█▋ | 2124/12384 [4:31:22<21:46:57, 7.64s/it, loss=0.0008, acc=0.9982, iter_time=9.69s]
Epoch 0: 17%|█▋ | 2125/12384 [4:31:22<21:47:46, 7.65s/it, loss=0.0008, acc=0.9982, iter_time=9.69s]
Epoch 0: 17%|█▋ | 2125/12384 [4:31:30<21:47:46, 7.65s/it, loss=0.0004, acc=0.9972, iter_time=7.69s]
Epoch 0: 17%|█▋ | 2126/12384 [4:31:30<21:50:25, 7.66s/it, loss=0.0004, acc=0.9972, iter_time=7.69s]
Epoch 0: 17%|█▋ | 2126/12384 [4:31:37<21:50:25, 7.66s/it, loss=0.0022, acc=0.9934, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2127/12384 [4:31:37<21:50:50, 7.67s/it, loss=0.0022, acc=0.9934, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2127/12384 [4:31:45<21:50:50, 7.67s/it, loss=0.0006, acc=0.9980, iter_time=8.14s]
Epoch 0: 17%|█▋ | 2128/12384 [4:31:45<21:56:56, 7.70s/it, loss=0.0006, acc=0.9980, iter_time=8.14s]
Epoch 0: 17%|█▋ | 2128/12384 [4:31:53<21:56:56, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.32s]
Epoch 0: 17%|█▋ | 2129/12384 [4:31:53<21:57:06, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.32s]
Epoch 0: 17%|█▋ | 2129/12384 [4:32:01<21:57:06, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2130/12384 [4:32:01<21:57:19, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2130/12384 [4:32:08<21:57:19, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 17%|█▋ | 2131/12384 [4:32:08<21:58:32, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=7.73s]
Epoch 0: 17%|█▋ | 2131/12384 [4:32:16<21:58:32, 7.72s/it, loss=0.0020, acc=0.9962, iter_time=7.69s]
Epoch 0: 17%|█▋ | 2132/12384 [4:32:16<21:56:54, 7.71s/it, loss=0.0020, acc=0.9962, iter_time=7.69s]
Epoch 0: 17%|█▋ | 2132/12384 [4:32:24<21:56:54, 7.71s/it, loss=0.0003, acc=0.9997, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2133/12384 [4:32:24<21:57:27, 7.71s/it, loss=0.0003, acc=0.9997, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2133/12384 [4:32:31<21:57:27, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2134/12384 [4:32:31<21:54:34, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2134/12384 [4:32:39<21:54:34, 7.70s/it, loss=0.0013, acc=0.9968, iter_time=8.85s]
Epoch 0: 17%|█▋ | 2135/12384 [4:32:39<21:53:44, 7.69s/it, loss=0.0013, acc=0.9968, iter_time=8.85s]
Epoch 0: 17%|█▋ | 2135/12384 [4:32:47<21:53:44, 7.69s/it, loss=0.0007, acc=0.9997, iter_time=7.56s]
Epoch 0: 17%|█▋ | 2136/12384 [4:32:47<21:49:32, 7.67s/it, loss=0.0007, acc=0.9997, iter_time=7.56s]
Epoch 0: 17%|█▋ | 2136/12384 [4:32:54<21:49:32, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 17%|█▋ | 2137/12384 [4:32:54<21:47:18, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 17%|█▋ | 2137/12384 [4:33:02<21:47:18, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=9.75s]
Epoch 0: 17%|█▋ | 2138/12384 [4:33:02<22:05:33, 7.76s/it, loss=0.0002, acc=1.0000, iter_time=9.75s]
Epoch 0: 17%|█▋ | 2138/12384 [4:33:10<22:05:33, 7.76s/it, loss=0.0002, acc=0.9996, iter_time=4.08s]
Epoch 0: 17%|█▋ | 2139/12384 [4:33:10<22:00:06, 7.73s/it, loss=0.0002, acc=0.9996, iter_time=4.08s]
Epoch 0: 17%|█▋ | 2139/12384 [4:33:18<22:00:06, 7.73s/it, loss=0.0002, acc=1.0000, iter_time=11.35s]
Epoch 0: 17%|█▋ | 2140/12384 [4:33:18<21:57:12, 7.72s/it, loss=0.0002, acc=1.0000, iter_time=11.35s]
Epoch 0: 17%|█▋ | 2140/12384 [4:33:25<21:57:12, 7.72s/it, loss=0.0003, acc=0.9999, iter_time=7.74s]
Epoch 0: 17%|█▋ | 2141/12384 [4:33:25<21:58:41, 7.72s/it, loss=0.0003, acc=0.9999, iter_time=7.74s]
Epoch 0: 17%|█▋ | 2141/12384 [4:33:33<21:58:41, 7.72s/it, loss=0.0023, acc=0.9967, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2142/12384 [4:33:33<21:58:18, 7.72s/it, loss=0.0023, acc=0.9967, iter_time=7.72s]
Epoch 0: 17%|█▋ | 2142/12384 [4:33:41<21:58:18, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=4.81s]
Epoch 0: 17%|█▋ | 2143/12384 [4:33:41<21:53:26, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=4.81s]
Epoch 0: 17%|█▋ | 2143/12384 [4:33:49<21:53:26, 7.70s/it, loss=0.0003, acc=0.9989, iter_time=10.90s]
Epoch 0: 17%|█▋ | 2144/12384 [4:33:49<21:53:16, 7.69s/it, loss=0.0003, acc=0.9989, iter_time=10.90s]
Epoch 0: 17%|█▋ | 2144/12384 [4:33:56<21:53:16, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 0: 17%|█▋ | 2145/12384 [4:33:56<21:48:31, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=4.18s]
Epoch 0: 17%|█▋ | 2145/12384 [4:34:04<21:48:31, 7.67s/it, loss=0.0027, acc=0.9913, iter_time=10.71s]
Epoch 0: 17%|█▋ | 2146/12384 [4:34:04<21:48:30, 7.67s/it, loss=0.0027, acc=0.9913, iter_time=10.71s]
Epoch 0: 17%|█▋ | 2146/12384 [4:34:11<21:48:30, 7.67s/it, loss=0.0004, acc=0.9996, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2147/12384 [4:34:11<21:45:39, 7.65s/it, loss=0.0004, acc=0.9996, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2147/12384 [4:34:19<21:45:39, 7.65s/it, loss=0.0005, acc=0.9993, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2148/12384 [4:34:19<21:43:07, 7.64s/it, loss=0.0005, acc=0.9993, iter_time=7.61s]
Epoch 0: 17%|█▋ | 2148/12384 [4:34:27<21:43:07, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 17%|█▋ | 2149/12384 [4:34:27<21:42:26, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.58s]
Epoch 0: 17%|█▋ | 2149/12384 [4:34:34<21:42:26, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=8.09s]
Epoch 0: 17%|█▋ | 2150/12384 [4:34:34<21:43:07, 7.64s/it, loss=0.0005, acc=0.9998, iter_time=8.09s]
Epoch 0: 17%|█▋ | 2150/12384 [4:34:42<21:43:07, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2151/12384 [4:34:42<21:42:54, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=7.21s]
Epoch 0: 17%|█▋ | 2151/12384 [4:34:50<21:42:54, 7.64s/it, loss=0.0005, acc=0.9976, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2152/12384 [4:34:50<21:41:46, 7.63s/it, loss=0.0005, acc=0.9976, iter_time=7.60s]
Epoch 0: 17%|█▋ | 2152/12384 [4:34:57<21:41:46, 7.63s/it, loss=0.0013, acc=0.9983, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2153/12384 [4:34:57<21:41:52, 7.63s/it, loss=0.0013, acc=0.9983, iter_time=7.65s]
Epoch 0: 17%|█▋ | 2153/12384 [4:35:05<21:41:52, 7.63s/it, loss=0.0007, acc=0.9977, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2154/12384 [4:35:05<21:41:19, 7.63s/it, loss=0.0007, acc=0.9977, iter_time=6.48s]
Epoch 0: 17%|█▋ | 2154/12384 [4:35:12<21:41:19, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.78s]
Epoch 0: 17%|█▋ | 2155/12384 [4:35:12<21:40:52, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=6.78s]
Epoch 0: 17%|█▋ | 2155/12384 [4:35:20<21:40:52, 7.63s/it, loss=0.0007, acc=0.9982, iter_time=9.82s]
Epoch 0: 17%|█▋ | 2156/12384 [4:35:20<21:48:46, 7.68s/it, loss=0.0007, acc=0.9982, iter_time=9.82s]
Epoch 0: 17%|█▋ | 2156/12384 [4:35:28<21:48:46, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2157/12384 [4:35:28<21:50:02, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.70s]
Epoch 0: 17%|█▋ | 2157/12384 [4:35:36<21:50:02, 7.69s/it, loss=0.0007, acc=0.9963, iter_time=7.71s]
Epoch 0: 17%|█▋ | 2158/12384 [4:35:36<21:50:40, 7.69s/it, loss=0.0007, acc=0.9963, iter_time=7.71s]
Epoch 0: 17%|█▋ | 2158/12384 [4:35:43<21:50:40, 7.69s/it, loss=0.0032, acc=0.9922, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2159/12384 [4:35:43<21:49:26, 7.68s/it, loss=0.0032, acc=0.9922, iter_time=7.67s]
Epoch 0: 17%|█▋ | 2159/12384 [4:35:51<21:49:26, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=8.17s]
Epoch 0: 17%|█▋ | 2160/12384 [4:35:51<21:54:20, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=8.17s]
Epoch 0: 17%|█▋ | 2160/12384 [4:35:59<21:54:20, 7.71s/it, loss=0.0006, acc=0.9963, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2161/12384 [4:35:59<21:55:04, 7.72s/it, loss=0.0006, acc=0.9963, iter_time=7.34s]
Epoch 0: 17%|█▋ | 2161/12384 [4:36:07<21:55:04, 7.72s/it, loss=0.0006, acc=0.9978, iter_time=7.71s]
Epoch 0: 17%|█▋ | 2162/12384 [4:36:07<21:54:00, 7.71s/it, loss=0.0006, acc=0.9978, iter_time=7.71s]
Epoch 0: 17%|█▋ | 2162/12384 [4:36:14<21:54:00, 7.71s/it, loss=0.0021, acc=0.9954, iter_time=6.98s]
Epoch 0: 17%|█▋ | 2163/12384 [4:36:14<21:55:18, 7.72s/it, loss=0.0021, acc=0.9954, iter_time=6.98s]
Epoch 0: 17%|█▋ | 2163/12384 [4:36:22<21:55:18, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.35s]
Epoch 0: 17%|█▋ | 2164/12384 [4:36:22<21:51:15, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.35s]
Epoch 0: 17%|█▋ | 2164/12384 [4:36:30<21:51:15, 7.70s/it, loss=0.0004, acc=1.0000, iter_time=7.68s]
Epoch 0: 17%|█▋ | 2165/12384 [4:36:30<22:05:42, 7.78s/it, loss=0.0004, acc=1.0000, iter_time=7.68s]
Epoch 0: 17%|█▋ | 2165/12384 [4:36:38<22:05:42, 7.78s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 17%|█▋ | 2166/12384 [4:36:38<22:03:57, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 17%|█▋ | 2166/12384 [4:36:45<22:03:57, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=7.82s]
Epoch 0: 17%|█▋ | 2167/12384 [4:36:45<22:03:38, 7.77s/it, loss=0.0001, acc=1.0000, iter_time=7.82s]
Epoch 0: 17%|█▋ | 2167/12384 [4:36:53<22:03:38, 7.77s/it, loss=0.0005, acc=0.9996, iter_time=7.57s]
Epoch 0: 18%|█▊ | 2168/12384 [4:36:53<21:56:24, 7.73s/it, loss=0.0005, acc=0.9996, iter_time=7.57s]
Epoch 0: 18%|█▊ | 2168/12384 [4:37:01<21:56:24, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 18%|█▊ | 2169/12384 [4:37:01<21:51:14, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 18%|█▊ | 2169/12384 [4:37:08<21:51:14, 7.70s/it, loss=0.0004, acc=0.9979, iter_time=8.27s]
Epoch 0: 18%|█▊ | 2170/12384 [4:37:08<21:48:22, 7.69s/it, loss=0.0004, acc=0.9979, iter_time=8.27s]
Epoch 0: 18%|█▊ | 2170/12384 [4:37:16<21:48:22, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 18%|█▊ | 2171/12384 [4:37:16<21:44:58, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 18%|█▊ | 2171/12384 [4:37:24<21:44:58, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.87s]
Epoch 0: 18%|█▊ | 2172/12384 [4:37:24<21:44:49, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.87s]
Epoch 0: 18%|█▊ | 2172/12384 [4:37:31<21:44:49, 7.67s/it, loss=0.0012, acc=0.9960, iter_time=9.09s]
Epoch 0: 18%|█▊ | 2173/12384 [4:37:31<21:44:14, 7.66s/it, loss=0.0012, acc=0.9960, iter_time=9.09s]
Epoch 0: 18%|█▊ | 2173/12384 [4:37:39<21:44:14, 7.66s/it, loss=0.0015, acc=0.9965, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2174/12384 [4:37:39<21:40:47, 7.64s/it, loss=0.0015, acc=0.9965, iter_time=7.96s]
Epoch 0: 18%|█▊ | 2174/12384 [4:37:46<21:40:47, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=4.82s]
Epoch 0: 18%|█▊ | 2175/12384 [4:37:46<21:38:52, 7.63s/it, loss=0.0004, acc=0.9998, iter_time=4.82s]
Epoch 0: 18%|█▊ | 2175/12384 [4:37:54<21:38:52, 7.63s/it, loss=0.0006, acc=0.9989, iter_time=10.78s]
Epoch 0: 18%|█▊ | 2176/12384 [4:37:54<21:42:44, 7.66s/it, loss=0.0006, acc=0.9989, iter_time=10.78s]
Epoch 0: 18%|█▊ | 2176/12384 [4:38:02<21:42:44, 7.66s/it, loss=0.0002, acc=0.9999, iter_time=7.33s]
Epoch 0: 18%|█▊ | 2177/12384 [4:38:02<21:46:22, 7.68s/it, loss=0.0002, acc=0.9999, iter_time=7.33s]
Epoch 0: 18%|█▊ | 2177/12384 [4:38:10<21:46:22, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.74s]
Epoch 0: 18%|█▊ | 2178/12384 [4:38:10<21:50:10, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.74s]
Epoch 0: 18%|█▊ | 2178/12384 [4:38:17<21:50:10, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 18%|█▊ | 2179/12384 [4:38:17<21:47:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 18%|█▊ | 2179/12384 [4:38:25<21:47:28, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 0: 18%|█▊ | 2180/12384 [4:38:25<21:43:43, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.56s]
Epoch 0: 18%|█▊ | 2180/12384 [4:38:33<21:43:43, 7.67s/it, loss=0.0001, acc=0.9993, iter_time=6.42s]
Epoch 0: 18%|█▊ | 2181/12384 [4:38:33<21:43:53, 7.67s/it, loss=0.0001, acc=0.9993, iter_time=6.42s]
Epoch 0: 18%|█▊ | 2181/12384 [4:38:40<21:43:53, 7.67s/it, loss=0.0004, acc=0.9977, iter_time=9.15s]
Epoch 0: 18%|█▊ | 2182/12384 [4:38:40<21:39:51, 7.64s/it, loss=0.0004, acc=0.9977, iter_time=9.15s]
Epoch 0: 18%|█▊ | 2182/12384 [4:38:48<21:39:51, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2183/12384 [4:38:48<21:39:58, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2183/12384 [4:38:55<21:39:58, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2184/12384 [4:38:55<21:38:03, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2184/12384 [4:39:03<21:38:03, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 18%|█▊ | 2185/12384 [4:39:03<21:40:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=4.28s]
Epoch 0: 18%|█▊ | 2185/12384 [4:39:11<21:40:46, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 0: 18%|█▊ | 2186/12384 [4:39:11<21:40:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=11.07s]
Epoch 0: 18%|█▊ | 2186/12384 [4:39:18<21:40:27, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 18%|█▊ | 2187/12384 [4:39:18<21:40:42, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 18%|█▊ | 2187/12384 [4:39:26<21:40:42, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.34s]
Epoch 0: 18%|█▊ | 2188/12384 [4:39:26<21:37:58, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.34s]
Epoch 0: 18%|█▊ | 2188/12384 [4:39:34<21:37:58, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.93s]
Epoch 0: 18%|█▊ | 2189/12384 [4:39:34<21:38:05, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.93s]
Epoch 0: 18%|█▊ | 2189/12384 [4:39:42<21:38:05, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 18%|█▊ | 2190/12384 [4:39:42<21:54:50, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=7.98s]
Epoch 0: 18%|█▊ | 2190/12384 [4:39:50<21:54:50, 7.74s/it, loss=0.0004, acc=0.9997, iter_time=7.70s]
Epoch 0: 18%|█▊ | 2191/12384 [4:39:50<22:08:02, 7.82s/it, loss=0.0004, acc=0.9997, iter_time=7.70s]
Epoch 0: 18%|█▊ | 2191/12384 [4:39:57<22:08:02, 7.82s/it, loss=0.0001, acc=1.0000, iter_time=8.30s]
Epoch 0: 18%|█▊ | 2192/12384 [4:39:57<21:57:58, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=8.30s]
Epoch 0: 18%|█▊ | 2192/12384 [4:40:05<21:57:58, 7.76s/it, loss=0.0007, acc=0.9980, iter_time=7.22s]
Epoch 0: 18%|█▊ | 2193/12384 [4:40:05<21:50:08, 7.71s/it, loss=0.0007, acc=0.9980, iter_time=7.22s]
Epoch 0: 18%|█▊ | 2193/12384 [4:40:13<21:50:08, 7.71s/it, loss=0.0011, acc=0.9981, iter_time=7.73s]
Epoch 0: 18%|█▊ | 2194/12384 [4:40:13<21:50:29, 7.72s/it, loss=0.0011, acc=0.9981, iter_time=7.73s]
Epoch 0: 18%|█▊ | 2194/12384 [4:40:20<21:50:29, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2195/12384 [4:40:20<21:46:19, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2195/12384 [4:40:28<21:46:19, 7.69s/it, loss=0.0003, acc=0.9998, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2196/12384 [4:40:28<21:48:29, 7.71s/it, loss=0.0003, acc=0.9998, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2196/12384 [4:40:36<21:48:29, 7.71s/it, loss=0.0006, acc=0.9979, iter_time=7.38s]
Epoch 0: 18%|█▊ | 2197/12384 [4:40:36<21:46:45, 7.70s/it, loss=0.0006, acc=0.9979, iter_time=7.38s]
Epoch 0: 18%|█▊ | 2197/12384 [4:40:43<21:46:45, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 0: 18%|█▊ | 2198/12384 [4:40:43<21:43:46, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=6.17s]
Epoch 0: 18%|█▊ | 2198/12384 [4:40:51<21:43:46, 7.68s/it, loss=0.0016, acc=0.9944, iter_time=9.44s]
Epoch 0: 18%|█▊ | 2199/12384 [4:40:51<21:43:20, 7.68s/it, loss=0.0016, acc=0.9944, iter_time=9.44s]
Epoch 0: 18%|█▊ | 2199/12384 [4:40:59<21:43:20, 7.68s/it, loss=0.0012, acc=0.9976, iter_time=8.11s]
Epoch 0: 18%|█▊ | 2200/12384 [4:40:59<21:44:59, 7.69s/it, loss=0.0012, acc=0.9976, iter_time=8.11s]
Epoch 0: 18%|█▊ | 2200/12384 [4:41:06<21:44:59, 7.69s/it, loss=0.0014, acc=0.9973, iter_time=7.21s]
Epoch 0: 18%|█▊ | 2201/12384 [4:41:06<21:44:30, 7.69s/it, loss=0.0014, acc=0.9973, iter_time=7.21s]
Epoch 0: 18%|█▊ | 2201/12384 [4:41:14<21:44:30, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=6.56s]
Epoch 0: 18%|█▊ | 2202/12384 [4:41:14<21:39:51, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=6.56s]
Epoch 0: 18%|█▊ | 2202/12384 [4:41:22<21:39:51, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 18%|█▊ | 2203/12384 [4:41:22<21:39:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 18%|█▊ | 2203/12384 [4:41:29<21:39:16, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 18%|█▊ | 2204/12384 [4:41:29<21:39:33, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.89s]
Epoch 0: 18%|█▊ | 2204/12384 [4:41:37<21:39:33, 7.66s/it, loss=0.0005, acc=0.9973, iter_time=9.95s]
Epoch 0: 18%|█▊ | 2205/12384 [4:41:37<21:35:58, 7.64s/it, loss=0.0005, acc=0.9973, iter_time=9.95s]
Epoch 0: 18%|█▊ | 2205/12384 [4:41:45<21:35:58, 7.64s/it, loss=0.0030, acc=0.9909, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2206/12384 [4:41:45<21:37:03, 7.65s/it, loss=0.0030, acc=0.9909, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2206/12384 [4:41:52<21:37:03, 7.65s/it, loss=0.0005, acc=0.9997, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2207/12384 [4:41:52<21:40:48, 7.67s/it, loss=0.0005, acc=0.9997, iter_time=7.60s]
Epoch 0: 18%|█▊ | 2207/12384 [4:42:00<21:40:48, 7.67s/it, loss=0.0014, acc=0.9955, iter_time=8.14s]
Epoch 0: 18%|█▊ | 2208/12384 [4:42:00<21:40:57, 7.67s/it, loss=0.0014, acc=0.9955, iter_time=8.14s]
Epoch 0: 18%|█▊ | 2208/12384 [4:42:08<21:40:57, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.47s]
Epoch 0: 18%|█▊ | 2209/12384 [4:42:08<21:36:39, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.47s]
Epoch 0: 18%|█▊ | 2209/12384 [4:42:15<21:36:39, 7.65s/it, loss=0.0006, acc=0.9974, iter_time=6.36s]
Epoch 0: 18%|█▊ | 2210/12384 [4:42:15<21:36:30, 7.65s/it, loss=0.0006, acc=0.9974, iter_time=6.36s]
Epoch 0: 18%|█▊ | 2210/12384 [4:42:23<21:36:30, 7.65s/it, loss=0.0007, acc=0.9986, iter_time=10.68s]
Epoch 0: 18%|█▊ | 2211/12384 [4:42:23<21:36:44, 7.65s/it, loss=0.0007, acc=0.9986, iter_time=10.68s]
Epoch 0: 18%|█▊ | 2211/12384 [4:42:31<21:36:44, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2212/12384 [4:42:31<21:37:47, 7.66s/it, loss=0.0003, acc=0.9997, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2212/12384 [4:42:38<21:37:47, 7.66s/it, loss=0.0005, acc=0.9996, iter_time=7.71s]
Epoch 0: 18%|█▊ | 2213/12384 [4:42:38<21:36:29, 7.65s/it, loss=0.0005, acc=0.9996, iter_time=7.71s]
Epoch 0: 18%|█▊ | 2213/12384 [4:42:46<21:36:29, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.67s]
Epoch 0: 18%|█▊ | 2214/12384 [4:42:46<21:34:42, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=6.67s]
Epoch 0: 18%|█▊ | 2214/12384 [4:42:54<21:34:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.88s]
Epoch 0: 18%|█▊ | 2215/12384 [4:42:54<21:49:18, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=8.88s]
Epoch 0: 18%|█▊ | 2215/12384 [4:43:01<21:49:18, 7.73s/it, loss=0.0009, acc=0.9983, iter_time=8.01s]
Epoch 0: 18%|█▊ | 2216/12384 [4:43:01<21:44:36, 7.70s/it, loss=0.0009, acc=0.9983, iter_time=8.01s]
Epoch 0: 18%|█▊ | 2216/12384 [4:43:09<21:44:36, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 18%|█▊ | 2217/12384 [4:43:09<21:55:17, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=6.32s]
Epoch 0: 18%|█▊ | 2217/12384 [4:43:17<21:55:17, 7.76s/it, loss=0.0009, acc=0.9967, iter_time=6.73s]
Epoch 0: 18%|█▊ | 2218/12384 [4:43:17<21:48:50, 7.72s/it, loss=0.0009, acc=0.9967, iter_time=6.73s]
Epoch 0: 18%|█▊ | 2218/12384 [4:43:25<21:48:50, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=8.77s]
Epoch 0: 18%|█▊ | 2219/12384 [4:43:25<21:44:53, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.77s]
Epoch 0: 18%|█▊ | 2219/12384 [4:43:32<21:44:53, 7.70s/it, loss=0.0004, acc=1.0000, iter_time=5.84s]
Epoch 0: 18%|█▊ | 2220/12384 [4:43:32<21:40:11, 7.68s/it, loss=0.0004, acc=1.0000, iter_time=5.84s]
Epoch 0: 18%|█▊ | 2220/12384 [4:43:40<21:40:11, 7.68s/it, loss=0.0004, acc=0.9984, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2221/12384 [4:43:40<21:39:00, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=7.37s]
Epoch 0: 18%|█▊ | 2221/12384 [4:43:47<21:39:00, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=8.32s]
Epoch 0: 18%|█▊ | 2222/12384 [4:43:47<21:35:13, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=8.32s]
Epoch 0: 18%|█▊ | 2222/12384 [4:43:55<21:35:13, 7.65s/it, loss=0.0007, acc=0.9979, iter_time=9.00s]
Epoch 0: 18%|█▊ | 2223/12384 [4:43:55<21:34:17, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=9.00s]
Epoch 0: 18%|█▊ | 2223/12384 [4:44:03<21:34:17, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=8.93s]
Epoch 0: 18%|█▊ | 2224/12384 [4:44:03<21:32:19, 7.63s/it, loss=0.0005, acc=1.0000, iter_time=8.93s]
Epoch 0: 18%|█▊ | 2224/12384 [4:44:10<21:32:19, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.24s]
Epoch 0: 18%|█▊ | 2225/12384 [4:44:10<21:30:39, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.24s]
Epoch 0: 18%|█▊ | 2225/12384 [4:44:18<21:30:39, 7.62s/it, loss=0.0005, acc=0.9984, iter_time=6.77s]
Epoch 0: 18%|█▊ | 2226/12384 [4:44:18<21:31:37, 7.63s/it, loss=0.0005, acc=0.9984, iter_time=6.77s]
Epoch 0: 18%|█▊ | 2226/12384 [4:44:26<21:31:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 0: 18%|█▊ | 2227/12384 [4:44:26<21:32:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.51s]
Epoch 0: 18%|█▊ | 2227/12384 [4:44:33<21:32:23, 7.63s/it, loss=0.0003, acc=0.9998, iter_time=6.41s]
Epoch 0: 18%|█▊ | 2228/12384 [4:44:33<21:30:06, 7.62s/it, loss=0.0003, acc=0.9998, iter_time=6.41s]
Epoch 0: 18%|█▊ | 2228/12384 [4:44:41<21:30:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.43s]
Epoch 0: 18%|█▊ | 2229/12384 [4:44:41<21:32:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.43s]
Epoch 0: 18%|█▊ | 2229/12384 [4:44:48<21:32:32, 7.64s/it, loss=0.0005, acc=0.9975, iter_time=7.29s]
Epoch 0: 18%|█▊ | 2230/12384 [4:44:48<21:30:19, 7.62s/it, loss=0.0005, acc=0.9975, iter_time=7.29s]
Epoch 0: 18%|█▊ | 2230/12384 [4:44:56<21:30:19, 7.62s/it, loss=0.0006, acc=0.9988, iter_time=11.35s]
Epoch 0: 18%|█▊ | 2231/12384 [4:44:56<21:29:02, 7.62s/it, loss=0.0006, acc=0.9988, iter_time=11.35s]
Epoch 0: 18%|█▊ | 2231/12384 [4:45:04<21:29:02, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.56s]
Epoch 0: 18%|█▊ | 2232/12384 [4:45:04<21:29:15, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.56s]
Epoch 0: 18%|█▊ | 2232/12384 [4:45:11<21:29:15, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2233/12384 [4:45:11<21:30:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2233/12384 [4:45:19<21:30:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.22s]
Epoch 0: 18%|█▊ | 2234/12384 [4:45:19<21:31:07, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.22s]
Epoch 0: 18%|█▊ | 2234/12384 [4:45:26<21:31:07, 7.63s/it, loss=0.0007, acc=0.9986, iter_time=9.10s]
Epoch 0: 18%|█▊ | 2235/12384 [4:45:26<21:29:50, 7.63s/it, loss=0.0007, acc=0.9986, iter_time=9.10s]
Epoch 0: 18%|█▊ | 2235/12384 [4:45:34<21:29:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 18%|█▊ | 2236/12384 [4:45:34<21:29:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.10s]
Epoch 0: 18%|█▊ | 2236/12384 [4:45:42<21:29:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.12s]
Epoch 0: 18%|█▊ | 2237/12384 [4:45:42<21:29:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.12s]
Epoch 0: 18%|█▊ | 2237/12384 [4:45:49<21:29:56, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2238/12384 [4:45:49<21:28:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2238/12384 [4:45:57<21:28:40, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2239/12384 [4:45:57<21:30:23, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 18%|█▊ | 2239/12384 [4:46:05<21:30:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.07s]
Epoch 0: 18%|█▊ | 2240/12384 [4:46:05<21:33:58, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.07s]
Epoch 0: 18%|█▊ | 2240/12384 [4:46:13<21:33:58, 7.65s/it, loss=0.0004, acc=0.9985, iter_time=7.55s]
Epoch 0: 18%|█▊ | 2241/12384 [4:46:13<21:44:06, 7.71s/it, loss=0.0004, acc=0.9985, iter_time=7.55s]
Epoch 0: 18%|█▊ | 2241/12384 [4:46:20<21:44:06, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2242/12384 [4:46:20<21:39:20, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2242/12384 [4:46:28<21:39:20, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=4.26s]
Epoch 0: 18%|█▊ | 2243/12384 [4:46:28<21:54:36, 7.78s/it, loss=0.0002, acc=1.0000, iter_time=4.26s]
Epoch 0: 18%|█▊ | 2243/12384 [4:46:36<21:54:36, 7.78s/it, loss=0.0005, acc=0.9990, iter_time=8.81s]
Epoch 0: 18%|█▊ | 2244/12384 [4:46:36<21:48:11, 7.74s/it, loss=0.0005, acc=0.9990, iter_time=8.81s]
Epoch 0: 18%|█▊ | 2244/12384 [4:46:43<21:48:11, 7.74s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2245/12384 [4:46:43<21:41:26, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2245/12384 [4:46:51<21:41:26, 7.70s/it, loss=0.0001, acc=0.9998, iter_time=10.15s]
Epoch 0: 18%|█▊ | 2246/12384 [4:46:51<21:37:38, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=10.15s]
Epoch 0: 18%|█▊ | 2246/12384 [4:46:59<21:37:38, 7.68s/it, loss=0.0066, acc=0.9912, iter_time=5.38s]
Epoch 0: 18%|█▊ | 2247/12384 [4:46:59<21:32:38, 7.65s/it, loss=0.0066, acc=0.9912, iter_time=5.38s]
Epoch 0: 18%|█▊ | 2247/12384 [4:47:06<21:32:38, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.81s]
Epoch 0: 18%|█▊ | 2248/12384 [4:47:06<21:31:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.81s]
Epoch 0: 18%|█▊ | 2248/12384 [4:47:14<21:31:43, 7.65s/it, loss=0.0009, acc=0.9975, iter_time=5.89s]
Epoch 0: 18%|█▊ | 2249/12384 [4:47:14<21:28:42, 7.63s/it, loss=0.0009, acc=0.9975, iter_time=5.89s]
Epoch 0: 18%|█▊ | 2249/12384 [4:47:22<21:28:42, 7.63s/it, loss=0.0020, acc=0.9934, iter_time=9.76s]
Epoch 0: 18%|█▊ | 2250/12384 [4:47:22<21:27:40, 7.62s/it, loss=0.0020, acc=0.9934, iter_time=9.76s]
Epoch 0: 18%|█▊ | 2250/12384 [4:47:29<21:27:40, 7.62s/it, loss=0.0006, acc=0.9995, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2251/12384 [4:47:29<21:26:48, 7.62s/it, loss=0.0006, acc=0.9995, iter_time=7.20s]
Epoch 0: 18%|█▊ | 2251/12384 [4:47:37<21:26:48, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 18%|█▊ | 2252/12384 [4:47:37<21:26:24, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.50s]
Epoch 0: 18%|█▊ | 2252/12384 [4:47:44<21:26:24, 7.62s/it, loss=0.0002, acc=0.9983, iter_time=7.16s]
Epoch 0: 18%|█▊ | 2253/12384 [4:47:44<21:28:18, 7.63s/it, loss=0.0002, acc=0.9983, iter_time=7.16s]
Epoch 0: 18%|█▊ | 2253/12384 [4:47:52<21:28:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 18%|█▊ | 2254/12384 [4:47:52<21:28:44, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.23s]
Epoch 0: 18%|█▊ | 2254/12384 [4:48:00<21:28:44, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2255/12384 [4:48:00<21:29:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2255/12384 [4:48:07<21:29:32, 7.64s/it, loss=0.0003, acc=0.9988, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2256/12384 [4:48:07<21:29:38, 7.64s/it, loss=0.0003, acc=0.9988, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2256/12384 [4:48:15<21:29:38, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2257/12384 [4:48:15<21:29:50, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2257/12384 [4:48:23<21:29:50, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.60s]
Epoch 0: 18%|█▊ | 2258/12384 [4:48:23<21:29:59, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=5.60s]
Epoch 0: 18%|█▊ | 2258/12384 [4:48:30<21:29:59, 7.64s/it, loss=0.0007, acc=0.9986, iter_time=8.48s]
Epoch 0: 18%|█▊ | 2259/12384 [4:48:30<21:29:52, 7.64s/it, loss=0.0007, acc=0.9986, iter_time=8.48s]
Epoch 0: 18%|█▊ | 2259/12384 [4:48:38<21:29:52, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=8.86s]
Epoch 0: 18%|█▊ | 2260/12384 [4:48:38<21:32:33, 7.66s/it, loss=0.0001, acc=0.9999, iter_time=8.86s]
Epoch 0: 18%|█▊ | 2260/12384 [4:48:46<21:32:33, 7.66s/it, loss=0.0004, acc=0.9980, iter_time=7.10s]
Epoch 0: 18%|█▊ | 2261/12384 [4:48:46<21:29:07, 7.64s/it, loss=0.0004, acc=0.9980, iter_time=7.10s]
Epoch 0: 18%|█▊ | 2261/12384 [4:48:53<21:29:07, 7.64s/it, loss=0.0016, acc=0.9958, iter_time=8.20s]
Epoch 0: 18%|█▊ | 2262/12384 [4:48:53<21:30:14, 7.65s/it, loss=0.0016, acc=0.9958, iter_time=8.20s]
Epoch 0: 18%|█▊ | 2262/12384 [4:49:01<21:30:14, 7.65s/it, loss=0.0007, acc=0.9979, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2263/12384 [4:49:01<21:28:34, 7.64s/it, loss=0.0007, acc=0.9979, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2263/12384 [4:49:09<21:28:34, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2264/12384 [4:49:09<21:30:08, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2264/12384 [4:49:16<21:30:08, 7.65s/it, loss=0.0011, acc=0.9992, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2265/12384 [4:49:16<21:29:26, 7.65s/it, loss=0.0011, acc=0.9992, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2265/12384 [4:49:24<21:29:26, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.79s]
Epoch 0: 18%|█▊ | 2266/12384 [4:49:24<21:36:01, 7.69s/it, loss=0.0002, acc=1.0000, iter_time=7.79s]
Epoch 0: 18%|█▊ | 2266/12384 [4:49:32<21:36:01, 7.69s/it, loss=0.0004, acc=1.0000, iter_time=7.97s]
Epoch 0: 18%|█▊ | 2267/12384 [4:49:32<21:47:48, 7.76s/it, loss=0.0004, acc=1.0000, iter_time=7.97s]
Epoch 0: 18%|█▊ | 2267/12384 [4:49:40<21:47:48, 7.76s/it, loss=0.0003, acc=0.9999, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2268/12384 [4:49:40<21:42:53, 7.73s/it, loss=0.0003, acc=0.9999, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2268/12384 [4:49:47<21:42:53, 7.73s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2269/12384 [4:49:47<21:55:18, 7.80s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 18%|█▊ | 2269/12384 [4:49:55<21:55:18, 7.80s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 18%|█▊ | 2270/12384 [4:49:55<21:47:44, 7.76s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 18%|█▊ | 2270/12384 [4:50:03<21:47:44, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2271/12384 [4:50:03<21:42:31, 7.73s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2271/12384 [4:50:11<21:42:31, 7.73s/it, loss=0.0003, acc=0.9994, iter_time=8.14s]
Epoch 0: 18%|█▊ | 2272/12384 [4:50:11<21:42:18, 7.73s/it, loss=0.0003, acc=0.9994, iter_time=8.14s]
Epoch 0: 18%|█▊ | 2272/12384 [4:50:18<21:42:18, 7.73s/it, loss=0.0004, acc=0.9979, iter_time=5.46s]
Epoch 0: 18%|█▊ | 2273/12384 [4:50:18<21:38:59, 7.71s/it, loss=0.0004, acc=0.9979, iter_time=5.46s]
Epoch 0: 18%|█▊ | 2273/12384 [4:50:26<21:38:59, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 18%|█▊ | 2274/12384 [4:50:26<21:34:56, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 18%|█▊ | 2274/12384 [4:50:33<21:34:56, 7.69s/it, loss=0.0010, acc=0.9974, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2275/12384 [4:50:33<21:33:07, 7.68s/it, loss=0.0010, acc=0.9974, iter_time=7.64s]
Epoch 0: 18%|█▊ | 2275/12384 [4:50:41<21:33:07, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 18%|█▊ | 2276/12384 [4:50:41<21:31:07, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 18%|█▊ | 2276/12384 [4:50:49<21:31:07, 7.66s/it, loss=0.0016, acc=0.9981, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2277/12384 [4:50:49<21:29:50, 7.66s/it, loss=0.0016, acc=0.9981, iter_time=7.63s]
Epoch 0: 18%|█▊ | 2277/12384 [4:50:56<21:29:50, 7.66s/it, loss=0.0013, acc=0.9951, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2278/12384 [4:50:56<21:34:00, 7.68s/it, loss=0.0013, acc=0.9951, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2278/12384 [4:51:04<21:34:00, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=4.68s]
Epoch 0: 18%|█▊ | 2279/12384 [4:51:04<21:29:43, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.68s]
Epoch 0: 18%|█▊ | 2279/12384 [4:51:12<21:29:43, 7.66s/it, loss=0.0035, acc=0.9906, iter_time=11.05s]
Epoch 0: 18%|█▊ | 2280/12384 [4:51:12<21:29:42, 7.66s/it, loss=0.0035, acc=0.9906, iter_time=11.05s]
Epoch 0: 18%|█▊ | 2280/12384 [4:51:19<21:29:42, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=5.82s]
Epoch 0: 18%|█▊ | 2281/12384 [4:51:19<21:27:37, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=5.82s]
Epoch 0: 18%|█▊ | 2281/12384 [4:51:27<21:27:37, 7.65s/it, loss=0.0004, acc=0.9998, iter_time=9.15s]
Epoch 0: 18%|█▊ | 2282/12384 [4:51:27<21:28:55, 7.66s/it, loss=0.0004, acc=0.9998, iter_time=9.15s]
Epoch 0: 18%|█▊ | 2282/12384 [4:51:35<21:28:55, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 18%|█▊ | 2283/12384 [4:51:35<21:27:38, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.68s]
Epoch 0: 18%|█▊ | 2283/12384 [4:51:42<21:27:38, 7.65s/it, loss=0.0005, acc=0.9997, iter_time=8.57s]
Epoch 0: 18%|█▊ | 2284/12384 [4:51:42<21:26:06, 7.64s/it, loss=0.0005, acc=0.9997, iter_time=8.57s]
Epoch 0: 18%|█▊ | 2284/12384 [4:51:50<21:26:06, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2285/12384 [4:51:50<21:24:48, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2285/12384 [4:51:58<21:24:48, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2286/12384 [4:51:58<21:23:37, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2286/12384 [4:52:05<21:23:37, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2287/12384 [4:52:05<21:23:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 18%|█▊ | 2287/12384 [4:52:13<21:23:10, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2288/12384 [4:52:13<21:27:05, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.00s]
Epoch 0: 18%|█▊ | 2288/12384 [4:52:20<21:27:05, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 18%|█▊ | 2289/12384 [4:52:20<21:25:36, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.32s]
Epoch 0: 18%|█▊ | 2289/12384 [4:52:28<21:25:36, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2290/12384 [4:52:28<21:26:02, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.62s]
Epoch 0: 18%|█▊ | 2290/12384 [4:52:36<21:26:02, 7.64s/it, loss=0.0002, acc=0.9984, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2291/12384 [4:52:36<21:24:03, 7.63s/it, loss=0.0002, acc=0.9984, iter_time=7.65s]
Epoch 0: 18%|█▊ | 2291/12384 [4:52:43<21:24:03, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▊ | 2292/12384 [4:52:43<21:25:58, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▊ | 2292/12384 [4:52:51<21:25:58, 7.65s/it, loss=0.0006, acc=0.9990, iter_time=7.93s]
Epoch 0: 19%|█▊ | 2293/12384 [4:52:51<21:36:59, 7.71s/it, loss=0.0006, acc=0.9990, iter_time=7.93s]
Epoch 0: 19%|█▊ | 2293/12384 [4:52:59<21:36:59, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 0: 19%|█▊ | 2294/12384 [4:52:59<21:33:13, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.29s]
Epoch 0: 19%|█▊ | 2294/12384 [4:53:07<21:33:13, 7.69s/it, loss=0.0012, acc=0.9977, iter_time=7.86s]
Epoch 0: 19%|█▊ | 2295/12384 [4:53:07<21:30:13, 7.67s/it, loss=0.0012, acc=0.9977, iter_time=7.86s]
Epoch 0: 19%|█▊ | 2295/12384 [4:53:15<21:30:13, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 0: 19%|█▊ | 2296/12384 [4:53:15<21:44:10, 7.76s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 0: 19%|█▊ | 2296/12384 [4:53:22<21:44:10, 7.76s/it, loss=0.0015, acc=0.9934, iter_time=5.40s]
Epoch 0: 19%|█▊ | 2297/12384 [4:53:22<21:43:18, 7.75s/it, loss=0.0015, acc=0.9934, iter_time=5.40s]
Epoch 0: 19%|█▊ | 2297/12384 [4:53:30<21:43:18, 7.75s/it, loss=0.0018, acc=0.9982, iter_time=10.10s]
Epoch 0: 19%|█▊ | 2298/12384 [4:53:30<21:40:11, 7.73s/it, loss=0.0018, acc=0.9982, iter_time=10.10s]
Epoch 0: 19%|█▊ | 2298/12384 [4:53:38<21:40:11, 7.73s/it, loss=0.0024, acc=0.9969, iter_time=7.60s]
Epoch 0: 19%|█▊ | 2299/12384 [4:53:38<21:33:48, 7.70s/it, loss=0.0024, acc=0.9969, iter_time=7.60s]
Epoch 0: 19%|█▊ | 2299/12384 [4:53:45<21:33:48, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 19%|█▊ | 2300/12384 [4:53:45<21:33:06, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.08s]
Epoch 0: 19%|█▊ | 2300/12384 [4:53:53<21:33:06, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 0: 19%|█▊ | 2301/12384 [4:53:53<21:29:27, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=7.22s]
Epoch 0: 19%|█▊ | 2301/12384 [4:54:00<21:29:27, 7.67s/it, loss=0.0015, acc=0.9954, iter_time=7.63s]
Epoch 0: 19%|█▊ | 2302/12384 [4:54:00<21:27:41, 7.66s/it, loss=0.0015, acc=0.9954, iter_time=7.63s]
Epoch 0: 19%|█▊ | 2302/12384 [4:54:08<21:27:41, 7.66s/it, loss=0.0020, acc=0.9975, iter_time=5.92s]
Epoch 0: 19%|█▊ | 2303/12384 [4:54:08<21:27:25, 7.66s/it, loss=0.0020, acc=0.9975, iter_time=5.92s]
Epoch 0: 19%|█▊ | 2303/12384 [4:54:16<21:27:25, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=9.34s]
Epoch 0: 19%|█▊ | 2304/12384 [4:54:16<21:25:57, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.34s]
Epoch 0: 19%|█▊ | 2304/12384 [4:54:23<21:25:57, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 19%|█▊ | 2305/12384 [4:54:23<21:25:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.61s]
Epoch 0: 19%|█▊ | 2305/12384 [4:54:31<21:25:43, 7.65s/it, loss=0.0004, acc=0.9980, iter_time=9.09s]
Epoch 0: 19%|█▊ | 2306/12384 [4:54:31<21:25:05, 7.65s/it, loss=0.0004, acc=0.9980, iter_time=9.09s]
Epoch 0: 19%|█▊ | 2306/12384 [4:54:39<21:25:05, 7.65s/it, loss=0.0006, acc=0.9979, iter_time=5.26s]
Epoch 0: 19%|█▊ | 2307/12384 [4:54:39<21:24:44, 7.65s/it, loss=0.0006, acc=0.9979, iter_time=5.26s]
Epoch 0: 19%|█▊ | 2307/12384 [4:54:46<21:24:44, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 19%|█▊ | 2308/12384 [4:54:46<21:22:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 19%|█▊ | 2308/12384 [4:54:54<21:22:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=10.90s]
Epoch 0: 19%|█▊ | 2309/12384 [4:54:54<21:27:07, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.90s]
Epoch 0: 19%|█▊ | 2309/12384 [4:55:02<21:27:07, 7.67s/it, loss=0.0016, acc=0.9974, iter_time=6.88s]
Epoch 0: 19%|█▊ | 2310/12384 [4:55:02<21:25:48, 7.66s/it, loss=0.0016, acc=0.9974, iter_time=6.88s]
Epoch 0: 19%|█▊ | 2310/12384 [4:55:09<21:25:48, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=8.61s]
Epoch 0: 19%|█▊ | 2311/12384 [4:55:09<21:31:32, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.61s]
Epoch 0: 19%|█▊ | 2311/12384 [4:55:17<21:31:32, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.12s]
Epoch 0: 19%|█▊ | 2312/12384 [4:55:17<21:30:30, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=8.12s]
Epoch 0: 19%|█▊ | 2312/12384 [4:55:25<21:30:30, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 19%|█▊ | 2313/12384 [4:55:25<21:33:02, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.35s]
Epoch 0: 19%|█▊ | 2313/12384 [4:55:33<21:33:02, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.77s]
Epoch 0: 19%|█▊ | 2314/12384 [4:55:33<21:28:22, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=6.77s]
Epoch 0: 19%|█▊ | 2314/12384 [4:55:40<21:28:22, 7.68s/it, loss=0.0019, acc=0.9907, iter_time=7.54s]
Epoch 0: 19%|█▊ | 2315/12384 [4:55:40<21:25:45, 7.66s/it, loss=0.0019, acc=0.9907, iter_time=7.54s]
Epoch 0: 19%|█▊ | 2315/12384 [4:55:48<21:25:45, 7.66s/it, loss=0.0008, acc=0.9979, iter_time=6.53s]
Epoch 0: 19%|█▊ | 2316/12384 [4:55:48<21:24:27, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=6.53s]
Epoch 0: 19%|█▊ | 2316/12384 [4:55:55<21:24:27, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2317/12384 [4:55:55<21:24:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 19%|█▊ | 2317/12384 [4:56:03<21:24:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.51s]
Epoch 0: 19%|█▊ | 2318/12384 [4:56:03<21:23:30, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.51s]
Epoch 0: 19%|█▊ | 2318/12384 [4:56:11<21:23:30, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.80s]
Epoch 0: 19%|█▊ | 2319/12384 [4:56:11<21:24:04, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.80s]
Epoch 0: 19%|█▊ | 2319/12384 [4:56:18<21:24:04, 7.65s/it, loss=0.0008, acc=0.9978, iter_time=10.66s]
Epoch 0: 19%|█▊ | 2320/12384 [4:56:18<21:22:23, 7.65s/it, loss=0.0008, acc=0.9978, iter_time=10.66s]
Epoch 0: 19%|█▊ | 2320/12384 [4:56:26<21:22:23, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▊ | 2321/12384 [4:56:26<21:19:55, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▊ | 2321/12384 [4:56:34<21:19:55, 7.63s/it, loss=0.0013, acc=0.9958, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2322/12384 [4:56:34<21:37:44, 7.74s/it, loss=0.0013, acc=0.9958, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2322/12384 [4:56:42<21:37:44, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 19%|█▉ | 2323/12384 [4:56:42<21:33:08, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=5.87s]
Epoch 0: 19%|█▉ | 2323/12384 [4:56:49<21:33:08, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 19%|█▉ | 2324/12384 [4:56:49<21:28:52, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 19%|█▉ | 2324/12384 [4:56:57<21:28:52, 7.69s/it, loss=0.0005, acc=0.9998, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2325/12384 [4:56:57<21:27:37, 7.68s/it, loss=0.0005, acc=0.9998, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2325/12384 [4:57:05<21:27:37, 7.68s/it, loss=0.0008, acc=0.9973, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2326/12384 [4:57:05<21:24:47, 7.66s/it, loss=0.0008, acc=0.9973, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2326/12384 [4:57:12<21:24:47, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2327/12384 [4:57:12<21:23:06, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2327/12384 [4:57:20<21:23:06, 7.66s/it, loss=0.0011, acc=0.9985, iter_time=8.04s]
Epoch 0: 19%|█▉ | 2328/12384 [4:57:20<21:21:41, 7.65s/it, loss=0.0011, acc=0.9985, iter_time=8.04s]
Epoch 0: 19%|█▉ | 2328/12384 [4:57:27<21:21:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 0: 19%|█▉ | 2329/12384 [4:57:27<21:19:25, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=5.74s]
Epoch 0: 19%|█▉ | 2329/12384 [4:57:35<21:19:25, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=9.09s]
Epoch 0: 19%|█▉ | 2330/12384 [4:57:35<21:19:03, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=9.09s]
Epoch 0: 19%|█▉ | 2330/12384 [4:57:43<21:19:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2331/12384 [4:57:43<21:20:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2331/12384 [4:57:50<21:20:29, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2332/12384 [4:57:50<21:19:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2332/12384 [4:57:58<21:19:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.71s]
Epoch 0: 19%|█▉ | 2333/12384 [4:57:58<21:17:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.71s]
Epoch 0: 19%|█▉ | 2333/12384 [4:58:06<21:17:19, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.44s]
Epoch 0: 19%|█▉ | 2334/12384 [4:58:06<21:17:23, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=6.44s]
Epoch 0: 19%|█▉ | 2334/12384 [4:58:13<21:17:23, 7.63s/it, loss=0.0017, acc=0.9957, iter_time=9.73s]
Epoch 0: 19%|█▉ | 2335/12384 [4:58:13<21:18:50, 7.64s/it, loss=0.0017, acc=0.9957, iter_time=9.73s]
Epoch 0: 19%|█▉ | 2335/12384 [4:58:21<21:18:50, 7.64s/it, loss=0.0010, acc=0.9963, iter_time=8.04s]
Epoch 0: 19%|█▉ | 2336/12384 [4:58:21<21:17:24, 7.63s/it, loss=0.0010, acc=0.9963, iter_time=8.04s]
Epoch 0: 19%|█▉ | 2336/12384 [4:58:28<21:17:24, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=4.90s]
Epoch 0: 19%|█▉ | 2337/12384 [4:58:28<21:16:46, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=4.90s]
Epoch 0: 19%|█▉ | 2337/12384 [4:58:36<21:16:46, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 19%|█▉ | 2338/12384 [4:58:36<21:15:05, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=9.91s]
Epoch 0: 19%|█▉ | 2338/12384 [4:58:44<21:15:05, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2339/12384 [4:58:44<21:15:33, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2339/12384 [4:58:51<21:15:33, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2340/12384 [4:58:51<21:19:30, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2340/12384 [4:58:59<21:19:30, 7.64s/it, loss=0.0006, acc=0.9978, iter_time=5.57s]
Epoch 0: 19%|█▉ | 2341/12384 [4:58:59<21:18:57, 7.64s/it, loss=0.0006, acc=0.9978, iter_time=5.57s]
Epoch 0: 19%|█▉ | 2341/12384 [4:59:07<21:18:57, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 0: 19%|█▉ | 2342/12384 [4:59:07<21:18:42, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.20s]
Epoch 0: 19%|█▉ | 2342/12384 [4:59:14<21:18:42, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=11.16s]
Epoch 0: 19%|█▉ | 2343/12384 [4:59:14<21:18:15, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=11.16s]
Epoch 0: 19%|█▉ | 2343/12384 [4:59:22<21:18:15, 7.64s/it, loss=0.0004, acc=0.9991, iter_time=7.74s]
Epoch 0: 19%|█▉ | 2344/12384 [4:59:22<21:16:49, 7.63s/it, loss=0.0004, acc=0.9991, iter_time=7.74s]
Epoch 0: 19%|█▉ | 2344/12384 [4:59:30<21:16:49, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 19%|█▉ | 2345/12384 [4:59:30<21:17:13, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 19%|█▉ | 2345/12384 [4:59:37<21:17:13, 7.63s/it, loss=0.0011, acc=0.9975, iter_time=5.13s]
Epoch 0: 19%|█▉ | 2346/12384 [4:59:37<21:19:06, 7.65s/it, loss=0.0011, acc=0.9975, iter_time=5.13s]
Epoch 0: 19%|█▉ | 2346/12384 [4:59:45<21:19:06, 7.65s/it, loss=0.0004, acc=0.9974, iter_time=9.63s]
Epoch 0: 19%|█▉ | 2347/12384 [4:59:45<21:19:09, 7.65s/it, loss=0.0004, acc=0.9974, iter_time=9.63s]
Epoch 0: 19%|█▉ | 2347/12384 [4:59:53<21:19:09, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 19%|█▉ | 2348/12384 [4:59:53<21:21:40, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.30s]
Epoch 0: 19%|█▉ | 2348/12384 [5:00:00<21:21:40, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2349/12384 [5:00:00<21:36:16, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2349/12384 [5:00:08<21:36:16, 7.75s/it, loss=0.0005, acc=0.9976, iter_time=8.32s]
Epoch 0: 19%|█▉ | 2350/12384 [5:00:08<21:30:21, 7.72s/it, loss=0.0005, acc=0.9976, iter_time=8.32s]
Epoch 0: 19%|█▉ | 2350/12384 [5:00:16<21:30:21, 7.72s/it, loss=0.0011, acc=0.9984, iter_time=7.22s]
Epoch 0: 19%|█▉ | 2351/12384 [5:00:16<21:28:06, 7.70s/it, loss=0.0011, acc=0.9984, iter_time=7.22s]
Epoch 0: 19%|█▉ | 2351/12384 [5:00:23<21:28:06, 7.70s/it, loss=0.0005, acc=0.9995, iter_time=8.07s]
Epoch 0: 19%|█▉ | 2352/12384 [5:00:23<21:25:13, 7.69s/it, loss=0.0005, acc=0.9995, iter_time=8.07s]
Epoch 0: 19%|█▉ | 2352/12384 [5:00:31<21:25:13, 7.69s/it, loss=0.0004, acc=0.9984, iter_time=3.07s]
Epoch 0: 19%|█▉ | 2353/12384 [5:00:31<21:21:58, 7.67s/it, loss=0.0004, acc=0.9984, iter_time=3.07s]
Epoch 0: 19%|█▉ | 2353/12384 [5:00:39<21:21:58, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=11.81s]
Epoch 0: 19%|█▉ | 2354/12384 [5:00:39<21:20:24, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=11.81s]
Epoch 0: 19%|█▉ | 2354/12384 [5:00:46<21:20:24, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2355/12384 [5:00:46<21:18:20, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2355/12384 [5:00:54<21:18:20, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2356/12384 [5:00:54<21:18:51, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2356/12384 [5:01:02<21:18:51, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2357/12384 [5:01:02<21:19:08, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.67s]
Epoch 0: 19%|█▉ | 2357/12384 [5:01:09<21:19:08, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=4.61s]
Epoch 0: 19%|█▉ | 2358/12384 [5:01:09<21:18:45, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=4.61s]
Epoch 0: 19%|█▉ | 2358/12384 [5:01:17<21:18:45, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 19%|█▉ | 2359/12384 [5:01:17<21:17:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.69s]
Epoch 0: 19%|█▉ | 2359/12384 [5:01:25<21:17:27, 7.65s/it, loss=0.0005, acc=0.9979, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2360/12384 [5:01:25<21:16:47, 7.64s/it, loss=0.0005, acc=0.9979, iter_time=7.60s]
Epoch 0: 19%|█▉ | 2360/12384 [5:01:32<21:16:47, 7.64s/it, loss=0.0011, acc=0.9974, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2361/12384 [5:01:32<21:16:42, 7.64s/it, loss=0.0011, acc=0.9974, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2361/12384 [5:01:40<21:16:42, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2362/12384 [5:01:40<21:16:44, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2362/12384 [5:01:48<21:16:44, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2363/12384 [5:01:48<21:17:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2363/12384 [5:01:55<21:17:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 19%|█▉ | 2364/12384 [5:01:55<21:15:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.06s]
Epoch 0: 19%|█▉ | 2364/12384 [5:02:03<21:15:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 19%|█▉ | 2365/12384 [5:02:03<21:13:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.21s]
Epoch 0: 19%|█▉ | 2365/12384 [5:02:10<21:13:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2366/12384 [5:02:10<21:12:07, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2366/12384 [5:02:18<21:12:07, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=4.48s]
Epoch 0: 19%|█▉ | 2367/12384 [5:02:18<21:12:28, 7.62s/it, loss=0.0003, acc=0.9982, iter_time=4.48s]
Epoch 0: 19%|█▉ | 2367/12384 [5:02:26<21:12:28, 7.62s/it, loss=0.0005, acc=0.9990, iter_time=11.14s]
Epoch 0: 19%|█▉ | 2368/12384 [5:02:26<21:12:17, 7.62s/it, loss=0.0005, acc=0.9990, iter_time=11.14s]
Epoch 0: 19%|█▉ | 2368/12384 [5:02:33<21:12:17, 7.62s/it, loss=0.0020, acc=0.9976, iter_time=7.25s]
Epoch 0: 19%|█▉ | 2369/12384 [5:02:33<21:12:20, 7.62s/it, loss=0.0020, acc=0.9976, iter_time=7.25s]
Epoch 0: 19%|█▉ | 2369/12384 [5:02:41<21:12:20, 7.62s/it, loss=0.0001, acc=0.9997, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2370/12384 [5:02:41<21:14:17, 7.64s/it, loss=0.0001, acc=0.9997, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2370/12384 [5:02:49<21:14:17, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2371/12384 [5:02:49<21:14:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2371/12384 [5:02:56<21:14:42, 7.64s/it, loss=0.0007, acc=0.9982, iter_time=5.65s]
Epoch 0: 19%|█▉ | 2372/12384 [5:02:56<21:13:50, 7.63s/it, loss=0.0007, acc=0.9982, iter_time=5.65s]
Epoch 0: 19%|█▉ | 2372/12384 [5:03:04<21:13:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 19%|█▉ | 2373/12384 [5:03:04<21:27:51, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 19%|█▉ | 2373/12384 [5:03:12<21:27:51, 7.72s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2374/12384 [5:03:12<21:25:48, 7.71s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2374/12384 [5:03:20<21:25:48, 7.71s/it, loss=0.0001, acc=0.9999, iter_time=6.51s]
Epoch 0: 19%|█▉ | 2375/12384 [5:03:20<21:41:27, 7.80s/it, loss=0.0001, acc=0.9999, iter_time=6.51s]
Epoch 0: 19%|█▉ | 2375/12384 [5:03:27<21:41:27, 7.80s/it, loss=0.0003, acc=1.0000, iter_time=9.15s]
Epoch 0: 19%|█▉ | 2376/12384 [5:03:27<21:33:40, 7.76s/it, loss=0.0003, acc=1.0000, iter_time=9.15s]
Epoch 0: 19%|█▉ | 2376/12384 [5:03:35<21:33:40, 7.76s/it, loss=0.0012, acc=0.9973, iter_time=5.66s]
Epoch 0: 19%|█▉ | 2377/12384 [5:03:35<21:28:43, 7.73s/it, loss=0.0012, acc=0.9973, iter_time=5.66s]
Epoch 0: 19%|█▉ | 2377/12384 [5:03:43<21:28:43, 7.73s/it, loss=0.0004, acc=0.9995, iter_time=9.66s]
Epoch 0: 19%|█▉ | 2378/12384 [5:03:43<21:25:21, 7.71s/it, loss=0.0004, acc=0.9995, iter_time=9.66s]
Epoch 0: 19%|█▉ | 2378/12384 [5:03:50<21:25:21, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2379/12384 [5:03:50<21:25:01, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 19%|█▉ | 2379/12384 [5:03:58<21:25:01, 7.71s/it, loss=0.0003, acc=0.9986, iter_time=6.77s]
Epoch 0: 19%|█▉ | 2380/12384 [5:03:58<21:21:22, 7.69s/it, loss=0.0003, acc=0.9986, iter_time=6.77s]
Epoch 0: 19%|█▉ | 2380/12384 [5:04:06<21:21:22, 7.69s/it, loss=0.0003, acc=0.9997, iter_time=8.58s]
Epoch 0: 19%|█▉ | 2381/12384 [5:04:06<21:19:21, 7.67s/it, loss=0.0003, acc=0.9997, iter_time=8.58s]
Epoch 0: 19%|█▉ | 2381/12384 [5:04:13<21:19:21, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=6.43s]
Epoch 0: 19%|█▉ | 2382/12384 [5:04:13<21:17:16, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=6.43s]
Epoch 0: 19%|█▉ | 2382/12384 [5:04:21<21:17:16, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=8.84s]
Epoch 0: 19%|█▉ | 2383/12384 [5:04:21<21:19:30, 7.68s/it, loss=0.0006, acc=0.9998, iter_time=8.84s]
Epoch 0: 19%|█▉ | 2383/12384 [5:04:29<21:19:30, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 19%|█▉ | 2384/12384 [5:04:29<21:17:18, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.11s]
Epoch 0: 19%|█▉ | 2384/12384 [5:04:36<21:17:18, 7.66s/it, loss=0.0006, acc=0.9991, iter_time=5.70s]
Epoch 0: 19%|█▉ | 2385/12384 [5:04:36<21:16:13, 7.66s/it, loss=0.0006, acc=0.9991, iter_time=5.70s]
Epoch 0: 19%|█▉ | 2385/12384 [5:04:44<21:16:13, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=9.16s]
Epoch 0: 19%|█▉ | 2386/12384 [5:04:44<21:17:23, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=9.16s]
Epoch 0: 19%|█▉ | 2386/12384 [5:04:52<21:17:23, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 19%|█▉ | 2387/12384 [5:04:52<21:15:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.72s]
Epoch 0: 19%|█▉ | 2387/12384 [5:04:59<21:15:19, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2388/12384 [5:04:59<21:17:02, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2388/12384 [5:05:07<21:17:02, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=4.89s]
Epoch 0: 19%|█▉ | 2389/12384 [5:05:07<21:17:19, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=4.89s]
Epoch 0: 19%|█▉ | 2389/12384 [5:05:15<21:17:19, 7.67s/it, loss=0.0002, acc=0.9992, iter_time=10.45s]
Epoch 0: 19%|█▉ | 2390/12384 [5:05:15<21:15:34, 7.66s/it, loss=0.0002, acc=0.9992, iter_time=10.45s]
Epoch 0: 19%|█▉ | 2390/12384 [5:05:22<21:15:34, 7.66s/it, loss=0.0031, acc=0.9921, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2391/12384 [5:05:22<21:14:20, 7.65s/it, loss=0.0031, acc=0.9921, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2391/12384 [5:05:30<21:14:20, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2392/12384 [5:05:30<21:14:03, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=8.01s]
Epoch 0: 19%|█▉ | 2392/12384 [5:05:38<21:14:03, 7.65s/it, loss=0.0006, acc=0.9998, iter_time=7.26s]
Epoch 0: 19%|█▉ | 2393/12384 [5:05:38<21:12:35, 7.64s/it, loss=0.0006, acc=0.9998, iter_time=7.26s]
Epoch 0: 19%|█▉ | 2393/12384 [5:05:45<21:12:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2394/12384 [5:05:45<21:12:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2394/12384 [5:05:53<21:12:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2395/12384 [5:05:53<21:12:25, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 19%|█▉ | 2395/12384 [5:06:00<21:12:25, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2396/12384 [5:06:00<21:09:57, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2396/12384 [5:06:08<21:09:57, 7.63s/it, loss=0.0004, acc=0.9988, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2397/12384 [5:06:08<21:13:30, 7.65s/it, loss=0.0004, acc=0.9988, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2397/12384 [5:06:16<21:13:30, 7.65s/it, loss=0.0006, acc=0.9976, iter_time=7.70s]
Epoch 0: 19%|█▉ | 2398/12384 [5:06:16<21:11:57, 7.64s/it, loss=0.0006, acc=0.9976, iter_time=7.70s]
Epoch 0: 19%|█▉ | 2398/12384 [5:06:24<21:11:57, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=7.93s]
Epoch 0: 19%|█▉ | 2399/12384 [5:06:24<21:25:51, 7.73s/it, loss=0.0002, acc=0.9995, iter_time=7.93s]
Epoch 0: 19%|█▉ | 2399/12384 [5:06:31<21:25:51, 7.73s/it, loss=0.0007, acc=0.9974, iter_time=8.05s]
Epoch 0: 19%|█▉ | 2400/12384 [5:06:31<21:21:59, 7.70s/it, loss=0.0007, acc=0.9974, iter_time=8.05s]
Epoch 0: 19%|█▉ | 2400/12384 [5:06:39<21:21:59, 7.70s/it, loss=0.0004, acc=0.9981, iter_time=7.24s]
Epoch 0: 19%|█▉ | 2401/12384 [5:06:39<21:31:55, 7.76s/it, loss=0.0004, acc=0.9981, iter_time=7.24s]
Epoch 0: 19%|█▉ | 2401/12384 [5:06:47<21:31:55, 7.76s/it, loss=0.0009, acc=0.9955, iter_time=7.88s]
Epoch 0: 19%|█▉ | 2402/12384 [5:06:47<21:25:44, 7.73s/it, loss=0.0009, acc=0.9955, iter_time=7.88s]
Epoch 0: 19%|█▉ | 2402/12384 [5:06:55<21:25:44, 7.73s/it, loss=0.0007, acc=0.9995, iter_time=7.71s]
Epoch 0: 19%|█▉ | 2403/12384 [5:06:55<21:23:01, 7.71s/it, loss=0.0007, acc=0.9995, iter_time=7.71s]
Epoch 0: 19%|█▉ | 2403/12384 [5:07:02<21:23:01, 7.71s/it, loss=0.0003, acc=0.9994, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2404/12384 [5:07:02<21:19:19, 7.69s/it, loss=0.0003, acc=0.9994, iter_time=7.64s]
Epoch 0: 19%|█▉ | 2404/12384 [5:07:10<21:19:19, 7.69s/it, loss=0.0005, acc=0.9985, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2405/12384 [5:07:10<21:17:47, 7.68s/it, loss=0.0005, acc=0.9985, iter_time=7.62s]
Epoch 0: 19%|█▉ | 2405/12384 [5:07:18<21:17:47, 7.68s/it, loss=0.0001, acc=0.9999, iter_time=7.77s]
Epoch 0: 19%|█▉ | 2406/12384 [5:07:18<21:19:30, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=7.77s]
Epoch 0: 19%|█▉ | 2406/12384 [5:07:25<21:19:30, 7.69s/it, loss=0.0004, acc=0.9978, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2407/12384 [5:07:25<21:16:22, 7.68s/it, loss=0.0004, acc=0.9978, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2407/12384 [5:07:33<21:16:22, 7.68s/it, loss=0.0013, acc=0.9973, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2408/12384 [5:07:33<21:14:15, 7.66s/it, loss=0.0013, acc=0.9973, iter_time=7.61s]
Epoch 0: 19%|█▉ | 2408/12384 [5:07:40<21:14:15, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2409/12384 [5:07:40<21:11:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2409/12384 [5:07:48<21:11:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.05s]
Epoch 0: 19%|█▉ | 2410/12384 [5:07:48<21:09:10, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.05s]
Epoch 0: 19%|█▉ | 2410/12384 [5:07:56<21:09:10, 7.63s/it, loss=0.0008, acc=0.9971, iter_time=9.10s]
Epoch 0: 19%|█▉ | 2411/12384 [5:07:56<21:09:24, 7.64s/it, loss=0.0008, acc=0.9971, iter_time=9.10s]
Epoch 0: 19%|█▉ | 2411/12384 [5:08:03<21:09:24, 7.64s/it, loss=0.0008, acc=0.9982, iter_time=9.72s]
Epoch 0: 19%|█▉ | 2412/12384 [5:08:03<21:08:46, 7.63s/it, loss=0.0008, acc=0.9982, iter_time=9.72s]
Epoch 0: 19%|█▉ | 2412/12384 [5:08:11<21:08:46, 7.63s/it, loss=0.0010, acc=0.9971, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2413/12384 [5:08:11<21:10:42, 7.65s/it, loss=0.0010, acc=0.9971, iter_time=7.65s]
Epoch 0: 19%|█▉ | 2413/12384 [5:08:19<21:10:42, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 19%|█▉ | 2414/12384 [5:08:19<21:10:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.03s]
Epoch 0: 19%|█▉ | 2414/12384 [5:08:26<21:10:11, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=8.28s]
Epoch 0: 20%|█▉ | 2415/12384 [5:08:26<21:08:49, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=8.28s]
Epoch 0: 20%|█▉ | 2415/12384 [5:08:34<21:08:49, 7.64s/it, loss=0.0007, acc=0.9951, iter_time=8.02s]
Epoch 0: 20%|█▉ | 2416/12384 [5:08:34<21:10:04, 7.64s/it, loss=0.0007, acc=0.9951, iter_time=8.02s]
Epoch 0: 20%|█▉ | 2416/12384 [5:08:42<21:10:04, 7.64s/it, loss=0.0003, acc=0.9987, iter_time=7.27s]
Epoch 0: 20%|█▉ | 2417/12384 [5:08:42<21:09:44, 7.64s/it, loss=0.0003, acc=0.9987, iter_time=7.27s]
Epoch 0: 20%|█▉ | 2417/12384 [5:08:49<21:09:44, 7.64s/it, loss=0.0006, acc=0.9966, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2418/12384 [5:08:49<21:08:45, 7.64s/it, loss=0.0006, acc=0.9966, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2418/12384 [5:08:57<21:08:45, 7.64s/it, loss=0.0004, acc=0.9995, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2419/12384 [5:08:57<21:08:47, 7.64s/it, loss=0.0004, acc=0.9995, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2419/12384 [5:09:04<21:08:47, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2420/12384 [5:09:04<21:08:52, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2420/12384 [5:09:12<21:08:52, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 20%|█▉ | 2421/12384 [5:09:12<21:07:05, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.00s]
Epoch 0: 20%|█▉ | 2421/12384 [5:09:20<21:07:05, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 20%|█▉ | 2422/12384 [5:09:20<21:06:08, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 20%|█▉ | 2422/12384 [5:09:27<21:06:08, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 20%|█▉ | 2423/12384 [5:09:27<21:06:18, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=4.61s]
Epoch 0: 20%|█▉ | 2423/12384 [5:09:35<21:06:18, 7.63s/it, loss=0.0008, acc=0.9979, iter_time=10.62s]
Epoch 0: 20%|█▉ | 2424/12384 [5:09:35<21:06:42, 7.63s/it, loss=0.0008, acc=0.9979, iter_time=10.62s]
Epoch 0: 20%|█▉ | 2424/12384 [5:09:43<21:06:42, 7.63s/it, loss=0.0018, acc=0.9978, iter_time=7.94s]
Epoch 0: 20%|█▉ | 2425/12384 [5:09:43<21:18:53, 7.70s/it, loss=0.0018, acc=0.9978, iter_time=7.94s]
Epoch 0: 20%|█▉ | 2425/12384 [5:09:51<21:18:53, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2426/12384 [5:09:51<21:16:04, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2426/12384 [5:09:58<21:16:04, 7.69s/it, loss=0.0006, acc=0.9998, iter_time=7.67s]
Epoch 0: 20%|█▉ | 2427/12384 [5:09:58<21:27:08, 7.76s/it, loss=0.0006, acc=0.9998, iter_time=7.67s]
Epoch 0: 20%|█▉ | 2427/12384 [5:10:06<21:27:08, 7.76s/it, loss=0.0023, acc=0.9939, iter_time=4.86s]
Epoch 0: 20%|█▉ | 2428/12384 [5:10:06<21:20:31, 7.72s/it, loss=0.0023, acc=0.9939, iter_time=4.86s]
Epoch 0: 20%|█▉ | 2428/12384 [5:10:14<21:20:31, 7.72s/it, loss=0.0001, acc=0.9999, iter_time=10.63s]
Epoch 0: 20%|█▉ | 2429/12384 [5:10:14<21:15:59, 7.69s/it, loss=0.0001, acc=0.9999, iter_time=10.63s]
Epoch 0: 20%|█▉ | 2429/12384 [5:10:21<21:15:59, 7.69s/it, loss=0.0003, acc=0.9980, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2430/12384 [5:10:21<21:11:56, 7.67s/it, loss=0.0003, acc=0.9980, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2430/12384 [5:10:29<21:11:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2431/12384 [5:10:29<21:12:05, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2431/12384 [5:10:37<21:12:05, 7.67s/it, loss=0.0079, acc=0.9976, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2432/12384 [5:10:37<21:12:10, 7.67s/it, loss=0.0079, acc=0.9976, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2432/12384 [5:10:44<21:12:10, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2433/12384 [5:10:44<21:09:26, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2433/12384 [5:10:52<21:09:26, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2434/12384 [5:10:52<21:07:02, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2434/12384 [5:11:00<21:07:02, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2435/12384 [5:11:00<21:07:01, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2435/12384 [5:11:07<21:07:01, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2436/12384 [5:11:07<21:06:38, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2436/12384 [5:11:15<21:06:38, 7.64s/it, loss=0.0007, acc=0.9977, iter_time=7.67s]
Epoch 0: 20%|█▉ | 2437/12384 [5:11:15<21:07:45, 7.65s/it, loss=0.0007, acc=0.9977, iter_time=7.67s]
Epoch 0: 20%|█▉ | 2437/12384 [5:11:22<21:07:45, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2438/12384 [5:11:22<21:06:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2438/12384 [5:11:30<21:06:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2439/12384 [5:11:30<21:10:38, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2439/12384 [5:11:38<21:10:38, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2440/12384 [5:11:38<21:08:08, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2440/12384 [5:11:45<21:08:08, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2441/12384 [5:11:45<21:06:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|█▉ | 2441/12384 [5:11:53<21:06:24, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 20%|█▉ | 2442/12384 [5:11:53<21:03:53, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.01s]
Epoch 0: 20%|█▉ | 2442/12384 [5:12:01<21:03:53, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 20%|█▉ | 2443/12384 [5:12:01<21:05:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=6.43s]
Epoch 0: 20%|█▉ | 2443/12384 [5:12:08<21:05:43, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.44s]
Epoch 0: 20%|█▉ | 2444/12384 [5:12:08<21:04:25, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.44s]
Epoch 0: 20%|█▉ | 2444/12384 [5:12:16<21:04:25, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2445/12384 [5:12:16<21:04:14, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.63s]
Epoch 0: 20%|█▉ | 2445/12384 [5:12:24<21:04:14, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2446/12384 [5:12:24<21:05:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 20%|█▉ | 2446/12384 [5:12:31<21:05:38, 7.64s/it, loss=0.0006, acc=0.9975, iter_time=6.82s]
Epoch 0: 20%|█▉ | 2447/12384 [5:12:31<21:06:19, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=6.82s]
Epoch 0: 20%|█▉ | 2447/12384 [5:12:39<21:06:19, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.86s]
Epoch 0: 20%|█▉ | 2448/12384 [5:12:39<21:05:14, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.86s]
Epoch 0: 20%|█▉ | 2448/12384 [5:12:46<21:05:14, 7.64s/it, loss=0.0003, acc=0.9990, iter_time=7.25s]
Epoch 0: 20%|█▉ | 2449/12384 [5:12:46<21:03:58, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=7.25s]
Epoch 0: 20%|█▉ | 2449/12384 [5:12:54<21:03:58, 7.63s/it, loss=0.0042, acc=0.9888, iter_time=8.03s]
Epoch 0: 20%|█▉ | 2450/12384 [5:12:54<21:04:11, 7.64s/it, loss=0.0042, acc=0.9888, iter_time=8.03s]
Epoch 0: 20%|█▉ | 2450/12384 [5:13:02<21:04:11, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 20%|█▉ | 2451/12384 [5:13:02<21:17:09, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.51s]
Epoch 0: 20%|█▉ | 2451/12384 [5:13:10<21:17:09, 7.71s/it, loss=0.0007, acc=0.9985, iter_time=5.50s]
Epoch 0: 20%|█▉ | 2452/12384 [5:13:10<21:13:46, 7.69s/it, loss=0.0007, acc=0.9985, iter_time=5.50s]
Epoch 0: 20%|█▉ | 2452/12384 [5:13:18<21:13:46, 7.69s/it, loss=0.0003, acc=1.0000, iter_time=9.18s]
Epoch 0: 20%|█▉ | 2453/12384 [5:13:18<21:29:35, 7.79s/it, loss=0.0003, acc=1.0000, iter_time=9.18s]
Epoch 0: 20%|█▉ | 2453/12384 [5:13:25<21:29:35, 7.79s/it, loss=0.0001, acc=1.0000, iter_time=8.60s]
Epoch 0: 20%|█▉ | 2454/12384 [5:13:25<21:21:05, 7.74s/it, loss=0.0001, acc=1.0000, iter_time=8.60s]
Epoch 0: 20%|█▉ | 2454/12384 [5:13:33<21:21:05, 7.74s/it, loss=0.0007, acc=0.9981, iter_time=5.55s]
Epoch 0: 20%|█▉ | 2455/12384 [5:13:33<21:16:27, 7.71s/it, loss=0.0007, acc=0.9981, iter_time=5.55s]
Epoch 0: 20%|█▉ | 2455/12384 [5:13:41<21:16:27, 7.71s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 20%|█▉ | 2456/12384 [5:13:41<21:13:46, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=9.71s]
Epoch 0: 20%|█▉ | 2456/12384 [5:13:48<21:13:46, 7.70s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2457/12384 [5:13:48<21:11:05, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2457/12384 [5:13:56<21:11:05, 7.68s/it, loss=0.0009, acc=0.9953, iter_time=5.84s]
Epoch 0: 20%|█▉ | 2458/12384 [5:13:56<21:09:59, 7.68s/it, loss=0.0009, acc=0.9953, iter_time=5.84s]
Epoch 0: 20%|█▉ | 2458/12384 [5:14:04<21:09:59, 7.68s/it, loss=0.0002, acc=0.9987, iter_time=9.48s]
Epoch 0: 20%|█▉ | 2459/12384 [5:14:04<21:08:29, 7.67s/it, loss=0.0002, acc=0.9987, iter_time=9.48s]
Epoch 0: 20%|█▉ | 2459/12384 [5:14:11<21:08:29, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2460/12384 [5:14:11<21:08:24, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=7.68s]
Epoch 0: 20%|█▉ | 2460/12384 [5:14:19<21:08:24, 7.67s/it, loss=0.0001, acc=0.9996, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2461/12384 [5:14:19<21:06:19, 7.66s/it, loss=0.0001, acc=0.9996, iter_time=7.64s]
Epoch 0: 20%|█▉ | 2461/12384 [5:14:27<21:06:19, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2462/12384 [5:14:27<21:09:18, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2462/12384 [5:14:34<21:09:18, 7.68s/it, loss=0.0013, acc=0.9985, iter_time=7.41s]
Epoch 0: 20%|█▉ | 2463/12384 [5:14:34<21:07:06, 7.66s/it, loss=0.0013, acc=0.9985, iter_time=7.41s]
Epoch 0: 20%|█▉ | 2463/12384 [5:14:42<21:07:06, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 20%|█▉ | 2464/12384 [5:14:42<21:07:27, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.94s]
Epoch 0: 20%|█▉ | 2464/12384 [5:14:50<21:07:27, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 20%|█▉ | 2465/12384 [5:14:50<21:05:24, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=5.86s]
Epoch 0: 20%|█▉ | 2465/12384 [5:14:57<21:05:24, 7.65s/it, loss=0.0003, acc=0.9985, iter_time=9.44s]
Epoch 0: 20%|█▉ | 2466/12384 [5:14:57<21:05:20, 7.65s/it, loss=0.0003, acc=0.9985, iter_time=9.44s]
Epoch 0: 20%|█▉ | 2466/12384 [5:15:05<21:05:20, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=4.60s]
Epoch 0: 20%|█▉ | 2467/12384 [5:15:05<21:05:36, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.60s]
Epoch 0: 20%|█▉ | 2467/12384 [5:15:12<21:05:36, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 20%|█▉ | 2468/12384 [5:15:12<21:05:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.95s]
Epoch 0: 20%|█▉ | 2468/12384 [5:15:20<21:05:46, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=9.42s]
Epoch 0: 20%|█▉ | 2469/12384 [5:15:20<21:03:07, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=9.42s]
Epoch 0: 20%|█▉ | 2469/12384 [5:15:28<21:03:07, 7.64s/it, loss=0.0004, acc=0.9992, iter_time=7.70s]
Epoch 0: 20%|█▉ | 2470/12384 [5:15:28<21:05:39, 7.66s/it, loss=0.0004, acc=0.9992, iter_time=7.70s]
Epoch 0: 20%|█▉ | 2470/12384 [5:15:35<21:05:39, 7.66s/it, loss=0.0005, acc=0.9977, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2471/12384 [5:15:35<21:04:22, 7.65s/it, loss=0.0005, acc=0.9977, iter_time=7.61s]
Epoch 0: 20%|█▉ | 2471/12384 [5:15:43<21:04:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 20%|█▉ | 2472/12384 [5:15:43<21:03:46, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.01s]
Epoch 0: 20%|█▉ | 2472/12384 [5:15:51<21:03:46, 7.65s/it, loss=0.0004, acc=1.0000, iter_time=7.27s]
Epoch 0: 20%|█▉ | 2473/12384 [5:15:51<21:02:11, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.27s]
Epoch 0: 20%|█▉ | 2473/12384 [5:15:58<21:02:11, 7.64s/it, loss=0.0009, acc=0.9980, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2474/12384 [5:15:58<21:01:32, 7.64s/it, loss=0.0009, acc=0.9980, iter_time=7.62s]
Epoch 0: 20%|█▉ | 2474/12384 [5:16:06<21:01:32, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 20%|█▉ | 2475/12384 [5:16:06<21:02:21, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=6.10s]
Epoch 0: 20%|█▉ | 2475/12384 [5:16:14<21:02:21, 7.64s/it, loss=0.0001, acc=0.9995, iter_time=9.18s]
Epoch 0: 20%|█▉ | 2476/12384 [5:16:14<21:04:05, 7.65s/it, loss=0.0001, acc=0.9995, iter_time=9.18s]
Epoch 0: 20%|█▉ | 2476/12384 [5:16:21<21:04:05, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.69s]
Epoch 0: 20%|██ | 2477/12384 [5:16:21<21:07:01, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.69s]
Epoch 0: 20%|██ | 2477/12384 [5:16:29<21:07:01, 7.67s/it, loss=0.0003, acc=1.0000, iter_time=4.68s]
Epoch 0: 20%|██ | 2478/12384 [5:16:29<21:05:01, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=4.68s]
Epoch 0: 20%|██ | 2478/12384 [5:16:37<21:05:01, 7.66s/it, loss=0.0011, acc=0.9960, iter_time=10.66s]
Epoch 0: 20%|██ | 2479/12384 [5:16:37<21:03:07, 7.65s/it, loss=0.0011, acc=0.9960, iter_time=10.66s]
Epoch 0: 20%|██ | 2479/12384 [5:16:45<21:03:07, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=8.11s]
Epoch 0: 20%|██ | 2480/12384 [5:16:45<21:22:33, 7.77s/it, loss=0.0003, acc=1.0000, iter_time=8.11s]
Epoch 0: 20%|██ | 2480/12384 [5:16:52<21:22:33, 7.77s/it, loss=0.0006, acc=0.9970, iter_time=7.60s]
Epoch 0: 20%|██ | 2481/12384 [5:16:52<21:19:33, 7.75s/it, loss=0.0006, acc=0.9970, iter_time=7.60s]
Epoch 0: 20%|██ | 2481/12384 [5:17:00<21:19:33, 7.75s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 20%|██ | 2482/12384 [5:17:00<21:14:43, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=7.70s]
Epoch 0: 20%|██ | 2482/12384 [5:17:08<21:14:43, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=4.30s]
Epoch 0: 20%|██ | 2483/12384 [5:17:08<21:11:58, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=4.30s]
Epoch 0: 20%|██ | 2483/12384 [5:17:15<21:11:58, 7.71s/it, loss=0.0051, acc=0.9972, iter_time=10.43s]
Epoch 0: 20%|██ | 2484/12384 [5:17:15<21:12:11, 7.71s/it, loss=0.0051, acc=0.9972, iter_time=10.43s]
Epoch 0: 20%|██ | 2484/12384 [5:17:23<21:12:11, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=5.54s]
Epoch 0: 20%|██ | 2485/12384 [5:17:23<21:07:36, 7.68s/it, loss=0.0002, acc=1.0000, iter_time=5.54s]
Epoch 0: 20%|██ | 2485/12384 [5:17:31<21:07:36, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 20%|██ | 2486/12384 [5:17:31<21:04:14, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.40s]
Epoch 0: 20%|██ | 2486/12384 [5:17:38<21:04:14, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2487/12384 [5:17:38<21:02:04, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.61s]
Epoch 0: 20%|██ | 2487/12384 [5:17:46<21:02:04, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 20%|██ | 2488/12384 [5:17:46<21:00:35, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.59s]
Epoch 0: 20%|██ | 2488/12384 [5:17:54<21:00:35, 7.64s/it, loss=0.0003, acc=0.9991, iter_time=7.66s]
Epoch 0: 20%|██ | 2489/12384 [5:17:54<21:02:02, 7.65s/it, loss=0.0003, acc=0.9991, iter_time=7.66s]
Epoch 0: 20%|██ | 2489/12384 [5:18:01<21:02:02, 7.65s/it, loss=0.0012, acc=0.9982, iter_time=6.48s]
Epoch 0: 20%|██ | 2490/12384 [5:18:01<21:00:49, 7.65s/it, loss=0.0012, acc=0.9982, iter_time=6.48s]
Epoch 0: 20%|██ | 2490/12384 [5:18:09<21:00:49, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=8.83s]
Epoch 0: 20%|██ | 2491/12384 [5:18:09<21:04:05, 7.67s/it, loss=0.0002, acc=0.9992, iter_time=8.83s]
Epoch 0: 20%|██ | 2491/12384 [5:18:17<21:04:05, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.71s]
Epoch 0: 20%|██ | 2492/12384 [5:18:17<21:01:27, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.71s]
Epoch 0: 20%|██ | 2492/12384 [5:18:24<21:01:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2493/12384 [5:18:24<20:59:40, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2493/12384 [5:18:32<20:59:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 0: 20%|██ | 2494/12384 [5:18:32<20:59:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.81s]
Epoch 0: 20%|██ | 2494/12384 [5:18:39<20:59:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 20%|██ | 2495/12384 [5:18:39<20:59:16, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.45s]
Epoch 0: 20%|██ | 2495/12384 [5:18:47<20:59:16, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=8.03s]
Epoch 0: 20%|██ | 2496/12384 [5:18:47<20:58:48, 7.64s/it, loss=0.0004, acc=0.9982, iter_time=8.03s]
Epoch 0: 20%|██ | 2496/12384 [5:18:55<20:58:48, 7.64s/it, loss=0.0005, acc=0.9987, iter_time=7.23s]
Epoch 0: 20%|██ | 2497/12384 [5:18:55<20:58:25, 7.64s/it, loss=0.0005, acc=0.9987, iter_time=7.23s]
Epoch 0: 20%|██ | 2497/12384 [5:19:02<20:58:25, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.32s]
Epoch 0: 20%|██ | 2498/12384 [5:19:02<20:58:05, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.32s]
Epoch 0: 20%|██ | 2498/12384 [5:19:10<20:58:05, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.15s]
Epoch 0: 20%|██ | 2499/12384 [5:19:10<20:56:45, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.15s]
Epoch 0: 20%|██ | 2499/12384 [5:19:18<20:56:45, 7.63s/it, loss=0.0012, acc=0.9991, iter_time=9.83s]
Epoch 0: 20%|██ | 2500/12384 [5:19:18<21:06:46, 7.69s/it, loss=0.0012, acc=0.9991, iter_time=9.83s]
Epoch 0: 20%|██ | 2500/12384 [5:19:25<21:06:46, 7.69s/it, loss=0.0013, acc=0.9951, iter_time=5.15s]
Epoch 0: 20%|██ | 2501/12384 [5:19:25<21:04:06, 7.67s/it, loss=0.0013, acc=0.9951, iter_time=5.15s]
Epoch 0: 20%|██ | 2501/12384 [5:19:33<21:04:06, 7.67s/it, loss=0.0009, acc=1.0000, iter_time=9.89s]
Epoch 0: 20%|██ | 2502/12384 [5:19:33<21:01:38, 7.66s/it, loss=0.0009, acc=1.0000, iter_time=9.89s]
Epoch 0: 20%|██ | 2502/12384 [5:19:41<21:01:38, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|██ | 2503/12384 [5:19:41<21:02:29, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 20%|██ | 2503/12384 [5:19:48<21:02:29, 7.67s/it, loss=0.0005, acc=0.9997, iter_time=8.02s]
Epoch 0: 20%|██ | 2504/12384 [5:19:48<21:01:25, 7.66s/it, loss=0.0005, acc=0.9997, iter_time=8.02s]
Epoch 0: 20%|██ | 2504/12384 [5:19:56<21:01:25, 7.66s/it, loss=0.0008, acc=0.9976, iter_time=7.25s]
Epoch 0: 20%|██ | 2505/12384 [5:19:56<20:58:29, 7.64s/it, loss=0.0008, acc=0.9976, iter_time=7.25s]
Epoch 0: 20%|██ | 2505/12384 [5:20:04<20:58:29, 7.64s/it, loss=0.0004, acc=0.9990, iter_time=7.04s]
Epoch 0: 20%|██ | 2506/12384 [5:20:04<21:14:29, 7.74s/it, loss=0.0004, acc=0.9990, iter_time=7.04s]
Epoch 0: 20%|██ | 2506/12384 [5:20:12<21:14:29, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 20%|██ | 2507/12384 [5:20:12<21:08:20, 7.70s/it, loss=0.0000, acc=1.0000, iter_time=8.55s]
Epoch 0: 20%|██ | 2507/12384 [5:20:19<21:08:20, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 20%|██ | 2508/12384 [5:20:19<21:09:16, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=6.99s]
Epoch 0: 20%|██ | 2508/12384 [5:20:27<21:09:16, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=8.38s]
Epoch 0: 20%|██ | 2509/12384 [5:20:27<21:05:24, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=8.38s]
Epoch 0: 20%|██ | 2509/12384 [5:20:35<21:05:24, 7.69s/it, loss=0.0048, acc=0.9965, iter_time=7.61s]
Epoch 0: 20%|██ | 2510/12384 [5:20:35<21:01:22, 7.66s/it, loss=0.0048, acc=0.9965, iter_time=7.61s]
Epoch 0: 20%|██ | 2510/12384 [5:20:42<21:01:22, 7.66s/it, loss=0.0004, acc=0.9995, iter_time=4.75s]
Epoch 0: 20%|██ | 2511/12384 [5:20:42<21:00:02, 7.66s/it, loss=0.0004, acc=0.9995, iter_time=4.75s]
Epoch 0: 20%|██ | 2511/12384 [5:20:50<21:00:02, 7.66s/it, loss=0.0002, acc=0.9997, iter_time=10.56s]
Epoch 0: 20%|██ | 2512/12384 [5:20:50<21:03:11, 7.68s/it, loss=0.0002, acc=0.9997, iter_time=10.56s]
Epoch 0: 20%|██ | 2512/12384 [5:20:58<21:03:11, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2513/12384 [5:20:58<20:59:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2513/12384 [5:21:05<20:59:57, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=4.55s]
Epoch 0: 20%|██ | 2514/12384 [5:21:05<20:54:06, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=4.55s]
Epoch 0: 20%|██ | 2514/12384 [5:21:13<20:54:06, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 20%|██ | 2515/12384 [5:21:13<20:54:14, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.62s]
Epoch 0: 20%|██ | 2515/12384 [5:21:20<20:54:14, 7.63s/it, loss=0.0003, acc=0.9997, iter_time=6.72s]
Epoch 0: 20%|██ | 2516/12384 [5:21:20<20:53:12, 7.62s/it, loss=0.0003, acc=0.9997, iter_time=6.72s]
Epoch 0: 20%|██ | 2516/12384 [5:21:28<20:53:12, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.50s]
Epoch 0: 20%|██ | 2517/12384 [5:21:28<20:52:26, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=8.50s]
Epoch 0: 20%|██ | 2517/12384 [5:21:36<20:52:26, 7.62s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 20%|██ | 2518/12384 [5:21:36<20:52:20, 7.62s/it, loss=0.0010, acc=0.9984, iter_time=7.62s]
Epoch 0: 20%|██ | 2518/12384 [5:21:43<20:52:20, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2519/12384 [5:21:43<20:52:57, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2519/12384 [5:21:51<20:52:57, 7.62s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 20%|██ | 2520/12384 [5:21:51<20:55:25, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.04s]
Epoch 0: 20%|██ | 2520/12384 [5:21:58<20:55:25, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.27s]
Epoch 0: 20%|██ | 2521/12384 [5:21:58<20:55:17, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.27s]
Epoch 0: 20%|██ | 2521/12384 [5:22:06<20:55:17, 7.64s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|██ | 2522/12384 [5:22:06<20:54:50, 7.63s/it, loss=0.0004, acc=1.0000, iter_time=7.62s]
Epoch 0: 20%|██ | 2522/12384 [5:22:14<20:54:50, 7.63s/it, loss=0.0043, acc=0.9953, iter_time=7.64s]
Epoch 0: 20%|██ | 2523/12384 [5:22:14<20:54:26, 7.63s/it, loss=0.0043, acc=0.9953, iter_time=7.64s]
Epoch 0: 20%|██ | 2523/12384 [5:22:21<20:54:26, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=7.62s]
Epoch 0: 20%|██ | 2524/12384 [5:22:21<20:54:32, 7.63s/it, loss=0.0003, acc=0.9990, iter_time=7.62s]
Epoch 0: 20%|██ | 2524/12384 [5:22:29<20:54:32, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2525/12384 [5:22:29<20:54:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.63s]
Epoch 0: 20%|██ | 2525/12384 [5:22:37<20:54:18, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=4.25s]
Epoch 0: 20%|██ | 2526/12384 [5:22:37<20:55:08, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=4.25s]
Epoch 0: 20%|██ | 2526/12384 [5:22:44<20:55:08, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.04s]
Epoch 0: 20%|██ | 2527/12384 [5:22:44<20:54:59, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=11.04s]
Epoch 0: 20%|██ | 2527/12384 [5:22:52<20:54:59, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=8.03s]
Epoch 0: 20%|██ | 2528/12384 [5:22:52<20:55:31, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=8.03s]
Epoch 0: 20%|██ | 2528/12384 [5:23:00<20:55:31, 7.64s/it, loss=0.0057, acc=0.9915, iter_time=3.24s]
Epoch 0: 20%|██ | 2529/12384 [5:23:00<20:57:11, 7.65s/it, loss=0.0057, acc=0.9915, iter_time=3.24s]
Epoch 0: 20%|██ | 2529/12384 [5:23:07<20:57:11, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.43s]
Epoch 0: 20%|██ | 2530/12384 [5:23:07<20:55:18, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=8.43s]
Epoch 0: 20%|██ | 2530/12384 [5:23:15<20:55:18, 7.64s/it, loss=0.0011, acc=0.9967, iter_time=10.90s]
Epoch 0: 20%|██ | 2531/12384 [5:23:15<20:57:22, 7.66s/it, loss=0.0011, acc=0.9967, iter_time=10.90s]
Epoch 0: 20%|██ | 2531/12384 [5:23:23<20:57:22, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2532/12384 [5:23:23<20:56:03, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.68s]
Epoch 0: 20%|██ | 2532/12384 [5:23:31<20:56:03, 7.65s/it, loss=0.0019, acc=0.9966, iter_time=4.54s]
Epoch 0: 20%|██ | 2533/12384 [5:23:31<21:13:13, 7.75s/it, loss=0.0019, acc=0.9966, iter_time=4.54s]
Epoch 0: 20%|██ | 2533/12384 [5:23:38<21:13:13, 7.75s/it, loss=0.0002, acc=1.0000, iter_time=11.09s]
Epoch 0: 20%|██ | 2534/12384 [5:23:38<21:05:53, 7.71s/it, loss=0.0002, acc=1.0000, iter_time=11.09s]
Epoch 0: 20%|██ | 2534/12384 [5:23:46<21:05:53, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=5.30s]
Epoch 0: 20%|██ | 2535/12384 [5:23:46<21:02:10, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=5.30s]
Epoch 0: 20%|██ | 2535/12384 [5:23:54<21:02:10, 7.69s/it, loss=0.0024, acc=0.9950, iter_time=10.35s]
Epoch 0: 20%|██ | 2536/12384 [5:23:54<21:00:53, 7.68s/it, loss=0.0024, acc=0.9950, iter_time=10.35s]
Epoch 0: 20%|██ | 2536/12384 [5:24:01<21:00:53, 7.68s/it, loss=0.0005, acc=0.9998, iter_time=6.69s]
Epoch 0: 20%|██ | 2537/12384 [5:24:01<20:58:51, 7.67s/it, loss=0.0005, acc=0.9998, iter_time=6.69s]
Epoch 0: 20%|██ | 2537/12384 [5:24:09<20:58:51, 7.67s/it, loss=0.0003, acc=0.9999, iter_time=8.21s]
Epoch 0: 20%|██ | 2538/12384 [5:24:09<20:55:14, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=8.21s]
Epoch 0: 20%|██ | 2538/12384 [5:24:16<20:55:14, 7.65s/it, loss=0.0007, acc=0.9980, iter_time=5.36s]
Epoch 0: 21%|██ | 2539/12384 [5:24:16<20:53:43, 7.64s/it, loss=0.0007, acc=0.9980, iter_time=5.36s]
Epoch 0: 21%|██ | 2539/12384 [5:24:24<20:53:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.59s]
Epoch 0: 21%|██ | 2540/12384 [5:24:24<20:54:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.59s]
Epoch 0: 21%|██ | 2540/12384 [5:24:32<20:54:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 21%|██ | 2541/12384 [5:24:32<20:52:28, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.95s]
Epoch 0: 21%|██ | 2541/12384 [5:24:39<20:52:28, 7.63s/it, loss=0.0005, acc=0.9985, iter_time=7.67s]
Epoch 0: 21%|██ | 2542/12384 [5:24:39<20:56:55, 7.66s/it, loss=0.0005, acc=0.9985, iter_time=7.67s]
Epoch 0: 21%|██ | 2542/12384 [5:24:47<20:56:55, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=7.70s]
Epoch 0: 21%|██ | 2543/12384 [5:24:47<20:56:32, 7.66s/it, loss=0.0006, acc=0.9998, iter_time=7.70s]
Epoch 0: 21%|██ | 2543/12384 [5:24:55<20:56:32, 7.66s/it, loss=0.0021, acc=0.9942, iter_time=7.57s]
Epoch 0: 21%|██ | 2544/12384 [5:24:55<20:54:25, 7.65s/it, loss=0.0021, acc=0.9942, iter_time=7.57s]
Epoch 0: 21%|██ | 2544/12384 [5:25:02<20:54:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 21%|██ | 2545/12384 [5:25:02<20:54:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 21%|██ | 2545/12384 [5:25:10<20:54:17, 7.65s/it, loss=0.0066, acc=0.9922, iter_time=6.14s]
Epoch 0: 21%|██ | 2546/12384 [5:25:10<20:52:14, 7.64s/it, loss=0.0066, acc=0.9922, iter_time=6.14s]
Epoch 0: 21%|██ | 2546/12384 [5:25:18<20:52:14, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=9.14s]
Epoch 0: 21%|██ | 2547/12384 [5:25:18<20:51:21, 7.63s/it, loss=0.0003, acc=0.9986, iter_time=9.14s]
Epoch 0: 21%|██ | 2547/12384 [5:25:25<20:51:21, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.58s]
Epoch 0: 21%|██ | 2548/12384 [5:25:25<20:51:04, 7.63s/it, loss=0.0003, acc=1.0000, iter_time=7.58s]
Epoch 0: 21%|██ | 2548/12384 [5:25:33<20:51:04, 7.63s/it, loss=0.0015, acc=0.9976, iter_time=7.66s]
Epoch 0: 21%|██ | 2549/12384 [5:25:33<20:52:19, 7.64s/it, loss=0.0015, acc=0.9976, iter_time=7.66s]
Epoch 0: 21%|██ | 2549/12384 [5:25:40<20:52:19, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 21%|██ | 2550/12384 [5:25:40<20:51:45, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.08s]
Epoch 0: 21%|██ | 2550/12384 [5:25:48<20:51:45, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=7.22s]
Epoch 0: 21%|██ | 2551/12384 [5:25:48<20:52:42, 7.64s/it, loss=0.0002, acc=0.9997, iter_time=7.22s]
Epoch 0: 21%|██ | 2551/12384 [5:25:56<20:52:42, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 21%|██ | 2552/12384 [5:25:56<20:50:03, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 21%|██ | 2552/12384 [5:26:03<20:50:03, 7.63s/it, loss=0.0004, acc=0.9994, iter_time=6.04s]
Epoch 0: 21%|██ | 2553/12384 [5:26:03<20:54:59, 7.66s/it, loss=0.0004, acc=0.9994, iter_time=6.04s]
Epoch 0: 21%|██ | 2553/12384 [5:26:11<20:54:59, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 21%|██ | 2554/12384 [5:26:11<20:52:48, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.97s]
Epoch 0: 21%|██ | 2554/12384 [5:26:19<20:52:48, 7.65s/it, loss=0.0009, acc=0.9967, iter_time=8.57s]
Epoch 0: 21%|██ | 2555/12384 [5:26:19<20:55:17, 7.66s/it, loss=0.0009, acc=0.9967, iter_time=8.57s]
Epoch 0: 21%|██ | 2555/12384 [5:26:26<20:55:17, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=7.40s]
Epoch 0: 21%|██ | 2556/12384 [5:26:26<20:52:11, 7.64s/it, loss=0.0003, acc=1.0000, iter_time=7.40s]
Epoch 0: 21%|██ | 2556/12384 [5:26:34<20:52:11, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.88s]
Epoch 0: 21%|██ | 2557/12384 [5:26:34<20:49:48, 7.63s/it, loss=0.0003, acc=0.9986, iter_time=7.88s]
Epoch 0: 21%|██ | 2557/12384 [5:26:42<20:49:48, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██ | 2558/12384 [5:26:42<20:51:44, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██ | 2558/12384 [5:26:50<20:51:44, 7.64s/it, loss=0.0003, acc=0.9987, iter_time=7.65s]
Epoch 0: 21%|██ | 2559/12384 [5:26:50<21:08:22, 7.75s/it, loss=0.0003, acc=0.9987, iter_time=7.65s]
Epoch 0: 21%|██ | 2559/12384 [5:26:57<21:08:22, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 21%|██ | 2560/12384 [5:26:57<21:01:44, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.89s]
Epoch 0: 21%|██ | 2560/12384 [5:27:05<21:01:44, 7.71s/it, loss=0.0012, acc=0.9972, iter_time=7.66s]
Epoch 0: 21%|██ | 2561/12384 [5:27:05<20:59:56, 7.70s/it, loss=0.0012, acc=0.9972, iter_time=7.66s]
Epoch 0: 21%|██ | 2561/12384 [5:27:12<20:59:56, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██ | 2562/12384 [5:27:12<20:54:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██ | 2562/12384 [5:27:20<20:54:37, 7.66s/it, loss=0.0006, acc=0.9979, iter_time=7.01s]
Epoch 0: 21%|██ | 2563/12384 [5:27:20<20:53:33, 7.66s/it, loss=0.0006, acc=0.9979, iter_time=7.01s]
Epoch 0: 21%|██ | 2563/12384 [5:27:28<20:53:33, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2564/12384 [5:27:28<20:52:31, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2564/12384 [5:27:35<20:52:31, 7.65s/it, loss=0.0009, acc=0.9979, iter_time=7.31s]
Epoch 0: 21%|██ | 2565/12384 [5:27:35<20:51:49, 7.65s/it, loss=0.0009, acc=0.9979, iter_time=7.31s]
Epoch 0: 21%|██ | 2565/12384 [5:27:43<20:51:49, 7.65s/it, loss=0.0021, acc=0.9964, iter_time=7.97s]
Epoch 0: 21%|██ | 2566/12384 [5:27:43<20:49:39, 7.64s/it, loss=0.0021, acc=0.9964, iter_time=7.97s]
Epoch 0: 21%|██ | 2566/12384 [5:27:51<20:49:39, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.62s]
Epoch 0: 21%|██ | 2567/12384 [5:27:51<20:49:13, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=7.62s]
Epoch 0: 21%|██ | 2567/12384 [5:27:58<20:49:13, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 21%|██ | 2568/12384 [5:27:58<20:52:32, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.03s]
Epoch 0: 21%|██ | 2568/12384 [5:28:06<20:52:32, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.28s]
Epoch 0: 21%|██ | 2569/12384 [5:28:06<20:51:19, 7.65s/it, loss=0.0002, acc=0.9998, iter_time=7.28s]
Epoch 0: 21%|██ | 2569/12384 [5:28:14<20:51:19, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=6.17s]
Epoch 0: 21%|██ | 2570/12384 [5:28:14<20:53:56, 7.67s/it, loss=0.0002, acc=1.0000, iter_time=6.17s]
Epoch 0: 21%|██ | 2570/12384 [5:28:21<20:53:56, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2571/12384 [5:28:21<20:51:54, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.24s]
Epoch 0: 21%|██ | 2571/12384 [5:28:29<20:51:54, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.36s]
Epoch 0: 21%|██ | 2572/12384 [5:28:29<20:52:06, 7.66s/it, loss=0.0003, acc=0.9998, iter_time=7.36s]
Epoch 0: 21%|██ | 2572/12384 [5:28:37<20:52:06, 7.66s/it, loss=0.0004, acc=0.9994, iter_time=8.86s]
Epoch 0: 21%|██ | 2573/12384 [5:28:37<20:48:37, 7.64s/it, loss=0.0004, acc=0.9994, iter_time=8.86s]
Epoch 0: 21%|██ | 2573/12384 [5:28:44<20:48:37, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2574/12384 [5:28:44<20:49:43, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2574/12384 [5:28:52<20:49:43, 7.64s/it, loss=0.0316, acc=0.9499, iter_time=7.64s]
Epoch 0: 21%|██ | 2575/12384 [5:28:52<20:48:15, 7.64s/it, loss=0.0316, acc=0.9499, iter_time=7.64s]
Epoch 0: 21%|██ | 2575/12384 [5:28:59<20:48:15, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 21%|██ | 2576/12384 [5:28:59<20:48:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=8.00s]
Epoch 0: 21%|██ | 2576/12384 [5:29:07<20:48:45, 7.64s/it, loss=0.0002, acc=0.9987, iter_time=7.00s]
Epoch 0: 21%|██ | 2577/12384 [5:29:07<20:51:46, 7.66s/it, loss=0.0002, acc=0.9987, iter_time=7.00s]
Epoch 0: 21%|██ | 2577/12384 [5:29:15<20:51:46, 7.66s/it, loss=0.0002, acc=0.9990, iter_time=7.96s]
Epoch 0: 21%|██ | 2578/12384 [5:29:15<20:50:48, 7.65s/it, loss=0.0002, acc=0.9990, iter_time=7.96s]
Epoch 0: 21%|██ | 2578/12384 [5:29:22<20:50:48, 7.65s/it, loss=0.0003, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██ | 2579/12384 [5:29:22<20:48:32, 7.64s/it, loss=0.0003, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██ | 2579/12384 [5:29:30<20:48:32, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2580/12384 [5:29:30<20:48:54, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2580/12384 [5:29:38<20:48:54, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 21%|██ | 2581/12384 [5:29:38<20:49:10, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.85s]
Epoch 0: 21%|██ | 2581/12384 [5:29:45<20:49:10, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=9.44s]
Epoch 0: 21%|██ | 2582/12384 [5:29:45<20:48:38, 7.64s/it, loss=0.0001, acc=0.9999, iter_time=9.44s]
Epoch 0: 21%|██ | 2582/12384 [5:29:53<20:48:38, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 21%|██ | 2583/12384 [5:29:53<20:50:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.08s]
Epoch 0: 21%|██ | 2583/12384 [5:30:01<20:50:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 21%|██ | 2584/12384 [5:30:01<20:51:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.64s]
Epoch 0: 21%|██ | 2584/12384 [5:30:09<20:51:37, 7.66s/it, loss=0.0051, acc=0.9949, iter_time=7.32s]
Epoch 0: 21%|██ | 2585/12384 [5:30:09<21:07:25, 7.76s/it, loss=0.0051, acc=0.9949, iter_time=7.32s]
Epoch 0: 21%|██ | 2585/12384 [5:30:16<21:07:25, 7.76s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 21%|██ | 2586/12384 [5:30:16<20:59:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=6.18s]
Epoch 0: 21%|██ | 2586/12384 [5:30:24<20:59:52, 7.72s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 21%|██ | 2587/12384 [5:30:24<20:55:41, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=9.39s]
Epoch 0: 21%|██ | 2587/12384 [5:30:32<20:55:41, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2588/12384 [5:30:32<20:54:36, 7.68s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2588/12384 [5:30:39<20:54:36, 7.68s/it, loss=0.0016, acc=0.9970, iter_time=7.67s]
Epoch 0: 21%|██ | 2589/12384 [5:30:39<20:52:42, 7.67s/it, loss=0.0016, acc=0.9970, iter_time=7.67s]
Epoch 0: 21%|██ | 2589/12384 [5:30:47<20:52:42, 7.67s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 21%|██ | 2590/12384 [5:30:47<20:48:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.41s]
Epoch 0: 21%|██ | 2590/12384 [5:30:55<20:48:22, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.86s]
Epoch 0: 21%|██ | 2591/12384 [5:30:55<20:47:50, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=7.86s]
Epoch 0: 21%|██ | 2591/12384 [5:31:02<20:47:50, 7.65s/it, loss=0.0003, acc=0.9997, iter_time=8.01s]
Epoch 0: 21%|██ | 2592/12384 [5:31:02<20:47:17, 7.64s/it, loss=0.0003, acc=0.9997, iter_time=8.01s]
Epoch 0: 21%|██ | 2592/12384 [5:31:10<20:47:17, 7.64s/it, loss=0.0005, acc=0.9989, iter_time=7.25s]
Epoch 0: 21%|██ | 2593/12384 [5:31:10<20:47:45, 7.65s/it, loss=0.0005, acc=0.9989, iter_time=7.25s]
Epoch 0: 21%|██ | 2593/12384 [5:31:17<20:47:45, 7.65s/it, loss=0.0004, acc=0.9995, iter_time=7.65s]
Epoch 0: 21%|██ | 2594/12384 [5:31:17<20:49:26, 7.66s/it, loss=0.0004, acc=0.9995, iter_time=7.65s]
Epoch 0: 21%|██ | 2594/12384 [5:31:25<20:49:26, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 21%|██ | 2595/12384 [5:31:25<20:49:45, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=3.83s]
Epoch 0: 21%|██ | 2595/12384 [5:31:33<20:49:45, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 0: 21%|██ | 2596/12384 [5:31:33<20:49:14, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.01s]
Epoch 0: 21%|██ | 2596/12384 [5:31:40<20:49:14, 7.66s/it, loss=0.0005, acc=0.9974, iter_time=7.37s]
Epoch 0: 21%|██ | 2597/12384 [5:31:40<20:48:47, 7.66s/it, loss=0.0005, acc=0.9974, iter_time=7.37s]
Epoch 0: 21%|██ | 2597/12384 [5:31:48<20:48:47, 7.66s/it, loss=0.0004, acc=0.9977, iter_time=9.43s]
Epoch 0: 21%|██ | 2598/12384 [5:31:48<20:51:00, 7.67s/it, loss=0.0004, acc=0.9977, iter_time=9.43s]
Epoch 0: 21%|██ | 2598/12384 [5:31:56<20:51:00, 7.67s/it, loss=0.0007, acc=0.9971, iter_time=7.71s]
Epoch 0: 21%|██ | 2599/12384 [5:31:56<20:49:39, 7.66s/it, loss=0.0007, acc=0.9971, iter_time=7.71s]
Epoch 0: 21%|██ | 2599/12384 [5:32:03<20:49:39, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.07s]
Epoch 0: 21%|██ | 2600/12384 [5:32:03<20:48:37, 7.66s/it, loss=0.0002, acc=1.0000, iter_time=8.07s]
Epoch 0: 21%|██ | 2600/12384 [5:32:11<20:48:37, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=6.35s]
Epoch 0: 21%|██ | 2601/12384 [5:32:11<20:47:43, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=6.35s]
Epoch 0: 21%|██ | 2601/12384 [5:32:19<20:47:43, 7.65s/it, loss=0.0006, acc=0.9975, iter_time=8.49s]
Epoch 0: 21%|██ | 2602/12384 [5:32:19<20:50:00, 7.67s/it, loss=0.0006, acc=0.9975, iter_time=8.49s]
Epoch 0: 21%|██ | 2602/12384 [5:32:26<20:50:00, 7.67s/it, loss=0.0021, acc=0.9964, iter_time=7.71s]
Epoch 0: 21%|██ | 2603/12384 [5:32:26<20:46:27, 7.65s/it, loss=0.0021, acc=0.9964, iter_time=7.71s]
Epoch 0: 21%|██ | 2603/12384 [5:32:34<20:46:27, 7.65s/it, loss=0.0008, acc=0.9979, iter_time=7.62s]
Epoch 0: 21%|██ | 2604/12384 [5:32:34<20:48:24, 7.66s/it, loss=0.0008, acc=0.9979, iter_time=7.62s]
Epoch 0: 21%|██ | 2604/12384 [5:32:42<20:48:24, 7.66s/it, loss=0.0002, acc=0.9991, iter_time=7.67s]
Epoch 0: 21%|██ | 2605/12384 [5:32:42<20:47:33, 7.65s/it, loss=0.0002, acc=0.9991, iter_time=7.67s]
Epoch 0: 21%|██ | 2605/12384 [5:32:49<20:47:33, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██ | 2606/12384 [5:32:49<20:44:43, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.64s]
Epoch 0: 21%|██ | 2606/12384 [5:32:57<20:44:43, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=7.62s]
Epoch 0: 21%|██ | 2607/12384 [5:32:57<20:44:52, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=7.62s]
Epoch 0: 21%|██ | 2607/12384 [5:33:05<20:44:52, 7.64s/it, loss=0.0005, acc=0.9983, iter_time=8.05s]
Epoch 0: 21%|██ | 2608/12384 [5:33:05<20:45:16, 7.64s/it, loss=0.0005, acc=0.9983, iter_time=8.05s]
Epoch 0: 21%|██ | 2608/12384 [5:33:12<20:45:16, 7.64s/it, loss=0.0017, acc=0.9954, iter_time=5.96s]
Epoch 0: 21%|██ | 2609/12384 [5:33:12<20:43:21, 7.63s/it, loss=0.0017, acc=0.9954, iter_time=5.96s]
Epoch 0: 21%|██ | 2609/12384 [5:33:20<20:43:21, 7.63s/it, loss=0.0006, acc=0.9992, iter_time=8.87s]
Epoch 0: 21%|██ | 2610/12384 [5:33:20<20:42:49, 7.63s/it, loss=0.0006, acc=0.9992, iter_time=8.87s]
Epoch 0: 21%|██ | 2610/12384 [5:33:28<20:42:49, 7.63s/it, loss=0.0001, acc=0.9998, iter_time=5.64s]
Epoch 0: 21%|██ | 2611/12384 [5:33:28<20:58:12, 7.72s/it, loss=0.0001, acc=0.9998, iter_time=5.64s]
Epoch 0: 21%|██ | 2611/12384 [5:33:35<20:58:12, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 21%|██ | 2612/12384 [5:33:35<20:53:25, 7.70s/it, loss=0.0001, acc=1.0000, iter_time=9.93s]
Epoch 0: 21%|██ | 2612/12384 [5:33:43<20:53:25, 7.70s/it, loss=0.0006, acc=0.9986, iter_time=7.63s]
Epoch 0: 21%|██ | 2613/12384 [5:33:43<20:48:39, 7.67s/it, loss=0.0006, acc=0.9986, iter_time=7.63s]
Epoch 0: 21%|██ | 2613/12384 [5:33:51<20:48:39, 7.67s/it, loss=0.0001, acc=0.9998, iter_time=7.29s]
Epoch 0: 21%|██ | 2614/12384 [5:33:51<20:46:16, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.29s]
Epoch 0: 21%|██ | 2614/12384 [5:33:58<20:46:16, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.94s]
Epoch 0: 21%|██ | 2615/12384 [5:33:58<20:45:22, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.94s]
Epoch 0: 21%|██ | 2615/12384 [5:34:06<20:45:22, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 21%|██ | 2616/12384 [5:34:06<20:47:09, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=8.02s]
Epoch 0: 21%|██ | 2616/12384 [5:34:14<20:47:09, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 21%|██ | 2617/12384 [5:34:14<20:46:16, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 21%|██ | 2617/12384 [5:34:21<20:46:16, 7.66s/it, loss=0.0006, acc=0.9983, iter_time=5.57s]
Epoch 0: 21%|██ | 2618/12384 [5:34:21<20:45:22, 7.65s/it, loss=0.0006, acc=0.9983, iter_time=5.57s]
Epoch 0: 21%|██ | 2618/12384 [5:34:29<20:45:22, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 21%|██ | 2619/12384 [5:34:29<20:45:30, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.71s]
Epoch 0: 21%|██ | 2619/12384 [5:34:37<20:45:30, 7.65s/it, loss=0.0024, acc=0.9961, iter_time=7.66s]
Epoch 0: 21%|██ | 2620/12384 [5:34:37<20:43:49, 7.64s/it, loss=0.0024, acc=0.9961, iter_time=7.66s]
Epoch 0: 21%|██ | 2620/12384 [5:34:44<20:43:49, 7.64s/it, loss=0.0013, acc=0.9957, iter_time=7.67s]
Epoch 0: 21%|██ | 2621/12384 [5:34:44<20:44:01, 7.65s/it, loss=0.0013, acc=0.9957, iter_time=7.67s]
Epoch 0: 21%|██ | 2621/12384 [5:34:52<20:44:01, 7.65s/it, loss=0.0006, acc=0.9996, iter_time=7.59s]
Epoch 0: 21%|██ | 2622/12384 [5:34:52<20:43:45, 7.64s/it, loss=0.0006, acc=0.9996, iter_time=7.59s]
Epoch 0: 21%|██ | 2622/12384 [5:35:00<20:43:45, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██ | 2623/12384 [5:35:00<20:46:10, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██ | 2623/12384 [5:35:07<20:46:10, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 21%|██ | 2624/12384 [5:35:07<20:46:39, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.06s]
Epoch 0: 21%|██ | 2624/12384 [5:35:15<20:46:39, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 0: 21%|██ | 2625/12384 [5:35:15<20:43:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.50s]
Epoch 0: 21%|██ | 2625/12384 [5:35:22<20:43:47, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 21%|██ | 2626/12384 [5:35:22<20:43:49, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=5.88s]
Epoch 0: 21%|██ | 2626/12384 [5:35:30<20:43:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.55s]
Epoch 0: 21%|██ | 2627/12384 [5:35:30<20:44:17, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=10.55s]
Epoch 0: 21%|██ | 2627/12384 [5:35:38<20:44:17, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=7.30s]
Epoch 0: 21%|██ | 2628/12384 [5:35:38<20:44:52, 7.66s/it, loss=0.0001, acc=0.9998, iter_time=7.30s]
Epoch 0: 21%|██ | 2628/12384 [5:35:45<20:44:52, 7.66s/it, loss=0.0003, acc=1.0000, iter_time=5.80s]
Epoch 0: 21%|██ | 2629/12384 [5:35:45<20:44:23, 7.65s/it, loss=0.0003, acc=1.0000, iter_time=5.80s]
Epoch 0: 21%|██ | 2629/12384 [5:35:53<20:44:23, 7.65s/it, loss=0.0006, acc=0.9990, iter_time=10.39s]
Epoch 0: 21%|██ | 2630/12384 [5:35:53<20:41:27, 7.64s/it, loss=0.0006, acc=0.9990, iter_time=10.39s]
Epoch 0: 21%|██ | 2630/12384 [5:36:01<20:41:27, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2631/12384 [5:36:01<20:41:00, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.62s]
Epoch 0: 21%|██ | 2631/12384 [5:36:08<20:41:00, 7.63s/it, loss=0.0009, acc=0.9979, iter_time=7.61s]
Epoch 0: 21%|██▏ | 2632/12384 [5:36:08<20:41:45, 7.64s/it, loss=0.0009, acc=0.9979, iter_time=7.61s]
Epoch 0: 21%|██▏ | 2632/12384 [5:36:16<20:41:45, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 21%|██▏ | 2633/12384 [5:36:16<20:39:26, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.33s]
Epoch 0: 21%|██▏ | 2633/12384 [5:36:24<20:39:26, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 0: 21%|██▏ | 2634/12384 [5:36:24<20:42:11, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.29s]
Epoch 0: 21%|██▏ | 2634/12384 [5:36:31<20:42:11, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 21%|██▏ | 2635/12384 [5:36:31<20:42:15, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.32s]
Epoch 0: 21%|██▏ | 2635/12384 [5:36:39<20:42:15, 7.65s/it, loss=0.0039, acc=0.9901, iter_time=7.95s]
Epoch 0: 21%|██▏ | 2636/12384 [5:36:39<20:54:16, 7.72s/it, loss=0.0039, acc=0.9901, iter_time=7.95s]
Epoch 0: 21%|██▏ | 2636/12384 [5:36:47<20:54:16, 7.72s/it, loss=0.0008, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2637/12384 [5:36:47<21:05:35, 7.79s/it, loss=0.0008, acc=0.9986, iter_time=7.64s]
Epoch 0: 21%|██▏ | 2637/12384 [5:36:55<21:05:35, 7.79s/it, loss=0.0009, acc=0.9998, iter_time=6.10s]
Epoch 0: 21%|██▏ | 2638/12384 [5:36:55<20:56:44, 7.74s/it, loss=0.0009, acc=0.9998, iter_time=6.10s]
Epoch 0: 21%|██▏ | 2638/12384 [5:37:02<20:56:44, 7.74s/it, loss=0.0081, acc=0.9851, iter_time=9.43s]
Epoch 0: 21%|██▏ | 2639/12384 [5:37:02<20:52:45, 7.71s/it, loss=0.0081, acc=0.9851, iter_time=9.43s]
Epoch 0: 21%|██▏ | 2639/12384 [5:37:10<20:52:45, 7.71s/it, loss=0.0010, acc=0.9975, iter_time=8.04s]
Epoch 0: 21%|██▏ | 2640/12384 [5:37:10<20:48:40, 7.69s/it, loss=0.0010, acc=0.9975, iter_time=8.04s]
Epoch 0: 21%|██▏ | 2640/12384 [5:37:16<20:48:40, 7.69s/it, loss=0.0029, acc=0.9933, iter_time=4.04s]
Epoch 0: 21%|██▏ | 2641/12384 [5:37:16<19:39:46, 7.27s/it, loss=0.0029, acc=0.9933, iter_time=4.04s]
Epoch 0: 21%|██▏ | 2641/12384 [5:37:24<19:39:46, 7.27s/it, loss=0.0002, acc=0.9999, iter_time=9.51s]
Epoch 0: 21%|██▏ | 2642/12384 [5:37:24<20:00:36, 7.39s/it, loss=0.0002, acc=0.9999, iter_time=9.51s]
Epoch 0: 21%|██▏ | 2642/12384 [5:37:32<20:00:36, 7.39s/it, loss=0.0053, acc=0.9917, iter_time=7.68s]
Epoch 0: 21%|██▏ | 2643/12384 [5:37:32<20:11:03, 7.46s/it, loss=0.0053, acc=0.9917, iter_time=7.68s]
Epoch 0: 21%|██▏ | 2643/12384 [5:37:39<20:11:03, 7.46s/it, loss=0.0003, acc=0.9998, iter_time=4.99s]
Epoch 0: 21%|██▏ | 2644/12384 [5:37:39<20:22:37, 7.53s/it, loss=0.0003, acc=0.9998, iter_time=4.99s]
Epoch 0: 21%|██▏ | 2644/12384 [5:37:47<20:22:37, 7.53s/it, loss=0.0003, acc=1.0000, iter_time=10.31s]
Epoch 0: 21%|██▏ | 2645/12384 [5:37:47<20:32:35, 7.59s/it, loss=0.0003, acc=1.0000, iter_time=10.31s]
Epoch 0: 21%|██▏ | 2645/12384 [5:37:55<20:32:35, 7.59s/it, loss=0.0003, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██▏ | 2646/12384 [5:37:55<20:35:56, 7.62s/it, loss=0.0003, acc=1.0000, iter_time=7.75s]
Epoch 0: 21%|██▏ | 2646/12384 [5:38:02<20:35:56, 7.62s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 21%|██▏ | 2647/12384 [5:38:02<20:35:31, 7.61s/it, loss=0.0002, acc=1.0000, iter_time=7.67s]
Epoch 0: 21%|██▏ | 2647/12384 [5:38:10<20:35:31, 7.61s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 21%|██▏ | 2648/12384 [5:38:10<20:35:53, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=7.99s]
Epoch 0: 21%|██▏ | 2648/12384 [5:38:18<20:35:53, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.46s]
Epoch 0: 21%|██▏ | 2649/12384 [5:38:18<20:36:42, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=5.46s]
Epoch 0: 21%|██▏ | 2649/12384 [5:38:25<20:36:42, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=9.87s]
Epoch 0: 21%|██▏ | 2650/12384 [5:38:25<20:38:40, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=9.87s]
Epoch 0: 21%|██▏ | 2650/12384 [5:38:33<20:38:40, 7.64s/it, loss=0.0002, acc=0.9988, iter_time=7.21s]
Epoch 0: 21%|██▏ | 2651/12384 [5:38:33<20:39:33, 7.64s/it, loss=0.0002, acc=0.9988, iter_time=7.21s]
Epoch 0: 21%|██▏ | 2651/12384 [5:38:41<20:39:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██▏ | 2652/12384 [5:38:41<20:40:24, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 21%|██▏ | 2652/12384 [5:38:48<20:40:24, 7.65s/it, loss=0.0005, acc=0.9992, iter_time=4.52s]
Epoch 0: 21%|██▏ | 2653/12384 [5:38:48<20:42:17, 7.66s/it, loss=0.0005, acc=0.9992, iter_time=4.52s]
Epoch 0: 21%|██▏ | 2653/12384 [5:38:56<20:42:17, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 21%|██▏ | 2654/12384 [5:38:56<20:41:53, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=9.89s]
Epoch 0: 21%|██▏ | 2654/12384 [5:39:04<20:41:53, 7.66s/it, loss=0.0010, acc=0.9981, iter_time=8.59s]
Epoch 0: 21%|██▏ | 2655/12384 [5:39:04<20:44:28, 7.67s/it, loss=0.0010, acc=0.9981, iter_time=8.59s]
Epoch 0: 21%|██▏ | 2655/12384 [5:39:11<20:44:28, 7.67s/it, loss=0.0005, acc=0.9998, iter_time=8.10s]
Epoch 0: 21%|██▏ | 2656/12384 [5:39:11<20:44:17, 7.67s/it, loss=0.0005, acc=0.9998, iter_time=8.10s]
Epoch 0: 21%|██▏ | 2656/12384 [5:39:19<20:44:17, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 21%|██▏ | 2657/12384 [5:39:19<20:43:01, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=7.30s]
Epoch 0: 21%|██▏ | 2657/12384 [5:39:27<20:43:01, 7.67s/it, loss=0.0008, acc=0.9978, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2658/12384 [5:39:27<20:39:27, 7.65s/it, loss=0.0008, acc=0.9978, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2658/12384 [5:39:34<20:39:27, 7.65s/it, loss=0.0001, acc=0.9997, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2659/12384 [5:39:34<20:36:36, 7.63s/it, loss=0.0001, acc=0.9997, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2659/12384 [5:39:42<20:36:36, 7.63s/it, loss=0.0024, acc=0.9961, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2660/12384 [5:39:42<20:36:01, 7.63s/it, loss=0.0024, acc=0.9961, iter_time=7.60s]
Epoch 0: 21%|██▏ | 2660/12384 [5:39:49<20:36:01, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2661/12384 [5:39:49<20:37:34, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.63s]
Epoch 0: 21%|██▏ | 2661/12384 [5:39:57<20:37:34, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 21%|██▏ | 2662/12384 [5:39:57<20:37:24, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.68s]
Epoch 0: 21%|██▏ | 2662/12384 [5:40:05<20:37:24, 7.64s/it, loss=0.0002, acc=0.9993, iter_time=5.26s]
Epoch 0: 22%|██▏ | 2663/12384 [5:40:05<20:36:35, 7.63s/it, loss=0.0002, acc=0.9993, iter_time=5.26s]
Epoch 0: 22%|██▏ | 2663/12384 [5:40:13<20:36:35, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 22%|██▏ | 2664/12384 [5:40:13<20:54:06, 7.74s/it, loss=0.0000, acc=1.0000, iter_time=10.30s]
Epoch 0: 22%|██▏ | 2664/12384 [5:40:20<20:54:06, 7.74s/it, loss=0.0003, acc=0.9996, iter_time=7.66s]
Epoch 0: 22%|██▏ | 2665/12384 [5:40:20<20:47:29, 7.70s/it, loss=0.0003, acc=0.9996, iter_time=7.66s]
Epoch 0: 22%|██▏ | 2665/12384 [5:40:28<20:47:29, 7.70s/it, loss=0.0001, acc=0.9993, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2666/12384 [5:40:28<20:42:43, 7.67s/it, loss=0.0001, acc=0.9993, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2666/12384 [5:40:35<20:42:43, 7.67s/it, loss=0.0012, acc=0.9973, iter_time=7.58s]
Epoch 0: 22%|██▏ | 2667/12384 [5:40:35<20:38:59, 7.65s/it, loss=0.0012, acc=0.9973, iter_time=7.58s]
Epoch 0: 22%|██▏ | 2667/12384 [5:40:43<20:38:59, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2668/12384 [5:40:43<20:38:26, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2668/12384 [5:40:51<20:38:26, 7.65s/it, loss=0.0020, acc=0.9934, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2669/12384 [5:40:51<20:36:01, 7.63s/it, loss=0.0020, acc=0.9934, iter_time=7.62s]
Epoch 0: 22%|██▏ | 2669/12384 [5:40:58<20:36:01, 7.63s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2670/12384 [5:40:58<20:34:17, 7.62s/it, loss=0.0002, acc=0.9998, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2670/12384 [5:41:06<20:34:17, 7.62s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 22%|██▏ | 2671/12384 [5:41:06<20:35:20, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.88s]
Epoch 0: 22%|██▏ | 2671/12384 [5:41:14<20:35:20, 7.63s/it, loss=0.0002, acc=1.0000, iter_time=9.77s]
Epoch 0: 22%|██▏ | 2672/12384 [5:41:14<20:36:50, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=9.77s]
Epoch 0: 22%|██▏ | 2672/12384 [5:41:21<20:36:50, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=5.47s]
Epoch 0: 22%|██▏ | 2673/12384 [5:41:21<20:36:02, 7.64s/it, loss=0.0005, acc=1.0000, iter_time=5.47s]
Epoch 0: 22%|██▏ | 2673/12384 [5:41:29<20:36:02, 7.64s/it, loss=0.0002, acc=0.9995, iter_time=8.49s]
Epoch 0: 22%|██▏ | 2674/12384 [5:41:29<20:35:32, 7.63s/it, loss=0.0002, acc=0.9995, iter_time=8.49s]
Epoch 0: 22%|██▏ | 2674/12384 [5:41:36<20:35:32, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2675/12384 [5:41:36<20:34:13, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2675/12384 [5:41:44<20:34:13, 7.63s/it, loss=0.0004, acc=0.9971, iter_time=4.80s]
Epoch 0: 22%|██▏ | 2676/12384 [5:41:44<20:37:23, 7.65s/it, loss=0.0004, acc=0.9971, iter_time=4.80s]
Epoch 0: 22%|██▏ | 2676/12384 [5:41:52<20:37:23, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 0: 22%|██▏ | 2677/12384 [5:41:52<20:36:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=9.57s]
Epoch 0: 22%|██▏ | 2677/12384 [5:41:59<20:36:33, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 22%|██▏ | 2678/12384 [5:41:59<20:34:50, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=5.80s]
Epoch 0: 22%|██▏ | 2678/12384 [5:42:07<20:34:50, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 22%|██▏ | 2679/12384 [5:42:07<20:36:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=8.05s]
Epoch 0: 22%|██▏ | 2679/12384 [5:42:15<20:36:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 22%|██▏ | 2680/12384 [5:42:15<20:36:27, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.40s]
Epoch 0: 22%|██▏ | 2680/12384 [5:42:22<20:36:27, 7.65s/it, loss=0.0022, acc=0.9950, iter_time=7.25s]
Epoch 0: 22%|██▏ | 2681/12384 [5:42:22<20:34:18, 7.63s/it, loss=0.0022, acc=0.9950, iter_time=7.25s]
Epoch 0: 22%|██▏ | 2681/12384 [5:42:30<20:34:18, 7.63s/it, loss=0.0006, acc=0.9991, iter_time=6.68s]
Epoch 0: 22%|██▏ | 2682/12384 [5:42:30<20:34:02, 7.63s/it, loss=0.0006, acc=0.9991, iter_time=6.68s]
Epoch 0: 22%|██▏ | 2682/12384 [5:42:38<20:34:02, 7.63s/it, loss=0.0002, acc=0.9996, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2683/12384 [5:42:38<20:34:19, 7.63s/it, loss=0.0002, acc=0.9996, iter_time=8.56s]
Epoch 0: 22%|██▏ | 2683/12384 [5:42:45<20:34:19, 7.63s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 22%|██▏ | 2684/12384 [5:42:45<20:37:28, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.73s]
Epoch 0: 22%|██▏ | 2684/12384 [5:42:53<20:37:28, 7.65s/it, loss=0.0001, acc=0.9999, iter_time=7.03s]
Epoch 0: 22%|██▏ | 2685/12384 [5:42:53<20:39:17, 7.67s/it, loss=0.0001, acc=0.9999, iter_time=7.03s]
Epoch 0: 22%|██▏ | 2685/12384 [5:43:01<20:39:17, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 0: 22%|██▏ | 2686/12384 [5:43:01<20:38:04, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=8.27s]
Epoch 0: 22%|██▏ | 2686/12384 [5:43:08<20:38:04, 7.66s/it, loss=0.0005, acc=0.9985, iter_time=7.68s]
Epoch 0: 22%|██▏ | 2687/12384 [5:43:08<20:38:29, 7.66s/it, loss=0.0005, acc=0.9985, iter_time=7.68s]
Epoch 0: 22%|██▏ | 2687/12384 [5:43:16<20:38:29, 7.66s/it, loss=0.0007, acc=0.9991, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2688/12384 [5:43:16<20:37:55, 7.66s/it, loss=0.0007, acc=0.9991, iter_time=7.63s]
Epoch 0: 22%|██▏ | 2688/12384 [5:43:24<20:37:55, 7.66s/it, loss=0.0002, acc=0.9998, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2689/12384 [5:43:24<20:35:14, 7.64s/it, loss=0.0002, acc=0.9998, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2689/12384 [5:43:32<20:35:14, 7.64s/it, loss=0.0004, acc=0.9998, iter_time=5.11s]
Epoch 0: 22%|██▏ | 2690/12384 [5:43:32<20:51:44, 7.75s/it, loss=0.0004, acc=0.9998, iter_time=5.11s]
Epoch 0: 22%|██▏ | 2690/12384 [5:43:39<20:51:44, 7.75s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 22%|██▏ | 2691/12384 [5:43:39<20:47:21, 7.72s/it, loss=0.0001, acc=1.0000, iter_time=6.53s]
Epoch 0: 22%|██▏ | 2691/12384 [5:43:47<20:47:21, 7.72s/it, loss=0.0022, acc=0.9954, iter_time=11.64s]
Epoch 0: 22%|██▏ | 2692/12384 [5:43:47<20:41:36, 7.69s/it, loss=0.0022, acc=0.9954, iter_time=11.64s]
Epoch 0: 22%|██▏ | 2692/12384 [5:43:55<20:41:36, 7.69s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2693/12384 [5:43:55<20:40:58, 7.68s/it, loss=0.0000, acc=1.0000, iter_time=7.60s]
Epoch 0: 22%|██▏ | 2693/12384 [5:44:02<20:40:58, 7.68s/it, loss=0.0002, acc=0.9998, iter_time=6.82s]
Epoch 0: 22%|██▏ | 2694/12384 [5:44:02<20:38:19, 7.67s/it, loss=0.0002, acc=0.9998, iter_time=6.82s]
Epoch 0: 22%|██▏ | 2694/12384 [5:44:10<20:38:19, 7.67s/it, loss=0.0003, acc=0.9998, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2695/12384 [5:44:10<20:35:11, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2695/12384 [5:44:17<20:35:11, 7.65s/it, loss=0.0004, acc=0.9991, iter_time=8.55s]
Epoch 0: 22%|██▏ | 2696/12384 [5:44:17<20:35:01, 7.65s/it, loss=0.0004, acc=0.9991, iter_time=8.55s]
Epoch 0: 22%|██▏ | 2696/12384 [5:44:25<20:35:01, 7.65s/it, loss=0.0002, acc=1.0000, iter_time=4.00s]
Epoch 0: 22%|██▏ | 2697/12384 [5:44:25<20:33:10, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=4.00s]
Epoch 0: 22%|██▏ | 2697/12384 [5:44:33<20:33:10, 7.64s/it, loss=0.0003, acc=0.9998, iter_time=8.09s]
Epoch 0: 22%|██▏ | 2698/12384 [5:44:33<20:35:25, 7.65s/it, loss=0.0003, acc=0.9998, iter_time=8.09s]
Epoch 0: 22%|██▏ | 2698/12384 [5:44:40<20:35:25, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2699/12384 [5:44:40<20:33:51, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.93s]
Epoch 0: 22%|██▏ | 2699/12384 [5:44:48<20:33:51, 7.64s/it, loss=0.0048, acc=0.9951, iter_time=10.57s]
Epoch 0: 22%|██▏ | 2700/12384 [5:44:48<20:32:35, 7.64s/it, loss=0.0048, acc=0.9951, iter_time=10.57s]
Epoch 0: 22%|██▏ | 2700/12384 [5:44:56<20:32:35, 7.64s/it, loss=0.0002, acc=0.9996, iter_time=7.21s]
Epoch 0: 22%|██▏ | 2701/12384 [5:44:56<20:32:01, 7.63s/it, loss=0.0002, acc=0.9996, iter_time=7.21s]
Epoch 0: 22%|██▏ | 2701/12384 [5:45:03<20:32:01, 7.63s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2702/12384 [5:45:03<20:32:50, 7.64s/it, loss=0.0002, acc=0.9999, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2702/12384 [5:45:11<20:32:50, 7.64s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 22%|██▏ | 2703/12384 [5:45:11<20:30:38, 7.63s/it, loss=0.0000, acc=1.0000, iter_time=7.42s]
Epoch 0: 22%|██▏ | 2703/12384 [5:45:18<20:30:38, 7.63s/it, loss=0.0015, acc=0.9963, iter_time=7.82s]
Epoch 0: 22%|██▏ | 2704/12384 [5:45:18<20:32:14, 7.64s/it, loss=0.0015, acc=0.9963, iter_time=7.82s]
Epoch 0: 22%|██▏ | 2704/12384 [5:45:26<20:32:14, 7.64s/it, loss=0.0001, acc=0.9988, iter_time=4.81s]
Epoch 0: 22%|██▏ | 2705/12384 [5:45:26<20:32:37, 7.64s/it, loss=0.0001, acc=0.9988, iter_time=4.81s]
Epoch 0: 22%|██▏ | 2705/12384 [5:45:34<20:32:37, 7.64s/it, loss=0.0008, acc=1.0000, iter_time=10.48s]
Epoch 0: 22%|██▏ | 2706/12384 [5:45:34<20:31:07, 7.63s/it, loss=0.0008, acc=1.0000, iter_time=10.48s]
Epoch 0: 22%|██▏ | 2706/12384 [5:45:41<20:31:07, 7.63s/it, loss=0.0004, acc=0.9990, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2707/12384 [5:45:41<20:31:50, 7.64s/it, loss=0.0004, acc=0.9990, iter_time=7.64s]
Epoch 0: 22%|██▏ | 2707/12384 [5:45:49<20:31:50, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2708/12384 [5:45:49<20:32:40, 7.64s/it, loss=0.0002, acc=1.0000, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2708/12384 [5:45:57<20:32:40, 7.64s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 22%|██▏ | 2709/12384 [5:45:57<20:32:49, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.66s]
Epoch 0: 22%|██▏ | 2709/12384 [5:46:04<20:32:49, 7.65s/it, loss=0.0002, acc=0.9992, iter_time=7.12s]
Epoch 0: 22%|██▏ | 2710/12384 [5:46:04<20:32:08, 7.64s/it, loss=0.0002, acc=0.9992, iter_time=7.12s]
Epoch 0: 22%|██▏ | 2710/12384 [5:46:12<20:32:08, 7.64s/it, loss=0.0063, acc=0.9969, iter_time=5.11s]
Epoch 0: 22%|██▏ | 2711/12384 [5:46:12<20:34:46, 7.66s/it, loss=0.0063, acc=0.9969, iter_time=5.11s]
Epoch 0: 22%|██▏ | 2711/12384 [5:46:20<20:34:46, 7.66s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 22%|██▏ | 2712/12384 [5:46:20<20:32:41, 7.65s/it, loss=0.0000, acc=1.0000, iter_time=10.85s]
Epoch 0: 22%|██▏ | 2712/12384 [5:46:27<20:32:41, 7.65s/it, loss=0.0001, acc=0.9998, iter_time=5.30s]
Epoch 0: 22%|██▏ | 2713/12384 [5:46:27<20:38:36, 7.68s/it, loss=0.0001, acc=0.9998, iter_time=5.30s]
Epoch 0: 22%|██▏ | 2713/12384 [5:46:35<20:38:36, 7.68s/it, loss=0.0005, acc=0.9962, iter_time=6.73s]
Epoch 0: 22%|██▏ | 2714/12384 [5:46:35<20:36:39, 7.67s/it, loss=0.0005, acc=0.9962, iter_time=6.73s]
Epoch 0: 22%|██▏ | 2714/12384 [5:46:43<20:36:39, 7.67s/it, loss=0.0001, acc=1.0000, iter_time=10.89s]
Epoch 0: 22%|██▏ | 2715/12384 [5:46:43<20:34:54, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=10.89s]
Epoch 0: 22%|██▏ | 2715/12384 [5:46:50<20:34:54, 7.66s/it, loss=0.0001, acc=1.0000, iter_time=7.12s]
Epoch 0: 22%|██▏ | 2716/12384 [5:46:50<20:32:41, 7.65s/it, loss=0.0001, acc=1.0000, iter_time=7.12s]
Epoch 0: 22%|██▏ | 2716/12384 [5:46:58<20:32:41, 7.65s/it, loss=0.0003, acc=0.9999, iter_time=7.33s]
Epoch 0: 22%|██▏ | 2717/12384 [5:46:58<20:47:40, 7.74s/it, loss=0.0003, acc=0.9999, iter_time=7.33s]
Epoch 0: 22%|██▏ | 2717/12384 [5:47:06<20:47:40, 7.74s/it, loss=0.0003, acc=0.9991, iter_time=8.79s]
Epoch 0: 22%|██▏ | 2718/12384 [5:47:06<20:42:23, 7.71s/it, loss=0.0003, acc=0.9991, iter_time=8.79s]
Epoch 0: 22%|██▏ | 2718/12384 [5:47:14<20:42:23, 7.71s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2719/12384 [5:47:14<20:38:47, 7.69s/it, loss=0.0001, acc=1.0000, iter_time=7.65s]
Epoch 0: 22%|██▏ | 2719/12384 [5:47:21<20:38:47, 7.69s/it, loss=0.0004, acc=0.9978, iter_time=8.03s]
Epoch 0: 22%|██▏ | 2720/12384 [5:47:21<20:36:57, 7.68s/it, loss=0.0004, acc=0.9978, iter_time=8.03s]W0310 14:09:33.982000 62051 site-packages/torch/distributed/elastic/agent/server/api.py:725] Received 15 death signal, shutting down workers
+W0310 14:09:33.986000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62184 closing signal SIGTERM
+W0310 14:09:33.987000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62185 closing signal SIGTERM
+W0310 14:09:33.987000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62186 closing signal SIGTERM
+W0310 14:09:33.987000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62187 closing signal SIGTERM
+W0310 14:09:33.987000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62188 closing signal SIGTERM
+W0310 14:09:33.988000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62189 closing signal SIGTERM
+W0310 14:09:33.988000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62190 closing signal SIGTERM
+W0310 14:09:33.988000 62051 site-packages/torch/distributed/elastic/multiprocessing/api.py:908] Sending process 62191 closing signal SIGTERM
+Traceback (most recent call last):
+ File "", line 198, in _run_module_as_main
+ File "", line 88, in _run_code
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 940, in
+ main()
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/errors/__init__.py", line 357, in wrapper
+ return f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 936, in main
+ run(args)
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/run.py", line 927, in run
+ elastic_launch(
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 156, in __call__
+ return launch_agent(self._config, self._entrypoint, list(args))
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/launcher/api.py", line 284, in launch_agent
+ result = agent.run()
+ ^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/metrics/api.py", line 138, in wrapper
+ result = f(*args, **kwargs)
+ ^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/agent/server/api.py", line 717, in run
+ result = self._invoke_run(role)
+ ^^^^^^^^^^^^^^^^^^^^^^
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/agent/server/api.py", line 881, in _invoke_run
+ time.sleep(monitor_interval)
+ File "/workspace/hanrui/specforge/lib/python3.11/site-packages/torch/distributed/elastic/multiprocessing/api.py", line 85, in _terminate_process_handler
+ raise SignalException(f"Process {os.getpid()} got signal: {sigval}", sigval=sigval)
+torch.distributed.elastic.multiprocessing.api.SignalException: Process 62051 got signal: 15
diff --git a/test/merge_lora.py b/test/merge_lora.py
new file mode 100644
index 0000000000000000000000000000000000000000..a0a17509a2455d5ae624a392490e753e1e325632
--- /dev/null
+++ b/test/merge_lora.py
@@ -0,0 +1,66 @@
+"""
+Step 1: Merge DFlash-LoRA adapter into base model.
+Usage:
+ conda activate sglang
+ python3 merge_lora.py
+ python3 merge_lora.py --ckpt epoch_2_step_15000 # 测其他 checkpoint
+"""
+import argparse
+import os
+
+import torch
+from peft import PeftModel
+from transformers import AutoModelForCausalLM, AutoTokenizer
+
+BASE_MODEL = "/workspace/models/Qwen3-8B"
+OUTPUT_ROOT = "/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-sft-32gpu-v2"
+MERGE_ROOT = "/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-sft-32gpu-v2-merged"
+
+def parse_args():
+ p = argparse.ArgumentParser()
+ p.add_argument("--ckpt", default="epoch_0_step_3000",
+ help="Checkpoint folder name under OUTPUT_ROOT")
+ p.add_argument("--merged-path", default=MERGE_ROOT,
+ help="Where to save the merged model")
+ return p.parse_args()
+
+
+def main():
+ args = parse_args()
+ adapter_path = os.path.join(OUTPUT_ROOT, args.ckpt)
+ merged_path = args.merged_path
+
+ if os.path.exists(merged_path):
+ print(f"[skip] Merged model already exists: {merged_path}")
+ return
+
+ assert os.path.isdir(adapter_path), f"Adapter not found: {adapter_path}"
+
+ print(f"Base model : {BASE_MODEL}")
+ print(f"Adapter : {adapter_path}")
+ print(f"Output : {merged_path}")
+ print()
+
+ print("[1/4] Loading base model to CPU ...")
+ model = AutoModelForCausalLM.from_pretrained(
+ BASE_MODEL,
+ torch_dtype=torch.bfloat16,
+ device_map="cpu",
+ )
+
+ print("[2/4] Loading LoRA adapter ...")
+ model = PeftModel.from_pretrained(model, adapter_path)
+
+ print("[3/4] Merging weights ...")
+ model = model.merge_and_unload()
+
+ print("[4/4] Saving merged model ...")
+ os.makedirs(merged_path, exist_ok=True)
+ model.save_pretrained(merged_path, safe_serialization=True)
+ AutoTokenizer.from_pretrained(BASE_MODEL).save_pretrained(merged_path)
+
+ print(f"\nDone. Merged model saved to: {merged_path}")
+
+
+if __name__ == "__main__":
+ main()
diff --git a/test/run_bench.sh b/test/run_bench.sh
new file mode 100644
index 0000000000000000000000000000000000000000..dbafc807d13b20adc67ebf004c2a71b0d40226b1
--- /dev/null
+++ b/test/run_bench.sh
@@ -0,0 +1,68 @@
+#!/bin/bash
+# Step 3: Run HumanEval / MT-Bench / GSM8K benchmarks.
+# Run AFTER start_server.sh is up.
+# Usage:
+# bash run_bench.sh # all three benches, full dataset
+# bash run_bench.sh humaneval # only humaneval
+# bash run_bench.sh mtbench gsm8k # pick any subset
+
+set -e
+
+INTRANET_IP=10.1.1.72
+PORT=30000
+BASE_MODEL=/workspace/models/Qwen3-8B
+MERGED=/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-sft-32gpu-v2-merged
+BENCH_DIR=/workspace/hanrui/syxin_old/Specforge/benchmarks
+RESULT_DIR=$BENCH_DIR/results
+
+# ---- sanity check ----
+echo "Checking server at http://$INTRANET_IP:$PORT ..."
+curl -sf http://$INTRANET_IP:$PORT/v1/models > /dev/null || {
+ echo "[ERROR] Server not reachable. Start it first: bash start_server.sh"
+ exit 1
+}
+echo "Server OK."
+
+mkdir -p $RESULT_DIR
+cd $BENCH_DIR
+export PYTHONPATH=/workspace/hanrui/syxin_old/Specforge:$PYTHONPATH
+
+# ---- decide which benches to run ----
+TARGETS=("$@")
+if [ ${#TARGETS[@]} -eq 0 ]; then
+ TARGETS=(humaneval mtbench gsm8k)
+fi
+
+BENCH_ARGS=""
+for t in "${TARGETS[@]}"; do
+ case $t in
+ humaneval) BENCH_ARGS="$BENCH_ARGS humaneval:164" ;;
+ mtbench) BENCH_ARGS="$BENCH_ARGS mtbench:80" ;;
+ gsm8k) BENCH_ARGS="$BENCH_ARGS gsm8k:1319" ;;
+ *)
+ echo "[ERROR] Unknown bench: $t (choices: humaneval mtbench gsm8k)"
+ exit 1
+ ;;
+ esac
+done
+
+TIMESTAMP=$(date +%Y%m%d_%H%M%S)
+echo "Running: $BENCH_ARGS"
+echo "Results -> $RESULT_DIR"
+echo ""
+
+python3 bench_eagle3.py \
+ --model-path $BASE_MODEL \
+ --speculative-draft-model-path $MERGED \
+ --host $INTRANET_IP \
+ --port $PORT \
+ --config-list "16,4,1,4" \
+ --benchmark-list $BENCH_ARGS \
+ --output-dir $RESULT_DIR \
+ --name dflash_lora_${TIMESTAMP} \
+ --skip-launch-server \
+ 2>&1 | tee $RESULT_DIR/bench_${TIMESTAMP}.log
+
+echo ""
+echo "Done. Latest result files:"
+ls -lht $RESULT_DIR/*.jsonl 2>/dev/null | head -5
diff --git a/test/run_bench_dflash.sh b/test/run_bench_dflash.sh
new file mode 100644
index 0000000000000000000000000000000000000000..1c8f0d6d8d11b8db0a56cb9369a2ac633b74998c
--- /dev/null
+++ b/test/run_bench_dflash.sh
@@ -0,0 +1,68 @@
+#!/bin/bash
+# Run HumanEval / MT-Bench / GSM8K benchmarks for DFLASH speculative decoding.
+# Run AFTER start_server_dflash.sh is up.
+# Usage:
+# bash run_bench_dflash.sh # all three benches, full dataset
+# bash run_bench_dflash.sh humaneval # only humaneval
+# bash run_bench_dflash.sh mtbench gsm8k # pick any subset
+
+set -e
+
+INTRANET_IP=10.1.1.22
+PORT=30000
+BASE_MODEL=/workspace/models/Qwen3-8B
+DRAFT_MODEL=/workspace/models/Qwen3-8B-DFlash-b16
+BENCH_DIR=/workspace/hanrui/syxin_old/Specforge/benchmarks
+RESULT_DIR=$BENCH_DIR/results
+
+# ---- sanity check ----
+echo "Checking server at http://$INTRANET_IP:$PORT ..."
+curl -sf http://$INTRANET_IP:$PORT/v1/models > /dev/null || {
+ echo "[ERROR] Server not reachable. Start it first: bash start_server_dflash.sh"
+ exit 1
+}
+echo "Server OK."
+
+mkdir -p $RESULT_DIR
+cd $BENCH_DIR
+export PYTHONPATH=/workspace/hanrui/syxin_old/Specforge:$PYTHONPATH
+
+# ---- decide which benches to run ----
+TARGETS=("$@")
+if [ ${#TARGETS[@]} -eq 0 ]; then
+ TARGETS=(humaneval mtbench gsm8k)
+fi
+
+BENCH_ARGS=""
+for t in "${TARGETS[@]}"; do
+ case $t in
+ humaneval) BENCH_ARGS="$BENCH_ARGS humaneval:164" ;;
+ mtbench) BENCH_ARGS="$BENCH_ARGS mtbench:80" ;;
+ gsm8k) BENCH_ARGS="$BENCH_ARGS gsm8k:1319" ;;
+ *)
+ echo "[ERROR] Unknown bench: $t (choices: humaneval mtbench gsm8k)"
+ exit 1
+ ;;
+ esac
+done
+
+TIMESTAMP=$(date +%Y%m%d_%H%M%S)
+echo "Running: $BENCH_ARGS"
+echo "Results -> $RESULT_DIR"
+echo ""
+
+/workspace/miniconda3/envs/dflash/bin/python3 bench_eagle3.py \
+ --model-path $BASE_MODEL \
+ --speculative-draft-model-path $DRAFT_MODEL \
+ --host $INTRANET_IP \
+ --port $PORT \
+ --config-list "16,4,1,4" \
+ --benchmark-list $BENCH_ARGS \
+ --output-dir $RESULT_DIR \
+ --name dflash_b16_${TIMESTAMP} \
+ --skip-launch-server \
+ 2>&1 | tee $RESULT_DIR/bench_dflash_b16_${TIMESTAMP}.log
+
+echo ""
+echo "Done. Latest result files:"
+ls -lht $RESULT_DIR/*.jsonl 2>/dev/null | head -5
diff --git a/test/start_server.sh b/test/start_server.sh
new file mode 100644
index 0000000000000000000000000000000000000000..657f8b018f7b31ef0d877ba41cc16a8c6df72198
--- /dev/null
+++ b/test/start_server.sh
@@ -0,0 +1,42 @@
+#!/bin/bash
+# Step 2: Launch SGLang server with STANDALONE speculative decoding.
+# Usage:
+# bash start_server.sh
+# bash start_server.sh 8 # use tp=8
+
+set -e
+
+TP=${1:-2}
+
+BASE_MODEL=/workspace/models/Qwen3-8B
+MERGED=/workspace/hanrui/syxin_old/Specforge/outputs/qwen3-8b-sft-32gpu-v2-merged
+INTRANET_IP=10.1.1.72
+PORT=30000
+
+if [ ! -d "$MERGED" ]; then
+ echo "[ERROR] Merged model not found: $MERGED"
+ echo " Run: conda activate sglang && python3 merge_lora.py"
+ exit 1
+fi
+
+echo "============================================"
+echo " SGLang STANDALONE Speculative Decoding"
+echo " target : $BASE_MODEL"
+echo " draft : $MERGED"
+echo " host : $INTRANET_IP:$PORT"
+echo " tp : $TP"
+echo "============================================"
+
+/workspace/miniconda3/envs/sglang/bin/python3 -m sglang.launch_server \
+ --model-path $BASE_MODEL \
+ --speculative-algorithm STANDALONE \
+ --speculative-draft-model-path $MERGED \
+ --speculative-num-steps 4 \
+ --speculative-eagle-topk 1 \
+ --speculative-num-draft-tokens 4 \
+ --tp-size $TP \
+ --mem-fraction-static 0.30 \
+ --trust-remote-code \
+ --host $INTRANET_IP \
+ --port $PORT \
+ --dtype bfloat16
diff --git a/test/start_server_dflash.sh b/test/start_server_dflash.sh
new file mode 100644
index 0000000000000000000000000000000000000000..084fb826ed7bd25a2061d24b59daae5deb74db84
--- /dev/null
+++ b/test/start_server_dflash.sh
@@ -0,0 +1,36 @@
+#!/bin/bash
+# Launch SGLang server with DFLASH speculative decoding.
+# Usage:
+# bash start_server_dflash.sh
+# bash start_server_dflash.sh 4 # use tp=4
+
+set -e
+
+TP=${1:-2}
+
+BASE_MODEL=/workspace/models/Qwen3-8B
+DRAFT_MODEL=/workspace/models/Qwen3-8B-DFlash-b16
+INTRANET_IP=10.1.1.22
+PORT=30000
+
+echo "============================================"
+echo " SGLang DFLASH Speculative Decoding"
+echo " target : $BASE_MODEL"
+echo " draft : $DRAFT_MODEL"
+echo " host : $INTRANET_IP:$PORT"
+echo " tp : $TP"
+echo "============================================"
+
+export SGLANG_ALLOW_OVERWRITE_LONGER_CONTEXT_LEN=1
+
+/workspace/miniconda3/envs/dflash/bin/python -m sglang.launch_server \
+ --model-path $BASE_MODEL \
+ --speculative-algorithm DFLASH \
+ --speculative-draft-model-path $DRAFT_MODEL \
+ --tp-size $TP \
+ --dtype bfloat16 \
+ --attention-backend fa3 \
+ --mem-fraction-static 0.30 \
+ --trust-remote-code \
+ --host $INTRANET_IP \
+ --port $PORT